lib_rss.php 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560
  1. <?php
  2. if (version_compare(PHP_VERSION, '5.3.8', '<')) {
  3. die('FreshRSS error: FreshRSS requires PHP 5.3.8+!');
  4. }
  5. if (!function_exists('json_decode')) {
  6. require_once(__DIR__ . '/JSON.php');
  7. function json_decode($var, $assoc = false) {
  8. $JSON = new Services_JSON($assoc ? SERVICES_JSON_LOOSE_TYPE : 0);
  9. return $JSON->decode($var);
  10. }
  11. }
  12. if (!function_exists('json_encode')) {
  13. require_once(__DIR__ . '/JSON.php');
  14. function json_encode($var) {
  15. $JSON = new Services_JSON();
  16. return $JSON->encodeUnsafe($var);
  17. }
  18. }
  19. defined('JSON_UNESCAPED_UNICODE') or define('JSON_UNESCAPED_UNICODE', 256); //PHP 5.3
  20. /**
  21. * Build a directory path by concatenating a list of directory names.
  22. *
  23. * @param $path_parts a list of directory names
  24. * @return a string corresponding to the final pathname
  25. */
  26. function join_path() {
  27. $path_parts = func_get_args();
  28. return join(DIRECTORY_SEPARATOR, $path_parts);
  29. }
  30. //<Auto-loading>
  31. function classAutoloader($class) {
  32. if (strpos($class, 'FreshRSS') === 0) {
  33. $components = explode('_', $class);
  34. switch (count($components)) {
  35. case 1:
  36. include(APP_PATH . '/' . $components[0] . '.php');
  37. return;
  38. case 2:
  39. include(APP_PATH . '/Models/' . $components[1] . '.php');
  40. return;
  41. case 3: //Controllers, Exceptions
  42. include(APP_PATH . '/' . $components[2] . 's/' . $components[1] . $components[2] . '.php');
  43. return;
  44. }
  45. } elseif (strpos($class, 'Minz') === 0) {
  46. include(LIB_PATH . '/' . str_replace('_', '/', $class) . '.php');
  47. } elseif (strpos($class, 'SimplePie') === 0) {
  48. include(LIB_PATH . '/SimplePie/' . str_replace('_', '/', $class) . '.php');
  49. }
  50. }
  51. spl_autoload_register('classAutoloader');
  52. //</Auto-loading>
  53. function idn_to_puny($url) {
  54. if (function_exists('idn_to_ascii')) {
  55. $parts = parse_url($url);
  56. if (!empty($parts['host'])) {
  57. $idn = $parts['host'];
  58. // INTL_IDNA_VARIANT_UTS46 is defined starting in PHP 5.4
  59. if (defined('INTL_IDNA_VARIANT_UTS46')) {
  60. $puny = idn_to_ascii($idn, 0, INTL_IDNA_VARIANT_UTS46);
  61. } else {
  62. $puny = idn_to_ascii($idn);
  63. }
  64. $pos = strpos($url, $idn);
  65. if ($pos !== false) {
  66. return substr_replace($url, $puny, $pos, strlen($idn));
  67. }
  68. }
  69. }
  70. return $url;
  71. }
  72. function checkUrl($url) {
  73. if ($url == '') {
  74. return '';
  75. }
  76. if (!preg_match('#^https?://#i', $url)) {
  77. $url = 'http://' . $url;
  78. }
  79. $url = idn_to_puny($url); //PHP bug #53474 IDN
  80. if (filter_var($url, FILTER_VALIDATE_URL)) {
  81. return $url;
  82. } else {
  83. return false;
  84. }
  85. }
  86. function safe_ascii($text) {
  87. return filter_var($text, FILTER_DEFAULT, FILTER_FLAG_STRIP_LOW | FILTER_FLAG_STRIP_HIGH);
  88. }
  89. /**
  90. * Test if a given server address is publicly accessible.
  91. *
  92. * Note: for the moment it tests only if address is corresponding to a
  93. * localhost address.
  94. *
  95. * @param $address the address to test, can be an IP or a URL.
  96. * @return true if server is accessible, false else.
  97. * @todo improve test with a more valid technique (e.g. test with an external server?)
  98. */
  99. function server_is_public($address) {
  100. $host = parse_url($address, PHP_URL_HOST);
  101. $is_public = !in_array($host, array(
  102. '127.0.0.1',
  103. 'localhost',
  104. 'localhost.localdomain',
  105. '[::1]',
  106. 'localhost6',
  107. 'localhost6.localdomain6',
  108. ));
  109. return $is_public;
  110. }
  111. function format_number($n, $precision = 0) {
  112. // number_format does not seem to be Unicode-compatible
  113. return str_replace(' ', ' ', //Espace fine insécable
  114. number_format($n, $precision, '.', ' ')
  115. );
  116. }
  117. function format_bytes($bytes, $precision = 2, $system = 'IEC') {
  118. if ($system === 'IEC') {
  119. $base = 1024;
  120. $units = array('B', 'KiB', 'MiB', 'GiB', 'TiB');
  121. } elseif ($system === 'SI') {
  122. $base = 1000;
  123. $units = array('B', 'KB', 'MB', 'GB', 'TB');
  124. } else {
  125. return format_number($bytes, $precision);
  126. }
  127. $bytes = max(intval($bytes), 0);
  128. $pow = $bytes === 0 ? 0 : floor(log($bytes) / log($base));
  129. $pow = min($pow, count($units) - 1);
  130. $bytes /= pow($base, $pow);
  131. return format_number($bytes, $precision) . ' ' . $units[$pow];
  132. }
  133. function timestamptodate ($t, $hour = true) {
  134. $month = _t('gen.date.' . date('M', $t));
  135. if ($hour) {
  136. $date = _t('gen.date.format_date_hour', $month);
  137. } else {
  138. $date = _t('gen.date.format_date', $month);
  139. }
  140. return @date ($date, $t);
  141. }
  142. function html_only_entity_decode($text) {
  143. static $htmlEntitiesOnly = null;
  144. if ($htmlEntitiesOnly === null) {
  145. if (version_compare(PHP_VERSION, '5.3.4') >= 0) {
  146. $htmlEntitiesOnly = array_flip(array_diff(
  147. get_html_translation_table(HTML_ENTITIES, ENT_NOQUOTES, 'UTF-8'), //Decode HTML entities
  148. get_html_translation_table(HTML_SPECIALCHARS, ENT_NOQUOTES, 'UTF-8') //Preserve XML entities
  149. ));
  150. } else {
  151. $htmlEntitiesOnly = array_map('utf8_encode', array_flip(array_diff(
  152. get_html_translation_table(HTML_ENTITIES, ENT_NOQUOTES), //Decode HTML entities
  153. get_html_translation_table(HTML_SPECIALCHARS, ENT_NOQUOTES) //Preserve XML entities
  154. )));
  155. }
  156. }
  157. return strtr($text, $htmlEntitiesOnly);
  158. }
  159. function customSimplePie($attributes = array()) {
  160. $system_conf = Minz_Configuration::get('system');
  161. $limits = $system_conf->limits;
  162. $simplePie = new SimplePie();
  163. $simplePie->set_useragent(FRESHRSS_USERAGENT);
  164. $simplePie->set_syslog($system_conf->simplepie_syslog_enabled);
  165. $simplePie->set_cache_location(CACHE_PATH);
  166. $simplePie->set_cache_duration($limits['cache_duration']);
  167. $feed_timeout = empty($attributes['timeout']) ? 0 : intval($attributes['timeout']);
  168. $simplePie->set_timeout($feed_timeout > 0 ? $feed_timeout : $limits['timeout']);
  169. $curl_options = $system_conf->curl_options;
  170. if (isset($attributes['ssl_verify'])) {
  171. $curl_options[CURLOPT_SSL_VERIFYHOST] = $attributes['ssl_verify'] ? 2 : 0;
  172. $curl_options[CURLOPT_SSL_VERIFYPEER] = $attributes['ssl_verify'] ? true : false;
  173. }
  174. $simplePie->set_curl_options($curl_options);
  175. $simplePie->strip_htmltags(array(
  176. 'base', 'blink', 'body', 'doctype', 'embed',
  177. 'font', 'form', 'frame', 'frameset', 'html',
  178. 'link', 'input', 'marquee', 'meta', 'noscript',
  179. 'object', 'param', 'plaintext', 'script', 'style',
  180. ));
  181. $simplePie->strip_attributes(array_merge($simplePie->strip_attributes, array(
  182. 'autoplay', 'class', 'onload', 'onunload', 'onclick', 'ondblclick', 'onmousedown', 'onmouseup',
  183. 'onmouseover', 'onmousemove', 'onmouseout', 'onfocus', 'onblur',
  184. 'onkeypress', 'onkeydown', 'onkeyup', 'onselect', 'onchange', 'seamless', 'sizes', 'srcset')));
  185. $simplePie->add_attributes(array(
  186. 'audio' => array('controls' => 'controls', 'preload' => 'none'),
  187. 'iframe' => array('sandbox' => 'allow-scripts allow-same-origin'),
  188. 'video' => array('controls' => 'controls', 'preload' => 'none'),
  189. ));
  190. $simplePie->set_url_replacements(array(
  191. 'a' => 'href',
  192. 'area' => 'href',
  193. 'audio' => 'src',
  194. 'blockquote' => 'cite',
  195. 'del' => 'cite',
  196. 'form' => 'action',
  197. 'iframe' => 'src',
  198. 'img' => array(
  199. 'longdesc',
  200. 'src'
  201. ),
  202. 'input' => 'src',
  203. 'ins' => 'cite',
  204. 'q' => 'cite',
  205. 'source' => 'src',
  206. 'track' => 'src',
  207. 'video' => array(
  208. 'poster',
  209. 'src',
  210. ),
  211. ));
  212. $https_domains = array();
  213. $force = @file(FRESHRSS_PATH . '/force-https.default.txt', FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES);
  214. if (is_array($force)) {
  215. $https_domains = array_merge($https_domains, $force);
  216. }
  217. $force = @file(DATA_PATH . '/force-https.txt', FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES);
  218. if (is_array($force)) {
  219. $https_domains = array_merge($https_domains, $force);
  220. }
  221. $simplePie->set_https_domains($https_domains);
  222. return $simplePie;
  223. }
  224. function sanitizeHTML($data, $base = '') {
  225. static $simplePie = null;
  226. if ($simplePie == null) {
  227. $simplePie = customSimplePie();
  228. $simplePie->init();
  229. }
  230. return html_only_entity_decode($simplePie->sanitize->sanitize($data, SIMPLEPIE_CONSTRUCT_HTML, $base));
  231. }
  232. /* permet de récupérer le contenu d'un article pour un flux qui n'est pas complet */
  233. function get_content_by_parsing ($url, $path) {
  234. require_once(LIB_PATH . '/lib_phpQuery.php');
  235. Minz_Log::notice('FreshRSS GET ' . SimplePie_Misc::url_remove_credentials($url));
  236. $html = file_get_contents($url);
  237. if ($html) {
  238. $doc = phpQuery::newDocument($html);
  239. $content = $doc->find($path);
  240. foreach (pq('img[data-src]') as $img) {
  241. $imgP = pq($img);
  242. $dataSrc = $imgP->attr('data-src');
  243. if (strlen($dataSrc) > 4) {
  244. $imgP->attr('src', $dataSrc);
  245. $imgP->removeAttr('data-src');
  246. }
  247. }
  248. return sanitizeHTML($content->__toString(), $url);
  249. } else {
  250. throw new Exception();
  251. }
  252. }
  253. /**
  254. * Add support of image lazy loading
  255. * Move content from src attribute to data-original
  256. * @param content is the text we want to parse
  257. */
  258. function lazyimg($content) {
  259. return preg_replace(
  260. '/<((?:img|iframe)[^>]+?)src=[\'"]([^"\']+)[\'"]([^>]*)>/i',
  261. '<$1src="' . Minz_Url::display('/themes/icons/grey.gif') . '" data-original="$2"$3>',
  262. $content
  263. );
  264. }
  265. function uTimeString() {
  266. $t = @gettimeofday();
  267. return $t['sec'] . str_pad($t['usec'], 6, '0');
  268. }
  269. function uSecString() {
  270. $t = @gettimeofday();
  271. return str_pad($t['usec'], 6, '0');
  272. }
  273. function invalidateHttpCache($username = '') {
  274. if (!FreshRSS_user_Controller::checkUsername($username)) {
  275. Minz_Session::_param('touch', uTimeString());
  276. $username = Minz_Session::param('currentUser', '_');
  277. }
  278. return touch(join_path(DATA_PATH, 'users', $username, 'log.txt'));
  279. }
  280. function listUsers() {
  281. $final_list = array();
  282. $base_path = join_path(DATA_PATH, 'users');
  283. $dir_list = array_values(array_diff(
  284. scandir($base_path),
  285. array('..', '.', '_')
  286. ));
  287. foreach ($dir_list as $file) {
  288. if ($file[0] !== '.' && is_dir(join_path($base_path, $file)) && file_exists(join_path($base_path, $file, 'config.php'))) {
  289. $final_list[] = $file;
  290. }
  291. }
  292. return $final_list;
  293. }
  294. /**
  295. * Return if the maximum number of registrations has been reached.
  296. *
  297. * Note a max_regstrations of 0 means there is no limit.
  298. *
  299. * @return true if number of users >= max registrations, false else.
  300. */
  301. function max_registrations_reached() {
  302. $system_conf = Minz_Configuration::get('system');
  303. $limit_registrations = $system_conf->limits['max_registrations'];
  304. $number_accounts = count(listUsers());
  305. return $limit_registrations > 0 && $number_accounts >= $limit_registrations;
  306. }
  307. /**
  308. * Register and return the configuration for a given user.
  309. *
  310. * Note this function has been created to generate temporary configuration
  311. * objects. If you need a long-time configuration, please don't use this function.
  312. *
  313. * @param $username the name of the user of which we want the configuration.
  314. * @return a Minz_Configuration object, null if the configuration cannot be loaded.
  315. */
  316. function get_user_configuration($username) {
  317. if (!FreshRSS_user_Controller::checkUsername($username)) {
  318. return null;
  319. }
  320. $namespace = 'user_' . $username;
  321. try {
  322. Minz_Configuration::register($namespace,
  323. join_path(USERS_PATH, $username, 'config.php'),
  324. join_path(FRESHRSS_PATH, 'config-user.default.php'));
  325. } catch (Minz_ConfigurationNamespaceException $e) {
  326. // namespace already exists, do nothing.
  327. Minz_Log::warning($e->getMessage());
  328. } catch (Minz_FileNotExistException $e) {
  329. Minz_Log::warning($e->getMessage());
  330. return null;
  331. }
  332. return Minz_Configuration::get($namespace);
  333. }
  334. function httpAuthUser() {
  335. if (isset($_SERVER['REMOTE_USER'])) {
  336. return $_SERVER['REMOTE_USER'];
  337. }
  338. if (isset($_SERVER['REDIRECT_REMOTE_USER'])) {
  339. return $_SERVER['REDIRECT_REMOTE_USER'];
  340. }
  341. return '';
  342. }
  343. function cryptAvailable() {
  344. try {
  345. $hash = '$2y$04$usesomesillystringfore7hnbRJHxXVLeakoG8K30oukPsA.ztMG';
  346. return $hash === @crypt('password', $hash);
  347. } catch (Exception $e) {
  348. Minz_Log::warning($e->getMessage());
  349. }
  350. return false;
  351. }
  352. function is_referer_from_same_domain() {
  353. if (empty($_SERVER['HTTP_REFERER'])) {
  354. return true; //Accept empty referer while waiting for good support of meta referrer same-origin policy in browsers
  355. }
  356. $host = parse_url(((isset($_SERVER['HTTPS']) && $_SERVER['HTTPS'] === 'on') ? 'https://' : 'http://') .
  357. (empty($_SERVER['HTTP_HOST']) ? $_SERVER['SERVER_NAME'] : $_SERVER['HTTP_HOST']));
  358. $referer = parse_url($_SERVER['HTTP_REFERER']);
  359. if (empty($host['host']) || empty($referer['host']) || $host['host'] !== $referer['host']) {
  360. return false;
  361. }
  362. //TODO: check 'scheme', taking into account the case of a proxy
  363. if ((isset($host['port']) ? $host['port'] : 0) !== (isset($referer['port']) ? $referer['port'] : 0)) {
  364. return false;
  365. }
  366. return true;
  367. }
  368. /**
  369. * Check PHP and its extensions are well-installed.
  370. *
  371. * @return array of tested values.
  372. */
  373. function check_install_php() {
  374. $pdo_mysql = extension_loaded('pdo_mysql');
  375. $pdo_pgsql = extension_loaded('pdo_pgsql');
  376. $pdo_sqlite = extension_loaded('pdo_sqlite');
  377. return array(
  378. 'php' => version_compare(PHP_VERSION, '5.3.8') >= 0,
  379. 'minz' => file_exists(LIB_PATH . '/Minz'),
  380. 'curl' => extension_loaded('curl'),
  381. 'pdo' => $pdo_mysql || $pdo_sqlite || $pdo_pgsql,
  382. 'pcre' => extension_loaded('pcre'),
  383. 'ctype' => extension_loaded('ctype'),
  384. 'fileinfo' => extension_loaded('fileinfo'),
  385. 'dom' => class_exists('DOMDocument'),
  386. 'json' => extension_loaded('json'),
  387. 'zip' => extension_loaded('zip'),
  388. );
  389. }
  390. /**
  391. * Check different data files and directories exist.
  392. *
  393. * @return array of tested values.
  394. */
  395. function check_install_files() {
  396. return array(
  397. 'data' => DATA_PATH && is_writable(DATA_PATH),
  398. 'cache' => CACHE_PATH && is_writable(CACHE_PATH),
  399. 'users' => USERS_PATH && is_writable(USERS_PATH),
  400. 'favicons' => is_writable(DATA_PATH . '/favicons'),
  401. 'tokens' => is_writable(DATA_PATH . '/tokens'),
  402. );
  403. }
  404. /**
  405. * Check database is well-installed.
  406. *
  407. * @return array of tested values.
  408. */
  409. function check_install_database() {
  410. $status = array(
  411. 'connection' => true,
  412. 'tables' => false,
  413. 'categories' => false,
  414. 'feeds' => false,
  415. 'entries' => false,
  416. );
  417. try {
  418. $dbDAO = FreshRSS_Factory::createDatabaseDAO();
  419. $status['tables'] = $dbDAO->tablesAreCorrect();
  420. $status['categories'] = $dbDAO->categoryIsCorrect();
  421. $status['feeds'] = $dbDAO->feedIsCorrect();
  422. $status['entries'] = $dbDAO->entryIsCorrect();
  423. } catch(Minz_PDOConnectionException $e) {
  424. $status['connection'] = false;
  425. }
  426. return $status;
  427. }
  428. /**
  429. * Remove a directory recursively.
  430. *
  431. * From http://php.net/rmdir#110489
  432. *
  433. * @param $dir the directory to remove
  434. */
  435. function recursive_unlink($dir) {
  436. if (!is_dir($dir)) {
  437. return true;
  438. }
  439. $files = array_diff(scandir($dir), array('.', '..'));
  440. foreach ($files as $filename) {
  441. $filename = $dir . '/' . $filename;
  442. if (is_dir($filename)) {
  443. @chmod($filename, 0777);
  444. recursive_unlink($filename);
  445. } else {
  446. unlink($filename);
  447. }
  448. }
  449. return rmdir($dir);
  450. }
  451. /**
  452. * Remove queries where $get is appearing.
  453. * @param $get the get attribute which should be removed.
  454. * @param $queries an array of queries.
  455. * @return the same array whithout those where $get is appearing.
  456. */
  457. function remove_query_by_get($get, $queries) {
  458. $final_queries = array();
  459. foreach ($queries as $key => $query) {
  460. if (empty($query['get']) || $query['get'] !== $get) {
  461. $final_queries[$key] = $query;
  462. }
  463. }
  464. return $final_queries;
  465. }
  466. /**
  467. * Add a value in an array and take care it is unique.
  468. * @param $array the array in which we add the value.
  469. * @param $value the value to add.
  470. */
  471. function array_push_unique(&$array, $value) {
  472. $found = array_search($value, $array) !== false;
  473. if (!$found) {
  474. $array[] = $value;
  475. }
  476. }
  477. /**
  478. * Remove a value from an array.
  479. * @param $array the array from wich value is removed.
  480. * @param $value the value to remove.
  481. */
  482. function array_remove(&$array, $value) {
  483. $array = array_diff($array, array($value));
  484. }
  485. //RFC 4648
  486. function base64url_encode($data) {
  487. return strtr(rtrim(base64_encode($data), '='), '+/', '-_');
  488. }
  489. //RFC 4648
  490. function base64url_decode($data) {
  491. return base64_decode(strtr($data, '-_', '+/'));
  492. }
  493. function _i($icon, $url_only = false) {
  494. return FreshRSS_Themes::icon($icon, $url_only);
  495. }