lib_rss.php 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327
  1. <?php
  2. if (!function_exists('json_decode')) {
  3. require_once('JSON.php');
  4. function json_decode($var) {
  5. $JSON = new Services_JSON;
  6. return (array)($JSON->decode($var));
  7. }
  8. }
  9. if (!function_exists('json_encode')) {
  10. require_once('JSON.php');
  11. function json_encode($var) {
  12. $JSON = new Services_JSON;
  13. return $JSON->encodeUnsafe($var);
  14. }
  15. }
  16. /**
  17. * Build a directory path by concatenating a list of directory names.
  18. *
  19. * @param $path_parts a list of directory names
  20. * @return a string corresponding to the final pathname
  21. */
  22. function join_path() {
  23. $path_parts = func_get_args();
  24. return join(DIRECTORY_SEPARATOR, $path_parts);
  25. }
  26. //<Auto-loading>
  27. function classAutoloader($class) {
  28. if (strpos($class, 'FreshRSS') === 0) {
  29. $components = explode('_', $class);
  30. switch (count($components)) {
  31. case 1:
  32. include(APP_PATH . '/' . $components[0] . '.php');
  33. return;
  34. case 2:
  35. include(APP_PATH . '/Models/' . $components[1] . '.php');
  36. return;
  37. case 3: //Controllers, Exceptions
  38. @include(APP_PATH . '/' . $components[2] . 's/' . $components[1] . $components[2] . '.php');
  39. return;
  40. }
  41. } elseif (strpos($class, 'Minz') === 0) {
  42. include(LIB_PATH . '/' . str_replace('_', '/', $class) . '.php');
  43. } elseif (strpos($class, 'SimplePie') === 0) {
  44. include(LIB_PATH . '/SimplePie/' . str_replace('_', '/', $class) . '.php');
  45. }
  46. }
  47. spl_autoload_register('classAutoloader');
  48. //</Auto-loading>
  49. function checkUrl($url) {
  50. if (empty ($url)) {
  51. return '';
  52. }
  53. if (!preg_match ('#^https?://#i', $url)) {
  54. $url = 'http://' . $url;
  55. }
  56. if (filter_var($url, FILTER_VALIDATE_URL) ||
  57. (version_compare(PHP_VERSION, '5.3.3', '<') && (strpos($url, '-') > 0) && //PHP bug #51192
  58. ($url === filter_var($url, FILTER_SANITIZE_URL)))) {
  59. return $url;
  60. } else {
  61. return false;
  62. }
  63. }
  64. function format_number($n, $precision = 0) {
  65. // number_format does not seem to be Unicode-compatible
  66. return str_replace(' ', ' ', //Espace fine insécable
  67. number_format($n, $precision, '.', ' ')
  68. );
  69. }
  70. function format_bytes($bytes, $precision = 2, $system = 'IEC') {
  71. if ($system === 'IEC') {
  72. $base = 1024;
  73. $units = array('B', 'KiB', 'MiB', 'GiB', 'TiB');
  74. } elseif ($system === 'SI') {
  75. $base = 1000;
  76. $units = array('B', 'KB', 'MB', 'GB', 'TB');
  77. }
  78. $bytes = max(intval($bytes), 0);
  79. $pow = $bytes === 0 ? 0 : floor(log($bytes) / log($base));
  80. $pow = min($pow, count($units) - 1);
  81. $bytes /= pow($base, $pow);
  82. return format_number($bytes, $precision) . ' ' . $units[$pow];
  83. }
  84. function timestamptodate ($t, $hour = true) {
  85. $month = _t('gen.date.' . date('M', $t));
  86. if ($hour) {
  87. $date = _t('gen.date.format_date_hour', $month);
  88. } else {
  89. $date = _t('gen.date.format_date', $month);
  90. }
  91. return @date ($date, $t);
  92. }
  93. function html_only_entity_decode($text) {
  94. static $htmlEntitiesOnly = null;
  95. if ($htmlEntitiesOnly === null) {
  96. if (version_compare(PHP_VERSION, '5.3.4') >= 0) {
  97. $htmlEntitiesOnly = array_flip(array_diff(
  98. get_html_translation_table(HTML_ENTITIES, ENT_NOQUOTES, 'UTF-8'), //Decode HTML entities
  99. get_html_translation_table(HTML_SPECIALCHARS, ENT_NOQUOTES, 'UTF-8') //Preserve XML entities
  100. ));
  101. } else {
  102. $htmlEntitiesOnly = array_map('utf8_encode', array_flip(array_diff(
  103. get_html_translation_table(HTML_ENTITIES, ENT_NOQUOTES), //Decode HTML entities
  104. get_html_translation_table(HTML_SPECIALCHARS, ENT_NOQUOTES) //Preserve XML entities
  105. )));
  106. }
  107. }
  108. return strtr($text, $htmlEntitiesOnly);
  109. }
  110. function customSimplePie() {
  111. $limits = Minz_Configuration::limits();
  112. $simplePie = new SimplePie();
  113. $simplePie->set_useragent(_t('gen.freshrss') . '/' . FRESHRSS_VERSION . ' (' . PHP_OS . '; ' . FRESHRSS_WEBSITE . ') ' . SIMPLEPIE_NAME . '/' . SIMPLEPIE_VERSION);
  114. $simplePie->set_cache_location(CACHE_PATH);
  115. $simplePie->set_cache_duration($limits['cache_duration']);
  116. $simplePie->set_timeout($limits['timeout']);
  117. $simplePie->strip_htmltags(array(
  118. 'base', 'blink', 'body', 'doctype', 'embed',
  119. 'font', 'form', 'frame', 'frameset', 'html',
  120. 'link', 'input', 'marquee', 'meta', 'noscript',
  121. 'object', 'param', 'plaintext', 'script', 'style',
  122. ));
  123. $simplePie->strip_attributes(array_merge($simplePie->strip_attributes, array(
  124. 'autoplay', 'onload', 'onunload', 'onclick', 'ondblclick', 'onmousedown', 'onmouseup',
  125. 'onmouseover', 'onmousemove', 'onmouseout', 'onfocus', 'onblur',
  126. 'onkeypress', 'onkeydown', 'onkeyup', 'onselect', 'onchange', 'seamless')));
  127. $simplePie->add_attributes(array(
  128. 'img' => array('lazyload' => '', 'postpone' => ''), //http://www.w3.org/TR/resource-priorities/
  129. 'audio' => array('lazyload' => '', 'postpone' => '', 'preload' => 'none'),
  130. 'iframe' => array('lazyload' => '', 'postpone' => '', 'sandbox' => 'allow-scripts allow-same-origin'),
  131. 'video' => array('lazyload' => '', 'postpone' => '', 'preload' => 'none'),
  132. ));
  133. $simplePie->set_url_replacements(array(
  134. 'a' => 'href',
  135. 'area' => 'href',
  136. 'audio' => 'src',
  137. 'blockquote' => 'cite',
  138. 'del' => 'cite',
  139. 'form' => 'action',
  140. 'iframe' => 'src',
  141. 'img' => array(
  142. 'longdesc',
  143. 'src'
  144. ),
  145. 'input' => 'src',
  146. 'ins' => 'cite',
  147. 'q' => 'cite',
  148. 'source' => 'src',
  149. 'track' => 'src',
  150. 'video' => array(
  151. 'poster',
  152. 'src',
  153. ),
  154. ));
  155. return $simplePie;
  156. }
  157. function sanitizeHTML($data, $base = '') {
  158. static $simplePie = null;
  159. if ($simplePie == null) {
  160. $simplePie = customSimplePie();
  161. $simplePie->init();
  162. }
  163. return html_only_entity_decode($simplePie->sanitize->sanitize($data, SIMPLEPIE_CONSTRUCT_HTML, $base));
  164. }
  165. /* permet de récupérer le contenu d'un article pour un flux qui n'est pas complet */
  166. function get_content_by_parsing ($url, $path) {
  167. require_once (LIB_PATH . '/lib_phpQuery.php');
  168. syslog(LOG_INFO, 'FreshRSS GET ' . $url);
  169. $html = file_get_contents ($url);
  170. if ($html) {
  171. $doc = phpQuery::newDocument ($html);
  172. $content = $doc->find ($path);
  173. return sanitizeHTML($content->__toString(), $url);
  174. } else {
  175. throw new Exception ();
  176. }
  177. }
  178. /**
  179. * Add support of image lazy loading
  180. * Move content from src attribute to data-original
  181. * @param content is the text we want to parse
  182. */
  183. function lazyimg($content) {
  184. return preg_replace(
  185. '/<((?:img|iframe)[^>]+?)src=[\'"]([^"\']+)[\'"]([^>]*)>/i',
  186. '<$1src="' . Minz_Url::display('/themes/icons/grey.gif') . '" data-original="$2"$3>',
  187. $content
  188. );
  189. }
  190. function uTimeString() {
  191. $t = @gettimeofday();
  192. return $t['sec'] . str_pad($t['usec'], 6, '0');
  193. }
  194. function uSecString() {
  195. $t = @gettimeofday();
  196. return str_pad($t['usec'], 6, '0');
  197. }
  198. function invalidateHttpCache() {
  199. Minz_Session::_param('touch', uTimeString());
  200. return touch(LOG_PATH . '/' . Minz_Session::param('currentUser', '_') . '.log');
  201. }
  202. function listUsers() {
  203. return array_values(array_diff(
  204. scandir(join_path(DATA_PATH, 'users')),
  205. array('..', '.')
  206. ));
  207. }
  208. function httpAuthUser() {
  209. return isset($_SERVER['REMOTE_USER']) ? $_SERVER['REMOTE_USER'] : '';
  210. }
  211. function cryptAvailable() {
  212. if (version_compare(PHP_VERSION, '5.3.3', '>=')) {
  213. try {
  214. $hash = '$2y$04$usesomesillystringfore7hnbRJHxXVLeakoG8K30oukPsA.ztMG';
  215. return $hash === @crypt('password', $hash);
  216. } catch (Exception $e) {
  217. }
  218. }
  219. return false;
  220. }
  221. function is_referer_from_same_domain() {
  222. if (empty($_SERVER['HTTP_REFERER'])) {
  223. return false;
  224. }
  225. $host = parse_url(((isset($_SERVER['HTTPS']) && $_SERVER['HTTPS'] === 'on') ? 'https://' : 'http://') .
  226. (empty($_SERVER['HTTP_HOST']) ? $_SERVER['SERVER_NAME'] : $_SERVER['HTTP_HOST']));
  227. $referer = parse_url($_SERVER['HTTP_REFERER']);
  228. if (empty($host['host']) || empty($referer['host']) || $host['host'] !== $referer['host']) {
  229. return false;
  230. }
  231. //TODO: check 'scheme', taking into account the case of a proxy
  232. if ((isset($host['port']) ? $host['port'] : 0) !== (isset($referer['port']) ? $referer['port'] : 0)) {
  233. return false;
  234. }
  235. return true;
  236. }
  237. /**
  238. * Check PHP and its extensions are well-installed.
  239. *
  240. * @return array of tested values.
  241. */
  242. function check_install_php() {
  243. $pdo_mysql = extension_loaded('pdo_mysql');
  244. $pdo_sqlite = extension_loaded('pdo_sqlite');
  245. return array(
  246. 'php' => version_compare(PHP_VERSION, '5.2.1') >= 0,
  247. 'minz' => file_exists(LIB_PATH . '/Minz'),
  248. 'curl' => extension_loaded('curl'),
  249. 'pdo' => $pdo_mysql || $pdo_sqlite,
  250. 'pcre' => extension_loaded('pcre'),
  251. 'ctype' => extension_loaded('ctype'),
  252. 'dom' => class_exists('DOMDocument'),
  253. 'json' => extension_loaded('json'),
  254. 'zip' => extension_loaded('zip'),
  255. );
  256. }
  257. /**
  258. * Check different data files and directories exist.
  259. *
  260. * @return array of tested values.
  261. */
  262. function check_install_files() {
  263. return array(
  264. 'data' => DATA_PATH && is_writable(DATA_PATH),
  265. 'cache' => CACHE_PATH && is_writable(CACHE_PATH),
  266. 'logs' => LOG_PATH && is_writable(LOG_PATH),
  267. 'favicons' => is_writable(DATA_PATH . '/favicons'),
  268. 'persona' => is_writable(DATA_PATH . '/persona'),
  269. 'tokens' => is_writable(DATA_PATH . '/tokens'),
  270. );
  271. }
  272. /**
  273. * Check database is well-installed.
  274. *
  275. * @return array of tested values.
  276. */
  277. function check_install_database() {
  278. $status = array(
  279. 'connection' => true,
  280. 'tables' => false,
  281. 'categories' => false,
  282. 'feeds' => false,
  283. 'entries' => false,
  284. );
  285. try {
  286. $dbDAO = FreshRSS_Factory::createDatabaseDAO();
  287. $status['tables'] = $dbDAO->tablesAreCorrect();
  288. $status['categories'] = $dbDAO->categoryIsCorrect();
  289. $status['feeds'] = $dbDAO->feedIsCorrect();
  290. $status['entries'] = $dbDAO->entryIsCorrect();
  291. } catch(Minz_PDOConnectionException $e) {
  292. $status['connection'] = false;
  293. }
  294. return $status;
  295. }