| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415 |
- <?php
- declare(strict_types=1);
- class FreshRSS_StatsDAO extends Minz_ModelPdo {
- public const ENTRY_COUNT_PERIOD = 30;
- /** Get the number of seconds to add to UTC to get the user's local time */
- protected function getTimezoneOffset(): int {
- $timezone = new DateTimeZone(date_default_timezone_get());
- return $timezone->getOffset(new DateTime('now', new DateTimeZone('UTC')));
- }
- /**
- * @param string $field to use for the date
- * @param int $precision to apply to the timestamp (1 for seconds, 1000 for milliseconds, 1000000 for microseconds)
- * @param 'day'|'month'|'year' $granularity of the date intervals
- */
- protected function sqlDateToIsoGranularity(string $field, int $precision, string $granularity): string {
- if (!preg_match('/^[a-zA-Z0-9_.]+$/', $field)) {
- throw new InvalidArgumentException('Invalid date field!');
- }
- $offset = $this->getTimezoneOffset();
- return match ($granularity) {
- 'day' => "FROM_UNIXTIME(($field / $precision) + $offset, '%Y-%m-%d')",
- 'month' => "FROM_UNIXTIME(($field / $precision) + $offset, '%Y-%m')",
- 'year' => "FROM_UNIXTIME(($field / $precision) + $offset, '%Y')",
- default => throw new InvalidArgumentException('Invalid date granularity!'),
- };
- }
- protected function sqlFloor(string $s): string {
- return "FLOOR($s)";
- }
- /**
- * Calculates entry repartition for all feeds and for main stream.
- *
- * @return array{'main_stream':array{'total':int,'count_unreads':int,'count_reads':int,'count_favorites':int}|false,'all_feeds':array{'total':int,'count_unreads':int,'count_reads':int,'count_favorites':int}|false}
- */
- public function calculateEntryRepartition(): array {
- return [
- 'main_stream' => $this->calculateEntryRepartitionPerFeed(null, true),
- 'all_feeds' => $this->calculateEntryRepartitionPerFeed(null, false),
- ];
- }
- /**
- * Calculates entry repartition for the selection.
- * The repartition includes:
- * - total entries
- * - read entries
- * - unread entries
- * - favorite entries
- *
- * @return array{total:int,count_unreads:int,count_reads:int,count_favorites:int}|false
- */
- public function calculateEntryRepartitionPerFeed(?int $feed = null, bool $only_main = false): array|false {
- $filter = '';
- if ($only_main) {
- $filter .= 'AND f.priority = 10';
- }
- if ($feed !== null) {
- $filter .= "AND e.id_feed = {$feed}";
- }
- $sql = <<<SQL
- SELECT COUNT(1) AS total,
- COUNT(1) - SUM(e.is_read) AS count_unreads,
- SUM(e.is_read) AS count_reads,
- SUM(e.is_favorite) AS count_favorites
- FROM `_entry` AS e, `_feed` AS f
- WHERE e.id_feed = f.id
- {$filter}
- SQL;
- $res = $this->fetchAssoc($sql);
- if (is_array($res) && !empty($res[0]) && is_array($res[0])) {
- $dao = array_map('intval', $res[0]);
- /** @var array{total:int,count_unreads:int,count_reads:int,count_favorites:int} $dao */
- return $dao;
- }
- return false;
- }
- /**
- * Calculates entry count per day on a 30 days period.
- * @return array<int,int>
- */
- public function calculateEntryCount(): array {
- $count = $this->initEntryCountArray();
- $midnight = mktime(0, 0, 0) ?: 0;
- $oldest = $midnight - (self::ENTRY_COUNT_PERIOD * 86400);
- // Get stats per day for the last 30 days
- $sqlDay = $this->sqlFloor("(date - $midnight) / 86400");
- $sql = <<<SQL
- SELECT {$sqlDay} AS day,
- COUNT(*) as count
- FROM `_entry`
- WHERE date >= {$oldest} AND date < {$midnight}
- GROUP BY day
- ORDER BY day ASC
- SQL;
- $res = $this->fetchAssoc($sql);
- if (!is_array($res)) {
- return [];
- }
- /** @var list<array{day:int,count:int}> $res */
- foreach ($res as $value) {
- $count[(int)($value['day'])] = (int)($value['count']);
- }
- return $count;
- }
- /**
- * Initialize an array for the entry count.
- * @return array<int,int>
- */
- protected function initEntryCountArray(): array {
- return $this->initStatsArray(-self::ENTRY_COUNT_PERIOD, -1);
- }
- /**
- * Calculates the number of article per hour of the day per feed
- * @return array<int,int>
- */
- public function calculateEntryRepartitionPerFeedPerHour(?int $feed = null): array {
- return $this->calculateEntryRepartitionPerFeedPerPeriod('%H', $feed);
- }
- /**
- * Calculates the number of article per day of week per feed
- * @return array<int,int>
- */
- public function calculateEntryRepartitionPerFeedPerDayOfWeek(?int $feed = null): array {
- return $this->calculateEntryRepartitionPerFeedPerPeriod('%w', $feed);
- }
- /**
- * Calculates the number of article per month per feed
- * @return array<int,int>
- */
- public function calculateEntryRepartitionPerFeedPerMonth(?int $feed = null): array {
- $monthRepartition = $this->calculateEntryRepartitionPerFeedPerPeriod('%m', $feed);
- // cut out the 0th month (Jan=1, Dec=12)
- \array_splice($monthRepartition, 0, 1);
- return $monthRepartition;
- }
- /**
- * Calculates the number of article per period per feed
- * @param string $period format string to use for grouping
- * @return array<int,int>
- */
- protected function calculateEntryRepartitionPerFeedPerPeriod(string $period, ?int $feed = null): array {
- $restrict = '';
- if ($feed) {
- $restrict = "WHERE e.id_feed = {$feed}";
- }
- $offset = $this->getTimezoneOffset();
- $sql = <<<SQL
- SELECT DATE_FORMAT(FROM_UNIXTIME(e.date + {$offset}), '{$period}') AS period
- , COUNT(1) AS count
- FROM `_entry` AS e
- {$restrict}
- GROUP BY period
- ORDER BY period ASC
- SQL;
- $res = $this->fetchAssoc($sql);
- if ($res == false) {
- return [];
- }
- $periodMax = match ($period) {
- '%H' => 24,
- '%w' => 7,
- '%m' => 12,
- default => 30,
- };
- $repartition = array_fill(0, $periodMax, 0);
- foreach ($res as $value) {
- $repartition[(int)$value['period']] = (int)$value['count'];
- }
- return $repartition;
- }
- /**
- * Calculates the average number of article per hour per feed
- */
- public function calculateEntryAveragePerFeedPerHour(?int $feed = null): float {
- return $this->calculateEntryAveragePerFeedPerPeriod(1 / 24, $feed);
- }
- /**
- * Calculates the average number of article per day of week per feed
- */
- public function calculateEntryAveragePerFeedPerDayOfWeek(?int $feed = null): float {
- return $this->calculateEntryAveragePerFeedPerPeriod(7, $feed);
- }
- /**
- * Calculates the average number of article per month per feed
- */
- public function calculateEntryAveragePerFeedPerMonth(?int $feed = null): float {
- return $this->calculateEntryAveragePerFeedPerPeriod(30, $feed);
- }
- /**
- * Calculates the average number of article per feed
- * @param float $period number used to divide the number of day in the period
- */
- protected function calculateEntryAveragePerFeedPerPeriod(float $period, ?int $feed = null): float {
- $restrict = '';
- if ($feed) {
- $restrict = "WHERE e.id_feed = {$feed}";
- }
- $sql = <<<SQL
- SELECT COUNT(1) AS count
- , MIN(date) AS date_min
- , MAX(date) AS date_max
- FROM `_entry` AS e
- {$restrict}
- SQL;
- $res = $this->fetchAssoc($sql);
- if ($res == null || empty($res[0])) {
- return -1.0;
- }
- $date_min = new \DateTime();
- $date_min->setTimestamp((int)($res[0]['date_min']));
- $date_max = new \DateTime();
- $date_max->setTimestamp((int)($res[0]['date_max']));
- $interval = $date_max->diff($date_min, true);
- $interval_in_days = (float)($interval->format('%a'));
- if ($interval_in_days <= 0) {
- // Surely only one article.
- // We will return count / (period/period) == count.
- $interval_in_days = $period;
- }
- return (int)$res[0]['count'] / ($interval_in_days / $period);
- }
- /**
- * Initialize an array for statistics depending on a range
- * @return array<int,int>
- */
- protected function initStatsArray(int $min, int $max): array {
- return array_map(fn() => 0, array_flip(range($min, $max)));
- }
- /**
- * Calculates feed count per category.
- * @return list<array{'label':string,'data':int}>
- */
- public function calculateFeedByCategory(): array {
- $sql = <<<SQL
- SELECT c.name AS label
- , COUNT(f.id) AS data
- FROM `_category` AS c, `_feed` AS f
- WHERE c.id = f.category
- GROUP BY label
- ORDER BY data DESC
- SQL;
- /** @var list<array{'label':string,'data':int}>|null @res */
- $res = $this->fetchAssoc($sql);
- return $res == null ? [] : $res;
- }
- /**
- * Calculates entry count per category.
- * @return list<array{'label':string,'data':int}>
- */
- public function calculateEntryByCategory(): array {
- $sql = <<<SQL
- SELECT c.name AS label
- , COUNT(e.id) AS data
- FROM `_category` AS c, `_feed` AS f, `_entry` AS e
- WHERE c.id = f.category
- AND f.id = e.id_feed
- GROUP BY label
- ORDER BY data DESC
- SQL;
- $res = $this->fetchAssoc($sql);
- /** @var list<array{'label':string,'data':int}>|null $res */
- return $res == null ? [] : $res;
- }
- /**
- * Calculates the 10 top feeds based on their number of entries
- * @return list<array{'id':int,'name':string,'category':string,'count':int}>
- */
- public function calculateTopFeed(): array {
- $sql = <<<SQL
- SELECT f.id AS id
- , MAX(f.name) AS name
- , MAX(c.name) AS category
- , COUNT(e.id) AS count
- FROM `_category` AS c, `_feed` AS f, `_entry` AS e
- WHERE c.id = f.category
- AND f.id = e.id_feed
- GROUP BY f.id
- ORDER BY count DESC
- LIMIT 10
- SQL;
- $res = $this->fetchAssoc($sql);
- /** @var list<array{'id':int,'name':string,'category':string,'count':int}>|null $res */
- if (is_array($res)) {
- return $res;
- }
- return [];
- }
- /**
- * Calculates the last publication date for each feed
- * @return list<array{'id':int,'name':string,'last_date':int,'nb_articles':int}>
- */
- public function calculateFeedLastDate(): array {
- $sql = <<<SQL
- SELECT MAX(f.id) as id
- , MAX(f.name) AS name
- , MAX(date) AS last_date
- , COUNT(*) AS nb_articles
- FROM `_feed` AS f, `_entry` AS e
- WHERE f.id = e.id_feed
- GROUP BY f.id
- ORDER BY name
- SQL;
- $res = $this->fetchAssoc($sql);
- /** @var list<array{'id':int,'name':string,'last_date':int,'nb_articles':int}>|null $res */
- if (is_array($res)) {
- return $res;
- }
- return [];
- }
- /**
- * Gets days ready for graphs
- * @return list<string>
- */
- public function getDays(): array {
- return $this->convertToTranslatedJson([
- 'sun',
- 'mon',
- 'tue',
- 'wed',
- 'thu',
- 'fri',
- 'sat',
- ]);
- }
- /**
- * Gets months ready for graphs
- * @return list<string>
- */
- public function getMonths(): array {
- return $this->convertToTranslatedJson([
- 'jan',
- 'feb',
- 'mar',
- 'apr',
- 'may_',
- 'jun',
- 'jul',
- 'aug',
- 'sep',
- 'oct',
- 'nov',
- 'dec',
- ]);
- }
- /**
- * Translates array content
- * @param list<string> $data
- * @return list<string>
- */
- private function convertToTranslatedJson(array $data = []): array {
- $translated = array_map(static fn(string $a) => _t('gen.date.' . $a), $data);
- return $translated;
- }
- /**
- * Gets the date intervals with the largest number of unread articles.
- * @param 'id'|'date' $field to use for the date
- * @param 'day'|'month'|'year' $granularity of the date intervals
- * @return list<array{'granularity':string,'unread_count':int}>
- */
- public function getMaxUnreadDates(string $field, string $granularity, int $max = 100, int $minPriority = FreshRSS_Feed::PRIORITY_HIDDEN): array {
- $sql = <<<SQL
- SELECT
- {$this->sqlDateToIsoGranularity('e.' . $field, precision: $field === 'id' ? 1000000 : 1, granularity: $granularity)} AS granularity,
- COUNT(*) AS unread_count
- FROM `_entry` e
- INNER JOIN `_feed` f ON e.id_feed = f.id
- WHERE e.is_read = 0 AND f.priority >= :min_priority
- GROUP BY granularity
- ORDER BY unread_count DESC, granularity DESC
- LIMIT :max
- SQL;
- if (($stm = $this->pdo->prepare($sql)) !== false &&
- $stm->bindValue(':min_priority', $minPriority, PDO::PARAM_INT) &&
- $stm->bindValue(':max', $max, PDO::PARAM_INT) &&
- $stm->execute() && is_array($res = $stm->fetchAll(PDO::FETCH_ASSOC))) {
- /** @var list<array{granularity:string,unread_count:int}> $res */
- return $res;
- } else {
- $info = $stm === false ? $this->pdo->errorInfo() : $stm->errorInfo();
- Minz_Log::error('SQL error ' . __METHOD__ . json_encode($info));
- return [];
- }
- }
- }
|