From ba8e8f5fb86e4c44c290af77d90d306c87f6832f Mon Sep 17 00:00:00 2001 From: SansGuidon Date: Wed, 2 Apr 2025 05:01:43 +0000 Subject: [PATCH] change(indieblog): enable refreshing feed with a certain date --- cron/generate_indieblog_daily_rss.php | 76 +++++++++++++-------------- 1 file changed, 38 insertions(+), 38 deletions(-) diff --git a/cron/generate_indieblog_daily_rss.php b/cron/generate_indieblog_daily_rss.php index e2a0640..978c09c 100644 --- a/cron/generate_indieblog_daily_rss.php +++ b/cron/generate_indieblog_daily_rss.php @@ -1,12 +1,26 @@ str_replace('/', '\/', $pattern), $excludePatterns); - -// Crée une expression régulière unique pour matcher toutes les exclusions $excludeRegex = '/' . implode('|', $excludePatterns) . '/i'; -// Vérifier si le script est en mode dry run +// Check for dry-run mode $isDryRun = in_array('dry-run', $argv); -$maxResults = 100; // Limite par défaut pour la sortie +$maxResults = 100; // Default limit foreach ($argv as $arg) { if (preg_match('/^max-results=(\d+)$/', $arg, $matches)) { $maxResults = (int)$matches[1]; @@ -73,7 +77,7 @@ if (!$data) die("Error: Invalid JSON data from $jsonUrl\n"); $includedIds = file_exists($cacheFile) ? file($cacheFile, FILE_IGNORE_NEW_LINES) : []; -// Filtrer les articles récents, non déjà inclus, et ne contenant pas de termes exclus +// Filter recent articles, not already included, and not matching exclude regex $newItems = []; $excludedItems = []; @@ -81,11 +85,9 @@ foreach ($data as $item) { if (!isset($item['published'], $item['itemid'], $item['itemtitle'])) { continue; } - $published = $item['published']; $itemId = $item['itemid']; $itemTitle = $item['itemtitle']; - if (in_array($itemId, $includedIds) || $published < $cutoffDate || preg_match($excludeRegex, $itemTitle)) { $excludedItems[] = $item; } else { @@ -96,18 +98,15 @@ foreach ($data as $item) { usort($newItems, fn($a, $b) => $b['published'] <=> $a['published']); usort($excludedItems, fn($a, $b) => $b['published'] <=> $a['published']); +// Dry run: display filtered items if ($isDryRun) { - // Mode dry-run : afficher les entrées incluses et exclues echo "=== Dry Run Mode ===\n"; - $showIncluded = array_slice($newItems, 0, $maxResults); $showExcluded = array_slice($excludedItems, 0, $maxResults); - echo "Filtered IN (" . count($newItems) . " total, showing up to $maxResults):\n"; foreach ($showIncluded as $item) { echo "- " . ($item['itemtitle'] ?? 'No title') . "\n"; } - echo "\nFiltered OUT (" . count($excludedItems) . " total, showing up to $maxResults):\n"; foreach ($showExcluded as $item) { echo "- " . ($item['itemtitle'] ?? 'No title') . "\n"; @@ -115,12 +114,15 @@ if ($isDryRun) { exit(0); } -// Groupement par jour pour les nouveaux éléments +// Group items only for the target date $groupedByDay = []; foreach ($newItems as $item) { $day = isset($item['published']) && is_numeric($item['published']) ? date('Y-m-d', $item['published']) : date('Y-m-d'); + if ($day !== $targetDate) { + continue; + } $groupedByDay[$day][] = $item; } @@ -141,19 +143,16 @@ foreach ($groupedByDay as $day => $items) { $rssItem->addChild('link', "https://indieblog.page/$day#" . md5(json_encode($items))); $rssItem->addChild('guid', "https://indieblog.page/$day#" . md5(json_encode($items))); $rssItem->addChild('pubDate', date(DATE_RSS, strtotime($day))); - $description = ""; - addCData($rssItem->addChild('description'), $description); } @@ -169,3 +168,4 @@ function addCData(SimpleXMLElement $node, $content) $domOwner = $domNode->ownerDocument; $domNode->appendChild($domOwner->createCDATASection($content)); } +?>