2022-04-08 21:13:05 +02:00
|
|
|
<?php
|
|
|
|
|
|
|
|
class FeedMergeBridge extends FeedExpander
|
|
|
|
{
|
|
|
|
const MAINTAINER = 'dvikan';
|
|
|
|
const NAME = 'FeedMerge';
|
|
|
|
const URI = 'https://github.com/RSS-Bridge/rss-bridge';
|
|
|
|
const DESCRIPTION = <<<'TEXT'
|
2025-01-03 08:17:47 +01:00
|
|
|
This bridge merges two or more feeds into a single feed. <br>
|
|
|
|
Max 10 latest items are fetched from each individual feed. <br>
|
|
|
|
Items with identical url or title are considered duplicates (and are removed). <br>
|
|
|
|
TEXT;
|
2022-04-08 21:13:05 +02:00
|
|
|
|
|
|
|
const PARAMETERS = [
|
|
|
|
[
|
|
|
|
'feed_name' => [
|
|
|
|
'name' => 'Feed name',
|
|
|
|
'type' => 'text',
|
2023-07-08 17:07:08 +02:00
|
|
|
'exampleValue' => 'FeedMerge',
|
2022-04-08 21:13:05 +02:00
|
|
|
],
|
|
|
|
'feed_1' => [
|
|
|
|
'name' => 'Feed url',
|
|
|
|
'type' => 'text',
|
|
|
|
'required' => true,
|
|
|
|
'exampleValue' => 'https://lorem-rss.herokuapp.com/feed?unit=day'
|
|
|
|
],
|
|
|
|
'feed_2' => ['name' => 'Feed url', 'type' => 'text'],
|
|
|
|
'feed_3' => ['name' => 'Feed url', 'type' => 'text'],
|
|
|
|
'feed_4' => ['name' => 'Feed url', 'type' => 'text'],
|
|
|
|
'feed_5' => ['name' => 'Feed url', 'type' => 'text'],
|
2022-09-08 18:44:15 +02:00
|
|
|
'feed_6' => ['name' => 'Feed url', 'type' => 'text'],
|
|
|
|
'feed_7' => ['name' => 'Feed url', 'type' => 'text'],
|
|
|
|
'feed_8' => ['name' => 'Feed url', 'type' => 'text'],
|
|
|
|
'feed_9' => ['name' => 'Feed url', 'type' => 'text'],
|
|
|
|
'feed_10' => ['name' => 'Feed url', 'type' => 'text'],
|
2022-06-22 18:34:05 +02:00
|
|
|
'limit' => self::LIMIT,
|
2022-04-08 21:13:05 +02:00
|
|
|
]
|
|
|
|
];
|
|
|
|
|
2022-09-08 18:44:15 +02:00
|
|
|
/**
|
2025-01-03 08:17:47 +01:00
|
|
|
* TODO: Consider a strategy which produces a shorter feed url
|
2022-09-08 18:44:15 +02:00
|
|
|
*/
|
2022-04-08 21:13:05 +02:00
|
|
|
public function collectData()
|
|
|
|
{
|
2025-01-03 08:17:47 +01:00
|
|
|
$limit = (int)($this->getInput('limit') ?: 99);
|
2022-04-08 21:13:05 +02:00
|
|
|
$feeds = [
|
|
|
|
$this->getInput('feed_1'),
|
|
|
|
$this->getInput('feed_2'),
|
|
|
|
$this->getInput('feed_3'),
|
|
|
|
$this->getInput('feed_4'),
|
|
|
|
$this->getInput('feed_5'),
|
2022-09-08 18:44:15 +02:00
|
|
|
$this->getInput('feed_6'),
|
|
|
|
$this->getInput('feed_7'),
|
|
|
|
$this->getInput('feed_8'),
|
|
|
|
$this->getInput('feed_9'),
|
|
|
|
$this->getInput('feed_10'),
|
2022-04-08 21:13:05 +02:00
|
|
|
];
|
2022-07-05 15:39:00 +02:00
|
|
|
|
2022-04-08 21:13:05 +02:00
|
|
|
// Remove empty values
|
|
|
|
$feeds = array_filter($feeds);
|
2022-07-05 15:39:00 +02:00
|
|
|
|
2022-04-08 21:13:05 +02:00
|
|
|
foreach ($feeds as $feed) {
|
2023-07-05 05:41:01 +02:00
|
|
|
if (count($feeds) > 1) {
|
|
|
|
// Allow one or more feeds to fail
|
|
|
|
try {
|
2025-01-03 08:17:47 +01:00
|
|
|
$this->collectExpandableDatas($feed, 10);
|
2023-07-05 05:41:01 +02:00
|
|
|
} catch (HttpException $e) {
|
2023-09-21 22:05:55 +02:00
|
|
|
$this->logger->warning(sprintf('Exception in FeedMergeBridge: %s', create_sane_exception_message($e)));
|
2024-04-04 19:12:04 +02:00
|
|
|
// This feed item might be spammy. Considering dropping it.
|
2023-07-05 05:41:01 +02:00
|
|
|
$this->items[] = [
|
|
|
|
'title' => 'RSS-Bridge: ' . $e->getMessage(),
|
|
|
|
// Give current time so it sorts to the top
|
|
|
|
'timestamp' => time(),
|
|
|
|
];
|
|
|
|
continue;
|
2023-07-08 23:36:36 +02:00
|
|
|
} catch (\Exception $e) {
|
2024-04-04 19:12:04 +02:00
|
|
|
if (str_starts_with($e->getMessage(), 'Failed to parse xml')) {
|
2023-07-08 23:36:36 +02:00
|
|
|
// Allow this particular exception from FeedExpander
|
2023-09-21 22:05:55 +02:00
|
|
|
$this->logger->warning(sprintf('Exception in FeedMergeBridge: %s', create_sane_exception_message($e)));
|
2023-07-08 23:36:36 +02:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
throw $e;
|
2023-07-05 05:41:01 +02:00
|
|
|
}
|
|
|
|
} else {
|
2025-01-03 08:17:47 +01:00
|
|
|
$this->collectExpandableDatas($feed, 10);
|
2023-07-05 05:41:01 +02:00
|
|
|
}
|
2022-04-08 21:13:05 +02:00
|
|
|
}
|
2022-07-05 15:39:00 +02:00
|
|
|
|
2024-04-04 19:12:04 +02:00
|
|
|
// If $this->items is empty we should consider throw exception here
|
|
|
|
|
2025-01-03 08:17:47 +01:00
|
|
|
// Sort by timestamp, uri, title in descending order
|
2022-11-08 21:17:32 +01:00
|
|
|
usort($this->items, function ($a, $b) {
|
|
|
|
$t1 = $a['timestamp'] ?? $a['uri'] ?? $a['title'];
|
|
|
|
$t2 = $b['timestamp'] ?? $b['uri'] ?? $b['title'];
|
|
|
|
return $t2 <=> $t1;
|
|
|
|
});
|
2022-07-05 15:39:00 +02:00
|
|
|
|
2025-01-03 08:17:47 +01:00
|
|
|
// Remove duplicates by url
|
2022-07-05 15:39:00 +02:00
|
|
|
$items = [];
|
|
|
|
foreach ($this->items as $item) {
|
2025-01-03 08:17:47 +01:00
|
|
|
$uri = $item['uri'] ?? null;
|
|
|
|
if ($uri) {
|
|
|
|
// Insert or override the existing duplicate
|
|
|
|
$items[$uri] = $item;
|
2022-07-05 15:39:00 +02:00
|
|
|
} else {
|
2025-01-03 08:17:47 +01:00
|
|
|
// The item doesn't have a uri!
|
2022-07-05 15:39:00 +02:00
|
|
|
$items[] = $item;
|
|
|
|
}
|
|
|
|
}
|
2025-01-03 08:17:47 +01:00
|
|
|
$this->items = array_values($items);
|
|
|
|
|
|
|
|
// Remove duplicates by title
|
|
|
|
$items = [];
|
|
|
|
foreach ($this->items as $item) {
|
|
|
|
$title = $item['title'] ?? null;
|
|
|
|
if ($title) {
|
|
|
|
// Insert or override the existing duplicate
|
|
|
|
$items[$title] = $item;
|
|
|
|
} else {
|
|
|
|
// The item doesn't have a title!
|
|
|
|
$items[] = $item;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
$this->items = array_values($items);
|
|
|
|
|
|
|
|
$this->items = array_slice($this->items, 0, $limit);
|
2022-04-08 21:13:05 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public function getIcon()
|
|
|
|
{
|
|
|
|
return 'https://cdn.jsdelivr.net/npm/famfamfam-silk@1.0.0/dist/png/folder_feed.png';
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getName()
|
|
|
|
{
|
2023-07-08 17:07:08 +02:00
|
|
|
return $this->getInput('feed_name') ?: 'FeedMerge';
|
2022-04-08 21:13:05 +02:00
|
|
|
}
|
|
|
|
}
|