2023-10-09 08:48:21 +02:00
|
|
|
<?php
|
|
|
|
|
|
|
|
class CssSelectorFeedExpanderBridge extends CssSelectorBridge
|
|
|
|
{
|
|
|
|
const MAINTAINER = 'ORelio';
|
|
|
|
const NAME = 'CSS Selector Feed Expander';
|
|
|
|
const URI = 'https://github.com/RSS-Bridge/rss-bridge/';
|
|
|
|
const DESCRIPTION = 'Expand any site RSS feed using CSS selectors (Advanced Users)';
|
|
|
|
const PARAMETERS = [
|
|
|
|
[
|
|
|
|
'feed' => [
|
|
|
|
'name' => 'Feed: URL of truncated RSS feed',
|
|
|
|
'exampleValue' => 'https://example.com/feed.xml',
|
|
|
|
'required' => true
|
|
|
|
],
|
|
|
|
'content_selector' => [
|
|
|
|
'name' => 'Selector for each article content',
|
|
|
|
'title' => <<<EOT
|
|
|
|
This bridge works using CSS selectors, e.g. "div.article" will match <div class="article">.
|
|
|
|
Everything inside that element becomes feed item content.
|
|
|
|
EOT,
|
|
|
|
'exampleValue' => 'article.content',
|
|
|
|
'required' => true
|
|
|
|
],
|
|
|
|
'content_cleanup' => [
|
|
|
|
'name' => '[Optional] Content cleanup: List of items to remove',
|
|
|
|
'title' => 'Selector for unnecessary elements to remove inside article contents.',
|
|
|
|
'exampleValue' => 'div.ads, div.comments',
|
|
|
|
],
|
|
|
|
'dont_expand_metadata' => [
|
|
|
|
'name' => '[Optional] Don\'t expand metadata',
|
|
|
|
'title' => "This bridge will attempt to fill missing fields using metadata from the webpage.\nCheck to disable.",
|
|
|
|
'type' => 'checkbox',
|
|
|
|
],
|
|
|
|
'discard_thumbnail' => [
|
|
|
|
'name' => '[Optional] Discard thumbnail set by site author',
|
|
|
|
'title' => 'Some sites set their logo as thumbnail for every article. Use this option to discard it.',
|
|
|
|
'type' => 'checkbox',
|
|
|
|
],
|
2024-01-19 21:30:53 +01:00
|
|
|
'thumbnail_as_header' => [
|
|
|
|
'name' => '[Optional] Insert thumbnail as article header',
|
|
|
|
'title' => 'Insert article main image on top of article contents.',
|
|
|
|
'type' => 'checkbox',
|
|
|
|
],
|
2023-10-09 08:48:21 +02:00
|
|
|
'limit' => self::LIMIT
|
|
|
|
]
|
|
|
|
];
|
|
|
|
|
|
|
|
public function collectData()
|
|
|
|
{
|
|
|
|
$url = $this->getInput('feed');
|
|
|
|
$content_selector = $this->getInput('content_selector');
|
|
|
|
$content_cleanup = $this->getInput('content_cleanup');
|
|
|
|
$dont_expand_metadata = $this->getInput('dont_expand_metadata');
|
|
|
|
$discard_thumbnail = $this->getInput('discard_thumbnail');
|
2024-01-19 21:30:53 +01:00
|
|
|
$thumbnail_as_header = $this->getInput('thumbnail_as_header');
|
2023-10-09 08:48:21 +02:00
|
|
|
$limit = $this->getInput('limit');
|
|
|
|
|
2023-10-16 02:58:03 +02:00
|
|
|
$feedParser = new FeedParser();
|
|
|
|
$xml = getContents($url);
|
|
|
|
$source_feed = $feedParser->parseFeed($xml);
|
2023-10-13 19:27:33 +02:00
|
|
|
$items = $source_feed['items'];
|
2023-10-12 22:14:04 +02:00
|
|
|
|
2023-10-13 19:27:33 +02:00
|
|
|
// Map Homepage URL (Default: Root page)
|
|
|
|
if (isset($source_feed['uri'])) {
|
|
|
|
$this->homepageUrl = $source_feed['uri'];
|
|
|
|
} else {
|
|
|
|
$this->homepageUrl = urljoin($url, '/');
|
|
|
|
}
|
|
|
|
|
|
|
|
// Map Feed Name (Default: Domain name)
|
|
|
|
if (isset($source_feed['title'])) {
|
|
|
|
$this->feedName = $source_feed['title'];
|
|
|
|
} else {
|
|
|
|
$this->feedName = explode('/', urljoin($url, '/'))[2];
|
|
|
|
}
|
2023-10-09 08:48:21 +02:00
|
|
|
|
2023-10-13 19:27:33 +02:00
|
|
|
// Apply item limit (Default: Global limit)
|
|
|
|
if ($limit > 0) {
|
|
|
|
$items = array_slice($items, 0, $limit);
|
|
|
|
}
|
2023-10-09 08:48:21 +02:00
|
|
|
|
2023-10-13 19:27:33 +02:00
|
|
|
// Expand feed items (CssSelectorBridge)
|
2023-10-09 08:48:21 +02:00
|
|
|
foreach ($items as $item_from_feed) {
|
|
|
|
$item_expanded = $this->expandEntryWithSelector(
|
|
|
|
$item_from_feed['uri'],
|
|
|
|
$content_selector,
|
|
|
|
$content_cleanup
|
|
|
|
);
|
|
|
|
|
|
|
|
if ($dont_expand_metadata) {
|
|
|
|
// Take feed item, only replace content from expanded data
|
|
|
|
$content = $item_expanded['content'];
|
|
|
|
$item_expanded = $item_from_feed;
|
|
|
|
$item_expanded['content'] = $content;
|
|
|
|
} else {
|
|
|
|
// Take expanded item, but give priority to metadata already in source item
|
|
|
|
foreach ($item_from_feed as $field => $val) {
|
2023-10-13 19:27:33 +02:00
|
|
|
if ($field !== 'content' && !empty($val)) {
|
2023-10-09 08:48:21 +02:00
|
|
|
$item_expanded[$field] = $val;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($discard_thumbnail && isset($item_expanded['enclosures'])) {
|
|
|
|
unset($item_expanded['enclosures']);
|
|
|
|
}
|
|
|
|
|
2024-01-19 21:30:53 +01:00
|
|
|
if ($thumbnail_as_header && isset($item_expanded['enclosures'][0])) {
|
|
|
|
$item_expanded['content'] = '<p><img src="'
|
|
|
|
. $item_expanded['enclosures'][0]
|
|
|
|
. '" /></p>'
|
|
|
|
. $item_expanded['content'];
|
|
|
|
}
|
|
|
|
|
2023-10-09 08:48:21 +02:00
|
|
|
$this->items[] = $item_expanded;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|