2017-12-23 15:57:40 -05:00
|
|
|
<?php
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-12-23 15:57:40 -05:00
|
|
|
class PcGamerBridge extends BridgeAbstract
|
|
|
|
{
|
2022-07-01 15:10:30 +02:00
|
|
|
const NAME = 'PC Gamer';
|
|
|
|
const URI = 'https://www.pcgamer.com/';
|
|
|
|
const DESCRIPTION = 'PC Gamer is your source for exclusive reviews, demos,
|
2021-10-19 02:53:26 -04:00
|
|
|
updates and news on all your favorite PC gaming franchises.';
|
2022-07-01 15:10:30 +02:00
|
|
|
const MAINTAINER = 'IceWreck, mdemoss';
|
2017-12-23 15:57:40 -05:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
const PARAMETERS = [
|
|
|
|
[
|
|
|
|
'limit' => self::LIMIT,
|
|
|
|
]
|
|
|
|
];
|
2022-04-10 18:56:24 +02:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
public function collectData()
|
|
|
|
{
|
|
|
|
$html = getSimpleHTMLDOMCached($this->getURI(), 300);
|
|
|
|
$stories = $html->find('a.article-link');
|
|
|
|
$limit = $this->getInput('limit') ?? 10;
|
|
|
|
foreach (array_slice($stories, 0, $limit) as $element) {
|
|
|
|
$item = [];
|
|
|
|
$item['uri'] = $element->href;
|
|
|
|
$articleHtml = getSimpleHTMLDOMCached($item['uri']);
|
2020-02-27 02:40:09 +05:30
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
// Relying on meta tags ought to be more reliable.
|
|
|
|
$item['title'] = $articleHtml->find('meta[name=parsely-title]', 0)->content;
|
|
|
|
$item['content'] = html_entity_decode($articleHtml->find('meta[name=description]', 0)->content);
|
|
|
|
$item['author'] = $articleHtml->find('meta[name=parsely-author]', 0)->content;
|
2022-11-15 00:30:51 +01:00
|
|
|
|
|
|
|
$imageUrl = $articleHtml->find('meta[name=parsely-image-url]', 0);
|
|
|
|
if ($imageUrl) {
|
|
|
|
$item['enclosures'][] = $imageUrl->content;
|
|
|
|
}
|
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
/* I don't know why every article has two extra tags, but because
|
|
|
|
one matches another common tag, "guide," it needs to be removed. */
|
|
|
|
$item['categories'] = array_diff(
|
|
|
|
explode(',', $articleHtml->find('meta[name=parsely-tags]', 0)->content),
|
|
|
|
['van_buying_guide_progressive', 'serversidehawk']
|
|
|
|
);
|
|
|
|
$item['timestamp'] = strtotime($articleHtml->find('meta[name=pub_date]', 0)->content);
|
|
|
|
$this->items[] = $item;
|
|
|
|
}
|
|
|
|
}
|
2017-12-23 15:57:40 -05:00
|
|
|
}
|