2017-03-19 14:07:25 +01:00
|
|
|
<?php
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
class UsbekEtRicaBridge extends BridgeAbstract
|
|
|
|
{
|
|
|
|
const MAINTAINER = 'logmanoriginal';
|
|
|
|
const NAME = 'Usbek & Rica Bridge';
|
|
|
|
const URI = 'https://usbeketrica.com';
|
|
|
|
const DESCRIPTION = 'Returns latest articles from the front page';
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
const PARAMETERS = [
|
2022-07-01 15:10:30 +02:00
|
|
|
[
|
2017-03-19 14:07:25 +01:00
|
|
|
'limit' => [
|
|
|
|
'name' => 'Number of articles to return',
|
|
|
|
'type' => 'number',
|
|
|
|
'required' => false,
|
|
|
|
'title' => 'Specifies the maximum number of articles to return',
|
|
|
|
'defaultValue' => -1
|
|
|
|
],
|
|
|
|
'fullarticle' => [
|
|
|
|
'name' => 'Load full article',
|
|
|
|
'type' => 'checkbox',
|
|
|
|
'required' => false,
|
|
|
|
'title' => 'Activate to load full articles',
|
2022-07-01 15:10:30 +02:00
|
|
|
]
|
|
|
|
]
|
2017-03-19 14:07:25 +01:00
|
|
|
];
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
public function collectData()
|
|
|
|
{
|
|
|
|
$limit = $this->getInput('limit');
|
|
|
|
$fullarticle = $this->getInput('fullarticle');
|
|
|
|
$html = getSimpleHTMLDOM($this->getURI());
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2022-04-12 23:37:17 +02:00
|
|
|
$articles = $html->find('article');
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-07-29 19:28:00 +02:00
|
|
|
foreach ($articles as $article) {
|
2017-03-19 14:07:25 +01:00
|
|
|
$item = [];
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2022-04-12 23:37:17 +02:00
|
|
|
$title = $article->find('h2', 0);
|
2017-07-29 19:28:00 +02:00
|
|
|
if ($title) {
|
2017-03-19 14:07:25 +01:00
|
|
|
$item['title'] = $title->plaintext;
|
|
|
|
} else {
|
|
|
|
// Sometimes we get rubbish, ignore.
|
|
|
|
continue;
|
|
|
|
}
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
$author = $article->find('div.author span', 0);
|
2017-07-29 19:28:00 +02:00
|
|
|
if ($author) {
|
2017-03-19 14:07:25 +01:00
|
|
|
$item['author'] = $author->plaintext;
|
|
|
|
}
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2022-11-08 21:17:32 +01:00
|
|
|
$content = null;
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2022-11-08 21:17:32 +01:00
|
|
|
$u = $article->find('a.card-img', 0);
|
|
|
|
if ($u) {
|
|
|
|
$uri = $u->href;
|
|
|
|
if (substr($uri, 0, 1) === 'h') {
|
|
|
|
// absolute uri
|
|
|
|
$item['uri'] = $uri;
|
|
|
|
} else {
|
|
|
|
// relative uri
|
|
|
|
$item['uri'] = $this->getURI() . $uri;
|
|
|
|
}
|
|
|
|
if ($fullarticle) {
|
|
|
|
$content = $this->loadFullArticle($item['uri']);
|
|
|
|
}
|
2017-03-19 14:07:25 +01:00
|
|
|
}
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2022-11-08 21:17:32 +01:00
|
|
|
if ($fullarticle && $content) {
|
2017-03-19 14:07:25 +01:00
|
|
|
$item['content'] = $content;
|
|
|
|
} else {
|
|
|
|
$excerpt = $article->find('div.card-excerpt', 0);
|
2017-07-29 19:28:00 +02:00
|
|
|
if ($excerpt) {
|
2017-03-19 14:07:25 +01:00
|
|
|
$item['content'] = $excerpt->plaintext;
|
|
|
|
}
|
|
|
|
}
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
$image = $article->find('div.card-img img', 0);
|
2017-07-29 19:28:00 +02:00
|
|
|
if ($image) {
|
2017-03-19 14:07:25 +01:00
|
|
|
$item['enclosures'] = [
|
|
|
|
$image->src
|
|
|
|
];
|
|
|
|
}
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
$this->items[] = $item;
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-07-29 19:28:00 +02:00
|
|
|
if ($limit > 0 && count($this->items) >= $limit) {
|
2017-03-19 14:07:25 +01:00
|
|
|
break;
|
2022-07-01 15:10:30 +02:00
|
|
|
}
|
2017-03-19 14:07:25 +01:00
|
|
|
}
|
|
|
|
}
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
/**
|
|
|
|
* Loads the full article and returns the contents
|
|
|
|
* @param $uri The article URI
|
|
|
|
* @return The article content
|
|
|
|
*/
|
|
|
|
private function loadFullArticle($uri)
|
|
|
|
{
|
|
|
|
$html = getSimpleHTMLDOMCached($uri);
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2022-04-12 23:37:17 +02:00
|
|
|
$content = $html->find('div.rich-text', 1);
|
2017-07-29 19:28:00 +02:00
|
|
|
if ($content) {
|
2017-03-19 14:07:25 +01:00
|
|
|
return $this->replaceUriInHtmlElement($content);
|
|
|
|
}
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
return null;
|
|
|
|
}
|
2022-07-01 15:10:30 +02:00
|
|
|
|
2017-03-19 14:07:25 +01:00
|
|
|
/**
|
|
|
|
* Replaces all relative URIs with absolute ones
|
|
|
|
* @param $element A simplehtmldom element
|
|
|
|
* @return The $element->innertext with all URIs replaced
|
|
|
|
*/
|
|
|
|
private function replaceUriInHtmlElement($element)
|
|
|
|
{
|
|
|
|
return str_replace('href="/', 'href="' . $this->getURI() . '/', $element->innertext);
|
|
|
|
}
|
|
|
|
}
|