mirror of
https://github.com/RSS-Bridge/rss-bridge.git
synced 2025-08-01 14:20:16 +02:00
[CourrierInternationalBridge] fix content parsing
Signed-off-by: Pierre Mazière <pierre.maziere@gmx.com>
This commit is contained in:
@@ -25,14 +25,20 @@ class CourrierInternationalBridge extends BridgeAbstract{
|
||||
$item['uri'] = self::URI.$item['uri'];
|
||||
}
|
||||
|
||||
$page = $this->getSimpleHTMLDOM($item['uri']);
|
||||
|
||||
$page = $this->getSimpleHTMLDOMCached($item['uri']);
|
||||
|
||||
$cleaner = new HTMLSanitizer();
|
||||
|
||||
$item['content'] = $cleaner->sanitize($page->find("div.article-text")[0]);
|
||||
$item['title'] = strip_tags($article->find(".title")[0]);
|
||||
$content = $page->find('.article-text',0);
|
||||
if(!$content){
|
||||
$content = $page->find('.depeche-text',0);
|
||||
}
|
||||
|
||||
$dateTime = date_parse($page->find("time")[0]);
|
||||
$item['content'] = $cleaner->sanitize($content);
|
||||
$item['title'] = strip_tags($article->find(".title",0));
|
||||
|
||||
$dateTime = date_parse($page->find("time",0));
|
||||
|
||||
$item['timestamp'] = mktime(
|
||||
$dateTime['hour'],
|
||||
|
Reference in New Issue
Block a user