mirror of
https://github.com/RSS-Bridge/rss-bridge.git
synced 2025-01-18 06:38:19 +01:00
6f24858124
This commit is a squash of all commits that fix coding styles for the new coding style policy. [ABCTabsBridge] Fix coding style [AcrimedBridge] Fix coding style [AllocineFRBridge] Fix coding style [AnimeUltimeBridge] Fix coding style [Arte7Bridge] Fix coding style [AskfmBridge] Fix coding style [BandcampBridge] Fix coding style [BastaBridge] Fix coding style [BlaguesDeMerdeBridge] Fix coding style [BooruprojectBridge] Fix coding style [CADBridge] Fix coding style [CNETBridge] Fix coding style [CastorusBridge] Fix coding style [CollegeDeFranceBridge] Fix coding style [CommonDreamsBridge] Fix coding style [CopieDoubleBridge] Fix coding style [CourrierInternationalBridge] Fix coding style [CpasbienBridge] Fix coding style [CryptomeBridge] Fix coding style [DailymotionBridge] Fix coding style [DanbooruBridge] Fix coding style [DansTonChatBridge] Fix coding style [DauphineLibereBridge] Fix coding style [DeveloppezDotComBridge] Fix coding style [DemoBridge] Fix coding style [DilbertBridge] Fix coding style [DuckDuckGoBridge] Fix coding style [DollbooruBridge] Fix coding style [EliteDangerousGalnetBridge] Fix coding style [ElsevierBridge] Fix coding style [EstCeQuonMetEnProdBridge] Fix coding style [EZTVBridge] Fix coding style [FacebookBridge] Fix coding style [FeedExpanderExampleBridge] Fix coding style [FB2Bridge] Fix coding style [FierPandaBridge] Fix coding style [FlickrBridge] Fix coding style [FootitoBridge] Fix coding style [FourchanBridge] Fix coding style [FuturaSciencesBridge] Fix coding style [GBAtempBridge] Fix coding style [GelbooruBridge] Fix coding style [GiphyBridge] Fix coding style [GithubIssueBridge] Fix coding style [GizmodoBridge] Fix coding style [GoComicsBridge] Fix coding style [GooglePlusPostBridge] Fix coding style [GoogleSearchBridge] Fix coding style [HDWallpapersBridge] Fix coding style [HentaiHavenBridge] Fix coding style [IdenticaBridge] Fix coding style [InstagramBridge] Fix coding style [IsoHuntBridge] Fix coding style [JapanExpoBridge] Fix coding style [KonachanBridge] Fix coding style [KoreusBridge] Fix coding style [KununuBridge] Fix coding style [LeBonCoinBridge] Fix coding style [LegifranceJOBBridge] Fix coding style [LeMondeInformatiqueBridge] Fix coding style [LesJoiesDuCodeBridge] Fix coding style [LichessBridge] Fix coding style [LinkedInCompanyBridge] Fix coding style [LolibooruBridge] Fix coding style [LWNprevBridge] Fix coding style [MangareaderBridge] Fix coding style [MilbooruBridge] Fix coding style [MixCloudBridge] Fix coding style [MoebooruBridge] Fix coding style [MondeDiploBridge] Fix coding style [MsnMondeBridge] Fix coding style [MspabooruBridge] Fix coding style [NasaApodBridge] Fix coding style [NeuviemeArtBridge] Fix coding style [NextgovBridge] Fix coding style [NextInpactBridge] Fix coding style [NiceMatinBridge] Fix coding style [NovelUpdatesBridge] Fix coding style [OpenClassroomsBridge] Fix coding style [ParuVenduImmoBridge] Fix coding style [PickyWallpapersBridge] Fix coding style [PinterestBridge] Fix coding style [PlanetLibreBridge] Fix coding style [ReadComicsBridge] Fix coding style [Releases3DSBridge] Fix coding style [ReporterreBridge] Fix coding style [RTBFBridge] Fix coding style [Rue89Bridge] Fix coding style [Rule34Bridge] Fix coding style [Rule34pahealBridge] Fix coding style [SafebooruBridge] Fix coding style [SakugabooruBridge] Fix coding style [ScmbBridge] Fix coding style [ScoopItBridge] Fix coding style [SensCritiqueBridge] Fix coding style [SexactuBridge] Fix coding style [ShanaprojectBridge] Fix coding style [Shimmie2Bridge] Fix coding style [SoundcloudBridge] Fix coding style [StripeAPIChangeLogBridge] Fix coding style [SuperbWallpapersBridge] Fix coding style [T411Bridge] Fix coding style [TagBoardBridge] Fix coding style [TbibBridge] Fix coding style [TheCodingLoveBridge] Fix coding style [TheHackerNewsBridge] Fix coding style [ThePirateBayBridge] Fix coding style [TheTVDBBridge] Fix coding style [Torrent9Bridge] Fix coding style [TwitterBridge] Fix coding style [UnsplashBridge] Fix coding style [ViadeoCompanyBridge] Fix coding style [VineBridge] Fix coding style [VkBridge] Fix coding style [WallpaperStopBridge] Fix coding style [WebfailBridge] Fix coding style [WeLiveSecurityBridge] Fix coding style [WhydBridge] Fix coding style [WikipediaBridge] Fix coding style [WordPressBridge] Fix coding style [WorldOfTanksBridge] Fix coding style [XbooruBridge] Fix coding style [YandereBridge] Fix coding style [YoutubeBridge] Fix coding style [ZDNetBridge] Fix coding style
303 lines
8.4 KiB
PHP
303 lines
8.4 KiB
PHP
<?php
|
|
|
|
define('WIKIPEDIA_SUBJECT_TFA', 0); // Today's featured article
|
|
define('WIKIPEDIA_SUBJECT_DYK', 1); // Did you know...
|
|
|
|
class WikipediaBridge extends BridgeAbstract {
|
|
const MAINTAINER = 'logmanoriginal';
|
|
const NAME = 'Wikipedia bridge for many languages';
|
|
const URI = 'https://www.wikipedia.org/';
|
|
const DESCRIPTION = 'Returns articles for a language of your choice';
|
|
|
|
const PARAMETERS = array( array(
|
|
'language' => array(
|
|
'name' => 'Language',
|
|
'type' => 'list',
|
|
'required' => true,
|
|
'title' => 'Select your language',
|
|
'exampleValue' => 'English',
|
|
'values' => array(
|
|
'English' => 'en',
|
|
'Dutch' => 'nl',
|
|
'Esperanto' => 'eo',
|
|
'French' => 'fr',
|
|
'German' => 'de',
|
|
)
|
|
),
|
|
'subject' => array(
|
|
'name' => 'Subject',
|
|
'type' => 'list',
|
|
'required' => true,
|
|
'title' => 'What subject are you interested in?',
|
|
'exampleValue' => 'Today\'s featured article',
|
|
'values' => array(
|
|
'Today\'s featured article' => 'tfa',
|
|
'Did you know…' => 'dyk'
|
|
)
|
|
),
|
|
'fullarticle' => array(
|
|
'name' => 'Load full article',
|
|
'type' => 'checkbox',
|
|
'title' => 'Activate to always load the full article'
|
|
)
|
|
));
|
|
|
|
public function getURI(){
|
|
return 'https://'
|
|
. strtolower($this->getInput('language'))
|
|
. '.wikipedia.org';
|
|
}
|
|
|
|
public function getName(){
|
|
switch($this->getInput('subject')){
|
|
case 'tfa':
|
|
$subject = WIKIPEDIA_SUBJECT_TFA;
|
|
break;
|
|
case 'dyk':
|
|
$subject = WIKIPEDIA_SUBJECT_DYK;
|
|
break;
|
|
default:
|
|
$subject = WIKIPEDIA_SUBJECT_TFA;
|
|
break;
|
|
}
|
|
|
|
switch($subject){
|
|
case WIKIPEDIA_SUBJECT_TFA:
|
|
$name = 'Today\'s featured article from '
|
|
. strtolower($this->getInput('language'))
|
|
. '.wikipedia.org';
|
|
break;
|
|
case WIKIPEDIA_SUBJECT_DYK:
|
|
$name = 'Did you know? - articles from '
|
|
. strtolower($this->getInput('language'))
|
|
. '.wikipedia.org';
|
|
break;
|
|
default:
|
|
$name = 'Articles from '
|
|
. strtolower($this->getInput('language'))
|
|
. '.wikipedia.org';
|
|
break;
|
|
}
|
|
return $name;
|
|
}
|
|
|
|
public function collectData(){
|
|
|
|
switch($this->getInput('subject')){
|
|
case 'tfa':
|
|
$subject = WIKIPEDIA_SUBJECT_TFA;
|
|
break;
|
|
case 'dyk':
|
|
$subject = WIKIPEDIA_SUBJECT_DYK;
|
|
break;
|
|
default:
|
|
$subject = WIKIPEDIA_SUBJECT_TFA;
|
|
break;
|
|
}
|
|
|
|
$fullArticle = $this->getInput('fullarticle');
|
|
|
|
// This will automatically send us to the correct main page in any language (try it!)
|
|
$html = getSimpleHTMLDOM($this->getURI() . '/wiki');
|
|
|
|
if(!$html)
|
|
returnServerError('Could not load site: ' . $this->getURI() . '!');
|
|
|
|
/*
|
|
* Now read content depending on the language (make sure to create one function per language!)
|
|
* We build the function name automatically, just make sure you create a private function ending
|
|
* with your desired language code, where the language code is upper case! (en -> getContentsEN).
|
|
*/
|
|
$function = 'getContents' . ucfirst(strtolower($this->getInput('language')));
|
|
|
|
if(!method_exists($this, $function))
|
|
returnServerError('A function to get the contents for your language is missing (\'' . $function . '\')!');
|
|
|
|
/*
|
|
* The method takes care of creating all items.
|
|
*/
|
|
$this->$function($html, $subject, $fullArticle);
|
|
}
|
|
|
|
/**
|
|
* Replaces all relative URIs with absolute ones
|
|
* @param $element A simplehtmldom element
|
|
* @return The $element->innertext with all URIs replaced
|
|
*/
|
|
private function replaceUriInHtmlElement($element){
|
|
return str_replace('href="/', 'href="' . $this->getURI() . '/', $element->innertext);
|
|
}
|
|
|
|
/*
|
|
* Adds a new item to $items using a generic operation (should work for most
|
|
* (all?) wikis) $anchorText can be specified if the wiki in question doesn't
|
|
* use '...' (like Dutch, French and Italian) $anchorFallbackIndex can be
|
|
* used to specify a different fallback link than the first
|
|
* (e.g., -1 for the last)
|
|
*/
|
|
private function addTodaysFeaturedArticleGeneric($element
|
|
, $fullArticle
|
|
, $anchorText = '...'
|
|
, $anchorFallbackIndex = 0){
|
|
// Clean the bottom of the featured article
|
|
if ($element->find('div', -1))
|
|
$element->find('div', -1)->outertext = '';
|
|
|
|
// The title and URI of the article can be found in an anchor containing
|
|
// the string '...' in most wikis ('full article ...')
|
|
$target = $element->find('p/a', $anchorFallbackIndex);
|
|
foreach($element->find('//a') as $anchor){
|
|
if(strpos($anchor->innertext, $anchorText) !== false){
|
|
$target = $anchor;
|
|
break;
|
|
}
|
|
}
|
|
|
|
$item = array();
|
|
$item['uri'] = $this->getURI() . $target->href;
|
|
$item['title'] = $target->title;
|
|
|
|
if(!$fullArticle)
|
|
$item['content'] = strip_tags($this->replaceUriInHtmlElement($element), '<a><p><br><img>');
|
|
else
|
|
$item['content'] = $this->loadFullArticle($item['uri']);
|
|
|
|
$this->items[] = $item;
|
|
}
|
|
|
|
/*
|
|
* Adds a new item to $items using a generic operation (should work for most (all?) wikis)
|
|
*/
|
|
private function addDidYouKnowGeneric($element, $fullArticle){
|
|
foreach($element->find('ul', 0)->find('li') as $entry){
|
|
$item = array();
|
|
|
|
// We can only use the first anchor, there is no way of finding the 'correct' one if there are multiple
|
|
$item['uri'] = $this->getURI() . $entry->find('a', 0)->href;
|
|
$item['title'] = strip_tags($entry->innertext);
|
|
|
|
if(!$fullArticle)
|
|
$item['content'] = $this->replaceUriInHtmlElement($entry);
|
|
else
|
|
$item['content'] = $this->loadFullArticle($item['uri']);
|
|
|
|
$this->items[] = $item;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Loads the full article from a given URI
|
|
*/
|
|
private function loadFullArticle($uri){
|
|
$content_html = getSimpleHTMLDOMCached($uri);
|
|
|
|
if(!$content_html)
|
|
returnServerError('Could not load site: ' . $uri . '!');
|
|
|
|
$content = $content_html->find('#mw-content-text', 0);
|
|
|
|
if(!$content)
|
|
returnServerError('Could not find content in page: ' . $uri . '!');
|
|
|
|
// Let's remove a couple of things from the article
|
|
$table = $content->find('#toc', 0); // Table of contents
|
|
if(!$table === false)
|
|
$table->outertext = '';
|
|
|
|
foreach($content->find('ol.references') as $reference) // References
|
|
$reference->outertext = '';
|
|
|
|
return str_replace('href="/', 'href="' . $this->getURI() . '/', $content->innertext);
|
|
}
|
|
|
|
/**
|
|
* Implementation for de.wikipedia.org
|
|
*/
|
|
private function getContentsDe($html, $subject, $fullArticle){
|
|
switch($subject){
|
|
case WIKIPEDIA_SUBJECT_TFA:
|
|
$element = $html->find('div[id=mf-tfa]', 0);
|
|
$this->addTodaysFeaturedArticleGeneric($element, $fullArticle);
|
|
break;
|
|
case WIKIPEDIA_SUBJECT_DYK:
|
|
$element = $html->find('div[id=mf-dyk]', 0);
|
|
$this->addDidYouKnowGeneric($element, $fullArticle);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Implementation for fr.wikipedia.org
|
|
*/
|
|
private function getContentsFr($html, $subject, $fullArticle){
|
|
switch($subject){
|
|
case WIKIPEDIA_SUBJECT_TFA:
|
|
$element = $html->find('div[id=accueil-lumieresur]', 0);
|
|
$this->addTodaysFeaturedArticleGeneric($element, $fullArticle, 'Lire la suite');
|
|
break;
|
|
case WIKIPEDIA_SUBJECT_DYK:
|
|
$element = $html->find('div[id=SaviezVous]', 0);
|
|
$this->addDidYouKnowGeneric($element, $fullArticle);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Implementation for en.wikipedia.org
|
|
*/
|
|
private function getContentsEn($html, $subject, $fullArticle){
|
|
switch($subject){
|
|
case WIKIPEDIA_SUBJECT_TFA:
|
|
$element = $html->find('div[id=mp-tfa]', 0);
|
|
$this->addTodaysFeaturedArticleGeneric($element, $fullArticle);
|
|
break;
|
|
case WIKIPEDIA_SUBJECT_DYK:
|
|
$element = $html->find('div[id=mp-dyk]', 0);
|
|
$this->addDidYouKnowGeneric($element, $fullArticle);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Implementation for eo.wikipedia.org
|
|
*/
|
|
private function getContentsEo($html, $subject, $fullArticle){
|
|
switch($subject){
|
|
case WIKIPEDIA_SUBJECT_TFA:
|
|
$element = $html->find('div[id=mf-artikolo-de-la-semajno]', 0);
|
|
$this->addTodaysFeaturedArticleGeneric($element, $fullArticle);
|
|
break;
|
|
case WIKIPEDIA_SUBJECT_DYK:
|
|
$element = $html->find('div[id=mw-content-text]', 0)->find('table', 4)->find('td', 4);
|
|
$this->addDidYouKnowGeneric($element, $fullArticle);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Implementation for nl.wikipedia.org
|
|
*/
|
|
private function getContentsNl($html, $subject, $fullArticle){
|
|
switch($subject){
|
|
case WIKIPEDIA_SUBJECT_TFA:
|
|
$element = $html->find('div[id=mf-uitgelicht]', 0);
|
|
$this->addTodaysFeaturedArticleGeneric($element, $fullArticle, 'Lees meer');
|
|
break;
|
|
case WIKIPEDIA_SUBJECT_DYK:
|
|
$element = $html->find('div[id=mw-content-text]', 0)->find('table', 4)->find('td', 2);
|
|
$this->addDidYouKnowGeneric($element, $fullArticle);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
}
|