2014-05-26 21:45:10 +04:00
|
|
|
<?php
|
|
|
|
class MsnMondeBridge extends BridgeAbstract{
|
|
|
|
|
2015-11-04 12:47:21 +03:00
|
|
|
public function loadMetadatas() {
|
|
|
|
|
|
|
|
$this->maintainer = "kranack";
|
|
|
|
$this->name = "MSN Actu Monde";
|
|
|
|
$this->uri = "http://www.msn.com/fr-fr/actualite/monde";
|
|
|
|
$this->description = "Returns the 10 newest posts from MSN Actualités (full text)";
|
|
|
|
$this->update = "2015-01-30";
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2014-05-26 21:45:10 +04:00
|
|
|
public function collectData(array $param){
|
|
|
|
|
2015-01-30 18:05:28 +03:00
|
|
|
function MsnMondeExtractContent($url, &$item) {
|
2016-06-26 00:17:42 +03:00
|
|
|
$html2 = $this->file_get_html($url);
|
2015-01-30 18:05:28 +03:00
|
|
|
$item->content = $html2->find('#content', 0)->find('article', 0)->find('section', 0)->plaintext;
|
|
|
|
$item->timestamp = strtotime($html2->find('.authorinfo-txt', 0)->find('time', 0)->datetime);
|
2014-05-26 21:45:10 +04:00
|
|
|
}
|
|
|
|
|
2016-06-26 00:17:42 +03:00
|
|
|
$html = $this->file_get_html('http://www.msn.com/fr-fr/actualite/monde') or $this->returnError('Could not request MsnMonde.', 404);
|
2015-01-30 18:05:28 +03:00
|
|
|
$limit = 0;
|
|
|
|
foreach($html->find('.smalla') as $article) {
|
|
|
|
if($limit < 10) {
|
2014-05-26 21:45:10 +04:00
|
|
|
$item = new \Item();
|
2015-01-30 18:05:28 +03:00
|
|
|
$item->title = utf8_decode($article->find('h4', 0)->innertext);
|
|
|
|
$item->uri = "http://www.msn.com" . utf8_decode($article->find('a', 0)->href);
|
|
|
|
MsnMondeExtractContent($item->uri, $item);
|
2014-05-26 21:45:10 +04:00
|
|
|
$this->items[] = $item;
|
|
|
|
$limit++;
|
2015-01-30 18:05:28 +03:00
|
|
|
}
|
|
|
|
}
|
2014-05-26 21:45:10 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
public function getName(){
|
|
|
|
return 'MSN Actu Monde';
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getURI(){
|
2015-01-30 18:05:28 +03:00
|
|
|
return 'http://www.msn.com/fr-fr/actualite/monde';
|
2014-05-26 21:45:10 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
public function getCacheDuration(){
|
|
|
|
return 3600; // 1 hour
|
|
|
|
}
|
|
|
|
}
|