2014-05-26 21:45:10 +04:00
|
|
|
<?php
|
|
|
|
class MsnMondeBridge extends BridgeAbstract{
|
|
|
|
|
2016-08-30 12:23:55 +03:00
|
|
|
const MAINTAINER = "kranack";
|
|
|
|
const NAME = 'MSN Actu Monde';
|
|
|
|
const URI = 'http://www.msn.com/';
|
|
|
|
const DESCRIPTION = "Returns the 10 newest posts from MSN Actualités (full text)";
|
2015-11-04 12:47:21 +03:00
|
|
|
|
2016-08-29 14:40:01 +03:00
|
|
|
public function getURI(){
|
2016-08-30 12:23:55 +03:00
|
|
|
return self::URI.'fr-fr/actualite/monde';
|
2016-08-29 14:40:01 +03:00
|
|
|
}
|
|
|
|
|
2016-08-06 17:00:56 +03:00
|
|
|
private function MsnMondeExtractContent($url, &$item) {
|
2016-08-21 20:48:23 +03:00
|
|
|
$html2 = $this->getSimpleHTMLDOM($url);
|
2016-08-22 19:55:59 +03:00
|
|
|
$item['content'] = $html2->find('#content', 0)->find('article', 0)->find('section', 0)->plaintext;
|
|
|
|
$item['timestamp'] = strtotime($html2->find('.authorinfo-txt', 0)->find('time', 0)->datetime);
|
2016-08-03 22:12:43 +03:00
|
|
|
}
|
2014-05-26 21:45:10 +04:00
|
|
|
|
2016-08-25 02:24:53 +03:00
|
|
|
public function collectData(){
|
2016-08-29 14:40:01 +03:00
|
|
|
$html = $this->getSimpleHTMLDOM($this->getURI()) or $this->returnServerError('Could not request MsnMonde.');
|
2016-08-03 22:14:46 +03:00
|
|
|
$limit = 0;
|
|
|
|
foreach($html->find('.smalla') as $article) {
|
|
|
|
if($limit < 10) {
|
2016-08-22 19:55:59 +03:00
|
|
|
$item = array();
|
|
|
|
$item['title'] = utf8_decode($article->find('h4', 0)->innertext);
|
2016-08-30 12:23:55 +03:00
|
|
|
$item['uri'] = self::URI . utf8_decode($article->find('a', 0)->href);
|
2016-08-22 19:55:59 +03:00
|
|
|
$this->MsnMondeExtractContent($item['uri'], $item);
|
2016-08-03 22:14:46 +03:00
|
|
|
$this->items[] = $item;
|
|
|
|
$limit++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2014-05-26 21:45:10 +04:00
|
|
|
}
|