2014-02-04 20:54:18 +04:00
|
|
|
<?php
|
2017-02-11 18:16:56 +03:00
|
|
|
class SexactuBridge extends BridgeAbstract {
|
2014-02-04 20:54:18 +04:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
const MAINTAINER = 'Riduidel';
|
|
|
|
const NAME = 'Sexactu';
|
|
|
|
const URI = 'https://www.gqmagazine.fr';
|
2016-09-25 18:04:28 +03:00
|
|
|
const CACHE_TIMEOUT = 7200; // 2h
|
2017-02-11 18:16:56 +03:00
|
|
|
const DESCRIPTION = 'Sexactu via rss-bridge';
|
2015-11-05 14:20:11 +03:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
public function collectData(){
|
|
|
|
$find = array(
|
|
|
|
'janvier',
|
|
|
|
'février',
|
|
|
|
'mars',
|
|
|
|
'avril',
|
|
|
|
'mai',
|
|
|
|
'juin',
|
|
|
|
'juillet',
|
|
|
|
'août',
|
|
|
|
'septembre',
|
|
|
|
'novembre',
|
|
|
|
'décembre'
|
|
|
|
);
|
2014-02-20 11:42:40 +04:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
$replace = array(
|
|
|
|
'January',
|
|
|
|
'February',
|
|
|
|
'March',
|
|
|
|
'April',
|
|
|
|
'May',
|
|
|
|
'June',
|
|
|
|
'July',
|
|
|
|
'August',
|
|
|
|
'September',
|
|
|
|
'October',
|
|
|
|
'November',
|
|
|
|
'December'
|
|
|
|
);
|
2014-02-18 14:55:47 +04:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
$html = getSimpleHTMLDOM($this->getURI())
|
|
|
|
or returnServerError('Could not request ' . $this->getURI());
|
2014-02-18 14:55:47 +04:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
foreach($html->find('.content-holder') as $contentHolder){
|
|
|
|
// only use first list as second one only contains pages numbers
|
|
|
|
$articles = $contentHolder->find('ul', 0);
|
|
|
|
foreach($articles->find('li') as $element){
|
|
|
|
// if you ask about that method_exists, there seems to be a bug in simple html dom
|
|
|
|
// see stackoverflow for more details : http://stackoverflow.com/a/10828479/15619
|
|
|
|
if(is_object($element)){
|
|
|
|
$item = array();
|
|
|
|
// various metadata
|
|
|
|
$titleBlock = $element->find('.title-holder', 0);
|
|
|
|
if(is_object($titleBlock)){
|
|
|
|
$titleDetails = $titleBlock->find('.article-title', 0);
|
|
|
|
$titleData = $titleDetails->find('h2', 0)->find('a', 0);
|
|
|
|
$titleTimestamp = $titleDetails->find('h4', 0);
|
|
|
|
$item['title'] = $this->correctCase(trim($titleData->innertext));
|
|
|
|
$item['uri'] = self::URI . $titleData->href;
|
2014-02-20 11:42:40 +04:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
// Fugly date parsing due to the fact my DNS-323 doesn't support php intl extension
|
|
|
|
$dateText = $titleTimestamp->innertext;
|
|
|
|
$dateText = substr($dateText, strpos($dateText, ',') + 1);
|
|
|
|
$dateText = str_replace($find, $replace, strtolower($dateText));
|
|
|
|
$date = strtotime($dateText);
|
|
|
|
$item['timestamp'] = $date;
|
2016-07-08 20:06:35 +03:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
$item['author'] = 'Maïa Mazaurette';
|
|
|
|
$elementText = $element->find('.text-container', 0);
|
|
|
|
// don't forget to replace images server url with gq one
|
|
|
|
foreach($elementText->find('img') as $image){
|
|
|
|
$image->src = self::URI . $image->src;
|
|
|
|
}
|
|
|
|
$item['content'] = $elementText->innertext;
|
|
|
|
$this->items[] = $item;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2016-07-08 20:06:35 +03:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
public function getURI(){
|
|
|
|
return self::URI . '/sexactu';
|
|
|
|
}
|
2014-02-04 20:54:18 +04:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
private function correctCase($str){
|
|
|
|
$sentences = explode('.', mb_strtolower($str, 'UTF-8'));
|
|
|
|
$str = '';
|
|
|
|
$sep = '';
|
|
|
|
foreach ($sentences as $sentence){
|
|
|
|
//upper case first char
|
|
|
|
$sentence = ucfirst(trim($sentence));
|
2014-02-04 20:54:18 +04:00
|
|
|
|
2017-02-11 18:16:56 +03:00
|
|
|
//append sentence to output
|
|
|
|
$str = $str . $sep . $sentence;
|
|
|
|
$sep = '. ';
|
|
|
|
}
|
|
|
|
return $str;
|
|
|
|
}
|
2014-02-04 20:54:18 +04:00
|
|
|
}
|