rss-bridge/bridges/T411Bridge.php

89 lines
3.7 KiB
PHP
Raw Normal View History

2015-10-22 15:57:33 +03:00
<?php
class T411Bridge extends BridgeAbstract {
public function loadMetadatas() {
2016-07-17 15:39:14 +03:00
$this->maintainer = 'ORelio';
$this->name = 'T411 Bridge';
$this->uri = 'https://t411.ch/';
2016-07-17 15:39:14 +03:00
$this->description = 'Returns the 10 newest torrents with specified search terms <br /> Use url part after "?" mark when using their search engine.';
$this->update = '2016-08-17';
$this->parameters[] =
'[
{
"name" : "Search criteria",
"identifier" : "search"
}
]';
}
2015-10-22 15:57:33 +03:00
public function collectData(array $param) {
//Utility function for retrieving text based on start and end delimiters
function ExtractFromDelimiters($string, $start, $end) {
if (strpos($string, $start) !== false) {
$section_retrieved = substr($string, strpos($string, $start) + strlen($start));
$section_retrieved = substr($section_retrieved, 0, strpos($section_retrieved, $end));
return $section_retrieved;
} return false;
2015-10-22 15:57:33 +03:00
}
//Ensure proper parameters have been provided
if (empty($param['search'])) {
$this->returnClientError('You must specify a search criteria');
2015-10-22 15:57:33 +03:00
}
//Retrieve torrent listing from search results, which does not contain torrent description
$url = $this->uri.'torrents/search/?'.$param['search'].'&order=added&type=desc';
$html = $this->getSimpleHTMLDOM($url) or $this->returnServerError('Could not request t411: '.$url);
$results = $html->find('table.results', 0);
if (is_null($results))
$this->returnServerError('No results from t411: '.$url);
2015-10-22 15:57:33 +03:00
$limit = 0;
//Process each item individually
2016-07-17 15:39:14 +03:00
foreach ($results->find('tr') as $element) {
2015-10-22 15:57:33 +03:00
2016-07-17 15:39:14 +03:00
//Limit total amount of requests and ignore table header
if ($limit < 10 && !is_object($element->find('th', 0))) {
2015-10-22 15:57:33 +03:00
//Requests are rate-limited
usleep(500000); //So we need to wait (500ms)
2015-10-22 15:57:33 +03:00
//Retrieve data from RSS entry
$item_uri = $this->uri.'torrents/details/?id='.ExtractFromDelimiters($element->find('a.nfo', 0)->outertext, '?id=', '"');
$item_title = ExtractFromDelimiters($element->outertext, '" title="', '"');
$item_date = strtotime($element->find('dd', 0)->plaintext);
2015-10-22 15:57:33 +03:00
//Retrieve full description from torrent page
if ($item_html = $this->getSimpleHTMLDOM($item_uri)) {
2015-10-22 15:57:33 +03:00
//Retrieve data from page contents
$item_desc = $item_html->find('div.description', 0);
$item_author = $item_html->find('a.profile', 0)->innertext;
2016-07-17 15:39:14 +03:00
//Cleanup advertisments
$divs = explode('<div class="align-center">', $item_desc->innertext);
$item_desc = '';
foreach ($divs as $text)
if (strpos($text, 'adprovider.adlure.net') === false)
$item_desc = $item_desc.'<div class="align-center">'.$text;
$item_desc = preg_replace('/<h2 class="align-center">LIENS DE T..?L..?CHARGEMENT<\/h2>/i', '', $item_desc);
2015-10-22 15:57:33 +03:00
//Build and add final item
$item = new \Item();
$item->uri = $item_uri;
$item->title = $item_title;
$item->author = $item_author;
$item->timestamp = $item_date;
2016-07-17 15:39:14 +03:00
$item->content = $item_desc;
2015-10-22 15:57:33 +03:00
$this->items[] = $item;
$limit++;
}
}
}
}
}