mirror of
https://github.com/RSS-Bridge/rss-bridge.git
synced 2024-12-18 08:54:20 +03:00
37cb4091d4
When fetching website contents, exceptions already raise on fetching error
217 lines
6.5 KiB
PHP
217 lines
6.5 KiB
PHP
<?php
|
|
class AnidexBridge extends BridgeAbstract {
|
|
|
|
const MAINTAINER = 'ORelio';
|
|
const NAME = 'Anidex';
|
|
const URI = 'http://anidex.info/'; // anidex.info has ddos-guard so we need to use anidex.moe
|
|
const ALTERNATE_URI = 'https://anidex.moe/'; // anidex.moe returns 301 unless Host is set to anidex.info
|
|
const ALTERNATE_HOST = 'anidex.info'; // Correct host for requesting anidex.moe without 301 redirect
|
|
const DESCRIPTION = 'Returns the newest torrents, with optional search criteria.';
|
|
const PARAMETERS = array(
|
|
array(
|
|
'id' => array(
|
|
'name' => 'Category',
|
|
'type' => 'list',
|
|
'values' => array(
|
|
'All categories' => '0',
|
|
'Anime' => '1,2,3',
|
|
'Anime - Sub' => '1',
|
|
'Anime - Raw' => '2',
|
|
'Anime - Dub' => '3',
|
|
'Live Action' => '4,5',
|
|
'Live Action - Sub' => '4',
|
|
'Live Action - Raw' => '5',
|
|
'Light Novel' => '6',
|
|
'Manga' => '7,8',
|
|
'Manga - Translated' => '7',
|
|
'Manga - Raw' => '8',
|
|
'Music' => '9,10,11',
|
|
'Music - Lossy' => '9',
|
|
'Music - Lossless' => '10',
|
|
'Music - Video' => '11',
|
|
'Games' => '12',
|
|
'Applications' => '13',
|
|
'Pictures' => '14',
|
|
'Adult Video' => '15',
|
|
'Other' => '16'
|
|
)
|
|
),
|
|
'lang_id' => array(
|
|
'name' => 'Language',
|
|
'type' => 'list',
|
|
'values' => array(
|
|
'All languages' => '0',
|
|
'English' => '1',
|
|
'Japanese' => '2',
|
|
'Polish' => '3',
|
|
'Serbo-Croatian' => '4',
|
|
'Dutch' => '5',
|
|
'Italian' => '6',
|
|
'Russian' => '7',
|
|
'German' => '8',
|
|
'Hungarian' => '9',
|
|
'French' => '10',
|
|
'Finnish' => '11',
|
|
'Vietnamese' => '12',
|
|
'Greek' => '13',
|
|
'Bulgarian' => '14',
|
|
'Spanish (Spain)' => '15',
|
|
'Portuguese (Brazil)' => '16',
|
|
'Portuguese (Portugal)' => '17',
|
|
'Swedish' => '18',
|
|
'Arabic' => '19',
|
|
'Danish' => '20',
|
|
'Chinese (Simplified)' => '21',
|
|
'Bengali' => '22',
|
|
'Romanian' => '23',
|
|
'Czech' => '24',
|
|
'Mongolian' => '25',
|
|
'Turkish' => '26',
|
|
'Indonesian' => '27',
|
|
'Korean' => '28',
|
|
'Spanish (LATAM)' => '29',
|
|
'Persian' => '30',
|
|
'Malaysian' => '31'
|
|
)
|
|
),
|
|
'group_id' => array(
|
|
'name' => 'Group ID',
|
|
'type' => 'number'
|
|
),
|
|
'r' => array(
|
|
'name' => 'Hide Remakes',
|
|
'type' => 'checkbox'
|
|
),
|
|
'b' => array(
|
|
'name' => 'Only Batches',
|
|
'type' => 'checkbox'
|
|
),
|
|
'a' => array(
|
|
'name' => 'Only Authorized',
|
|
'type' => 'checkbox'
|
|
),
|
|
'q' => array(
|
|
'name' => 'Keyword',
|
|
'description' => 'Keyword(s)',
|
|
'type' => 'text'
|
|
),
|
|
'h' => array(
|
|
'name' => 'Adult content',
|
|
'type' => 'list',
|
|
'values' => array(
|
|
'No filter' => '0',
|
|
'Hide +18' => '1',
|
|
'Only +18' => '2'
|
|
)
|
|
)
|
|
)
|
|
);
|
|
|
|
public function collectData() {
|
|
|
|
// Build Search URL from user-provided parameters
|
|
$search_url = self::ALTERNATE_URI . '?s=upload_timestamp&o=desc';
|
|
foreach (array('id', 'lang_id', 'group_id') as $param_name) {
|
|
$param = $this->getInput($param_name);
|
|
if (!empty($param) && intval($param) != 0 && ctype_digit(str_replace(',', '', $param))) {
|
|
$search_url .= '&' . $param_name . '=' . $param;
|
|
}
|
|
}
|
|
foreach (array('r', 'b', 'a') as $param_name) {
|
|
$param = $this->getInput($param_name);
|
|
if (!empty($param) && boolval($param)) {
|
|
$search_url .= '&' . $param_name . '=1';
|
|
}
|
|
}
|
|
$query = $this->getInput('q');
|
|
if (!empty($query)) {
|
|
$search_url .= '&q=' . urlencode($query);
|
|
}
|
|
$opt = array();
|
|
$h = $this->getInput('h');
|
|
if (!empty($h) && intval($h) != 0 && ctype_digit($h)) {
|
|
$opt[CURLOPT_COOKIE] = 'anidex_h_toggle=' . $h;
|
|
}
|
|
|
|
// We need to use a different Host HTTP header to reach the correct page on ALTERNATE_URI
|
|
$headers = array('Host: ' . self::ALTERNATE_HOST);
|
|
|
|
// The HTTPS certificate presented by anidex.moe is for anidex.info. We need to ignore this.
|
|
// As a consequence, the bridge is intentionally marked as insecure by setting self::URI to http://
|
|
$opt[CURLOPT_SSL_VERIFYHOST] = 0;
|
|
$opt[CURLOPT_SSL_VERIFYPEER] = 0;
|
|
|
|
// Retrieve torrent listing from search results, which does not contain torrent description
|
|
$html = getSimpleHTMLDOM($search_url, $headers, $opt);
|
|
$links = $html->find('a');
|
|
$results = array();
|
|
foreach ($links as $link)
|
|
if (strpos($link->href, '/torrent/') === 0 && !in_array($link->href, $results))
|
|
$results[] = $link->href;
|
|
if (empty($results) && empty($this->getInput('q')))
|
|
returnServerError('No results from Anidex: ' . $search_url);
|
|
|
|
//Process each item individually
|
|
foreach ($results as $element) {
|
|
|
|
//Limit total amount of requests
|
|
if(count($this->items) >= 20) {
|
|
break;
|
|
}
|
|
|
|
$torrent_id = str_replace('/torrent/', '', $element);
|
|
|
|
//Ignore entries without valid torrent ID
|
|
if ($torrent_id != 0 && ctype_digit($torrent_id)) {
|
|
|
|
//Retrieve data for this torrent ID
|
|
$item_browse_uri = self::URI . 'torrent/' . $torrent_id;
|
|
$item_fetch_uri = self::ALTERNATE_URI . 'torrent/' . $torrent_id;
|
|
|
|
//Retrieve full description from torrent page (cached for 24 hours: 86400 seconds)
|
|
if ($item_html = getSimpleHTMLDOMCached($item_fetch_uri, 86400, $headers, $opt)) {
|
|
|
|
//Retrieve data from page contents
|
|
$item_title = str_replace(' (Torrent) - AniDex ', '', $item_html->find('title', 0)->plaintext);
|
|
$item_desc = $item_html->find('div.panel-body', 0);
|
|
$item_author = trim($item_html->find('span.fa-user', 0)->parent()->plaintext);
|
|
$item_date = strtotime(trim($item_html->find('span.fa-clock', 0)->parent()->plaintext));
|
|
$item_image = $this->getURI() . 'images/user_logos/default.png';
|
|
|
|
//Check for description-less torrent andn optionally extract image
|
|
$desc_title_found = false;
|
|
foreach ($item_html->find('h3.panel-title') as $h3) {
|
|
if (strpos($h3, 'Description') !== false) {
|
|
$desc_title_found = true;
|
|
break;
|
|
}
|
|
}
|
|
if ($desc_title_found) {
|
|
//Retrieve image for thumbnail or generic logo fallback
|
|
foreach ($item_desc->find('img') as $img) {
|
|
if (strpos($img->src, 'prez') === false) {
|
|
$item_image = $img->src;
|
|
break;
|
|
}
|
|
}
|
|
$item_desc = trim($item_desc->innertext);
|
|
} else {
|
|
$item_desc = '<em>No description.</em>';
|
|
}
|
|
|
|
//Build and add final item
|
|
$item = array();
|
|
$item['uri'] = $item_browse_uri;
|
|
$item['title'] = $item_title;
|
|
$item['author'] = $item_author;
|
|
$item['timestamp'] = $item_date;
|
|
$item['enclosures'] = array($item_image);
|
|
$item['content'] = $item_desc;
|
|
$this->items[] = $item;
|
|
}
|
|
}
|
|
$element = null;
|
|
}
|
|
$results = null;
|
|
}
|
|
}
|