2024-01-10 18:42:57 -05:00
|
|
|
|
<?php
|
|
|
|
|
|
|
|
|
|
class AnnasArchiveBridge extends BridgeAbstract
|
|
|
|
|
{
|
|
|
|
|
const NAME = 'Anna\'s Archive';
|
|
|
|
|
const MAINTAINER = 'phantop';
|
|
|
|
|
const URI = 'https://annas-archive.org/';
|
|
|
|
|
const DESCRIPTION = 'Returns books from Anna\'s Archive';
|
|
|
|
|
const PARAMETERS = [
|
|
|
|
|
[
|
|
|
|
|
'q' => [
|
|
|
|
|
'name' => 'Query',
|
|
|
|
|
'exampleValue' => 'apothecary diaries',
|
|
|
|
|
'required' => true,
|
|
|
|
|
],
|
|
|
|
|
'ext' => [
|
|
|
|
|
'name' => 'Extension',
|
|
|
|
|
'type' => 'list',
|
|
|
|
|
'values' => [
|
|
|
|
|
'Any' => null,
|
|
|
|
|
'azw3' => 'azw3',
|
|
|
|
|
'cbr' => 'cbr',
|
|
|
|
|
'cbz' => 'cbz',
|
|
|
|
|
'djvu' => 'djvu',
|
|
|
|
|
'epub' => 'epub',
|
|
|
|
|
'fb2' => 'fb2',
|
|
|
|
|
'fb2.zip' => 'fb2.zip',
|
|
|
|
|
'mobi' => 'mobi',
|
|
|
|
|
'pdf' => 'pdf',
|
|
|
|
|
]
|
|
|
|
|
],
|
|
|
|
|
'lang' => [
|
|
|
|
|
'name' => 'Language',
|
|
|
|
|
'type' => 'list',
|
|
|
|
|
'values' => [
|
|
|
|
|
'Any' => null,
|
|
|
|
|
'Afrikaans [af]' => 'af',
|
|
|
|
|
'Arabic [ar]' => 'ar',
|
|
|
|
|
'Bangla [bn]' => 'bn',
|
|
|
|
|
'Belarusian [be]' => 'be',
|
|
|
|
|
'Bulgarian [bg]' => 'bg',
|
|
|
|
|
'Catalan [ca]' => 'ca',
|
|
|
|
|
'Chinese [zh]' => 'zh',
|
|
|
|
|
'Church Slavic [cu]' => 'cu',
|
|
|
|
|
'Croatian [hr]' => 'hr',
|
|
|
|
|
'Czech [cs]' => 'cs',
|
|
|
|
|
'Danish [da]' => 'da',
|
|
|
|
|
'Dongxiang [sce]' => 'sce',
|
|
|
|
|
'Dutch [nl]' => 'nl',
|
|
|
|
|
'English [en]' => 'en',
|
|
|
|
|
'French [fr]' => 'fr',
|
|
|
|
|
'German [de]' => 'de',
|
|
|
|
|
'Greek [el]' => 'el',
|
|
|
|
|
'Hebrew [he]' => 'he',
|
|
|
|
|
'Hindi [hi]' => 'hi',
|
|
|
|
|
'Hungarian [hu]' => 'hu',
|
|
|
|
|
'Indonesian [id]' => 'id',
|
|
|
|
|
'Irish [ga]' => 'ga',
|
|
|
|
|
'Italian [it]' => 'it',
|
|
|
|
|
'Japanese [ja]' => 'ja',
|
|
|
|
|
'Kazakh [kk]' => 'kk',
|
|
|
|
|
'Korean [ko]' => 'ko',
|
|
|
|
|
'Latin [la]' => 'la',
|
|
|
|
|
'Latvian [lv]' => 'lv',
|
|
|
|
|
'Lithuanian [lt]' => 'lt',
|
|
|
|
|
'Luxembourgish [lb]' => 'lb',
|
|
|
|
|
'Ndolo [ndl]' => 'ndl',
|
|
|
|
|
'Norwegian [no]' => 'no',
|
|
|
|
|
'Persian [fa]' => 'fa',
|
|
|
|
|
'Polish [pl]' => 'pl',
|
|
|
|
|
'Portuguese [pt]' => 'pt',
|
|
|
|
|
'Romanian [ro]' => 'ro',
|
|
|
|
|
'Russian [ru]' => 'ru',
|
|
|
|
|
'Serbian [sr]' => 'sr',
|
|
|
|
|
'Spanish [es]' => 'es',
|
|
|
|
|
'Swedish [sv]' => 'sv',
|
|
|
|
|
'Tamil [ta]' => 'ta',
|
|
|
|
|
'Traditional Chinese [zh‑Hant]' => 'zh‑Hant',
|
|
|
|
|
'Turkish [tr]' => 'tr',
|
|
|
|
|
'Ukrainian [uk]' => 'uk',
|
|
|
|
|
'Unknown language' => '_empty',
|
|
|
|
|
'Unknown language [und]' => 'und',
|
|
|
|
|
'Unknown language [urdu]' => 'urdu',
|
|
|
|
|
'Urdu [ur]' => 'ur',
|
|
|
|
|
'Vietnamese [vi]' => 'vi',
|
|
|
|
|
'Welsh [cy]' => 'cy',
|
|
|
|
|
]
|
|
|
|
|
],
|
|
|
|
|
'content' => [
|
|
|
|
|
'name' => 'Type',
|
|
|
|
|
'type' => 'list',
|
|
|
|
|
'values' => [
|
|
|
|
|
'Any' => null,
|
|
|
|
|
'Book (fiction)' => 'book_fiction',
|
|
|
|
|
'Book (non‑fiction)' => 'book_nonfiction',
|
|
|
|
|
'Book (unknown)' => 'book_unknown',
|
|
|
|
|
'Comic book' => 'book_comic',
|
|
|
|
|
'Journal article' => 'journal_article',
|
|
|
|
|
'Magazine' => 'magazine',
|
|
|
|
|
'Standards document' => 'standards_document',
|
|
|
|
|
]
|
|
|
|
|
],
|
|
|
|
|
'src' => [
|
|
|
|
|
'name' => 'Source',
|
|
|
|
|
'type' => 'list',
|
|
|
|
|
'values' => [
|
|
|
|
|
'Any' => null,
|
|
|
|
|
'Internet Archive' => 'ia',
|
|
|
|
|
'Libgen.li' => 'lgli',
|
|
|
|
|
'Libgen.rs' => 'lgrs',
|
|
|
|
|
'Sci‑Hub' => 'scihub',
|
|
|
|
|
'Z‑Library' => 'zlib',
|
|
|
|
|
]
|
|
|
|
|
],
|
|
|
|
|
]
|
|
|
|
|
];
|
|
|
|
|
|
|
|
|
|
public function collectData()
|
|
|
|
|
{
|
|
|
|
|
$url = $this->getURI();
|
|
|
|
|
$list = getSimpleHTMLDOMCached($url);
|
|
|
|
|
$list = defaultLinkTo($list, self::URI);
|
|
|
|
|
|
|
|
|
|
// Don't attempt to do anything if not found message is given
|
|
|
|
|
if ($list->find('.js-not-found-additional')) {
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
2024-03-05 19:28:24 -05:00
|
|
|
|
$elements = $list->find('.w-full > .mb-4 > div');
|
2024-02-09 07:27:16 +01:00
|
|
|
|
foreach ($elements as $element) {
|
2024-03-05 19:28:24 -05:00
|
|
|
|
// stop added entries once partial match list starts
|
|
|
|
|
if (str_contains($element->innertext, 'partial match')) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
if ($element = $element->find('a', 0)) {
|
|
|
|
|
$item = [];
|
|
|
|
|
$item['title'] = $element->find('h3', 0)->plaintext;
|
|
|
|
|
$item['author'] = $element->find('div.italic', 0)->plaintext;
|
|
|
|
|
$item['uri'] = $element->href;
|
|
|
|
|
$item['content'] = $element->plaintext;
|
|
|
|
|
$item['uid'] = $item['uri'];
|
2024-01-10 18:42:57 -05:00
|
|
|
|
|
2024-03-05 19:28:24 -05:00
|
|
|
|
$item_html = getSimpleHTMLDOMCached($item['uri'], 86400 * 20);
|
|
|
|
|
if ($item_html) {
|
|
|
|
|
$item_html = defaultLinkTo($item_html, self::URI);
|
|
|
|
|
$item['content'] .= $item_html->find('main img', 0);
|
|
|
|
|
$item['content'] .= $item_html->find('main .mt-4', 0); // Summary
|
|
|
|
|
foreach ($item_html->find('main ul.mb-4 > li > a.js-download-link') as $file) {
|
|
|
|
|
if (!str_contains($file->href, 'fast_download')) {
|
|
|
|
|
$item['enclosures'][] = $file->href;
|
|
|
|
|
}
|
2024-01-10 18:42:57 -05:00
|
|
|
|
}
|
|
|
|
|
// Remove bulk torrents from enclosures list
|
|
|
|
|
$item['enclosures'] = array_diff($item['enclosures'], [self::URI . 'datasets']);
|
|
|
|
|
}
|
|
|
|
|
|
2024-03-05 19:28:24 -05:00
|
|
|
|
$this->items[] = $item;
|
|
|
|
|
}
|
2024-01-10 18:42:57 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public function getName()
|
|
|
|
|
{
|
|
|
|
|
$name = parent::getName();
|
|
|
|
|
if ($this->getInput('q') != null) {
|
|
|
|
|
$name .= ' - ' . $this->getInput('q');
|
|
|
|
|
}
|
|
|
|
|
return $name;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public function getURI()
|
|
|
|
|
{
|
|
|
|
|
$params = array_filter([ // Filter to remove non-provided parameters
|
|
|
|
|
'q' => $this->getInput('q'),
|
|
|
|
|
'ext' => $this->getInput('ext'),
|
|
|
|
|
'lang' => $this->getInput('lang'),
|
|
|
|
|
'src' => $this->getInput('src'),
|
|
|
|
|
'content' => $this->getInput('content'),
|
|
|
|
|
]);
|
|
|
|
|
$url = parent::getURI() . 'search?sort=newest&' . http_build_query($params);
|
|
|
|
|
return $url;
|
|
|
|
|
}
|
|
|
|
|
}
|