rss-bridge/bridges/ScribdBridge.php

79 lines
2 KiB
PHP
Raw Normal View History

2020-02-04 19:26:34 +03:00
<?php
class ScribdBridge extends BridgeAbstract {
const NAME = 'Scribd Bridge';
const URI = 'https://www.scribd.com';
const DESCRIPTION = 'Returns documents uploaded by a user.';
const MAINTAINER = 'VerifiedJoseph';
const PARAMETERS = array(array(
'profile' => array(
'name' => 'Profile URL',
'type' => 'text',
'required' => true,
2022-03-24 23:32:16 +03:00
'title' => 'Profile URL. Example: https://www.scribd.com/user/164147088/Ars-Technica',
'exampleValue' => 'https://www.scribd.com/user/'
2020-02-04 19:26:34 +03:00
),
));
const CACHE_TIMEOUT = 3600;
private $profileUrlRegex = '/scribd\.com\/(user\/[0-9]+\/[\w-]+)\/?/';
private $feedName = '';
public function collectData() {
$html = getSimpleHTMLDOM($this->getURI());
2020-02-04 19:26:34 +03:00
2022-03-24 23:32:16 +03:00
$this->feedName = $html->find('div.header', 0)->plaintext;
2020-02-04 19:26:34 +03:00
2022-03-24 23:32:16 +03:00
foreach($html->find('ul.document_cells > li') as $index => $li) {
2020-02-04 19:26:34 +03:00
$item = array();
$item['title'] = $li->find('div.under_title', 0)->plaintext;
$item['uri'] = $li->find('a', 0)->href;
$item['author'] = $li->find('span.uploader', 0)->plaintext;
$item['uid'] = $li->find('a', 0)->href;
$pageHtml = getSimpleHTMLDOMCached($item['uri'], 3600);
2020-02-04 19:26:34 +03:00
$image = $pageHtml->find('meta[property="og:image"]', 0)->content;
$description = $pageHtml->find('meta[property="og:description"]', 0)->content;
foreach ($pageHtml->find('ul.interest_pills li') as $pills) {
$item['categories'][] = $pills->plaintext;
}
$item['content'] = <<<EOD
<p>{$description}<p><p><img src="{$image}"></p>
EOD;
$item['enclosures'][] = $image;
$this->items[] = $item;
if (count($this->items) >= 15) {
break;
}
}
}
public function getName() {
if ($this->feedName) {
return $this->feedName . ' - Scribd';
}
return parent::getName();
}
public function getURI() {
if (!is_null($this->getInput('profile'))) {
preg_match($this->profileUrlRegex, $this->getInput('profile'), $user)
or returnServerError('Could not extract user ID and name from given profile URL.');
return self::URI . '/' . $user[1] . '/uploads';
}
return parent::getURI();
}
}