mirror of
https://github.com/RSS-Bridge/rss-bridge.git
synced 2024-11-27 20:12:11 +03:00
37cb4091d4
When fetching website contents, exceptions already raise on fetching error
137 lines
3.3 KiB
PHP
137 lines
3.3 KiB
PHP
<?php
|
|
class HaveIBeenPwnedBridge extends BridgeAbstract {
|
|
const NAME = 'Have I Been Pwned (HIBP) Bridge';
|
|
const URI = 'https://haveibeenpwned.com';
|
|
const DESCRIPTION = 'Returns list of Pwned websites';
|
|
const MAINTAINER = 'VerifiedJoseph';
|
|
const PARAMETERS = array(array(
|
|
'order' => array(
|
|
'name' => 'Order by',
|
|
'type' => 'list',
|
|
'values' => array(
|
|
'Breach date' => 'breachDate',
|
|
'Date added to HIBP' => 'dateAdded',
|
|
),
|
|
'defaultValue' => 'dateAdded',
|
|
),
|
|
'item_limit' => array(
|
|
'name' => 'Limit number of returned items',
|
|
'type' => 'number',
|
|
'defaultValue' => 20,
|
|
)
|
|
));
|
|
|
|
const CACHE_TIMEOUT = 3600;
|
|
|
|
private $breachDateRegex = '/Breach date: ([0-9]{1,2} [A-Z-a-z]+ [0-9]{4})/';
|
|
private $dateAddedRegex = '/Date added to HIBP: ([0-9]{1,2} [A-Z-a-z]+ [0-9]{4})/';
|
|
private $accountsRegex = '/Compromised accounts: ([0-9,]+)/';
|
|
|
|
private $breaches = array();
|
|
|
|
public function collectData() {
|
|
|
|
$html = getSimpleHTMLDOM(self::URI . '/PwnedWebsites');
|
|
|
|
$breaches = array();
|
|
|
|
foreach($html->find('div.row') as $breach) {
|
|
$item = array();
|
|
|
|
if ($breach->class != 'row') {
|
|
continue;
|
|
}
|
|
|
|
preg_match($this->breachDateRegex, $breach->find('p', 1)->plaintext, $breachDate)
|
|
or returnServerError('Could not extract details');
|
|
|
|
preg_match($this->dateAddedRegex, $breach->find('p', 1)->plaintext, $dateAdded)
|
|
or returnServerError('Could not extract details');
|
|
|
|
preg_match($this->accountsRegex, $breach->find('p', 1)->plaintext, $accounts)
|
|
or returnServerError('Could not extract details');
|
|
|
|
$permalink = $breach->find('p', 1)->find('a', 0)->href;
|
|
|
|
// Remove permalink
|
|
$breach->find('p', 1)->find('a', 0)->outertext = '';
|
|
|
|
$item['title'] = html_entity_decode($breach->find('h3', 0)->plaintext, ENT_QUOTES)
|
|
. ' - ' . $accounts[1] . ' breached accounts';
|
|
$item['dateAdded'] = strtotime($dateAdded[1]);
|
|
$item['breachDate'] = strtotime($breachDate[1]);
|
|
$item['uri'] = self::URI . '/PwnedWebsites' . $permalink;
|
|
|
|
$item['content'] = '<p>' . $breach->find('p', 0)->innertext . '</p>';
|
|
$item['content'] .= '<p>' . $this->breachType($breach) . '</p>';
|
|
$item['content'] .= '<p>' . $breach->find('p', 1)->innertext . '</p>';
|
|
|
|
$this->breaches[] = $item;
|
|
}
|
|
|
|
$this->orderBreaches();
|
|
$this->createItems();
|
|
}
|
|
|
|
/**
|
|
* Extract data breach type(s)
|
|
*/
|
|
private function breachType($breach) {
|
|
|
|
$content = '';
|
|
|
|
if ($breach->find('h3 > i', 0)) {
|
|
|
|
foreach ($breach->find('h3 > i') as $i) {
|
|
$content .= $i->title . '.<br>';
|
|
}
|
|
|
|
}
|
|
|
|
return $content;
|
|
|
|
}
|
|
|
|
/**
|
|
* Order Breaches by date added or date breached
|
|
*/
|
|
private function orderBreaches() {
|
|
|
|
$sortBy = $this->getInput('order');
|
|
$sort = array();
|
|
|
|
foreach ($this->breaches as $key => $item) {
|
|
$sort[$key] = $item[$sortBy];
|
|
}
|
|
|
|
array_multisort($sort, SORT_DESC, $this->breaches);
|
|
|
|
}
|
|
|
|
/**
|
|
* Create items from breaches array
|
|
*/
|
|
private function createItems() {
|
|
|
|
$limit = $this->getInput('item_limit');
|
|
|
|
if ($limit < 1) {
|
|
$limit = 20;
|
|
}
|
|
|
|
foreach ($this->breaches as $breach) {
|
|
$item = array();
|
|
|
|
$item['title'] = $breach['title'];
|
|
$item['timestamp'] = $breach[$this->getInput('order')];
|
|
$item['uri'] = $breach['uri'];
|
|
$item['content'] = $breach['content'];
|
|
|
|
$this->items[] = $item;
|
|
|
|
if (count($this->items) >= $limit) {
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|