2020-08-27 06:38:51 +01:00
|
|
|
<?php
|
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
class DiarioDeNoticiasBridge extends BridgeAbstract
|
|
|
|
{
|
|
|
|
const NAME = 'Diário de Notícias (PT)';
|
|
|
|
const URI = 'https://dn.pt';
|
|
|
|
const DESCRIPTION = 'Diário de Notícias (DN.PT)';
|
|
|
|
const MAINTAINER = 'somini';
|
|
|
|
const PARAMETERS = [
|
|
|
|
'Tag' => [
|
|
|
|
'n' => [
|
|
|
|
'name' => 'Tag Name',
|
|
|
|
'required' => true,
|
|
|
|
'exampleValue' => 'rogerio-casanova',
|
|
|
|
]
|
|
|
|
]
|
|
|
|
];
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
const MONPT = [
|
|
|
|
'jan',
|
|
|
|
'fev',
|
|
|
|
'mar',
|
|
|
|
'abr',
|
|
|
|
'mai',
|
|
|
|
'jun',
|
|
|
|
'jul',
|
|
|
|
'ago',
|
|
|
|
'set',
|
|
|
|
'out',
|
|
|
|
'nov',
|
|
|
|
'dez',
|
|
|
|
];
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
public function getIcon()
|
|
|
|
{
|
|
|
|
return 'https://static.globalnoticias.pt/dn/common/images/favicons/favicon-128.png';
|
|
|
|
}
|
2020-10-15 12:53:19 +05:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
public function getName()
|
|
|
|
{
|
|
|
|
switch ($this->queriedContext) {
|
|
|
|
case 'Tag':
|
|
|
|
$name = self::NAME . ' | Tag | ' . $this->getInput('n');
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
$name = self::NAME;
|
|
|
|
}
|
|
|
|
return $name;
|
|
|
|
}
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
public function getURI()
|
|
|
|
{
|
|
|
|
switch ($this->queriedContext) {
|
|
|
|
case 'Tag':
|
|
|
|
$url = self::URI . '/tag/' . $this->getInput('n') . '.html';
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
$url = self::URI;
|
|
|
|
}
|
|
|
|
return $url;
|
|
|
|
}
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
public function collectData()
|
|
|
|
{
|
2022-07-09 08:13:07 +02:00
|
|
|
$archives = $this->getURI();
|
2022-07-01 15:10:30 +02:00
|
|
|
$html = getSimpleHTMLDOMCached($archives);
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
foreach ($html->find('article') as $element) {
|
|
|
|
$item = [];
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
$title = $element->find('.t-am-title', 0);
|
|
|
|
$link = $element->find('a.t-am-text', 0);
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
$item['title'] = $title->plaintext;
|
|
|
|
$item['uri'] = self::URI . $link->href;
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
$snippet = $element->find('.t-am-lead', 0);
|
|
|
|
if ($snippet) {
|
|
|
|
$item['content'] = $snippet->plaintext;
|
|
|
|
}
|
|
|
|
preg_match('|edicao-do-dia\\/(?P<day>\d\d)-(?P<monpt>\w\w\w)-(?P<year>\d\d\d\d)|', $link->href, $d);
|
|
|
|
if ($d) {
|
|
|
|
$item['timestamp'] = sprintf('%s-%s-%s', $d['year'], array_search($d['monpt'], self::MONPT) + 1, $d['day']);
|
|
|
|
}
|
2020-08-27 06:38:51 +01:00
|
|
|
|
2022-07-01 15:10:30 +02:00
|
|
|
$this->items[] = $item;
|
|
|
|
}
|
|
|
|
}
|
2020-08-27 06:38:51 +01:00
|
|
|
}
|