[ 'splitGobbets' => [ 'name' => 'Split the short stories', 'type' => 'checkbox', 'defaultValue' => false, 'title' => 'Whether to split the short stories into separate entries' ], 'limit' => [ 'name' => 'Truncate headers for the short stories', 'type' => 'number', 'defaultValue' => 100 ], 'agenda' => [ 'name' => 'Add agenda for the day', 'type' => 'checkbox', 'defaultValue' => 'checked' ], 'agendaPictures' => [ 'name' => 'Include pictures to the agenda', 'type' => 'checkbox', 'defaultValue' => 'checked' ], 'quote' => [ 'name' => 'Include the quote of the day', 'type' => 'checkbox' ] ] ]; public function collectData() { $html = getSimpleHTMLDOM(self::URI); $gobbets = $html->find('._gobbets', 0); if ($this->getInput('splitGobbets') == 1) { $this->splitGobbets($gobbets); } else { $this->mergeGobbets($gobbets); }; if ($this->getInput('agenda') == 1) { $articles = $html->find('._articles', 0); $this->collectArticles($articles); } if ($this->getInput('quote') == 1) { $quote = $html->find('._quote-container', 0); $this->addQuote($quote); } } private function splitGobbets($gobbets) { $today = new Datetime(); $today->setTime(0, 0, 0, 0); $limit = $this->getInput('limit'); foreach ($gobbets->find('._gobbet') as $gobbet) { $title = $gobbet->plaintext; $match = preg_match('/[\.,]/', $title, $matches, PREG_OFFSET_CAPTURE); if ($match > 0) { $point = $matches[0][1]; $title = mb_substr($title, 0, $point); } if ($limit && mb_strlen($title) > $limit) { $title = mb_substr($title, 0, $limit) . '...'; } $item = [ 'uri' => self::URI, 'title' => $title, 'content' => $gobbet->innertext, 'timestamp' => $today->format('U'), 'uid' => md5($gobbet->plaintext) ]; $this->items[] = $item; } } private function mergeGobbets($gobbets) { $today = new Datetime(); $today->setTime(0, 0, 0, 0); $contents = ''; foreach ($gobbets->find('._gobbet') as $gobbet) { $contents .= "
{$gobbet->innertext}"; } $this->items[] = [ 'uri' => self::URI, 'title' => 'World in brief at ' . $today->format('Y.m.d'), 'content' => $contents, 'timestamp' => $today->format('U'), 'uid' => 'world-in-brief-' . $today->format('U') ]; } private function collectArticles($articles) { $i = 0; $today = new Datetime(); $today->setTime(0, 0, 0, 0); foreach ($articles->find('._article') as $article) { $title = $article->find('._headline', 0)->plaintext; $image = $article->find('._main-image', 0); $content = $article->find('._content', 0); $res_content = ''; if ($image != null && $this->getInput('agendaPictures') == 1) { $img = $image->find('img', 0); $res_content .= ''; } $res_content .= $content->innertext; $this->items[] = [ 'uri' => self::URI, 'title' => $title, 'content' => $res_content, 'timestamp' => $today->format('U'), 'uid' => 'story-' . $today->format('U') . "{$i}", ]; $i++; } } private function addQuote($quote) { $today = new Datetime(); $today->setTime(0, 0, 0, 0); $this->items[] = [ 'uri' => self::URI, 'title' => 'Quote of the day ' . $today->format('Y.m.d'), 'content' => $quote->innertext, 'timestamp' => $today->format('U'), 'uid' => 'quote-' . $today->format('U') ]; } }