mirror of
https://github.com/RSS-Bridge/rss-bridge.git
synced 2025-02-10 06:12:25 +00:00
![Bartosz Sosna](/assets/img/avatar_default.png)
* Add lfc.pl bridge * Adjust bridge * Add comments section * Fix a bug with page content when comments exist * Add brtsos to CONTRIBUTORS.md
110 lines
No EOL
3.4 KiB
PHP
110 lines
No EOL
3.4 KiB
PHP
<?php
|
|
|
|
class LfcPlBridge extends BridgeAbstract
|
|
{
|
|
const NAME = 'LFC (lfc.pl)';
|
|
const DESCRIPTION = 'LFC.pl - największa polska strona o Liverpool FC';
|
|
const URI = 'https://lfc.pl';
|
|
const MAINTAINER = 'brtsos';
|
|
const PARAMETERS = [
|
|
[
|
|
'comments' => [
|
|
'type' => 'list',
|
|
'name' => 'Include comments',
|
|
'title' => 'Include comments in the article content',
|
|
'values' => [
|
|
'No' => 'no',
|
|
'Yes' => 'yes',
|
|
],
|
|
]
|
|
]
|
|
];
|
|
|
|
public function collectData()
|
|
{
|
|
$dom = getSimpleHTMLDOM(self::URI . '/Archiwum/' . date('Y') . date('m'));
|
|
|
|
$list = $dom->find('#page .list-vertical li');
|
|
$list = array_reverse($list);
|
|
$list = array_slice($list, 0, 10);
|
|
|
|
foreach ($list as $li) {
|
|
$link = $li->find('a', 0);
|
|
$url = self::URI . $link->href;
|
|
|
|
$articleDom = getSimpleHTMLDOM($url);
|
|
|
|
$description = $this->getContent($articleDom);
|
|
if (mb_strpos($description, 'Artykuł sponsorowany') !== false) {
|
|
continue;
|
|
}
|
|
|
|
$image = '<img src="' . $this->getImage($articleDom) . '" alt="' . $link->plaintext . '" />';
|
|
|
|
$content = $image . '</br>' . $description;
|
|
|
|
$tagsToRemove = ['script', 'iframe', 'input', 'form'];
|
|
$content = sanitize($content, $tagsToRemove);
|
|
|
|
$footerArticle = $articleDom->find('.footer', 0)->find('.item', 0)->find('div', 1);
|
|
$author = $footerArticle->find('a', 0)->plaintext;
|
|
|
|
$dateTime = $footerArticle->find('div', 0)->plaintext;
|
|
$date = DateTime::createFromFormat('d.m.Y H:i', $dateTime);
|
|
$timestamp = $date->getTimestamp();
|
|
$this->items[] = [
|
|
'title' => $link->plaintext,
|
|
'uri' => $url,
|
|
'timestamp' => $timestamp,
|
|
'content' => $content,
|
|
'author' => $author,
|
|
];
|
|
}
|
|
}
|
|
|
|
private function getContent($article)
|
|
{
|
|
$content = $article->find('.news-body', 0)->innertext;
|
|
$commentsHtml = $article->find('#comments', 0);
|
|
|
|
$comments = '';
|
|
if ($this->withComment()) {
|
|
if ($commentsHtml) {
|
|
$commentsDom = $commentsHtml->find('.comment');
|
|
|
|
if (count($commentsDom) > 0) {
|
|
$comments = '<h3>Komentarze:</h3>';
|
|
}
|
|
|
|
foreach ($commentsDom as $comment) {
|
|
$header = $comment->find('.header', 0)->plaintext;
|
|
$commentContent = $comment->find('.content', 0)->plaintext;
|
|
$comments .= $header . '<br />' . $commentContent . '<br /><br />';
|
|
}
|
|
}
|
|
}
|
|
|
|
return $content . '<br /> <br />' . $comments;
|
|
}
|
|
|
|
private function getImage($article): ?string
|
|
{
|
|
$imgElement = $article->find('#news .img', 0);
|
|
if ($imgElement) {
|
|
$style = $imgElement->style;
|
|
|
|
if (preg_match('/background-image:\s*url\(([^)]+)\)/i', $style, $matches)) {
|
|
return self::URI . trim($matches[1], "'\"");
|
|
}
|
|
|
|
return null;
|
|
}
|
|
|
|
return null;
|
|
}
|
|
|
|
private function withComment(): bool
|
|
{
|
|
return $this->getInput('comments') === 'yes';
|
|
}
|
|
} |