mirror of
https://github.com/RSS-Bridge/rss-bridge.git
synced 2025-04-24 07:26:53 +00:00
commit
9e998abfd1
1
.gitignore
vendored
1
.gitignore
vendored
@ -226,3 +226,4 @@ pip-log.txt
|
||||
##############
|
||||
/cache
|
||||
/whitelist.txt
|
||||
DEBUG
|
||||
|
@ -113,6 +113,7 @@ Technical notes
|
||||
===
|
||||
* There is a cache so that source services won't ban you even if you hammer the rss-bridge with requests. Each bridge has a different duration for the cache. The `cache` subdirectory will be automatically created and cached objects older than 24 hours get purged.
|
||||
* To implement a new rss-bridge, [follow the specifications](CREATE_BRIDGE.md) and take a look at existing bridges for examples.
|
||||
* To enable debug mode (disabling cache and enabling error reporting), create an empty file named `DEBUG` in the root directory (next to `index.php`).
|
||||
|
||||
Rant
|
||||
===
|
||||
|
@ -33,10 +33,14 @@ class BandcampBridge extends BridgeAbstract{
|
||||
}
|
||||
|
||||
foreach($html->find('li.item') as $release) {
|
||||
$script = $release->find('div.art', 0)->getAttribute('onclick');
|
||||
$uri = ltrim($script, "return 'url(");
|
||||
$uri = rtrim($uri, "')");
|
||||
|
||||
$item = new \Item();
|
||||
$item->name = $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
||||
$item->title = $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
||||
$item->content = '<img src="' . $release->find('img.art',0)->src . '"/><br/>' . $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
||||
$item->content = '<img src="' . $uri . '"/><br/>' . $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
||||
$item->id = $release->find('a',0)->getAttribute('href');
|
||||
$item->uri = $release->find('a',0)->getAttribute('href');
|
||||
$this->items[] = $item;
|
||||
|
@ -9,7 +9,7 @@ class CNETBridge extends BridgeAbstract {
|
||||
$this->name = 'CNET News';
|
||||
$this->uri = 'http://www.cnet.com/';
|
||||
$this->description = 'Returns the newest articles. <br /> You may specify a topic found in some section URLs, else all topics are selected.';
|
||||
$this->update = '2016-02-06';
|
||||
$this->update = '2016-03-16';
|
||||
|
||||
$this->parameters[] =
|
||||
'[
|
||||
@ -76,7 +76,7 @@ class CNETBridge extends BridgeAbstract {
|
||||
if (is_object($article_thumbnail))
|
||||
$article_thumbnail = $article_thumbnail->find('img', 0)->src;
|
||||
|
||||
$article_content = trim(CleanArticle(ExtractFromDelimiters($article_html, '</div></div></div><div class="col-8">', '<footer>')));
|
||||
$article_content = trim(CleanArticle(ExtractFromDelimiters($article_html, '<div class="articleContent', '<footer>')));
|
||||
|
||||
$item = new \Item();
|
||||
$item->uri = $article_uri;
|
||||
|
@ -13,52 +13,49 @@ class CourrierInternationalBridge extends BridgeAbstract{
|
||||
|
||||
public function collectData(array $param){
|
||||
|
||||
function fetchArticle($link) {
|
||||
$html = '';
|
||||
|
||||
$page = file_get_html($link);
|
||||
|
||||
$contenu = $page->find(".article-text")[0];
|
||||
|
||||
return strip_tags($contenu);
|
||||
$html = file_get_html('http://www.courrierinternational.com/') or $this->returnError('Error.', 500);
|
||||
|
||||
|
||||
|
||||
}
|
||||
$element = $html->find("article");
|
||||
|
||||
$html = '';
|
||||
$article_count = 1;
|
||||
|
||||
$html = file_get_html('http://www.courrierinternational.com/article') or $this->returnError('Error.', 500);
|
||||
foreach($element as $article) {
|
||||
|
||||
$item = new \Item();
|
||||
|
||||
$item->uri = $article->parent->getAttribute("href");
|
||||
|
||||
$element = $html->find(".type-normal");
|
||||
if(strpos($item->uri, "http") === FALSE) {
|
||||
$item->uri = "http://courrierinternational.fr/".$item->uri;
|
||||
}
|
||||
|
||||
$article_count = 1;
|
||||
$page = file_get_html($item->uri);
|
||||
|
||||
foreach($element as $article) {
|
||||
$cleaner = new HTMLSanitizer();
|
||||
|
||||
$item = new \Item();
|
||||
$item->content = $cleaner->sanitize($page->find("div.article-text")[0]);
|
||||
$item->title = strip_tags($article->find(".title")[0]);
|
||||
|
||||
$item->uri = "http://www.courrierinternational.com".$article->find("a")[0]->getAttribute("href");
|
||||
$item->content = fetchArticle("http://www.courrierinternational.com".$article->find("a")[0]->getAttribute("href"));
|
||||
$item->title = strip_tags($article->find("h2")[0]);
|
||||
$dateTime = date_parse($page->find("time")[0]);
|
||||
|
||||
$dateTime = date_parse($article->find("time")[0]);
|
||||
|
||||
$item->timestamp = mktime(
|
||||
$item->timestamp = mktime(
|
||||
$dateTime['hour'],
|
||||
$dateTime['minute'],
|
||||
$dateTime['second'],
|
||||
$dateTime['month'],
|
||||
$dateTime['day'],
|
||||
$dateTime['year']
|
||||
);
|
||||
);
|
||||
|
||||
$this->items[] = $item;
|
||||
$article_count ++;
|
||||
if($article_count > 5) break;
|
||||
$this->items[] = $item;
|
||||
$article_count ++;
|
||||
if($article_count > 5) break;
|
||||
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
|
||||
|
@ -28,9 +28,9 @@ class Freenews extends RssExpander {
|
||||
$item->title = trim($newsItem->title);
|
||||
// $this->message("item has for title \"".$item->title."\"");
|
||||
if(empty($newsItem->guid)) {
|
||||
$item->uri = $newsItem->link;
|
||||
$item->uri = (string) $newsItem->link;
|
||||
} else {
|
||||
$item->uri = $newsItem->guid;
|
||||
$item->uri = (string) $newsItem->guid;
|
||||
}
|
||||
// now load that uri from cache
|
||||
// $this->message("now loading page ".$item->uri);
|
||||
|
219
bridges/FuturaSciencesBridge.php
Normal file
219
bridges/FuturaSciencesBridge.php
Normal file
@ -0,0 +1,219 @@
|
||||
<?php
|
||||
class FuturaSciencesBridge extends BridgeAbstract {
|
||||
|
||||
public function loadMetadatas() {
|
||||
|
||||
$this->maintainer = 'ORelio';
|
||||
$this->name = $this->getName();
|
||||
$this->uri = $this->getURI();
|
||||
$this->description = 'Returns the newest articles.';
|
||||
$this->update = '2016-03-20';
|
||||
|
||||
$this->parameters[] =
|
||||
'[
|
||||
{
|
||||
"name" : "Feed",
|
||||
"type" : "list",
|
||||
"identifier" : "feed",
|
||||
"values" :
|
||||
[
|
||||
{ "name" : "---- Select ----", "value" : "" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux multi-magazines", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Sciences", "value" : "actualites" },
|
||||
{ "name" : " Les dernières définitions de Futura-Sciences", "value" : "definitions" },
|
||||
{ "name" : " Les dernières photos de Futura-Sciences", "value" : "photos" },
|
||||
{ "name" : " Les dernières questions - réponses de Futura-Sciences", "value" : "questions-reponses" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Sciences", "value" : "dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Services", "value" : "" },
|
||||
|
||||
{ "name" : " Les cartes virtuelles de Futura-Sciences", "value" : "services/cartes-virtuelles" },
|
||||
{ "name" : " Les fonds d\'écran de Futura-Sciences", "value" : "services/fonds-ecran" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Santé", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Santé", "value" : "sante/actualites" },
|
||||
{ "name" : " Les dernières définitions de Futura-Santé", "value" : "sante/definitions" },
|
||||
{ "name" : " Les dernières questions-réponses de Futura-Santé", "value" : "sante/questions-reponses" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Santé", "value" : "sante/dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux High-Tech", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura High-Tech", "value" : "high-tech/actualites" },
|
||||
{ "name" : " Les dernières astuces de Futura High-Tech", "value" : "high-tech/questions-reponses" },
|
||||
{ "name" : " Les dernières définitions de Futura High-Tech", "value" : "high-tech/definitions" },
|
||||
{ "name" : " Les derniers dossiers de Futura High-Tech", "value" : "high-tech/dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Espace", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Espace", "value" : "espace/actualites" },
|
||||
{ "name" : " Les dernières définitions de Futura-Espace", "value" : "espace/definitions" },
|
||||
{ "name" : " Les dernières questions-réponses de Futura-Espace", "value" : "espace/questions-reponses" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Espace", "value" : "espace/dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Environnement", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Environnement", "value" : "environnement/actualites" },
|
||||
{ "name" : " Les dernières définitions de Futura-Environnement", "value" : "environnement/definitions" },
|
||||
{ "name" : " Les dernières questions - réponses de Futura-Environnement", "value" : "environnement/questions-reponses" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Environnement", "value" : "environnement/dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Maison", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Maison", "value" : "maison/actualites" },
|
||||
{ "name" : " Les dernières astuces de Futura-Maison", "value" : "maison/questions-reponses" },
|
||||
{ "name" : " Les dernières définitions de Futura-Maison", "value" : "maison/definitions" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Maison", "value" : "maison/dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Nature", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Nature", "value" : "nature/actualites" },
|
||||
{ "name" : " Les dernières définitions de Futura-Nature", "value" : "nature/definitions" },
|
||||
{ "name" : " Les dernières questions-réponses de Futura-Nature", "value" : "nature/questions-reponses" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Nature", "value" : "nature/dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Terre", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Terre", "value" : "terre/actualites" },
|
||||
{ "name" : " Les dernières définitions de Futura-Terre", "value" : "terre/definitions" },
|
||||
{ "name" : " Les dernières questions-réponses de Futura-Terre", "value" : "terre/questions-reponses" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Terre", "value" : "terre/dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Matière", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Matière", "value" : "matiere/actualites" },
|
||||
{ "name" : " Les dernières définitions de Futura-Matière", "value" : "matiere/definitions" },
|
||||
{ "name" : " Les dernières questions-réponses de Futura-Matière", "value" : "matiere/questions-reponses" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Matière", "value" : "matiere/dossiers" },
|
||||
|
||||
{ "name" : "", "value" : "" },
|
||||
{ "name" : "Les flux Mathématiques", "value" : "" },
|
||||
|
||||
{ "name" : " Les dernières actualités de Futura-Mathématiques", "value" : "mathematiques/actualites" },
|
||||
{ "name" : " Les derniers dossiers de Futura-Mathématiques", "value" : "mathematiques/dossiers" }
|
||||
]
|
||||
}
|
||||
]';
|
||||
|
||||
}
|
||||
|
||||
public function collectData(array $param) {
|
||||
|
||||
function StripCDATA($string) {
|
||||
$string = str_replace('<![CDATA[', '', $string);
|
||||
$string = str_replace(']]>', '', $string);
|
||||
return $string;
|
||||
}
|
||||
|
||||
function StripWithDelimiters($string, $start, $end) {
|
||||
while (strpos($string, $start) !== false) {
|
||||
$section_to_remove = substr($string, strpos($string, $start));
|
||||
$section_to_remove = substr($section_to_remove, 0, strpos($section_to_remove, $end) + strlen($end));
|
||||
$string = str_replace($section_to_remove, '', $string);
|
||||
} return $string;
|
||||
}
|
||||
|
||||
function StripRecursiveHTMLSection($string, $tag_name, $tag_start) {
|
||||
$open_tag = '<'.$tag_name;
|
||||
$close_tag = '</'.$tag_name.'>';
|
||||
$close_tag_length = strlen($close_tag);
|
||||
if (strpos($tag_start, $open_tag) === 0) {
|
||||
while (strpos($string, $tag_start) !== false) {
|
||||
$max_recursion = 100;
|
||||
$section_to_remove = null;
|
||||
$section_start = strpos($string, $tag_start);
|
||||
$search_offset = $section_start;
|
||||
do {
|
||||
$max_recursion--;
|
||||
$section_end = strpos($string, $close_tag, $search_offset);
|
||||
$search_offset = $section_end + $close_tag_length;
|
||||
$section_to_remove = substr($string, $section_start, $section_end - $section_start + $close_tag_length);
|
||||
$open_tag_count = substr_count($section_to_remove, $open_tag);
|
||||
$close_tag_count = substr_count($section_to_remove, $close_tag);
|
||||
} while ($open_tag_count > $close_tag_count && $max_recursion > 0);
|
||||
$string = str_replace($section_to_remove, '', $string);
|
||||
}
|
||||
}
|
||||
return $string;
|
||||
}
|
||||
|
||||
if (empty($param['feed']))
|
||||
$this->returnError('Please select a feed to display.'.$url, 400);
|
||||
if ($param['feed'] !== preg_replace('/[^a-zA-Z-\/]+/', '', $param['feed']) || substr_count($param['feed'], '/') > 1 || strlen($param['feed'] > 64))
|
||||
$this->returnError('Invalid "feed" parameter.'.$url, 400);
|
||||
|
||||
$url = $this->getURI().'rss/'.$param['feed'].'.xml';
|
||||
$html = file_get_html($url) or $this->returnError('Could not request Futura-Sciences: '.$url, 500);
|
||||
$limit = 0;
|
||||
|
||||
foreach($html->find('item') as $element) {
|
||||
if ($limit < 10) {
|
||||
$article_url = str_replace('#xtor=RSS-8', '', StripCDATA($element->find('guid', 0)->plaintext));
|
||||
$article = file_get_html($article_url) or $this->returnError('Could not request Futura-Sciences: '.$article_url, 500);
|
||||
$contents = $article->find('div.content', 0)->innertext;
|
||||
$author = trim(str_replace(', Futura-Sciences', '', $article->find('span.author', 0)->plaintext));
|
||||
if (empty($author))
|
||||
$author = StripCDATA($element->find('author', 0)->plaintext);
|
||||
|
||||
foreach (array(
|
||||
'<div class="clear',
|
||||
'<div class="sharebar2',
|
||||
'<div class="diaporamafullscreen"',
|
||||
'<div style="margin-bottom:10px;" class="noprint"',
|
||||
'<div class="ficheprevnext',
|
||||
'<div class="bar noprint',
|
||||
'<div class="toolbar noprint',
|
||||
'<div class="addthis_toolbox',
|
||||
'<div class="noprint',
|
||||
'<div class="bg bglight border border-full noprint',
|
||||
'<div class="httplogbar-wrapper noprint',
|
||||
'<div id="forumcomments'
|
||||
) as $div_start) {
|
||||
$contents = StripRecursiveHTMLSection($contents , 'div', $div_start);
|
||||
}
|
||||
|
||||
$contents = StripWithDelimiters($contents, '<hr ', '/>');
|
||||
$contents = StripWithDelimiters($contents, '<p class="content-date', '</p>');
|
||||
$contents = StripWithDelimiters($contents, '<h1 class="content-title', '</h1>');
|
||||
$contents = StripWithDelimiters($contents, 'fs:definition="', '"');
|
||||
$contents = StripWithDelimiters($contents, 'fs:xt:clicktype="', '"');
|
||||
$contents = StripWithDelimiters($contents, 'fs:xt:clickname="', '"');
|
||||
|
||||
$item = new \Item();
|
||||
$item->author = $author;
|
||||
$item->uri = $article_url;
|
||||
$item->title = StripCDATA($element->find('title', 0)->innertext);
|
||||
$item->thumbnailUri = StripCDATA($element->find('enclosure', 0)->url);
|
||||
$item->timestamp = strtotime(StripCDATA($element->find('pubDate', 0)->plaintext));
|
||||
$item->content = trim($contents);
|
||||
$this->items[] = $item;
|
||||
$limit++;
|
||||
}
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
public function getName() {
|
||||
return 'Futura-Sciences Bridge';
|
||||
}
|
||||
|
||||
public function getURI() {
|
||||
return 'http://www.futura-sciences.com/';
|
||||
}
|
||||
|
||||
public function getCacheDuration() {
|
||||
return 3600;
|
||||
}
|
||||
}
|
61
bridges/LichessBridge.php
Normal file
61
bridges/LichessBridge.php
Normal file
@ -0,0 +1,61 @@
|
||||
<?php
|
||||
|
||||
class LichessBridge extends BridgeAbstract
|
||||
{
|
||||
public function loadMetadatas()
|
||||
{
|
||||
$this->maintainer = 'AmauryCarrade';
|
||||
$this->name = $this->getName() . ' Bridge';
|
||||
$this->uri = $this->getURI();
|
||||
$this->description = 'Returns the 5 newest posts from the Lichess blog (full text)';
|
||||
$this->update = "2016-03-22";
|
||||
}
|
||||
|
||||
public function collectData(array $param)
|
||||
{
|
||||
$xml_feed = file_get_html('http://fr.lichess.org/blog.atom') or $this->returnError('Could not retrieve Lichess blog feed.', 404);
|
||||
|
||||
$posts_loaded = 0;
|
||||
foreach($xml_feed->find('entry') as $entry)
|
||||
{
|
||||
if ($posts_loaded < 5)
|
||||
{
|
||||
$item = new \Item();
|
||||
|
||||
$item->title = html_entity_decode($entry->find('title', 0)->innertext);
|
||||
$item->author = $entry->find('author', 0)->find('name', 0)->innertext;
|
||||
$item->uri = $entry->find('id', 0)->plaintext;
|
||||
$item->timestamp = strtotime($entry->find('published', 0)->plaintext);
|
||||
|
||||
$item->content = $this->retrieve_lichess_post($item->uri);
|
||||
|
||||
$this->items[] = $item;
|
||||
$posts_loaded++;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
private function retrieve_lichess_post($blog_post_uri)
|
||||
{
|
||||
$blog_post_html = file_get_html($blog_post_uri);
|
||||
$blog_post_div = $blog_post_html->find('#lichess_blog', 0);
|
||||
|
||||
$post_chapo = $blog_post_div->find('.shortlede', 0)->innertext;
|
||||
$post_content = $blog_post_div->find('.body', 0)->innertext;
|
||||
|
||||
$content = '<p><em>' . $post_chapo . '</em></p>';
|
||||
$content .= '<div>' . $post_content . '</div>';
|
||||
|
||||
return $content;
|
||||
}
|
||||
|
||||
public function getName()
|
||||
{
|
||||
return 'Lichess Blog';
|
||||
}
|
||||
|
||||
public function getURI()
|
||||
{
|
||||
return 'http://lichess.org/blog';
|
||||
}
|
||||
}
|
@ -5,7 +5,7 @@ class T411Bridge extends BridgeAbstract {
|
||||
|
||||
$this->maintainer = "ORelio";
|
||||
$this->name = "T411";
|
||||
$this->uri = "https://t411.in/";
|
||||
$this->uri = $this->getURI();
|
||||
$this->description = "Returns the 5 newest torrents with specified search terms <br /> Use url part after '?' mark when using their search engine";
|
||||
$this->update = "2016-02-06";
|
||||
|
||||
@ -34,8 +34,8 @@ class T411Bridge extends BridgeAbstract {
|
||||
$this->returnError('You must specify a search criteria', 400);
|
||||
}
|
||||
|
||||
//Retrieve torrent listing as truncated rss, which does not contain torrent description
|
||||
$url = 'http://www.t411.in/torrents/search/?'.$param['search'].'&order=added&type=desc';
|
||||
//Retrieve torrent listing from search results, which does not contain torrent description
|
||||
$url = $this->getURI().'torrents/search/?'.$param['search'].'&order=added&type=desc';
|
||||
$html = file_get_html($url) or $this->returnError('Could not request t411: '.$url, 500);
|
||||
$results = $html->find('table.results', 0);
|
||||
if (is_null($results))
|
||||
@ -52,7 +52,7 @@ class T411Bridge extends BridgeAbstract {
|
||||
usleep(500000); //So we need to wait (500ms)
|
||||
|
||||
//Retrieve data from RSS entry
|
||||
$item_uri = 'http://'.ExtractFromDelimiters($element->outertext, '<a href="//', '"');
|
||||
$item_uri = $this->getURI().'torrents/details/?id='.ExtractFromDelimiters($element->find('a.nfo', 0)->outertext, '?id=', '"');
|
||||
$item_title = ExtractFromDelimiters($element->outertext, '" title="', '"');
|
||||
$item_date = strtotime($element->find('dd', 0)->plaintext);
|
||||
|
||||
@ -64,7 +64,7 @@ class T411Bridge extends BridgeAbstract {
|
||||
$item_author = $item_html->find('a.profile', 0)->innertext;
|
||||
|
||||
//Retrieve image for thumbnail or generic logo fallback
|
||||
$item_image = 'http://www.t411.in/themes/blue/images/logo.png';
|
||||
$item_image = $this->getURI().'themes/blue/images/logo.png';
|
||||
foreach ($item_desc->find('img') as $img) {
|
||||
if (strpos($img->src, 'prez') === false) {
|
||||
$item_image = $img->src;
|
||||
@ -92,7 +92,7 @@ class T411Bridge extends BridgeAbstract {
|
||||
}
|
||||
|
||||
public function getURI() {
|
||||
return 'https://t411.in';
|
||||
return 'https://t411.ch/';
|
||||
}
|
||||
|
||||
public function getCacheDuration() {
|
||||
|
@ -41,7 +41,7 @@ class TheOatmealBridge extends RssExpander{
|
||||
$item = new Item();
|
||||
$item->title = trim($newsItem->title);
|
||||
$this->message("browsing Oatmeal item ".var_export($newsItem, true));
|
||||
$item->uri=$newsItem->attributes($namespaces['rdf'])->about;
|
||||
$item->uri=(string) $newsItem->attributes($namespaces['rdf'])->about;
|
||||
// now load that uri from cache
|
||||
$this->message("now loading page ".$item->uri);
|
||||
$articlePage = str_get_html($this->get_cached($item->uri));
|
||||
@ -53,7 +53,7 @@ class TheOatmealBridge extends RssExpander{
|
||||
$item->content = $content->innertext;
|
||||
|
||||
$this->message("dc content is ".var_export($dc, true));
|
||||
$item->name = $dc->creator;
|
||||
$item->name = (string) $dc->creator;
|
||||
$item->timestamp = DateTime::createFromFormat(DateTime::ISO8601, $dc->date)->getTimestamp();
|
||||
$this->message("writtem by ".$item->name." on ".$item->timestamp);
|
||||
return $item;
|
||||
|
59
bridges/VineBridge.php
Normal file
59
bridges/VineBridge.php
Normal file
@ -0,0 +1,59 @@
|
||||
<?php
|
||||
class VineBridge extends BridgeAbstract {
|
||||
|
||||
public function loadMetadatas() {
|
||||
|
||||
$this->maintainer = "ckiw";
|
||||
$this->name = "Vine bridge";
|
||||
$this->uri = "http://vine.co/";
|
||||
$this->description = "Returns the latests vines from vine user page";
|
||||
$this->update = "2016-03-12";
|
||||
|
||||
$this->parameters[] =
|
||||
'[
|
||||
{
|
||||
"name" : "User id",
|
||||
"identifier" : "u",
|
||||
"type" : "text",
|
||||
"required" : "true"
|
||||
}
|
||||
]';
|
||||
}
|
||||
|
||||
public function collectData(array $param){
|
||||
$html = '';
|
||||
$uri = 'http://vine.co/u/'.$param['u'].'?mode=list';
|
||||
|
||||
$html = file_get_html($uri) or $this->returnError('No results for this query.', 404);
|
||||
|
||||
foreach($html->find('.post') as $element) {
|
||||
$a = $element->find('a', 0);
|
||||
$a->href = str_replace('https://', 'http://', $a->href);
|
||||
$time = strtotime(ltrim($element->find('p', 0)->plaintext, " Uploaded at "));
|
||||
$video = $element->find('video', 0);
|
||||
$video->controls = "true";
|
||||
$element->find('h2', 0)->outertext = '';
|
||||
|
||||
$item = new \Item();
|
||||
$item->uri = $a->href;
|
||||
$item->timestamp = $time;
|
||||
$item->title = $a->plaintext;
|
||||
$item->content = $element;
|
||||
|
||||
$this->items[] = $item;
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
public function getName(){
|
||||
return 'Vine';
|
||||
}
|
||||
|
||||
public function getURI(){
|
||||
return 'http://vine.co';
|
||||
}
|
||||
|
||||
public function getCacheDuration(){
|
||||
return 10; //seconds
|
||||
}
|
||||
}
|
58
bridges/ZoneTelechargementBridge.php
Normal file
58
bridges/ZoneTelechargementBridge.php
Normal file
@ -0,0 +1,58 @@
|
||||
<?php
|
||||
class ZoneTelechargementBridge extends BridgeAbstract {
|
||||
|
||||
public function loadMetadatas() {
|
||||
|
||||
$this->maintainer = 'ORelio';
|
||||
$this->name = $this->getName();
|
||||
$this->uri = $this->getURI();
|
||||
$this->description = 'RSS proxy returning the newest releases.<br />You may specify a category found in RSS URLs, else main feed is selected.';
|
||||
$this->update = "2016-03-16";
|
||||
|
||||
$this->parameters[] =
|
||||
'[
|
||||
{
|
||||
"name" : "Category",
|
||||
"identifier" : "category"
|
||||
}
|
||||
]';
|
||||
}
|
||||
|
||||
public function collectData(array $param) {
|
||||
|
||||
function StripCDATA($string) {
|
||||
$string = str_replace('<![CDATA[', '', $string);
|
||||
$string = str_replace(']]>', '', $string);
|
||||
return $string;
|
||||
}
|
||||
|
||||
$category = '/';
|
||||
if (!empty($param['category']))
|
||||
$category = '/'.$param['category'].'/';
|
||||
|
||||
$url = $this->getURI().$category.'rss.xml';
|
||||
$html = file_get_html($url) or $this->returnError('Could not request Zone Telechargement: '.$url, 500);
|
||||
|
||||
foreach($html->find('item') as $element) {
|
||||
$item = new \Item();
|
||||
$item->title = $element->find('title', 0)->plaintext;
|
||||
$item->uri = str_replace('http://', 'https://', $element->find('guid', 0)->plaintext);
|
||||
$item->timestamp = strtotime($element->find('pubDate', 0)->plaintext);
|
||||
$item->content = StripCDATA($element->find('description', 0)->innertext);
|
||||
$this->items[] = $item;
|
||||
$limit++;
|
||||
}
|
||||
}
|
||||
|
||||
public function getName() {
|
||||
return 'Zone Telechargement Bridge';
|
||||
}
|
||||
|
||||
public function getURI() {
|
||||
return 'https://www.zone-telechargement.com/';
|
||||
}
|
||||
|
||||
public function getCacheDuration() {
|
||||
return 3600;
|
||||
}
|
||||
}
|
10
index.php
10
index.php
@ -14,7 +14,13 @@ TODO :
|
||||
|
||||
date_default_timezone_set('UTC');
|
||||
error_reporting(0);
|
||||
//ini_set('display_errors','1'); error_reporting(E_ALL); // For debugging only.
|
||||
|
||||
if(file_exists("DEBUG")) {
|
||||
|
||||
ini_set('display_errors','1'); error_reporting(E_ALL); //Report all errors
|
||||
define("DEBUG", "true");
|
||||
|
||||
}
|
||||
|
||||
require_once __DIR__ . '/lib/RssBridge.php';
|
||||
|
||||
@ -84,7 +90,7 @@ try{
|
||||
|
||||
// Data retrieval
|
||||
$bridge = Bridge::create($bridge);
|
||||
if(isset($_REQUEST["disable_cache"])) {
|
||||
if(defined("DEBUG")) {
|
||||
} else {
|
||||
$bridge->setCache($cache); // just add disable cache to your query to disable caching
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user