mirror of
https://github.com/RSS-Bridge/rss-bridge.git
synced 2025-04-23 15:06:53 +00:00
commit
9e998abfd1
1
.gitignore
vendored
1
.gitignore
vendored
@ -226,3 +226,4 @@ pip-log.txt
|
|||||||
##############
|
##############
|
||||||
/cache
|
/cache
|
||||||
/whitelist.txt
|
/whitelist.txt
|
||||||
|
DEBUG
|
||||||
|
@ -113,6 +113,7 @@ Technical notes
|
|||||||
===
|
===
|
||||||
* There is a cache so that source services won't ban you even if you hammer the rss-bridge with requests. Each bridge has a different duration for the cache. The `cache` subdirectory will be automatically created and cached objects older than 24 hours get purged.
|
* There is a cache so that source services won't ban you even if you hammer the rss-bridge with requests. Each bridge has a different duration for the cache. The `cache` subdirectory will be automatically created and cached objects older than 24 hours get purged.
|
||||||
* To implement a new rss-bridge, [follow the specifications](CREATE_BRIDGE.md) and take a look at existing bridges for examples.
|
* To implement a new rss-bridge, [follow the specifications](CREATE_BRIDGE.md) and take a look at existing bridges for examples.
|
||||||
|
* To enable debug mode (disabling cache and enabling error reporting), create an empty file named `DEBUG` in the root directory (next to `index.php`).
|
||||||
|
|
||||||
Rant
|
Rant
|
||||||
===
|
===
|
||||||
|
@ -33,10 +33,14 @@ class BandcampBridge extends BridgeAbstract{
|
|||||||
}
|
}
|
||||||
|
|
||||||
foreach($html->find('li.item') as $release) {
|
foreach($html->find('li.item') as $release) {
|
||||||
|
$script = $release->find('div.art', 0)->getAttribute('onclick');
|
||||||
|
$uri = ltrim($script, "return 'url(");
|
||||||
|
$uri = rtrim($uri, "')");
|
||||||
|
|
||||||
$item = new \Item();
|
$item = new \Item();
|
||||||
$item->name = $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
$item->name = $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
||||||
$item->title = $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
$item->title = $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
||||||
$item->content = '<img src="' . $release->find('img.art',0)->src . '"/><br/>' . $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
$item->content = '<img src="' . $uri . '"/><br/>' . $release->find('div.itemsubtext',0)->plaintext . ' - ' . $release->find('div.itemtext',0)->plaintext;
|
||||||
$item->id = $release->find('a',0)->getAttribute('href');
|
$item->id = $release->find('a',0)->getAttribute('href');
|
||||||
$item->uri = $release->find('a',0)->getAttribute('href');
|
$item->uri = $release->find('a',0)->getAttribute('href');
|
||||||
$this->items[] = $item;
|
$this->items[] = $item;
|
||||||
|
@ -9,7 +9,7 @@ class CNETBridge extends BridgeAbstract {
|
|||||||
$this->name = 'CNET News';
|
$this->name = 'CNET News';
|
||||||
$this->uri = 'http://www.cnet.com/';
|
$this->uri = 'http://www.cnet.com/';
|
||||||
$this->description = 'Returns the newest articles. <br /> You may specify a topic found in some section URLs, else all topics are selected.';
|
$this->description = 'Returns the newest articles. <br /> You may specify a topic found in some section URLs, else all topics are selected.';
|
||||||
$this->update = '2016-02-06';
|
$this->update = '2016-03-16';
|
||||||
|
|
||||||
$this->parameters[] =
|
$this->parameters[] =
|
||||||
'[
|
'[
|
||||||
@ -76,7 +76,7 @@ class CNETBridge extends BridgeAbstract {
|
|||||||
if (is_object($article_thumbnail))
|
if (is_object($article_thumbnail))
|
||||||
$article_thumbnail = $article_thumbnail->find('img', 0)->src;
|
$article_thumbnail = $article_thumbnail->find('img', 0)->src;
|
||||||
|
|
||||||
$article_content = trim(CleanArticle(ExtractFromDelimiters($article_html, '</div></div></div><div class="col-8">', '<footer>')));
|
$article_content = trim(CleanArticle(ExtractFromDelimiters($article_html, '<div class="articleContent', '<footer>')));
|
||||||
|
|
||||||
$item = new \Item();
|
$item = new \Item();
|
||||||
$item->uri = $article_uri;
|
$item->uri = $article_uri;
|
||||||
|
@ -13,52 +13,49 @@ class CourrierInternationalBridge extends BridgeAbstract{
|
|||||||
|
|
||||||
public function collectData(array $param){
|
public function collectData(array $param){
|
||||||
|
|
||||||
function fetchArticle($link) {
|
$html = '';
|
||||||
|
|
||||||
$page = file_get_html($link);
|
$html = file_get_html('http://www.courrierinternational.com/') or $this->returnError('Error.', 500);
|
||||||
|
|
||||||
$contenu = $page->find(".article-text")[0];
|
|
||||||
|
|
||||||
return strip_tags($contenu);
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
}
|
$element = $html->find("article");
|
||||||
|
|
||||||
$html = '';
|
$article_count = 1;
|
||||||
|
|
||||||
$html = file_get_html('http://www.courrierinternational.com/article') or $this->returnError('Error.', 500);
|
foreach($element as $article) {
|
||||||
|
|
||||||
|
$item = new \Item();
|
||||||
|
|
||||||
|
$item->uri = $article->parent->getAttribute("href");
|
||||||
|
|
||||||
$element = $html->find(".type-normal");
|
if(strpos($item->uri, "http") === FALSE) {
|
||||||
|
$item->uri = "http://courrierinternational.fr/".$item->uri;
|
||||||
|
}
|
||||||
|
|
||||||
$article_count = 1;
|
$page = file_get_html($item->uri);
|
||||||
|
|
||||||
foreach($element as $article) {
|
$cleaner = new HTMLSanitizer();
|
||||||
|
|
||||||
$item = new \Item();
|
$item->content = $cleaner->sanitize($page->find("div.article-text")[0]);
|
||||||
|
$item->title = strip_tags($article->find(".title")[0]);
|
||||||
|
|
||||||
$item->uri = "http://www.courrierinternational.com".$article->find("a")[0]->getAttribute("href");
|
$dateTime = date_parse($page->find("time")[0]);
|
||||||
$item->content = fetchArticle("http://www.courrierinternational.com".$article->find("a")[0]->getAttribute("href"));
|
|
||||||
$item->title = strip_tags($article->find("h2")[0]);
|
|
||||||
|
|
||||||
$dateTime = date_parse($article->find("time")[0]);
|
$item->timestamp = mktime(
|
||||||
|
|
||||||
$item->timestamp = mktime(
|
|
||||||
$dateTime['hour'],
|
$dateTime['hour'],
|
||||||
$dateTime['minute'],
|
$dateTime['minute'],
|
||||||
$dateTime['second'],
|
$dateTime['second'],
|
||||||
$dateTime['month'],
|
$dateTime['month'],
|
||||||
$dateTime['day'],
|
$dateTime['day'],
|
||||||
$dateTime['year']
|
$dateTime['year']
|
||||||
);
|
);
|
||||||
|
|
||||||
$this->items[] = $item;
|
$this->items[] = $item;
|
||||||
$article_count ++;
|
$article_count ++;
|
||||||
if($article_count > 5) break;
|
if($article_count > 5) break;
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
@ -28,9 +28,9 @@ class Freenews extends RssExpander {
|
|||||||
$item->title = trim($newsItem->title);
|
$item->title = trim($newsItem->title);
|
||||||
// $this->message("item has for title \"".$item->title."\"");
|
// $this->message("item has for title \"".$item->title."\"");
|
||||||
if(empty($newsItem->guid)) {
|
if(empty($newsItem->guid)) {
|
||||||
$item->uri = $newsItem->link;
|
$item->uri = (string) $newsItem->link;
|
||||||
} else {
|
} else {
|
||||||
$item->uri = $newsItem->guid;
|
$item->uri = (string) $newsItem->guid;
|
||||||
}
|
}
|
||||||
// now load that uri from cache
|
// now load that uri from cache
|
||||||
// $this->message("now loading page ".$item->uri);
|
// $this->message("now loading page ".$item->uri);
|
||||||
|
219
bridges/FuturaSciencesBridge.php
Normal file
219
bridges/FuturaSciencesBridge.php
Normal file
@ -0,0 +1,219 @@
|
|||||||
|
<?php
|
||||||
|
class FuturaSciencesBridge extends BridgeAbstract {
|
||||||
|
|
||||||
|
public function loadMetadatas() {
|
||||||
|
|
||||||
|
$this->maintainer = 'ORelio';
|
||||||
|
$this->name = $this->getName();
|
||||||
|
$this->uri = $this->getURI();
|
||||||
|
$this->description = 'Returns the newest articles.';
|
||||||
|
$this->update = '2016-03-20';
|
||||||
|
|
||||||
|
$this->parameters[] =
|
||||||
|
'[
|
||||||
|
{
|
||||||
|
"name" : "Feed",
|
||||||
|
"type" : "list",
|
||||||
|
"identifier" : "feed",
|
||||||
|
"values" :
|
||||||
|
[
|
||||||
|
{ "name" : "---- Select ----", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux multi-magazines", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Sciences", "value" : "actualites" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura-Sciences", "value" : "definitions" },
|
||||||
|
{ "name" : " Les dernières photos de Futura-Sciences", "value" : "photos" },
|
||||||
|
{ "name" : " Les dernières questions - réponses de Futura-Sciences", "value" : "questions-reponses" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Sciences", "value" : "dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Services", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les cartes virtuelles de Futura-Sciences", "value" : "services/cartes-virtuelles" },
|
||||||
|
{ "name" : " Les fonds d\'écran de Futura-Sciences", "value" : "services/fonds-ecran" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Santé", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Santé", "value" : "sante/actualites" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura-Santé", "value" : "sante/definitions" },
|
||||||
|
{ "name" : " Les dernières questions-réponses de Futura-Santé", "value" : "sante/questions-reponses" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Santé", "value" : "sante/dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux High-Tech", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura High-Tech", "value" : "high-tech/actualites" },
|
||||||
|
{ "name" : " Les dernières astuces de Futura High-Tech", "value" : "high-tech/questions-reponses" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura High-Tech", "value" : "high-tech/definitions" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura High-Tech", "value" : "high-tech/dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Espace", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Espace", "value" : "espace/actualites" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura-Espace", "value" : "espace/definitions" },
|
||||||
|
{ "name" : " Les dernières questions-réponses de Futura-Espace", "value" : "espace/questions-reponses" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Espace", "value" : "espace/dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Environnement", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Environnement", "value" : "environnement/actualites" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura-Environnement", "value" : "environnement/definitions" },
|
||||||
|
{ "name" : " Les dernières questions - réponses de Futura-Environnement", "value" : "environnement/questions-reponses" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Environnement", "value" : "environnement/dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Maison", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Maison", "value" : "maison/actualites" },
|
||||||
|
{ "name" : " Les dernières astuces de Futura-Maison", "value" : "maison/questions-reponses" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura-Maison", "value" : "maison/definitions" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Maison", "value" : "maison/dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Nature", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Nature", "value" : "nature/actualites" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura-Nature", "value" : "nature/definitions" },
|
||||||
|
{ "name" : " Les dernières questions-réponses de Futura-Nature", "value" : "nature/questions-reponses" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Nature", "value" : "nature/dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Terre", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Terre", "value" : "terre/actualites" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura-Terre", "value" : "terre/definitions" },
|
||||||
|
{ "name" : " Les dernières questions-réponses de Futura-Terre", "value" : "terre/questions-reponses" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Terre", "value" : "terre/dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Matière", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Matière", "value" : "matiere/actualites" },
|
||||||
|
{ "name" : " Les dernières définitions de Futura-Matière", "value" : "matiere/definitions" },
|
||||||
|
{ "name" : " Les dernières questions-réponses de Futura-Matière", "value" : "matiere/questions-reponses" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Matière", "value" : "matiere/dossiers" },
|
||||||
|
|
||||||
|
{ "name" : "", "value" : "" },
|
||||||
|
{ "name" : "Les flux Mathématiques", "value" : "" },
|
||||||
|
|
||||||
|
{ "name" : " Les dernières actualités de Futura-Mathématiques", "value" : "mathematiques/actualites" },
|
||||||
|
{ "name" : " Les derniers dossiers de Futura-Mathématiques", "value" : "mathematiques/dossiers" }
|
||||||
|
]
|
||||||
|
}
|
||||||
|
]';
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
public function collectData(array $param) {
|
||||||
|
|
||||||
|
function StripCDATA($string) {
|
||||||
|
$string = str_replace('<![CDATA[', '', $string);
|
||||||
|
$string = str_replace(']]>', '', $string);
|
||||||
|
return $string;
|
||||||
|
}
|
||||||
|
|
||||||
|
function StripWithDelimiters($string, $start, $end) {
|
||||||
|
while (strpos($string, $start) !== false) {
|
||||||
|
$section_to_remove = substr($string, strpos($string, $start));
|
||||||
|
$section_to_remove = substr($section_to_remove, 0, strpos($section_to_remove, $end) + strlen($end));
|
||||||
|
$string = str_replace($section_to_remove, '', $string);
|
||||||
|
} return $string;
|
||||||
|
}
|
||||||
|
|
||||||
|
function StripRecursiveHTMLSection($string, $tag_name, $tag_start) {
|
||||||
|
$open_tag = '<'.$tag_name;
|
||||||
|
$close_tag = '</'.$tag_name.'>';
|
||||||
|
$close_tag_length = strlen($close_tag);
|
||||||
|
if (strpos($tag_start, $open_tag) === 0) {
|
||||||
|
while (strpos($string, $tag_start) !== false) {
|
||||||
|
$max_recursion = 100;
|
||||||
|
$section_to_remove = null;
|
||||||
|
$section_start = strpos($string, $tag_start);
|
||||||
|
$search_offset = $section_start;
|
||||||
|
do {
|
||||||
|
$max_recursion--;
|
||||||
|
$section_end = strpos($string, $close_tag, $search_offset);
|
||||||
|
$search_offset = $section_end + $close_tag_length;
|
||||||
|
$section_to_remove = substr($string, $section_start, $section_end - $section_start + $close_tag_length);
|
||||||
|
$open_tag_count = substr_count($section_to_remove, $open_tag);
|
||||||
|
$close_tag_count = substr_count($section_to_remove, $close_tag);
|
||||||
|
} while ($open_tag_count > $close_tag_count && $max_recursion > 0);
|
||||||
|
$string = str_replace($section_to_remove, '', $string);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return $string;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (empty($param['feed']))
|
||||||
|
$this->returnError('Please select a feed to display.'.$url, 400);
|
||||||
|
if ($param['feed'] !== preg_replace('/[^a-zA-Z-\/]+/', '', $param['feed']) || substr_count($param['feed'], '/') > 1 || strlen($param['feed'] > 64))
|
||||||
|
$this->returnError('Invalid "feed" parameter.'.$url, 400);
|
||||||
|
|
||||||
|
$url = $this->getURI().'rss/'.$param['feed'].'.xml';
|
||||||
|
$html = file_get_html($url) or $this->returnError('Could not request Futura-Sciences: '.$url, 500);
|
||||||
|
$limit = 0;
|
||||||
|
|
||||||
|
foreach($html->find('item') as $element) {
|
||||||
|
if ($limit < 10) {
|
||||||
|
$article_url = str_replace('#xtor=RSS-8', '', StripCDATA($element->find('guid', 0)->plaintext));
|
||||||
|
$article = file_get_html($article_url) or $this->returnError('Could not request Futura-Sciences: '.$article_url, 500);
|
||||||
|
$contents = $article->find('div.content', 0)->innertext;
|
||||||
|
$author = trim(str_replace(', Futura-Sciences', '', $article->find('span.author', 0)->plaintext));
|
||||||
|
if (empty($author))
|
||||||
|
$author = StripCDATA($element->find('author', 0)->plaintext);
|
||||||
|
|
||||||
|
foreach (array(
|
||||||
|
'<div class="clear',
|
||||||
|
'<div class="sharebar2',
|
||||||
|
'<div class="diaporamafullscreen"',
|
||||||
|
'<div style="margin-bottom:10px;" class="noprint"',
|
||||||
|
'<div class="ficheprevnext',
|
||||||
|
'<div class="bar noprint',
|
||||||
|
'<div class="toolbar noprint',
|
||||||
|
'<div class="addthis_toolbox',
|
||||||
|
'<div class="noprint',
|
||||||
|
'<div class="bg bglight border border-full noprint',
|
||||||
|
'<div class="httplogbar-wrapper noprint',
|
||||||
|
'<div id="forumcomments'
|
||||||
|
) as $div_start) {
|
||||||
|
$contents = StripRecursiveHTMLSection($contents , 'div', $div_start);
|
||||||
|
}
|
||||||
|
|
||||||
|
$contents = StripWithDelimiters($contents, '<hr ', '/>');
|
||||||
|
$contents = StripWithDelimiters($contents, '<p class="content-date', '</p>');
|
||||||
|
$contents = StripWithDelimiters($contents, '<h1 class="content-title', '</h1>');
|
||||||
|
$contents = StripWithDelimiters($contents, 'fs:definition="', '"');
|
||||||
|
$contents = StripWithDelimiters($contents, 'fs:xt:clicktype="', '"');
|
||||||
|
$contents = StripWithDelimiters($contents, 'fs:xt:clickname="', '"');
|
||||||
|
|
||||||
|
$item = new \Item();
|
||||||
|
$item->author = $author;
|
||||||
|
$item->uri = $article_url;
|
||||||
|
$item->title = StripCDATA($element->find('title', 0)->innertext);
|
||||||
|
$item->thumbnailUri = StripCDATA($element->find('enclosure', 0)->url);
|
||||||
|
$item->timestamp = strtotime(StripCDATA($element->find('pubDate', 0)->plaintext));
|
||||||
|
$item->content = trim($contents);
|
||||||
|
$this->items[] = $item;
|
||||||
|
$limit++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getName() {
|
||||||
|
return 'Futura-Sciences Bridge';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getURI() {
|
||||||
|
return 'http://www.futura-sciences.com/';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getCacheDuration() {
|
||||||
|
return 3600;
|
||||||
|
}
|
||||||
|
}
|
61
bridges/LichessBridge.php
Normal file
61
bridges/LichessBridge.php
Normal file
@ -0,0 +1,61 @@
|
|||||||
|
<?php
|
||||||
|
|
||||||
|
class LichessBridge extends BridgeAbstract
|
||||||
|
{
|
||||||
|
public function loadMetadatas()
|
||||||
|
{
|
||||||
|
$this->maintainer = 'AmauryCarrade';
|
||||||
|
$this->name = $this->getName() . ' Bridge';
|
||||||
|
$this->uri = $this->getURI();
|
||||||
|
$this->description = 'Returns the 5 newest posts from the Lichess blog (full text)';
|
||||||
|
$this->update = "2016-03-22";
|
||||||
|
}
|
||||||
|
|
||||||
|
public function collectData(array $param)
|
||||||
|
{
|
||||||
|
$xml_feed = file_get_html('http://fr.lichess.org/blog.atom') or $this->returnError('Could not retrieve Lichess blog feed.', 404);
|
||||||
|
|
||||||
|
$posts_loaded = 0;
|
||||||
|
foreach($xml_feed->find('entry') as $entry)
|
||||||
|
{
|
||||||
|
if ($posts_loaded < 5)
|
||||||
|
{
|
||||||
|
$item = new \Item();
|
||||||
|
|
||||||
|
$item->title = html_entity_decode($entry->find('title', 0)->innertext);
|
||||||
|
$item->author = $entry->find('author', 0)->find('name', 0)->innertext;
|
||||||
|
$item->uri = $entry->find('id', 0)->plaintext;
|
||||||
|
$item->timestamp = strtotime($entry->find('published', 0)->plaintext);
|
||||||
|
|
||||||
|
$item->content = $this->retrieve_lichess_post($item->uri);
|
||||||
|
|
||||||
|
$this->items[] = $item;
|
||||||
|
$posts_loaded++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
private function retrieve_lichess_post($blog_post_uri)
|
||||||
|
{
|
||||||
|
$blog_post_html = file_get_html($blog_post_uri);
|
||||||
|
$blog_post_div = $blog_post_html->find('#lichess_blog', 0);
|
||||||
|
|
||||||
|
$post_chapo = $blog_post_div->find('.shortlede', 0)->innertext;
|
||||||
|
$post_content = $blog_post_div->find('.body', 0)->innertext;
|
||||||
|
|
||||||
|
$content = '<p><em>' . $post_chapo . '</em></p>';
|
||||||
|
$content .= '<div>' . $post_content . '</div>';
|
||||||
|
|
||||||
|
return $content;
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getName()
|
||||||
|
{
|
||||||
|
return 'Lichess Blog';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getURI()
|
||||||
|
{
|
||||||
|
return 'http://lichess.org/blog';
|
||||||
|
}
|
||||||
|
}
|
@ -5,7 +5,7 @@ class T411Bridge extends BridgeAbstract {
|
|||||||
|
|
||||||
$this->maintainer = "ORelio";
|
$this->maintainer = "ORelio";
|
||||||
$this->name = "T411";
|
$this->name = "T411";
|
||||||
$this->uri = "https://t411.in/";
|
$this->uri = $this->getURI();
|
||||||
$this->description = "Returns the 5 newest torrents with specified search terms <br /> Use url part after '?' mark when using their search engine";
|
$this->description = "Returns the 5 newest torrents with specified search terms <br /> Use url part after '?' mark when using their search engine";
|
||||||
$this->update = "2016-02-06";
|
$this->update = "2016-02-06";
|
||||||
|
|
||||||
@ -34,8 +34,8 @@ class T411Bridge extends BridgeAbstract {
|
|||||||
$this->returnError('You must specify a search criteria', 400);
|
$this->returnError('You must specify a search criteria', 400);
|
||||||
}
|
}
|
||||||
|
|
||||||
//Retrieve torrent listing as truncated rss, which does not contain torrent description
|
//Retrieve torrent listing from search results, which does not contain torrent description
|
||||||
$url = 'http://www.t411.in/torrents/search/?'.$param['search'].'&order=added&type=desc';
|
$url = $this->getURI().'torrents/search/?'.$param['search'].'&order=added&type=desc';
|
||||||
$html = file_get_html($url) or $this->returnError('Could not request t411: '.$url, 500);
|
$html = file_get_html($url) or $this->returnError('Could not request t411: '.$url, 500);
|
||||||
$results = $html->find('table.results', 0);
|
$results = $html->find('table.results', 0);
|
||||||
if (is_null($results))
|
if (is_null($results))
|
||||||
@ -52,7 +52,7 @@ class T411Bridge extends BridgeAbstract {
|
|||||||
usleep(500000); //So we need to wait (500ms)
|
usleep(500000); //So we need to wait (500ms)
|
||||||
|
|
||||||
//Retrieve data from RSS entry
|
//Retrieve data from RSS entry
|
||||||
$item_uri = 'http://'.ExtractFromDelimiters($element->outertext, '<a href="//', '"');
|
$item_uri = $this->getURI().'torrents/details/?id='.ExtractFromDelimiters($element->find('a.nfo', 0)->outertext, '?id=', '"');
|
||||||
$item_title = ExtractFromDelimiters($element->outertext, '" title="', '"');
|
$item_title = ExtractFromDelimiters($element->outertext, '" title="', '"');
|
||||||
$item_date = strtotime($element->find('dd', 0)->plaintext);
|
$item_date = strtotime($element->find('dd', 0)->plaintext);
|
||||||
|
|
||||||
@ -64,7 +64,7 @@ class T411Bridge extends BridgeAbstract {
|
|||||||
$item_author = $item_html->find('a.profile', 0)->innertext;
|
$item_author = $item_html->find('a.profile', 0)->innertext;
|
||||||
|
|
||||||
//Retrieve image for thumbnail or generic logo fallback
|
//Retrieve image for thumbnail or generic logo fallback
|
||||||
$item_image = 'http://www.t411.in/themes/blue/images/logo.png';
|
$item_image = $this->getURI().'themes/blue/images/logo.png';
|
||||||
foreach ($item_desc->find('img') as $img) {
|
foreach ($item_desc->find('img') as $img) {
|
||||||
if (strpos($img->src, 'prez') === false) {
|
if (strpos($img->src, 'prez') === false) {
|
||||||
$item_image = $img->src;
|
$item_image = $img->src;
|
||||||
@ -92,7 +92,7 @@ class T411Bridge extends BridgeAbstract {
|
|||||||
}
|
}
|
||||||
|
|
||||||
public function getURI() {
|
public function getURI() {
|
||||||
return 'https://t411.in';
|
return 'https://t411.ch/';
|
||||||
}
|
}
|
||||||
|
|
||||||
public function getCacheDuration() {
|
public function getCacheDuration() {
|
||||||
|
@ -41,7 +41,7 @@ class TheOatmealBridge extends RssExpander{
|
|||||||
$item = new Item();
|
$item = new Item();
|
||||||
$item->title = trim($newsItem->title);
|
$item->title = trim($newsItem->title);
|
||||||
$this->message("browsing Oatmeal item ".var_export($newsItem, true));
|
$this->message("browsing Oatmeal item ".var_export($newsItem, true));
|
||||||
$item->uri=$newsItem->attributes($namespaces['rdf'])->about;
|
$item->uri=(string) $newsItem->attributes($namespaces['rdf'])->about;
|
||||||
// now load that uri from cache
|
// now load that uri from cache
|
||||||
$this->message("now loading page ".$item->uri);
|
$this->message("now loading page ".$item->uri);
|
||||||
$articlePage = str_get_html($this->get_cached($item->uri));
|
$articlePage = str_get_html($this->get_cached($item->uri));
|
||||||
@ -53,7 +53,7 @@ class TheOatmealBridge extends RssExpander{
|
|||||||
$item->content = $content->innertext;
|
$item->content = $content->innertext;
|
||||||
|
|
||||||
$this->message("dc content is ".var_export($dc, true));
|
$this->message("dc content is ".var_export($dc, true));
|
||||||
$item->name = $dc->creator;
|
$item->name = (string) $dc->creator;
|
||||||
$item->timestamp = DateTime::createFromFormat(DateTime::ISO8601, $dc->date)->getTimestamp();
|
$item->timestamp = DateTime::createFromFormat(DateTime::ISO8601, $dc->date)->getTimestamp();
|
||||||
$this->message("writtem by ".$item->name." on ".$item->timestamp);
|
$this->message("writtem by ".$item->name." on ".$item->timestamp);
|
||||||
return $item;
|
return $item;
|
||||||
|
59
bridges/VineBridge.php
Normal file
59
bridges/VineBridge.php
Normal file
@ -0,0 +1,59 @@
|
|||||||
|
<?php
|
||||||
|
class VineBridge extends BridgeAbstract {
|
||||||
|
|
||||||
|
public function loadMetadatas() {
|
||||||
|
|
||||||
|
$this->maintainer = "ckiw";
|
||||||
|
$this->name = "Vine bridge";
|
||||||
|
$this->uri = "http://vine.co/";
|
||||||
|
$this->description = "Returns the latests vines from vine user page";
|
||||||
|
$this->update = "2016-03-12";
|
||||||
|
|
||||||
|
$this->parameters[] =
|
||||||
|
'[
|
||||||
|
{
|
||||||
|
"name" : "User id",
|
||||||
|
"identifier" : "u",
|
||||||
|
"type" : "text",
|
||||||
|
"required" : "true"
|
||||||
|
}
|
||||||
|
]';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function collectData(array $param){
|
||||||
|
$html = '';
|
||||||
|
$uri = 'http://vine.co/u/'.$param['u'].'?mode=list';
|
||||||
|
|
||||||
|
$html = file_get_html($uri) or $this->returnError('No results for this query.', 404);
|
||||||
|
|
||||||
|
foreach($html->find('.post') as $element) {
|
||||||
|
$a = $element->find('a', 0);
|
||||||
|
$a->href = str_replace('https://', 'http://', $a->href);
|
||||||
|
$time = strtotime(ltrim($element->find('p', 0)->plaintext, " Uploaded at "));
|
||||||
|
$video = $element->find('video', 0);
|
||||||
|
$video->controls = "true";
|
||||||
|
$element->find('h2', 0)->outertext = '';
|
||||||
|
|
||||||
|
$item = new \Item();
|
||||||
|
$item->uri = $a->href;
|
||||||
|
$item->timestamp = $time;
|
||||||
|
$item->title = $a->plaintext;
|
||||||
|
$item->content = $element;
|
||||||
|
|
||||||
|
$this->items[] = $item;
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getName(){
|
||||||
|
return 'Vine';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getURI(){
|
||||||
|
return 'http://vine.co';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getCacheDuration(){
|
||||||
|
return 10; //seconds
|
||||||
|
}
|
||||||
|
}
|
58
bridges/ZoneTelechargementBridge.php
Normal file
58
bridges/ZoneTelechargementBridge.php
Normal file
@ -0,0 +1,58 @@
|
|||||||
|
<?php
|
||||||
|
class ZoneTelechargementBridge extends BridgeAbstract {
|
||||||
|
|
||||||
|
public function loadMetadatas() {
|
||||||
|
|
||||||
|
$this->maintainer = 'ORelio';
|
||||||
|
$this->name = $this->getName();
|
||||||
|
$this->uri = $this->getURI();
|
||||||
|
$this->description = 'RSS proxy returning the newest releases.<br />You may specify a category found in RSS URLs, else main feed is selected.';
|
||||||
|
$this->update = "2016-03-16";
|
||||||
|
|
||||||
|
$this->parameters[] =
|
||||||
|
'[
|
||||||
|
{
|
||||||
|
"name" : "Category",
|
||||||
|
"identifier" : "category"
|
||||||
|
}
|
||||||
|
]';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function collectData(array $param) {
|
||||||
|
|
||||||
|
function StripCDATA($string) {
|
||||||
|
$string = str_replace('<![CDATA[', '', $string);
|
||||||
|
$string = str_replace(']]>', '', $string);
|
||||||
|
return $string;
|
||||||
|
}
|
||||||
|
|
||||||
|
$category = '/';
|
||||||
|
if (!empty($param['category']))
|
||||||
|
$category = '/'.$param['category'].'/';
|
||||||
|
|
||||||
|
$url = $this->getURI().$category.'rss.xml';
|
||||||
|
$html = file_get_html($url) or $this->returnError('Could not request Zone Telechargement: '.$url, 500);
|
||||||
|
|
||||||
|
foreach($html->find('item') as $element) {
|
||||||
|
$item = new \Item();
|
||||||
|
$item->title = $element->find('title', 0)->plaintext;
|
||||||
|
$item->uri = str_replace('http://', 'https://', $element->find('guid', 0)->plaintext);
|
||||||
|
$item->timestamp = strtotime($element->find('pubDate', 0)->plaintext);
|
||||||
|
$item->content = StripCDATA($element->find('description', 0)->innertext);
|
||||||
|
$this->items[] = $item;
|
||||||
|
$limit++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getName() {
|
||||||
|
return 'Zone Telechargement Bridge';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getURI() {
|
||||||
|
return 'https://www.zone-telechargement.com/';
|
||||||
|
}
|
||||||
|
|
||||||
|
public function getCacheDuration() {
|
||||||
|
return 3600;
|
||||||
|
}
|
||||||
|
}
|
10
index.php
10
index.php
@ -14,7 +14,13 @@ TODO :
|
|||||||
|
|
||||||
date_default_timezone_set('UTC');
|
date_default_timezone_set('UTC');
|
||||||
error_reporting(0);
|
error_reporting(0);
|
||||||
//ini_set('display_errors','1'); error_reporting(E_ALL); // For debugging only.
|
|
||||||
|
if(file_exists("DEBUG")) {
|
||||||
|
|
||||||
|
ini_set('display_errors','1'); error_reporting(E_ALL); //Report all errors
|
||||||
|
define("DEBUG", "true");
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
require_once __DIR__ . '/lib/RssBridge.php';
|
require_once __DIR__ . '/lib/RssBridge.php';
|
||||||
|
|
||||||
@ -84,7 +90,7 @@ try{
|
|||||||
|
|
||||||
// Data retrieval
|
// Data retrieval
|
||||||
$bridge = Bridge::create($bridge);
|
$bridge = Bridge::create($bridge);
|
||||||
if(isset($_REQUEST["disable_cache"])) {
|
if(defined("DEBUG")) {
|
||||||
} else {
|
} else {
|
||||||
$bridge->setCache($cache); // just add disable cache to your query to disable caching
|
$bridge->setCache($cache); // just add disable cache to your query to disable caching
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user