diff --git a/bridges/AnidexBridge.php b/bridges/AnidexBridge.php new file mode 100644 index 00000000..a89cb567 --- /dev/null +++ b/bridges/AnidexBridge.php @@ -0,0 +1,207 @@ + array( + 'name' => 'Category', + 'type' => 'list', + 'values' => array( + 'All categories' => '0', + 'Anime' => '1,2,3', + 'Anime - Sub' => '1', + 'Anime - Raw' => '2', + 'Anime - Dub' => '3', + 'Live Action' => '4,5', + 'Live Action - Sub' => '4', + 'Live Action - Raw' => '5', + 'Light Novel' => '6', + 'Manga' => '7,8', + 'Manga - Translated' => '7', + 'Manga - Raw' => '8', + 'Music' => '9,10,11', + 'Music - Lossy' => '9', + 'Music - Lossless' => '10', + 'Music - Video' => '11', + 'Games' => '12', + 'Applications' => '13', + 'Pictures' => '14', + 'Adult Video' => '15', + 'Other' => '16' + ) + ), + 'lang_id' => array( + 'name' => 'Language', + 'type' => 'list', + 'values' => array( + 'All languages' => '0', + 'English' => '1', + 'Japanese' => '2', + 'Polish' => '3', + 'Serbo-Croatian' => '4', + 'Dutch' => '5', + 'Italian' => '6', + 'Russian' => '7', + 'German' => '8', + 'Hungarian' => '9', + 'French' => '10', + 'Finnish' => '11', + 'Vietnamese' => '12', + 'Greek' => '13', + 'Bulgarian' => '14', + 'Spanish (Spain)' => '15', + 'Portuguese (Brazil)' => '16', + 'Portuguese (Portugal)' => '17', + 'Swedish' => '18', + 'Arabic' => '19', + 'Danish' => '20', + 'Chinese (Simplified)' => '21', + 'Bengali' => '22', + 'Romanian' => '23', + 'Czech' => '24', + 'Mongolian' => '25', + 'Turkish' => '26', + 'Indonesian' => '27', + 'Korean' => '28', + 'Spanish (LATAM)' => '29', + 'Persian' => '30', + 'Malaysian' => '31' + ) + ), + 'group_id' => array( + 'name' => 'Group ID', + 'type' => 'number' + ), + 'r' => array( + 'name' => 'Hide Remakes', + 'type' => 'checkbox' + ), + 'b' => array( + 'name' => 'Only Batches', + 'type' => 'checkbox' + ), + 'a' => array( + 'name' => 'Only Authorized', + 'type' => 'checkbox' + ), + 'q' => array( + 'name' => 'Keyword', + 'description' => 'Keyword(s)', + 'type' => 'text' + ), + 'h' => array( + 'name' => 'Adult content', + 'type' => 'list', + 'values' => array( + 'No filter' => '0', + 'Hide +18' => '1', + 'Only +18' => '2' + ) + ) + ) + ); + + public function collectData() { + + // Build Search URL from user-provided parameters + $search_url = self::URI . '?s=upload_timestamp&o=desc'; + foreach (array('id', 'lang_id', 'group_id') as $param_name) { + $param = $this->getInput($param_name); + if (!empty($param) && intval($param) != 0 && ctype_digit(str_replace(',', '', $param))) { + $search_url .= '&' . $param_name . '=' . $param; + } + } + foreach (array('r', 'b', 'a') as $param_name) { + $param = $this->getInput($param_name); + if (!empty($param) && boolval($param)) { + $search_url .= '&' . $param_name . '=1'; + } + } + $query = $this->getInput('q'); + if (!empty($query)) { + $search_url .= '&q=' . urlencode($query); + } + $opt = array(); + $h = $this->getInput('h'); + if (!empty($h) && intval($h) != 0 && ctype_digit($h)) { + $opt[CURLOPT_COOKIE] = 'anidex_h_toggle=' . $h; + } + + // Retrieve torrent listing from search results, which does not contain torrent description + $html = getSimpleHTMLDOM($search_url, array(), $opt) + or returnServerError('Could not request Anidex: ' . $search_url); + $links = $html->find('a'); + $results = array(); + foreach ($links as $link) + if (strpos($link->href, '/torrent/') === 0 && !in_array($link->href, $results)) + $results[] = $link->href; + if (empty($results) && empty($this->getInput('q'))) + returnServerError('No results from Anidex: '.$search_url); + + //Process each item individually + foreach ($results as $element) { + + //Limit total amount of requests + if(count($this->items) >= 20) { + break; + } + + $torrent_id = str_replace('/torrent/', '', $element); + + //Ignore entries without valid torrent ID + if ($torrent_id != 0 && ctype_digit($torrent_id)) { + + //Retrieve data for this torrent ID + $item_uri = self::URI . 'torrent/'.$torrent_id; + + //Retrieve full description from torrent page + if ($item_html = getSimpleHTMLDOMCached($item_uri)) { + + //Retrieve data from page contents + $item_title = str_replace(' (Torrent) - AniDex ', '', $item_html->find('title', 0)->plaintext); + $item_desc = $item_html->find('div.panel-body', 0); + $item_author = trim($item_html->find('span.fa-user', 0)->parent()->plaintext); + $item_date = strtotime(trim($item_html->find('span.fa-clock', 0)->parent()->plaintext)); + $item_image = $this->getURI() . 'images/user_logos/default.png'; + + //Check for description-less torrent andn optionally extract image + $desc_title_found = false; + foreach ($item_html->find('h3.panel-title') as $h3) { + if (strpos($h3, 'Description') !== false) { + $desc_title_found = true; + break; + } + } + if ($desc_title_found) { + //Retrieve image for thumbnail or generic logo fallback + foreach ($item_desc->find('img') as $img) { + if (strpos($img->src, 'prez') === false) { + $item_image = $img->src; + break; + } + } + $item_desc = trim($item_desc->innertext); + } else { + $item_desc = 'No description.'; + } + + //Build and add final item + $item = array(); + $item['uri'] = $item_uri; + $item['title'] = $item_title; + $item['author'] = $item_author; + $item['timestamp'] = $item_date; + $item['enclosures'] = array($item_image); + $item['content'] = $item_desc; + $this->items[] = $item; + } + } + $element = null; + } + $results = null; + } +} diff --git a/bridges/AnimeUltimeBridge.php b/bridges/AnimeUltimeBridge.php index 6c5427e5..5c719b92 100644 --- a/bridges/AnimeUltimeBridge.php +++ b/bridges/AnimeUltimeBridge.php @@ -5,7 +5,7 @@ class AnimeUltimeBridge extends BridgeAbstract { const NAME = 'Anime-Ultime'; const URI = 'http://www.anime-ultime.net/'; const CACHE_TIMEOUT = 10800; // 3h - const DESCRIPTION = 'Returns the 10 newest releases posted on Anime-Ultime'; + const DESCRIPTION = 'Returns the newest releases posted on Anime-Ultime.'; const PARAMETERS = array( array( 'type' => array( 'name' => 'Type', @@ -65,6 +65,13 @@ class AnimeUltimeBridge extends BridgeAbstract { $item_link_element = $release->find('td', 0)->find('a', 0); $item_uri = self::URI . $item_link_element->href; $item_name = html_entity_decode($item_link_element->plaintext); + + $item_image = self::URI . substr( + $item_link_element->onmouseover, + 37, + strpos($item_link_element->onmouseover, ' ', 37) - 37 + ); + $item_episode = html_entity_decode( str_pad( $release->find('td', 1)->plaintext, @@ -79,8 +86,7 @@ class AnimeUltimeBridge extends BridgeAbstract { if(!empty($item_uri)) { - // Retrieve description from description page and - // convert relative image src info absolute image src + // Retrieve description from description page $html_item = getContents($item_uri) or returnServerError('Could not request Anime-Ultime: ' . $item_uri); $item_description = substr( @@ -91,10 +97,9 @@ class AnimeUltimeBridge extends BridgeAbstract { 0, strpos($item_description, '
') ); - $item_description = str_replace( - 'src="images', 'src="' . self::URI . 'images', - $item_description - ); + + // Convert relative image src into absolute image src, remove line breaks + $item_description = defaultLinkTo($item_description, self::URI); $item_description = str_replace("\r", '', $item_description); $item_description = str_replace("\n", '', $item_description); $item_description = utf8_encode($item_description); @@ -105,6 +110,7 @@ class AnimeUltimeBridge extends BridgeAbstract { $item['title'] = $item_name . ' ' . $item_type . ' ' . $item_episode; $item['author'] = $item_fansub; $item['timestamp'] = $item_date; + $item['enclosures'] = array($item_image); $item['content'] = $item_description; $this->items[] = $item; $processedOK++; diff --git a/bridges/CNETBridge.php b/bridges/CNETBridge.php new file mode 100644 index 00000000..bd41febc --- /dev/null +++ b/bridges/CNETBridge.php @@ -0,0 +1,109 @@ + array( + 'name' => 'Topic', + 'type' => 'list', + 'values' => array( + 'All articles' => '', + 'Apple' => 'apple', + 'Google' => 'google', + 'Microsoft' => 'tags-microsoft', + 'Computers' => 'topics-computers', + 'Mobile' => 'topics-mobile', + 'Sci-Tech' => 'topics-sci-tech', + 'Security' => 'topics-security', + 'Internet' => 'topics-internet', + 'Tech Industry' => 'topics-tech-industry' + ) + ) + ) + ); + + private function cleanArticle($article_html) { + $offset_p = strpos($article_html, '

'); + $offset_figure = strpos($article_html, '', '', $article_html); + $article_html = str_replace('', '', $article_html); + $article_html = StripWithDelimiters($article_html, ''); + $article_html = stripWithDelimiters($article_html, 'find('div.originalImage', 0); + if (empty($article_thumbnail)) + $article_thumbnail = $article_html->find('span.imageContainer', 0); + if (is_object($article_thumbnail)) + $article_thumbnail = $article_thumbnail->find('img', 0)->src; + + $article_content .= trim( + $this->cleanArticle( + extractFromDelimiters( + $article_html, 'items[] = $item; + } + } + } +} diff --git a/bridges/DilbertBridge.php b/bridges/DilbertBridge.php index 959a91a2..a84e5e87 100644 --- a/bridges/DilbertBridge.php +++ b/bridges/DilbertBridge.php @@ -9,8 +9,8 @@ class DilbertBridge extends BridgeAbstract { public function collectData(){ - $html = getSimpleHTMLDOM($this->getURI()) - or returnServerError('Could not request Dilbert: ' . $this->getURI()); + $html = getSimpleHTMLDOM(self::URI) + or returnServerError('Could not request Dilbert: ' . self::URI); foreach($html->find('section.comic-item') as $element) { diff --git a/bridges/EstCeQuonMetEnProdBridge.php b/bridges/EstCeQuonMetEnProdBridge.php index db9d1d5f..4439d694 100644 --- a/bridges/EstCeQuonMetEnProdBridge.php +++ b/bridges/EstCeQuonMetEnProdBridge.php @@ -7,19 +7,9 @@ class EstCeQuonMetEnProdBridge extends BridgeAbstract { const CACHE_TIMEOUT = 21600; // 6h const DESCRIPTION = 'Should we put a website in production today? (French)'; - public function collectData(){ - function extractFromDelimiters($string, $start, $end){ - if(strpos($string, $start) !== false) { - $section_retrieved = substr($string, strpos($string, $start) + strlen($start)); - $section_retrieved = substr($section_retrieved, 0, strpos($section_retrieved, $end)); - return $section_retrieved; - } - - return false; - } - - $html = getSimpleHTMLDOM($this->getURI()) - or returnServerError('Could not request EstCeQuonMetEnProd: ' . $this->getURI()); + public function collectData() { + $html = getSimpleHTMLDOM(self::URI) + or returnServerError('Could not request EstCeQuonMetEnProd: ' . self::URI); $item = array(); $item['uri'] = $this->getURI() . '#' . date('Y-m-d'); @@ -28,8 +18,8 @@ class EstCeQuonMetEnProdBridge extends BridgeAbstract { $item['timestamp'] = strtotime('today midnight'); $item['content'] = str_replace( 'src="/', - 'src="' . $this->getURI(), - trim(extractFromDelimiters($html->outertext, '', '

')) + 'src="' . self::URI, + trim(extractFromDelimiters($html->outertext, '', '