From 418f951dd19d205acef1845d2ac7f4b642d149c7 Mon Sep 17 00:00:00 2001 From: Dag Date: Sat, 15 Jan 2022 11:15:39 +0500 Subject: [PATCH] [ThePirateBayBridge] Repair broken bridge This is more like a refactor because they dont serve data in plain html anymore. Instead, the data is available from a json api at apibay.org Could possibly expand this bridge because their api has more to give. I learned about this api by grokking https://thepiratebay.org/static/main.js and by looking at browser ajax requests. For some unknown reason they host some static assets at https://torrindex.net/ which is used by the bridge to render magnet image and user status image. Signed-off-by: Dag --- bridges/ThePirateBayBridge.php | 372 ++++++++++++++++++++++----------- 1 file changed, 253 insertions(+), 119 deletions(-) mode change 100644 => 100755 bridges/ThePirateBayBridge.php diff --git a/bridges/ThePirateBayBridge.php b/bridges/ThePirateBayBridge.php old mode 100644 new mode 100755 index 0f417acc..e6b08ef9 --- a/bridges/ThePirateBayBridge.php +++ b/bridges/ThePirateBayBridge.php @@ -1,9 +1,13 @@ array( 'search' => 'search', 'category' => 'cat', - 'user' => 'usr' + 'user' => 'usr', ) ), 'catCheck' => array( @@ -38,140 +42,270 @@ class ThePirateBayBridge extends BridgeAbstract { ), )); - public function collectData(){ + const STATIC_SERVER = 'https://torrindex.net'; - $catBool = $this->getInput('catCheck'); - if($catBool) { - $catNum = $this->getInput('cat'); + const CATEGORIES = array( + '1' => 'Audio', + '2' => 'Video', + '3' => 'Applications', + '4' => 'Games', + '5' => 'Porn', + '6' => 'Other', + '101' => 'Music', + '102' => 'Audio Books', + '103' => 'Sound clips', + '104' => 'FLAC', + '199' => 'Other', + '201' => 'Movies', + '202' => 'Movies DVDR', + '203' => 'Music videos', + '204' => 'Movie Clips', + '205' => 'TV-Shows', + '206' => 'Handheld', + '207' => 'HD Movies', + '208' => 'HD TV-Shows', + '209' => '3D', + '299' => 'Other', + '301' => 'Windows', + '302' => 'Mac/Apple', + '303' => 'UNIX', + '304' => 'Handheld', + '305' => 'IOS(iPad/iPhone)', + '306' => 'Android', + '399' => 'Other OS', + '401' => 'PC', + '402' => 'Mac/Apple', + '403' => 'PSx', + '404' => 'XBOX360', + '405' => 'Wii', + '406' => 'Handheld', + '407' => 'IOS(iPad/iPhone)', + '408' => 'Android', + '499' => 'Other OS', + '501' => 'Movies', + '502' => 'Movies DVDR', + '503' => 'Pictures', + '504' => 'Games', + '505' => 'HD-Movies', + '506' => 'Movie Clips', + '599' => 'Other', + '601' => 'E-books', + '602' => 'Comics', + '603' => 'Pictures', + '604' => 'Covers', + '605' => 'Physibles', + '699' => 'Other', + ); + + public function collectData() { + $keywords = explode(';', $this->getInput('q')); + + foreach($keywords as $keyword) { + $this->processKeyword($keyword); } - $critList = $this->getInput('crit'); + } - $trustedBool = $this->getInput('trusted'); - $keywordsList = explode(';', $this->getInput('q')); - foreach($keywordsList as $keywords) { - switch($critList) { + private function processKeyword($keyword) + { + $keyword = trim($keyword); + switch ($this->getInput('crit')) { case 'search': - if($catBool == false) { - $html = getSimpleHTMLDOM( - self::URI . - 'search/' . - rawurlencode($keywords) . - '/0/3/0' + $catCheck = $this->getInput('catCheck'); + if ($catCheck) { + $categories = $this->getInput('cat'); + $query = sprintf( + '/q.php?q=%s&cat=%s', + rawurlencode($keyword), + rawurlencode($categories) ); } else { - $html = getSimpleHTMLDOM( - self::URI . - 'search/' . - rawurlencode($keywords) . - '/0/3/' . - rawurlencode($catNum) - ); + $query = sprintf('/q.php?q=%s', rawurlencode($keyword)); } break; case 'cat': - $html = getSimpleHTMLDOM( - self::URI . - 'browse/' . - rawurlencode($keywords) . - '/0/3/0' - ); + $query = sprintf('/q.php?q=category:%s', rawurlencode($keyword)); break; case 'usr': - $html = getSimpleHTMLDOM( - self::URI . - 'user/' . - rawurlencode($keywords) . - '/0/3/0' - ); + $query = sprintf('/q.php?q=user:%s', rawurlencode($keyword)); break; + default: + returnClientError('Impossible'); + } + $api = 'https://apibay.org'; + $json = getContents($api . $query); + $result = json_decode($json); + + if ($result[0]->name === 'No results returned') { + return; + } + foreach ($result as $torrent) { + // This is the check for whether to include results from Trusted or VIP users + if ($this->getInput('trusted') + && !in_array($torrent->status, array('vip', 'trusted')) + ) { + continue; } - - if ($html->find('table#searchResult', 0) == false) - returnServerError('No result for query ' . $keywords); - - foreach($html->find('tr') as $element) { - - if(!$trustedBool - || !is_null($element->find('img[alt=VIP]', 0)) - || !is_null($element->find('img[alt=Trusted]', 0))) { - $item = array(); - $item['uri'] = self::URI . $element->find('a.detLink', 0)->href; - $item['id'] = self::URI . $element->find('a.detLink', 0)->href; - $item['timestamp'] = $this->parseDateTimestamp($element); - $item['author'] = $element->find('a.detDesc', 0)->plaintext; - $item['title'] = $element->find('a.detLink', 0)->plaintext; - $item['magnet'] = $element->find('a', 3)->href; - $item['seeders'] = (int)$element->find('td', 2)->plaintext; - $item['leechers'] = (int)$element->find('td', 3)->plaintext; - $item['content'] = $element->find('font', 0)->plaintext - . '
seeders: ' - . $item['seeders'] - . ' | leechers: ' - . $item['leechers'] - . '
info page
magnet link'; - - if(isset($item['title'])) - $this->items[] = $item; - } - } + $this->processTorrent($torrent); } } - private function parseDateTimestamp($element){ - $guessedDate = $element->find('font', 0)->plaintext; - $guessedDate = explode('Uploaded ', $guessedDate)[1]; - $guessedDate = explode(',', $guessedDate)[0]; + private function processTorrent($torrent) + { + // Extracted these trackers from the magnet links on thepiratebay.org + $trackers = array( + 'udp://tracker.coppersurfer.tk:6969/announce', + 'udp://tracker.openbittorrent.com:6969/announce', + 'udp://9.rarbg.to:2710/announce', + 'udp://9.rarbg.me:2780/announce', + 'udp://9.rarbg.to:2730/announce', + 'udp://tracker.opentrackr.org:1337', + 'http://p4p.arenabg.com:1337/announce', + 'udp://tracker.torrent.eu.org:451/announce', + 'udp://tracker.tiny-vps.com:6969/announce', + 'udp://open.stealth.si:80/announce', + ); - if(count(explode(':', $guessedDate)) == 1) { - $guessedDate = strptime($guessedDate, '%m-%d %Y'); - $timestamp = mktime( - 0, - 0, - 0, - $guessedDate['tm_mon'] + 1, - $guessedDate['tm_mday'], - 1900 + $guessedDate['tm_year'] - ); - } elseif(explode(' ', $guessedDate)[0] == 'Today') { - $guessedDate = strptime( - explode(' ', $guessedDate)[1], '%H:%M' - ); + $magnetLink = sprintf( + 'magnet:?xt=urn:btih:%s&dn=%s', + $torrent->info_hash, + rawurlencode($torrent->name) + ); + foreach ($trackers as $tracker) { + // Build magnet link manually instead of using http_build_query because it + // creates undesirable query such as ?tr[0]=foo&tr[1]=bar&tr[2]=baz + $magnetLink .= '&tr=' . rawurlencode($tracker); + } - $timestamp = mktime( - $guessedDate['tm_hour'], - $guessedDate['tm_min'], - 0, - date('m'), - date('d'), - date('Y') - ); - } elseif(explode(' ', $guessedDate)[0] == 'Y-day') { - $guessedDate = strptime( - explode(' ', $guessedDate)[1], '%H:%M' - ); + $item = array(); - $timestamp = mktime( - $guessedDate['tm_hour'], - $guessedDate['tm_min'], - 0, - date('m', time() - 24 * 60 * 60), - date('d', time() - 24 * 60 * 60), - date('Y', time() - 24 * 60 * 60) - ); - } else { - $guessedDate = strptime($guessedDate, '%m-%d %H:%M'); - $timestamp = mktime( - $guessedDate['tm_hour'], - $guessedDate['tm_min'], - 0, - $guessedDate['tm_mon'] + 1, - $guessedDate['tm_mday'], - date('Y')); - } - return $timestamp; + $item['title'] = $torrent->name; + // This uri should be a magnet link so that feed readers can easily pick it up. + // However, rss-bridge only allows http or https schemes + $item['uri'] = sprintf('%s/description.php?id=%s', self::URI, $torrent->id); + $item['timestamp'] = $torrent->added; + $item['author'] = $torrent->username; + + $content = 'Type: ' + . $this->renderCategory($torrent->category) . '
'; + $content .= "Files: $torrent->num_files
"; + $content .= 'Size: ' . $this->renderSize($torrent->size) . '

'; + + $content .= 'Uploaded: ' + . $this->renderUploadDate($torrent->added) . '
'; + $content .= 'By: ' . $this->renderUser($torrent) . '
'; + + $content .= "Seeders: {$torrent->seeders}
"; + $content .= "Leechers: {$torrent->leechers}
"; + $content .= "Info hash: {$torrent->info_hash}

"; + + if ($torrent->imdb) { + $content .= 'Imdb: ' + . $this->renderImdbLink($torrent->imdb) . '

'; + } + + $html = << + GET THIS TORRENT + +
+HTML; + $content .= sprintf($html, $magnetLink, self::STATIC_SERVER); + + $item['content'] = $content; + + $this->items[] = $item; + } + + private function renderSize($size) + { + if ($size < 1024) return $size . ' B'; + if ($size < pow(1024, 2)) return round($size / 1024, 2) . ' KB'; + if ($size < pow(1024, 3)) return round($size / pow(1024, 2), 2) . ' MB'; + if ($size < pow(1024, 4)) return round($size / pow(1024, 3), 2) . ' GB'; + + return round($size / pow(1024, 4), 2) . ' TB'; + } + + private function renderUploadDate($added) + { + return date('Y-m-d', $added ?: time()); + } + + private function renderCategory($category) + { + $mainCategory = sprintf( + '%s', + self::URI, + $category[0] . '00', + self::CATEGORIES[$category[0]] + ); + + $subCategory = sprintf( + '%s', + self::URI, + $category, + self::CATEGORIES[$category] + ); + + return sprintf('%s > %s', $mainCategory, $subCategory); + } + + private function renderUser($torrent) + { + if ($torrent->username === 'Anonymous') { + return $torrent->username . ' ' . $this->renderStatusImage($torrent->status); + } + return sprintf( + '%s %s', + self::URI, + $torrent->username, + $torrent->username, + $this->renderStatusImage($torrent->status) + ); + } + + private function renderStatusImage($status) + { + if ($status == 'trusted') + return sprintf( + '', + self::STATIC_SERVER + ); + if ($status == 'vip') + return sprintf( + '', + self::STATIC_SERVER + ); + if ($status == 'helper') + return sprintf( + '', + self::STATIC_SERVER + ); + if ($status == 'moderator') + return sprintf( + '', + self::STATIC_SERVER + ); + if ($status == 'supermod') + return sprintf( + '', + self::STATIC_SERVER + ); + if ($status == 'admin') + return sprintf( + '', + self::STATIC_SERVER + ); + + return ''; + } + + private function renderImdbLink($imdb) + { + return sprintf( + '%s', + "https://www.imdb.com/title/$imdb", + "https://www.imdb.com/title/$imdb" + ); } }