diff --git a/lib/FeedExpander.php b/lib/FeedExpander.php index caface38..edfe99d4 100644 --- a/lib/FeedExpander.php +++ b/lib/FeedExpander.php @@ -102,7 +102,7 @@ abstract class FeedExpander extends BridgeAbstract $httpHeaders = ['Accept: ' . implode(', ', $mimeTypes)]; $content = getContents($url, $httpHeaders); if ($content === '') { - throw new \Exception(sprintf('Unable to parse xml from `%s` because we got the empty string', $url)); + throw new \Exception(sprintf('Unable to parse xml from `%s` because we got the empty string', $url), 10); } // Maybe move this call earlier up the stack frames // Disable triggering of the php error-handler and handle errors manually instead @@ -121,7 +121,7 @@ abstract class FeedExpander extends BridgeAbstract // Render only the first error into exception message $firstXmlErrorMessage = $xmlErrors[0]->message; } - throw new \Exception(sprintf('Unable to parse xml from `%s` %s', $url, $firstXmlErrorMessage ?? '')); + throw new \Exception(sprintf('Unable to parse xml from `%s` %s', $url, $firstXmlErrorMessage ?? ''), 11); } // Restore previous behaviour in case other code relies on it being off libxml_use_internal_errors(false); diff --git a/lib/contents.php b/lib/contents.php index 5dec2730..7f5ec2f2 100644 --- a/lib/contents.php +++ b/lib/contents.php @@ -178,29 +178,28 @@ function getContents( $response['content'] = $cache->loadData(); break; default: - if (Debug::isEnabled()) { - // Include a part of the response body in the exception message - throw new HttpException( - sprintf( - '%s resulted in `%s %s: %s`', - $url, - $result['code'], - Response::STATUS_CODES[$result['code']] ?? '', - mb_substr($result['body'], 0, 500), - ), - $result['code'] - ); - } else { - throw new HttpException( - sprintf( - '%s resulted in `%s %s`', - $url, - $result['code'], - Response::STATUS_CODES[$result['code']] ?? '', - ), - $result['code'] - ); + $exceptionMessage = sprintf( + '%s resulted in %s %s %s', + $url, + $result['code'], + Response::STATUS_CODES[$result['code']] ?? '', + // If debug, include a part of the response body in the exception message + Debug::isEnabled() ? mb_substr($result['body'], 0, 500) : '', + ); + + // The following code must be extracted if it grows too much + $cloudflareTitles = [ + '
+ RSS-Bridge tried to fetch a website. + The fetching was blocked by CloudFlare. + CloudFlare is anti-bot software. + Its purpose is to block non-humans. +
+ -The application could not run because of the following error:
+ getCode() === 404): ?> ++ RSS-Bridge tried to fetch a page on a website. + But it doesn't exists. +
+ + + getCode() === 429): ?> ++ RSS-Bridge tried to fetch a website. + They told us to try again later. +
+ + + + getCode() === 10): ?> ++ RSS-Bridge tried parse the empty string as xml. + The fetched url is not pointing to real xml. +
+ + + getCode() === 11): ?> ++ RSS-Bridge tried parse xml. It failed. The xml is probably broken. +
+ +