[EconomistBridge] Add cookie (#4173)

* [EconomistBridge] Add cookie

* [EconomistBridge] Fix lint
This commit is contained in:
Pavel Korytov 2024-07-30 23:10:57 +03:00 committed by GitHub
parent cb91afbd71
commit aa3989873c
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 32 additions and 2 deletions

View File

@ -8,6 +8,12 @@ class EconomistBridge extends FeedExpander
const CACHE_TIMEOUT = 3600; //1hour const CACHE_TIMEOUT = 3600; //1hour
const DESCRIPTION = 'Returns the latest articles for the selected category'; const DESCRIPTION = 'Returns the latest articles for the selected category';
const CONFIGURATION = [
'cookie' => [
'required' => false,
]
];
const PARAMETERS = [ const PARAMETERS = [
'global' => [ 'global' => [
'limit' => [ 'limit' => [
@ -99,8 +105,20 @@ class EconomistBridge extends FeedExpander
protected function parseItem(array $item) protected function parseItem(array $item)
{ {
$headers = [];
if ($this->getOption('cookie')) {
$headers = [
'Authority: www.economist.com',
'Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7',
'Accept-language: en-US,en;q=0.9',
'Cache-control: max-age=0',
'Cookie: ' . $this->getOption('cookie'),
'Upgrade-insecure-requests: 1',
'User-agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/112.0.0.0 Safari/537.36'
];
}
try { try {
$dom = getSimpleHTMLDOM($item['uri']); $dom = getSimpleHTMLDOM($item['uri'], $headers);
} catch (Exception $e) { } catch (Exception $e) {
$item['content'] = $e->getMessage(); $item['content'] = $e->getMessage();
return $item; return $item;
@ -209,6 +227,15 @@ class EconomistBridge extends FeedExpander
foreach ($elem->find('a.ds-link-with-arrow-icon') as $a) { foreach ($elem->find('a.ds-link-with-arrow-icon') as $a) {
$a->parent->removeChild($a); $a->parent->removeChild($a);
} }
// Sections like "Leaders on day X"
foreach ($elem->find('div[data-tracking-id=content-well-chapter-list]') as $div) {
$div->parent->removeChild($div);
}
// "Explore more" section
foreach ($elem->find('h3[id=article-tags]') as $h3) {
$div = $h3->parent;
$div->parent->removeChild($div);
}
// The Economist puts infographics into iframes, which doesn't // The Economist puts infographics into iframes, which doesn't
// work in any of my readers. So this replaces iframes with // work in any of my readers. So this replaces iframes with

View File

@ -1,4 +1,4 @@
# EconomistWorldInBriefBridge # EconomistWorldInBriefBridge and EconomistBridge
In May 2024, The Economist finally fixed its paywall, and it started requiring authorization. Which means you can't use this bridge unless you have an active subscription. In May 2024, The Economist finally fixed its paywall, and it started requiring authorization. Which means you can't use this bridge unless you have an active subscription.
@ -15,4 +15,7 @@ Once you've done this, add the cookie to your `config.ini.php`:
``` ```
[EconomistWorldInBriefBridge] [EconomistWorldInBriefBridge]
cookie = "<value>" cookie = "<value>"
[EconomistBridge]
cookie = "<value>"
``` ```