diff --git a/bridges/MerchantAndMillsBridge.php b/bridges/MerchantAndMillsBridge.php index 380f9cc0..dca043b6 100644 --- a/bridges/MerchantAndMillsBridge.php +++ b/bridges/MerchantAndMillsBridge.php @@ -6,6 +6,7 @@ class MerchantAndMillsBridge extends BridgeAbstract { const DESCRIPTION = 'The latest blog posts from Merchant and Mills.'; const MAINTAINER = 'caseykulm'; const CACHE_TIMEOUT = 43200; // 12h + const POST_LIMIT = 10; // Maximum number of blog posts to fetch const PARAMETERS = [[ 'selected_country_id' => [ 'name' => 'Country', @@ -19,8 +20,7 @@ class MerchantAndMillsBridge extends BridgeAbstract { ] ]]; - private function getCountryBlogPath($countryName): string - { + private function getCountryBlogPath($countryName): string { if ($countryName === 'European Union') { return '/eu/blog'; } @@ -36,57 +36,78 @@ class MerchantAndMillsBridge extends BridgeAbstract { return '/rw/blog'; } - public function collectData() - { + public function collectData() { $selectedCountryKey = $this->getKey('selected_country_id'); $selectedCountryBlogPath = $this->getCountryBlogPath($selectedCountryKey); $url = self::URI . $selectedCountryBlogPath; $html = getSimpleHTMLDOM($url) or returnServerError('Could not request ' . $url); + // Limit processing to POST_LIMIT blog posts + $counter = 0; foreach ($html->find('.products .post') as $post) { + if ($counter >= self::POST_LIMIT) { + break; // Stop when the limit is reached + } + $item = []; - // Extract image - $image = $post->find('.post_image img', 0); - if ($image) { - // Resolve the relative image URL - $imageUrl = $image->src; - if (!str_starts_with($imageUrl, 'http')) { - $imageUrl = rtrim(self::URI, '/') . '/' . ltrim($imageUrl, '/'); - } - $item['image'] = $imageUrl; - } else { - $item['image'] = ''; - } - - // Extract title + // Extract title and URI $titleLink = $post->find('.post_name a', 0); - $item['title'] = $titleLink ? trim($titleLink->plaintext) : ''; + $item['title'] = $titleLink ? trim($titleLink->plaintext) : 'No title'; $item['uri'] = $titleLink ? self::URI . $titleLink->href : ''; - // Extract date and views - $dateAndViews = $post->find('.post_date span'); - $item['date'] = isset($dateAndViews[0]) ? trim($dateAndViews[0]->plaintext) : ''; - $item['views'] = isset($dateAndViews[1]) ? trim(str_replace('Viewed:', '', $dateAndViews[1]->plaintext)) : ''; + // Extract date + $dateElement = $post->find('.post_date span', 0); + $item['timestamp'] = $dateElement ? strtotime(trim($dateElement->plaintext)) : null; - // Extract description - $description = $post->find('.post_desc', 0); - $item['content'] = ''; - - // Add the image and description to content - if (!empty($item['image'])) { - $item['content'] .= '