From 86a9383b53ecd4b21ffcbc4f4392fd0478169ed7 Mon Sep 17 00:00:00 2001 From: Hongbo Wu Date: Thu, 23 Jun 2022 21:11:23 +0800 Subject: [PATCH] Do not remove content in .container-banners class --- packages/readabilityjs/Readability-readerable.js | 2 +- packages/readabilityjs/Readability.js | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/packages/readabilityjs/Readability-readerable.js b/packages/readabilityjs/Readability-readerable.js index 0765c7144..8e9a7c779 100644 --- a/packages/readabilityjs/Readability-readerable.js +++ b/packages/readabilityjs/Readability-readerable.js @@ -23,7 +23,7 @@ var REGEXPS = { // NOTE: These two regular expressions are duplicated in // Readability.js. Please keep both copies in sync. - unlikelyCandidates: /-ad-|ai2html|banner|breadcrumbs|combx|comment|community|cover-wrap|disqus|extra|footer|gdpr|header|legends|menu|related|remark|replies|rss|shoutbox|sidebar|skyscraper|social|sponsor|supplemental|ad-break|agegate|pagination|pager|popup|yom-remote|copyright|keywords|outline/i, + unlikelyCandidates: /-ad-|ai2html|banner|breadcrumbs|breadcrumb|combx|comment|community|cover-wrap|disqus|extra|footer|gdpr|header|legends|menu|related|remark|replies|rss|shoutbox|sidebar|skyscraper|social|sponsor|supplemental|ad-break|agegate|pagination|pager(?!ow)|popup|yom-remote|copyright|keywords|outline|infinite-list|beta|recirculation|site-index|hide-for-print|post-end-share-cta|post-end-cta-full|post-footer|main-navigation|programtic-ads|outstream_article|hfeed|comment-holder|back-to-top|show-up-next|onward-journey|topic-tracker|list-nav|block-ad-entity|adSpecs/i, okMaybeItsACandidate: /and|article|body|column|content|main|shadow/i, }; diff --git a/packages/readabilityjs/Readability.js b/packages/readabilityjs/Readability.js index 13e1791ad..1d5f73ce1 100644 --- a/packages/readabilityjs/Readability.js +++ b/packages/readabilityjs/Readability.js @@ -174,7 +174,7 @@ Readability.prototype = { unlikelyCandidates: /-ad-|ai2html|banner|breadcrumbs|breadcrumb|combx|comment|community|cover-wrap|disqus|extra|footer|gdpr|header|legends|menu|related|remark|replies|rss|shoutbox|sidebar|skyscraper|social|sponsor|supplemental|ad-break|agegate|pagination|pager(?!ow)|popup|yom-remote|copyright|keywords|outline|infinite-list|beta|recirculation|site-index|hide-for-print|post-end-share-cta|post-end-cta-full|post-footer|main-navigation|programtic-ads|outstream_article|hfeed|comment-holder|back-to-top|show-up-next|onward-journey|topic-tracker|list-nav|block-ad-entity|adSpecs/i, // okMaybeItsACandidate: /and|article(?!-breadcrumb)|body|column|content|main|shadow|post-header/i, get okMaybeItsACandidate() { - return new RegExp(`and|(?