return published date if the class name is omnivore-published-date which we added when we scraped the article

This commit is contained in:
Hongbo Wu
2023-03-13 12:08:01 +08:00
parent deb398112b
commit aae6759bcb
2 changed files with 12 additions and 2 deletions

View File

@ -1055,7 +1055,10 @@ Readability.prototype = {
_checkPublishedDate: function (node, matchString) {
// Skipping meta tags
if (node.tagName.toLowerCase() === 'meta') return
// return published date if the class name is 'omnivore-published-date' which we added when we scraped the article
if (node.className === 'omnivore-published-date' && this._isValidPublishedDate(node.textContent)) {
return new Date(node.textContent);
}
// Searching for the real date in the text content
let dateRegExpFound = this.REGEXPS.DATES_REGEXPS.find(regexp => regexp.test(node.textContent.trim()))
dateRegExpFound && (dateRegExpFound = dateRegExpFound.exec(node.textContent.trim()))