Skip to content

Commit 08a8920

Browse files
mrichtarskyjosStorer
authored andcommitted
Look for class="article" for content
Quite a few sites use this, but fail the current heuristic.
1 parent 0d7d735 commit 08a8920

File tree

1 file changed

+10
-5
lines changed

1 file changed

+10
-5
lines changed

src/utils/get-core-content-text.mjs

Lines changed: 10 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -43,23 +43,28 @@ function findLargestElement(e) {
4343
}
4444

4545
export function getCoreContentText() {
46+
function getTextFrom(e) {
47+
return e.innerText || e.textContent
48+
}
49+
4650
for (const [siteName, selectors] of Object.entries(adapters)) {
4751
if (location.hostname.includes(siteName)) {
4852
const element = getPossibleElementByQuerySelector(selectors)
49-
if (element) return element.innerText || element.textContent
53+
if (element) return getTextFrom(element)
5054
break
5155
}
5256
}
5357

58+
const element = document.querySelector('article')
59+
if (element) {
60+
return getTextFrom(element)
61+
}
62+
5463
const largestElement = findLargestElement(document.body)
5564
const secondLargestElement = findLargestElement(largestElement)
5665
console.log(largestElement)
5766
console.log(secondLargestElement)
5867

59-
function getTextFrom(e) {
60-
return e.innerText || e.textContent
61-
}
62-
6368
let ret
6469
if (!largestElement) {
6570
ret = getTextFrom(document.body)

0 commit comments

Comments
 (0)