Skip to content

Commit f26c566

Browse files
mrichtarskyjosStorer
authored andcommitted
Make summarization work for text/plain content
document.body is available and text can be extracted from it. Fixes #521
1 parent 9085396 commit f26c566

File tree

1 file changed

+15
-4
lines changed

1 file changed

+15
-4
lines changed

src/utils/get-core-content-text.mjs

Lines changed: 15 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,9 @@ const adapters = {
1515
}
1616

1717
function findLargestElement(e) {
18+
if (!e) {
19+
return null
20+
}
1821
let maxArea = 0
1922
let largestElement = null
2023
const limitedArea = 0.8 * getArea(e)
@@ -50,14 +53,22 @@ export function getCoreContentText() {
5053
console.log(largestElement)
5154
console.log(secondLargestElement)
5255

53-
if (!largestElement) return
56+
function getTextFrom(e) {
57+
return e.innerText || e.textContent
58+
}
5459

5560
let ret
56-
if (secondLargestElement && getArea(secondLargestElement) > 0.5 * getArea(largestElement)) {
57-
ret = secondLargestElement.innerText || secondLargestElement.textContent
61+
if (!largestElement) {
62+
ret = getTextFrom(document.body)
63+
console.log('use document.body')
64+
} else if (
65+
secondLargestElement &&
66+
getArea(secondLargestElement) > 0.5 * getArea(largestElement)
67+
) {
68+
ret = getTextFrom(secondLargestElement)
5869
console.log('use second')
5970
} else {
60-
ret = largestElement.innerText || largestElement.textContent
71+
ret = getTextFrom(largestElement)
6172
console.log('use first')
6273
}
6374
return ret.trim().replaceAll(' ', '').replaceAll('\n\n', '').replaceAll(',,', '')

0 commit comments

Comments
 (0)