Skip to content

Commit 0dd6739

Browse files
authored
Merge pull request #418 from extractus/8.0.19
v8.0.19
2 parents 1da50a5 + 648d2ed commit 0dd6739

17 files changed

+23
-22
lines changed

.github/workflows/ci-test.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ jobs:
1212

1313
strategy:
1414
matrix:
15-
node_version: [20.x, 22.x, 23.x]
15+
node_version: [20.x, 22.x, 24.x]
1616

1717
steps:
1818
- uses: actions/checkout@v4

eval.js

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
import { execSync } from 'node:child_process'
44
import { readFileSync, writeFileSync, existsSync } from 'node:fs'
55

6-
import { slugify } from 'bellajs'
6+
import { slugify } from '@ndaidong/bellajs'
77

88
import { isValid as isValidUrl } from './src/utils/linker.js'
99
import { extract, extractFromHtml } from './src/main.js'

package.json

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
{
2-
"version": "8.0.18",
2+
"version": "8.0.19",
33
"name": "@extractus/article-extractor",
44
"description": "To extract main article from given URL",
55
"homepage": "https://github.com/extractus/article-extractor",
@@ -31,16 +31,16 @@
3131
},
3232
"dependencies": {
3333
"@mozilla/readability": "^0.6.0",
34-
"bellajs": "^11.2.0",
34+
"@ndaidong/bellajs": "^12.0.1",
3535
"cross-fetch": "^4.1.0",
3636
"linkedom": "^0.18.10",
3737
"sanitize-html": "2.16.0"
3838
},
3939
"devDependencies": {
4040
"@eslint/js": "^9.26.0",
41-
"@types/sanitize-html": "^2.15.0",
41+
"@types/sanitize-html": "^2.16.0",
4242
"eslint": "^9.26.0",
43-
"globals": "^16.0.0",
43+
"globals": "^16.1.0",
4444
"https-proxy-agent": "^7.0.6",
4545
"nock": "^14.0.4"
4646
},

src/config.js

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// config.js
22

3-
import { clone } from 'bellajs'
3+
import { clone } from '@ndaidong/bellajs'
44

55
const sanitizeHtmlOptions = {
66
allowedTags: [

src/main.js

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22

33
import {
44
isString
5-
} from 'bellajs'
5+
} from '@ndaidong/bellajs'
66

77
import retrieve from './utils/retrieve.js'
88
import parseFromHtml from './utils/parseFromHtml.js'

src/utils/extractLdSchema.js

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// utils -> extractLdSchema.js
22

3-
import { isArray, isObject, isString } from 'bellajs'
3+
import { isArray, isObject, isString } from '@ndaidong/bellajs'
44

55
const typeSchemas = [
66
'aboutpage',
@@ -74,7 +74,7 @@ export default (document, entry) => {
7474

7575
const keyValue = ldJson[attr]
7676
const val = isArray(keyValue) ? keyValue[0] : isObject(keyValue) ? keyValue?.name || '' : keyValue
77-
if (isString(val)) {
77+
if (isString(val) && val !== '') {
7878
entry[key] = val.trim()
7979
}
8080
})

src/utils/extractMetaData.js

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -138,8 +138,9 @@ export default (html) => {
138138

139139
Array.from(doc.getElementsByTagName('meta')).forEach(node => {
140140
const result = getMetaContentByNameOrProperty(node, attributeLists)
141-
if (result) {
142-
entry[result.key] = result.content
141+
const val = result?.content || ''
142+
if (val !== '') {
143+
entry[result.key] = val
143144
}
144145
})
145146

src/utils/extractMetaData.test.js

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ import assert from 'node:assert'
44

55
import { readFileSync } from 'node:fs'
66

7-
import { isObject, hasProperty } from 'bellajs'
7+
import { isObject, hasProperty } from '@ndaidong/bellajs'
88

99
import extractMetaData from './extractMetaData.js'
1010

src/utils/extractWithReadability.js

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22

33
import { Readability } from '@mozilla/readability'
44
import { DOMParser } from 'linkedom'
5-
import { isString } from 'bellajs'
5+
import { isString } from '@ndaidong/bellajs'
66

77
export default (html, url = '') => {
88
if (!isString(html)) {

src/utils/extractWithReadability.test.js

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ import assert from 'node:assert'
55

66
import { readFileSync } from 'node:fs'
77

8-
import { isString } from 'bellajs'
8+
import { isString } from '@ndaidong/bellajs'
99

1010
import extractWithReadability, { extractTitleWithReadability } from './extractWithReadability.js'
1111

0 commit comments

Comments
 (0)