We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ad7bed0 commit 7ad5ff2Copy full SHA for 7ad5ff2
extractnet/__init__.py
@@ -1,6 +1,6 @@
1
from extractnet.pipeline import Extractor
2
3
-__version__ = '2.0.3'
+__version__ = '2.0.4'
4
5
6
_LOADED_MODELS = {}
extractnet/metadata_extraction/metadata.py
@@ -77,7 +77,7 @@ def extract_json(tree, metadata):
77
if '"publisher"' in elem.text:
78
mymatch = JSON_PUBLISHER.search(elem.text)
79
if mymatch and not ',' in mymatch.group(1):
80
- candidate = normalize_json(mymatch.group(1))
+ candidate = url_normalizer(mymatch.group(1))
81
if metadata['sitename'] is None or len(metadata['sitename']) < len(candidate):
82
metadata['sitename'] = candidate
83
if metadata['sitename'].startswith('http') and not candidate.startswith('http'):
0 commit comments