Skip to content

Commit 930945f

Browse files
committed
v1.4.1: add trafilatura.utils to SENTRY_LOGGERS_TO_IGNORE
1 parent e51beb4 commit 930945f

File tree

3 files changed

+9
-5
lines changed

3 files changed

+9
-5
lines changed

CHANGELOG.md

+4-1
Original file line numberDiff line numberDiff line change
@@ -4,14 +4,17 @@ Version History
44
Version 1
55
---------
66

7+
### V1.4.1
8+
* add trafilatura.utils to SENTRY_LOGGERS_TO_IGNORE
9+
710
### V1.4.0
811
* add ignore_loggers and sentry_ignore_loggers
912

1013
### V1.3.1
1114
* Fix CI Bug from out-of-date dependency
1215

1316
### V1.3.0
14-
* Add option to optionally override canonical_domain
17+
* Add option to optionally override canonical_domain
1518

1619
### V1.2.0
1720
* metadata now includes Canonical Url when available

mcmetadata/__init__.py

+4-3
Original file line numberDiff line numberDiff line change
@@ -33,6 +33,7 @@
3333
# NOTE! in sorted order!
3434
"htmldate.utils",
3535
"trafilatura.core",
36+
"trafilatura.utils",
3637
]
3738

3839

@@ -102,9 +103,9 @@ def extract(
102103
is_shortened_url = urls.is_shortened_url(url)
103104
url_duration = time.monotonic() - t1
104105
stats_accumulator["url"] += url_duration
105-
106-
if 'canonical_domain' in overrides:
107-
canonical_domain = overrides['canonical_domain']
106+
107+
if "canonical_domain" in overrides:
108+
canonical_domain = overrides["canonical_domain"]
108109
else:
109110
canonical_domain = urls.canonical_domain(final_url)
110111

pyproject.toml

+1-1
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ build-backend = "flit_core.buildapi"
44

55
[project]
66
name = "mediacloud-metadata"
7-
version = "1.4.0"
7+
version = "1.4.1"
88
authors = [
99
{name='Rahul Bhargava', email='[email protected]'}
1010
]

0 commit comments

Comments
 (0)