-
Notifications
You must be signed in to change notification settings - Fork 6
Expand file tree
/
Copy pathpyproject.toml
More file actions
65 lines (60 loc) · 1.78 KB
/
pyproject.toml
File metadata and controls
65 lines (60 loc) · 1.78 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
[build-system]
requires = ["flit_core >=3.2,<4"]
build-backend = "flit_core.buildapi"
[project]
name = "mediacloud-metadata"
version = "1.4.3"
authors = [
{name='Rahul Bhargava', email='rahul@mediacloud.org'}
]
description='Media Cloud news article metadata extraction'
readme = "README.md"
requires-python = ">=3.10"
classifiers = [
"License :: OSI Approved :: Apache Software License",
"Natural Language :: English",
"Operating System :: OS Independent",
"Programming Language :: Python",
"Programming Language :: Python :: 3.10",
"Programming Language :: Python :: 3.11",
]
dependencies = [
# for date guessing
"htmldate==1.8.*", "dateparser==1.2.*",
# for domain name and URL extraction
"tldextract==5.1.*",
"url-normalize==1.4.*",
"furl==2.1.*",
# for language detection
"py3langid==0.2.*",
# various content extractors we try to use
"newspaper3k==0.2.*",
"goose3==3.1.*",
"BeautifulSoup4==4.12.*",
"readability-lxml==0.8.*",
"trafilatura==1.8.*", # must stay below v1.11.* to allow easy extraction of canonical_url
"boilerpy3==1.0.*",
# support
"requests", # leave un-versioned so dependencies can sort of which version is best
"faust-cchardet==2.1.*", # BeautifulSoup4 speedup
"surt==0.3.1"
]
[tool.flit.module]
name = "mcmetadata"
[project.optional-dependencies]
dev = [
"pre-commit==3.8.*",
"flake8==6.1.*",
"mypy==1.6.*",
"isort==5.12.*",
"types-urllib3==1.26.*",
"types-requests==2.32.*",
"black==24.4.*"
]
test = [ "pytest", "parameterized" ]
[project.urls]
"Homepage" = "https://mediacloud.org"
"Bug Tracker" = "https://github.com/mediacloud/meta-extractor/issues"
"Source Code" = "https://github.com/mediacloud/meta-extractor"
[tool.isort]
profile = "black"