-
Notifications
You must be signed in to change notification settings - Fork 2
/
pyproject.toml
55 lines (52 loc) · 1.66 KB
/
pyproject.toml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
[project]
name = "bicleaner-hardrules"
version = "2.10.6"
authors = [
{ name="Prompsit Language Engineering", email="[email protected]" },
]
maintainers = [
{ name="Jaume Zaragoza", email="[email protected]" },
]
description = "Pre-filtering step for obvious noise based on rules, poor language based on general language modelling and vulgar language based on specific language modelling"
readme = "README.md"
requires-python = ">=3.8"
dependencies = [
"regex",
"PyYAML",
"pytest",
"toolwrapper>=1.0,<=3",
"joblib",
"sacremoses==0.0.53",
"fasttext-wheel==0.9.2",
"fastspell==0.11.1",
"huggingface-hub>=0.15,<0.23",
]
classifiers = [
"Environment :: Console",
"Intended Audience :: Science/Research",
"Programming Language :: Python :: 3.7",
"Programming Language :: Python :: 3.8",
"Programming Language :: Python :: 3.9",
"Programming Language :: Python :: 3.10",
"License :: OSI Approved :: GNU General Public License v3 (GPLv3)",
"Operating System :: POSIX :: Linux",
"Topic :: Text Processing :: Linguistic",
"Topic :: Software Development :: Libraries :: Python Modules",
"Topic :: Text Processing :: Filters"
]
[build-system]
requires = [
"setuptools>=45.0,<66",
"cmake>=3.18",
"scikit-build==0.16.6",
"ninja",
]
build-backend = "setuptools.build_meta"
[project.scripts]
bicleaner-hardrules = "hardrules.bicleaner_hardrules:main"
[project.urls]
"HomePage" = "https://github.com/bitextor/bicleaner-hardrules"
"Prompsit Language Engineering" = "http://www.prompsit.com"
"Paracrawl" = "https://paracrawl.eu/"
"MaCoCu" = "https://macocu.eu"
"HPLT Project" = "https://hplt-project.org"