Feature/ner (#103)

NER und Sentiment-Pipeline mit Services zur Datenextraktion.

---------

Co-authored-by: Philipp Horstenkamp <philipp@horstenkamp.de>
Co-authored-by: TrisNol <tristan.nolde@yahoo.de>
This commit is contained in:
Sebastian
2023-10-16 19:54:24 +02:00
committed by GitHub
parent 99b61e7c2e
commit c680ac9759
28 changed files with 12509 additions and 10 deletions

View File

@ -65,12 +65,18 @@ python = "^3.11"
python-dotenv = "^1.0.0"
seaborn = "^0.12.2"
selenium = "^4.12.0"
spacy = "^3.6.1"
spacy-sentiws = "^3.0.0"
torch = {version = "*", source = "torch-cpu"}
torchaudio = {version = "*", source = "torch-cpu"}
torchvision = {version = "*", source = "torch-cpu"}
tqdm = "^4.66.1"
transformers = {version = "*", extras = ["torch"]}
xmltodict = "^0.13.0"
[tool.poetry.extras]
ingest = ["selenium", "deutschland", "xmltodict"]
transformation = []
transformation = ["torch", "torchaudio", "torchvision", "transformers", "spacy-sentiws", "spacy"]
web-server = ["dash", "dash-auth", "dash-bootstrap-components", "matplotlib", "seaborn"]
[tool.poetry.group.develop.dependencies]
@ -108,6 +114,7 @@ types-cachetools = "^5.3.0.6"
types-pyOpenSSL = "*"
types-requests = "^2.31.0.2"
types-setuptools = "*"
types-tabulate = "^0.9.0.3"
types-tqdm = "^4.66.0.2"
[tool.poetry.group.test.dependencies]
@ -123,6 +130,11 @@ data-transformation = "aki_prj23_transparenzregister.utils.data_transfer:transfe
reset-sql = "aki_prj23_transparenzregister.utils.sql.connector:reset_all_tables_cli"
webserver = "aki_prj23_transparenzregister.ui.app:main"
[[tool.poetry.source]]
name = "torch-cpu"
priority = "explicit"
url = "https://download.pytorch.org/whl/cpu"
[tool.ruff]
exclude = [
".bzr",