From 3b1f0425cf94f508dbb788fd9143087be118814b Mon Sep 17 00:00:00 2001 From: TrisNol Date: Sat, 21 Oct 2023 11:22:34 +0200 Subject: [PATCH] deps: Adding html5lib for table parsing via Pandas --- poetry.lock | 4 ++-- pyproject.toml | 3 ++- 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/poetry.lock b/poetry.lock index 809c5e7..c476a34 100644 --- a/poetry.lock +++ b/poetry.lock @@ -7361,11 +7361,11 @@ test = ["coverage (>=5.0.3)", "zope.event", "zope.testing"] testing = ["coverage (>=5.0.3)", "zope.event", "zope.testing"] [extras] -ingest = ["deutschland", "selenium", "xmltodict"] +ingest = ["deutschland", "html5lib", "selenium", "xmltodict"] transformation = ["spacy", "spacy-sentiws", "torch", "torchaudio", "torchvision", "transformers"] web-server = ["dash", "dash-auth", "dash-bootstrap-components", "matplotlib", "networkx", "seaborn"] [metadata] lock-version = "2.0" python-versions = ">=3.11,<3.13" -content-hash = "0fb643247c09a91aeef5aae1286426f9296688dadff30f5a4a6085c3abe5399e" +content-hash = "5ca44ede811dc417faeda6b976c032682be7b4edadc16fc6c81e2ffe3dc4f946" diff --git a/pyproject.toml b/pyproject.toml index 77af5eb..a17ac8b 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -81,9 +81,10 @@ torchvision = {version = "*", source = "torch-cpu"} tqdm = "^4.66.1" transformers = {version = "*", extras = ["torch"]} xmltodict = "^0.13.0" +html5lib = "^1.1" [tool.poetry.extras] -ingest = ["selenium", "deutschland", "xmltodict"] +ingest = ["selenium", "deutschland", "xmltodict", "html5lib"] transformation = ["torch", "torchaudio", "torchvision", "transformers", "spacy-sentiws", "spacy"] web-server = ["dash", "dash-auth", "dash-bootstrap-components", "matplotlib", "seaborn", "networkx"]