diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-10-27 15:42:55 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-10-27 15:42:55 -0700 |
commit | b8e04dc6199a443d3d1e4f15e86420ad00ba9886 (patch) | |
tree | c0c445dc97a8afcf620555f862578fed755a636c /python/Pipfile | |
parent | ae851f3f205b741dbc826c3197cdd3cc9bde8802 (diff) | |
download | sandcrawler-b8e04dc6199a443d3d1e4f15e86420ad00ba9886.tar.gz sandcrawler-b8e04dc6199a443d3d1e4f15e86420ad00ba9886.zip |
new dependencies for HTML metadata parsing
Diffstat (limited to 'python/Pipfile')
-rw-r--r-- | python/Pipfile | 8 |
1 files changed, 8 insertions, 0 deletions
diff --git a/python/Pipfile b/python/Pipfile index 17734ad..1a409e9 100644 --- a/python/Pipfile +++ b/python/Pipfile @@ -38,6 +38,14 @@ Flask = ">=1" urlcanon = "*" pillow = ">=3" python-poppler = ">=0.2.1" +selectolax = ">=0.2" +trafilatura = "*" +pydantic = ">=1.7" +dateparser = "*" + +# TODO: +#dynaconf = ">=3" +#sentry-sdk = { version = ">=0.14.0", extras = [] } # must lock black to an exact version because it is still "beta" # see: https://github.com/psf/black/issues/517 |