diff --git a/MANIFEST.in b/MANIFEST.in index 7256d988..c4c8c161 100644 --- a/MANIFEST.in +++ b/MANIFEST.in @@ -8,9 +8,5 @@ graft tests/resources/ exclude tests/realworld_tests.py recursive-exclude tests/cache/ -recursive-include docs/ conf.py Makefile make.bat *.rst *.gif *.jpg *.png -include docs/requirements.txt -recursive-include docs/_build/ *.gif *.jpg *.png - recursive-exclude * __pycache__ recursive-exclude * *.py[co] diff --git a/docs/index.rst b/docs/index.rst index 3bce9954..4c04b363 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -192,6 +192,15 @@ Jointly developed plugins and additional packages also contribute to the field o Corresponding posts on `Bits of Language `_ (blog). +Building the docs +----------------- + +Starting from the ``docs/`` folder of the repository: + +1. ``pip install -r requirements.txt`` +2. ``sphinx-build -b html . _build/`` (where ``_build`` is the target directory) + + Further documentation ===================== @@ -207,10 +216,4 @@ Further documentation used-by background - -Indices and tables -================== - * :ref:`genindex` -* :ref:`modindex` -* :ref:`search` diff --git a/pyproject.toml b/pyproject.toml index e1825e01..a08a5943 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -77,8 +77,7 @@ version = {attr = "trafilatura.__version__"} # https://setuptools.pypa.io/en/stable/userguide/datafiles.html [tool.setuptools.package-data] trafilatura = [ - "data/tei-schema-pickle.lzma", - "data/jt-stopwords-pickle.lzma", + "data/tei_corpus.dtd", "settings.cfg", ]