# automatically generated by g-sorcery
# please do not edit this file

EAPI=8

REALNAME="${PN}"
LITERALNAME="${PN}"
REALVERSION="${PV}"
DIGEST_SOURCES="yes"
PYTHON_COMPAT=( python{3_11,3_12,3_13,3_14} )
DISTUTILS_USE_PEP517=standalone

inherit python-r1 gs-pypi

DESCRIPTION="This library contains a set of tools in order to extract and synthesize structured information from documents"

HOMEPAGE="https://pydoxtools.xyntopia.com"
LICENSE="MIT"
SRC_URI="https://files.pythonhosted.org/packages/source/${REALNAME::1}/${REALNAME}/${REALNAME}-${REALVERSION}.tar.gz"
SOURCEFILE="${REALNAME}-${REALVERSION}.tar.gz"
RESTRICT="test"

SLOT="0"
KEYWORDS="~amd64 ~x86"

IUSE="etl inference"
DEPENDENCIES="etl? ( dev-python/goose3[${PYTHON_USEDEP}] )
	etl? ( dev-python/readability-lxml[${PYTHON_USEDEP}] )
	<dev-python/appdirs-2.0.0[${PYTHON_USEDEP}]
	etl? ( dev-python/langdetect[${PYTHON_USEDEP}] )
	inference? ( dev-python/transformers[${PYTHON_USEDEP}] )
	etl? ( >=dev-python/tldextract-2.2.3[${PYTHON_USEDEP}] )
	etl? ( dev-python/pdfminer-six[${PYTHON_USEDEP}] )
	etl? ( dev-python/extruct[${PYTHON_USEDEP}] )
	etl? ( dev-python/quantulum3[${PYTHON_USEDEP}] )
	etl? ( >=dev-python/quantities-0.12.4[${PYTHON_USEDEP}] )
	inference? ( >=dev-python/tqdm-4.47.0[${PYTHON_USEDEP}] )
	etl? ( dev-python/urlextract[${PYTHON_USEDEP}] )
	inference? ( dev-python/urlextract[${PYTHON_USEDEP}] )
	<dev-python/pydantic-3.0.0[${PYTHON_USEDEP}]
	etl? ( >=dev-python/beautifulsoup4-4.8.0[${PYTHON_USEDEP}] )
	inference? ( >=dev-python/beautifulsoup4-4.8.0[${PYTHON_USEDEP}] )
	>=dev-python/lxml-4.6.2[${PYTHON_USEDEP}]
	etl? ( dev-python/stemming[${PYTHON_USEDEP}] )
	dev-python/Pint[${PYTHON_USEDEP}]
	>=dev-python/pikepdf-2.10.0[${PYTHON_USEDEP}]
	inference? ( dev-python/pytorch-lightning[${PYTHON_USEDEP}] )
	etl? ( dev-python/pdf2image[${PYTHON_USEDEP}] )
	<dev-python/shapely-2.0.0[${PYTHON_USEDEP}]
	inference? ( <dev-python/scikit-learn-2.0.0[${PYTHON_USEDEP}] )
	etl? ( dev-python/spacy[${PYTHON_USEDEP}] )
	inference? ( dev-python/spacy[${PYTHON_USEDEP}] )
	etl? ( <dev-python/pandas-3.0.0[${PYTHON_USEDEP}] )
	inference? ( <dev-python/pandas-3.0.0[${PYTHON_USEDEP}] )
	etl? ( dev-python/hnswlib[${PYTHON_USEDEP}] )
	inference? ( dev-python/hnswlib[${PYTHON_USEDEP}] )
	etl? ( <dev-python/networkx-3.0.0[${PYTHON_USEDEP}] )
	<dev-python/python-magic-0.5.0[${PYTHON_USEDEP}]
	etl? ( dev-python/openai[${PYTHON_USEDEP}] )
	etl? ( dev-python/python-pptx[${PYTHON_USEDEP}] )
	etl? ( dev-python/pandoc[${PYTHON_USEDEP}] )
	<dev-python/packaging-24.0[${PYTHON_USEDEP}]
	inference? ( dev-python/torch[${PYTHON_USEDEP}] )
	etl? ( <dev-python/pytesseract-0.4.0[${PYTHON_USEDEP}] )
	<dev-python/pyyaml-7.0[${PYTHON_USEDEP}]
	etl? ( dev-python/dask[${PYTHON_USEDEP}] )
	<dev-python/diskcache-6.0.0[${PYTHON_USEDEP}]
	<dev-python/chardet-6.0.0[${PYTHON_USEDEP}]
	inference? ( dev-python/gpt4all[${PYTHON_USEDEP}] )
	inference? ( dev-python/fastcoref[${PYTHON_USEDEP}] )
	inference? ( dev-python/timm[${PYTHON_USEDEP}] )
	etl? ( <dev-python/pygraphviz-2.0[${PYTHON_USEDEP}] )
	dev-python/pydantic-settings[${PYTHON_USEDEP}]
	<dev-python/tabulate-0.10.0[${PYTHON_USEDEP}]"
BDEPEND="${DEPENDENCIES}"
RDEPEND="${DEPENDENCIES}"