View Raw Ebuild
# automatically generated by g-sorcery
# please do not edit this file
EAPI=8
REALNAME="${PN}"
LITERALNAME="${PN}"
REALVERSION="${PV}"
DIGEST_SOURCES="yes"
PYTHON_COMPAT=( python{3_11,3_12,3_13,3_14} )
DISTUTILS_USE_PEP517=standalone
inherit python-r1 gs-pypi
DESCRIPTION="Curate scraped HTML for easy interpretation by large language models. Build more robust generative AI applications. Convert HTML to Markdown using Regex, BeautifulSoup4, and filter out useless content with Jina Embeddings."
HOMEPAGE=""
LICENSE="MIT"
SRC_URI="https://files.pythonhosted.org/packages/source/${REALNAME::1}/${REALNAME}/${REALNAME//-/_}-${REALVERSION}.tar.gz"
SOURCEFILE="${REALNAME//-/_}-${REALVERSION}.tar.gz"
RESTRICT="test"
SLOT="0"
KEYWORDS="~amd64 ~x86"
IUSE=""
DEPENDENCIES=">=dev-python/beautifulsoup4-4.12.2[${PYTHON_USEDEP}]
dev-python/markdownify[${PYTHON_USEDEP}]
dev-python/transformers[${PYTHON_USEDEP}]
dev-python/torch[${PYTHON_USEDEP}]
>=dev-python/aiofiles-23.2.1[${PYTHON_USEDEP}]
dev-python/asyncio[${PYTHON_USEDEP}]"
BDEPEND="${DEPENDENCIES}"
RDEPEND="${DEPENDENCIES}"