Install this version:
emerge -a =sci-ml/sentencepiece-0.2.1
If this version is masked, you can unmask it using the autounmask tool or standard emerge options:
autounmask =sci-ml/sentencepiece-0.2.1
Or alternatively:
emerge --autounmask-write -a =sci-ml/sentencepiece-0.2.1
| Version | EAPI | Keywords | Slot |
|---|---|---|---|
| 0.2.1 | 8 | ~amd64 | 0 |
# Copyright 2025-2026 Gentoo Authors
# Distributed under the terms of the GNU General Public License v2
EAPI=8
DISTUTILS_USE_PEP517=setuptools
DISTUTILS_EXT=1
PYTHON_COMPAT=( python3_{11..14} )
inherit cmake distutils-r1 dot-a
DESCRIPTION="Text tokenizer for Neural Network-based text generation"
HOMEPAGE="https://github.com/google/sentencepiece"
SRC_URI="https://github.com/google/${PN}/archive/refs/tags/v${PV}.tar.gz
-> ${P}.tar.gz"
LICENSE="Apache-2.0"
SLOT="0"
KEYWORDS="~amd64"
# depends on abseil-cpp via protobuf targets
RDEPEND="
dev-cpp/abseil-cpp:=
dev-libs/protobuf:=
dev-util/google-perftools
!sci-ml/pysentencepiece
"
DEPEND="${RDEPEND}
dev-libs/darts
"
DOCS=(
README.md
doc/api.md
doc/experiments.md
doc/normalization.md
doc/options.md
doc/special_symbols.md
)
PATCHES=(
"${FILESDIR}"/${P}-cmake.patch
"${FILESDIR}"/${P}-noStatic.patch
"${FILESDIR}"/${P}-nostrip.patch
)
src_prepare() {
sed -i \
-e "s:third_party/darts_clone/darts.h:darts.h:" \
src/model_interface.h \
src/normalizer.h \
src/normalizer.cc \
src/unigram_model.h \
src/builder.cc \
|| die
distutils-r1_src_prepare
cmake_prepare
sed \
-e 's|@libprotobuf_lite@|protobuf-lite|' \
-e "s|@includedir_for_pc_file@|${S}/src|" \
-e "s|@libdir_for_pc_file@|${BUILD_DIR}/src|" \
${PN}.pc.in \
> python/${PN}.pc \
|| die
sed -e '/CMAKE_CXX_STANDARD /{s/)/ CACHE STRING "")/g}' -i CMakeLists.txt || die
}
src_configure() {
lto-guarantee-fat
local mycmakeargs=(
-DSPM_ABSL_PROVIDER=package
-DSPM_PROTOBUF_PROVIDER=package
)
if has_version ">=dev-cpp/abseil-cpp-20260107.0"; then
# needs >=c++20
mycmakeargs+=(
-DCMAKE_CXX_STANDARD=20
)
fi
cmake_src_configure
}
src_compile() {
cmake_src_compile
cd python
PKG_CONFIG_PATH=. distutils-r1_src_compile
}
src_test() {
LD_LIBRARY_PATH=${BUILD_DIR}/src distutils-r1_src_test
}
python_test() {
cd python
${EPYTHON} test/sentencepiece_test.py || die
}
src_install() {
cmake_src_install
distutils-r1_src_install
strip-lto-bytecode
}
dev-cpp/abseil-cpp:= dev-libs/protobuf:= dev-util/google-perftools !sci-ml/pysentencepiece dev-libs/darts
dev-cpp/abseil-cpp:= dev-libs/protobuf:= dev-util/google-perftools !sci-ml/pysentencepiece
| Type | File | Size | Source URLs |
|---|---|---|---|
| DIST | sentencepiece-0.2.1.tar.gz | 13485527 bytes | https://github.com/google/sentencepiece/archive/refs/tags/v0.2.1.tar.gz |