Install this version:
emerge -a =sci-ml/fastflowlm-0.9.43-r1
If this version is masked, you can unmask it using the autounmask tool or standard emerge options:
autounmask =sci-ml/fastflowlm-0.9.43-r1
Or alternatively:
emerge --autounmask-write -a =sci-ml/fastflowlm-0.9.43-r1
| Version | EAPI | Keywords | Slot |
|---|---|---|---|
| 0.9.43-r1 | 8 | ~amd64 | 0 |
# Copyright 2026 Gentoo Authors
# Distributed under the terms of the GNU General Public License v2
EAPI=8
inherit cmake systemd
DESCRIPTION="NPU-first LLM runtime for AMD Ryzen AI (XDNA2) processors"
HOMEPAGE="
https://fastflowlm.com/
https://github.com/FastFlowLM/FastFlowLM
"
# Submodule commit pins. tokenizers-cpp reverted to acbdc5a in 0.9.43
# (0.9.42 had bumped to 34885cf); nested sentencepiece + msgpack pins
# at acbdc5a still match the existing values.
TOKENIZERS_CPP_COMMIT="acbdc5a27ae01ba74cda756f94da698d40f11dfe"
SENTENCEPIECE_COMMIT="11051e3b73b3a6222a52acd720e39805dc7545ab"
MSGPACK_COMMIT="092bc69b6e815980bce7808595c914dd3a29f905"
SRC_URI="
https://github.com/FastFlowLM/FastFlowLM/archive/refs/tags/v${PV}.tar.gz
-> ${P}.tar.gz
https://github.com/mlc-ai/tokenizers-cpp/archive/${TOKENIZERS_CPP_COMMIT}.tar.gz
-> tokenizers-cpp-${TOKENIZERS_CPP_COMMIT}.tar.gz
https://github.com/google/sentencepiece/archive/${SENTENCEPIECE_COMMIT}.tar.gz
-> sentencepiece-${SENTENCEPIECE_COMMIT}.tar.gz
https://github.com/msgpack/msgpack-c/archive/${MSGPACK_COMMIT}.tar.gz
-> msgpack-c-${MSGPACK_COMMIT}.tar.gz
"
S="${WORKDIR}/FastFlowLM-${PV}"
# Orchestration / CLI is MIT (LICENSE_RUNTIME.txt); NPU compute kernels
# (xclbins) are proprietary (LICENSE_BINARY.txt → FastFlowLM-Binary).
LICENSE="MIT FastFlowLM-Binary"
SLOT="0"
KEYWORDS="~amd64"
IUSE="openrc systemd"
# Cargo (inside tokenizers-cpp/rust) fetches crates at build time.
# Proper GURU submission would require pre-vendored crates via cargo.eclass.
PROPERTIES="live"
RESTRICT="network-sandbox"
BDEPEND="
>=dev-build/cmake-3.22
dev-build/ninja
|| ( dev-lang/rust dev-lang/rust-bin )
"
RDEPEND="
dev-util/xrt
dev-libs/xdna-driver
dev-libs/xrt-xdna
media-video/ffmpeg:=
net-misc/curl:=
dev-libs/boost:=
sci-libs/fftw:3.0=
sys-libs/readline:=
"
DEPEND="${RDEPEND}"
CMAKE_USE_DIR="${S}/src"
src_unpack() {
default
rmdir "${S}/third_party/tokenizers-cpp" || die
mv "${WORKDIR}/tokenizers-cpp-${TOKENIZERS_CPP_COMMIT}" \
"${S}/third_party/tokenizers-cpp" || die
rmdir "${S}/third_party/tokenizers-cpp/sentencepiece" || die
mv "${WORKDIR}/sentencepiece-${SENTENCEPIECE_COMMIT}" \
"${S}/third_party/tokenizers-cpp/sentencepiece" || die
rmdir "${S}/third_party/tokenizers-cpp/msgpack" || die
mv "${WORKDIR}/msgpack-c-${MSGPACK_COMMIT}" \
"${S}/third_party/tokenizers-cpp/msgpack" || die
}
src_prepare() {
# Drop upstream's symlink-into-/usr/local/bin block; we provide our
# own wrapper via newbin + env.d below.
sed -i '/if.*NOT WIN32.*CMAKE_INSTALL_PREFIX/,/endif()/d' \
"${S}/src/CMakeLists.txt" || die
cmake_src_prepare
}
src_configure() {
# FLM_VERSION + NPU_VERSION + CMAKE_XCLBIN_PREFIX are set by the
# linux-default cmake preset upstream; we set them here directly
# because we don't drive the build via the preset. NPU_VERSION on
# Linux only satisfies a CMake guard (it's the Windows NPU driver
# version). CMAKE_XCLBIN_PREFIX must match the install rule
# (DESTINATION share/flm at src/CMakeLists.txt:345): without it the
# runtime's find_xclbin_path() falls back to dirname(/proc/self/exe)
# and looks for xclbins under bin/ instead of share/flm/ (#269).
# verified 2026-05-27 against fastflowlm-0.9.43 src/CMakeLists.txt
# (byte-identical to 0.9.42)
local mycmakeargs=(
-DCMAKE_INSTALL_PREFIX="/opt/fastflowlm"
-DCMAKE_XCLBIN_PREFIX="/opt/fastflowlm/share/flm"
-DFLM_VERSION="${PV}"
-DNPU_VERSION="32.0.203.304"
)
cmake_src_configure
}
src_install() {
cmake_src_install
# Wrapper so flm finds XRT and its own libs at runtime
# (lemonade-sdk/lemonade#1315).
newbin - flm <<-'EOF'
#!/usr/bin/env bash
set -euo pipefail
export LD_LIBRARY_PATH="/opt/fastflowlm/lib:/opt/xilinx/xrt/lib${LD_LIBRARY_PATH:+:${LD_LIBRARY_PATH}}"
export FLM_CONFIG_PATH="${FLM_CONFIG_PATH:-/opt/fastflowlm/share/flm/model_list.json}"
exec /opt/fastflowlm/bin/flm "$@"
EOF
# Helper that patches HuggingFace Whisper config.json so FLM's
# decoder-only LM_Config validator doesn't crash on it. Idempotent;
# user runs once after `flm pull whisper-v3:turbo`.
# Upstream bug: https://github.com/FastFlowLM/FastFlowLM/issues/545
newbin "${FILESDIR}/flm-patch-whisper" flm-patch-whisper
newenvd - 99fastflowlm <<-'EOF'
LDPATH="/opt/fastflowlm/lib"
PATH="/opt/fastflowlm/bin"
FLM_CONFIG_PATH="/opt/fastflowlm/share/flm/model_list.json"
EOF
if use openrc; then
newinitd "${FILESDIR}/${PN}.initd" "${PN}"
newconfd "${FILESDIR}/${PN}.confd" "${PN}"
fi
if use systemd; then
systemd_newunit "${FILESDIR}/${PN}.service" "${PN}@.service"
fi
}
pkg_postinst() {
elog ""
elog "FastFlowLM ${PV} installed to /opt/fastflowlm."
elog ""
elog "Quick start (manual):"
elog " flm validate # verify NPU stack"
elog " flm pull llama3.2:3b # download a model"
elog " flm run llama3.2:3b # chat with it"
elog ""
if use openrc; then
elog "OpenRC service (supervise-daemon; rlimit_memlock=unlimited set):"
elog " edit /etc/conf.d/fastflowlm and set FLM_USER (required)"
elog " other tunables (model, sidecars, port) have safe defaults"
elog " rc-service fastflowlm start"
elog " rc-update add fastflowlm default # auto-start at boot"
elog ""
fi
if use systemd; then
elog "systemd template service (one instance per user, mlock unlimited):"
elog " optionally create /etc/default/fastflowlm@<user> to override"
elog " FLM_MODEL / FLM_HOST / FLM_PORT / FLM_PMODE / FLM_ASR /"
elog " FLM_EMBED / FLM_EXTRA_OPTS"
elog " systemctl enable --now fastflowlm@<user>.service"
elog ""
fi
elog "Models stored in ~/.config/flm/ (override: FLM_MODEL_PATH)."
elog ""
elog "Ensure memlock is unlimited for INTERACTIVE 'flm run' use too."
if use openrc || use systemd; then
elog "(The installed service unit already sets memlock to unlimited.)"
fi
elog "If 'ulimit -l' is not 'unlimited' in your shell, add to"
elog "/etc/security/limits.d/99-amdxdna.conf:"
elog " * soft memlock unlimited"
elog " * hard memlock unlimited"
elog ""
ewarn ""
ewarn "Whisper ASR models (whisper-v3:turbo, ...) crash flm at startup"
ewarn "until their config.json is patched: FLM's LM_Config validator"
ewarn "asserts on decoder-only LM-shape fields that HuggingFace Whisper"
ewarn "configs don't carry."
ewarn "Upstream bug: https://github.com/FastFlowLM/FastFlowLM/issues/545"
ewarn ""
ewarn "After 'flm pull whisper-v3:turbo' (or any Whisper model), run"
ewarn " flm-patch-whisper"
ewarn "to patch the downloaded config.json idempotently."
ewarn ""
elog "Run 'env-update && source /etc/profile' to pick up paths."
}
Manage flags for this package:
euse -i <flag> -p sci-ml/fastflowlm |
euse -E <flag> -p sci-ml/fastflowlm |
euse -D <flag> -p sci-ml/fastflowlm
dev-util/xrt dev-libs/xdna-driver dev-libs/xrt-xdna media-video/ffmpeg:= net-misc/curl:= dev-libs/boost:= sci-libs/fftw:3.0= sys-libs/readline:=
dev-util/xrt dev-libs/xdna-driver dev-libs/xrt-xdna media-video/ffmpeg:= net-misc/curl:= dev-libs/boost:= sci-libs/fftw:3.0= sys-libs/readline:=
>=dev-build/cmake-3.22 dev-build/ninja || ( dev-lang/rust dev-lang/rust-bin )