summaryrefslogtreecommitdiff
path: root/textproc/py-tokenizers/Makefile
diff options
context:
space:
mode:
Diffstat (limited to '')
-rw-r--r--textproc/py-tokenizers/Makefile23
-rw-r--r--textproc/py-tokenizers/Makefile.crates215
2 files changed, 148 insertions, 90 deletions
diff --git a/textproc/py-tokenizers/Makefile b/textproc/py-tokenizers/Makefile
index cec8c52fa266..a2aa44437341 100644
--- a/textproc/py-tokenizers/Makefile
+++ b/textproc/py-tokenizers/Makefile
@@ -1,6 +1,5 @@
PORTNAME= tokenizers
-DISTVERSION= 0.21.1
-PORTREVISION= 2
+DISTVERSION= 0.22.0
CATEGORIES= textproc python
MASTER_SITES= PYPI
PKGNAMEPREFIX= ${PYTHON_PKGNAMEPREFIX}
@@ -15,16 +14,32 @@ LICENSE_FILE= ${WRKSRC}/tokenizers/LICENSE
BUILD_DEPENDS= ${PYTHON_PKGNAMEPREFIX}maturin>=1.0<2.0:devel/py-maturin@${PY_FLAVOR}
RUN_DEPENDS= ${PYTHON_PKGNAMEPREFIX}huggingface-hub>=0.16.4<1.0:misc/py-huggingface-hub@${PY_FLAVOR}
-TEST_DEPENDS= ${LOCALBASE}/libdata/pkgconfig/oniguruma.pc:devel/oniguruma
+TEST_DEPENDS= ${LOCALBASE}/libdata/pkgconfig/oniguruma.pc:devel/oniguruma \
+ ${PYTHON_PKGNAMEPREFIX}numpy>0:math/py-numpy@${PY_FLAVOR} \
+ ${PYTHON_PKGNAMEPREFIX}datasets>0:misc/py-datasets@${PY_FLAVOR} \
+ ${PYTHON_PKGNAMEPREFIX}requests>0:www/py-requests@${PY_FLAVOR}
USES= cargo python
-USE_PYTHON= autoplist pep517
+USE_PYTHON= autoplist pep517 pytest
+PYTEST_BROKEN_TESTS= test_gzip
CARGO_CARGOTOML=${WRKSRC}/bindings/python/Cargo.toml
CARGO_CARGOLOCK=${WRKSRC}/bindings/python/Cargo.lock
CARGO_BUILD= no
CARGO_INSTALL= no
+CARGO_TEST= no
+CARGO_TEST_ARGS= --no-default-features
+
+TEST_ARGS= tests
+TEST_ENV= PYTHONPATH=${STAGEDIR}${PYTHONPREFIX_SITELIBDIR}
BINARY_ALIAS= python3=${PYTHON_CMD}
+TEST_WRKSRC= ${WRKSRC}/bindings/python
+
+post-test:
+ cd ${TEST_WRKSRC} && \
+ ${SETENV} ${MAKE_ENV} ${CARGO_ENV} ${TEST_ENV} ${CARGO} test \
+ --manifest-path ${CARGO_CARGOTOML} --verbose --verbose ${CARGO_TEST_ARGS}
+
.include <bsd.port.mk>
diff --git a/textproc/py-tokenizers/Makefile.crates b/textproc/py-tokenizers/Makefile.crates
index 6fe57601c387..f1c05a287689 100644
--- a/textproc/py-tokenizers/Makefile.crates
+++ b/textproc/py-tokenizers/Makefile.crates
@@ -1,130 +1,173 @@
-CARGO_CRATES= aho-corasick-1.1.3 \
- anstream-0.6.18 \
- anstyle-1.0.10 \
- anstyle-parse-0.2.6 \
- anstyle-query-1.1.2 \
- anstyle-wincon-3.0.6 \
- autocfg-1.4.0 \
+CARGO_CRATES= addr2line-0.24.2 \
+ adler2-2.0.1 \
+ ahash-0.8.12 \
+ aho-corasick-1.1.3 \
+ anstream-0.6.20 \
+ anstyle-1.0.11 \
+ anstyle-parse-0.2.7 \
+ anstyle-query-1.1.4 \
+ anstyle-wincon-3.0.10 \
+ autocfg-1.5.0 \
+ backtrace-0.3.75 \
base64-0.13.1 \
- bitflags-1.3.2 \
- bitflags-2.6.0 \
- bumpalo-3.16.0 \
- byteorder-1.5.0 \
- cc-1.2.6 \
- cfg-if-1.0.0 \
- colorchoice-1.0.3 \
- console-0.15.10 \
+ bitflags-2.9.3 \
+ bumpalo-3.19.0 \
+ castaway-0.2.4 \
+ cc-1.2.34 \
+ cfg-if-1.0.3 \
+ colorchoice-1.0.4 \
+ compact_str-0.9.0 \
+ console-0.15.11 \
crossbeam-deque-0.8.6 \
crossbeam-epoch-0.9.18 \
crossbeam-utils-0.8.21 \
- darling-0.20.10 \
- darling_core-0.20.10 \
- darling_macro-0.20.10 \
+ darling-0.20.11 \
+ darling_core-0.20.11 \
+ darling_macro-0.20.11 \
+ dary_heap-0.3.7 \
derive_builder-0.20.2 \
derive_builder_core-0.20.2 \
derive_builder_macro-0.20.2 \
- either-1.13.0 \
+ either-1.15.0 \
encode_unicode-1.0.0 \
env_filter-0.1.3 \
- env_logger-0.11.6 \
- errno-0.3.10 \
+ env_logger-0.11.8 \
+ errno-0.3.13 \
esaxx-rs-0.1.10 \
fastrand-2.3.0 \
fnv-1.0.7 \
- getrandom-0.2.15 \
+ futures-0.3.31 \
+ futures-channel-0.3.31 \
+ futures-core-0.3.31 \
+ futures-executor-0.3.31 \
+ futures-io-0.3.31 \
+ futures-macro-0.3.31 \
+ futures-sink-0.3.31 \
+ futures-task-0.3.31 \
+ futures-util-0.3.31 \
+ getrandom-0.3.3 \
+ gimli-0.31.1 \
heck-0.5.0 \
- humantime-2.1.0 \
ident_case-1.0.1 \
- indicatif-0.17.9 \
- indoc-2.0.5 \
+ indicatif-0.17.11 \
+ indoc-2.0.6 \
+ io-uring-0.7.10 \
is_terminal_polyfill-1.70.1 \
- itertools-0.11.0 \
- itertools-0.12.1 \
- itertools-0.13.0 \
- itoa-1.0.14 \
- js-sys-0.3.76 \
- lazy_static-1.5.0 \
- libc-0.2.169 \
- linux-raw-sys-0.4.14 \
- log-0.4.22 \
- macro_rules_attribute-0.2.0 \
- macro_rules_attribute-proc_macro-0.2.0 \
- matrixmultiply-0.3.9 \
- memchr-2.7.4 \
+ itertools-0.14.0 \
+ itoa-1.0.15 \
+ jiff-0.2.15 \
+ jiff-static-0.2.15 \
+ js-sys-0.3.77 \
+ libc-0.2.175 \
+ linux-raw-sys-0.9.4 \
+ log-0.4.27 \
+ macro_rules_attribute-0.2.2 \
+ macro_rules_attribute-proc_macro-0.2.2 \
+ matrixmultiply-0.3.10 \
+ memchr-2.7.5 \
memoffset-0.9.1 \
minimal-lexical-0.2.1 \
- monostate-0.1.13 \
- monostate-impl-0.1.13 \
+ miniz_oxide-0.8.9 \
+ mio-1.0.4 \
+ monostate-0.1.14 \
+ monostate-impl-0.1.14 \
ndarray-0.16.1 \
nom-7.1.3 \
num-complex-0.4.6 \
num-integer-0.1.46 \
num-traits-0.2.19 \
number_prefix-0.4.0 \
- numpy-0.23.0 \
- once_cell-1.20.2 \
- onig-6.4.0 \
- onig_sys-69.8.1 \
+ numpy-0.25.0 \
+ object-0.36.7 \
+ once_cell-1.21.3 \
+ once_cell_polyfill-1.70.1 \
+ onig-6.5.1 \
+ onig_sys-69.9.1 \
paste-1.0.15 \
- pkg-config-0.3.31 \
- portable-atomic-1.10.0 \
+ pin-project-lite-0.2.16 \
+ pin-utils-0.1.0 \
+ pkg-config-0.3.32 \
+ portable-atomic-1.11.1 \
portable-atomic-util-0.2.4 \
- ppv-lite86-0.2.20 \
- proc-macro2-1.0.92 \
- pyo3-0.23.5 \
- pyo3-build-config-0.23.5 \
- pyo3-ffi-0.23.5 \
- pyo3-macros-0.23.5 \
- pyo3-macros-backend-0.23.5 \
- quote-1.0.38 \
- rand-0.8.5 \
- rand_chacha-0.3.1 \
- rand_core-0.6.4 \
+ ppv-lite86-0.2.21 \
+ proc-macro2-1.0.101 \
+ pyo3-0.25.1 \
+ pyo3-async-runtimes-0.25.0 \
+ pyo3-build-config-0.25.1 \
+ pyo3-ffi-0.25.1 \
+ pyo3-macros-0.25.1 \
+ pyo3-macros-backend-0.25.1 \
+ quote-1.0.40 \
+ r-efi-5.3.0 \
+ rand-0.9.2 \
+ rand_chacha-0.9.0 \
+ rand_core-0.9.3 \
rawpointer-0.2.1 \
- rayon-1.10.0 \
- rayon-cond-0.3.0 \
- rayon-core-1.12.1 \
- regex-1.11.1 \
- regex-automata-0.4.9 \
- regex-syntax-0.8.5 \
- rustc-hash-2.1.0 \
- rustix-0.38.42 \
- ryu-1.0.18 \
- serde-1.0.217 \
- serde_derive-1.0.217 \
- serde_json-1.0.134 \
+ rayon-1.11.0 \
+ rayon-cond-0.4.0 \
+ rayon-core-1.13.0 \
+ regex-1.11.2 \
+ regex-automata-0.4.10 \
+ regex-syntax-0.8.6 \
+ rustc-demangle-0.1.26 \
+ rustc-hash-2.1.1 \
+ rustix-1.0.8 \
+ rustversion-1.0.22 \
+ ryu-1.0.20 \
+ serde-1.0.219 \
+ serde_derive-1.0.219 \
+ serde_json-1.0.143 \
shlex-1.3.0 \
- smallvec-1.13.2 \
+ signal-hook-registry-1.4.6 \
+ slab-0.4.11 \
+ smallvec-1.15.1 \
spm_precompiled-0.1.4 \
+ static_assertions-1.1.0 \
strsim-0.11.1 \
- syn-2.0.93 \
- target-lexicon-0.12.16 \
- tempfile-3.14.0 \
- thiserror-2.0.9 \
- thiserror-impl-2.0.9 \
- unicode-ident-1.0.14 \
+ syn-2.0.106 \
+ target-lexicon-0.13.2 \
+ tempfile-3.21.0 \
+ thiserror-2.0.16 \
+ thiserror-impl-2.0.16 \
+ tokio-1.47.1 \
+ tokio-macros-2.5.0 \
+ unicode-ident-1.0.18 \
unicode-normalization-alignments-0.1.12 \
unicode-segmentation-1.12.0 \
- unicode-width-0.2.0 \
+ unicode-width-0.2.1 \
unicode_categories-0.1.1 \
- unindent-0.2.3 \
+ unindent-0.2.4 \
utf8parse-0.2.2 \
- wasi-0.11.0+wasi-snapshot-preview1 \
- wasm-bindgen-0.2.99 \
- wasm-bindgen-backend-0.2.99 \
- wasm-bindgen-macro-0.2.99 \
- wasm-bindgen-macro-support-0.2.99 \
- wasm-bindgen-shared-0.2.99 \
+ version_check-0.9.5 \
+ wasi-0.11.1+wasi-snapshot-preview1 \
+ wasi-0.14.3+wasi-0.2.4 \
+ wasm-bindgen-0.2.100 \
+ wasm-bindgen-backend-0.2.100 \
+ wasm-bindgen-macro-0.2.100 \
+ wasm-bindgen-macro-support-0.2.100 \
+ wasm-bindgen-shared-0.2.100 \
web-time-1.1.0 \
+ windows-link-0.1.3 \
windows-sys-0.59.0 \
+ windows-sys-0.60.2 \
windows-targets-0.52.6 \
+ windows-targets-0.53.3 \
windows_aarch64_gnullvm-0.52.6 \
+ windows_aarch64_gnullvm-0.53.0 \
windows_aarch64_msvc-0.52.6 \
+ windows_aarch64_msvc-0.53.0 \
windows_i686_gnu-0.52.6 \
+ windows_i686_gnu-0.53.0 \
windows_i686_gnullvm-0.52.6 \
+ windows_i686_gnullvm-0.53.0 \
windows_i686_msvc-0.52.6 \
+ windows_i686_msvc-0.53.0 \
windows_x86_64_gnu-0.52.6 \
+ windows_x86_64_gnu-0.53.0 \
windows_x86_64_gnullvm-0.52.6 \
+ windows_x86_64_gnullvm-0.53.0 \
windows_x86_64_msvc-0.52.6 \
- zerocopy-0.7.35 \
- zerocopy-derive-0.7.35
+ windows_x86_64_msvc-0.53.0 \
+ wit-bindgen-0.45.0 \
+ zerocopy-0.8.26 \
+ zerocopy-derive-0.8.26