{"bugs":[],"categories":[{"categoryid":450,"name":"dev-lang","summary":"The dev-lang category contains various programming language implementations and related tools."},{"categoryid":393,"name":"dev-libs","summary":"The dev-libs category contains various miscellaneous programming libraries."},{"categoryid":1597,"name":"sci-ml","summary":"The sci-ml category contains software and models that can be used for machine learning, natural language processing and similar"}],"changelog":[{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"506b570bac56b0e780ab9440f091e2e1e4f9719d","committime":"2025-11-21T20:30:48","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"cc17fc9c3c6000cdaf75002c5485ea5eb2bd05d7","committime":"2025-11-21T20:18:11","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: drop 0.21.4"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"fac1752607e77cf244fd7c846a99924f1fdad741","committime":"2025-09-25T17:33:38","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"ee41170140a8b1e4d97fc40eee8123acbe1bbe18","committime":"2025-09-25T17:27:44","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: add 0.22.1, drop 0.22.0"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"c0cf82cb45eb025ca2e676575dc37bd72b336471","committime":"2025-09-11T18:49:08","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"34ff68eb3224cbc7feb8046b134185d085dfa1be","committime":"2025-09-11T18:25:55","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: add 0.22.0"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"2b13bad5ef6ec58fff0c8e5dffb0b01e138431ee","committime":"2025-09-11T10:03:55","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"a05acc42551b68644bd7483f8c0095b98b9afb1f","committime":"2025-09-11T09:48:33","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: drop 0.21.0"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"4e7126b24a8bb478e22d59098ba05ed711fd3c6a","committime":"2025-09-11T09:47:10","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: add 0.21.4, rm 0.21.1-r1"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"577250a24536444f6fd497b0b64b40cb31c43fe7","committime":"2025-04-06T20:50:20","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"658f2ff4e204dba823e395f8649f7c42425e880a","committime":"2025-04-06T20:39:46","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: drop test failing in sandbox"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"b51356113421ae379e59ecd2dba22da4bfac9729","committime":"2025-04-06T15:55:05","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Closes: https:\/\/bugs.gentoo.org\/944852\nSigned-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"d30c629a79cd779ce24dfcdacea59edee57982f2","committime":"2025-04-06T13:20:46","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: fix for gcc-15"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"6f08fa0900f0a55f6a384d2d3ea3b710e891e076","committime":"2025-04-04T21:35:20","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"d960ba732ad4cd52bd21b1cbc265e3e327b11e50","committime":"2025-04-04T21:16:28","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: add 0.21.1"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"1a670c33cf1308b203648b3a19365fed766bd6d8","committime":"2025-04-02T10:50:15","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Closes: https:\/\/bugs.gentoo.org\/952696\nSigned-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"ed2bb3840ffd49fb2b5af3f4a98b28ea34c68579","committime":"2025-04-02T10:38:04","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: enable py3.13"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"ba6bc1b3ddaca15346ab88c427eef7cc8fd32318","committime":"2025-04-02T06:50:09","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"9f338745b0afa5209cefd3ac280616bc4e974ff2","committime":"2025-04-02T06:36:02","packageid":78202,"repoid":1,"summary":"sci-ml\/tokenizers: drop 0.20.1-r1"},{"authoremail":"repomirrorci@gentoo.org","authorname":"Repository mirror & CI","commitid":"6ef7ac681005cce5d994e80fa19330bb286897e4","committime":"2025-03-14T20:33:18","packageid":78202,"repoid":1,"summary":"Merge updates from master"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"d29b62cf9182d0ad45e92776e3b120c43b7a6f92","committime":"2025-03-14T20:23:56","packageid":78202,"repoid":1,"summary":"sci-ml\/*: mv sci-libs\/datasets to sci-ml\/"},{"authoremail":"tupone@gentoo.org","authorname":"Alfredo Tupone","body":"Signed-off-by: Alfredo Tupone <tupone@gentoo.org>","commitid":"ade42174a98ce3bb50ff879441a8d5c8184ed5a9","committime":"2025-03-14T20:16:36","packageid":78202,"repoid":1,"summary":"sci-ml\/*: mv sci-libs\/tokenizer to sci-ml\/"}],"dependencies":[{"block":false,"categoryid":450,"description":"An interpreted, interactive, object-oriented programming language","ebuildids":[877021,877021,877021],"firstseen":"2010-05-04T00:54:45.661860","maintainer":"python@gentoo.org","maintainername":"Python","name":"python","packageid":43095}],"depending":[{"block":false,"categoryid":1597,"description":"State-of-the-art Machine Learning for JAX, PyTorch and TensorFlow","ebuildids":[890088,893914],"firstseen":"2025-03-14T20:23:55.878103","name":"transformers","packageid":78201}],"ebuilds":[{"archs":["~amd64"],"ebuildid":877021,"firstseen":"2025-09-25T18:52:35.399782","license":"Apache-2.0 Apache-2.0 Apache-2.0-with-LLVM-exceptions BSD-2 BSD ISC MIT MPL-2.0 Unicode-DFS-2016","moddate":"2026-03-31T06:53:54","packageid":78202,"repoid":1,"slot":"0","uses":["debug","python_single_target_python3_11","python_single_target_python3_12","python_single_target_python3_13","test"],"version":"0.22.1"}],"masks":[],"package":{"categoryid":1597,"description":"Implementation of today's most used tokenizers","firstseen":"2025-03-14T20:43:59.868749","name":"tokenizers","packageid":78202},"rdependencies":[{"block":false,"categoryid":450,"description":"An interpreted, interactive, object-oriented programming language","ebuildids":[877021,877021,877021],"firstseen":"2010-05-04T00:54:45.661860","maintainer":"python@gentoo.org","maintainername":"Python","name":"python","packageid":43095},{"block":false,"categoryid":393,"description":"Regular expression library for different character encodings","ebuildids":[877021],"firstseen":"2010-05-04T00:54:45.661860","maintainer":"cjk@gentoo.org","maintainername":"Cjk","name":"oniguruma","packageid":53410,"summary":"Oniguruma is a regular expression library. The characteristics of this library is that different character encoding for every regular expression object can be specified. (Supported character encodings: ASCII, UTF-8, EUC-JP, Shift_JIS)"}],"repos":[{"branch":"master","lastcommit":"82366aa45a35f6900f43023917c2c86ccdbb00a3","name":"gentoo","path":"\/usr\/portage","repoid":1,"upstream":"origin"}],"tracked":false,"urls":["https:\/\/github.com\/huggingface\/tokenizers"],"uses":[{"description":"Enable extra debug codepaths, like asserts and extra output. If you want to get meaningful backtraces see https:\/\/wiki.gentoo.org\/wiki\/Project:Quality_Assurance\/Backtraces","isdefault":false,"use":"debug"},{"description":"Enable dependencies and\/or preparations necessary to run tests (usually controlled by FEATURES=test but can be toggled independently)","isdefault":false,"use":"test"},{"description":"Build for Python 3.11 only","group":"python_single_target","isdefault":false,"use":"python3_11"},{"description":"Build for Python 3.12 only","group":"python_single_target","isdefault":false,"use":"python3_12"},{"description":"Build for Python 3.13 only","group":"python_single_target","isdefault":false,"use":"python3_13"}]}