{"@context":"https://w3id.org/codemeta/3.0","@type":"SoftwareSourceCode","identifier":"pkg:pypi/python-ucto","name":"python-ucto","description":"This is a Python binding to the tokenizer Ucto. Tokenisation is one of the first step in almost any Natural Language Processing task, yet it is not always as trivial a task as it appears to be. This binding makes the power of the ucto tokeniser available to Python. Ucto itself is a regular-expression based, extensible, and advanced tokeniser written in C++ (https://languagemachines.github.io/ucto).","version":"0.6.10","softwareVersion":"0.6.10","license":"https://spdx.org/licenses/GPL-3.0-only","codeRepository":"https://github.com/proycon/python-ucto","issueTracker":"https://github.com/proycon/python-ucto/issues","url":"https://github.com/proycon/python-ucto","keywords":["tokenizer","tokenization","tokeniser","tokenisation","nlp","computational_linguistics","ucto"],"programmingLanguage":{"@type":"ComputerLanguage","name":"Cython"},"maintainer":[{"@type":"Person","name":"proycon"}],"author":[{"@type":"Person","name":"proycon"}],"copyrightHolder":[{"@type":"Person","name":"proycon"}],"dateCreated":"2015-01-29","dateModified":"2026-02-02","datePublished":"2026-02-02","copyrightYear":2015,"downloadUrl":"https://files.pythonhosted.org/packages/d4/5c/6b3cf49a22fa3fa8230c7d642b5f4a8f6248c630ddb6ea2329ea358908ff/python_ucto-0.6.10-cp310-cp310-macosx_14_0_arm64.whl","softwareHelp":{"@type":"WebSite","url":"https://python-ucto.readthedocs.io/"},"applicationCategory":"pypi","runtimePlatform":"pypi","developmentStatus":"active","sameAs":["https://pypi.org/project/python-ucto/"],"https://www.w3.org/ns/activitystreams#likes":29,"https://forgefed.org/ns#forks":5}