python-ucto


Namepython-ucto JSON
Version 0.6.9 PyPI version JSON
download
home_pagehttps://github.com/proycon/python-ucto
SummaryThis is a Python binding to the tokenizer Ucto. Tokenisation is one of the first step in almost any Natural Language Processing task, yet it is not always as trivial a task as it appears to be. This binding makes the power of the ucto tokeniser available to Python. Ucto itself is a regular-expression based, extensible, and advanced tokeniser written in C++ (https://languagemachines.github.io/ucto).
upload_time2024-12-17 11:56:39
maintainerNone
docs_urlNone
authorMaarten van Gompel
requires_pythonNone
licenseGPLv3
keywords tokenizer tokenization tokeniser tokenisation nlp computational_linguistics ucto
VCS
bugtrack_url
requirements Cython
Travis-CI No Travis.
coveralls test coverage No coveralls.
            
            

Raw data

            {
    "_id": null,
    "home_page": "https://github.com/proycon/python-ucto",
    "name": "python-ucto",
    "maintainer": null,
    "docs_url": null,
    "requires_python": null,
    "maintainer_email": null,
    "keywords": "tokenizer tokenization tokeniser tokenisation nlp computational_linguistics ucto",
    "author": "Maarten van Gompel",
    "author_email": "proycon@anaproy.nl",
    "download_url": "https://files.pythonhosted.org/packages/1f/af/4389468a5d4a0492469f088f9bc559898994cbe1423f8f6f9d60bf683d5c/python_ucto-0.6.9.tar.gz",
    "platform": null,
    "description": "",
    "bugtrack_url": null,
    "license": "GPLv3",
    "summary": "This is a Python binding to the tokenizer Ucto. Tokenisation is one of the first step in almost any Natural Language Processing task, yet it is not always as trivial a task as it appears to be. This binding makes the power of the ucto tokeniser available to Python. Ucto itself is a regular-expression based, extensible, and advanced tokeniser written in C++ (https://languagemachines.github.io/ucto).",
    "version": "0.6.9",
    "project_urls": {
        "Homepage": "https://github.com/proycon/python-ucto"
    },
    "split_keywords": [
        "tokenizer",
        "tokenization",
        "tokeniser",
        "tokenisation",
        "nlp",
        "computational_linguistics",
        "ucto"
    ],
    "urls": [
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "dadc1e7a93fe79c206448cda884c333c3c932b7ef4147702c1cdb763fd600fc6",
                "md5": "8b3a83b6f7f18823b46fe6ae719928c7",
                "sha256": "6c8e9899b453999c7cea3ccaea5319ba0486150005dd1dbe9b0108502d057c74"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp310-cp310-macosx_14_0_arm64.whl",
            "has_sig": false,
            "md5_digest": "8b3a83b6f7f18823b46fe6ae719928c7",
            "packagetype": "bdist_wheel",
            "python_version": "cp310",
            "requires_python": null,
            "size": 15976951,
            "upload_time": "2024-12-17T12:00:44",
            "upload_time_iso_8601": "2024-12-17T12:00:44.187373Z",
            "url": "https://files.pythonhosted.org/packages/da/dc/1e7a93fe79c206448cda884c333c3c932b7ef4147702c1cdb763fd600fc6/python_ucto-0.6.9-cp310-cp310-macosx_14_0_arm64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "a3bb3a29a4370d7bf685ce603067b20a1078ed290199fe6790ed255ab9f3503f",
                "md5": "e9114bfb10d53b3e726a6fbea9a6d304",
                "sha256": "3f56bba3d900b074042a5ec0856695137ca64389bcdf4a22980b61c5b035fe65"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp310-cp310-musllinux_1_1_x86_64.whl",
            "has_sig": false,
            "md5_digest": "e9114bfb10d53b3e726a6fbea9a6d304",
            "packagetype": "bdist_wheel",
            "python_version": "cp310",
            "requires_python": null,
            "size": 27013358,
            "upload_time": "2024-12-17T12:01:04",
            "upload_time_iso_8601": "2024-12-17T12:01:04.528707Z",
            "url": "https://files.pythonhosted.org/packages/a3/bb/3a29a4370d7bf685ce603067b20a1078ed290199fe6790ed255ab9f3503f/python_ucto-0.6.9-cp310-cp310-musllinux_1_1_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "764bd442afb2d7239926718af79ff4d63c449f959a780e922fc1e6c87a8cba33",
                "md5": "04e7e4f0f667c21e32fae707a152f07d",
                "sha256": "664fa27b6c55200debdfef1cc6a552f037794796dd06cdfcb5b16be97da4f182"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp311-cp311-macosx_14_0_arm64.whl",
            "has_sig": false,
            "md5_digest": "04e7e4f0f667c21e32fae707a152f07d",
            "packagetype": "bdist_wheel",
            "python_version": "cp311",
            "requires_python": null,
            "size": 15977107,
            "upload_time": "2024-12-17T12:01:09",
            "upload_time_iso_8601": "2024-12-17T12:01:09.931941Z",
            "url": "https://files.pythonhosted.org/packages/76/4b/d442afb2d7239926718af79ff4d63c449f959a780e922fc1e6c87a8cba33/python_ucto-0.6.9-cp311-cp311-macosx_14_0_arm64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "6e51ed1974dacdd61876c6149b1f9c07c33fc9b1139cc4af9b8f0a1508127fb9",
                "md5": "e7357edfe2efcedf2b6eb78ab8e36e9a",
                "sha256": "e07ae25c31d3340c523f5f3d373dc4c8c1a5cf2f3783b4e3d454984f9b6cbe5c"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp311-cp311-musllinux_1_1_x86_64.whl",
            "has_sig": false,
            "md5_digest": "e7357edfe2efcedf2b6eb78ab8e36e9a",
            "packagetype": "bdist_wheel",
            "python_version": "cp311",
            "requires_python": null,
            "size": 27044369,
            "upload_time": "2024-12-17T12:01:15",
            "upload_time_iso_8601": "2024-12-17T12:01:15.770653Z",
            "url": "https://files.pythonhosted.org/packages/6e/51/ed1974dacdd61876c6149b1f9c07c33fc9b1139cc4af9b8f0a1508127fb9/python_ucto-0.6.9-cp311-cp311-musllinux_1_1_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "4284694cbabbfe490d797168c8d3fe79fbb15ecb9a3a8e77d2f7f28267d555e0",
                "md5": "6643ee2581898f5dcd1cdff77fc6782f",
                "sha256": "b0302be43a5c10cff34c383c1ad60636c0da44baf2fee8b455e9efd4d4589532"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp312-cp312-macosx_14_0_arm64.whl",
            "has_sig": false,
            "md5_digest": "6643ee2581898f5dcd1cdff77fc6782f",
            "packagetype": "bdist_wheel",
            "python_version": "cp312",
            "requires_python": null,
            "size": 15976494,
            "upload_time": "2024-12-17T12:01:22",
            "upload_time_iso_8601": "2024-12-17T12:01:22.102780Z",
            "url": "https://files.pythonhosted.org/packages/42/84/694cbabbfe490d797168c8d3fe79fbb15ecb9a3a8e77d2f7f28267d555e0/python_ucto-0.6.9-cp312-cp312-macosx_14_0_arm64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "808f483f68ed7e677a86fbd01cc661985fc4db9d923bf266d33f4de4f9aae2b6",
                "md5": "e89f9b1f27ffb04742224db220ee24a3",
                "sha256": "33a5f7adcba4f320430bbab98c12431f25e872eaf3ee9d3c0a0f96123fa6ae78"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp312-cp312-musllinux_1_1_x86_64.whl",
            "has_sig": false,
            "md5_digest": "e89f9b1f27ffb04742224db220ee24a3",
            "packagetype": "bdist_wheel",
            "python_version": "cp312",
            "requires_python": null,
            "size": 27037041,
            "upload_time": "2024-12-17T12:01:30",
            "upload_time_iso_8601": "2024-12-17T12:01:30.575797Z",
            "url": "https://files.pythonhosted.org/packages/80/8f/483f68ed7e677a86fbd01cc661985fc4db9d923bf266d33f4de4f9aae2b6/python_ucto-0.6.9-cp312-cp312-musllinux_1_1_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "624173a8bc3fe41d94cf2607301f6bf7c80df25353c46c6594c79d3b60c650e3",
                "md5": "aea56e20e3f192a36d52b576c4749a99",
                "sha256": "b1274855d64f4345468d2f90a558b31ba1b30a06973210727c659bd276c3242c"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp313-cp313-macosx_14_0_arm64.whl",
            "has_sig": false,
            "md5_digest": "aea56e20e3f192a36d52b576c4749a99",
            "packagetype": "bdist_wheel",
            "python_version": "cp313",
            "requires_python": null,
            "size": 15975211,
            "upload_time": "2024-12-17T12:01:35",
            "upload_time_iso_8601": "2024-12-17T12:01:35.100831Z",
            "url": "https://files.pythonhosted.org/packages/62/41/73a8bc3fe41d94cf2607301f6bf7c80df25353c46c6594c79d3b60c650e3/python_ucto-0.6.9-cp313-cp313-macosx_14_0_arm64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "bcb973f9c492df11d35bf58ef5b2e0858cb6b4bb0e63780e84cf0cc11f685623",
                "md5": "6158012fe39ca5e0efb2d0c8eb7ee022",
                "sha256": "6904263bdf1c7a5f8fc069118fdda55ac3d61026d5279895f95d0b50e1b2b8bf"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp313-cp313-manylinux_2_28_x86_64.whl",
            "has_sig": false,
            "md5_digest": "6158012fe39ca5e0efb2d0c8eb7ee022",
            "packagetype": "bdist_wheel",
            "python_version": "cp313",
            "requires_python": null,
            "size": 25081709,
            "upload_time": "2024-12-17T12:01:39",
            "upload_time_iso_8601": "2024-12-17T12:01:39.924646Z",
            "url": "https://files.pythonhosted.org/packages/bc/b9/73f9c492df11d35bf58ef5b2e0858cb6b4bb0e63780e84cf0cc11f685623/python_ucto-0.6.9-cp313-cp313-manylinux_2_28_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "16a519fb930e0ad74bd3ae156685b63ad49728ff06a0455fff51ca10ddecb9f1",
                "md5": "aa640d54a7d26d56bae80a8579e31ddd",
                "sha256": "240234ee0ca0757b9ec743dc9076619d2b9c3f0b66799cb58b1af5b6dcce755f"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp313-cp313-musllinux_1_1_x86_64.whl",
            "has_sig": false,
            "md5_digest": "aa640d54a7d26d56bae80a8579e31ddd",
            "packagetype": "bdist_wheel",
            "python_version": "cp313",
            "requires_python": null,
            "size": 27034802,
            "upload_time": "2024-12-17T12:01:46",
            "upload_time_iso_8601": "2024-12-17T12:01:46.391311Z",
            "url": "https://files.pythonhosted.org/packages/16/a5/19fb930e0ad74bd3ae156685b63ad49728ff06a0455fff51ca10ddecb9f1/python_ucto-0.6.9-cp313-cp313-musllinux_1_1_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "435c55830da67f12322d60dbdb190b6c65e2a197dd04004b5511fd5c3d0f6137",
                "md5": "f76f6d14ca3bf28e630f622cb59c5e31",
                "sha256": "bcdc57963569823a1d045aa2b06f3f8b33482451e93e7daa9312938c409b75a0"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp38-cp38-manylinux_2_28_x86_64.whl",
            "has_sig": false,
            "md5_digest": "f76f6d14ca3bf28e630f622cb59c5e31",
            "packagetype": "bdist_wheel",
            "python_version": "cp38",
            "requires_python": null,
            "size": 25070479,
            "upload_time": "2024-12-17T12:01:53",
            "upload_time_iso_8601": "2024-12-17T12:01:53.786012Z",
            "url": "https://files.pythonhosted.org/packages/43/5c/55830da67f12322d60dbdb190b6c65e2a197dd04004b5511fd5c3d0f6137/python_ucto-0.6.9-cp38-cp38-manylinux_2_28_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "ad41b65b831360c439cc22da102168f523338ea076f15772ea8c7c151511feb3",
                "md5": "d7e0d969bf8537f099e1d8dc975df0cf",
                "sha256": "bfbdc816edef7b87bf7f2317e464a0b30e2510475638520db425ff95a8431ea8"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp38-cp38-musllinux_1_1_x86_64.whl",
            "has_sig": false,
            "md5_digest": "d7e0d969bf8537f099e1d8dc975df0cf",
            "packagetype": "bdist_wheel",
            "python_version": "cp38",
            "requires_python": null,
            "size": 27028545,
            "upload_time": "2024-12-17T12:01:59",
            "upload_time_iso_8601": "2024-12-17T12:01:59.173524Z",
            "url": "https://files.pythonhosted.org/packages/ad/41/b65b831360c439cc22da102168f523338ea076f15772ea8c7c151511feb3/python_ucto-0.6.9-cp38-cp38-musllinux_1_1_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "abef8912c8c7f28352636449b9151ba6edb95ba4ad2f4e7bbdafb8d92e985134",
                "md5": "da917d9bd114172a9d8ece7445a7baa0",
                "sha256": "53415b668092d8d1d11c19c60f0cbd13b1fbd227da05017bdda0f64af600a2d3"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp39-cp39-macosx_14_0_arm64.whl",
            "has_sig": false,
            "md5_digest": "da917d9bd114172a9d8ece7445a7baa0",
            "packagetype": "bdist_wheel",
            "python_version": "cp39",
            "requires_python": null,
            "size": 15977225,
            "upload_time": "2024-12-17T12:02:04",
            "upload_time_iso_8601": "2024-12-17T12:02:04.683032Z",
            "url": "https://files.pythonhosted.org/packages/ab/ef/8912c8c7f28352636449b9151ba6edb95ba4ad2f4e7bbdafb8d92e985134/python_ucto-0.6.9-cp39-cp39-macosx_14_0_arm64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "60f55a154396a00374c9a4834490e32a665fc7b5333b489495ce2a6300cdff33",
                "md5": "70439255fe30cc9df3cad0f769beada8",
                "sha256": "56a681aaadf7a15c223682eb950a36e2c2e54a7f0b4a0ef41294c1920cfda08a"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp39-cp39-manylinux_2_28_x86_64.whl",
            "has_sig": false,
            "md5_digest": "70439255fe30cc9df3cad0f769beada8",
            "packagetype": "bdist_wheel",
            "python_version": "cp39",
            "requires_python": null,
            "size": 25062941,
            "upload_time": "2024-12-17T12:02:09",
            "upload_time_iso_8601": "2024-12-17T12:02:09.588329Z",
            "url": "https://files.pythonhosted.org/packages/60/f5/5a154396a00374c9a4834490e32a665fc7b5333b489495ce2a6300cdff33/python_ucto-0.6.9-cp39-cp39-manylinux_2_28_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "af146c707c30eb82b046e832aae1b99d109e8f8cca854cbcd9cbaea995c6ac25",
                "md5": "2ce7776257e51a08d80dad5d59295acd",
                "sha256": "bf692d0819fe3e2d82707f8e6000f17e15df3714e61c657e99f19d24b1ca4309"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9-cp39-cp39-musllinux_1_1_x86_64.whl",
            "has_sig": false,
            "md5_digest": "2ce7776257e51a08d80dad5d59295acd",
            "packagetype": "bdist_wheel",
            "python_version": "cp39",
            "requires_python": null,
            "size": 27015168,
            "upload_time": "2024-12-17T12:02:15",
            "upload_time_iso_8601": "2024-12-17T12:02:15.121385Z",
            "url": "https://files.pythonhosted.org/packages/af/14/6c707c30eb82b046e832aae1b99d109e8f8cca854cbcd9cbaea995c6ac25/python_ucto-0.6.9-cp39-cp39-musllinux_1_1_x86_64.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "1faf4389468a5d4a0492469f088f9bc559898994cbe1423f8f6f9d60bf683d5c",
                "md5": "1c384d35c799b5faa09977dcd0c3c066",
                "sha256": "11fa5f8211842d7e06d1df978904c8263abb8d14f63b285d0020acfc2aa073ae"
            },
            "downloads": -1,
            "filename": "python_ucto-0.6.9.tar.gz",
            "has_sig": false,
            "md5_digest": "1c384d35c799b5faa09977dcd0c3c066",
            "packagetype": "sdist",
            "python_version": "source",
            "requires_python": null,
            "size": 110317,
            "upload_time": "2024-12-17T11:56:39",
            "upload_time_iso_8601": "2024-12-17T11:56:39.822447Z",
            "url": "https://files.pythonhosted.org/packages/1f/af/4389468a5d4a0492469f088f9bc559898994cbe1423f8f6f9d60bf683d5c/python_ucto-0.6.9.tar.gz",
            "yanked": false,
            "yanked_reason": null
        }
    ],
    "upload_time": "2024-12-17 11:56:39",
    "github": true,
    "gitlab": false,
    "bitbucket": false,
    "codeberg": false,
    "github_user": "proycon",
    "github_project": "python-ucto",
    "travis_ci": false,
    "coveralls": false,
    "github_actions": true,
    "requirements": [
        {
            "name": "Cython",
            "specs": []
        }
    ],
    "lcname": "python-ucto"
}
        
Elapsed time: 0.78076s