Raw data
{
"_id": null,
"home_page": "https://github.com/amir-zeldes/RFTokenizer",
"name": "rftokenizer",
"maintainer": "",
"docs_url": null,
"requires_python": "",
"maintainer_email": "",
"keywords": "NLP,tokenization,segmentation,morphology,morphological,Hebrew,Arabic,Coptic,word,splitting",
"author": "Amir Zeldes",
"author_email": "amir.zeldes@georgetown.edu",
"download_url": "https://files.pythonhosted.org/packages/cd/5f/5fefdd26db3bf85af6c9dd7a7fb0aab032e35e4bbe32413604a6d41d1886/rftokenizer-2.2.0.tar.gz",
"platform": null,
"description": "",
"bugtrack_url": null,
"license": "Apache License, Version 2.0",
"summary": "A character-wise tokenizer for morphologically rich languages",
"version": "2.2.0",
"project_urls": {
"Download": "https://github.com/amir-zeldes/RFTokenizer/releases/tag/v2.2.0",
"Homepage": "https://github.com/amir-zeldes/RFTokenizer"
},
"split_keywords": [
"nlp",
"tokenization",
"segmentation",
"morphology",
"morphological",
"hebrew",
"arabic",
"coptic",
"word",
"splitting"
],
"urls": [
{
"comment_text": "",
"digests": {
"blake2b_256": "cd5f5fefdd26db3bf85af6c9dd7a7fb0aab032e35e4bbe32413604a6d41d1886",
"md5": "a9dcdc7803ca050fd18a67793ae0c329",
"sha256": "dd99f68889e147bdba260caf7f244e83bb1c82ff6bdde347a73edc0e0089a09a"
},
"downloads": -1,
"filename": "rftokenizer-2.2.0.tar.gz",
"has_sig": false,
"md5_digest": "a9dcdc7803ca050fd18a67793ae0c329",
"packagetype": "sdist",
"python_version": "source",
"requires_python": null,
"size": 68452282,
"upload_time": "2024-02-01T21:30:54",
"upload_time_iso_8601": "2024-02-01T21:30:54.123477Z",
"url": "https://files.pythonhosted.org/packages/cd/5f/5fefdd26db3bf85af6c9dd7a7fb0aab032e35e4bbe32413604a6d41d1886/rftokenizer-2.2.0.tar.gz",
"yanked": false,
"yanked_reason": null
}
],
"upload_time": "2024-02-01 21:30:54",
"github": true,
"gitlab": false,
"bitbucket": false,
"codeberg": false,
"github_user": "amir-zeldes",
"github_project": "RFTokenizer",
"travis_ci": false,
"coveralls": false,
"github_actions": false,
"requirements": [
{
"name": "scikit-learn",
"specs": [
[
"==",
"1.3.2"
]
]
},
{
"name": "joblib",
"specs": [
[
"==",
"1.3.2"
]
]
},
{
"name": "numpy",
"specs": []
},
{
"name": "pandas",
"specs": [
[
"==",
"2.1.2"
]
]
},
{
"name": "xgboost",
"specs": [
[
"==",
"2.0.3"
]
]
},
{
"name": "hyperopt",
"specs": []
},
{
"name": "flair",
"specs": [
[
"==",
"0.13.0"
]
]
}
],
"lcname": "rftokenizer"
}