TensorRT-LLM: A TensorRT Toolbox for Large Language Models
Raw data
{
"_id": null,
"home_page": "https://github.com/NVIDIA/TensorRT-LLM",
"name": "tensorrt-llm",
"maintainer": null,
"docs_url": null,
"requires_python": "<4,>=3.7",
"maintainer_email": null,
"keywords": "nvidia tensorrt deeplearning inference",
"author": "NVIDIA Corporation",
"author_email": null,
"download_url": "https://files.pythonhosted.org/packages/24/fb/540259e1fae2273d673236cf27fdd13f5e9707c3d5560d351aa719db47c3/tensorrt_llm-0.15.0.tar.gz",
"platform": null,
"description": "TensorRT-LLM: A TensorRT Toolbox for Large Language Models\n",
"bugtrack_url": null,
"license": "Apache License 2.0",
"summary": "TensorRT-LLM: A TensorRT Toolbox for Large Language Models",
"version": "0.15.0",
"project_urls": {
"Download": "https://github.com/NVIDIA/TensorRT-LLM/tags",
"Homepage": "https://github.com/NVIDIA/TensorRT-LLM"
},
"split_keywords": [
"nvidia",
"tensorrt",
"deeplearning",
"inference"
],
"urls": [
{
"comment_text": "",
"digests": {
"blake2b_256": "24fb540259e1fae2273d673236cf27fdd13f5e9707c3d5560d351aa719db47c3",
"md5": "0878ba76d7e9dae292a5531aac20903f",
"sha256": "50a54f85fad484bbd6644786c22754ccd1fd2b80a5a9482f3670d5f008d6b5b1"
},
"downloads": -1,
"filename": "tensorrt_llm-0.15.0.tar.gz",
"has_sig": false,
"md5_digest": "0878ba76d7e9dae292a5531aac20903f",
"packagetype": "sdist",
"python_version": "source",
"requires_python": "<4,>=3.7",
"size": 1321,
"upload_time": "2024-12-04T06:38:32",
"upload_time_iso_8601": "2024-12-04T06:38:32.360000Z",
"url": "https://files.pythonhosted.org/packages/24/fb/540259e1fae2273d673236cf27fdd13f5e9707c3d5560d351aa719db47c3/tensorrt_llm-0.15.0.tar.gz",
"yanked": false,
"yanked_reason": null
}
],
"upload_time": "2024-12-04 06:38:32",
"github": true,
"gitlab": false,
"bitbucket": false,
"codeberg": false,
"github_user": "NVIDIA",
"github_project": "TensorRT-LLM",
"travis_ci": false,
"coveralls": false,
"github_actions": true,
"requirements": [
{
"name": "accelerate",
"specs": [
[
">=",
"0.25.0"
]
]
},
{
"name": "build",
"specs": []
},
{
"name": "colored",
"specs": []
},
{
"name": "cuda-python",
"specs": []
},
{
"name": "diffusers",
"specs": [
[
">=",
"0.27.0"
]
]
},
{
"name": "lark",
"specs": []
},
{
"name": "mpi4py",
"specs": []
},
{
"name": "numpy",
"specs": [
[
"<",
"2"
]
]
},
{
"name": "onnx",
"specs": [
[
">=",
"1.12.0"
]
]
},
{
"name": "onnx_graphsurgeon",
"specs": [
[
">=",
"0.5.2"
]
]
},
{
"name": "openai",
"specs": [
[
"==",
"1.54.3"
]
]
},
{
"name": "polygraphy",
"specs": []
},
{
"name": "psutil",
"specs": []
},
{
"name": "pynvml",
"specs": [
[
">=",
"11.5.0"
]
]
},
{
"name": "pulp",
"specs": []
},
{
"name": "pandas",
"specs": []
},
{
"name": "h5py",
"specs": [
[
"==",
"3.12.1"
]
]
},
{
"name": "StrEnum",
"specs": []
},
{
"name": "sentencepiece",
"specs": [
[
">=",
"0.1.99"
]
]
},
{
"name": "tensorrt",
"specs": [
[
"~=",
"10.7.0"
]
]
},
{
"name": "torch",
"specs": [
[
">=",
"2.5.1"
],
[
"<=",
"2.6.0a0"
]
]
},
{
"name": "torchvision",
"specs": []
},
{
"name": "nvidia-modelopt",
"specs": [
[
"~=",
"0.19.0"
]
]
},
{
"name": "nvidia-nccl-cu12",
"specs": []
},
{
"name": "transformers",
"specs": [
[
"<=",
"4.45.1"
],
[
">=",
"4.38.2"
]
]
},
{
"name": "pydantic",
"specs": [
[
">=",
"2.9.1"
]
]
},
{
"name": "pillow",
"specs": [
[
"==",
"10.3.0"
]
]
},
{
"name": "wheel",
"specs": []
},
{
"name": "optimum",
"specs": []
},
{
"name": "evaluate",
"specs": []
},
{
"name": "mpmath",
"specs": [
[
">=",
"1.3.0"
]
]
},
{
"name": "click",
"specs": []
},
{
"name": "click_option_group",
"specs": []
},
{
"name": "aenum",
"specs": []
},
{
"name": "pyzmq",
"specs": []
},
{
"name": "fastapi",
"specs": [
[
"==",
"0.115.4"
]
]
},
{
"name": "uvicorn",
"specs": []
},
{
"name": "httpx",
"specs": []
},
{
"name": "setuptools",
"specs": [
[
"==",
"70.3.0"
]
]
},
{
"name": "ordered-set",
"specs": []
}
],
"lcname": "tensorrt-llm"
}