TensorRT-LLM: A TensorRT Toolbox for Large Language Models
Raw data
{
"_id": null,
"home_page": "https://github.com/NVIDIA/TensorRT-LLM",
"name": "tensorrt-llm",
"maintainer": null,
"docs_url": null,
"requires_python": "<4,>=3.7",
"maintainer_email": null,
"keywords": "nvidia tensorrt deeplearning inference",
"author": "NVIDIA Corporation",
"author_email": null,
"download_url": "https://files.pythonhosted.org/packages/57/f2/d7432180af42bc4e10da2c6c5dfcf08bcbe800f2717ac36222fe4d111f5b/tensorrt_llm-0.20.0.tar.gz",
"platform": null,
"description": "TensorRT-LLM: A TensorRT Toolbox for Large Language Models\n",
"bugtrack_url": null,
"license": "Apache License 2.0",
"summary": "TensorRT-LLM: A TensorRT Toolbox for Large Language Models",
"version": "0.20.0",
"project_urls": {
"Download": "https://github.com/NVIDIA/TensorRT-LLM/tags",
"Homepage": "https://github.com/NVIDIA/TensorRT-LLM"
},
"split_keywords": [
"nvidia",
"tensorrt",
"deeplearning",
"inference"
],
"urls": [
{
"comment_text": "",
"digests": {
"blake2b_256": "57f2d7432180af42bc4e10da2c6c5dfcf08bcbe800f2717ac36222fe4d111f5b",
"md5": "0651897c98e9d5c653cbe831dfd65683",
"sha256": "3fc586a851c016c49186a6ab71b96c544dca52d15819b4f5da9bc8e8f32688e2"
},
"downloads": -1,
"filename": "tensorrt_llm-0.20.0.tar.gz",
"has_sig": false,
"md5_digest": "0651897c98e9d5c653cbe831dfd65683",
"packagetype": "sdist",
"python_version": "source",
"requires_python": "<4,>=3.7",
"size": 1553,
"upload_time": "2025-06-19T02:38:47",
"upload_time_iso_8601": "2025-06-19T02:38:47.386822Z",
"url": "https://files.pythonhosted.org/packages/57/f2/d7432180af42bc4e10da2c6c5dfcf08bcbe800f2717ac36222fe4d111f5b/tensorrt_llm-0.20.0.tar.gz",
"yanked": false,
"yanked_reason": null
}
],
"upload_time": "2025-06-19 02:38:47",
"github": true,
"gitlab": false,
"bitbucket": false,
"codeberg": false,
"github_user": "NVIDIA",
"github_project": "TensorRT-LLM",
"travis_ci": false,
"coveralls": false,
"github_actions": true,
"requirements": [
{
"name": "accelerate",
"specs": [
[
">=",
"0.25.0"
]
]
},
{
"name": "build",
"specs": []
},
{
"name": "colored",
"specs": []
},
{
"name": "cuda-python",
"specs": []
},
{
"name": "diffusers",
"specs": [
[
">=",
"0.27.0"
]
]
},
{
"name": "lark",
"specs": []
},
{
"name": "mpi4py",
"specs": []
},
{
"name": "numpy",
"specs": [
[
"<",
"2"
]
]
},
{
"name": "onnx",
"specs": [
[
">=",
"1.12.0"
]
]
},
{
"name": "onnx_graphsurgeon",
"specs": [
[
">=",
"0.5.2"
]
]
},
{
"name": "openai",
"specs": []
},
{
"name": "polygraphy",
"specs": []
},
{
"name": "psutil",
"specs": []
},
{
"name": "nvidia-ml-py",
"specs": [
[
"<",
"13"
],
[
">=",
"12"
]
]
},
{
"name": "pynvml",
"specs": [
[
"==",
"12.0.0"
]
]
},
{
"name": "pulp",
"specs": []
},
{
"name": "pandas",
"specs": []
},
{
"name": "h5py",
"specs": [
[
"==",
"3.12.1"
]
]
},
{
"name": "StrEnum",
"specs": []
},
{
"name": "sentencepiece",
"specs": [
[
">=",
"0.1.99"
]
]
},
{
"name": "tensorrt",
"specs": [
[
"~=",
"10.11.0"
]
]
},
{
"name": "torch",
"specs": [
[
"<=",
"2.8.0a0"
],
[
">=",
"2.7.1"
]
]
},
{
"name": "torchvision",
"specs": []
},
{
"name": "nvidia-modelopt",
"specs": [
[
"~=",
"0.33.0"
]
]
},
{
"name": "nvidia-nccl-cu12",
"specs": []
},
{
"name": "nvidia-cuda-nvrtc-cu12",
"specs": []
},
{
"name": "transformers",
"specs": [
[
"==",
"4.53.1"
]
]
},
{
"name": "pydantic",
"specs": [
[
">=",
"2.9.1"
]
]
},
{
"name": "pydantic-settings",
"specs": []
},
{
"name": "pillow",
"specs": [
[
"==",
"10.3.0"
]
]
},
{
"name": "wheel",
"specs": [
[
"<=",
"0.45.1"
]
]
},
{
"name": "optimum",
"specs": []
},
{
"name": "datasets",
"specs": [
[
"==",
"3.1.0"
]
]
},
{
"name": "evaluate",
"specs": []
},
{
"name": "mpmath",
"specs": [
[
">=",
"1.3.0"
]
]
},
{
"name": "click",
"specs": []
},
{
"name": "click_option_group",
"specs": []
},
{
"name": "aenum",
"specs": []
},
{
"name": "pyzmq",
"specs": []
},
{
"name": "fastapi",
"specs": [
[
"==",
"0.115.4"
]
]
},
{
"name": "uvicorn",
"specs": []
},
{
"name": "setuptools",
"specs": [
[
"<",
"80"
]
]
},
{
"name": "ordered-set",
"specs": []
},
{
"name": "peft",
"specs": []
},
{
"name": "einops",
"specs": []
},
{
"name": "flashinfer-python",
"specs": [
[
"==",
"0.2.5"
]
]
},
{
"name": "opencv-python-headless",
"specs": []
},
{
"name": "xgrammar",
"specs": [
[
"==",
"0.1.19"
]
]
},
{
"name": "backoff",
"specs": []
},
{
"name": "nvtx",
"specs": []
},
{
"name": "matplotlib",
"specs": []
},
{
"name": "meson",
"specs": []
},
{
"name": "ninja",
"specs": []
},
{
"name": "etcd3",
"specs": []
},
{
"name": "blake3",
"specs": []
},
{
"name": "llguidance",
"specs": [
[
"==",
"0.7.29"
]
]
},
{
"name": "soundfile",
"specs": []
}
],
"lcname": "tensorrt-llm"
}