Name | smoothquant JSON |
Version |
0.0.1.dev0
JSON |
| download |
home_page | |
Summary | SmoothQuant: Accurate and Efficient Post-Training Quantization for Large Language Models |
upload_time | 2023-03-19 01:18:24 |
maintainer | |
docs_url | None |
author | Shadow Walker |
requires_python | |
license | |
keywords |
smoothquant
|
VCS |
|
bugtrack_url |
|
requirements |
No requirements were recorded.
|
Travis-CI |
No Travis.
|
coveralls test coverage |
No coveralls.
|
# SmoothQuant: Accurate and Efficient Post-Training Quantization for Large Language Models
> SmoothQuant enables an INT8 quantization of both weights and activations for all the matrix multiplications in LLMs, including OPT-175B, BLOOM-176B, GLM-130B, and MT-NLG 530B.
Raw data
{
"_id": null,
"home_page": "",
"name": "smoothquant",
"maintainer": "",
"docs_url": null,
"requires_python": "",
"maintainer_email": "",
"keywords": "smoothquant",
"author": "Shadow Walker",
"author_email": "",
"download_url": "",
"platform": null,
"description": "# SmoothQuant: Accurate and Efficient Post-Training Quantization for Large Language Models\n\n> SmoothQuant enables an INT8 quantization of both weights and activations for all the matrix multiplications in LLMs, including OPT-175B, BLOOM-176B, GLM-130B, and MT-NLG 530B.\n\n\n\n\n\n",
"bugtrack_url": null,
"license": "",
"summary": "SmoothQuant: Accurate and Efficient Post-Training Quantization for Large Language Models",
"version": "0.0.1.dev0",
"split_keywords": [
"smoothquant"
],
"urls": [
{
"comment_text": "",
"digests": {
"blake2b_256": "baff1e9097dc819baf2ba154ce23f62e20f0cff2932af05a6e2f52eef4e423b2",
"md5": "6d1444de90256aadc7b0bf0c5c04b81c",
"sha256": "2281ba9f4f6c3463f2258b8de1b8fa8a1e73e008d764f73f24d415cc688cf865"
},
"downloads": -1,
"filename": "smoothquant-0.0.1.dev0-py3-none-any.whl",
"has_sig": false,
"md5_digest": "6d1444de90256aadc7b0bf0c5c04b81c",
"packagetype": "bdist_wheel",
"python_version": "py3",
"requires_python": null,
"size": 1519,
"upload_time": "2023-03-19T01:18:24",
"upload_time_iso_8601": "2023-03-19T01:18:24.833512Z",
"url": "https://files.pythonhosted.org/packages/ba/ff/1e9097dc819baf2ba154ce23f62e20f0cff2932af05a6e2f52eef4e423b2/smoothquant-0.0.1.dev0-py3-none-any.whl",
"yanked": false,
"yanked_reason": null
}
],
"upload_time": "2023-03-19 01:18:24",
"github": false,
"gitlab": false,
"bitbucket": false,
"lcname": "smoothquant"
}