| Name | smoothquant JSON | 
            
| Version | 
                  0.0.1.dev0
                   
                  JSON | 
            
 | download  | 
            
| home_page |   | 
            
| Summary | SmoothQuant: Accurate and Efficient Post-Training Quantization for Large Language Models | 
            | upload_time | 2023-03-19 01:18:24 | 
            | maintainer |  | 
            
            | docs_url | None | 
            | author | Shadow Walker | 
            
            | requires_python |  | 
            
            
            | license |  | 
            | keywords | 
                
                    smoothquant
                 | 
            | VCS | 
                
                    | 
                
            
            | bugtrack_url | 
                
                 | 
             
            
            | requirements | 
                
                  No requirements were recorded.
                
             | 
            
| Travis-CI | 
                
                   No Travis.
                
             | 
            | coveralls test coverage | 
                
                   No coveralls.
                
             | 
        
        
            
            # SmoothQuant: Accurate and Efficient Post-Training Quantization for Large Language Models
> SmoothQuant enables an INT8 quantization of both weights and activations for all the matrix multiplications in LLMs, including OPT-175B, BLOOM-176B, GLM-130B, and MT-NLG 530B.
            
         
        Raw data
        
            {
    "_id": null,
    "home_page": "",
    "name": "smoothquant",
    "maintainer": "",
    "docs_url": null,
    "requires_python": "",
    "maintainer_email": "",
    "keywords": "smoothquant",
    "author": "Shadow Walker",
    "author_email": "",
    "download_url": "",
    "platform": null,
    "description": "# SmoothQuant: Accurate and Efficient Post-Training Quantization for Large Language Models\n\n> SmoothQuant enables an INT8 quantization of both weights and activations for all the matrix multiplications in LLMs, including OPT-175B, BLOOM-176B, GLM-130B, and MT-NLG 530B.\n\n\n\n\n\n",
    "bugtrack_url": null,
    "license": "",
    "summary": "SmoothQuant: Accurate and Efficient Post-Training Quantization for Large Language Models",
    "version": "0.0.1.dev0",
    "split_keywords": [
        "smoothquant"
    ],
    "urls": [
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "baff1e9097dc819baf2ba154ce23f62e20f0cff2932af05a6e2f52eef4e423b2",
                "md5": "6d1444de90256aadc7b0bf0c5c04b81c",
                "sha256": "2281ba9f4f6c3463f2258b8de1b8fa8a1e73e008d764f73f24d415cc688cf865"
            },
            "downloads": -1,
            "filename": "smoothquant-0.0.1.dev0-py3-none-any.whl",
            "has_sig": false,
            "md5_digest": "6d1444de90256aadc7b0bf0c5c04b81c",
            "packagetype": "bdist_wheel",
            "python_version": "py3",
            "requires_python": null,
            "size": 1519,
            "upload_time": "2023-03-19T01:18:24",
            "upload_time_iso_8601": "2023-03-19T01:18:24.833512Z",
            "url": "https://files.pythonhosted.org/packages/ba/ff/1e9097dc819baf2ba154ce23f62e20f0cff2932af05a6e2f52eef4e423b2/smoothquant-0.0.1.dev0-py3-none-any.whl",
            "yanked": false,
            "yanked_reason": null
        }
    ],
    "upload_time": "2023-03-19 01:18:24",
    "github": false,
    "gitlab": false,
    "bitbucket": false,
    "lcname": "smoothquant"
}