shtec-rlhf


Nameshtec-rlhf JSON
Version 1.0.5 PyPI version JSON
download
home_pageNone
Summaryshtec-rlhf: Safe Reinforcement Learning from Human Feedback
upload_time2024-06-24 05:55:07
maintainerNone
docs_urlNone
authorPKU-Alignment Team
requires_python>=3.8
licenseApache License, Version 2.0
keywords reinforcement learning safe reinforcement learning reinforcement learning from human feedback safe reinforcement learning from human feedback large language model language model rlhf safe rlhf llm
VCS
bugtrack_url
requirements No requirements were recorded.
Travis-CI No Travis.
coveralls test coverage No coveralls.
            <h1 align="center">Some part of the code is fork from the Safe-RLHF project by PKU Alignment</h1>

            

Raw data

            {
    "_id": null,
    "home_page": null,
    "name": "shtec-rlhf",
    "maintainer": null,
    "docs_url": null,
    "requires_python": ">=3.8",
    "maintainer_email": null,
    "keywords": "Reinforcement Learning, Safe Reinforcement Learning, Reinforcement Learning from Human Feedback, Safe Reinforcement Learning from Human Feedback, Large Language Model, Language Model, RLHF, Safe RLHF, LLM",
    "author": "PKU-Alignment Team",
    "author_email": null,
    "download_url": "https://files.pythonhosted.org/packages/fe/5e/1c6a5d1254fe36eb10d266f37eb840e47fdab985fedc3b871cd249fb551a/shtec-rlhf-1.0.5.tar.gz",
    "platform": null,
    "description": "<h1 align=\"center\">Some part of the code is fork from the Safe-RLHF project by PKU Alignment</h1>\n",
    "bugtrack_url": null,
    "license": "Apache License, Version 2.0",
    "summary": "shtec-rlhf: Safe Reinforcement Learning from Human Feedback",
    "version": "1.0.5",
    "project_urls": {
        "Bug Report": "https://github.com/PKU-Alignment/shtec-rlhf",
        "Documentation": "https://shtec-rlhf.readthedocs.io",
        "Homepage": "https://github.com/PKU-Alignment/shtec-rlhf",
        "Repository": "https://github.com/PKU-Alignment/shtec-rlhf"
    },
    "split_keywords": [
        "reinforcement learning",
        " safe reinforcement learning",
        " reinforcement learning from human feedback",
        " safe reinforcement learning from human feedback",
        " large language model",
        " language model",
        " rlhf",
        " safe rlhf",
        " llm"
    ],
    "urls": [
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "07a1d2019172152e594a869e4ff673c7eb652e56012c8b344e8c54ec6bcf6d37",
                "md5": "6f8043a3f8a2fa8eb796e9a4b6dddea4",
                "sha256": "2c211da6704b7d4f922b943f6ddcc8ae8739e59fecf7d861c3b4c5b825989eaf"
            },
            "downloads": -1,
            "filename": "shtec_rlhf-1.0.5-py3-none-any.whl",
            "has_sig": false,
            "md5_digest": "6f8043a3f8a2fa8eb796e9a4b6dddea4",
            "packagetype": "bdist_wheel",
            "python_version": "py3",
            "requires_python": ">=3.8",
            "size": 301429,
            "upload_time": "2024-06-24T05:55:05",
            "upload_time_iso_8601": "2024-06-24T05:55:05.527087Z",
            "url": "https://files.pythonhosted.org/packages/07/a1/d2019172152e594a869e4ff673c7eb652e56012c8b344e8c54ec6bcf6d37/shtec_rlhf-1.0.5-py3-none-any.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "fe5e1c6a5d1254fe36eb10d266f37eb840e47fdab985fedc3b871cd249fb551a",
                "md5": "eef5a35730a5bc7ccff0da40c819edd9",
                "sha256": "56e9504ab77b25322431decba6edd0d258a6ce788fd50db2bd67c7add3c6f37f"
            },
            "downloads": -1,
            "filename": "shtec-rlhf-1.0.5.tar.gz",
            "has_sig": false,
            "md5_digest": "eef5a35730a5bc7ccff0da40c819edd9",
            "packagetype": "sdist",
            "python_version": "source",
            "requires_python": ">=3.8",
            "size": 76951,
            "upload_time": "2024-06-24T05:55:07",
            "upload_time_iso_8601": "2024-06-24T05:55:07.324345Z",
            "url": "https://files.pythonhosted.org/packages/fe/5e/1c6a5d1254fe36eb10d266f37eb840e47fdab985fedc3b871cd249fb551a/shtec-rlhf-1.0.5.tar.gz",
            "yanked": false,
            "yanked_reason": null
        }
    ],
    "upload_time": "2024-06-24 05:55:07",
    "github": true,
    "gitlab": false,
    "bitbucket": false,
    "codeberg": false,
    "github_user": "PKU-Alignment",
    "github_project": "shtec-rlhf",
    "github_not_found": true,
    "lcname": "shtec-rlhf"
}
        
Elapsed time: 0.49407s