shtec-rlhf

Name	shtec-rlhf JSON
Version	1.0.5 JSON
	download
home_page	None
Summary	shtec-rlhf: Safe Reinforcement Learning from Human Feedback
upload_time	2024-06-24 05:55:07
maintainer	None
docs_url	None
author	PKU-Alignment Team
requires_python	>=3.8
license	Apache License, Version 2.0
keywords	reinforcement learning safe reinforcement learning reinforcement learning from human feedback safe reinforcement learning from human feedback large language model language model rlhf safe rlhf llm
VCS
bugtrack_url
requirements	No requirements were recorded.
Travis-CI	No Travis.
coveralls test coverage	No coveralls.

            <h1 align="center">Some part of the code is fork from the Safe-RLHF project by PKU Alignment</h1>

Raw data

            {
    "_id": null,
    "home_page": null,
    "name": "shtec-rlhf",
    "maintainer": null,
    "docs_url": null,
    "requires_python": ">=3.8",
    "maintainer_email": null,
    "keywords": "Reinforcement Learning, Safe Reinforcement Learning, Reinforcement Learning from Human Feedback, Safe Reinforcement Learning from Human Feedback, Large Language Model, Language Model, RLHF, Safe RLHF, LLM",
    "author": "PKU-Alignment Team",
    "author_email": null,
    "download_url": "https://files.pythonhosted.org/packages/fe/5e/1c6a5d1254fe36eb10d266f37eb840e47fdab985fedc3b871cd249fb551a/shtec-rlhf-1.0.5.tar.gz",
    "platform": null,
    "description": "<h1 align=\"center\">Some part of the code is fork from the Safe-RLHF project by PKU Alignment</h1>\n",
    "bugtrack_url": null,
    "license": "Apache License, Version 2.0",
    "summary": "shtec-rlhf: Safe Reinforcement Learning from Human Feedback",
    "version": "1.0.5",
    "project_urls": {
        "Bug Report": "https://github.com/PKU-Alignment/shtec-rlhf",
        "Documentation": "https://shtec-rlhf.readthedocs.io",
        "Homepage": "https://github.com/PKU-Alignment/shtec-rlhf",
        "Repository": "https://github.com/PKU-Alignment/shtec-rlhf"
    },
    "split_keywords": [
        "reinforcement learning",
        " safe reinforcement learning",
        " reinforcement learning from human feedback",
        " safe reinforcement learning from human feedback",
        " large language model",
        " language model",
        " rlhf",
        " safe rlhf",
        " llm"
    ],
    "urls": [
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "07a1d2019172152e594a869e4ff673c7eb652e56012c8b344e8c54ec6bcf6d37",
                "md5": "6f8043a3f8a2fa8eb796e9a4b6dddea4",
                "sha256": "2c211da6704b7d4f922b943f6ddcc8ae8739e59fecf7d861c3b4c5b825989eaf"
            },
            "downloads": -1,
            "filename": "shtec_rlhf-1.0.5-py3-none-any.whl",
            "has_sig": false,
            "md5_digest": "6f8043a3f8a2fa8eb796e9a4b6dddea4",
            "packagetype": "bdist_wheel",
            "python_version": "py3",
            "requires_python": ">=3.8",
            "size": 301429,
            "upload_time": "2024-06-24T05:55:05",
            "upload_time_iso_8601": "2024-06-24T05:55:05.527087Z",
            "url": "https://files.pythonhosted.org/packages/07/a1/d2019172152e594a869e4ff673c7eb652e56012c8b344e8c54ec6bcf6d37/shtec_rlhf-1.0.5-py3-none-any.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": "",
            "digests": {
                "blake2b_256": "fe5e1c6a5d1254fe36eb10d266f37eb840e47fdab985fedc3b871cd249fb551a",
                "md5": "eef5a35730a5bc7ccff0da40c819edd9",
                "sha256": "56e9504ab77b25322431decba6edd0d258a6ce788fd50db2bd67c7add3c6f37f"
            },
            "downloads": -1,
            "filename": "shtec-rlhf-1.0.5.tar.gz",
            "has_sig": false,
            "md5_digest": "eef5a35730a5bc7ccff0da40c819edd9",
            "packagetype": "sdist",
            "python_version": "source",
            "requires_python": ">=3.8",
            "size": 76951,
            "upload_time": "2024-06-24T05:55:07",
            "upload_time_iso_8601": "2024-06-24T05:55:07.324345Z",
            "url": "https://files.pythonhosted.org/packages/fe/5e/1c6a5d1254fe36eb10d266f37eb840e47fdab985fedc3b871cd249fb551a/shtec-rlhf-1.0.5.tar.gz",
            "yanked": false,
            "yanked_reason": null
        }
    ],
    "upload_time": "2024-06-24 05:55:07",
    "github": true,
    "gitlab": false,
    "bitbucket": false,
    "codeberg": false,
    "github_user": "PKU-Alignment",
    "github_project": "shtec-rlhf",
    "github_not_found": true,
    "lcname": "shtec-rlhf"
}

PKU-Alignment Team