{"id":123951,"url":"https://github.com/PKU-Alignment/safe-rlhf","last_synced_at":"2026-06-02T07:30:44.413Z","repository":{"id":165616429,"uuid":"640914148","full_name":"PKU-Alignment/safe-rlhf","owner":"PKU-Alignment","description":"Safe RLHF: Constrained Value Alignment via Safe Reinforcement Learning from Human Feedback","archived":false,"fork":false,"pushed_at":"2025-11-24T04:07:51.000Z","size":4105,"stargazers_count":1593,"open_issues_count":18,"forks_count":132,"subscribers_count":15,"default_branch":"main","last_synced_at":"2026-03-30T00:40:21.465Z","etag":null,"topics":["ai-safety","alpaca","beaver","datasets","deepspeed","gpt","large-language-models","llama","llm","llms","reinforcement-learning","reinforcement-learning-from-human-feedback","rlhf","safe-reinforcement-learning","safe-reinforcement-learning-from-human-feedback","safe-rlhf","safety","transformer","transformers","vicuna"],"latest_commit_sha":null,"homepage":"https://pku-beaver.github.io","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/PKU-Alignment.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":"CODE_OF_CONDUCT.md","threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null,"notice":null,"maintainers":null,"copyright":null,"agents":null,"dco":null,"cla":null}},"created_at":"2023-05-15T11:47:08.000Z","updated_at":"2026-03-27T06:00:29.000Z","dependencies_parsed_at":"2023-10-10T17:14:48.010Z","dependency_job_id":"cacf5197-a7a4-4374-8fb8-a3ac2e7ef687","html_url":"https://github.com/PKU-Alignment/safe-rlhf","commit_stats":{"total_commits":111,"total_committers":4,"mean_commits":27.75,"dds":0.2072072072072072,"last_synced_commit":"e8cca16665ef2340ac92c6514f05519310251581"},"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/PKU-Alignment/safe-rlhf","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/PKU-Alignment%2Fsafe-rlhf","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/PKU-Alignment%2Fsafe-rlhf/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/PKU-Alignment%2Fsafe-rlhf/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/PKU-Alignment%2Fsafe-rlhf/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/PKU-Alignment","download_url":"https://codeload.github.com/PKU-Alignment/safe-rlhf/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/PKU-Alignment%2Fsafe-rlhf/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":286080680,"owners_count":31260121,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2026-04-01T00:21:46.390Z","status":"ssl_error","status_checked_at":"2026-04-01T00:09:28.497Z","response_time":111,"last_error":"SSL_read: unexpected eof while reading","robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":false,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"PKU-Alignment","name":"PKU-Alignment","uuid":"129283536","kind":"organization","description":"Loves Sharing and Open-Source, Making AI Safer.","email":"yaodong.yang@outlook.com","website":null,"location":"China","twitter":null,"company":null,"icon_url":"https://avatars.githubusercontent.com/u/129283536?v=4","repositories_count":3,"last_synced_at":"2023-05-15T17:22:58.200Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/PKU-Alignment","funding_links":[],"total_stars":null,"followers":null,"following":null,"created_at":"2023-04-15T20:21:21.546Z","updated_at":"2023-05-15T17:22:58.218Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/PKU-Alignment","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/PKU-Alignment/repositories"},"packages":[],"commits":{"id":1639489,"full_name":"PKU-Alignment/safe-rlhf","default_branch":"main","total_commits":111,"total_committers":4,"total_bot_commits":0,"total_bot_committers":0,"mean_commits":27.75,"dds":0.2072072072072072,"past_year_total_commits":0,"past_year_total_committers":0,"past_year_total_bot_commits":0,"past_year_total_bot_committers":0,"past_year_mean_commits":0.0,"past_year_dds":0.0,"last_synced_at":"2026-04-01T01:02:01.667Z","last_synced_commit":"e8cca16665ef2340ac92c6514f05519310251581","created_at":"2024-07-25T15:27:01.340Z","updated_at":"2026-04-01T01:02:01.601Z","committers":[{"name":"Xuehai Pan","email":"XuehaiPan@pku.edu.cn","login":"XuehaiPan","count":88},{"name":"Ruiyang Sun","email":"rockmagma02@gmail.com","login":"rockmagma02","count":13},{"name":"Calico","email":"93032279+calico-1226","login":"calico-1226","count":9},{"name":"Jiaming Ji","email":"73586554+zmsn-2077","login":"zmsn-2077","count":1}],"past_year_committers":[],"commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/PKU-Alignment%2Fsafe-rlhf/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2026-04-05T00:00:09.419Z","repositories_count":6211086,"commits_count":926601344,"contributors_count":35760976,"owners_count":1145205,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues":{"table":{"full_name":"PKU-Alignment/safe-rlhf","html_url":"https://github.com/PKU-Alignment/safe-rlhf","last_synced_at":"2025-12-26T02:04:27.111Z","status":"active","issues_count":63,"pull_requests_count":59,"avg_time_to_close_issue":2010364.8541666667,"avg_time_to_close_pull_request":176701.74545454545,"issues_closed_count":48,"pull_requests_closed_count":55,"pull_request_authors_count":6,"issue_authors_count":46,"avg_comments_per_issue":3.3015873015873014,"avg_comments_per_pull_request":0.0847457627118644,"merged_pull_requests_count":54,"bot_issues_count":0,"bot_pull_requests_count":3,"past_year_issues_count":2,"past_year_pull_requests_count":4,"past_year_avg_time_to_close_issue":null,"past_year_avg_time_to_close_pull_request":1216.0,"past_year_issues_closed_count":0,"past_year_pull_requests_closed_count":1,"past_year_pull_request_authors_count":2,"past_year_issue_authors_count":2,"past_year_avg_comments_per_issue":1.0,"past_year_avg_comments_per_pull_request":0.25,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":3,"past_year_merged_pull_requests_count":0,"created_at":"2024-07-25T15:27:32.986Z","updated_at":"2025-12-26T02:04:27.111Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/PKU-Alignment%2Fsafe-rlhf","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/PKU-Alignment%2Fsafe-rlhf/issues","issue_labels_count":{"table":{"question":45,"bug":11,"enhancement":9,"need information":9,"invalid":4,"cuda":3,"new feature":3,"dependency":3,"upstream":3,"installation":3,"evaluation":3,"in progress":2}},"pull_request_labels_count":{"table":{"enhancement":35,"bug":15,"new feature":15,"documentation":6,"evaluation":4,"github_actions":3,"dependency":3,"dependencies":3,"installation":2,"upstream":2,"cuda":1}},"issue_author_associations_count":{"table":{"NONE":60,"MEMBER":2,"CONTRIBUTOR":1}},"pull_request_author_associations_count":{"table":{"MEMBER":45,"CONTRIBUTOR":10,"NONE":4}},"issue_authors":{"table":{"zhaobinNF":6,"liumingzhu6060":4,"jc-ryan":3,"Harry-mic":3,"Ruibn":2,"iamsile":2,"pxyWaterMoon":2,"feiliya333":2,"nonstopfor":2,"Mandy0016":1,"AAAhWei":1,"DwarfWarriors":1,"skepsun":1,"dizzyvn":1,"calico-1226":1,"renqibing":1,"xyjsjruiliu":1,"SpongebBob":1,"cemiu":1,"Tinker250":1,"AlexXx-Wu":1,"XuehaiPan":1,"shuoyinn":1,"SliencerX":1,"Benjamin-eecs":1,"LiuShixing":1,"lierer007":1,"70557dzqc":1,"gao-xiao-bai":1,"Yanfei-Qin":1,"cyzhh":1,"RajatDandekar":1,"rockmagma02":1,"EthenZhang":1,"diehualong":1,"sh-qiangchen":1,"HaixHan":1,"HaoshengZou":1,"leezy18":1,"wqw547243068":1,"peter-xbs":1,"haorannlp":1,"xinqiaozhang":1,"icemoon-creative":1,"yifan123":1,"NNStrings":1}},"pull_request_authors":{"table":{"XuehaiPan":37,"rockmagma02":10,"calico-1226":7,"dependabot[bot]":3,"ColdSilence989":1,"zmsn-2077":1}},"host":{"table":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2026-04-05T00:00:08.668Z","repositories_count":14079050,"issues_count":34456365,"pull_requests_count":112426587,"authors_count":11225778,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"}},"past_year_issue_labels_count":{"table":{"bug":1}},"past_year_pull_request_labels_count":{"table":{"dependencies":3,"github_actions":3}},"past_year_issue_author_associations_count":{"table":{"NONE":1}},"past_year_pull_request_author_associations_count":{"table":{"NONE":4}},"past_year_issue_authors":{"table":{"RajatDandekar":1}},"past_year_pull_request_authors":{"table":{"dependabot[bot]":3,"ColdSilence989":1}},"maintainers":[{"table":{"login":"XuehaiPan","count":38,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/XuehaiPan"}},{"table":{"login":"calico-1226","count":8,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/calico-1226"}},{"table":{"login":"zmsn-2077","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/zmsn-2077"}}],"active_maintainers":[]}},"events":{"total":{"PullRequestEvent":6,"ForkEvent":13,"DiscussionEvent":1,"IssuesEvent":6,"WatchEvent":215,"IssueCommentEvent":8,"CreateEvent":2},"last_year":{"PullRequestEvent":6,"ForkEvent":10,"DiscussionEvent":1,"IssuesEvent":1,"WatchEvent":83,"CreateEvent":2}},"keywords":["ai-safety","alpaca","beaver","datasets","deepspeed","gpt","large-language-models","llama","llm","llms","reinforcement-learning","reinforcement-learning-from-human-feedback","rlhf","safe-reinforcement-learning","safe-reinforcement-learning-from-human-feedback","safe-rlhf","safety","transformer","transformers","vicuna"],"dependencies":[{"ecosystem":"actions","filepath":".github/workflows/lint.yml","sha":null,"kind":"manifest","created_at":"2023-07-10T07:01:56.790Z","updated_at":"2023-07-10T07:01:56.790Z","repository_link":"https://github.com/PKU-Alignment/safe-rlhf/blob/main/.github/workflows/lint.yml","dependencies":[{"id":11283843616,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false},{"id":11283843618,"package_name":"actions/setup-python","ecosystem":"actions","requirements":"v4","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"docker","filepath":"Dockerfile","sha":null,"kind":"manifest","created_at":"2023-07-10T07:01:56.857Z","updated_at":"2023-07-10T07:01:56.857Z","repository_link":"https://github.com/PKU-Alignment/safe-rlhf/blob/main/Dockerfile","dependencies":[{"id":11283844503,"package_name":"nvidia/cuda","ecosystem":"docker","requirements":"\"${cuda_docker_tag}\"","direct":true,"kind":"build","optional":false}]},{"ecosystem":"pypi","filepath":"pyproject.toml","sha":null,"kind":"manifest","created_at":"2023-07-10T07:01:57.399Z","updated_at":"2023-07-10T07:01:57.399Z","repository_link":"https://github.com/PKU-Alignment/safe-rlhf/blob/main/pyproject.toml","dependencies":[{"id":11283849548,"package_name":"torch","ecosystem":"pypi","requirements":"\u003e= 1.13","direct":true,"kind":"runtime","optional":false},{"id":11283849557,"package_name":"transformers","ecosystem":"pypi","requirements":"\u003e= 4.28","direct":true,"kind":"runtime","optional":false},{"id":11283849561,"package_name":"datasets","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283849565,"package_name":"tokenizers","ecosystem":"pypi","requirements":"\u003e= 0.13.3","direct":true,"kind":"runtime","optional":false},{"id":11283849567,"package_name":"accelerate","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283849570,"package_name":"deepspeed","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850208,"package_name":"numpy","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850209,"package_name":"scipy","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850210,"package_name":"sentencepiece","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850211,"package_name":"wandb","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850212,"package_name":"tensorboard","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850213,"package_name":"optree","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850254,"package_name":"matplotlib","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850255,"package_name":"tqdm","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850256,"package_name":"rich","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"requirements.txt","sha":null,"kind":"manifest","created_at":"2023-07-10T07:01:57.920Z","updated_at":"2023-07-10T07:01:57.920Z","repository_link":"https://github.com/PKU-Alignment/safe-rlhf/blob/main/requirements.txt","dependencies":[{"id":11283850287,"package_name":"torch","ecosystem":"pypi","requirements":"\u003e=1.13","direct":true,"kind":"runtime","optional":false},{"id":11283850288,"package_name":"transformers","ecosystem":"pypi","requirements":"\u003e=4.28","direct":true,"kind":"runtime","optional":false},{"id":11283850289,"package_name":"datasets","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850290,"package_name":"tokenizers","ecosystem":"pypi","requirements":"\u003e=0.13.3","direct":true,"kind":"runtime","optional":false},{"id":11283850291,"package_name":"accelerate","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850292,"package_name":"deepspeed","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850293,"package_name":"numpy","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850294,"package_name":"scipy","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850295,"package_name":"sentencepiece","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850296,"package_name":"wandb","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850297,"package_name":"tensorboard","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850298,"package_name":"optree","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850299,"package_name":"matplotlib","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850300,"package_name":"tqdm","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11283850301,"package_name":"rich","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"setup.py","sha":null,"kind":"manifest","created_at":"2023-10-10T17:14:47.995Z","updated_at":"2023-10-10T17:14:47.995Z","repository_link":"https://github.com/PKU-Alignment/safe-rlhf/blob/main/setup.py","dependencies":[]}],"score":8.770904744296864,"created_at":"2024-07-25T15:26:06.420Z","updated_at":"2026-06-02T07:30:44.413Z","avatar_url":"https://github.com/PKU-Alignment.png","language":"Python","codemeta":null,"publiccode":null,"project_url":"https://summary.ecosyste.ms/api/v1/projects/123951","html_url":"https://summary.ecosyste.ms/projects/123951"}