{"id":124302,"url":"https://github.com/pjlab-sys4nlp/llama-moe","last_synced_at":"2026-06-15T17:00:52.621Z","repository":{"id":214003487,"uuid":"670026629","full_name":"pjlab-sys4nlp/llama-moe","owner":"pjlab-sys4nlp","description":"⛷️ LLaMA-MoE: Building Mixture-of-Experts from LLaMA with Continual Pre-training (EMNLP 2024)","archived":false,"fork":false,"pushed_at":"2024-12-06T04:47:07.000Z","size":1774,"stargazers_count":1003,"open_issues_count":7,"forks_count":61,"subscribers_count":8,"default_branch":"main","last_synced_at":"2026-06-09T14:04:07.622Z","etag":null,"topics":["continual-pre-training","expert-partition","llama","llm","mixture-of-experts","moe"],"latest_commit_sha":null,"homepage":"https://arxiv.org/abs/2406.16554","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/pjlab-sys4nlp.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2023-07-24T06:15:51.000Z","updated_at":"2026-06-04T02:57:43.000Z","dependencies_parsed_at":"2023-12-25T04:19:31.657Z","dependency_job_id":"2090a98c-a999-43ce-8ee4-e8f4b2040d3c","html_url":"https://github.com/pjlab-sys4nlp/llama-moe","commit_stats":{"total_commits":142,"total_committers":5,"mean_commits":28.4,"dds":0.471830985915493,"last_synced_commit":"b17aff436cce58e2fcd7327789c7fadafe15d19e"},"previous_names":["pjlab-sys4nlp/llama-moe"],"tags_count":4,"template":false,"template_full_name":null,"purl":"pkg:github/pjlab-sys4nlp/llama-moe","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/pjlab-sys4nlp%2Fllama-moe","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/pjlab-sys4nlp%2Fllama-moe/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/pjlab-sys4nlp%2Fllama-moe/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/pjlab-sys4nlp%2Fllama-moe/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/pjlab-sys4nlp","download_url":"https://codeload.github.com/pjlab-sys4nlp/llama-moe/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/pjlab-sys4nlp%2Fllama-moe/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":286080680,"owners_count":34372130,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2026-05-26T15:22:16.424Z","status":"online","status_checked_at":"2026-06-15T02:00:07.085Z","response_time":63,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"pjlab-sys4nlp","name":"pjlab-sys4nlp","uuid":"124339599","kind":"organization","description":null,"email":null,"website":null,"location":null,"twitter":null,"company":null,"icon_url":"https://avatars.githubusercontent.com/u/124339599?v=4","repositories_count":1,"last_synced_at":"2023-10-12T20:41:01.548Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/pjlab-sys4nlp","funding_links":[],"total_stars":null,"followers":null,"following":null,"created_at":"2023-10-12T20:41:01.552Z","updated_at":"2023-10-12T20:41:01.552Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/pjlab-sys4nlp","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/pjlab-sys4nlp/repositories"},"packages":[],"commits":{"id":1639826,"full_name":"pjlab-sys4nlp/llama-moe","default_branch":"main","total_commits":142,"total_committers":5,"total_bot_commits":0,"total_bot_committers":0,"mean_commits":28.4,"dds":0.471830985915493,"past_year_total_commits":0,"past_year_total_committers":0,"past_year_total_bot_commits":0,"past_year_total_bot_committers":0,"past_year_mean_commits":0.0,"past_year_dds":0.0,"last_synced_at":"2026-06-11T15:04:20.160Z","last_synced_commit":"b17aff436cce58e2fcd7327789c7fadafe15d19e","created_at":"2024-07-25T15:31:33.917Z","updated_at":"2026-06-11T15:04:20.129Z","committers":[{"name":"zhutong","email":"tzhu1997@outlook.com","login":"Spico197","count":75},{"name":"Daize Dong","email":"dzdong2019@gmail.com","login":"DaizeDong","count":58},{"name":"XiaoYee","email":"503843998@qq.com","login":"XiaoYee","count":4},{"name":"jcruan","email":"jcruan@163.com","login":"JCruan519","count":3},{"name":"tongjingqi","email":"2389508713@qq.com","login":"tongjingqi","count":2}],"past_year_committers":[],"commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/pjlab-sys4nlp%2Fllama-moe/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2026-06-15T00:00:11.107Z","repositories_count":6259889,"commits_count":882492512,"contributors_count":35088204,"owners_count":1166796,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues":{"table":{"full_name":"pjlab-sys4nlp/llama-moe","html_url":"https://github.com/pjlab-sys4nlp/llama-moe","last_synced_at":"2026-04-27T17:03:10.541Z","status":"error","issues_count":25,"pull_requests_count":50,"avg_time_to_close_issue":1043598.6315789474,"avg_time_to_close_pull_request":188664.04081632654,"issues_closed_count":19,"pull_requests_closed_count":49,"pull_request_authors_count":4,"issue_authors_count":23,"avg_comments_per_issue":2.28,"avg_comments_per_pull_request":0.14,"merged_pull_requests_count":46,"bot_issues_count":0,"bot_pull_requests_count":0,"past_year_issues_count":6,"past_year_pull_requests_count":1,"past_year_avg_time_to_close_issue":218239.75,"past_year_avg_time_to_close_pull_request":null,"past_year_issues_closed_count":4,"past_year_pull_requests_closed_count":0,"past_year_pull_request_authors_count":1,"past_year_issue_authors_count":6,"past_year_avg_comments_per_issue":1.6666666666666667,"past_year_avg_comments_per_pull_request":0.0,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":0,"created_at":"2024-07-25T15:32:12.949Z","updated_at":"2026-04-27T17:03:10.541Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/pjlab-sys4nlp%2Fllama-moe","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/pjlab-sys4nlp%2Fllama-moe/issues","issue_labels_count":{"table":{}},"pull_request_labels_count":{"table":{}},"issue_author_associations_count":{"table":{"NONE":24}},"pull_request_author_associations_count":{"table":{"COLLABORATOR":54}},"issue_authors":{"table":{"rzr002":2,"Minami-su":2,"18600709862":1,"theblackcat102":1,"bulaikexiansheng":1,"qiuzh20":1,"DoubleVII":1,"xyjsjruiliu":1,"exhyy":1,"abhinand5":1,"WangRongsheng":1,"Tangkexian":1,"apoorvcodes":1,"Xingxiangrui":1,"ZeyuTeng96":1,"He-JYang":1,"linyubupa":1,"Attention-is-All-I-Need":1,"kevin3567":1,"bestfleer":1,"ftgreat":1,"YixinSong-e":1}},"pull_request_authors":{"table":{"DaizeDong":29,"Spico197":23,"tongjingqi":1,"JCruan519":1}},"host":{"table":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2026-06-09T00:00:17.805Z","repositories_count":14786729,"issues_count":33482993,"pull_requests_count":110239305,"authors_count":11297234,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"}},"past_year_issue_labels_count":{"table":{}},"past_year_pull_request_labels_count":{"table":{}},"past_year_issue_author_associations_count":{"table":{}},"past_year_pull_request_author_associations_count":{"table":{}},"past_year_issue_authors":{"table":{}},"past_year_pull_request_authors":{"table":{}},"maintainers":[{"table":{"login":"DaizeDong","count":29,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/DaizeDong"}},{"table":{"login":"Spico197","count":23,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/Spico197"}},{"table":{"login":"tongjingqi","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/tongjingqi"}},{"table":{"login":"JCruan519","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/JCruan519"}}],"active_maintainers":[]}},"events":{"total":{"PullRequestEvent":1,"ForkEvent":12,"IssuesEvent":7,"WatchEvent":125,"IssueCommentEvent":11,"PushEvent":2},"last_year":{"ForkEvent":1,"WatchEvent":23}},"keywords":["continual-pre-training","expert-partition","llama","llm","mixture-of-experts","moe"],"dependencies":[{"ecosystem":"pypi","filepath":"requirements.txt","sha":null,"kind":"manifest","created_at":"2023-12-25T04:19:31.252Z","updated_at":"2023-12-25T04:19:31.252Z","repository_link":"https://github.com/pjlab-sys4nlp/llama-moe/blob/main/requirements.txt","dependencies":[{"id":15263655522,"package_name":"deepspeed","ecosystem":"pypi","requirements":"==0.10.0","direct":true,"kind":"runtime","optional":false},{"id":15263655523,"package_name":"flake8","ecosystem":"pypi","requirements":"==6.0.0","direct":true,"kind":"runtime","optional":false},{"id":15263655524,"package_name":"huggingface-hub","ecosystem":"pypi","requirements":"==0.16.4","direct":true,"kind":"runtime","optional":false},{"id":15263655525,"package_name":"isort","ecosystem":"pypi","requirements":"==5.12.0","direct":true,"kind":"runtime","optional":false},{"id":15263655526,"package_name":"k-means-constrained","ecosystem":"pypi","requirements":"==0.7.3","direct":true,"kind":"runtime","optional":false},{"id":15263655527,"package_name":"nltk","ecosystem":"pypi","requirements":"==3.8.1","direct":true,"kind":"runtime","optional":false},{"id":15263655528,"package_name":"ninja","ecosystem":"pypi","requirements":"==1.11.1","direct":true,"kind":"runtime","optional":false},{"id":15263655529,"package_name":"omegaconf","ecosystem":"pypi","requirements":"==2.0.6","direct":true,"kind":"runtime","optional":false},{"id":15263655530,"package_name":"packaging","ecosystem":"pypi","requirements":"==23.1","direct":true,"kind":"runtime","optional":false},{"id":15263655531,"package_name":"peft","ecosystem":"pypi","requirements":"==0.4.0","direct":true,"kind":"runtime","optional":false},{"id":15263655532,"package_name":"pre-commit","ecosystem":"pypi","requirements":"==3.3.3","direct":true,"kind":"runtime","optional":false},{"id":15263655533,"package_name":"pytest","ecosystem":"pypi","requirements":"==7.4.0","direct":true,"kind":"runtime","optional":false},{"id":15263655534,"package_name":"safetensors","ecosystem":"pypi","requirements":"==0.3.1","direct":true,"kind":"runtime","optional":false},{"id":15263655535,"package_name":"scikit-learn","ecosystem":"pypi","requirements":"==1.3.0","direct":true,"kind":"runtime","optional":false},{"id":15263655536,"package_name":"sentencepiece","ecosystem":"pypi","requirements":"==0.1.99","direct":true,"kind":"runtime","optional":false},{"id":15263655537,"package_name":"tensorboard","ecosystem":"pypi","requirements":"==2.13.0","direct":true,"kind":"runtime","optional":false},{"id":15263655538,"package_name":"tokenizers","ecosystem":"pypi","requirements":"==0.13.3","direct":true,"kind":"runtime","optional":false},{"id":15263655539,"package_name":"torch","ecosystem":"pypi","requirements":"==2.0.1","direct":true,"kind":"runtime","optional":false},{"id":15263655540,"package_name":"torchaudio","ecosystem":"pypi","requirements":"==2.0.2","direct":true,"kind":"runtime","optional":false},{"id":15263655541,"package_name":"torchvision","ecosystem":"pypi","requirements":"==0.15.2","direct":true,"kind":"runtime","optional":false},{"id":15263655542,"package_name":"tqdm","ecosystem":"pypi","requirements":"==4.65.0","direct":true,"kind":"runtime","optional":false},{"id":15263655543,"package_name":"transformers","ecosystem":"pypi","requirements":"==4.31.0","direct":true,"kind":"runtime","optional":false},{"id":15263655544,"package_name":"triton","ecosystem":"pypi","requirements":"==2.0.0","direct":true,"kind":"runtime","optional":false},{"id":15263655545,"package_name":"trl","ecosystem":"pypi","requirements":"==0.4.7","direct":true,"kind":"runtime","optional":false},{"id":15263655546,"package_name":"wandb","ecosystem":"pypi","requirements":"==0.15.6","direct":true,"kind":"runtime","optional":false},{"id":15263655547,"package_name":"xformers","ecosystem":"pypi","requirements":"==0.0.20","direct":true,"kind":"runtime","optional":false},{"id":15263655548,"package_name":"pebble","ecosystem":"pypi","requirements":"==5.0.3","direct":true,"kind":"runtime","optional":false},{"id":15263655549,"package_name":"matplotlib","ecosystem":"pypi","requirements":"==3.7.2","direct":true,"kind":"runtime","optional":false},{"id":15263655550,"package_name":"python-dotenv","ecosystem":"pypi","requirements":"==1.0.0","direct":true,"kind":"runtime","optional":false},{"id":15263655551,"package_name":"sentence-transformers","ecosystem":"pypi","requirements":"==2.2.2","direct":true,"kind":"runtime","optional":false},{"id":15263655552,"package_name":"Pillow","ecosystem":"pypi","requirements":"==9.4.0","direct":true,"kind":"runtime","optional":false},{"id":15263655553,"package_name":"numpy","ecosystem":"pypi","requirements":"==1.25.0","direct":true,"kind":"runtime","optional":false},{"id":15263655554,"package_name":"opencv-python","ecosystem":"pypi","requirements":"==4.8.1.78","direct":true,"kind":"runtime","optional":false},{"id":15263655555,"package_name":"pynvml","ecosystem":"pypi","requirements":"==11.5.0","direct":true,"kind":"runtime","optional":false},{"id":15263655556,"package_name":"PyYaml","ecosystem":"pypi","requirements":"==6.0.1","direct":true,"kind":"runtime","optional":false},{"id":15263655557,"package_name":"pandas","ecosystem":"pypi","requirements":"\u003c2.1.0","direct":true,"kind":"runtime","optional":false},{"id":15263655517,"package_name":"accelerate","ecosystem":"pypi","requirements":"==0.21.0","direct":true,"kind":"runtime","optional":false},{"id":15263655518,"package_name":"black","ecosystem":"pypi","requirements":"==23.7.0","direct":true,"kind":"runtime","optional":false},{"id":15263655519,"package_name":"coverage","ecosystem":"pypi","requirements":"==7.2.7","direct":true,"kind":"runtime","optional":false},{"id":15263655520,"package_name":"datasets","ecosystem":"pypi","requirements":"==2.14.1","direct":true,"kind":"runtime","optional":false},{"id":15263655521,"package_name":"debugpy","ecosystem":"pypi","requirements":"==1.6.7","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"setup.py","sha":null,"kind":"manifest","created_at":"2023-12-25T04:19:31.522Z","updated_at":"2023-12-25T04:19:31.522Z","repository_link":"https://github.com/pjlab-sys4nlp/llama-moe/blob/main/setup.py","dependencies":[{"id":15263655558,"package_name":"scikit-learn","ecosystem":"pypi","requirements":"==1.3.0","direct":true,"kind":"runtime","optional":false},{"id":15263655559,"package_name":"omegaconf","ecosystem":"pypi","requirements":"==2.0.6","direct":true,"kind":"runtime","optional":false},{"id":15263655560,"package_name":"tqdm","ecosystem":"pypi","requirements":"==4.65.0","direct":true,"kind":"runtime","optional":false},{"id":15263655561,"package_name":"datasets","ecosystem":"pypi","requirements":"==2.14.1","direct":true,"kind":"runtime","optional":false},{"id":15263655562,"package_name":"transformers","ecosystem":"pypi","requirements":"==4.31.0","direct":true,"kind":"runtime","optional":false},{"id":15263655563,"package_name":"peft","ecosystem":"pypi","requirements":"==0.4.0","direct":true,"kind":"runtime","optional":false},{"id":15263655564,"package_name":"tensorboard","ecosystem":"pypi","requirements":"==2.13.0","direct":true,"kind":"runtime","optional":false}]}],"score":8.527143522269405,"created_at":"2024-07-25T15:26:09.572Z","updated_at":"2026-06-15T17:00:52.621Z","avatar_url":"https://github.com/pjlab-sys4nlp.png","language":"Python","codemeta":null,"publiccode":null,"project_url":"https://summary.ecosyste.ms/api/v1/projects/124302","html_url":"https://summary.ecosyste.ms/projects/124302"}