{"id":124835,"url":"https://github.com/microsoft/sarathi-serve","last_synced_at":"2026-06-02T06:30:30.580Z","repository":{"id":239106343,"uuid":"713419018","full_name":"microsoft/sarathi-serve","owner":"microsoft","description":"A low-latency \u0026 high-throughput serving engine for LLMs","archived":false,"fork":false,"pushed_at":"2026-01-08T05:10:57.000Z","size":2877,"stargazers_count":504,"open_issues_count":16,"forks_count":63,"subscribers_count":7,"default_branch":"main","last_synced_at":"2026-05-26T09:35:37.278Z","etag":null,"topics":["llama","llm-inference","pytorch","transformer"],"latest_commit_sha":null,"homepage":"","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/microsoft.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":"CONTRIBUTING.md","funding":null,"license":"LICENSE","code_of_conduct":"CODE_OF_CONDUCT.md","threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":"SECURITY.md","support":"SUPPORT.md","governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null,"notice":null,"maintainers":null,"copyright":null,"agents":null,"dco":null,"cla":null}},"created_at":"2023-11-02T13:38:16.000Z","updated_at":"2026-05-26T07:50:52.000Z","dependencies_parsed_at":"2024-05-10T03:32:59.958Z","dependency_job_id":"42ad6e6a-84c5-4800-9f9f-a268e4b4d2cc","html_url":"https://github.com/microsoft/sarathi-serve","commit_stats":null,"previous_names":["microsoft/sarathi-serve"],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/microsoft/sarathi-serve","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/microsoft%2Fsarathi-serve","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/microsoft%2Fsarathi-serve/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/microsoft%2Fsarathi-serve/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/microsoft%2Fsarathi-serve/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/microsoft","download_url":"https://codeload.github.com/microsoft/sarathi-serve/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/microsoft%2Fsarathi-serve/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":286080680,"owners_count":33632928,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2026-05-26T15:22:16.424Z","status":"online","status_checked_at":"2026-05-28T02:00:06.440Z","response_time":99,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"microsoft","name":"Microsoft","uuid":"6154722","kind":"organization","description":"Open source projects and samples from Microsoft","email":"opensource@microsoft.com","website":"https://opensource.microsoft.com","location":"Redmond, WA","twitter":"OpenAtMicrosoft","company":null,"icon_url":"https://avatars.githubusercontent.com/u/6154722?v=4","repositories_count":7804,"last_synced_at":"2026-05-19T00:57:03.114Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/microsoft","funding_links":[],"total_stars":3954942,"followers":119968,"following":0,"created_at":"2022-11-02T16:20:12.368Z","updated_at":"2026-05-19T00:57:03.114Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/microsoft","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/microsoft/repositories"},"packages":[],"commits":{"id":1640327,"full_name":"microsoft/sarathi-serve","default_branch":"main","total_commits":33,"total_committers":10,"total_bot_commits":1,"total_bot_committers":1,"mean_commits":3.3,"dds":0.4545454545454546,"past_year_total_commits":3,"past_year_total_committers":3,"past_year_total_bot_commits":0,"past_year_total_bot_committers":0,"past_year_mean_commits":1.0,"past_year_dds":0.6666666666666667,"last_synced_at":"2025-11-18T00:58:06.258Z","last_synced_commit":"3a210e76f5fb0be82b568097d45486401119a967","created_at":"2024-07-25T15:38:10.548Z","updated_at":"2025-11-18T00:56:37.219Z","committers":[{"name":"Amey Agrawal","email":"agrawalamey12@gmail.com","login":"AgrawalAmey","count":18},{"name":"Microsoft Open Source","email":"microsoftopensource","login":"microsoftopensource","count":5},{"name":"Nitin Kedia","email":"nitinkedia7@gmail.com","login":"nitinkedia7","count":3},{"name":"yuhkalhic","email":"146904269+yuhkalhic","login":"yuhkalhic","count":1},{"name":"microsoft-github-operations[bot]","email":"55726097+microsoft-github-operations[bot]","login":"microsoft-github-operations[bot]","count":1},{"name":"Varun Komperla","email":"144953849+kompy99","login":"kompy99","count":1},{"name":"Mohammed Wazir Adain","email":"mwadain@gmail.com","login":"MohammedAdain","count":1},{"name":"Kasra Alexander Sohrab","email":"67869617+kasohrab","login":"kasohrab","count":1},{"name":"Ashish Panwar","email":"31126399+apanwariisc","login":"apanwariisc","count":1},{"name":"Anirudha Agrawal","email":"44918113+Anirudhaagrawal","login":"Anirudhaagrawal","count":1}],"past_year_committers":[{"name":"yuhkalhic","email":"146904269+yuhkalhic","login":"yuhkalhic","count":1},{"name":"Mohammed Wazir Adain","email":"mwadain@gmail.com","login":"MohammedAdain","count":1},{"name":"Anirudha Agrawal","email":"44918113+Anirudhaagrawal","login":"Anirudhaagrawal","count":1}],"commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/microsoft%2Fsarathi-serve/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-11-20T00:00:13.077Z","repositories_count":6111778,"commits_count":924606049,"contributors_count":36012494,"owners_count":1117574,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues":{"table":{"full_name":"microsoft/sarathi-serve","html_url":"https://github.com/microsoft/sarathi-serve","last_synced_at":"2025-10-23T18:18:50.824Z","status":"active","issues_count":28,"pull_requests_count":65,"avg_time_to_close_issue":605297.8823529412,"avg_time_to_close_pull_request":156463.23913043478,"issues_closed_count":17,"pull_requests_closed_count":46,"pull_request_authors_count":12,"issue_authors_count":24,"avg_comments_per_issue":1.4285714285714286,"avg_comments_per_pull_request":0.47692307692307695,"merged_pull_requests_count":42,"bot_issues_count":2,"bot_pull_requests_count":4,"past_year_issues_count":11,"past_year_pull_requests_count":19,"past_year_avg_time_to_close_issue":528347.5,"past_year_avg_time_to_close_pull_request":1846294.5,"past_year_issues_closed_count":2,"past_year_pull_requests_closed_count":2,"past_year_pull_request_authors_count":8,"past_year_issue_authors_count":11,"past_year_avg_comments_per_issue":0.45454545454545453,"past_year_avg_comments_per_pull_request":0.7894736842105263,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":4,"past_year_merged_pull_requests_count":1,"created_at":"2024-07-25T15:38:20.011Z","updated_at":"2025-10-23T18:18:50.824Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/microsoft%2Fsarathi-serve","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/microsoft%2Fsarathi-serve/issues","issue_labels_count":{"table":{}},"pull_request_labels_count":{"table":{"dependencies":4,"python":4}},"issue_author_associations_count":{"table":{"NONE":28}},"pull_request_author_associations_count":{"table":{"COLLABORATOR":40,"NONE":16,"CONTRIBUTOR":9}},"issue_authors":{"table":{"Sunt-ing":4,"microsoft-github-policy-service[bot]":2,"Hudayday":1,"amansahu278":1,"lambda7xx":1,"Jaxcong":1,"zhypku":1,"irasin":1,"marwage":1,"Mrxiangli":1,"aniketmaurya":1,"deciding":1,"JuiceLemonLemon":1,"yunoJ":1,"genglinWang":1,"yuhkalhic":1,"zhanggj821":1,"Albert-Zhao-2020":1,"jumbo-q":1,"azamikram":1,"kjain1810":1,"hatttoomma":1,"MohammedAdain":1,"BigCousin-z":1}},"pull_request_authors":{"table":{"AgrawalAmey":34,"nitinkedia7":7,"kasohrab":6,"dependabot[bot]":4,"jadewang21":2,"alvi75":2,"vmehrotra50":2,"kompy99":2,"tianhao909":2,"yuhkalhic":2,"MohammedAdain":1,"apanwariisc":1}},"host":{"table":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-11-20T00:00:08.556Z","repositories_count":11680247,"issues_count":35493608,"pull_requests_count":115270548,"authors_count":11044964,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"}},"past_year_issue_labels_count":{"table":{}},"past_year_pull_request_labels_count":{"table":{"dependencies":4,"python":4}},"past_year_issue_author_associations_count":{"table":{"NONE":10}},"past_year_pull_request_author_associations_count":{"table":{"NONE":12,"CONTRIBUTOR":5}},"past_year_issue_authors":{"table":{"aniketmaurya":1,"BigCousin-z":1,"genglinWang":1,"hatttoomma":1,"Hudayday":1,"kjain1810":1,"marwage":1,"MohammedAdain":1,"yuhkalhic":1,"zhanggj821":1}},"past_year_pull_request_authors":{"table":{"dependabot[bot]":4,"yuhkalhic":2,"vmehrotra50":2,"jadewang21":2,"kasohrab":2,"tianhao909":2,"AgrawalAmey":2,"MohammedAdain":1}},"maintainers":[{"table":{"login":"AgrawalAmey","count":32,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/AgrawalAmey"}},{"table":{"login":"nitinkedia7","count":7,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/nitinkedia7"}},{"table":{"login":"apanwariisc","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/apanwariisc"}}],"active_maintainers":[]}},"events":{"total":{"IssuesEvent":11,"WatchEvent":188,"DeleteEvent":1,"MemberEvent":2,"IssueCommentEvent":20,"PushEvent":1,"PullRequestReviewEvent":4,"PullRequestEvent":12,"ForkEvent":31,"CreateEvent":1},"last_year":{"IssuesEvent":9,"WatchEvent":151,"DeleteEvent":1,"MemberEvent":2,"IssueCommentEvent":12,"PushEvent":1,"PullRequestReviewEvent":4,"PullRequestEvent":11,"ForkEvent":27,"CreateEvent":1}},"keywords":["llama","llm-inference","pytorch","transformer"],"dependencies":[{"ecosystem":"actions","filepath":".github/workflows/yapf.yml","sha":null,"kind":"manifest","created_at":"2024-05-10T03:32:58.205Z","updated_at":"2024-05-10T03:32:58.205Z","repository_link":"https://github.com/microsoft/sarathi-serve/blob/main/.github/workflows/yapf.yml","dependencies":[{"id":18004640139,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v2","direct":true,"kind":"composite","optional":false},{"id":18004640140,"package_name":"actions/setup-python","ecosystem":"actions","requirements":"v2","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"pypi","filepath":"pyproject.toml","sha":null,"kind":"manifest","created_at":"2024-05-10T03:32:58.322Z","updated_at":"2024-05-10T03:32:58.322Z","repository_link":"https://github.com/microsoft/sarathi-serve/blob/main/pyproject.toml","dependencies":[]},{"ecosystem":"pypi","filepath":"requirements-dev.txt","sha":null,"kind":"manifest","created_at":"2024-05-10T03:32:58.359Z","updated_at":"2024-05-10T03:32:58.359Z","repository_link":"https://github.com/microsoft/sarathi-serve/blob/main/requirements-dev.txt","dependencies":[{"id":18004640141,"package_name":"yapf","ecosystem":"pypi","requirements":"==0.40.2","direct":true,"kind":"development","optional":false},{"id":18004640142,"package_name":"pylint","ecosystem":"pypi","requirements":"==2.8.2","direct":true,"kind":"development","optional":false},{"id":18004640143,"package_name":"types-PyYAML","ecosystem":"pypi","requirements":"*","direct":true,"kind":"development","optional":false},{"id":18004640144,"package_name":"types-requests","ecosystem":"pypi","requirements":"*","direct":true,"kind":"development","optional":false},{"id":18004640145,"package_name":"types-setuptools","ecosystem":"pypi","requirements":"*","direct":true,"kind":"development","optional":false},{"id":18004640146,"package_name":"nbdime","ecosystem":"pypi","requirements":"*","direct":true,"kind":"development","optional":false}]},{"ecosystem":"pypi","filepath":"requirements.txt","sha":null,"kind":"manifest","created_at":"2024-05-10T03:32:58.397Z","updated_at":"2024-05-10T03:32:58.397Z","repository_link":"https://github.com/microsoft/sarathi-serve/blob/main/requirements.txt","dependencies":[{"id":18004640147,"package_name":"ninja","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640148,"package_name":"psutil","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640149,"package_name":"ray","ecosystem":"pypi","requirements":"\u003e=2.5.1","direct":true,"kind":"runtime","optional":false},{"id":18004640150,"package_name":"pandas","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640151,"package_name":"pyarrow","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640152,"package_name":"sentencepiece","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640153,"package_name":"numpy","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640154,"package_name":"torch","ecosystem":"pypi","requirements":"==2.2.2","direct":true,"kind":"runtime","optional":false},{"id":18004640155,"package_name":"transformers","ecosystem":"pypi","requirements":"\u003e=4.37.0","direct":true,"kind":"runtime","optional":false},{"id":18004640156,"package_name":"matplotlib","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640157,"package_name":"plotly_express","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640158,"package_name":"seaborn","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640159,"package_name":"wandb","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640160,"package_name":"kaleido","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640161,"package_name":"ddsketch","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640162,"package_name":"jupyterlab","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640163,"package_name":"flashinfer","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640164,"package_name":"pillow","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640165,"package_name":"tiktoken","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640166,"package_name":"grpcio","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":18004640167,"package_name":"tqdm","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"setup.py","sha":null,"kind":"manifest","created_at":"2024-05-10T03:32:59.874Z","updated_at":"2024-05-10T03:32:59.874Z","repository_link":"https://github.com/microsoft/sarathi-serve/blob/main/setup.py","dependencies":[]}],"score":8.556413904569519,"created_at":"2024-07-25T15:26:14.089Z","updated_at":"2026-06-02T06:30:30.580Z","avatar_url":"https://github.com/microsoft.png","language":"Python","codemeta":null,"publiccode":null,"project_url":"https://summary.ecosyste.ms/api/v1/projects/124835","html_url":"https://summary.ecosyste.ms/projects/124835"}