{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"vllm","owner":"vllm-project","isFork":false,"description":"A high-throughput and memory-efficient inference and serving engine for LLMs","allTopics":["amd","cuda","inference","pytorch","transformer","llama","gpt","rocm","model-serving","mlops","llm","inferentia","llmops","llm-serving","trainium"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":277,"issueCount":879,"starsCount":20880,"forksCount":2888,"license":"Apache License 2.0","participation":[22,15,19,10,13,11,6,11,6,10,7,17,20,21,16,23,7,21,4,14,10,10,31,11,30,32,40,11,2,16,19,25,26,26,14,23,31,33,28,58,45,62,39,56,52,57,62,52,48,29,64,75],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-12T10:05:15.896Z"}},{"type":"Public","name":"flash-attention","owner":"vllm-project","isFork":true,"description":"Fast and memory-efficient exact attention","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":1016,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":[0,0,6,3,8,19,14,0,17,19,20,28,9,13,13,2,6,1,2,0,0,3,6,5,1,0,2,20,0,6,12,18,7,4,18,2,6,2,0,6,3,9,5,0,4,0,7,0,4,3,2,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-07T01:53:57.411Z"}},{"type":"Public archive","name":"vllm-nccl","owner":"vllm-project","isFork":false,"description":"Manages vllm-nccl dependency","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":16,"forksCount":2,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,6,3,1,1,2,0,0,0,0,1,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-03T22:00:55.924Z"}},{"type":"Public","name":"dashboard","owner":"vllm-project","isFork":false,"description":"vLLM performance dashboard","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":12,"forksCount":3,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,19,2,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-26T06:13:47.853Z"}}],"repositoryCount":4,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}