{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"vllm","owner":"vllm-project","isFork":false,"description":"A high-throughput and memory-efficient inference and serving engine for LLMs","topicNames":["amd","cuda","inference","pytorch","transformer","llama","gpt","rocm","model-serving","mlops"],"topicsNotShown":5,"allTopics":["amd","cuda","inference","pytorch","transformer","llama","gpt","rocm","model-serving","mlops","llm","inferentia","llmops","llm-serving","trainium"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":255,"issueCount":873,"starsCount":20004,"forksCount":2701,"license":"Apache License 2.0","participation":[4,7,7,22,18,19,6,14,8,12,5,5,14,11,20,18,21,21,8,16,14,1,21,10,17,23,26,19,39,30,6,11,17,21,24,28,15,24,27,33,31,49,41,70,42,53,43,64,66,47,49,38],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-26T04:29:51.804Z"}},{"type":"Public","name":"flash-attention","owner":"vllm-project","isFork":true,"description":"Fast and memory-efficient exact attention","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":2,"forksCount":991,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-22T22:53:28.236Z"}},{"type":"Public","name":"vllm-nccl","owner":"vllm-project","isFork":false,"description":"Manages vllm-nccl dependency","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":13,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-01T20:54:28.924Z"}},{"type":"Public","name":"dashboard","owner":"vllm-project","isFork":false,"description":"vLLM performance dashboard","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":12,"forksCount":3,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,15,6,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-26T06:13:47.853Z"}}],"repositoryCount":4,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}