{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"FlexGen","owner":"FMInference","isFork":false,"description":"Running large language models on a single GPU for throughput-oriented scenarios.","topicNames":["machine-learning","offloading","high-throughput","opt","gpt-3","large-language-models","deep-learning"],"topicsNotShown":0,"allTopics":["machine-learning","offloading","high-throughput","opt","gpt-3","large-language-models","deep-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":49,"starsCount":9038,"forksCount":527,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-19T19:33:37.171Z"}},{"type":"Public","name":"H2O","owner":"FMInference","isFork":false,"description":"[NeurIPS'23] H2O: Heavy-Hitter Oracle for Efficient Generative Inference of Large Language Models.","topicNames":["sparsity","high-throughput","heavy-hitters","kv-cache","gpt-3","large-language-models"],"topicsNotShown":0,"allTopics":["sparsity","high-throughput","heavy-hitters","kv-cache","gpt-3","large-language-models"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":20,"starsCount":293,"forksCount":25,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-17T15:10:12.258Z"}},{"type":"Public","name":"DejaVu","owner":"FMInference","isFork":false,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":19,"starsCount":230,"forksCount":29,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-02T21:51:45.539Z"}}],"repositoryCount":3,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}