{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"vllm","owner":"deepinfra","isFork":true,"description":"A high-throughput and memory-efficient inference and serving engine for LLMs","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":5,"issueCount":0,"starsCount":0,"forksCount":3496,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-31T01:00:16.708Z"}},{"type":"Public","name":"tensorrtllm_backend","owner":"deepinfra","isFork":true,"description":"The Triton TensorRT-LLM Backend","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":88,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-26T19:04:51.824Z"}},{"type":"Public","name":"TensorRT-LLM","owner":"deepinfra","isFork":true,"description":"TensorRT-LLM provides users with an easy-to-use Python API to define Large Language Models (LLMs) and build TensorRT engines that contain state-of-the-art optimizations to perform inference efficiently on NVIDIA GPUs. TensorRT-LLM also contains components to create Python and C++ runtimes that execute those TensorRT engines.","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":852,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-26T19:04:35.199Z"}},{"type":"Public","name":"ngx-http-auth-jwt-module","owner":"deepinfra","isFork":true,"description":"Secure your NGINX locations with JWT","allTopics":[],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":118,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-17T15:27:47.646Z"}},{"type":"Public","name":"deepctl","owner":"deepinfra","isFork":false,"description":"Command line tool for Deep Infra cloud ML inference service","allTopics":[],"primaryLanguage":{"name":"Rust","color":"#dea584"},"pullRequestCount":0,"issueCount":1,"starsCount":23,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-10T16:32:04.770Z"}},{"type":"Public","name":"langchainjs","owner":"deepinfra","isFork":true,"description":"🦜🔗 Build context-aware reasoning applications 🦜🔗","allTopics":[],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":2010,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-31T04:26:54.049Z"}},{"type":"Public","name":"deepinfra-node","owner":"deepinfra","isFork":false,"description":"Official TypeScript wrapper for DeepInfra Inference API","allTopics":["javascript","api","wrapper","typescript","deep-learning","api-client","llm","llm-inference"],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":1,"issueCount":4,"starsCount":6,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-13T10:21:59.758Z"}},{"type":"Public","name":"lm-evaluation-harness","owner":"deepinfra","isFork":true,"description":"A framework for few-shot evaluation of language models.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1609,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-29T19:46:52.415Z"}},{"type":"Public","name":"langchain","owner":"deepinfra","isFork":true,"description":"⚡ Building applications with LLMs through composability ⚡","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":14282,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-22T16:08:02.212Z"}},{"type":"Public","name":"litellm","owner":"deepinfra","isFork":true,"description":"Call all LLM APIs using the OpenAI format. Use Azure, OpenAI, Cohere, Anthropic, Ollama, VLLM, Sagemaker, HuggingFace, Replicate (100+ LLMs)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1265,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-08T16:54:36.867Z"}},{"type":"Public","name":"text-generation-inference","owner":"deepinfra","isFork":true,"description":"Large Language Model Text Generation Inference","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":0,"starsCount":9,"forksCount":974,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-15T21:31:46.309Z"}},{"type":"Public","name":"fetch-stream-parser","owner":"deepinfra","isFork":true,"description":"fetch-stream","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-06T10:25:30.293Z"}},{"type":"Public","name":"fetch-event-source","owner":"deepinfra","isFork":true,"description":"A better API for making Event Source requests, with all the features of fetch()","allTopics":[],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":128,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-18T17:45:57.113Z"}},{"type":"Public","name":"cog","owner":"deepinfra","isFork":true,"description":"Containers for machine learning","allTopics":[],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":525,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-01T16:28:12.845Z"}},{"type":"Public","name":"cog-llama-2","owner":"deepinfra","isFork":false,"description":"A cog for running llama-2 using llama.cpp server","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-01T09:47:41.913Z"}},{"type":"Public","name":"transformers","owner":"deepinfra","isFork":true,"description":"🤗 Transformers: State-of-the-art Machine Learning for Pytorch, TensorFlow, and JAX.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":25876,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-07-24T10:35:53.787Z"}},{"type":"Public","name":"superfans-gpu-controller","owner":"deepinfra","isFork":true,"description":"NVIDIA GPU-based FAN controller for SUPERMICRO server","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":3,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-04-25T05:37:42.213Z"}},{"type":"Public","name":"whisper-timestamped","owner":"deepinfra","isFork":true,"description":"Multilingual Automatic Speech Recognition with word-level timestamps and confidence","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":144,"license":"GNU Affero General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-03-07T01:50:35.963Z"}},{"type":"Public","name":"sentence-transformers","owner":"deepinfra","isFork":true,"description":"Multilingual Sentence & Image Embeddings with BERT","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":2412,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-02-28T16:03:55.829Z"}},{"type":"Public","name":"full-stack-deep-learning-website","owner":"deepinfra","isFork":true,"description":"Source for https://fullstackdeeplearning.com","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":202,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-02-14T00:23:56.547Z"}}],"repositoryCount":20,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"deepinfra repositories"}