{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"sdft","owner":"sail-sg","isFork":false,"description":"[ACL 2024] The official codebase for the paper \"Self-Distillation Bridges Distribution Gap in Language Model Fine-tuning\".","allTopics":["language-model","self-distillation","supervised-finetuning"],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":0,"starsCount":44,"forksCount":3,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-28T07:06:03.365Z"}},{"type":"Public","name":"envpool","owner":"sail-sg","isFork":false,"description":"C++-based high-performance parallel environment execution engine (vectorized env) for general RL environments.","allTopics":["robotics","gym","high-performance-computing","cpp17","box2d","vizdoom","parallel-processing","threadpool","pybind11","atari-games","mujoco","lock-free-queue","dm-control","reinforcement-learning-environments","dm-env","reinforcement-learning"],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":7,"issueCount":52,"starsCount":1032,"forksCount":89,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-28T00:23:01.309Z"}},{"type":"Public","name":"zero-bubble-pipeline-parallelism","owner":"sail-sg","isFork":true,"description":"Zero Bubble Pipeline Parallelism","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":11,"starsCount":198,"forksCount":2001,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-27T03:11:40.146Z"}},{"type":"Public","name":"sailor-llm","owner":"sail-sg","isFork":false,"description":"Sailor: Open Language Models for South-East Asia","allTopics":["indonesia","thai","language-model","sea","vietnam","lao","malay"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":78,"forksCount":5,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,31,0,0,0,1,4,0,1,0,1,0,1,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T06:20:00.449Z"}},{"type":"Public","name":"sailcraft","owner":"sail-sg","isFork":false,"description":"Data Toolkit for Sailor Language Models","allTopics":["data-deduplication","data-cleaning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":65,"forksCount":6,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,9,0,0,1,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-15T08:37:25.218Z"}},{"type":"Public","name":"d4ft","owner":"sail-sg","isFork":false,"description":"A JAX library for Density Functional Theory.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":16,"starsCount":29,"forksCount":2,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,4,0,7,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-04T10:45:14.584Z"}},{"type":"Public","name":"finetune-fair-diffusion","owner":"sail-sg","isFork":false,"description":"Code of the paper: Finetuning Text-to-Image Diffusion Models for Fairness","allTopics":["text-to-image","fairness","diffusion-models","trustworthy-ai"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":29,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-26T05:38:20.646Z"}},{"type":"Public","name":"MDT","owner":"sail-sg","isFork":false,"description":"Masked Diffusion Transformer is the SOTA for image synthesis. (ICCV 2023)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":11,"starsCount":461,"forksCount":32,"license":"Apache License 2.0","participation":[2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,2,0,1,2,0,0,0,0,2,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-23T18:53:04.939Z"}},{"type":"Public","name":"CLoT","owner":"sail-sg","isFork":false,"description":"CVPR'24, Official Codebase of our Paper: \"Let's Think Outside the Box: Exploring Leap-of-Thought in Large Language Models with Creative Humor Generation\".","allTopics":["association","multimodal-deep-learning","humor-generation","large-language-models","leap-of-thought"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":10,"starsCount":247,"forksCount":10,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-13T01:52:28.174Z"}},{"type":"Public","name":"AnyDoor","owner":"sail-sg","isFork":false,"description":"AnyDoor: Test-Time Backdoor Attacks on Multimodal Large Language Models","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":34,"forksCount":0,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,2,0,0,0,0,0,0,1,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-08T04:59:17.025Z"}},{"type":"Public","name":"Adan","owner":"sail-sg","isFork":false,"description":"Adan: Adaptive Nesterov Momentum Algorithm for Faster Optimizing Deep Models","allTopics":["artificial-intelligence","resnet","vit","diffusion","mae","fairseq","cuda-programming","bert-model","gpt2","transformer-xl","timm","convnext","adan","dreamfusion","deep-learning","optimizer","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":727,"forksCount":63,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-04T14:06:15.005Z"}},{"type":"Public","name":"InfNeRF","owner":"sail-sg","isFork":false,"description":"InfNeRF: Towards Infinite Scale NeRF Rendering with O(log n) Space Complexity","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-04T03:17:00.830Z"}},{"type":"Public","name":"Agent-Smith","owner":"sail-sg","isFork":false,"description":"[ICML2024] Agent Smith: A Single Image Can Jailbreak One Million Multimodal LLM Agents Exponentially Fast","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":53,"forksCount":6,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-26T03:54:24.189Z"}},{"type":"Public","name":"GDPO","owner":"sail-sg","isFork":false,"description":"Graph Diffusion Policy Optimization","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":20,"forksCount":3,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-17T13:27:35.826Z"}},{"type":"Public","name":"lm-random-memory-access","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":6,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-12T07:12:31.614Z"}},{"type":"Public","name":"Consistent3D","owner":"sail-sg","isFork":false,"description":"The official PyTorch implementation of Consistent3D (CVPR 2024)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":55,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-02T03:59:42.100Z"}},{"type":"Public","name":"EditAnything","owner":"sail-sg","isFork":false,"description":"Edit anything in images powered by segment-anything, ControlNet, StableDiffusion, etc. (ACM MM)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":43,"starsCount":3164,"forksCount":174,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-29T14:37:00.394Z"}},{"type":"Public","name":"zero-bubble-megatron-deepspeed","owner":"sail-sg","isFork":true,"description":"Zero Bubble Pipeline Parallelism implemented on Megatron-Deepspeed","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":2001,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-21T09:18:32.294Z"}},{"type":"Public","name":"autofd","owner":"sail-sg","isFork":false,"description":"Automatic Functional Differentiation in JAX","allTopics":["automatic-differentiation","jax","neural-operator","variational-calculus"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":44,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-20T23:11:54.843Z"}},{"type":"Public","name":"mugs","owner":"sail-sg","isFork":false,"description":"A PyTorch implementation of Mugs proposed by our paper \"Mugs: A Multi-Granular Self-Supervised Learning Framework\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":81,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-13T13:51:09.006Z"}},{"type":"Public","name":"MMCBench","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":23,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-23T22:30:23.803Z"}},{"type":"Public","name":"D-TRAK","owner":"sail-sg","isFork":false,"description":"Intriguing Properties of Data Attribution on Diffusion Models (ICLR 2024)","allTopics":["attribution","interpretability","influence-functions","diffusion-models","ddpm","data-valuation","data-centric-ai","stable-diffusion","data-attribution"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":19,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-23T07:03:39.548Z"}},{"type":"Public","name":"Megatron-LLM","owner":"sail-sg","isFork":true,"description":"distributed trainer for LLMs","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":72,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-19T09:20:36.534Z"}},{"type":"Public","name":"metaformer","owner":"sail-sg","isFork":false,"description":"MetaFormer Baselines for Vision (TPAMI 2024)","allTopics":["transformer","metaformer","starrelu"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":2,"starsCount":370,"forksCount":21,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-15T01:35:03.849Z"}},{"type":"Public","name":"sewformer","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":118,"forksCount":12,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-28T09:03:16.969Z"}},{"type":"Public","name":"jax_xc","owner":"sail-sg","isFork":false,"description":"Exchange correlation functionals translated from libxc to jax","allTopics":["python","density-functional-theory","libxc","jax"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":39,"forksCount":2,"license":"Mozilla Public License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T15:58:08.899Z"}},{"type":"Public","name":"lorahub","owner":"sail-sg","isFork":false,"description":"The official repository of paper \"LoraHub: Efficient Cross-Task Generalization via Dynamic LoRA Composition\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":2,"starsCount":528,"forksCount":34,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-30T15:18:34.754Z"}},{"type":"Public","name":"inceptionnext","owner":"sail-sg","isFork":false,"description":"InceptionNeXt: When Inception Meets ConvNeXt (CVPR 2024)","allTopics":["convolutional-neural-networks"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":13,"starsCount":200,"forksCount":15,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-20T01:07:59.543Z"}},{"type":"Public","name":"edp","owner":"sail-sg","isFork":false,"description":"[NeurIPS 2023] Efficient Diffusion Policy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":58,"forksCount":5,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-31T03:16:36.663Z"}},{"type":"Public","name":"ScaleLong","owner":"sail-sg","isFork":false,"description":"The official repository of paper \"ScaleLong: Towards More Stable Training of Diffusion Model via Scaling Network Long Skip Connection\" (NeurIPS 2023)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":47,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-23T01:54:49.074Z"}}],"repositoryCount":55,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}