{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"zero-bubble-pipeline-parallelism","owner":"sail-sg","isFork":true,"description":"Zero Bubble Pipeline Parallelism","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":16,"starsCount":223,"forksCount":2114,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-11T10:31:10.748Z"}},{"type":"Public","name":"sailor-llm","owner":"sail-sg","isFork":false,"description":"Sailor: Open Language Models for South-East Asia","allTopics":["indonesia","thai","language-model","sea","vietnam","lao","malay"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":83,"forksCount":7,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,31,0,0,1,0,4,0,1,1,0,0,1,0,0,0,0,0,0,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-11T02:59:30.449Z"}},{"type":"Public","name":"sailcraft","owner":"sail-sg","isFork":false,"description":"Data Toolkit for Sailor Language Models","allTopics":["data-deduplication","data-cleaning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":68,"forksCount":6,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-11T02:58:47.218Z"}},{"type":"Public","name":"regmix","owner":"sail-sg","isFork":false,"description":"🧬 RegMix: Data Mixture as Regression for Language Model Pre-training ","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":43,"forksCount":0,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,19,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-11T02:56:47.114Z"}},{"type":"Public","name":"dice","owner":"sail-sg","isFork":false,"description":"Official implementation of Bootstrapping Language Models via DPO Implicit Rewards","allTopics":["alignment","preference-learning","large-language-models","rlhf"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":25,"forksCount":1,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,3,0,2,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-03T10:00:07.618Z"}},{"type":"Public","name":"Adan","owner":"sail-sg","isFork":false,"description":"Adan: Adaptive Nesterov Momentum Algorithm for Faster Optimizing Deep Models","allTopics":["deep-learning","optimizer","pytorch","artificial-intelligence","moe","resnet","vit","diffusion","mae","fairseq","cuda-programming","bert-model","gpt2","transformer-xl","timm","convnext","adan","llms","dreamfusion","llm-training"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":739,"forksCount":63,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-02T18:26:36.005Z"}},{"type":"Public","name":"envpool","owner":"sail-sg","isFork":false,"description":"C++-based high-performance parallel environment execution engine (vectorized env) for general RL environments.","allTopics":["robotics","gym","high-performance-computing","cpp17","box2d","vizdoom","parallel-processing","threadpool","pybind11","atari-games","mujoco","lock-free-queue","dm-control","reinforcement-learning-environments","dm-env","reinforcement-learning"],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":8,"issueCount":54,"starsCount":1044,"forksCount":93,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,1,0,0,0,0,0,0,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-27T22:05:12.383Z"}},{"type":"Public archive","name":"zero-bubble-megatron-deepspeed","owner":"sail-sg","isFork":true,"description":"Zero Bubble Pipeline Parallelism implemented on Megatron-Deepspeed","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":2114,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-27T08:51:04.973Z"}},{"type":"Public","name":"CPO","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":16,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-14T04:35:07.252Z"}},{"type":"Public","name":"sailcompass","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":0,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-13T13:24:47.321Z"}},{"type":"Public","name":"I-FSJ","owner":"sail-sg","isFork":false,"description":"Improved Few-Shot Jailbreaking Can Circumvent Aligned Language Models and Their Defenses (NextGenAISafety @ ICML 2024)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":28,"forksCount":3,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-07T00:59:42.643Z"}},{"type":"Public","name":"optim4rl","owner":"sail-sg","isFork":false,"description":"Optim4RL is a Jax framework of learning to optimize for reinforcement learning.","allTopics":["reinforcement-learning","optimization","optimizer","reinforcement-learning-algorithms","optimization-algorithms","meta-learning","jax","learning-to-learn","optimizers","meta-learning-algorithms","learning-to-optimize","meta-learning-algorithm"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":21,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-04T07:21:58.237Z"}},{"type":"Public","name":"metaformer","owner":"sail-sg","isFork":false,"description":"MetaFormer Baselines for Vision (TPAMI 2024)","allTopics":["transformer","metaformer","starrelu"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":383,"forksCount":21,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T15:32:57.849Z"}},{"type":"Public","name":"poolformer","owner":"sail-sg","isFork":false,"description":"PoolFormer: MetaFormer Is Actually What You Need for Vision (CVPR 2022 Oral)","allTopics":["transformer","image-classification","mlp","pooling","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":12,"starsCount":1264,"forksCount":116,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T15:19:56.549Z"}},{"type":"Public","name":"sdft","owner":"sail-sg","isFork":false,"description":"[ACL 2024] The official codebase for the paper \"Self-Distillation Bridges Distribution Gap in Language Model Fine-tuning\".","allTopics":["language-model","self-distillation","supervised-finetuning"],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":0,"starsCount":58,"forksCount":4,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-28T07:06:03.365Z"}},{"type":"Public","name":"d4ft","owner":"sail-sg","isFork":false,"description":"A JAX library for Density Functional Theory.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":16,"starsCount":30,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-04T10:45:14.584Z"}},{"type":"Public","name":"finetune-fair-diffusion","owner":"sail-sg","isFork":false,"description":"Code of the paper: Finetuning Text-to-Image Diffusion Models for Fairness","allTopics":["text-to-image","fairness","diffusion-models","trustworthy-ai"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":33,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-26T05:38:20.646Z"}},{"type":"Public","name":"MDT","owner":"sail-sg","isFork":false,"description":"Masked Diffusion Transformer is the SOTA for image synthesis. (ICCV 2023)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":12,"starsCount":486,"forksCount":35,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-23T18:53:04.939Z"}},{"type":"Public","name":"CLoT","owner":"sail-sg","isFork":false,"description":"CVPR'24, Official Codebase of our Paper: \"Let's Think Outside the Box: Exploring Leap-of-Thought in Large Language Models with Creative Humor Generation\".","allTopics":["association","multimodal-deep-learning","humor-generation","large-language-models","leap-of-thought"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":11,"starsCount":260,"forksCount":10,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-13T01:52:28.174Z"}},{"type":"Public","name":"AnyDoor","owner":"sail-sg","isFork":false,"description":"AnyDoor: Test-Time Backdoor Attacks on Multimodal Large Language Models","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":34,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-08T04:59:17.025Z"}},{"type":"Public","name":"InfNeRF","owner":"sail-sg","isFork":false,"description":"InfNeRF: Towards Infinite Scale NeRF Rendering with O(log n) Space Complexity","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-04T03:17:00.830Z"}},{"type":"Public","name":"Agent-Smith","owner":"sail-sg","isFork":false,"description":"[ICML2024] Agent Smith: A Single Image Can Jailbreak One Million Multimodal LLM Agents Exponentially Fast","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":64,"forksCount":9,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-26T03:54:24.189Z"}},{"type":"Public","name":"GDPO","owner":"sail-sg","isFork":false,"description":"Graph Diffusion Policy Optimization","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":20,"forksCount":3,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-17T13:27:35.826Z"}},{"type":"Public","name":"lm-random-memory-access","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":8,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-12T07:12:31.614Z"}},{"type":"Public","name":"Consistent3D","owner":"sail-sg","isFork":false,"description":"The official PyTorch implementation of Consistent3D (CVPR 2024)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":60,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-02T03:59:42.100Z"}},{"type":"Public","name":"EditAnything","owner":"sail-sg","isFork":false,"description":"Edit anything in images powered by segment-anything, ControlNet, StableDiffusion, etc. (ACM MM)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":43,"starsCount":3230,"forksCount":181,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-29T14:37:00.394Z"}},{"type":"Public","name":"autofd","owner":"sail-sg","isFork":false,"description":"Automatic Functional Differentiation in JAX","allTopics":["automatic-differentiation","jax","neural-operator","variational-calculus"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":49,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-20T23:11:54.843Z"}},{"type":"Public","name":"mugs","owner":"sail-sg","isFork":false,"description":"A PyTorch implementation of Mugs proposed by our paper \"Mugs: A Multi-Granular Self-Supervised Learning Framework\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":81,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-13T13:51:09.006Z"}},{"type":"Public","name":"MMCBench","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":23,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-23T22:30:23.803Z"}},{"type":"Public","name":"D-TRAK","owner":"sail-sg","isFork":false,"description":"Intriguing Properties of Data Attribution on Diffusion Models (ICLR 2024)","allTopics":["attribution","interpretability","influence-functions","diffusion-models","ddpm","data-valuation","data-centric-ai","stable-diffusion","data-attribution"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":21,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-23T07:03:39.548Z"}}],"repositoryCount":60,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"sail-sg repositories"}