{"payload":{"pageCount":3,"repositories":[{"type":"Public","name":"zero-bubble-pipeline-parallelism","owner":"sail-sg","isFork":true,"description":"Zero Bubble Pipeline Parallelism","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":18,"starsCount":237,"forksCount":2168,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-07T07:42:01.164Z"}},{"type":"Public","name":"optim4rl","owner":"sail-sg","isFork":false,"description":"Optim4RL is a Jax framework of learning to optimize for reinforcement learning.","allTopics":["reinforcement-learning","optimization","optimizer","reinforcement-learning-algorithms","optimization-algorithms","meta-learning","jax","learning-to-learn","optimizers","meta-learning-algorithms","learning-to-optimize","meta-learning-algorithm"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":21,"forksCount":1,"license":"Apache License 2.0","participation":[1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-06T04:57:03.237Z"}},{"type":"Public","name":"scaling-with-vocab","owner":"sail-sg","isFork":false,"description":"📈 Scaling Laws with Vocabulary: Larger Models Deserve Larger Vocabularies","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":40,"forksCount":2,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,3,4],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-05T05:13:56.967Z"}},{"type":"Public","name":"I-FSJ","owner":"sail-sg","isFork":false,"description":"Improved Few-Shot Jailbreaking Can Circumvent Aligned Language Models and Their Defenses (NextGenAISafety @ ICML 2024)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":32,"forksCount":3,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-03T10:35:09.643Z"}},{"type":"Public","name":"dice","owner":"sail-sg","isFork":false,"description":"Official implementation of Bootstrapping Language Models via DPO Implicit Rewards","allTopics":["alignment","preference-learning","large-language-models","rlhf"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":29,"forksCount":1,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,0,0,2,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-29T03:55:13.618Z"}},{"type":"Public","name":"regmix","owner":"sail-sg","isFork":false,"description":"🧬 RegMix: Data Mixture as Regression for Language Model Pre-training ","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":56,"forksCount":2,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,8,11,1,4,2,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-25T08:36:33.114Z"}},{"type":"Public","name":"lorahub","owner":"sail-sg","isFork":false,"description":"[COLM 2024] LoraHub: Efficient Cross-Task Generalization via Dynamic LoRA Composition","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":2,"starsCount":554,"forksCount":35,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-22T00:38:28.754Z"}},{"type":"Public","name":"envpool","owner":"sail-sg","isFork":false,"description":"C++-based high-performance parallel environment execution engine (vectorized env) for general RL environments.","allTopics":["robotics","gym","high-performance-computing","cpp17","box2d","vizdoom","parallel-processing","threadpool","pybind11","atari-games","mujoco","lock-free-queue","dm-control","reinforcement-learning-environments","dm-env","reinforcement-learning"],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":9,"issueCount":56,"starsCount":1057,"forksCount":98,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-16T09:21:10.123Z"}},{"type":"Public","name":"sailor-llm","owner":"sail-sg","isFork":false,"description":"⚓️ Sailor: Open Language Models for South-East Asia","allTopics":["indonesia","thai","language-model","sea","vietnam","lao","malay"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":87,"forksCount":7,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-11T02:59:30.449Z"}},{"type":"Public","name":"sailcraft","owner":"sail-sg","isFork":false,"description":"🚢 Data Toolkit for Sailor Language Models","allTopics":["data-deduplication","data-cleaning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":70,"forksCount":7,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,9,0,0,1,0,0,0,0,0,0,1,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-11T02:58:47.218Z"}},{"type":"Public","name":"Adan","owner":"sail-sg","isFork":false,"description":"Adan: Adaptive Nesterov Momentum Algorithm for Faster Optimizing Deep Models","allTopics":["deep-learning","optimizer","pytorch","artificial-intelligence","moe","resnet","vit","diffusion","mae","fairseq","cuda-programming","bert-model","gpt2","transformer-xl","timm","convnext","adan","llms","dreamfusion","llm-training"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":743,"forksCount":63,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-02T18:26:36.005Z"}},{"type":"Public archive","name":"zero-bubble-megatron-deepspeed","owner":"sail-sg","isFork":true,"description":"Zero Bubble Pipeline Parallelism implemented on Megatron-Deepspeed","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":2168,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-27T08:51:04.973Z"}},{"type":"Public","name":"CPO","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":19,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-14T04:35:07.252Z"}},{"type":"Public","name":"sailcompass","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-13T13:24:47.321Z"}},{"type":"Public","name":"metaformer","owner":"sail-sg","isFork":false,"description":"MetaFormer Baselines for Vision (TPAMI 2024)","allTopics":["transformer","metaformer","starrelu"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":386,"forksCount":21,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T15:32:57.849Z"}},{"type":"Public","name":"poolformer","owner":"sail-sg","isFork":false,"description":"PoolFormer: MetaFormer Is Actually What You Need for Vision (CVPR 2022 Oral)","allTopics":["transformer","image-classification","mlp","pooling","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":12,"starsCount":1270,"forksCount":116,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T15:19:56.549Z"}},{"type":"Public","name":"sdft","owner":"sail-sg","isFork":false,"description":"[ACL 2024] The official codebase for the paper \"Self-Distillation Bridges Distribution Gap in Language Model Fine-tuning\".","allTopics":["language-model","self-distillation","supervised-finetuning"],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":1,"starsCount":65,"forksCount":4,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-28T07:06:03.365Z"}},{"type":"Public","name":"d4ft","owner":"sail-sg","isFork":false,"description":"A JAX library for Density Functional Theory.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":16,"starsCount":37,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-04T10:45:14.584Z"}},{"type":"Public","name":"finetune-fair-diffusion","owner":"sail-sg","isFork":false,"description":"Code of the paper: Finetuning Text-to-Image Diffusion Models for Fairness","allTopics":["text-to-image","fairness","diffusion-models","trustworthy-ai"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":35,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-26T05:38:20.646Z"}},{"type":"Public","name":"MDT","owner":"sail-sg","isFork":false,"description":"Masked Diffusion Transformer is the SOTA for image synthesis. (ICCV 2023)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":14,"starsCount":491,"forksCount":35,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-23T18:53:04.939Z"}},{"type":"Public","name":"CLoT","owner":"sail-sg","isFork":false,"description":"CVPR'24, Official Codebase of our Paper: \"Let's Think Outside the Box: Exploring Leap-of-Thought in Large Language Models with Creative Humor Generation\".","allTopics":["association","multimodal-deep-learning","humor-generation","large-language-models","leap-of-thought"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":13,"starsCount":286,"forksCount":11,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-13T01:52:28.174Z"}},{"type":"Public","name":"AnyDoor","owner":"sail-sg","isFork":false,"description":"AnyDoor: Test-Time Backdoor Attacks on Multimodal Large Language Models","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":35,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-08T04:59:17.025Z"}},{"type":"Public","name":"InfNeRF","owner":"sail-sg","isFork":false,"description":"InfNeRF: Towards Infinite Scale NeRF Rendering with O(log n) Space Complexity","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-04T03:17:00.830Z"}},{"type":"Public","name":"Agent-Smith","owner":"sail-sg","isFork":false,"description":"[ICML2024] Agent Smith: A Single Image Can Jailbreak One Million Multimodal LLM Agents Exponentially Fast","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":65,"forksCount":9,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-26T03:54:24.189Z"}},{"type":"Public","name":"GDPO","owner":"sail-sg","isFork":false,"description":"Graph Diffusion Policy Optimization","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":21,"forksCount":3,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-17T13:27:35.826Z"}},{"type":"Public","name":"lm-random-memory-access","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":9,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-12T07:12:31.614Z"}},{"type":"Public","name":"Consistent3D","owner":"sail-sg","isFork":false,"description":"The official PyTorch implementation of Consistent3D (CVPR 2024)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":63,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-02T03:59:42.100Z"}},{"type":"Public","name":"EditAnything","owner":"sail-sg","isFork":false,"description":"Edit anything in images powered by segment-anything, ControlNet, StableDiffusion, etc. (ACM MM)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":43,"starsCount":3253,"forksCount":186,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-29T14:37:00.394Z"}},{"type":"Public","name":"autofd","owner":"sail-sg","isFork":false,"description":"Automatic Functional Differentiation in JAX","allTopics":["automatic-differentiation","jax","neural-operator","variational-calculus"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":50,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-20T23:11:54.843Z"}},{"type":"Public","name":"mugs","owner":"sail-sg","isFork":false,"description":"A PyTorch implementation of Mugs proposed by our paper \"Mugs: A Multi-Granular Self-Supervised Learning Framework\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":81,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-13T13:51:09.006Z"}}],"repositoryCount":61,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"sail-sg repositories"}