{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"metaformer","owner":"sail-sg","isFork":false,"description":"MetaFormer Baselines for Vision (TPAMI 2024)","allTopics":["transformer","metaformer","starrelu"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":370,"forksCount":21,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T15:32:57.849Z"}},{"type":"Public","name":"poolformer","owner":"sail-sg","isFork":false,"description":"PoolFormer: MetaFormer Is Actually What You Need for Vision (CVPR 2022 Oral)","allTopics":["transformer","image-classification","mlp","pooling","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":12,"starsCount":1255,"forksCount":116,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T15:19:56.549Z"}},{"type":"Public","name":"zero-bubble-pipeline-parallelism","owner":"sail-sg","isFork":true,"description":"Zero Bubble Pipeline Parallelism","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":12,"starsCount":199,"forksCount":2006,"license":"Other","participation":[33,8,9,20,39,37,43,22,39,27,70,70,37,45,50,33,50,79,127,128,102,38,24,61,6,10,2,1,0,1,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-27T03:11:40.146Z"}},{"type":"Public","name":"sailor-llm","owner":"sail-sg","isFork":false,"description":"Sailor: Open Language Models for South-East Asia","allTopics":["indonesia","thai","language-model","sea","vietnam","lao","malay"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":78,"forksCount":6,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T06:20:00.449Z"}},{"type":"Public","name":"sailcraft","owner":"sail-sg","isFork":false,"description":"Data Toolkit for Sailor Language Models","allTopics":["data-deduplication","data-cleaning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":65,"forksCount":6,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-15T08:37:25.218Z"}},{"type":"Public","name":"d4ft","owner":"sail-sg","isFork":false,"description":"A JAX library for Density Functional Theory.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":16,"starsCount":29,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-04T10:45:14.584Z"}},{"type":"Public","name":"finetune-fair-diffusion","owner":"sail-sg","isFork":false,"description":"Code of the paper: Finetuning Text-to-Image Diffusion Models for Fairness","allTopics":["text-to-image","fairness","diffusion-models","trustworthy-ai"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":29,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-26T05:38:20.646Z"}},{"type":"Public","name":"MDT","owner":"sail-sg","isFork":false,"description":"Masked Diffusion Transformer is the SOTA for image synthesis. (ICCV 2023)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":12,"starsCount":464,"forksCount":32,"license":"Apache License 2.0","participation":[2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,5,0,0,3,0,0,0,0,0,2,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-23T18:53:04.939Z"}},{"type":"Public","name":"CLoT","owner":"sail-sg","isFork":false,"description":"CVPR'24, Official Codebase of our Paper: \"Let's Think Outside the Box: Exploring Leap-of-Thought in Large Language Models with Creative Humor Generation\".","allTopics":["association","multimodal-deep-learning","humor-generation","large-language-models","leap-of-thought"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":11,"starsCount":247,"forksCount":10,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-13T01:52:28.174Z"}},{"type":"Public","name":"AnyDoor","owner":"sail-sg","isFork":false,"description":"AnyDoor: Test-Time Backdoor Attacks on Multimodal Large Language Models","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":34,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-08T04:59:17.025Z"}},{"type":"Public","name":"Adan","owner":"sail-sg","isFork":false,"description":"Adan: Adaptive Nesterov Momentum Algorithm for Faster Optimizing Deep Models","allTopics":["artificial-intelligence","resnet","vit","diffusion","mae","fairseq","cuda-programming","bert-model","gpt2","transformer-xl","timm","convnext","adan","dreamfusion","deep-learning","optimizer","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":728,"forksCount":63,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-04T14:06:15.005Z"}},{"type":"Public","name":"Agent-Smith","owner":"sail-sg","isFork":false,"description":"[ICML2024] Agent Smith: A Single Image Can Jailbreak One Million Multimodal LLM Agents Exponentially Fast","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":53,"forksCount":6,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-26T03:54:24.189Z"}},{"type":"Public","name":"GDPO","owner":"sail-sg","isFork":false,"description":"Graph Diffusion Policy Optimization","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":20,"forksCount":3,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-17T13:27:35.826Z"}},{"type":"Public","name":"lm-random-memory-access","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":6,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-12T07:12:31.614Z"}},{"type":"Public","name":"Consistent3D","owner":"sail-sg","isFork":false,"description":"The official PyTorch implementation of Consistent3D (CVPR 2024)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":55,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-02T03:59:42.100Z"}},{"type":"Public","name":"EditAnything","owner":"sail-sg","isFork":false,"description":"Edit anything in images powered by segment-anything, ControlNet, StableDiffusion, etc. (ACM MM)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":43,"starsCount":3181,"forksCount":175,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-29T14:37:00.394Z"}},{"type":"Public","name":"zero-bubble-megatron-deepspeed","owner":"sail-sg","isFork":true,"description":"Zero Bubble Pipeline Parallelism implemented on Megatron-Deepspeed","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":2,"forksCount":2006,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-31T07:15:05.711Z"}},{"type":"Public","name":"autofd","owner":"sail-sg","isFork":false,"description":"Automatic Functional Differentiation in JAX","allTopics":["automatic-differentiation","jax","neural-operator","variational-calculus"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":45,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-20T23:11:54.843Z"}},{"type":"Public","name":"mugs","owner":"sail-sg","isFork":false,"description":"A PyTorch implementation of Mugs proposed by our paper \"Mugs: A Multi-Granular Self-Supervised Learning Framework\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":81,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-13T13:51:09.006Z"}},{"type":"Public","name":"MMCBench","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":23,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-23T22:30:23.803Z"}},{"type":"Public","name":"Megatron-LLM","owner":"sail-sg","isFork":true,"description":"distributed trainer for LLMs","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":72,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-19T09:20:36.534Z"}},{"type":"Public","name":"sewformer","owner":"sail-sg","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":9,"starsCount":117,"forksCount":12,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-28T09:03:16.969Z"}},{"type":"Public","name":"jax_xc","owner":"sail-sg","isFork":false,"description":"Exchange correlation functionals translated from libxc to jax","allTopics":["python","density-functional-theory","libxc","jax"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":39,"forksCount":2,"license":"Mozilla Public License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T15:58:08.899Z"}},{"type":"Public","name":"lorahub","owner":"sail-sg","isFork":false,"description":"The official repository of paper \"LoraHub: Efficient Cross-Task Generalization via Dynamic LoRA Composition\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":2,"starsCount":528,"forksCount":34,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-30T15:18:34.754Z"}},{"type":"Public","name":"inceptionnext","owner":"sail-sg","isFork":false,"description":"InceptionNeXt: When Inception Meets ConvNeXt (CVPR 2024)","allTopics":["convolutional-neural-networks"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":13,"starsCount":202,"forksCount":15,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-20T01:07:59.543Z"}},{"type":"Public","name":"edp","owner":"sail-sg","isFork":false,"description":"[NeurIPS 2023] Efficient Diffusion Policy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":58,"forksCount":5,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-31T03:16:36.663Z"}},{"type":"Public","name":"ScaleLong","owner":"sail-sg","isFork":false,"description":"The official repository of paper \"ScaleLong: Towards More Stable Training of Diffusion Model via Scaling Network Long Skip Connection\" (NeurIPS 2023)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":47,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-23T01:54:49.074Z"}},{"type":"Public","name":"DiffMemorize","owner":"sail-sg","isFork":false,"description":"On Memorization in Diffusion Models","allTopics":["generative-model","memorization","diffusion-models"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":20,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-05T06:04:17.894Z"}},{"type":"Public","name":"numcc","owner":"sail-sg","isFork":false,"description":"NU-MCC: Multiview Compressive Coding with Neighborhood Decoder and Repulsive UDF","allTopics":["3d-reconstruction","single-view-reconstruction"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":11,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-28T06:17:49.129Z"}},{"type":"Public","name":"optim4rl","owner":"sail-sg","isFork":false,"description":"Optim4RL is a Jax framework of learning to optimize for reinforcement learning.","allTopics":["reinforcement-learning","optimization","optimizer","reinforcement-learning-algorithms","optimization-algorithms","meta-learning","jax","learning-to-learn","optimizers","meta-learning-algorithms","learning-to-optimize","meta-learning-algorithm"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":21,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-09T20:08:16.237Z"}}],"repositoryCount":47,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}