{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"MotionLLM","owner":"IDEA-Research","isFork":false,"description":"[Arxiv-2024] MotionLLM: Understanding Human Behaviors from Human Motions and Videos","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":212,"forksCount":5,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8,4,2,2,1,0,0,0,0,0,0,0,0,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-08T07:45:34.268Z"}},{"type":"Public","name":"Grounded-SAM-2","owner":"IDEA-Research","isFork":false,"description":"Grounded SAM 2: Ground and Track Anything in Videos with Grounding DINO, Florence-2 and SAM 2","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":18,"starsCount":647,"forksCount":46,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,14,51,18,5,6,5],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-06T12:44:58.355Z"}},{"type":"Public","name":"Grounded-Segment-Anything","owner":"IDEA-Research","isFork":false,"description":"Grounded SAM: Marrying Grounding DINO with Segment Anything &amp; Stable Diffusion &amp; Recognize Anything - Automatically Detect , Segment and Generate Anything","allTopics":["speech","image-editing","caption","data-generation","3d-whole-body-pose-estimation","open-vocabulary-detection","open-vocabulary-segmentation","automatic-labeling-system"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":1,"issueCount":277,"starsCount":14698,"forksCount":1360,"license":"Apache License 2.0","participation":[1,0,0,0,1,1,0,0,0,1,5,0,2,5,0,2,0,0,2,2,1,0,0,0,3,1,3,0,0,0,2,1,0,0,0,2,2,0,0,0,0,0,0,0,0,0,2,0,0,0,2,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-05T06:07:32.279Z"}},{"type":"Public","name":"Motion-X","owner":"IDEA-Research","isFork":false,"description":"[NeurIPS 2023] Official implementation of the paper \"Motion-X: A Large-scale 3D Expressive Whole-body Human Motion Dataset\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":60,"starsCount":528,"forksCount":13,"license":"Other","participation":[0,0,0,0,3,16,37,5,0,7,0,4,0,0,3,2,0,6,2,2,0,1,0,0,0,0,0,0,0,0,0,3,1,0,0,0,0,0,0,5,0,0,0,0,0,0,0,0,0,0,1,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-01T13:12:40.310Z"}},{"type":"Public","name":"T-Rex","owner":"IDEA-Research","isFork":false,"description":"[ECCV2024] API code for T-Rex2: Towards Generic Object Detection via Text-Visual Prompt Synergy","allTopics":["interactive","object-detection","open-set","object-counting","text-prompt","visual-prompt"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":2139,"forksCount":124,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,13,0,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,10,9,2,0,2,0,0,0,1,0,0,2,0,0,3,0,0,0,0,0,1,0,0,1,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-29T02:16:03.094Z"}},{"type":"Public","name":"OSX","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper \"One-Stage 3D Whole-Body Mesh Recovery with Component Aware Transformer\"","allTopics":["human-pose-estimation","smpl-model","smplx","3d-body-recovery","whole-body-pose-estimation","cvpr2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":23,"starsCount":622,"forksCount":54,"license":"MIT License","participation":[0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-26T07:47:17.570Z"}},{"type":"Public","name":"TAPTR","owner":"IDEA-Research","isFork":false,"description":"[ECCV 2024] Official implementation of the paper \"TAPTR: Tracking Any Point with Transformers as Detection\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":180,"forksCount":10,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,13,6,3,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-18T03:09:26.906Z"}},{"type":"Public","name":"X-Pose","owner":"IDEA-Research","isFork":false,"description":"[ECCV 2024] Official implementation of the paper \"X-Pose: Detecting Any Keypoints\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":18,"starsCount":414,"forksCount":18,"license":"Other","participation":[0,0,0,0,6,2,0,4,3,0,0,2,0,0,0,0,0,0,0,4,0,0,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,7,2,0,0,0,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-16T15:22:44.069Z"}},{"type":"Public","name":"detrex","owner":"IDEA-Research","isFork":false,"description":"detrex is a research platform for DETR-based object detection, segmentation, pose estimation and other visual recognition tasks.","allTopics":["segmentation","pose-estimation","dino","state-of-the-art","deta","detr","deformable-detr","dab-detr","mask-dino","dn-detr","conditional-detr","h-detr","group-detr","anchor-detr","pytorch","object-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":65,"starsCount":1969,"forksCount":206,"license":"Apache License 2.0","participation":[0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-15T09:24:30.749Z"}},{"type":"Public","name":"GroundingDINO","owner":"IDEA-Research","isFork":false,"description":"[ECCV 2024] Official implementation of the paper \"Grounding DINO: Marrying DINO with Grounded Pre-Training for Open-Set Object Detection\"","allTopics":["open-world","object-detection","vision-language","vision-language-transformer","open-world-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":10,"issueCount":242,"starsCount":6209,"forksCount":650,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,3,1,0,0,0,1,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,1,0,0,1,1,0,0,0,0,1,0,1,0,3,0,0,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-12T08:52:02.313Z"}},{"type":"Public","name":"Grounding-DINO-1.5-API","owner":"IDEA-Research","isFork":false,"description":"API for Grounding DINO 1.5: IDEA Research's Most Capable Open-World Object Detection Model Series","allTopics":["open-world","object-detection","open-set","zero-shot-object-detection","foundation-model","open-vocabulary-detection","grounding-dino"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":24,"starsCount":701,"forksCount":21,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,25,3,1,2,1,0,0,0,0,0,0,1,1,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-09T07:04:58.767Z"}},{"type":"Public","name":"detrex-storage","owner":"IDEA-Research","isFork":false,"description":"","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-06T09:20:52.520Z"}},{"type":"Public","name":"DINO","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2023] Official implementation of the paper \"DINO: DETR with Improved DeNoising Anchor Boxes for End-to-End Object Detection\"","allTopics":["computer-vision","deep-learning","object-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":140,"starsCount":2155,"forksCount":234,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-31T13:56:21.232Z"}},{"type":"Public","name":"DreamWaltz","owner":"IDEA-Research","isFork":false,"description":"[NeurIPS 2023] Official implementation of the paper \"DreamWaltz: Make a Scene with Complex 3D Animatable Avatars\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":173,"forksCount":8,"license":"Other","participation":[0,0,0,0,2,1,0,0,0,0,0,0,0,0,0,0,0,2,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-23T07:37:56.449Z"}},{"type":"Public","name":"awesome-detection-transformer","owner":"IDEA-Research","isFork":false,"description":"Collect some papers about transformer for detection and segmentation. Awesome Detection Transformer for Computer Vision (CV)","allTopics":[],"primaryLanguage":null,"pullRequestCount":1,"issueCount":7,"starsCount":1260,"forksCount":111,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-04T09:42:46.257Z"}},{"type":"Public","name":"HumanTOMATO","owner":"IDEA-Research","isFork":false,"description":"[ICML 2024] 🍅HumanTOMATO: Text-aligned Whole-body Motion Generation","allTopics":["motion","generation","gpt","whole-body","smplx","motion-generation","whole-body-motion"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":17,"starsCount":267,"forksCount":8,"license":"Other","participation":[0,0,0,0,0,7,1,0,0,5,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,4,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-19T04:51:49.661Z"}},{"type":"Public","name":"TOSS","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2024] Official implementation of the paper \"Toss: High-quality text-guided novel view synthesis from a single image\"","allTopics":["open-world","3d-generation","novel-view-synthesis"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":12,"forksCount":1,"license":"Apache License 2.0","participation":[0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,11,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-05T20:25:37.167Z"}},{"type":"Public","name":"Stable-DINO","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"Detection Transformer with Stable Matching\"","allTopics":["transformer","object-detection","dino","detection-transformer","detrex"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":17,"starsCount":208,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-29T10:25:46.372Z"}},{"type":"Public","name":"deepdataspace","owner":"IDEA-Research","isFork":false,"description":"The Go-To Choice for CV Data Visualization, Annotation, and Model Analysis.","allTopics":["computer-vision","model-analysis","labeling-tool","dataset-visualization","intelligent-annotation","collaborative-annotation"],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":0,"issueCount":3,"starsCount":212,"forksCount":16,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-19T09:43:56.667Z"}},{"type":"Public","name":"IYFC","owner":"IDEA-Research","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":9,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-19T02:56:11.667Z"}},{"type":"Public","name":"OpenSeeD","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"A Simple Framework for Open-Vocabulary Segmentation and Detection\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":16,"starsCount":637,"forksCount":39,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,3,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-22T14:12:04.770Z"}},{"type":"Public","name":"DN-DETR","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2022 Oral] Official implementation of DN-DETR","allTopics":["object-detection","detr"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":34,"starsCount":535,"forksCount":61,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-20T07:06:23.532Z"}},{"type":"Public","name":"MaskDINO","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper \"Mask DINO: Towards A Unified Transformer-based Framework for Object Detection and Segmentation\"","allTopics":["object-detection","semantic-segmentation","instance-segmentation","panoptic-segmentation"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":52,"starsCount":1149,"forksCount":102,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-20T07:05:03.227Z"}},{"type":"Public","name":"DWPose","owner":"IDEA-Research","isFork":false,"description":"\"Effective Whole-body Pose Estimation with Two-stages Distillation\" (ICCV 2023, CV4Metaverse Workshop)","allTopics":["knowledge-distillation","pose-estimation","stable-diffusion-webui","controlnet"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":29,"starsCount":2154,"forksCount":141,"license":"Apache License 2.0","participation":[0,0,0,0,1,0,0,0,1,0,0,1,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T02:54:23.076Z"}},{"type":"Public","name":"HumanSD","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] The official implementation of paper \"HumanSD: A Native Skeleton-Guided Diffusion Model for Human Image Generation\"","allTopics":["deep-learning","image-generation","iccv","conditional-image-generation","iccv2023","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":271,"forksCount":18,"license":"Apache License 2.0","participation":[0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-24T08:18:16.437Z"}},{"type":"Public","name":"MP-Former","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper: MP-Former: Mask-Piloted Transformer for Image Segmentation","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":115,"forksCount":6,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-22T02:34:06.363Z"}},{"type":"Public","name":"Click-Pose","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"Neural Interactive Keypoint Detection\"","allTopics":["annotation-tool","pose-estimation","human-in-the-loop","iccv2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":68,"forksCount":3,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-12T08:29:50.105Z"}},{"type":"Public","name":"HumanArt","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] The official implementation of CVPR 2023 paper \"Human-Art: A Versatile Human-Centric Dataset Bridging Natural and Artificial Scenes\"","allTopics":["image-generation","human-pose-estimation","datasets","cvpr","pose-estimation","multi-scenario","multi-scene","cvpr2023"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":2,"starsCount":217,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-03T07:29:58.420Z"}},{"type":"Public","name":"3D-deformable-attention","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"DFA3D: 3D Deformable Attention For 2D-to-3D Feature Lifting\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":144,"forksCount":2,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-20T14:09:07.000Z"}},{"type":"Public","name":"ED-Pose","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2023] Official implementation of the paper \"Explicit Box Detection Unifies End-to-End Multi-Person Pose Estimation \"","allTopics":["end-to-end","multi-person-pose-estimation","iclr2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":17,"starsCount":152,"forksCount":10,"license":"Other","participation":[0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-20T02:07:21.728Z"}}],"repositoryCount":37,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"IDEA-Research repositories"}