{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"Grounding-DINO-1.5-API","owner":"IDEA-Research","isFork":false,"description":"API for Grounding DINO 1.5: IDEA Research's Most Capable Open-World Object Detection Model Series","allTopics":["open-world","object-detection","open-set","zero-shot-object-detection","foundation-model","open-vocabulary-detection","grounding-dino"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":11,"starsCount":481,"forksCount":16,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-07T02:31:25.767Z"}},{"type":"Public","name":"T-Rex","owner":"IDEA-Research","isFork":false,"description":"API for T-Rex2: Towards Generic Object Detection via Text-Visual Prompt Synergy","allTopics":["interactive","object-detection","open-set","object-counting","text-prompt","visual-prompt"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":1943,"forksCount":120,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,13,0,2,0,2,0,0,0,0,0,0,0,0,0,0,0,0,7,11,3,0,2,0,0,0,0,1,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-04T06:30:32.094Z"}},{"type":"Public","name":"MotionLLM","owner":"IDEA-Research","isFork":false,"description":"[Arxiv-2024] MotionLLM: Understanding Human Behaviors from Human Motions and Videos","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":127,"forksCount":1,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,5],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T00:09:55.268Z"}},{"type":"Public","name":"Grounded-Segment-Anything","owner":"IDEA-Research","isFork":false,"description":"Grounded SAM: Marrying Grounding DINO with Segment Anything &amp; Stable Diffusion &amp; Recognize Anything - Automatically Detect , Segment and Generate Anything","allTopics":["speech","image-editing","caption","data-generation","3d-whole-body-pose-estimation","open-vocabulary-detection","open-vocabulary-segmentation","automatic-labeling-system"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":1,"issueCount":269,"starsCount":13859,"forksCount":1277,"license":"Apache License 2.0","participation":[7,10,6,2,2,2,2,0,0,0,0,1,1,1,0,0,0,0,2,0,0,0,1,3,2,0,5,2,1,1,0,1,1,3,0,0,0,2,2,1,2,0,0,2,1,0,0,0,0,4,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-23T12:11:52.408Z"}},{"type":"Public","name":"GroundingDINO","owner":"IDEA-Research","isFork":false,"description":"Official implementation of the paper \"Grounding DINO: Marrying DINO with Grounded Pre-Training for Open-Set Object Detection\"","allTopics":["open-world","vision-language","vision-language-transformer","open-world-detection","object-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":222,"starsCount":5303,"forksCount":559,"license":"Apache License 2.0","participation":[2,3,5,0,0,1,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,0,1,0,0,1,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,1,0,0,0,2,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-23T12:10:37.380Z"}},{"type":"Public","name":"HumanTOMATO","owner":"IDEA-Research","isFork":false,"description":"[ICML 2024] 🍅HumanTOMATO: Text-aligned Whole-body Motion Generation","allTopics":["motion","generation","gpt","whole-body","smplx","motion-generation","whole-body-motion"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":9,"starsCount":226,"forksCount":5,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,4,0,0,5,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-16T02:17:14.661Z"}},{"type":"Public","name":"DreamWaltz","owner":"IDEA-Research","isFork":false,"description":"[NeurIPS 2023] Official implementation of the paper \"DreamWaltz: Make a Scene with Complex 3D Animatable Avatars\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":163,"forksCount":6,"license":"Other","participation":[0,0,0,8,1,0,0,0,0,0,0,0,0,0,0,0,0,2,1,0,0,0,0,0,0,0,0,0,0,0,2,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-08T09:04:20.449Z"}},{"type":"Public","name":"TOSS","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2024] Official implementation of the paper \"Toss: High-quality text-guided novel view synthesis from a single image\"","allTopics":["open-world","3d-generation","novel-view-synthesis"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":11,"forksCount":1,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,11,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-05T20:25:37.167Z"}},{"type":"Public","name":"detrex","owner":"IDEA-Research","isFork":false,"description":"detrex is a research platform for DETR-based object detection, segmentation, pose estimation and other visual recognition tasks.","allTopics":["segmentation","pose-estimation","dino","state-of-the-art","deta","detr","deformable-detr","dab-detr","mask-dino","dn-detr","conditional-detr","h-detr","group-detr","anchor-detr","pytorch","object-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":56,"starsCount":1862,"forksCount":196,"license":"Apache License 2.0","participation":[9,0,0,3,1,4,2,2,0,1,2,1,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-01T01:12:39.213Z"}},{"type":"Public","name":"Stable-DINO","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"Detection Transformer with Stable Matching\"","allTopics":["transformer","object-detection","dino","detection-transformer","detrex"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":15,"starsCount":192,"forksCount":3,"license":"Apache License 2.0","participation":[6,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-29T10:25:46.372Z"}},{"type":"Public","name":"Motion-X","owner":"IDEA-Research","isFork":false,"description":"[NeurIPS 2023] Official implementation of the paper \"Motion-X: A Large-scale 3D Expressive Whole-body Human Motion Dataset\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":51,"starsCount":470,"forksCount":11,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-25T07:09:56.310Z"}},{"type":"Public","name":"deepdataspace","owner":"IDEA-Research","isFork":false,"description":"The Go-To Choice for CV Data Visualization, Annotation, and Model Analysis.","allTopics":["computer-vision","model-analysis","labeling-tool","dataset-visualization","intelligent-annotation","collaborative-annotation"],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":0,"issueCount":2,"starsCount":200,"forksCount":14,"license":"Apache License 2.0","participation":[33,18,23,22,43,44,20,3,4,0,3,11,6,6,16,17,0,0,0,0,0,0,0,0,0,0,15,0,1,10,4,0,0,7,6,0,1,14,2,6,0,15,0,12,0,4,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-19T09:43:56.667Z"}},{"type":"Public","name":"DINO","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2023] Official implementation of the paper \"DINO: DETR with Improved DeNoising Anchor Boxes for End-to-End Object Detection\"","allTopics":["computer-vision","deep-learning","object-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":136,"starsCount":2036,"forksCount":228,"license":"Apache License 2.0","participation":[0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-07T01:59:52.232Z"}},{"type":"Public","name":"awesome-detection-transformer","owner":"IDEA-Research","isFork":false,"description":"Collect some papers about transformer for detection and segmentation. Awesome Detection Transformer for Computer Vision (CV)","allTopics":[],"primaryLanguage":null,"pullRequestCount":1,"issueCount":6,"starsCount":1202,"forksCount":109,"license":null,"participation":[0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-29T03:18:27.359Z"}},{"type":"Public","name":"UniPose","owner":"IDEA-Research","isFork":false,"description":"Official implementation of the paper \"UniPose : Detecting Any Keypoints\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":9,"starsCount":247,"forksCount":10,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-19T16:13:03.069Z"}},{"type":"Public","name":"IYFC","owner":"IDEA-Research","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":9,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-19T02:56:11.667Z"}},{"type":"Public","name":"OpenSeeD","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"A Simple Framework for Open-Vocabulary Segmentation and Detection\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":16,"starsCount":601,"forksCount":36,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-22T14:12:04.770Z"}},{"type":"Public","name":"DN-DETR","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2022 Oral] Official implementation of DN-DETR","allTopics":["object-detection","detr"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":33,"starsCount":523,"forksCount":57,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-20T07:06:23.532Z"}},{"type":"Public","name":"MaskDINO","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper \"Mask DINO: Towards A Unified Transformer-based Framework for Object Detection and Segmentation\"","allTopics":["object-detection","semantic-segmentation","instance-segmentation","panoptic-segmentation"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":45,"starsCount":1067,"forksCount":95,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-20T07:05:03.227Z"}},{"type":"Public","name":"detrex-storage","owner":"IDEA-Research","isFork":false,"description":"","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":0,"license":"Apache License 2.0","participation":[2,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-15T18:42:28.520Z"}},{"type":"Public","name":"DWPose","owner":"IDEA-Research","isFork":false,"description":"\"Effective Whole-body Pose Estimation with Two-stages Distillation\" (ICCV 2023, CV4Metaverse Workshop)","allTopics":["knowledge-distillation","pose-estimation","stable-diffusion-webui","controlnet"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":22,"starsCount":1971,"forksCount":132,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,1,15,14,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,1,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T02:54:23.076Z"}},{"type":"Public","name":"HumanSD","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] The official implementation of paper \"HumanSD: A Native Skeleton-Guided Diffusion Model for Human Image Generation\"","allTopics":["deep-learning","image-generation","iccv","conditional-image-generation","iccv2023","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":7,"starsCount":254,"forksCount":18,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-24T08:18:16.437Z"}},{"type":"Public","name":"MP-Former","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper: MP-Former: Mask-Piloted Transformer for Image Segmentation","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":108,"forksCount":3,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-22T02:34:06.363Z"}},{"type":"Public","name":"OSX","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper \"One-Stage 3D Whole-Body Mesh Recovery with Component Aware Transformer\"","allTopics":["human-pose-estimation","smpl-model","smplx","3d-body-recovery","whole-body-pose-estimation","cvpr2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":16,"starsCount":587,"forksCount":49,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-12T11:15:43.570Z"}},{"type":"Public","name":"Click-Pose","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"Neural Interactive Keypoint Detection\"","allTopics":["annotation-tool","pose-estimation","human-in-the-loop","iccv2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":62,"forksCount":2,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-12T08:29:50.105Z"}},{"type":"Public","name":"HumanArt","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] The official implementation of CVPR 2023 paper \"Human-Art: A Versatile Human-Centric Dataset Bridging Natural and Artificial Scenes\"","allTopics":["image-generation","human-pose-estimation","datasets","cvpr","pose-estimation","multi-scenario","multi-scene","cvpr2023"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":1,"starsCount":201,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-03T07:29:58.420Z"}},{"type":"Public","name":"3D-deformable-attention","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"DFA3D: 3D Deformable Attention For 2D-to-3D Feature Lifting\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":138,"forksCount":2,"license":"Other","participation":[0,0,0,0,0,0,3,0,0,0,3,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-20T14:09:07.000Z"}},{"type":"Public","name":"ED-Pose","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2023] Official implementation of the paper \"Explicit Box Detection Unifies End-to-End Multi-Person Pose Estimation \"","allTopics":["end-to-end","multi-person-pose-estimation","iclr2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":17,"starsCount":141,"forksCount":9,"license":"Other","participation":[0,0,0,0,0,0,0,0,3,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-20T02:07:21.728Z"}},{"type":"Public","name":"DiffHOI","owner":"IDEA-Research","isFork":false,"description":"Official implementation of the paper \"Boosting Human-Object Interaction Detection with Text-to-Image Diffusion Model\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":37,"forksCount":0,"license":"Other","participation":[0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-09T02:42:15.720Z"}},{"type":"Public","name":"DisCo-CLIP","owner":"IDEA-Research","isFork":false,"description":"Official PyTorch implementation of the paper \"DisCo-CLIP: A Distributed Contrastive Loss for Memory Efficient CLIP Training\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":39,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-02T07:46:29.818Z"}}],"repositoryCount":35,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}