{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"Grounding-DINO-1.5-API","owner":"IDEA-Research","isFork":false,"description":"API for Grounding DINO 1.5: IDEA Research's Most Capable Open-World Object Detection Model Series","allTopics":["open-world","object-detection","open-set","zero-shot-object-detection","foundation-model","open-vocabulary-detection","grounding-dino"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":11,"starsCount":480,"forksCount":16,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,15,13,1,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-07T02:31:25.767Z"}},{"type":"Public","name":"T-Rex","owner":"IDEA-Research","isFork":false,"description":"API for T-Rex2: Towards Generic Object Detection via Text-Visual Prompt Synergy","allTopics":["interactive","object-detection","open-set","object-counting","text-prompt","visual-prompt"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":1943,"forksCount":120,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,13,0,2,0,2,0,0,0,0,0,0,0,0,0,0,0,0,7,11,3,0,2,0,0,0,0,1,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-04T06:30:32.094Z"}},{"type":"Public","name":"MotionLLM","owner":"IDEA-Research","isFork":false,"description":"[Arxiv-2024] MotionLLM: Understanding Human Behaviors from Human Motions and Videos","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":126,"forksCount":1,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,5],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T00:09:55.268Z"}},{"type":"Public","name":"GroundingDINO","owner":"IDEA-Research","isFork":false,"description":"Official implementation of the paper \"Grounding DINO: Marrying DINO with Grounded Pre-Training for Open-Set Object Detection\"","allTopics":["open-world","vision-language","vision-language-transformer","open-world-detection","object-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":222,"starsCount":5302,"forksCount":559,"license":"Apache License 2.0","participation":[2,3,5,0,0,1,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,0,1,0,0,1,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,1,0,0,0,2,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-23T12:10:37.380Z"}},{"type":"Public","name":"HumanTOMATO","owner":"IDEA-Research","isFork":false,"description":"[ICML 2024] 🍅HumanTOMATO: Text-aligned Whole-body Motion Generation","allTopics":["motion","generation","gpt","whole-body","smplx","motion-generation","whole-body-motion"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":9,"starsCount":226,"forksCount":5,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,4,0,0,5,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-16T02:17:14.661Z"}},{"type":"Public","name":"DreamWaltz","owner":"IDEA-Research","isFork":false,"description":"[NeurIPS 2023] Official implementation of the paper \"DreamWaltz: Make a Scene with Complex 3D Animatable Avatars\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":163,"forksCount":6,"license":"Other","participation":[0,0,0,8,1,0,0,0,0,0,0,0,0,0,0,0,0,2,1,0,0,0,0,0,0,0,0,0,0,0,2,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-08T09:04:20.449Z"}},{"type":"Public","name":"TOSS","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2024] Official implementation of the paper \"Toss: High-quality text-guided novel view synthesis from a single image\"","allTopics":["open-world","3d-generation","novel-view-synthesis"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":11,"forksCount":1,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,11,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-05T20:25:37.167Z"}},{"type":"Public","name":"detrex","owner":"IDEA-Research","isFork":false,"description":"detrex is a research platform for DETR-based object detection, segmentation, pose estimation and other visual recognition tasks.","allTopics":["segmentation","pose-estimation","dino","state-of-the-art","deta","detr","deformable-detr","dab-detr","mask-dino","dn-detr","conditional-detr","h-detr","group-detr","anchor-detr","pytorch","object-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":56,"starsCount":1862,"forksCount":196,"license":"Apache License 2.0","participation":[9,0,0,3,1,4,2,2,0,1,2,1,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-01T01:12:39.213Z"}},{"type":"Public","name":"Stable-DINO","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"Detection Transformer with Stable Matching\"","allTopics":["transformer","object-detection","dino","detection-transformer","detrex"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":15,"starsCount":192,"forksCount":3,"license":"Apache License 2.0","participation":[6,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-29T10:25:46.372Z"}},{"type":"Public","name":"Motion-X","owner":"IDEA-Research","isFork":false,"description":"[NeurIPS 2023] Official implementation of the paper \"Motion-X: A Large-scale 3D Expressive Whole-body Human Motion Dataset\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":51,"starsCount":470,"forksCount":11,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-25T07:09:56.310Z"}},{"type":"Public","name":"DINO","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2023] Official implementation of the paper \"DINO: DETR with Improved DeNoising Anchor Boxes for End-to-End Object Detection\"","allTopics":["computer-vision","deep-learning","object-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":136,"starsCount":2036,"forksCount":228,"license":"Apache License 2.0","participation":[0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-07T01:59:52.232Z"}},{"type":"Public","name":"UniPose","owner":"IDEA-Research","isFork":false,"description":"Official implementation of the paper \"UniPose : Detecting Any Keypoints\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":9,"starsCount":247,"forksCount":10,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8,0,4,3,0,0,2,0,0,0,0,0,0,0,4,0,0,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-19T16:13:03.069Z"}},{"type":"Public","name":"OpenSeeD","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"A Simple Framework for Open-Vocabulary Segmentation and Detection\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":16,"starsCount":601,"forksCount":36,"license":"Apache License 2.0","participation":[0,0,0,0,0,3,1,0,0,0,10,0,0,0,0,0,0,0,0,3,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-22T14:12:04.770Z"}},{"type":"Public","name":"DN-DETR","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2022 Oral] Official implementation of DN-DETR","allTopics":["object-detection","detr"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":33,"starsCount":523,"forksCount":57,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-20T07:06:23.532Z"}},{"type":"Public","name":"MaskDINO","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper \"Mask DINO: Towards A Unified Transformer-based Framework for Object Detection and Segmentation\"","allTopics":["object-detection","semantic-segmentation","instance-segmentation","panoptic-segmentation"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":45,"starsCount":1067,"forksCount":95,"license":"Apache License 2.0","participation":[0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-20T07:05:03.227Z"}},{"type":"Public","name":"DWPose","owner":"IDEA-Research","isFork":false,"description":"\"Effective Whole-body Pose Estimation with Two-stages Distillation\" (ICCV 2023, CV4Metaverse Workshop)","allTopics":["knowledge-distillation","pose-estimation","stable-diffusion-webui","controlnet"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":22,"starsCount":1971,"forksCount":132,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,1,15,14,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,1,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T02:54:23.076Z"}},{"type":"Public","name":"HumanSD","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] The official implementation of paper \"HumanSD: A Native Skeleton-Guided Diffusion Model for Human Image Generation\"","allTopics":["deep-learning","image-generation","iccv","conditional-image-generation","iccv2023","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":7,"starsCount":254,"forksCount":18,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-24T08:18:16.437Z"}},{"type":"Public","name":"MP-Former","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper: MP-Former: Mask-Piloted Transformer for Image Segmentation","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":108,"forksCount":3,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-22T02:34:06.363Z"}},{"type":"Public","name":"OSX","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper \"One-Stage 3D Whole-Body Mesh Recovery with Component Aware Transformer\"","allTopics":["human-pose-estimation","smpl-model","smplx","3d-body-recovery","whole-body-pose-estimation","cvpr2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":16,"starsCount":587,"forksCount":49,"license":"MIT License","participation":[0,0,0,2,2,2,0,4,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-12T11:15:43.570Z"}},{"type":"Public","name":"Click-Pose","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"Neural Interactive Keypoint Detection\"","allTopics":["annotation-tool","pose-estimation","human-in-the-loop","iccv2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":62,"forksCount":2,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,15,0,5,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-12T08:29:50.105Z"}},{"type":"Public","name":"3D-deformable-attention","owner":"IDEA-Research","isFork":false,"description":"[ICCV 2023] Official implementation of the paper \"DFA3D: 3D Deformable Attention For 2D-to-3D Feature Lifting\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":138,"forksCount":2,"license":"Other","participation":[0,0,0,0,0,0,3,0,0,0,3,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-20T14:09:07.000Z"}},{"type":"Public","name":"ED-Pose","owner":"IDEA-Research","isFork":false,"description":"[ICLR 2023] Official implementation of the paper \"Explicit Box Detection Unifies End-to-End Multi-Person Pose Estimation \"","allTopics":["end-to-end","multi-person-pose-estimation","iclr2023"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":17,"starsCount":141,"forksCount":9,"license":"Other","participation":[0,0,0,0,0,0,0,0,3,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-20T02:07:21.728Z"}},{"type":"Public","name":"DiffHOI","owner":"IDEA-Research","isFork":false,"description":"Official implementation of the paper \"Boosting Human-Object Interaction Detection with Text-to-Image Diffusion Model\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":37,"forksCount":0,"license":"Other","participation":[0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-09T02:42:15.720Z"}},{"type":"Public","name":"DisCo-CLIP","owner":"IDEA-Research","isFork":false,"description":"Official PyTorch implementation of the paper \"DisCo-CLIP: A Distributed Contrastive Loss for Memory Efficient CLIP Training\".","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":39,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-02T07:46:29.818Z"}},{"type":"Public","name":"LipsFormer","owner":"IDEA-Research","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":31,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-07T12:45:05.924Z"}},{"type":"Public","name":"Lite-DETR","owner":"IDEA-Research","isFork":false,"description":"[CVPR 2023] Official implementation of the paper \"Lite DETR : An Interleaved Multi-Scale Encoder for Efficient DETR\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":11,"starsCount":176,"forksCount":14,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-01T07:11:44.637Z"}},{"type":"Public","name":"hana","owner":"IDEA-Research","isFork":false,"description":"Implementation and checkpoints of Imagen, Google's text-to-image synthesis neural network, in Pytorch","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":17,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-12-22T14:20:12.205Z"}}],"repositoryCount":27,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}