{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"Groma","owner":"FoundationVision","isFork":false,"description":"Grounded Multimodal Large Language Model with Localized Visual Tokenization","topicNames":["llama","multimodal","grounding","foundation-models","large-language-models","llm","mllm","vision-language-model","llama2"],"topicsNotShown":0,"allTopics":["llama","multimodal","grounding","foundation-models","large-language-models","llm","mllm","vision-language-model","llama2"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":384,"forksCount":50,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-15T13:31:20.383Z"}},{"type":"Public","name":"GLEE","owner":"FoundationVision","isFork":false,"description":"[CVPR2024 Highlight]GLEE: General Object Foundation Model for Images and Videos at Scale","topicNames":["tracking","open-world","object-detection","interactive-segmentation","video-object-segmentation","referring-expression-segmentation","referring-expression-comprehension","video-instance-segmentation","zero-shot-object-detection","referring-video-object-segmentation"],"topicsNotShown":5,"allTopics":["tracking","open-world","object-detection","interactive-segmentation","video-object-segmentation","referring-expression-segmentation","referring-expression-comprehension","video-instance-segmentation","zero-shot-object-detection","referring-video-object-segmentation","foundation-model","segment-anything","open-vocabulary-detection","open-vocabulary-segmentation","open-vocabulary-video-segmentation"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":21,"starsCount":930,"forksCount":74,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-08T15:11:16.544Z"}},{"type":"Public","name":"VAR","owner":"FoundationVision","isFork":false,"description":"[GPT beats diffusion🔥] [scaling laws in visual generation📈] Official impl. of \"Visual Autoregressive Modeling: Scalable Image Generation via Next-Scale Prediction\". An *ultra-simple, user-friendly yet state-of-the-art* codebase for autoregressive image generation!","topicNames":["transformers","generative-model","image-generation","auto-regressive-model","gpt","gpt-2","diffusion-models","autoregressive-models","vision-transformer","large-language-models"],"topicsNotShown":1,"allTopics":["transformers","generative-model","image-generation","auto-regressive-model","gpt","gpt-2","diffusion-models","autoregressive-models","vision-transformer","large-language-models","generative-ai"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":17,"starsCount":3565,"forksCount":274,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-30T13:34:27.499Z"}},{"type":"Public","name":"GenerateU","owner":"FoundationVision","isFork":false,"description":"[CVPR2024] Generative Region-Language Pretraining for Open-Ended Object Detection","topicNames":["open-world","object-detection","multimodality","open-vocabulary","mllm","open-vocabulary-detection"],"topicsNotShown":0,"allTopics":["open-world","object-detection","multimodality","open-vocabulary","mllm","open-vocabulary-detection"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":99,"forksCount":5,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-25T02:24:16.947Z"}},{"type":"Public","name":"UniRef","owner":"FoundationVision","isFork":false,"description":"[ICCV2023] Segment Every Reference Object in Spatial and Temporal Spaces ","topicNames":["object-segmentation","unified-model"],"topicsNotShown":0,"allTopics":["object-segmentation","unified-model"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":227,"forksCount":12,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-10T04:34:32.219Z"}}],"repositoryCount":5,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}