{ "_id": "621ffdc136468d709f17a32e", "id": "dandelin/vilt-b32-finetuned-vqa", "private": false, "pipeline_tag": "visual-question-answering", "library_name": "transformers", "tags": [ "transformers", "pytorch", "vilt", "visual-question-answering", "arxiv:2102.03334", "license:apache-2.0", "endpoints_compatible", "region:us" ], "downloads": 1182512, "likes": 407, "modelId": "dandelin/vilt-b32-finetuned-vqa", "author": "dandelin", "sha": "d0a1f6ab88522427a7ae76ceb6e1e1e7b68a1d08", "lastModified": "2022-08-02T13:03:04.000Z", "gated": false, "disabled": false, "widgetData": [ { "text": "What's the animal doing?", "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/tiger.jpg" }, { "text": "What is on top of the building?", "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/palace.jpg" } ], "model-index": null, "config": { "architectures": [ "ViltForVisualQuestionAnswering" ], "model_type": "vilt", "tokenizer_config": { "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]" } }, "cardData": { "tags": [ "visual-question-answering" ], "license": "apache-2.0", "widget": [ { "text": "What's the animal doing?", "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/tiger.jpg" }, { "text": "What is on top of the building?", "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/palace.jpg" } ] }, "transformersInfo": { "auto_model": "ViltForVisualQuestionAnswering", "processor": "AutoProcessor" }, "siblings": [ { "rfilename": ".gitattributes" }, { "rfilename": "README.md" }, { "rfilename": "config.json" }, { "rfilename": "preprocessor_config.json" }, { "rfilename": "pytorch_model.bin" }, { "rfilename": "special_tokens_map.json" }, { "rfilename": "tokenizer.json" }, { "rfilename": "tokenizer_config.json" }, { "rfilename": "vocab.txt" } ], "spaces": [ "microsoft/HuggingGPT", "gunship999/SexyImages", "Yntec/ToyWorld", "llamameta/flux-pro-uncensored", "Nymbo/Compare-6", "Yntec/PrintingPress", "Uthar/SexyReality", "nielsr/comparing-VQA-models", "llamameta/fluxproV2", "Yntec/ToyWorldXL", "phenixrhyder/NSFW-ToyWorld", "Yntec/blitz_diffusion", "nielsr/vilt-vqa", "ethanchern/Anole", "John6666/Diffusion80XX4sg", "John6666/PrintingPress4", "llamameta/fast-sd3.5-large", "Yntec/Image-Models-Test-April-2024", "DemiPoto/TestDifs", "Abinivesh/Multi-models-prompt-to-image-generation", "Yntec/Image-Models-Test-2024", "martynka/TasiaExperiment", "Yntec/Image-Models-Test", "yergyerg/ImgGenClone", "John6666/hfd_test_nostopbutton", "Yntec/Image-Models-Test-May-2024", "taesiri/HuggingGPT-Lite", "Nymbo/Diffusion80XX4sg", "Yntec/Image-Models-Test-September-2024", "DemiPoto/testSortModels", "Yntec/MiniToyWorld", "kaleidoskop-hug/PrintingPress", "Madhuri/vqa_audiobot", "ixxan/cross-lingual-vqa", "John6666/ToyWorld4", "John6666/Diffusion80XX4g", "SAITAN666/StableDiffusion35Large-Image-Models-Test-November-2024", "NativeAngels/HuggingfaceDiffusion", "Yntec/Image-Models-Test-December-2024", "huggingfacejs/doc-vis-qa", "John6666/Diffusion80XX4", "K00B404/HuggingfaceDiffusion_custom", "John6666/blitz_diffusion4", "John6666/blitz_diffusion_builtin", "NativeAngels/Compare-6", "K00B404/SimpleBrothel", "Babyloncoder/chat-with-an-image", "Yntec/Image-Models-Test-July-2024", "Blane187/multi-diffusion", "OpenXAIProject/pnpxai-image-classification", "Uthar/LewdExperiments", "Uthar/BodyPaint", "Uthar/HighFashion", "Yntec/open-craiyon", "BarBar288/Chatbot", "hayas-tohoku-workshop-2023/comparing-VQA-models", "dreamdrop-art/000555111", "SeyedAli/Persian-Visual-Question-Answering-1", "sathvikparasa20/vqa-vitgpt", "NativeAngels/ToyWorld", "Uthar/Harvester", "Yntec/Image-Models-Test-January-2025", "Yeeezus/SexyImages", "John6666/MiniToyWorld", "ccarr0807/HuggingGPT", "theholycityweb/HuggingGPT", "gtx4010661/dandelin-vilt-b32-finetuned-vqa", "Alfasign/HuggingGPT-Lite", "roontoon/Demo-TTI-dandelin-vilt-b32-finetuned-vqa", "nilaymodi/dandelin-vilt-b32-finetuned-vqa", "saurshaz/HuggingGPT", "Akoloskov/image-recon", "optowo/dandelin-vilt-b32-finetuned-vqa", "Nikhil0987/omm", "wendys-llc/comparing-VQA-models", "SilvusTV/Test", "roshithindia/imageQuestionAnswering", "mahitha11/vqa-vitgpt", "TotoB12/dandelin-vilt-b32-finetuned-vqa", "NativeAngels/blitz_diffusion", "NativeAngels/PrintingPress4", "NativeAngels/PrintingPress", "Uthar/HRGiger", "romadanskiy/open-source-models-hg", "dehua68/ToyWorld", "tushar888/Zeinural.ai", "JarvisOnSolana/Jarvis", "codelion/sentinel", "Yntec/Image-Models-Test-February-2025", "MrRokot/GENFLUX", "Hadiil/home23", "BarBar288/AI_Tools", "burman-ai/Printing-Press", "Yntec/Image-Models-Test-March-2025", "chrisW6825/HuggingGPT", "Shenziqian/HuggingGPT", "hema1/Text-Visual-QA", "lokutus/HuggingGPT", "mimiqiao/HuggingGPT", "tsgbalakarthik/HuggingGPT" ], "createdAt": "2022-03-02T23:29:05.000Z", "inference": "warm", "usedStorage": 940815323 }