← Back to index
dandelin/vilt-b32-finetuned-vqa
Inference API
Inference API (serverless) is disabled for an unknown reason. Please open a Discussion in the Community tab.
			{
  "_id": "621ffdc136468d709f17a32e",
  "id": "dandelin/vilt-b32-finetuned-vqa",
  "private": false,
  "pipeline_tag": "visual-question-answering",
  "library_name": "transformers",
  "tags": [
    "transformers",
    "pytorch",
    "vilt",
    "visual-question-answering",
    "arxiv:2102.03334",
    "license:apache-2.0",
    "endpoints_compatible",
    "region:us"
  ],
  "downloads": 1182512,
  "likes": 407,
  "modelId": "dandelin/vilt-b32-finetuned-vqa",
  "author": "dandelin",
  "sha": "d0a1f6ab88522427a7ae76ceb6e1e1e7b68a1d08",
  "lastModified": "2022-08-02T13:03:04.000Z",
  "gated": false,
  "disabled": false,
  "widgetData": [
    {
      "text": "What's the animal doing?",
      "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/tiger.jpg"
    },
    {
      "text": "What is on top of the building?",
      "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/palace.jpg"
    }
  ],
  "model-index": null,
  "config": {
    "architectures": [
      "ViltForVisualQuestionAnswering"
    ],
    "model_type": "vilt",
    "tokenizer_config": {
      "unk_token": "[UNK]",
      "sep_token": "[SEP]",
      "pad_token": "[PAD]",
      "cls_token": "[CLS]",
      "mask_token": "[MASK]"
    }
  },
  "cardData": {
    "tags": [
      "visual-question-answering"
    ],
    "license": "apache-2.0",
    "widget": [
      {
        "text": "What's the animal doing?",
        "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/tiger.jpg"
      },
      {
        "text": "What is on top of the building?",
        "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/palace.jpg"
      }
    ]
  },
  "transformersInfo": {
    "auto_model": "ViltForVisualQuestionAnswering",
    "processor": "AutoProcessor"
  },
  "siblings": [
    {
      "rfilename": ".gitattributes"
    },
    {
      "rfilename": "README.md"
    },
    {
      "rfilename": "config.json"
    },
    {
      "rfilename": "preprocessor_config.json"
    },
    {
      "rfilename": "pytorch_model.bin"
    },
    {
      "rfilename": "special_tokens_map.json"
    },
    {
      "rfilename": "tokenizer.json"
    },
    {
      "rfilename": "tokenizer_config.json"
    },
    {
      "rfilename": "vocab.txt"
    }
  ],
  "spaces": [
    "microsoft/HuggingGPT",
    "gunship999/SexyImages",
    "Yntec/ToyWorld",
    "llamameta/flux-pro-uncensored",
    "Nymbo/Compare-6",
    "Yntec/PrintingPress",
    "Uthar/SexyReality",
    "nielsr/comparing-VQA-models",
    "llamameta/fluxproV2",
    "Yntec/ToyWorldXL",
    "phenixrhyder/NSFW-ToyWorld",
    "Yntec/blitz_diffusion",
    "nielsr/vilt-vqa",
    "ethanchern/Anole",
    "John6666/Diffusion80XX4sg",
    "John6666/PrintingPress4",
    "llamameta/fast-sd3.5-large",
    "Yntec/Image-Models-Test-April-2024",
    "DemiPoto/TestDifs",
    "Abinivesh/Multi-models-prompt-to-image-generation",
    "Yntec/Image-Models-Test-2024",
    "martynka/TasiaExperiment",
    "Yntec/Image-Models-Test",
    "yergyerg/ImgGenClone",
    "John6666/hfd_test_nostopbutton",
    "Yntec/Image-Models-Test-May-2024",
    "taesiri/HuggingGPT-Lite",
    "Nymbo/Diffusion80XX4sg",
    "Yntec/Image-Models-Test-September-2024",
    "DemiPoto/testSortModels",
    "Yntec/MiniToyWorld",
    "kaleidoskop-hug/PrintingPress",
    "Madhuri/vqa_audiobot",
    "ixxan/cross-lingual-vqa",
    "John6666/ToyWorld4",
    "John6666/Diffusion80XX4g",
    "SAITAN666/StableDiffusion35Large-Image-Models-Test-November-2024",
    "NativeAngels/HuggingfaceDiffusion",
    "Yntec/Image-Models-Test-December-2024",
    "huggingfacejs/doc-vis-qa",
    "John6666/Diffusion80XX4",
    "K00B404/HuggingfaceDiffusion_custom",
    "John6666/blitz_diffusion4",
    "John6666/blitz_diffusion_builtin",
    "NativeAngels/Compare-6",
    "K00B404/SimpleBrothel",
    "Babyloncoder/chat-with-an-image",
    "Yntec/Image-Models-Test-July-2024",
    "Blane187/multi-diffusion",
    "OpenXAIProject/pnpxai-image-classification",
    "Uthar/LewdExperiments",
    "Uthar/BodyPaint",
    "Uthar/HighFashion",
    "Yntec/open-craiyon",
    "BarBar288/Chatbot",
    "hayas-tohoku-workshop-2023/comparing-VQA-models",
    "dreamdrop-art/000555111",
    "SeyedAli/Persian-Visual-Question-Answering-1",
    "sathvikparasa20/vqa-vitgpt",
    "NativeAngels/ToyWorld",
    "Uthar/Harvester",
    "Yntec/Image-Models-Test-January-2025",
    "Yeeezus/SexyImages",
    "John6666/MiniToyWorld",
    "ccarr0807/HuggingGPT",
    "theholycityweb/HuggingGPT",
    "gtx4010661/dandelin-vilt-b32-finetuned-vqa",
    "Alfasign/HuggingGPT-Lite",
    "roontoon/Demo-TTI-dandelin-vilt-b32-finetuned-vqa",
    "nilaymodi/dandelin-vilt-b32-finetuned-vqa",
    "saurshaz/HuggingGPT",
    "Akoloskov/image-recon",
    "optowo/dandelin-vilt-b32-finetuned-vqa",
    "Nikhil0987/omm",
    "wendys-llc/comparing-VQA-models",
    "SilvusTV/Test",
    "roshithindia/imageQuestionAnswering",
    "mahitha11/vqa-vitgpt",
    "TotoB12/dandelin-vilt-b32-finetuned-vqa",
    "NativeAngels/blitz_diffusion",
    "NativeAngels/PrintingPress4",
    "NativeAngels/PrintingPress",
    "Uthar/HRGiger",
    "romadanskiy/open-source-models-hg",
    "dehua68/ToyWorld",
    "tushar888/Zeinural.ai",
    "JarvisOnSolana/Jarvis",
    "codelion/sentinel",
    "Yntec/Image-Models-Test-February-2025",
    "MrRokot/GENFLUX",
    "Hadiil/home23",
    "BarBar288/AI_Tools",
    "burman-ai/Printing-Press",
    "Yntec/Image-Models-Test-March-2025",
    "chrisW6825/HuggingGPT",
    "Shenziqian/HuggingGPT",
    "hema1/Text-Visual-QA",
    "lokutus/HuggingGPT",
    "mimiqiao/HuggingGPT",
    "tsgbalakarthik/HuggingGPT"
  ],
  "createdAt": "2022-03-02T23:29:05.000Z",
  "inference": "warm",
  "usedStorage": 940815323
}