← Back to index
dandelin/vilt-b32-finetuned-vqa
Inference API is disabled for an unknown reason. Please open a Discussion in the Community tab.
			{
  "_id": "621ffdc136468d709f17a32e",
  "id": "dandelin/vilt-b32-finetuned-vqa",
  "modelId": "dandelin/vilt-b32-finetuned-vqa",
  "author": "dandelin",
  "sha": "d0a1f6ab88522427a7ae76ceb6e1e1e7b68a1d08",
  "lastModified": "2022-08-02T13:03:04.000Z",
  "private": false,
  "disabled": false,
  "gated": false,
  "pipeline_tag": "visual-question-answering",
  "tags": [
    "transformers",
    "pytorch",
    "vilt",
    "visual-question-answering",
    "arxiv:2102.03334",
    "license:apache-2.0",
    "endpoints_compatible",
    "has_space",
    "region:us"
  ],
  "downloads": 60207,
  "library_name": "transformers",
  "widgetData": [
    {
      "text": "What's the animal doing?",
      "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/tiger.jpg"
    },
    {
      "text": "What is on top of the building?",
      "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/palace.jpg"
    }
  ],
  "likes": 296,
  "model-index": null,
  "config": {
    "architectures": [
      "ViltForVisualQuestionAnswering"
    ],
    "model_type": "vilt"
  },
  "cardData": {
    "tags": [
      "visual-question-answering"
    ],
    "license": "apache-2.0",
    "widget": [
      {
        "text": "What's the animal doing?",
        "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/tiger.jpg"
      },
      {
        "text": "What is on top of the building?",
        "src": "https://huggingface.co/datasets/mishig/sample_images/resolve/main/palace.jpg"
      }
    ]
  },
  "transformersInfo": {
    "auto_model": "ViltForVisualQuestionAnswering",
    "processor": "AutoProcessor"
  },
  "spaces": [
    "microsoft/HuggingGPT",
    "nielsr/comparing-VQA-models",
    "nielsr/vilt-vqa",
    "taesiri/HuggingGPT-Lite",
    "Madhuri/vqa_audiobot",
    "ixxan/multilingual-vqa",
    "huggingfacejs/doc-vis-qa",
    "hayas-tohoku-workshop-2023/comparing-VQA-models",
    "SeyedAli/Persian-Visual-Question-Answering-1",
    "gtx4010661/dandelin-vilt-b32-finetuned-vqa",
    "ccarr0807/HuggingGPT",
    "theholycityweb/HuggingGPT",
    "contluForse/HuggingGPT",
    "Alfasign/HuggingGPT-Lite",
    "roontoon/Demo-TTI-dandelin-vilt-b32-finetuned-vqa",
    "saurshaz/HuggingGPT",
    "nilaymodi/dandelin-vilt-b32-finetuned-vqa",
    "Nikhil0987/omm",
    "roshithindia/imageQuestionAnswering",
    "Anniek/VQA",
    "Frvvhencjsbydhehdhgwgbdujeocmfikdkcsshdnjs/dandelin-vilt-b32-finetuned-vqa",
    "kingli999/dandelin-vilt-b32-finetuned-vqa23",
    "kingli999/dandelin-vilt-b32-finetuned-vqa14421",
    "yinuozh/dandelin-vilt-b32-finetuned-vqa",
    "treeindex/dandelin-vilt-b32-finetuned-vqa",
    "hema1/Tab",
    "kanishka207004/project7",
    "sakshamm/project7",
    "keaneu/HuggingGPT",
    "viscosity/HuggingGPT",
    "Mcdof/HuggingGPT",
    "BMukhtar/BMA",
    "chrisW6825/HuggingGPT",
    "Shenziqian/HuggingGPT",
    "lokutus/HuggingGPT",
    "mimiqiao/HuggingGPT",
    "tsgbalakarthik/HuggingGPT",
    "wowochkin/HuggingGPT",
    "Msp/HuggingGPT",
    "ryan12439/HuggingGPTpub",
    "FANCHIYU/HuggingGPT",
    "Betacuckgpt/HuggingGPT",
    "cashqin/HuggingGPT",
    "felixfriday/MICROSOFTT_JARVIS_HuggingGPT",
    "Meffordh/HuggingGPT",
    "lzqfree/HuggingGPT",
    "bountyfuljr/HuggingGPTplaypublic",
    "mearjunsha/HuggingGPT",
    "turbowed/HuggingGPT",
    "Chokyounghoon/HuggingGPT",
    "lollo21/Will-GPT",
    "Pfs2021Funny/HuggingGPT",
    "irritablebro/HuggingGPT",
    "MagKoz/HuggingGPT",
    "zhangdream/HuggingGPT",
    "calliber/HuggingGPT",
    "Pitak/HuggingGPT",
    "gaocegege/HuggingGPT",
    "apgarmd/jarvis",
    "apgarmd/jarvis2",
    "mukulnag/HuggingGPT1",
    "lugifudun/HuggingGPT",
    "leadmaister/HuggingGPT",
    "pors/HuggingGPT",
    "vs4vijay/HuggingGPT",
    "vvmnnnkv/doc-vis-qa",
    "mckeeboards/HuggingGPT",
    "mastere00/JarvisMeetsProfessor",
    "passthebutter/HuggingGPT",
    "manu1435/HuggingGPT",
    "rafaelcalleja/HuggingGPT",
    "NaamanSaif/HuggingGPT",
    "CollaalloC/HuggingGPT",
    "dwolfe66/HuggingGPT",
    "CODERHUE/dandelin-vilt-b32-finetuned-vqa",
    "xian-sheng/HuggingGPT",
    "Aygtljl518866/HuggingGPT",
    "bageltoes/dandelin-vilt-b32-finetuned-vqa",
    "Hemi1403/HuggingGPT",
    "trhacknon/HuggingGPT",
    "Vito99/HuggingGPT-Lite",
    "EinfachOlder/HuggingGPT-Lite",
    "innovativeillusions/HuggingGPT",
    "priiyanshu/dandelin-vilt-b32-finetuned-vqa",
    "jaidev21/dandelin-vilt-b32-finetuned-vqa",
    "Matteogonzo02/dandelin-vilt-b32-finetuned-vqa",
    "ph33bs/dandelin-vilt-b32-finetuned-vqa",
    "nouman-10/VQArt",
    "cduck/italystory",
    "yalan/dandelin-vilt-b32-finetuned-vqa",
    "seanshahkarami/vilt-for-vqa",
    "ricklon/nlp-vit",
    "ylavie/HuggingGPT3",
    "ylavie/HuggingGPT-Lite",
    "AppleSeedThriver/dandelin-vilt-b32-finetuned-vqa",
    "FRKSIHJG5AEHTRSJ/dandelin-vilt-b32-finetuned-vqa",
    "CCYAO/HuggingGPT",
    "ActivatedOne/dandelin-vilt-b32-finetuned-vqa",
    "dcams/HuggingGPT",
    "Minqin/carets_finetune_vqa",
    "teganmosi/chatbot",
    "AnimaLab/vision_model_init",
    "Insightly/Image_Reader",
    "CS4NLP/vqa_demo",
    "BlakeCDA/dandelin-vilt-b32-finetuned-vqa",
    "Dobator/dandelin-vilt-b32-finetuned-vqa",
    "Akoloskov/image-recon",
    "zhuguangbin86/dandelin-vilt-b32-finetuned-vqa",
    "shannon-paul/dandelin-vilt-b32-finetuned-vqa",
    "CosmoAI/CosmoS",
    "rjiang12/comparing-VQA-models",
    "diffaccessor0012/dandelin-vilt-b32-finetuned-vqa",
    "cndavy/HuggingGPT",
    "sykang/dandelin-vilt-b32-finetuned-vqa",
    "pbshayar/dandelin-vilt-b32-finetuned-vqa",
    "ojeromyo/dandelin-vilt-b32-finetuned-vqa",
    "PlsReload9382/Bildsuche",
    "ribokle/vilt",
    "mmuzzamil/dandelin-vilt-b32-finetuned-vqa",
    "reshav1/P.A",
    "adeaven/dandelin-vilt-b32-finetuned-vqa",
    "jeanmauriceport/dandelin-vilt-b32-finetuned-vqa",
    "SilvusTV/Test",
    "devangel007/dandelin-vilt-b32-finetuned-vqa",
    "trezero/dandelin-vilt-b32-finetuned-vqa",
    "anon4757/BiasTestVQA",
    "Aseel17/dandelin-vilt-b32-finetuned-vqa",
    "Amiralasady/dandelin-vilt-b32-finetuned-vqa",
    "SSHAMZZ/Host_trial_1",
    "ZeroTwo3/dandelin-vilt-b32-finetuned-vqa",
    "Exalt-company/ai-with-eyes",
    "ZackBradshaw/omni_bot",
    "hema1/QA-YT-Video-Summarization",
    "kukiui/dandelin-vilt-b32-finetuned-vqa",
    "Anon4445/VQA",
    "sms07/Georgios-Ioannou-Visual-Question-Answering-With-Hugging-Face",
    "sms07/Georgios-Ioannou-Visual-Question-Answering-With-Hugging-Face-FINAL",
    "ZackBradshaw/swarms"
  ],
  "siblings": [
    {
      "rfilename": ".gitattributes"
    },
    {
      "rfilename": "README.md"
    },
    {
      "rfilename": "config.json"
    },
    {
      "rfilename": "preprocessor_config.json"
    },
    {
      "rfilename": "pytorch_model.bin"
    },
    {
      "rfilename": "special_tokens_map.json"
    },
    {
      "rfilename": "tokenizer.json"
    },
    {
      "rfilename": "tokenizer_config.json"
    },
    {
      "rfilename": "vocab.txt"
    }
  ],
  "createdAt": "2022-03-02T23:29:05.000Z"
}