{"passport":{"unfragile":{"@version":"1.0","version":"2026-05","artifact":{"id":"papers-with-code-vqav2","slug":"vqav2","name":"VQAv2","type":"dataset","url":"https://paperswithcode.com/dataset/vqav2","page_url":"https://unfragile.ai/vqav2","categories":["testing-quality"],"tags":["benchmark","evaluation","visual-qa","vision-language"],"pricing":{"model":"open_source","free":true,"starting_price":null},"status":"active","verified":false},"capabilities":[{"id":"papers-with-code-vqav2__cap_0","uri":"capability://data.processing.analysis.multimodal.question.answering.evaluation","name":"multimodal question-answering evaluation","description":"VQAv2 serves as a benchmark for evaluating vision-language models by providing a dataset of 1.1 million questions paired with 650,000 images from the COCO dataset. It requires models to understand both visual content and generate natural language answers, utilizing a diverse set of question types such as color identification and quantity assessment. This dual requirement distinguishes it from other benchmarks that may focus solely on either vision or language tasks.","intents":["How can I evaluate my vision-language model's performance on diverse question types?","What dataset should I use to benchmark my multimodal AI system?","How do I assess the accuracy of image-based question answering in my application?"],"best_for":["researchers developing and testing vision-language models"],"limitations":["Limited to questions that can be answered based on the provided images; may not cover all visual contexts."],"requires":["Access to the VQAv2 dataset","Familiarity with evaluation metrics for machine learning"],"input_types":["image","text"],"output_types":["text"],"categories":["data-processing-analysis","benchmarking"],"confidence":0.5,"matches":0,"success_rate":0}],"trust":{"score":46,"verified":false,"data_access_risk":"low","permissions":["Access to the VQAv2 dataset","Familiarity with evaluation metrics for machine learning"],"failure_modes":["Limited to questions that can be answered based on the provided images; may not cover all visual contexts.","builder identity is not verified yet","no observed match outcomes yet"],"rank_breakdown":{"adoption":0.8,"quality":0.27,"ecosystem":0.42,"match_graph":0.25,"freshness":0.75,"weights":{"adoption":0.3,"quality":0.25,"ecosystem":0.1,"match_graph":0.3,"freshness":0.05}},"observed_outcomes":{"matches":0,"success_rate":0,"avg_confidence":0,"top_intents":[],"last_matched_at":null},"maintenance":{"status":"active","updated_at":"2026-05-24T12:16:25.060Z","last_scraped_at":"2026-05-03T15:20:49.428Z","last_commit":null},"community":{"stars":null,"forks":null,"weekly_downloads":null,"model_downloads":null,"model_likes":null}},"distribution":{"claim_url":"https://unfragile.ai/submit?claim=vqav2","compare_url":"https://unfragile.ai/compare?artifact=vqav2"}},"signature":"1yM6StBjM8uK9csDE1J3IbQteq91SxBpoCFkRaougfyuu1FeVGYiu6yPP4PmRzWEsOnNNiMENHUoBCjJ1V4wCQ==","signedAt":"2026-06-22T22:27:19.434Z","signedBy":"unfragile.ai","version":1},"_links":{"self":"https://unfragile.ai/api/v1/passport/vqav2","artifact":"https://unfragile.ai/vqav2","verify":"https://unfragile.ai/api/v1/verify?slug=vqav2","publicKey":"https://unfragile.ai/api/v1/trust-passport-public-key","spec":"https://unfragile.ai/trust","schema":"https://unfragile.ai/schema.json","docs":"https://unfragile.ai/docs"}}