{"passport":{"unfragile":{"@version":"1.0","version":"2026-05","artifact":{"id":"reddit-1st9v81","slug":"we-benchmarked-18-llms-on-ocr-7k-calls-cheaper-old","name":"We benchmarked 18 LLMs on OCR (7k+ calls) — cheaper/old models oftentimes win. Full dataset + framework open-sourced. [R]","type":"benchmark","url":"https://github.com/ArbitrHq/ocr-mini-bench","page_url":"https://unfragile.ai/we-benchmarked-18-llms-on-ocr-7k-calls-cheaper-old","categories":["model-training"],"tags":["machinelearning"],"pricing":{"model":"open_source","free":true,"starting_price":null},"status":"active","verified":false},"capabilities":[{"id":"reddit-1st9v81__cap_0","uri":"capability://data.processing.analysis.benchmarking.llms.for.ocr.performance","name":"benchmarking llms for ocr performance","description":"This capability benchmarks 18 different LLMs on Optical Character Recognition (OCR) tasks using a comprehensive dataset of over 7,000 calls. It employs a systematic evaluation framework that allows for the comparison of model performance across various metrics, such as accuracy and processing speed. The open-sourced framework enables users to replicate the benchmarks and adapt the methodology for their specific needs, promoting transparency and reproducibility in research.","intents":["How do different LLMs perform on OCR tasks?","What is the best model for OCR based on cost and performance?","Can I replicate these benchmarks for my own LLM evaluation?"],"best_for":["researchers evaluating LLM performance for OCR","developers selecting OCR models for applications","data scientists conducting comparative analysis"],"limitations":["Limited to the 18 LLMs included in the benchmark; results may not generalize to other models.","Performance may vary based on specific OCR tasks not covered in the dataset."],"requires":["Python 3.8+","Access to the benchmark dataset provided in the repository"],"input_types":["text","image"],"output_types":["structured data","performance metrics"],"categories":["data-processing-analysis","benchmarking"],"confidence":0.5,"matches":0,"success_rate":0}],"trust":{"score":36,"verified":false,"data_access_risk":"low","permissions":["Python 3.8+","Access to the benchmark dataset provided in the repository"],"failure_modes":["Limited to the 18 LLMs included in the benchmark; results may not generalize to other models.","Performance may vary based on specific OCR tasks not covered in the dataset.","builder identity is not verified yet","no observed match outcomes yet"],"rank_breakdown":{"adoption":0.5,"quality":0.27,"ecosystem":0.33,"match_graph":0.25,"freshness":0.9,"weights":{"adoption":0.25,"quality":0.35,"ecosystem":0.15,"match_graph":0.2,"freshness":0.05}},"observed_outcomes":{"matches":0,"success_rate":0,"avg_confidence":0,"top_intents":[],"last_matched_at":null},"maintenance":{"status":"active","updated_at":"2026-05-24T12:16:25.061Z","last_scraped_at":"2026-05-04T07:50:58.215Z","last_commit":null},"community":{"stars":null,"forks":null,"weekly_downloads":null,"model_downloads":null,"model_likes":null}},"distribution":{"claim_url":"https://unfragile.ai/submit?claim=we-benchmarked-18-llms-on-ocr-7k-calls-cheaper-old","compare_url":"https://unfragile.ai/compare?artifact=we-benchmarked-18-llms-on-ocr-7k-calls-cheaper-old"}},"signature":"pQFr+4NKiKytr15j53geOHfUSOCpdskADh8UdCI5fg4P4UuVYfDlWO85Acft0K1KJjQxm4XvN8KaNNKypHxkCQ==","signedAt":"2026-06-15T06:56:08.856Z","signedBy":"unfragile.ai","version":1},"_links":{"self":"https://unfragile.ai/api/v1/passport/we-benchmarked-18-llms-on-ocr-7k-calls-cheaper-old","artifact":"https://unfragile.ai/we-benchmarked-18-llms-on-ocr-7k-calls-cheaper-old","verify":"https://unfragile.ai/api/v1/verify?slug=we-benchmarked-18-llms-on-ocr-7k-calls-cheaper-old","publicKey":"https://unfragile.ai/api/v1/trust-passport-public-key","spec":"https://unfragile.ai/trust","schema":"https://unfragile.ai/schema.json","docs":"https://unfragile.ai/docs"}}