{"passport":{"unfragile":{"@version":"1.0","version":"2026-05","artifact":{"id":"hn-46540794","slug":"watch-llms-play-21-000-hands-of-poker","name":"Watch LLMs play 21,000 hands of Poker","type":"benchmark","url":"https://pokerbench.adfontes.io/run/Large_Models","page_url":"https://unfragile.ai/watch-llms-play-21-000-hands-of-poker","categories":["testing-quality"],"tags":["hackernews","show-hn"],"pricing":{"model":"unknown","free":false,"starting_price":null},"status":"active","verified":false},"capabilities":[{"id":"hn-46540794__cap_0","uri":"capability://data.processing.analysis.simulated.poker.gameplay.analysis","name":"simulated poker gameplay analysis","description":"This capability allows users to observe and analyze the performance of LLMs as they play 21,000 hands of poker. It utilizes a custom-built simulation environment that integrates LLM decision-making processes with poker game rules, enabling real-time tracking of strategies, outcomes, and player interactions. The architecture supports detailed logging and performance metrics, providing insights into the models' decision-making patterns and effectiveness in various scenarios.","intents":["How well do LLMs perform in poker compared to human players?","What strategies do LLMs employ when playing poker?","Can I analyze the decision-making process of LLMs in poker games?"],"best_for":["researchers studying AI decision-making in games","developers building AI models for strategic gameplay"],"limitations":["Limited to poker; does not support other card games or variations","Performance metrics may not reflect real-world poker scenarios"],"requires":["Web browser for accessing the simulation","No specific software installation required"],"input_types":["text (game rules, player actions)","structured data (game state)"],"output_types":["structured data (game results, performance metrics)","text (game commentary)"],"categories":["data-processing-analysis","ai research"],"confidence":0.5,"matches":0,"success_rate":0}],"trust":{"score":28,"verified":false,"data_access_risk":"low","permissions":["Web browser for accessing the simulation","No specific software installation required"],"failure_modes":["Limited to poker; does not support other card games or variations","Performance metrics may not reflect real-world poker scenarios","builder identity is not verified yet","no observed match outcomes yet"],"rank_breakdown":{"adoption":0.46,"quality":0.12,"ecosystem":0.21000000000000002,"match_graph":0.25,"freshness":0.75,"weights":{"adoption":0.25,"quality":0.35,"ecosystem":0.15,"match_graph":0.2,"freshness":0.05}},"observed_outcomes":{"matches":0,"success_rate":0,"avg_confidence":0,"top_intents":[],"last_matched_at":null},"maintenance":{"status":"active","updated_at":"2026-05-24T12:16:23.326Z","last_scraped_at":"2026-05-04T08:09:56.918Z","last_commit":null},"community":{"stars":null,"forks":null,"weekly_downloads":null,"model_downloads":null,"model_likes":null}},"distribution":{"claim_url":"https://unfragile.ai/submit?claim=watch-llms-play-21-000-hands-of-poker","compare_url":"https://unfragile.ai/compare?artifact=watch-llms-play-21-000-hands-of-poker"}},"signature":"lANwgeBuViGOmc89NYulzTG1rewHXUMlKVeBCkUn12OrRkezHhoWz2uJG2rAVSeJ2zRuAgmL56msFXEvNvX3Dw==","signedAt":"2026-06-19T08:47:06.708Z","signedBy":"unfragile.ai","version":1},"_links":{"self":"https://unfragile.ai/api/v1/passport/watch-llms-play-21-000-hands-of-poker","artifact":"https://unfragile.ai/watch-llms-play-21-000-hands-of-poker","verify":"https://unfragile.ai/api/v1/verify?slug=watch-llms-play-21-000-hands-of-poker","publicKey":"https://unfragile.ai/api/v1/trust-passport-public-key","spec":"https://unfragile.ai/trust","schema":"https://unfragile.ai/schema.json","docs":"https://unfragile.ai/docs"}}