{"passport":{"unfragile":{"@version":"1.0","version":"2026-05","artifact":{"id":"hf-dataset-jat-project--jat-dataset","slug":"jat-project--jat-dataset","name":"jat-dataset","type":"dataset","url":"https://huggingface.co/datasets/jat-project/jat-dataset","page_url":"https://unfragile.ai/jat-project--jat-dataset","categories":["model-training"],"tags":["task_categories:reinforcement-learning","task_categories:text-generation","task_categories:question-answering","annotations_creators:found","annotations_creators:machine-generated","source_datasets:conceptual-captions","source_datasets:ok-vqa","source_datasets:oscar","license:apache-2.0","size_categories:100M<n<1B","format:parquet","modality:image","modality:text","modality:timeseries","library:datasets","library:dask","library:mlcroissant","library:polars","arxiv:2402.09844","arxiv:2303.03915"],"pricing":{"model":"open_source","free":true,"starting_price":null},"status":"active","verified":false},"capabilities":[{"id":"hf-dataset-jat-project--jat-dataset__cap_0","uri":"capability://data.processing.analysis.multi.modal.dataset.integration","name":"multi-modal dataset integration","description":"jat-dataset integrates multiple modalities including text, images, and timeseries data, allowing for comprehensive training and evaluation of models across different formats. It utilizes a parquet format for efficient storage and retrieval, enabling fast access to large datasets. The dataset is designed to support various tasks such as reinforcement learning, text generation, and question answering, making it versatile for researchers and developers.","intents":["How can I access a multi-modal dataset for training my AI models?","What datasets are available for reinforcement learning tasks?","Where can I find a dataset that includes both text and image data?"],"best_for":["researchers developing multi-modal AI applications","developers building models for reinforcement learning"],"limitations":["Dataset size may require significant storage and processing power","Limited documentation on specific use cases"],"requires":["Python 3.8+","Dask library for handling large datasets"],"input_types":["text","image","timeseries"],"output_types":["structured data","parquet files"],"categories":["data-processing-analysis","research"],"confidence":0.5,"matches":0,"success_rate":0},{"id":"hf-dataset-jat-project--jat-dataset__cap_1","uri":"capability://data.processing.analysis.large.scale.dataset.accessibility","name":"large-scale dataset accessibility","description":"jat-dataset is hosted on Hugging Face, providing easy access and download capabilities for users. The dataset supports over 391,137 downloads, indicating its popularity and reliability. Its open-source nature allows for community contributions and enhancements, fostering a collaborative environment for dataset improvement.","intents":["How can I easily download a large dataset for my project?","What are the benefits of using an open-source dataset?","Where can I find community-supported datasets for AI research?"],"best_for":["developers looking for reliable datasets","researchers needing community-supported resources"],"limitations":["Potential download speed limitations based on user bandwidth","May require familiarity with Hugging Face platform"],"requires":["Internet access","Hugging Face account for certain features"],"input_types":["N/A"],"output_types":["N/A"],"categories":["data-processing-analysis","open-source"],"confidence":0.5,"matches":0,"success_rate":0}],"trust":{"score":21,"verified":false,"data_access_risk":"low","permissions":["Python 3.8+","Dask library for handling large datasets","Internet access","Hugging Face account for certain features"],"failure_modes":["Dataset size may require significant storage and processing power","Limited documentation on specific use cases","Potential download speed limitations based on user bandwidth","May require familiarity with Hugging Face platform","builder identity is not verified yet","no observed match outcomes yet"],"rank_breakdown":{"adoption":0.05,"quality":0.14,"ecosystem":0.5000000000000001,"match_graph":0.25,"freshness":0.75,"weights":{"adoption":0.3,"quality":0.25,"ecosystem":0.1,"match_graph":0.3,"freshness":0.05}},"observed_outcomes":{"matches":0,"success_rate":0,"avg_confidence":0,"top_intents":[],"last_matched_at":null},"maintenance":{"status":"active","updated_at":"2026-05-24T12:16:22.764Z","last_scraped_at":"2026-05-03T14:22:48.064Z","last_commit":null},"community":{"stars":null,"forks":null,"weekly_downloads":null,"model_downloads":null,"model_likes":null}},"distribution":{"claim_url":"https://unfragile.ai/submit?claim=jat-project--jat-dataset","compare_url":"https://unfragile.ai/compare?artifact=jat-project--jat-dataset"}},"signature":"o4yBSHwALmScqdQSqxyu3gIT+Gy5ihnXWGOhLQ6PfJsD/NZ0bdMIBaO2vd2OczlCXa18Xn4s+cLArgwRXcBJDA==","signedAt":"2026-06-22T02:50:16.189Z","signedBy":"unfragile.ai","version":1},"_links":{"self":"https://unfragile.ai/api/v1/passport/jat-project--jat-dataset","artifact":"https://unfragile.ai/jat-project--jat-dataset","verify":"https://unfragile.ai/api/v1/verify?slug=jat-project--jat-dataset","publicKey":"https://unfragile.ai/api/v1/trust-passport-public-key","spec":"https://unfragile.ai/trust","schema":"https://unfragile.ai/schema.json","docs":"https://unfragile.ai/docs"}}