{"passport":{"unfragile":{"@version":"1.0","version":"2026-05","artifact":{"id":"hf-model-microsoft--vibevoice-1.5b","slug":"microsoft--vibevoice-1.5b","name":"VibeVoice-1.5B","type":"model","url":"https://huggingface.co/microsoft/VibeVoice-1.5B","page_url":"https://unfragile.ai/microsoft--vibevoice-1.5b","categories":["voice-audio"],"tags":["transformers","safetensors","vibevoice","text-generation","Podcast","text-to-speech","en","zh","arxiv:2508.19205","arxiv:2412.08635","license:mit","endpoints_compatible","region:us"],"pricing":{"model":"open_source","free":true,"starting_price":null},"status":"active","verified":false},"capabilities":[{"id":"hf-model-microsoft--vibevoice-1.5b__cap_0","uri":"capability://text.generation.language.natural.language.text.to.speech.synthesis","name":"natural language text-to-speech synthesis","description":"VibeVoice-1.5B employs a transformer-based architecture to convert text input into natural-sounding speech. It utilizes a large pre-trained model that leverages attention mechanisms to capture contextual nuances in language, ensuring that the generated speech closely mimics human intonation and rhythm. This model is fine-tuned on diverse datasets to enhance its ability to produce high-quality audio outputs across various languages and accents.","intents":["How can I convert written scripts into spoken audio for my podcast?","What tools can I use to generate voiceovers for my videos?","How do I create realistic speech from text for my application?"],"best_for":["content creators producing audio content","developers integrating TTS into applications","educators creating learning materials"],"limitations":["Limited to supported languages; may not perform well with niche dialects or accents","Audio output quality may vary based on input complexity"],"requires":["Python 3.7+","Hugging Face Transformers library 4.0+","sufficient computational resources for inference"],"input_types":["text"],"output_types":["audio"],"categories":["text-generation-language","audio"],"confidence":0.5,"matches":0,"success_rate":0}],"trust":{"score":43,"verified":false,"data_access_risk":"low","permissions":["Python 3.7+","Hugging Face Transformers library 4.0+","sufficient computational resources for inference"],"failure_modes":["Limited to supported languages; may not perform well with niche dialects or accents","Audio output quality may vary based on input complexity","builder identity is not verified yet","no observed match outcomes yet"],"rank_breakdown":{"adoption":0.6804511812945822,"quality":0.12,"ecosystem":0.5000000000000001,"match_graph":0.25,"freshness":0.9,"weights":{"adoption":0.35,"quality":0.2,"ecosystem":0.1,"match_graph":0.3,"freshness":0.05}},"observed_outcomes":{"matches":0,"success_rate":0,"avg_confidence":0,"top_intents":[],"last_matched_at":null},"maintenance":{"status":"active","updated_at":"2026-05-24T12:16:22.765Z","last_scraped_at":"2026-05-03T14:22:51.286Z","last_commit":null},"community":{"stars":null,"forks":null,"weekly_downloads":null,"model_downloads":261587,"model_likes":2353}},"distribution":{"claim_url":"https://unfragile.ai/submit?claim=microsoft--vibevoice-1.5b","compare_url":"https://unfragile.ai/compare?artifact=microsoft--vibevoice-1.5b"}},"signature":"LiX2gR3y2kqvxTgF09o9WQX+/vWqBN7tF1GhRCgWLa3pmR8iGGsCadD0gE1DqoBtwKJO9IWWFH+NjncSnoApBA==","signedAt":"2026-06-15T17:51:01.980Z","signedBy":"unfragile.ai","version":1},"_links":{"self":"https://unfragile.ai/api/v1/passport/microsoft--vibevoice-1.5b","artifact":"https://unfragile.ai/microsoft--vibevoice-1.5b","verify":"https://unfragile.ai/api/v1/verify?slug=microsoft--vibevoice-1.5b","publicKey":"https://unfragile.ai/api/v1/trust-passport-public-key","spec":"https://unfragile.ai/trust","schema":"https://unfragile.ai/schema.json","docs":"https://unfragile.ai/docs"}}