{"passport":{"unfragile":{"@version":"1.0","version":"2026-05","artifact":{"id":"smithery_chirag127-mcp-hierarchical-scraper","slug":"chirag127-mcp-hierarchical-scraper","name":"mcp-hierarchical-scraper","type":"mcp","url":"https://github.com/chirag127/mcp-hierarchical-scraper","page_url":"https://unfragile.ai/chirag127-mcp-hierarchical-scraper","categories":["rag-knowledge","testing-quality"],"tags":["mcp","model-context-protocol","web-browsing","smithery:chirag127/mcp-hierarchical-scraper"],"pricing":{"model":"open_source","free":true,"starting_price":null},"status":"active","verified":false},"capabilities":[{"id":"smithery_chirag127-mcp-hierarchical-scraper__cap_0","uri":"capability://data.processing.analysis.recursive.web.crawling.for.hierarchical.mapping","name":"recursive web crawling for hierarchical mapping","description":"This capability utilizes a depth-first search algorithm to recursively crawl websites, building a hierarchical map of pages. It identifies links and follows them while maintaining a record of the site structure, enabling users to visualize the relationships between pages. This approach is distinct as it optimally manages state and context during the crawl, ensuring that the hierarchy reflects the actual site architecture.","intents":["How can I visualize the structure of a website for better navigation?","I need to understand the relationships between different pages on a site.","Can I get a complete map of a website's content for analysis?"],"best_for":["web developers analyzing site structure","researchers mapping content relationships"],"limitations":["May encounter rate limiting on some websites, affecting crawl depth","Not optimized for sites with heavy JavaScript rendering"],"requires":["Node.js 14+","Access to the target website"],"input_types":["URL"],"output_types":["structured data (JSON)"],"categories":["data-processing-analysis","web-crawling"],"confidence":0.5,"matches":0,"success_rate":0},{"id":"smithery_chirag127-mcp-hierarchical-scraper__cap_1","uri":"capability://text.generation.language.html.to.markdown.conversion","name":"html to markdown conversion","description":"This capability transforms HTML content into clean, LLM-ready Markdown by stripping out boilerplate code and unnecessary tags. It uses a custom parser that identifies semantic elements and converts them into Markdown equivalents, ensuring that the output is both readable and suitable for machine learning applications. This approach allows for high fidelity in content representation while simplifying the format.","intents":["How can I convert web content into a format suitable for LLM training?","I need to clean up HTML content for better readability.","Can I extract text from a webpage while preserving its structure?"],"best_for":["data scientists preparing training data","content creators needing clean text formats"],"limitations":["Complex HTML structures may not convert perfectly","Limited support for advanced CSS styles"],"requires":["Node.js 14+","Access to HTML content"],"input_types":["HTML"],"output_types":["Markdown"],"categories":["text-generation-language","content-cleaning"],"confidence":0.5,"matches":0,"success_rate":0},{"id":"smithery_chirag127-mcp-hierarchical-scraper__cap_2","uri":"capability://search.retrieval.contextual.web.content.retrieval","name":"contextual web content retrieval","description":"This capability allows users to retrieve web content based on contextual queries by leveraging the hierarchical map built during the crawling process. It employs a semantic search algorithm that matches user queries with the structured data, providing relevant snippets and links. This ensures that users receive contextually appropriate results that are directly tied to their search intent.","intents":["How can I find specific information from a website based on context?","I need to retrieve content that matches certain keywords from my crawled data.","Can I get relevant snippets from a website for my research?"],"best_for":["researchers needing targeted information","developers building search functionalities"],"limitations":["Search results depend on the quality of the initial crawl","May not handle ambiguous queries effectively"],"requires":["Node.js 14+","Crawled data in structured format"],"input_types":["text (search query)"],"output_types":["text (snippets)","structured data (links)"],"categories":["search-retrieval","contextual-search"],"confidence":0.5,"matches":0,"success_rate":0}],"trust":{"score":30,"verified":false,"data_access_risk":"moderate","permissions":["Node.js 14+","Access to the target website","Access to HTML content","Crawled data in structured format"],"failure_modes":["May encounter rate limiting on some websites, affecting crawl depth","Not optimized for sites with heavy JavaScript rendering","Complex HTML structures may not convert perfectly","Limited support for advanced CSS styles","Search results depend on the quality of the initial crawl","May not handle ambiguous queries effectively","builder identity is not verified yet","no observed match outcomes yet"],"rank_breakdown":{"adoption":0.05,"quality":0.31,"ecosystem":0.62,"match_graph":0.25,"freshness":0.5,"weights":{"adoption":0.25,"quality":0.25,"ecosystem":0.15,"match_graph":0.23,"freshness":0.12}},"observed_outcomes":{"matches":0,"success_rate":0,"avg_confidence":0,"top_intents":[],"last_matched_at":null},"maintenance":{"status":"active","updated_at":"2026-05-24T12:16:25.636Z","last_scraped_at":"2026-05-03T15:19:18.599Z","last_commit":null},"community":{"stars":null,"forks":null,"weekly_downloads":null,"model_downloads":null,"model_likes":null}},"distribution":{"claim_url":"https://unfragile.ai/submit?claim=chirag127-mcp-hierarchical-scraper","compare_url":"https://unfragile.ai/compare?artifact=chirag127-mcp-hierarchical-scraper"}},"signature":"6H2OCkhw72Xs/AX2J3JLmiZrtDFAc/BCGDmq4XlVQvq23r/KMhlgKsdAytG43uKB9fwRfTBoOjC9ZDGVjNFFCA==","signedAt":"2026-06-21T00:22:12.712Z","signedBy":"unfragile.ai","version":1},"_links":{"self":"https://unfragile.ai/api/v1/passport/chirag127-mcp-hierarchical-scraper","artifact":"https://unfragile.ai/chirag127-mcp-hierarchical-scraper","verify":"https://unfragile.ai/api/v1/verify?slug=chirag127-mcp-hierarchical-scraper","publicKey":"https://unfragile.ai/api/v1/trust-passport-public-key","spec":"https://unfragile.ai/trust","schema":"https://unfragile.ai/schema.json","docs":"https://unfragile.ai/docs"}}