{"version":"1.0","workflow_uuid":"c2ba9909-f624-414f-8aeb-fbd95c50766e","workflow_title":"Unstructured — Document ETL for LLM Pipelines","install_contract":{"version":"1.0","installReady":false,"title":"Unstructured — Document ETL for LLM Pipelines","summary":"Extract clean data from PDFs, DOCX, HTML, images, and emails for RAG and LLM ingestion. 14K+ GitHub stars.","assetType":"MCP Configs","pageUrl":"https://tokrepo.com/en/workflows/c2ba9909-f624-414f-8aeb-fbd95c50766e","sourceUrl":"https://github.com/Unstructured-IO","intendedFor":[],"firstActions":[],"agentFirstSteps":[],"targetPaths":[],"verification":[],"startingPoints":[],"example":"","successOutcome":"","boundaries":[],"askUserIf":["the current workspace stack cannot be matched to a safe upstream template","the target path is not the project root, or an existing file should be merged instead of overwritten"]}}