{"id":"96e9a05e-45aa-4d41-bca9-80d38b6115f8","shortId":"WZw7Eg","kind":"skill","title":"Tesseract OCR Engine for Image-to-Text Workflows","tagline":"Tesseract OCR is a widely used open source optical character recognition engine with command line and library interfaces. It can extract text from images and scanned documents, supports more than 100 languages, and outputs plain text, hOCR, TSV, and PDF variants.","description":"# Tesseract OCR Engine for Image-to-Text Workflows\n\nTesseract OCR is a widely used open source optical character recognition engine with command line and library interfaces. It can extract text from images and scanned documents, supports more than 100 languages, and outputs plain text, hOCR, TSV, and PDF variants.\n\n## Prerequisites\n\ngo\n\n## Installation\n\nRequirements and caveats from upstream:\n- **NOTE**: This software depends on other packages that may be licensed under different open source licenses.\n\nBasic usage or getting-started notes:\n- It also needs [traineddata](https://tesseract-ocr.github.io/tessdoc/Data-Files.html) files which support the legacy engine, for example those from the [tessdata](https://github.com/tesseract-ocr/tessdata) repository.\n- Basic **[command line usage](https://tesseract-ocr.github.io/tessdoc/Command-Line-Usage.html)**:\n- Examples can be found in the [documentation](https://tesseract-ocr.github.io/tessdoc/Command-Line-Usage.html#simplest-invocation-to-ocr-an-image).\n\n- Source: https://github.com/tesseract-ocr/tesseract\n- Extracted from upstream docs: https://raw.githubusercontent.com/tesseract-ocr/tesseract/HEAD/README.md\n\n## Documentation\n\n- https://tesseract-ocr.github.io/tessdoc/Planning.html\n\n## Source\n\n- [Agent Skill Exchange](https://agentskillexchange.com/skills/tesseract-ocr-engine-for-image-to-text-workflows/)","tags":["tesseract","ocr","engine","for","image","text","workflows","skills","agentskillexchange","agent-skills","ai-agents","ai-tools"],"capabilities":["skill","source-agentskillexchange","skill-tesseract-ocr-engine-for-image-to-text-workflows","topic-agent-skills","topic-ai-agents","topic-ai-tools","topic-awesome-list","topic-claude-code","topic-codex","topic-cursor","topic-llm","topic-mcp","topic-npx-skills","topic-openclaw","topic-skills-catalog"],"categories":["skills"],"synonyms":[],"warnings":[],"endpointUrl":"https://skills.sh/agentskillexchange/skills/tesseract-ocr-engine-for-image-to-text-workflows","protocol":"skill","transport":"skills-sh","auth":{"type":"none","details":{"cli":"npx skills add agentskillexchange/skills","source_repo":"https://github.com/agentskillexchange/skills","install_from":"skills.sh"}},"qualityScore":"0.454","qualityRationale":"deterministic score 0.45 from registry signals: · indexed on github topic:agent-skills · 8 github stars · SKILL.md body (1,372 chars)","verified":false,"liveness":"unknown","lastLivenessCheck":null,"agentReviews":{"count":0,"score_avg":null,"cost_usd_avg":null,"success_rate":null,"latency_p50_ms":null,"narrative_summary":null,"summary_updated_at":null},"enrichmentModel":"deterministic:skill-github:v1","enrichmentVersion":1,"enrichedAt":"2026-05-18T19:12:49.991Z","embedding":null,"createdAt":"2026-05-18T13:19:55.688Z","updatedAt":"2026-05-18T19:12:49.991Z","lastSeenAt":"2026-05-18T19:12:49.991Z","tsv":"'/skills/tesseract-ocr-engine-for-image-to-text-workflows/)':193 '/tessdoc/command-line-usage.html#simplest-invocation-to-ocr-an-image).':171 '/tessdoc/command-line-usage.html)**:':161 '/tessdoc/data-files.html)':138 '/tessdoc/planning.html':186 '/tesseract-ocr/tessdata)':153 '/tesseract-ocr/tesseract':175 '/tesseract-ocr/tesseract/head/readme.md':182 '100':40,90 'agent':188 'agentskillexchange.com':192 'agentskillexchange.com/skills/tesseract-ocr-engine-for-image-to-text-workflows/)':191 'also':133 'basic':125,155 'caveat':106 'charact':19,69 'command':23,73,156 'depend':112 'differ':121 'doc':179 'document':36,86,168,183 'engin':3,21,53,71,144 'exampl':146,162 'exchang':190 'extract':30,80,176 'file':139 'found':165 'get':129 'getting-start':128 'github.com':152,174 'github.com/tesseract-ocr/tessdata)':151 'github.com/tesseract-ocr/tesseract':173 'go':102 'hocr':46,96 'imag':6,33,56,83 'image-to-text':5,55 'instal':103 'interfac':27,77 'languag':41,91 'legaci':143 'librari':26,76 'licens':119,124 'line':24,74,157 'may':117 'need':134 'note':109,131 'ocr':2,11,52,61 'open':16,66,122 'optic':18,68 'output':43,93 'packag':115 'pdf':49,99 'plain':44,94 'prerequisit':101 'raw.githubusercontent.com':181 'raw.githubusercontent.com/tesseract-ocr/tesseract/head/readme.md':180 'recognit':20,70 'repositori':154 'requir':104 'scan':35,85 'skill':189 'skill-tesseract-ocr-engine-for-image-to-text-workflows' 'softwar':111 'sourc':17,67,123,172,187 'source-agentskillexchange' 'start':130 'support':37,87,141 'tessdata':150 'tesseract':1,10,51,60 'tesseract-ocr.github.io':137,160,170,185 'tesseract-ocr.github.io/tessdoc/command-line-usage.html#simplest-invocation-to-ocr-an-image).':169 'tesseract-ocr.github.io/tessdoc/command-line-usage.html)**:':159 'tesseract-ocr.github.io/tessdoc/data-files.html)':136 'tesseract-ocr.github.io/tessdoc/planning.html':184 'text':8,31,45,58,81,95 'topic-agent-skills' 'topic-ai-agents' 'topic-ai-tools' 'topic-awesome-list' 'topic-claude-code' 'topic-codex' 'topic-cursor' 'topic-llm' 'topic-mcp' 'topic-npx-skills' 'topic-openclaw' 'topic-skills-catalog' 'traineddata':135 'tsv':47,97 'upstream':108,178 'usag':126,158 'use':15,65 'variant':50,100 'wide':14,64 'workflow':9,59","prices":[{"id":"aa93722f-ce73-473f-86f8-26317e8662b4","listingId":"96e9a05e-45aa-4d41-bca9-80d38b6115f8","amountUsd":"0","unit":"free","nativeCurrency":null,"nativeAmount":null,"chain":null,"payTo":null,"paymentMethod":"skill-free","isPrimary":true,"details":{"org":"agentskillexchange","category":"skills","install_from":"skills.sh"},"createdAt":"2026-05-18T13:19:55.688Z"}],"sources":[{"listingId":"96e9a05e-45aa-4d41-bca9-80d38b6115f8","source":"github","sourceId":"agentskillexchange/skills/tesseract-ocr-engine-for-image-to-text-workflows","sourceUrl":"https://github.com/agentskillexchange/skills/tree/main/skills/tesseract-ocr-engine-for-image-to-text-workflows","isPrimary":false,"firstSeenAt":"2026-05-18T13:19:55.688Z","lastSeenAt":"2026-05-18T19:12:49.991Z"}],"details":{"listingId":"96e9a05e-45aa-4d41-bca9-80d38b6115f8","quickStartSnippet":null,"exampleRequest":null,"exampleResponse":null,"schema":null,"openapiUrl":null,"agentsTxtUrl":null,"citations":[],"useCases":[],"bestFor":[],"notFor":[],"kindDetails":{"org":"agentskillexchange","slug":"tesseract-ocr-engine-for-image-to-text-workflows","github":{"repo":"agentskillexchange/skills","stars":8,"topics":["agent-skills","ai-agents","ai-tools","awesome-list","claude-code","codex","cursor","llm","mcp","npx-skills","openclaw","skills-catalog"],"license":"mit","html_url":"https://github.com/agentskillexchange/skills","pushed_at":"2026-05-18T19:02:17Z","description":"The open catalog of AI agent skills — 2,000+ security-scanned skills for Claude Code, Cursor, Codex, and more.","skill_md_sha":"16de2f5c3a26143bb3d773ad439aeb3b19c9e032","skill_md_path":"skills/tesseract-ocr-engine-for-image-to-text-workflows/SKILL.md","default_branch":"main","skill_tree_url":"https://github.com/agentskillexchange/skills/tree/main/skills/tesseract-ocr-engine-for-image-to-text-workflows"},"layout":"multi","source":"github","category":"skills","frontmatter":{"name":"Tesseract OCR Engine for Image-to-Text Workflows","description":"Tesseract OCR is a widely used open source optical character recognition engine with command line and library interfaces. It can extract text from images and scanned documents, supports more than 100 languages, and outputs plain text, hOCR, TSV, and PDF variants."},"skills_sh_url":"https://skills.sh/agentskillexchange/skills/tesseract-ocr-engine-for-image-to-text-workflows"},"updatedAt":"2026-05-18T19:12:49.991Z"}}