[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"extension-skill-claude-office-skills-smart-ocr-id":3,"guides-for-claude-office-skills-smart-ocr":226,"similar-k1782aqmjfqy0qysysgq76w9z1867e3x":227},{"_creationTime":4,"_id":5,"children":6,"community":7,"display":9,"evaluation":22,"identity":192,"isFallback":197,"parentExtension":198,"providers":199,"relations":203,"repo":205,"workflow":223},1778053148350.4734,"k1782aqmjfqy0qysysgq76w9z1867e3x",[],{"reviewCount":8},0,{"description":10,"installMethods":11,"name":12,"sourceUrl":13,"tags":14},">",{},"Smart OCR Skill","https://github.com/claude-office-skills/skills/tree/HEAD/smart-ocr",[15,16,17,18,19,20,21],"ocr","parsing","multilingual","paddleocr","extraction","image-processing","document-processing",{"_creationTime":23,"_id":24,"extensionId":5,"locale":25,"result":26,"trustSignals":180,"workflow":190},1778053561145.7488,"kn7e85709hrh43p1g03kstbvks867p8p","en",{"checks":27,"evaluatedAt":170,"extensionSummary":171,"promptVersionExtension":172,"promptVersionScoring":173,"rationale":174,"score":175,"summary":176,"tags":177,"targetMarket":178,"tier":179},[28,33,36,39,43,47,52,56,59,62,66,70,73,77,80,83,86,89,92,95,99,103,107,111,115,118,121,124,129,132,135,138,141,144,148,151,154,157,160,163,167],{"category":29,"check":30,"severity":31,"summary":32},"Practical Utility","Problem relevance","pass","The description clearly states the problem: extracting text from images and scanned documents with high accuracy using PaddleOCR.",{"category":29,"check":34,"severity":31,"summary":35},"Unique selling proposition","The skill leverages PaddleOCR, a powerful OCR engine supporting over 100 languages, offering specialized multilingual OCR capabilities beyond basic text extraction.",{"category":29,"check":37,"severity":31,"summary":38},"Production readiness","The skill is production-ready, supporting OCR for images, scanned PDFs, and handwritten documents, with detailed explanations of configuration and processing different sources.",{"category":40,"check":41,"severity":31,"summary":42},"Scope","Single responsibility principle","The skill has a single, well-defined responsibility: performing optical character recognition (OCR) on various document and image types.",{"category":40,"check":44,"severity":45,"summary":46},"Description quality","warning","The 'Displayed Description' field is minimal (a single '>'), providing no useful information about the skill's functionality.",{"category":48,"check":49,"severity":50,"summary":51},"Invocation","Scoped tools","not_applicable","This skill primarily relies on external libraries (PaddleOCR) and does not expose distinct, narrow tools in the typical sense; its functionality is a single, integrated OCR process.",{"category":53,"check":54,"severity":31,"summary":55},"Documentation","Configuration & parameter reference","The SKILL.md file provides detailed documentation for PaddleOCR configuration options, including defaults and explanations for various settings.",{"category":40,"check":57,"severity":31,"summary":58},"Tool naming","The primary tool/capability is 'smart-ocr', which is descriptive of its function. Underlying library functions are not user-facing tool names.",{"category":40,"check":60,"severity":31,"summary":61},"Minimal I/O surface","The skill's input is the document/image and optional language specifications, and its output is structured text data with confidence and bounding box information, which is appropriate for OCR.",{"category":63,"check":64,"severity":31,"summary":65},"License","License usability","The extension explicitly uses the MIT license, which is a permissive open-source license, and includes a LICENSE file.",{"category":67,"check":68,"severity":50,"summary":69},"Maintenance","Commit recency","No commit history is available for this specific skill file or its associated repository in the provided context.",{"category":67,"check":71,"severity":31,"summary":72},"Dependency Management","The SKILL.md file lists necessary dependencies (paddlepaddle, paddleocr, pdf2image, Pillow) and provides installation instructions for both CPU and GPU versions.",{"category":74,"check":75,"severity":50,"summary":76},"Security","Secret Management","The skill does not appear to handle any secrets or sensitive user credentials.",{"category":74,"check":78,"severity":31,"summary":79},"Injection","The skill focuses on OCR and text extraction; there is no indication of loading external data as instructions or executing arbitrary code from external sources.",{"category":74,"check":81,"severity":31,"summary":82},"Transitive Supply-Chain Grenades","The skill's dependencies are standard Python libraries and it processes local files or fetched bytes. It does not perform runtime code fetches or remote script executions.",{"category":74,"check":84,"severity":31,"summary":85},"Sandbox Isolation","The skill operates on provided files and does not appear to modify files outside its designated scope or interact with the user's OS in a destructive manner.",{"category":74,"check":87,"severity":31,"summary":88},"Sandbox escape primitives","No sandbox escape primitives like detached processes or retry loops around denied calls were found in the provided script snippets.",{"category":74,"check":90,"severity":31,"summary":91},"Data Exfiltration","The skill's primary function is local text extraction. There are no apparent outbound calls to submit confidential data, and external resources like fonts are standard and documented.",{"category":74,"check":93,"severity":31,"summary":94},"Hidden Text Tricks","The bundled content is free of hidden-steering tricks, and descriptions appear to be clean ASCII.",{"category":96,"check":97,"severity":31,"summary":98},"Hooks","Opaque code execution","The code snippets provided are standard Python and do not exhibit obfuscation, base64 payloads, or runtime script fetching.",{"category":100,"check":101,"severity":31,"summary":102},"Portability","Structural Assumption","The skill primarily operates on provided file paths or bytes and does not make assumptions about user-specific project organization beyond what's typical for Python scripts.",{"category":104,"check":105,"severity":50,"summary":106},"Trust","Issues Attention","No GitHub issues data is available for this skill.",{"category":108,"check":109,"severity":31,"summary":110},"Versioning","Release Management","The SKILL.md frontmatter explicitly declares a 'version: \"1.0\"'.",{"category":112,"check":113,"severity":45,"summary":114},"Code Execution","Validation","While configuration options are documented, the provided Python snippets for processing images and PDFs do not explicitly show the use of a schema library for input validation or sanitization of file paths and arguments.",{"category":74,"check":116,"severity":50,"summary":117},"Unguarded Destructive Operations","The skill is primarily read-only, focused on text extraction, and does not perform any destructive operations.",{"category":112,"check":119,"severity":31,"summary":120},"Error Handling","The provided Python code examples demonstrate basic error handling for file operations and OCR processing, with clear steps to extract text and process results.",{"category":112,"check":122,"severity":31,"summary":123},"Logging","The `show_log=False` option in PaddleOCR suggests logging can be controlled, and the provided Python examples focus on processing results rather than extensive logging, aligning with typical skill behavior.",{"category":125,"check":126,"severity":127,"summary":128},"Compliance","GDPR","info","The skill processes document content which may include personal data. While not directly submitting this data to a 3rd party, it's processed by the LLM, and no explicit sanitization is detailed.",{"category":125,"check":130,"severity":31,"summary":131},"Target market","The skill supports over 100 languages and processes general document types, with no specific regional or jurisdictional logic detected. The target market is global.",{"category":100,"check":133,"severity":31,"summary":134},"Runtime stability","The skill relies on standard Python libraries and the PaddleOCR engine, with clear installation instructions for CPU and GPU, indicating good portability across systems.",{"category":48,"check":136,"severity":31,"summary":137},"Precise Purpose","The SKILL.md clearly states the skill performs OCR using PaddleOCR, supports 100+ languages, and lists example prompts for common use cases like screenshots and scanned PDFs.",{"category":48,"check":139,"severity":31,"summary":140},"Concise Frontmatter","The frontmatter is concise and self-contained, clearly defining the skill's name, description, version, and capabilities within the first ~160 characters.",{"category":53,"check":142,"severity":31,"summary":143},"Concise Body","The SKILL.md body is well-structured, using code blocks for explanations and separating detailed procedural code into logical sections, staying within a reasonable length.",{"category":145,"check":146,"severity":31,"summary":147},"Context","Progressive Disclosure","The SKILL.md uses inline code blocks for explanations and examples, and provides links to external resources like the PaddleOCR GitHub repository, effectively disclosing information progressively.",{"category":145,"check":149,"severity":50,"summary":150},"Forked exploration","This skill performs a specific task (OCR) and does not involve deep exploration or code review that would necessitate 'context: fork'.",{"category":29,"check":152,"severity":31,"summary":153},"Usage examples","The skill provides three comprehensive, ready-to-use examples demonstrating business card reading, receipt scanning, and multilingual document processing, including input, invocation, and expected output.",{"category":29,"check":155,"severity":31,"summary":156},"Edge cases","The 'Limitations' section addresses potential edge cases such as handwritten text accuracy, small text detection, complex backgrounds, and rotated text, offering context and implicit recovery through the skill's design.",{"category":112,"check":158,"severity":50,"summary":159},"Tool Fallback","The skill does not appear to rely on external MCP tools that would require a fallback mechanism; it's self-contained with its Python dependencies.",{"category":100,"check":161,"severity":31,"summary":162},"Stack assumptions","The SKILL.md clearly states stack assumptions (Python, specific libraries) and provides installation instructions for both CPU and GPU versions, along with interpreter information.",{"category":164,"check":165,"severity":31,"summary":166},"Safety","Halt on unexpected state","The skill's design, focusing on processing provided inputs, and the structure of the Python examples imply that unexpected states like malformed input would likely result in an error rather than proceeding destructively.",{"category":100,"check":168,"severity":31,"summary":169},"Cross-skill coupling","The skill is self-contained and performs a specific OCR task, not implicitly relying on other skills or cross-linking to adjacent ones.",1778053463874,"This skill leverages the PaddleOCR engine to extract text from images, scanned PDFs, and handwritten documents. It supports multilingual processing, provides detailed configuration options, and includes practical examples for business cards, receipts, and multi-language documents.","2.0.0","3.4.0","The 'smart-ocr' skill is highly functional, well-documented, and adheres to best practices for code execution and security. The primary finding is the missing 'Displayed Description', which is a significant documentation gap, alongside a minor concern regarding explicit input validation schema usage in the provided code snippets. However, the comprehensive documentation, clear examples, and robust implementation of core functionalities position it as a high-quality, verified skill.",92,"A highly capable and well-documented skill for performing optical character recognition on various document types and images across over 100 languages.",[15,16,17,18,19,20,21],"global","verified",{"codeQuality":181,"collectedAt":182,"documentation":183,"maintenance":185,"security":186,"testCoverage":189},{},1778053451905,{"descriptionLength":184,"readmeSize":8},1,{},{"hasNpmPackage":187,"license":188,"smitheryVerified":187},false,"MIT",{"hasCi":187,"hasTests":187},{"updatedAt":191},1778053561145,{"githubOwner":193,"githubRepo":194,"locale":25,"slug":195,"type":196},"claude-office-skills","skills","smart-ocr","skill",true,null,{"extract":200,"llm":202},{"commitSha":201,"license":188},"9c4c7d5cd2813a8936bf2c9fdb174ea883b85a11",{"promptVersionExtension":172,"promptVersionScoring":173,"score":175,"targetMarket":178,"tier":179},{"repoId":204},"kd7fw7xbj58qc2z8whrrjptbed8659db",{"_creationTime":206,"_id":204,"identity":207,"providers":209,"workflow":220},1777995558409.8474,{"githubOwner":193,"githubRepo":194,"sourceUrl":208},"https://github.com/claude-office-skills/skills",{"discover":210,"github":213},{"sources":211},[212],"skills-sh",{"closedIssues90d":8,"forks":214,"license":188,"openIssues90d":215,"pushedAt":216,"readmeSize":217,"stars":218,"topics":219},27,2,1769868236000,29630,98,[],{"discoverAt":221,"extractAt":222,"githubAt":222,"updatedAt":222},1777995558409,1778053155657,{"anyEnrichmentAt":224,"extractAt":225,"githubAt":224,"llmAt":191,"updatedAt":191},1778053151766,1778053148350,[],[228,248,274,306,327,346],{"_creationTime":229,"_id":230,"community":231,"display":232,"identity":241,"providers":243,"relations":246,"workflow":247},1778053148350.4373,"k1776t2fdx4h35mkwpc5h201dd866zms",{"reviewCount":8},{"description":10,"installMethods":233,"name":234,"sourceUrl":235,"tags":236},{},"Document Parser Skill","https://github.com/claude-office-skills/skills/tree/HEAD/doc-parser",[16,21,237,238,15,19,239,240],"pdf","python","layout-analysis","docling",{"githubOwner":193,"githubRepo":194,"locale":25,"slug":242,"type":196},"doc-parser",{"extract":244,"llm":245},{"commitSha":201,"license":188},{"promptVersionExtension":172,"promptVersionScoring":173,"score":175,"targetMarket":178,"tier":179},{"repoId":204},{"anyEnrichmentAt":224,"extractAt":225,"githubAt":224,"llmAt":191,"updatedAt":191},{"_creationTime":249,"_id":250,"community":251,"display":252,"identity":259,"providers":263,"relations":268,"workflow":270},1778053339109.673,"k170fjdnm4zmjtz1rgs8zwq4418663pv",{"reviewCount":8},{"description":253,"installMethods":254,"name":255,"sourceUrl":256,"tags":257},"Use this skill to extract structured Markdown/JSON from PDFs and document images—tables with cell-level precision, formulas as LaTeX, figures, seals, charts, headers/footers, multi-column layout and correct reading order. Trigger terms: 文档解析, 版面分析, 版面还原, 表格提取, 公式识别, 多栏排版, 扫描件结构化, 发票, 财报, 复杂 PDF, PDF转Markdown, 图表, 阅读顺序; reading order, formula, LaTeX, layout parsing, structure extraction, PP-StructureV3, PaddleOCR-VL.",{},"PaddleOCR Document Parsing","https://github.com/aidenwu0209/paddleocr-skills/tree/HEAD/skills/paddleocr-doc-parsing",[237,258,15,239,18,238],"document-parsing",{"githubOwner":260,"githubRepo":261,"locale":25,"slug":262,"type":196},"aidenwu0209","paddleocr-skills","paddleocr-doc-parsing",{"extract":264,"llm":267},{"commitSha":265,"license":266},"ca41406b66e5a475f43b073a5b731dfd1b9c50b1","Apache-2.0",{"promptVersionExtension":172,"promptVersionScoring":173,"score":218,"targetMarket":178,"tier":179},{"repoId":269},"kd7b1t00prnctc7258swvw0hs5865sjq",{"anyEnrichmentAt":271,"extractAt":272,"githubAt":271,"llmAt":273,"updatedAt":273},1778053339393,1778053339109,1778053352237,{"_creationTime":275,"_id":276,"community":277,"display":278,"identity":291,"providers":295,"relations":300,"workflow":302},1778054812528.7214,"k17c4avaab2db2m79et4f4hnwn867qj1",{"reviewCount":8},{"description":279,"installMethods":280,"name":281,"sourceUrl":282,"tags":283},"Multimodal AI processing via Google Gemini API (2M tokens context). Capabilities: audio (transcription, 9.5hr max, summarization, music analysis), images (captioning, OCR, object detection, segmentation, visual Q&A), video (scene detection, 6hr max, YouTube URLs, temporal analysis), documents (PDF extraction, tables, forms, charts), image generation (text-to-image, editing). Actions: transcribe, analyze, extract, caption, detect, segment, generate from media. Keywords: Gemini API, audio transcription, image captioning, OCR, object detection, video analysis, PDF extraction, text-to-image, multimodal, speech recognition, visual Q&A, scene detection, YouTube transcription, table extraction, form processing, image generation, Imagen. Use when: transcribing audio/video, analyzing images/screenshots, extracting data from PDFs, processing YouTube videos, generating images from text, implementing multimodal AI features.",{},"AI Multimodal Processing Skill","https://github.com/samhvw8/dot-claude/tree/HEAD/skills/ai-multimodal",[284,285,286,287,288,21,289,15,290],"gemini-api","multimodal","audio","image","video","text-to-image","transcription",{"githubOwner":292,"githubRepo":293,"locale":25,"slug":294,"type":196},"samhvw8","dot-claude","ai-multimodal",{"extract":296,"llm":298},{"commitSha":297,"license":188},"28c76162116d2eedab131c0e1548fdc76a2999f7",{"promptVersionExtension":172,"promptVersionScoring":173,"score":299,"targetMarket":178,"tier":179},95,{"repoId":301},"kd79ad9dpqazy79y2s6rvajgjn865xek",{"anyEnrichmentAt":303,"extractAt":304,"githubAt":303,"llmAt":305,"updatedAt":305},1778054813688,1778054812528,1778054896678,{"_creationTime":307,"_id":308,"community":309,"display":310,"identity":320,"providers":322,"relations":325,"workflow":326},1778053148350.4636,"k171dtxahnz3h8q0jz3gk6akks867ym1",{"reviewCount":8},{"description":311,"installMethods":312,"name":313,"sourceUrl":314,"tags":315},"Extract text, tables, and metadata from PDFs using pdfplumber",{},"PDF Extraction","https://github.com/claude-office-skills/skills/tree/HEAD/pdf-extraction",[237,19,316,317,318,319,21],"text","tables","metadata","pdfplumber",{"githubOwner":193,"githubRepo":194,"locale":25,"slug":321,"type":196},"pdf-extraction",{"extract":323,"llm":324},{"commitSha":201,"license":188},{"promptVersionExtension":172,"promptVersionScoring":173,"score":299,"targetMarket":178,"tier":179},{"repoId":204},{"anyEnrichmentAt":224,"extractAt":225,"githubAt":224,"llmAt":191,"updatedAt":191},{"_creationTime":328,"_id":329,"community":330,"display":331,"identity":338,"providers":340,"relations":344,"workflow":345},1778053148350.4768,"k17c4t5g480bzq5t7qrjgbjsys867fb5",{"reviewCount":8},{"description":10,"installMethods":332,"name":333,"sourceUrl":334,"tags":335},{},"Table Extractor","https://github.com/claude-office-skills/skills/tree/HEAD/table-extractor",[237,19,336,337,16],"table","camelot",{"githubOwner":193,"githubRepo":194,"locale":25,"slug":339,"type":196},"table-extractor",{"extract":341,"llm":342},{"commitSha":201,"license":188},{"promptVersionExtension":172,"promptVersionScoring":173,"score":175,"targetMarket":178,"tier":343},"flagged",{"repoId":204},{"anyEnrichmentAt":224,"extractAt":225,"githubAt":224,"llmAt":191,"updatedAt":191},{"_creationTime":347,"_id":348,"community":349,"display":350,"identity":358,"providers":360,"relations":364,"workflow":365},1778053148350.4524,"k1768qh208by3vwy8tre4tmw59866348",{"reviewCount":8},{"description":10,"installMethods":351,"name":352,"sourceUrl":353,"tags":354},{},"Layout Analyzer","https://github.com/claude-office-skills/skills/tree/HEAD/layout-analyzer",[355,356,15,357,237,16],"document-analysis","layout","surya",{"githubOwner":193,"githubRepo":194,"locale":25,"slug":359,"type":196},"layout-analyzer",{"extract":361,"llm":362},{"commitSha":201,"license":188},{"promptVersionExtension":172,"promptVersionScoring":173,"score":363,"targetMarket":178,"tier":179},90,{"repoId":204},{"anyEnrichmentAt":224,"extractAt":225,"githubAt":224,"llmAt":191,"updatedAt":191}]