[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"extension-skill-jacob-g-park-polaris-datainsight-doc-extract-zh-CN":3,"guides-for-jacob-g-park-polaris-datainsight-doc-extract":289,"similar-k179a6hzxwhnrt79a8f8r0b89s86m035-zh-CN":290},{"_creationTime":4,"_id":5,"children":6,"community":7,"display":9,"evaluation":15,"identity":243,"isFallback":232,"parentExtension":248,"providers":249,"relations":256,"repo":259,"tags":285,"workflow":286},1778691275162.481,"k179a6hzxwhnrt79a8f8r0b89s86m035",[],{"reviewCount":8},0,{"description":10,"installMethods":11,"name":13,"sourceUrl":14},"使用 Polaris AI DataInsight Doc Extract API 从 Office 文档（DOCX、PPTX、XLSX、HWP、HWPX）中提取结构化数据。当用户想要解析、分析或提取文档文件中的文本、表格、图表、图像或形状时使用。每当用户提及从 Word、PowerPoint、Excel、HWP 或 HWPX 文件提取内容、想要解析文档结构、需要为 RAG 管道转换文档数据，或询问有关读取 Office 格式文档中的表格、图表或文本时，都可以调用此技能 — 即使他们没有明确提到“DataInsight”或“Polaris”。",{"claudeCode":12},"jacob-g-park/polaris-datainsight-doc-extract","Polaris AI DataInsight — 文档提取技能","https://github.com/jacob-g-park/polaris-datainsight-doc-extract",{"_creationTime":16,"_id":17,"extensionId":5,"locale":18,"result":19,"trustSignals":230,"workflow":241},1778691275162.4812,"kn72ydec3kwdhxj99rx4f0aejh86mcgz","zh-CN",{"checks":20,"evaluatedAt":192,"extensionSummary":193,"features":194,"nonGoals":199,"practices":203,"prerequisites":204,"promptVersionExtension":206,"promptVersionScoring":207,"purpose":208,"rationale":209,"score":210,"summary":211,"tags":212,"tier":218,"useCases":219,"workflow":224},[21,26,29,33,37,41,45,48,52,56,60,63,66,69,73,76,79,82,85,88,92,96,99,102,105,108,111,114,117,120,124,127,131,135,138,141,144,147,151,154,157,160,163,166,169,173,177,182,185,189],{"category":22,"check":23,"severity":24,"summary":25},"调用","精确的目的","pass","描述清楚地说明了技能的功能（通过 Polaris API 从 Office 文档中提取数据），并提供了具体的用例和调用触发器。",{"category":22,"check":27,"severity":24,"summary":28},"简洁的前端内容","前端内容简洁且自成一体，在字符限制内有效地总结了核心功能，并提供了清晰的触发短语。",{"category":30,"check":31,"severity":24,"summary":32},"文档","简洁的正文","SKILL.md 的正文结构良好，对高级主题使用渐进披露，并避免了不必要的冗余。",{"category":34,"check":35,"severity":24,"summary":36},"上下文","渐进披露","SKILL.md 使用相对路径链接到 API 响应结构和用法模式等详细信息，避免了直接嵌入大型数据结构。",{"category":34,"check":38,"severity":39,"summary":40},"分支探索","not_applicable","此技能不是需要分支上下文的探索性强的技能。",{"category":42,"check":43,"severity":24,"summary":44},"实用性","使用示例","SKILL.md 提供了清晰、可直接使用的 Python 和 curl 示例，用于基本和高级用法，展示了输入、调用和预期输出。",{"category":42,"check":46,"severity":24,"summary":47},"边缘情况","SKILL.md 记录了文件大小、超时和速率限制，并讨论了使用模式，有效地涵盖了潜在的失败模式和限制。",{"category":49,"check":50,"severity":39,"summary":51},"代码执行","工具回退","该技能不依赖外部 MCP 工具；它直接与描述的 API 端点交互。",{"category":53,"check":54,"severity":39,"summary":55},"安全","意外状态下停止","该技能的工作流程似乎不涉及破坏性操作或复杂的有状态管理，因此不需要明确的前置条件检查和停止。",{"category":57,"check":58,"severity":24,"summary":59},"可移植性","跨技能耦合","该技能是独立的，并且似乎不隐式依赖其他技能；未提及跨技能协调是其要求。",{"category":42,"check":61,"severity":24,"summary":62},"问题相关性","描述清楚地指出了用户从各种 Office 文档格式中提取结构化数据的痛点。",{"category":42,"check":64,"severity":24,"summary":65},"独特卖点","该技能利用特定的 API（Polaris AI DataInsight Doc Extract）从多种文档类型中提供结构化数据提取，其价值超越了一般 LLM 的功能。",{"category":42,"check":67,"severity":24,"summary":68},"生产就绪性","该技能详细说明了 API 身份验证、端点、请求/响应结构，并提供了清晰的使用示例，涵盖了其规定用例的完整生命周期。",{"category":70,"check":71,"severity":24,"summary":72},"范围","单一职责原则","该技能专注于单一职责：使用特定的 API 从指定的文档类型中提取结构化数据。",{"category":70,"check":74,"severity":24,"summary":75},"描述质量","描述准确地反映了技能的功能和限制，并且格式良好，便于用户阅读。",{"category":22,"check":77,"severity":39,"summary":78},"作用域工具","此技能不公开多个工具；它代表一种单一的、由 API 驱动的功能。",{"category":30,"check":80,"severity":24,"summary":81},"配置和参数参考","SKILL.md 清楚地记录了 API 端点、必需的标头（包括通过环境变量设置的 API 密钥）以及支持的文件格式和限制。",{"category":70,"check":83,"severity":39,"summary":84},"工具命名","这是一个技能，而不是一组具有名称的不同工具。",{"category":70,"check":86,"severity":24,"summary":87},"最小 I/O 表面","技能的输入是文件路径和 API 密钥（通过环境变量），输出是结构化 JSON，符合所述任务。",{"category":89,"check":90,"severity":24,"summary":91},"许可证","许可证可用性","该技能定义是在 Apache 2.0 许可下，服务使用受 Polaris AI 条款的约束，这一点已清楚说明。",{"category":93,"check":94,"severity":24,"summary":95},"维护","提交新鲜度","上次提交是在 2026-02-27，在过去 3 个月内。",{"category":93,"check":97,"severity":39,"summary":98},"依赖管理","该技能似乎没有需要显式管理在包内的第三方依赖项。",{"category":53,"check":100,"severity":24,"summary":101},"秘密管理","API 密钥通过环境变量处理，并且不回显在输出中，遵循最佳实践。",{"category":53,"check":103,"severity":24,"summary":104},"注入","该技能处理文件输入和 API 交互；没有迹象表明正在加载和执行不受信任的第三方数据作为指令。",{"category":53,"check":106,"severity":24,"summary":107},"传递供应链炸弹","该技能与文档化的 API 端点交互，并且在运行时不获取或执行外部代码或内容。",{"category":53,"check":109,"severity":24,"summary":110},"沙箱隔离","该技能的主要交互是与外部 API；它似乎不会修改其预期范围之外的文件。",{"category":53,"check":112,"severity":24,"summary":113},"沙箱逃逸原语","在提供的技能描述和示例中，没有发现分离的进程或拒绝重试循环的证据。",{"category":53,"check":115,"severity":24,"summary":116},"数据泄露","该技能仅对 Polaris API 进行已记录的调用，并且似乎不会泄露机密数据。",{"category":53,"check":118,"severity":24,"summary":119},"隐藏文本技巧","捆绑的内容和描述似乎没有隐藏的操控技巧或混淆。",{"category":121,"check":122,"severity":24,"summary":123},"钩子","不透明的代码执行","提供的 Python 代码示例清晰易读，没有证据表明存在混淆或不透明执行。",{"category":57,"check":125,"severity":24,"summary":126},"结构假设","该技能假设存在用于输入的​​文件路径和用于 API 密钥的环境变量，这些都是标准且有文档记录的。",{"category":128,"check":129,"severity":39,"summary":130},"信任","问题关注","没有可供评估的开放或已关闭的问题数据。",{"category":132,"check":133,"severity":24,"summary":134},"版本控制","发布管理","该技能定义在 SKILL.md 前端内容中有 `name` 和 `description`，并且代码已提交，这表明了一种版本控制形式。",{"category":49,"check":136,"severity":24,"summary":137},"验证","Python 示例演示了对 API 响应和文件操作的基本错误处理，暗示了一定程度的验证。",{"category":53,"check":139,"severity":24,"summary":140},"无保护的破坏性操作","该技能对用户文件是只读的；其主要操作是出站 API 调用。",{"category":49,"check":142,"severity":24,"summary":143},"错误处理","提供的 Python 示例包括对 API 状态码和 ZIP 文件解析的显式错误处理。",{"category":49,"check":145,"severity":39,"summary":146},"日志记录","该技能侧重于 API 交互，不涉及需要本地审计日志记录的本地破坏性操作或出站调用。",{"category":148,"check":149,"severity":39,"summary":150},"合规性","GDPR","该技能处理文档内容，但似乎不专门针对或处理需要 GDPR 清理的个人数据。",{"category":148,"check":152,"severity":24,"summary":153},"目标市场","该技能的功能是全球性的；它处理文档并与 API 交互，没有区域限制。",{"category":57,"check":155,"severity":24,"summary":156},"运行时稳定性","该技能使用标准的 Python 库并进行 API 调用，使其与 Python 环境具有广泛的兼容性。",{"category":30,"check":158,"severity":39,"summary":159},"README","SKILL.md 文件充当主要文档，并满足 README 的要求。",{"category":70,"check":161,"severity":39,"summary":162},"工具表面大小","此技能代表一种单一功能，而不是一组工具。",{"category":22,"check":164,"severity":39,"summary":165},"重叠的近义词工具","此技能不公开可能接近同义词的多个工具。",{"category":30,"check":167,"severity":24,"summary":168},"幻影功能","所有已记录的功能，例如 API 交互和结构化输出，都按描述实现。",{"category":170,"check":171,"severity":24,"summary":172},"安装","安装说明","SKILL.md 提供了清晰的安装步骤（API 密钥设置）以及可复制粘贴的 Python 和 curl 示例。",{"category":174,"check":175,"severity":24,"summary":176},"错误","可操作的错误消息","Python 示例演示了对 API 响应和文件操作的可操作错误处理，提供了状态码和错误文本。",{"category":178,"check":179,"severity":180,"summary":181},"执行","固定的依赖项","info","Python 脚本依赖于标准库，但未固定特定版本，这可能导致兼容性问题。",{"category":70,"check":183,"severity":39,"summary":184},"试运行预览","该技能的主要功能是通过 API 进行数据提取，而不是需要试运行预览的状态更改操作。",{"category":186,"check":187,"severity":24,"summary":188},"协议","幂等重试和超时","Python 示例包括基本的 HTTP 错误处理，并通过 API 自身的限制以及明确提及 10 分钟超时时间来暗示超时机制。",{"category":148,"check":190,"severity":24,"summary":191},"遥测选择加入","没有提到此技能会发出遥测数据；因此，它被视为默认选择加入（无遥测）。",1778691255638,"此技能使用 Polaris AI DataInsight Doc Extract API 从 Office 文档格式（DOCX、PPTX、XLSX、HWP、HWPX）中提取结构化数据（文本、表格、图表、图像、形状）。它处理身份验证、文件上传、ZIP 响应处理，并以统一模式的 JSON 格式提供数据。",[195,196,197,198],"从文档中提取文本、表格、图表、图像、形状、公式","支持 DOCX、PPTX、XLSX、HWP、HWPX 文件格式","以结构化的 `unifiedSchema` JSON 格式提供数据","处理 API 身份验证和响应解析",[200,201,202],"编辑或修改文档","提取列表中未包含的文件格式的数据","替换 Polaris AI DataInsight API 本身",[],[205],"Polaris AI DataInsight API 密钥（存储在 POLARIS_DATAINSIGHT_API_KEY 环境变量中）","3.0.0","4.4.0","使您能够使用专用 API 解析、分析和提取各种 Office 文档类型中的结构化内容。","该技能文档齐全、已准备好投入生产，并遵循安全最佳实践。唯一的小问题是 Python 依赖项缺少显式的版本固定，但这仅供参考。",99,"通过 Polaris API 从 Office 文档中提取结构化数据的高质量技能。",[213,214,215,216,217],"document-processing","api","office-suite","data-extraction","rag","verified",[220,221,222,223],"解析和分析 Office 文档内容","为 RAG 管道转换文档数据","将表格和图表提取为结构化格式（CSV、JSON）","自动化从文档文件中提取数据",[225,226,227,228,229],"使用提供的 API 密钥与 Polaris DataInsight API 进行身份验证。","通过 multipart/form-data POST 上传目标文档文件（DOCX、PPTX、XLSX、HWP、HWPX）。","从 API 接收 ZIP 文件响应。","解压 ZIP 文件并加载包含的 `unifiedSchema` JSON。","返回结构化的 JSON 数据，按页面和元素类型组织。",{"codeQuality":231,"collectedAt":233,"documentation":234,"maintenance":236,"security":239,"testCoverage":240},{"hasLockfile":232},false,1778691238101,{"descriptionLength":235,"readmeSize":8},582,{"closedIssues90d":8,"forks":8,"hasChangelog":232,"openIssues90d":8,"pushedAt":237,"stars":238},1772181340000,2,{"hasNpmPackage":232,"smitheryVerified":232},{"hasCi":232,"hasTests":232},{"updatedAt":242},1778691275162,{"basePath":244,"githubOwner":245,"githubRepo":246,"locale":18,"slug":246,"type":247},"skills/polaris-datainsight-doc-extract","jacob-g-park","polaris-datainsight-doc-extract","skill",null,{"evaluate":250,"extract":253},{"promptVersionExtension":206,"promptVersionScoring":207,"score":210,"tags":251,"targetMarket":252,"tier":218},[213,214,215,216,217],"global",{"commitSha":254,"license":255},"HEAD","Apache-2.0",{"repoId":257,"translatedFrom":258},"kd712xd320svz04am16hb3z7gs86nnp8","k179pfttbef03w90924p19s63x86nz28",{"_creationTime":260,"_id":257,"identity":261,"providers":262,"workflow":281},1778689987483.1523,{"githubOwner":245,"githubRepo":246,"sourceUrl":14},{"classify":263,"discover":275,"github":278},{"commitSha":254,"extensions":264},[265],{"basePath":244,"description":266,"displayName":246,"installMethods":267,"rationale":268,"selectedPaths":269,"source":273,"sourceLanguage":274,"type":247},"Extract structured data from Office documents (DOCX, PPTX, XLSX, HWP, HWPX) using the Polaris AI DataInsight Doc Extract API. Use when the user wants to parse, analyze, or extract text, tables, charts, images, or shapes from document files. Invoke this skill whenever the user mentions extracting content from Word, PowerPoint, Excel, HWP, or HWPX files, wants to parse document structure, needs to convert document data for RAG pipelines, or asks about reading tables, charts, or text from Office-format documents — even if they don't explicitly mention \"DataInsight\" or \"Polaris\".",{"claudeCode":12},"SKILL.md frontmatter at skills/polaris-datainsight-doc-extract/SKILL.md",[270],{"path":271,"priority":272},"SKILL.md","mandatory","rule","en",{"sources":276},[277],"manual",{"closedIssues90d":8,"description":279,"forks":8,"openIssues90d":8,"pushedAt":237,"readmeSize":8,"stars":238,"topics":280},"",[],{"classifiedAt":282,"discoverAt":283,"extractAt":284,"githubAt":284,"updatedAt":282},1778691222473,1778689987483,1778691220794,[214,216,213,215,217],{"evaluatedAt":287,"extractAt":288,"updatedAt":242},1778691255755,1778691222643,[],[291,321,340,359,380,402],{"_creationTime":292,"_id":293,"community":294,"display":295,"identity":301,"providers":305,"relations":314,"tags":317,"workflow":318},1778691104676.009,"k178w7wd1nma48cbwy5hbrnq7s86nyvy",{"reviewCount":8},{"description":296,"installMethods":297,"name":299,"sourceUrl":300},"Extract typed JSON from public website pages using a schema.",{"claudeCode":298},"iterationlayer/skills","website-extraction-api","https://github.com/iterationlayer/skills",{"basePath":302,"githubOwner":303,"githubRepo":304,"locale":274,"slug":299,"type":247},"skills/website-extraction-api","iterationlayer","skills",{"evaluate":306,"extract":313},{"promptVersionExtension":206,"promptVersionScoring":207,"score":307,"tags":308,"targetMarket":252,"tier":218},100,[309,216,310,311,214,312],"web-scraping","json","schema","automation",{"commitSha":254},{"parentExtensionId":315,"repoId":316},"k1721s0xmp59902ybtpakrrffn86n10s","kd76p4g2qmtrkgx99cnab3683d86n4g8",[214,312,216,310,311,309],{"evaluatedAt":319,"extractAt":320,"updatedAt":319},1778694012840,1778691104676,{"_creationTime":322,"_id":323,"community":324,"display":325,"identity":329,"providers":331,"relations":336,"tags":337,"workflow":338},1778691104675.9915,"k172qd89p5z3xybe3h8ncdmns586nd5g",{"reviewCount":8},{"description":326,"installMethods":327,"name":328,"sourceUrl":300},"Extract SKUs, product names, unit prices, availability, and minimum order quantities from a supplier catalog page.",{"claudeCode":298},"extract-supplier-catalog-from-website",{"basePath":330,"githubOwner":303,"githubRepo":304,"locale":274,"slug":328,"type":247},"skills/extract-supplier-catalog-from-website",{"evaluate":332,"extract":335},{"promptVersionExtension":206,"promptVersionScoring":207,"score":307,"tags":333,"targetMarket":252,"tier":218},[309,216,334,214,312],"procurement",{"commitSha":254},{"parentExtensionId":315,"repoId":316},[214,312,216,334,309],{"evaluatedAt":339,"extractAt":320,"updatedAt":339},1778692514878,{"_creationTime":341,"_id":342,"community":343,"display":344,"identity":348,"providers":350,"relations":355,"tags":356,"workflow":357},1778691104675.9893,"k172n42pm2yc36v1fmx3f243t986n52g",{"reviewCount":8},{"description":345,"installMethods":346,"name":347,"sourceUrl":300},"Extract property address, price, room count, and features from a listing document into structured JSON for MLS and property platforms.",{"claudeCode":298},"extract-real-estate-listing",{"basePath":349,"githubOwner":303,"githubRepo":304,"locale":274,"slug":347,"type":247},"skills/extract-real-estate-listing",{"evaluate":351,"extract":354},{"promptVersionExtension":206,"promptVersionScoring":207,"score":307,"tags":352,"targetMarket":252,"tier":218},[213,216,353,310,312],"real-estate",{"commitSha":254},{"parentExtensionId":315,"repoId":316},[312,216,213,310,353],{"evaluatedAt":358,"extractAt":320,"updatedAt":358},1778692318469,{"_creationTime":360,"_id":361,"community":362,"display":363,"identity":367,"providers":369,"relations":376,"tags":377,"workflow":378},1778691104675.9834,"k17bwxnh9scy64bmm9anmf7bbx86mtvn",{"reviewCount":8},{"description":364,"installMethods":365,"name":366,"sourceUrl":300},"Extract vehicle identification, owner details, registration dates, and technical specifications from vehicle registration documents.",{"claudeCode":298},"extract-fleet-vehicle-registration",{"basePath":368,"githubOwner":303,"githubRepo":304,"locale":274,"slug":366,"type":247},"skills/extract-fleet-vehicle-registration",{"evaluate":370,"extract":375},{"promptVersionExtension":206,"promptVersionScoring":207,"score":307,"tags":371,"targetMarket":252,"tier":218},[213,216,372,373,374],"fleet-management","api-integration","pdf",{"commitSha":254},{"parentExtensionId":315,"repoId":316},[373,216,213,372,374],{"evaluatedAt":379,"extractAt":320,"updatedAt":379},1778691789036,{"_creationTime":381,"_id":382,"community":383,"display":384,"identity":388,"providers":390,"relations":398,"tags":399,"workflow":400},1778691104675.9897,"k17fpgdfkq2ktrjw2phyx6c9f586ma8t",{"reviewCount":8},{"description":385,"installMethods":386,"name":387,"sourceUrl":300},"Extract merchant, date, line items, tax, and total from receipts.",{"claudeCode":298},"extract-receipt-data",{"basePath":389,"githubOwner":303,"githubRepo":304,"locale":274,"slug":387,"type":247},"skills/extract-receipt-data",{"evaluate":391,"extract":397},{"promptVersionExtension":206,"promptVersionScoring":207,"score":210,"tags":392,"targetMarket":252,"tier":218},[393,394,395,213,396,216],"receipts","finance","extraction","ocr",{"commitSha":254},{"parentExtensionId":315,"repoId":316},[216,213,395,394,396,393],{"evaluatedAt":401,"extractAt":320,"updatedAt":401},1778692373588,{"_creationTime":403,"_id":404,"community":405,"display":406,"identity":410,"providers":412,"relations":416,"tags":417,"workflow":418},1778691104675.988,"k1717wt59hjn0j8kydze6s09ph86nf9r",{"reviewCount":8},{"description":407,"installMethods":408,"name":409,"sourceUrl":300},"Extract appraised value, property details, and comparable sales from a property appraisal report into structured JSON.",{"claudeCode":298},"extract-property-appraisal",{"basePath":411,"githubOwner":303,"githubRepo":304,"locale":274,"slug":409,"type":247},"skills/extract-property-appraisal",{"evaluate":413,"extract":415},{"promptVersionExtension":206,"promptVersionScoring":207,"score":210,"tags":414,"targetMarket":252,"tier":218},[213,353,216,310,214],{"commitSha":254},{"parentExtensionId":315,"repoId":316},[214,216,213,310,353],{"evaluatedAt":419,"extractAt":320,"updatedAt":419},1778692195131]