<?xml version="1.0" encoding="utf-8" standalone="yes"?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom"><channel><title>Table on Sawyer Zheng's Blog</title><link>https://elated-raman-42e0c2.netlify.app/tags/table/</link><description>Recent content in Table on Sawyer Zheng's Blog</description><generator>Hugo</generator><language>zh-cn</language><lastBuildDate>Wed, 01 Feb 2023 18:11:43 +0800</lastBuildDate><atom:link href="https://elated-raman-42e0c2.netlify.app/tags/table/index.xml" rel="self" type="application/rss+xml"/><item><title>Table</title><link>https://elated-raman-42e0c2.netlify.app/post/notes/ai/nlp/table/</link><pubDate>Fri, 04 Nov 2022 00:00:00 +0000</pubDate><guid>https://elated-raman-42e0c2.netlify.app/post/notes/ai/nlp/table/</guid><description>&lt;div id="outline-container-headline-1" class="outline-2"&gt;
&lt;h2 id="headline-1"&gt;
表格抽取工具收集
&lt;/h2&gt;
&lt;div id="outline-text-headline-1" class="outline-text-2"&gt;
&lt;ul&gt;
&lt;li&gt;
&lt;p&gt;列表网站&lt;/p&gt;
&lt;ul&gt;
&lt;li&gt;
&lt;p&gt;&lt;a href="https://nanonets.com/blog/extract-tables-from-pdf/"&gt;How to Extract Tables from PDF - PDF to Table Extractor&lt;/a&gt;&lt;/p&gt;
&lt;ul&gt;
&lt;li&gt;有不同工具的对比说明&lt;/li&gt;
&lt;/ul&gt;
&lt;/li&gt;
&lt;/ul&gt;
&lt;/li&gt;
&lt;li&gt;
&lt;p&gt;tabula-py&lt;/p&gt;
&lt;ul&gt;
&lt;li&gt;&lt;a href="https://github.com/chezou/tabula-py"&gt;GitHub - chezou/tabula-py: Simple wrapper of tabula-java: extract table from …&lt;/a&gt;&lt;/li&gt;
&lt;li&gt;底层调用 tabula-java&lt;/li&gt;
&lt;/ul&gt;
&lt;/li&gt;
&lt;li&gt;
&lt;p&gt;PDFPatcher&lt;/p&gt;
&lt;ul&gt;
&lt;li&gt;&lt;a href="https://github.com/wmjordan/PDFPatcher"&gt;GitHub - wmjordan/PDFPatcher: PDF补丁丁——PDF工具箱，可以编辑书签、剪裁旋转页面、解除限制、提取或合并文档，探查文档结…&lt;/a&gt;&lt;/li&gt;
&lt;li&gt;支持 OCR 图片表格&lt;/li&gt;
&lt;/ul&gt;
&lt;/li&gt;
&lt;li&gt;
&lt;p&gt;camelot&lt;/p&gt;</description></item></channel></rss>