<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0">
  <channel>
    <title>PyPI recent updates for document-data-extractor</title>
    <link>https://pypi.org/project/document-data-extractor/</link>
    <description>Recent updates to the Python Package Index for document-data-extractor</description>
    <language>en</language>    <item>
      <title>1.0.4</title>
      <link>https://pypi.org/project/document-data-extractor/1.0.4/</link>
      <description>Best open-source document to markdown extractor for LLM training data. Convert PDF, Word, PowerPoint, Excel, images, URLs to clean markdown, JSON, HTML locally. Alternative to Unstructured, Docling, Marker, MarkItDown, MinerU, PaddleOCR, Tesseract</description>
<author>team@nanonets.com</author>      <pubDate>Tue, 29 Jul 2025 08:25:54 GMT</pubDate>
    </item>    <item>
      <title>1.0.3</title>
      <link>https://pypi.org/project/document-data-extractor/1.0.3/</link>
      <description>Best open-source document to markdown extractor for LLM training data. Convert PDF, Word, PowerPoint, Excel, images, URLs to clean markdown, JSON, HTML locally. Alternative to Unstructured, Docling, Marker, MarkItDown, MinerU, PaddleOCR, Tesseract</description>
<author>team@nanonets.com</author>      <pubDate>Mon, 28 Jul 2025 14:00:12 GMT</pubDate>
    </item>    <item>
      <title>1.0.2</title>
      <link>https://pypi.org/project/document-data-extractor/1.0.2/</link>
      <description>Best open-source document to markdown extractor for LLM training data. Convert PDF, Word, PowerPoint, Excel, images, URLs to clean markdown, JSON, HTML locally. Alternative to Unstructured, Docling, Marker, MarkItDown, MinerU, PaddleOCR, Tesseract</description>
<author>team@nanonets.com</author>      <pubDate>Mon, 28 Jul 2025 12:27:29 GMT</pubDate>
    </item>    <item>
      <title>1.0.1</title>
      <link>https://pypi.org/project/document-data-extractor/1.0.1/</link>
      <description>Best open-source document to markdown extractor for LLM training data. Convert PDF, Word, PowerPoint, Excel, images, URLs to clean markdown, JSON, HTML locally. Alternative to Unstructured, Docling, Marker, MarkItDown, MinerU, PaddleOCR, Tesseract</description>
<author>team@nanonets.com</author>      <pubDate>Mon, 28 Jul 2025 12:22:48 GMT</pubDate>
    </item>    <item>
      <title>1.0.0</title>
      <link>https://pypi.org/project/document-data-extractor/1.0.0/</link>
      <description>Best open-source document to markdown extractor for LLM training data. Convert PDF, Word, PowerPoint, Excel, images, URLs to clean markdown, JSON, HTML locally. Alternative to Unstructured, Docling, Marker, MarkItDown, MinerU, PaddleOCR, Tesseract</description>
<author>team@nanonets.com</author>      <pubDate>Mon, 28 Jul 2025 12:19:56 GMT</pubDate>
    </item>  </channel>
</rss>