<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Index the document in Alfresco Forum</title>
    <link>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110524#M30904</link>
    <description>&lt;P&gt;Content&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Wed, 06 Nov 2019 14:52:13 GMT</pubDate>
    <dc:creator>Mahesha</dc:creator>
    <dc:date>2019-11-06T14:52:13Z</dc:date>
    <item>
      <title>Index the document</title>
      <link>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110522#M30902</link>
      <description>&lt;P&gt;I am new to alfresco&lt;/P&gt;&lt;P&gt;i use alfresco community edition&lt;/P&gt;&lt;P&gt;i want to index a word document and also image&lt;/P&gt;&lt;P&gt;can i explain how i achive this&lt;/P&gt;</description>
      <pubDate>Wed, 06 Nov 2019 12:48:01 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110522#M30902</guid>
      <dc:creator>Mahesha</dc:creator>
      <dc:date>2019-11-06T12:48:01Z</dc:date>
    </item>
    <item>
      <title>Re: Index the document</title>
      <link>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110523#M30903</link>
      <description>&lt;P&gt;are you using Alfresco Content or Process?&lt;/P&gt;</description>
      <pubDate>Wed, 06 Nov 2019 14:48:54 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110523#M30903</guid>
      <dc:creator>jljwoznica</dc:creator>
      <dc:date>2019-11-06T14:48:54Z</dc:date>
    </item>
    <item>
      <title>Re: Index the document</title>
      <link>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110524#M30904</link>
      <description>&lt;P&gt;Content&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 06 Nov 2019 14:52:13 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110524#M30904</guid>
      <dc:creator>Mahesha</dc:creator>
      <dc:date>2019-11-06T14:52:13Z</dc:date>
    </item>
    <item>
      <title>Re: Index the document</title>
      <link>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110525#M30905</link>
      <description>&lt;P&gt;Can you provide an little more information? You want to add a document and have it full text indexed and also generated into an image file?&lt;/P&gt;</description>
      <pubDate>Wed, 20 Nov 2019 20:16:52 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110525#M30905</guid>
      <dc:creator>jljwoznica</dc:creator>
      <dc:date>2019-11-20T20:16:52Z</dc:date>
    </item>
    <item>
      <title>Re: Index the document</title>
      <link>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110526#M30906</link>
      <description>&lt;P&gt;Hi &lt;A href="https://migration33.stage.lithium.com/t5/user/viewprofilepage/user-id/2080"&gt;@jljwoznica&lt;/A&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;1. scan a bulk of&amp;nbsp; document and get images and then i need to upload them to alfresco&lt;/P&gt;&lt;P&gt;2.and also i need to upload bulk of non readable pdf to alfresco&lt;/P&gt;&lt;P&gt;3.i need to name/index both type of document to easy searching purpose&lt;/P&gt;&lt;P&gt;can you please help me to solve this problem&lt;/P&gt;&lt;P&gt;&lt;SPAN class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Capture.PNG" style="width: 742px;"&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://connect.hyland.com/t5/image/serverpage/image-id/366i3290889E5F58AA85/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 21 Nov 2019 06:02:22 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110526#M30906</guid>
      <dc:creator>Mahesha</dc:creator>
      <dc:date>2019-11-21T06:02:22Z</dc:date>
    </item>
    <item>
      <title>Re: Index the document</title>
      <link>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110527#M30907</link>
      <description>&lt;P&gt;Ok - so these are image files that are not in readable format (OCRed). Alfresco does not provide those tools out of the box, but there are plenty of options. You can integrate with another tool, like AWS Textract (I am not sure of your architecture - on premise or cloud, etc.). You can also use transformations to perform OCR with other tools.&amp;nbsp;&lt;/P&gt;
&lt;P&gt;However, based on what you are trying to do, the best method might be a capture (ingestion) provider - like Ephesoft. These tools can be trained to find specific information (by zone or surrounded text) and then optical character recognize the information and either save that at full text or apply the information found into particular custom metadata fields.&lt;/P&gt;
&lt;P&gt;However, you will need another product to work in conjunction with Alfresco - or at least that is my experience.&lt;/P&gt;</description>
      <pubDate>Thu, 21 Nov 2019 15:13:01 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-forum/index-the-document/m-p/110527#M30907</guid>
      <dc:creator>jljwoznica</dc:creator>
      <dc:date>2019-11-21T15:13:01Z</dc:date>
    </item>
  </channel>
</rss>

