<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Pesquisa Lucene e indexação de conteúdo em documentos PDF in Alfresco Archive</title>
    <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65466#M41455</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Estou com um problema nesse diretório também, e não faço a mínima ideia de como resolver&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;13:52:44,956 ERROR [org.alfresco.repo.search.impl.lucene.index.IndexInfo] Failed building filter reader beneath f041ae5b-d09c-4d84-9670-12ea5bc1aa2e&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;java.io.EOFException&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at java.io.DataInputStream.readInt(DataInputStream.java:375)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.getDeletions(IndexInfo.java:1091)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.createMainIndexReader(IndexInfo.java:2056)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.getMainIndexReferenceCountingReadOnlyIndexReader(IndexInfo.java:1219)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.AbstractLuceneBase.getSearcher(AbstractLuceneBase.java:168)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.ADMLuceneSearcherImpl.query(ADMLuceneSearcherImpl.java:286)&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Caused by: org.alfresco.repo.search.impl.lucene.LuceneIndexException: 03130000 Failed to open IndexSarcher for /opt/alfresco-3.4.d/alf_data/lucene-indexes/workspace/SpacesStore/&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.AbstractLuceneBase.getSearcher(AbstractLuceneBase.java:184)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.ADMLuceneSearcherImpl.query(ADMLuceneSearcherImpl.java:286)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.SearcherComponent.query(SearcherComponent.java:78)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.AbstractReindexComponent.isTxnIdPresentInIndex(AbstractReindexComponent.java:500)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.AbstractReindexComponent.isTxnPresentInIndex(AbstractReindexComponent.java:421)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.FullIndexRecoveryComponent.areTxnsInStartSample(FullIndexRecoveryComponent.java:265)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.FullIndexRecoveryComponent.reindexImpl(FullIndexRecoveryComponent.java:188)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.AbstractReindexComponent$1.execute(AbstractReindexComponent.java:300)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.transaction.RetryingTransactionHelper.doInTransaction(RetryingTransactionHelper.java:381)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.transaction.RetryingTransactionHelper.doInTransaction(RetryingTransactionHelper.java:272)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.AbstractReindexComponent.reindex(AbstractReindexComponent.java:306)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;… 35 more&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Caused by: java.io.EOFException&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at java.io.DataInputStream.readInt(DataInputStream.java:375)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.getDeletions(IndexInfo.java:1091)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.createMainIndexReader(IndexInfo.java:2056)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.getMainIndexReferenceCountingReadOnlyIndexReader(IndexInfo.java:1219)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.AbstractLuceneBase.getSearcher(AbstractLuceneBase.java:168)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;… 45 more&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:06,749 INFO [org.springframework.extensions.webscripts.DeclarativeRegistry] Registered 264 Web Scripts (+0 failed), 274 URLs&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:06,751 INFO [org.springframework.extensions.webscripts.DeclarativeRegistry] Registered 8 Package Description Documents (+0 failed)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:06,751 INFO [org.springframework.extensions.webscripts.DeclarativeRegistry] Registered 0 Schema Description Documents (+0 failed)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:07,354 INFO [org.springframework.extensions.webscripts.AbstractRuntimeContainer] Initialised Spring Surf Container Web Script Container (in 4490.937ms)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:07,524 INFO [org.springframework.extensions.webscripts.TemplateProcessorRegistry] Registered template processor freemarker for extension ftl&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:07,871 INFO [org.springframework.extensions.webscripts.ScriptProcessorRegistry] Registered script processor javascript for extension js&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:08,351 INFO [org.springframework.extensions.webscripts.TemplateProcessorRegistry] Registered template processor freemarker for extension ftl&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:08,370 INFO [org.springframework.extensions.webscripts.ScriptProcessorRegistry] Registered script processor javascript for extension js&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:08,614 INFO [org.springframework.extensions.webscripts.TemplateProcessorRegistry] Registered template processor freemarker for extension ftl&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:08,625 INFO [org.springframework.extensions.webscripts.ScriptProcessorRegistry] Registered script processor javascript for extension js&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:09,038 INFO [org.alfresco.web.site.servlet.SSOAuthenticationFilter] NTLMAuthenticationFilter initialised. &amp;lt;code/&amp;gt;&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Thu, 14 Apr 2016 15:19:00 GMT</pubDate>
    <dc:creator>sammuel</dc:creator>
    <dc:date>2016-04-14T15:19:00Z</dc:date>
    <item>
      <title>Pesquisa Lucene e indexação de conteúdo em documentos PDF</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65460#M41449</link>
      <description>Boa tarde a todos,Tenho obtido falhas em pesquisas Lucene, sobre diversos documentos PDF.Para exemplo, fiz o upload de dois ficheiros para teste, com características idênticas (tamanho, motor de conversão PDF, programa que os converteu, versão do formato PDF, etc.). Estão ambos colocados no mesmo es</description>
      <pubDate>Fri, 19 Feb 2010 18:39:22 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65460#M41449</guid>
      <dc:creator>ricardoc-moreda</dc:creator>
      <dc:date>2010-02-19T18:39:22Z</dc:date>
    </item>
    <item>
      <title>Re: Pesquisa Lucene e indexação de conteúdo em documentos PDF</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65461#M41450</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Olá Ricardo,&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; Poderia dar maiores detalhes desses documentos.:&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;ficheiros para teste, com características idênticas (tamanho, motor de conversão PDF, programa que os converteu, versão do formato PDF, etc.). Estão ambos colocados no mesmo espaço.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; Qual o tipo de ferramenta vc. usou para conversão dos documentos para o formato PDF.Independente do Alfresco usar o Lucene como motor de pesquisa e indexão o Alfresco utiliza o&amp;nbsp; "pdf2swf "do SWF Tools&amp;nbsp; para visualizar os documentos.Já efetuei esses mesmos testes em pesquisas no repositório tanto em documentos como conteúdo de arquivos .doc,docx,.pdf ,etc.com sucesso.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;&lt;SPAN&gt; Faça o mesmo teste com o Alfresco Share criando um projeto comum tanto para o Alfresco DM e para o Alfresco Share no espaço"Company Home &amp;gt; Web Projects &amp;gt; documentLibrary ".Apesar de utulizar o SO Windows e Alfresco Community Edition 3.2r creio que isso seja&amp;nbsp; indiferente. se puder envie os arquivos para o meu e-mail&amp;nbsp; - &lt;/SPAN&gt;&lt;A class="jive-link-email-small" href="mailto:wos.silva@uol.com.br" rel="nofollow noopener noreferrer"&gt;wos.silva@uol.com.br&lt;/A&gt;&lt;SPAN&gt; -.&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;O ideal é vc. renomear a sua pasta alfresco e fazer uma nova instalação sem alterar o "contentModel.xml",estude uma forma também de etiquetar os seus documentos usando "categorias".&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Verifique se está apontando para o "espaço" correto ao usar a pesquisa avançada.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; Mande um abraço ao pessoal da Moredata&amp;nbsp; ai em&amp;nbsp; portugal, gosto muito do trabalho de vcs.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; Qualquer coisa retorne ok….&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; &lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;sds.&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Sun, 21 Feb 2010 23:26:38 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65461#M41450</guid>
      <dc:creator>williamsilva</dc:creator>
      <dc:date>2010-02-21T23:26:38Z</dc:date>
    </item>
    <item>
      <title>Re: Pesquisa Lucene e indexação de conteúdo em documentos PDF</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65462#M41451</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;WilliamSilva wrote: Olá Ricardo,&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; Poderia dar maiores detalhes desses documentos.:&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;ficheiros para teste, com características idênticas (tamanho, motor de conversão PDF, programa que os converteu, versão do formato PDF, etc.). Estão ambos colocados no mesmo espaço.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; Qual o tipo de ferramenta vc. usou para conversão dos documentos para o formato PDF.Independente do Alfresco usar o Lucene como motor de pesquisa e indexão o Alfresco utiliza o&amp;nbsp; "pdf2swf "do SWF Tools&amp;nbsp; para visualizar os documentos.Já efetuei esses mesmos testes em pesquisas no repositório tanto em documentos como conteúdo de arquivos .doc,docx,.pdf ,etc.com sucesso.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;&lt;SPAN&gt; Faça o mesmo teste com o Alfresco Share criando um projeto comum tanto para o Alfresco DM e para o Alfresco Share no espaço"Company Home &amp;gt; Web Projects &amp;gt; documentLibrary ".Apesar de utulizar o SO Windows e Alfresco Community Edition 3.2r creio que isso seja&amp;nbsp; indiferente. se puder envie os arquivos para o meu e-mail&amp;nbsp; - &lt;/SPAN&gt;&lt;A class="jive-link-email-small" href="mailto:wos.silva@uol.com.br" rel="nofollow noopener noreferrer"&gt;wos.silva@uol.com.br&lt;/A&gt;&lt;SPAN&gt; -.&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;O ideal é vc. renomear a sua pasta alfresco e fazer uma nova instalação sem alterar o "contentModel.xml",estude uma forma também de etiquetar os seus documentos usando "categorias".&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Verifique se está apontando para o "espaço" correto ao usar a pesquisa avançada.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; Mande um abraço ao pessoal da Moredata&amp;nbsp; ai em&amp;nbsp; portugal, gosto muito do trabalho de vcs.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; Qualquer coisa retorne ok….&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; &lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;sds.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Viva William,&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Antes do mais, agradeço a resposta.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Os links para estes dois documentos são:&lt;/SPAN&gt;&lt;BR /&gt;&lt;A href="http://ecmarchitect.com/images/articles/alfresco-actions/actions-article.pdf" rel="nofollow noopener noreferrer"&gt;http://ecmarchitect.com/images/articles/alfresco-actions/actions-article.pdf&lt;/A&gt;&lt;BR /&gt;&lt;A href="http://ecmarchitect.com/images/articles/alfresco-content/content-article.pdf" rel="nofollow noopener noreferrer"&gt;http://ecmarchitect.com/images/articles/alfresco-content/content-article.pdf&lt;/A&gt;&lt;SPAN&gt; &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Mas posso adiantar as suas características (para ambos):&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Producer - OpenOffice 2.0&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Creator - Writer&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Security - No&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Format - PDF-1.4&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Tanto quanto sei, o Alfresco usa PDFBox para transformar o conteúdo dos documentos PDF em texto. Mas neste caso, apenas estou a testar acesso aos metadados das properties "creator" e "modifier", definidas em contentModel.xml. Quanto a alterações a este ficheiro, apenas me limitei a criar as linhas para forçar a indexação destas propriedades:&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;true&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;false&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;both&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; &lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Isto porque as pesquisas iniciais sem estas linhas também falhavam, e procurei esta solução. Sem qualquer bom resultado, infelizmente.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Para além destas duas propriedades padrão dos documentos em Alfresco, estou a utilizar um modelo personalizado onde acrescento outras propriedades, mas que passam pelo mesmo problema. Daí ter colocado nos exemplos apenas estas duas. O modelo personalizado torna-se irrelevante para esta análise. Mas essa é a razão porque não estou a utilizar categorias. Nos vários tipos de documentos descritos nesse modelo personalizado, utilizo inúmeras propriedades para cada um (data de saída, classificação, processo, destinatário, origem, etc.). Não se tornaria prático com categorias, imagino. &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Estou apontando para o espaço correctamente, como se pode ver nos três exemplos de pesquisa que coloquei. O estranho aqui é que, se procurar documentos nesse espaço obtenho os tais dois, se acrescentar à pesquisa o TEXT:*admin* já só obtenho um (apesar de ambos os documentos terem as mesmas propriedades, rigorosamente), e se o acréscimo for por TEXT:admin simplesmente nenhum documento é encontrado!&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Haverá alguma explicação para isto?!&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 22 Feb 2010 10:38:14 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65462#M41451</guid>
      <dc:creator>ricardoc-moreda</dc:creator>
      <dc:date>2010-02-22T10:38:14Z</dc:date>
    </item>
    <item>
      <title>Re: Pesquisa Lucene e indexação de conteúdo em documentos PDF</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65463#M41452</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Ah! Um grande abraço de todo o pessoal da MoreData para o amigo William.&amp;nbsp; &lt;img id="smileyhappy" class="emoticon emoticon-smileyhappy" src="https://connect.hyland.com/i/smilies/16x16_smiley-happy.png" alt="Smiley Happy" title="Smiley Happy" /&gt; &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;É sempre bom sabermos que temos amigos para lá do Atlântico.&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 22 Feb 2010 10:42:40 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65463#M41452</guid>
      <dc:creator>ricardoc-moreda</dc:creator>
      <dc:date>2010-02-22T10:42:40Z</dc:date>
    </item>
    <item>
      <title>Re: Pesquisa Lucene e indexação de conteúdo em documentos PDF</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65464#M41453</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Olá Ricardo,&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt; Um link sobre .:&lt;/SPAN&gt;&lt;BR /&gt;&lt;A href="http://forums.alfresco.com/en/viewtopic.php?f=8&amp;amp;t=24033&amp;amp;start=0&amp;amp;st=0&amp;amp;sk=t&amp;amp;sd=a" rel="nofollow noopener noreferrer"&gt;http://forums.alfresco.com/en/viewtopic.php?f=8&amp;amp;t=24033&amp;amp;start=0&amp;amp;st=0&amp;amp;sk=t&amp;amp;sd=a&lt;/A&gt;&lt;BR /&gt;&lt;SPAN&gt; Na customização/implantação que comentei acima foi utilizado o "Adobe Acrobat 9.0 Pro", pois uma das regras do projeto pedia&amp;nbsp; pesquisa "container + navio",&amp;nbsp; os documentos foram convertidos para PDF, tratados (= análise, revisão, aprovação, etc) antecipadamente e depois povoados no DM com os metadados.No momento estou em transito , mais&amp;nbsp;&amp;nbsp; estarei lendo com mais calma o post e com certeza acharemos uma resposta.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;abraços.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;sds.&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 22 Feb 2010 15:42:10 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65464#M41453</guid>
      <dc:creator>williamsilva</dc:creator>
      <dc:date>2010-02-22T15:42:10Z</dc:date>
    </item>
    <item>
      <title>Re: Pesquisa Lucene e indexação de conteúdo em documentos PDF</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65465#M41454</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Obrigado William,&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Estive a ler esses posts que me indicaste. Segundo entendi, o problema residia na forma como o PDF era gerado ou modificado, certo?&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Contudo, nos exemplos que eu coloquei, os dois ficheiros foram gerados pelo mesmo mecanismo (OpenOffice Writer 2.0), e não sofreram qualquer modificação. Além disso, até têm tamanhos idênticos. Logo, ambos estão em igualdade de circunstâncias. Mas numa das pesquisas pelo Node Browser que indiquei (TEXT:*admin*), apenas um deles é encontrado e, mais estranho ainda, com TEXT:admin, nenhum aparece! Apesar de ambos terem metadados com 'admin', como indiquei.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Ou será que me escapou alguma coisa nesses posts?&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 22 Feb 2010 16:47:41 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65465#M41454</guid>
      <dc:creator>ricardoc-moreda</dc:creator>
      <dc:date>2010-02-22T16:47:41Z</dc:date>
    </item>
    <item>
      <title>Re: Pesquisa Lucene e indexação de conteúdo em documentos PDF</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65466#M41455</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Estou com um problema nesse diretório também, e não faço a mínima ideia de como resolver&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;13:52:44,956 ERROR [org.alfresco.repo.search.impl.lucene.index.IndexInfo] Failed building filter reader beneath f041ae5b-d09c-4d84-9670-12ea5bc1aa2e&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;java.io.EOFException&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at java.io.DataInputStream.readInt(DataInputStream.java:375)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.getDeletions(IndexInfo.java:1091)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.createMainIndexReader(IndexInfo.java:2056)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.getMainIndexReferenceCountingReadOnlyIndexReader(IndexInfo.java:1219)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.AbstractLuceneBase.getSearcher(AbstractLuceneBase.java:168)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.ADMLuceneSearcherImpl.query(ADMLuceneSearcherImpl.java:286)&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Caused by: org.alfresco.repo.search.impl.lucene.LuceneIndexException: 03130000 Failed to open IndexSarcher for /opt/alfresco-3.4.d/alf_data/lucene-indexes/workspace/SpacesStore/&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.AbstractLuceneBase.getSearcher(AbstractLuceneBase.java:184)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.ADMLuceneSearcherImpl.query(ADMLuceneSearcherImpl.java:286)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.SearcherComponent.query(SearcherComponent.java:78)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.AbstractReindexComponent.isTxnIdPresentInIndex(AbstractReindexComponent.java:500)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.AbstractReindexComponent.isTxnPresentInIndex(AbstractReindexComponent.java:421)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.FullIndexRecoveryComponent.areTxnsInStartSample(FullIndexRecoveryComponent.java:265)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.FullIndexRecoveryComponent.reindexImpl(FullIndexRecoveryComponent.java:188)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.AbstractReindexComponent$1.execute(AbstractReindexComponent.java:300)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.transaction.RetryingTransactionHelper.doInTransaction(RetryingTransactionHelper.java:381)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.transaction.RetryingTransactionHelper.doInTransaction(RetryingTransactionHelper.java:272)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.node.index.AbstractReindexComponent.reindex(AbstractReindexComponent.java:306)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;… 35 more&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Caused by: java.io.EOFException&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at java.io.DataInputStream.readInt(DataInputStream.java:375)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.getDeletions(IndexInfo.java:1091)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.createMainIndexReader(IndexInfo.java:2056)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.index.IndexInfo.getMainIndexReferenceCountingReadOnlyIndexReader(IndexInfo.java:1219)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;at org.alfresco.repo.search.impl.lucene.AbstractLuceneBase.getSearcher(AbstractLuceneBase.java:168)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;… 45 more&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:06,749 INFO [org.springframework.extensions.webscripts.DeclarativeRegistry] Registered 264 Web Scripts (+0 failed), 274 URLs&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:06,751 INFO [org.springframework.extensions.webscripts.DeclarativeRegistry] Registered 8 Package Description Documents (+0 failed)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:06,751 INFO [org.springframework.extensions.webscripts.DeclarativeRegistry] Registered 0 Schema Description Documents (+0 failed)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:07,354 INFO [org.springframework.extensions.webscripts.AbstractRuntimeContainer] Initialised Spring Surf Container Web Script Container (in 4490.937ms)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:07,524 INFO [org.springframework.extensions.webscripts.TemplateProcessorRegistry] Registered template processor freemarker for extension ftl&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:07,871 INFO [org.springframework.extensions.webscripts.ScriptProcessorRegistry] Registered script processor javascript for extension js&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:08,351 INFO [org.springframework.extensions.webscripts.TemplateProcessorRegistry] Registered template processor freemarker for extension ftl&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:08,370 INFO [org.springframework.extensions.webscripts.ScriptProcessorRegistry] Registered script processor javascript for extension js&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:08,614 INFO [org.springframework.extensions.webscripts.TemplateProcessorRegistry] Registered template processor freemarker for extension ftl&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:08,625 INFO [org.springframework.extensions.webscripts.ScriptProcessorRegistry] Registered script processor javascript for extension js&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;13:53:09,038 INFO [org.alfresco.web.site.servlet.SSOAuthenticationFilter] NTLMAuthenticationFilter initialised. &amp;lt;code/&amp;gt;&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 14 Apr 2016 15:19:00 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65466#M41455</guid>
      <dc:creator>sammuel</dc:creator>
      <dc:date>2016-04-14T15:19:00Z</dc:date>
    </item>
    <item>
      <title>Re: Pesquisa Lucene e indexação de conteúdo em documentos PDF</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65467#M41456</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;O seu problema parece diferente.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Pelas mensagens de erro, eu diria que os arquivos de index do solr estão corrompidos.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Nesse caso, o ideal seria você forçar a reindexação de toda a base e ver se isso corrige seu problema.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Qual a versão do Alfresco que você está usando?&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Fri, 22 Apr 2016 13:04:45 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/pesquisa-lucene-e-indexa%C3%A7%C3%A3o-de-conte%C3%BAdo-em-documentos-pdf/m-p/65467#M41456</guid>
      <dc:creator>douglascrp</dc:creator>
      <dc:date>2016-04-22T13:04:45Z</dc:date>
    </item>
  </channel>
</rss>

