<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Office 2007 (docx...) Extract Common Metadata in Alfresco Archive</title>
    <link>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203846#M156976</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Hi&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Is there support for in the current version of Alfresco 3.0 Stable through the use of the POI version installed to extract docx document properties (custom ones?)&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;I have been strugelling with this for a while and it seems to work for doc files but not docx.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Anyone&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Regards&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Kenneth Thorman&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Thu, 02 Apr 2009 09:53:16 GMT</pubDate>
    <dc:creator>kenneth_thorman</dc:creator>
    <dc:date>2009-04-02T09:53:16Z</dc:date>
    <item>
      <title>Office 2007 (docx...) Extract Common Metadata</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203846#M156976</link>
      <description>HiIs there support for in the current version of Alfresco 3.0 Stable through the use of the POI version installed to extract docx document properties (custom ones?)I have been strugelling with this for a while and it seems to work for doc files but not docx.AnyoneRegardsKenneth Thorman</description>
      <pubDate>Thu, 02 Apr 2009 09:53:16 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203846#M156976</guid>
      <dc:creator>kenneth_thorman</dc:creator>
      <dc:date>2009-04-02T09:53:16Z</dc:date>
    </item>
    <item>
      <title>Re: Office 2007 (docx...) Extract Common Metadata</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203847#M156977</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;In the current release 3.0 Stable of Alfresco the POI library versino 3.1 is used.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;If this is changed to 3.5 (beta) we're getting detailed exception and it says "The supplied data appears to be in the Office 2007+ XML. You are calling the part of POI that deals with OLE2 Office Documents. You need to call a different part of POI to process this data (eg XSSF instead of HSSF)"&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;So I guess a bit of the code will have to be changed.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Any pointers, anyone?&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Regards&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Kenneth Thorman&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 02 Apr 2009 11:00:33 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203847#M156977</guid>
      <dc:creator>kenneth_thorman</dc:creator>
      <dc:date>2009-04-02T11:00:33Z</dc:date>
    </item>
    <item>
      <title>Re: Office 2007 (docx...) Extract Common Metadata</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203848#M156978</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Hi,&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;yub, .doc is a binary file format, .docx is a special xml format.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;You'll have to write your own metadata extrator, map it to docx file extension and use the XSSF part of jakarta POI.&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;I'm not sure if the old extractors are still working with a 3.5 POI jar…&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Cheers, Jan&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 02 Apr 2009 12:07:35 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203848#M156978</guid>
      <dc:creator>jpfi</dc:creator>
      <dc:date>2009-04-02T12:07:35Z</dc:date>
    </item>
    <item>
      <title>Re: Office 2007 (docx...) Extract Common Metadata</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203849#M156979</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;We have been waiting for this feature, not wanting to implement this if alfresco was going to come out with this functionality.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;I have been searching high and low now since POI 3.5 have come out.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Is it correct that this feature (office 2007 file format metadata awareness) is still not available?&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Regards&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;Kenneth Thorman&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Tue, 01 Dec 2009 14:46:50 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/office-2007-docx-extract-common-metadata/m-p/203849#M156979</guid>
      <dc:creator>kenneth_thorman</dc:creator>
      <dc:date>2009-12-01T14:46:50Z</dc:date>
    </item>
  </channel>
</rss>

