<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Alfresco write-read 500 MO when adding a 200 ko pdf document in Alfresco Archive</title>
    <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256091#M209221</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Our Alfresco output 500 MO to and from the disk where lucene-indexes are located, for each document added to the repository.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Our documents are only small pieces of PDFA files (200 ko) !&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;So, it takes more than 10 seconds to process a document and 2000 documents are inserted per days.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;This scenario appear in our quality and production environment.&lt;/SPAN&gt;&lt;BR /&gt;&lt;STRONG&gt;Configuration information :&lt;/STRONG&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;UL&gt;Alfresco is installed in a virtual environment (Vmware).&lt;BR /&gt;Indexes and documents are in separate disk.&lt;BR /&gt;The database is installed in a other server.&lt;/UL&gt;&lt;UL&gt;Alfresco version : Community 3.4.e&lt;BR /&gt;Java version&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; : Java(TM) SE Runtime Environment (build 1.6.0_27-b07) Java HotSpot(TM) 64-Bit Server VM &lt;BR /&gt;OS Distribution&amp;nbsp; : Centos 6.2 2.6.32-220.4.1.el6.x86_64&lt;BR /&gt;Database&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; : PostgreSQL 9.0.8 /Linux&lt;BR /&gt;Repository size&amp;nbsp; : 240 GO for 1'600'000 documents&lt;BR /&gt;Indexes size&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; : 6.6 GO&lt;/UL&gt;&lt;STRONG&gt;JVM Parameters&amp;nbsp; &lt;/STRONG&gt;&lt;SPAN&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &lt;/SPAN&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;&amp;nbsp; $JAVA_OPTS="-Xss512K -XX:MaxPermSize=256m -Xms2048m -Xmx2048m&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -Dalfresco.home=/soi/app/alfresco-ged34e&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -Dhttp.proxyHost=xx.xx.xx.xx -Dhttp.proxyPort=xxxx&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -Duser.dir=${CATALINA_HOME}/user.dir&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -Duser.home=${CATALINA_HOME}/user.home&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -Dcom.sun.management.jmxremote -Dcom.sun.management.jmxremote.port=xxxx&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -Dcom.sun.management.jmxremote.ssl=false -Dcom.sun.management.jmxremote.authenticate=false&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -Djava.rmi.server.hostname=myserver.mydomain.ch&amp;nbsp;&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -server -Dsun.security.ssl.allowUnsafeRenegotiation=true&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -Dfile.encoding=UTF-8 -Duser.country=CH -Duser.language=fr -Duser.timezone=Europe/Zurich&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -XX:NewRatio=1 -XX:+UseConcMarkSweepGC -XX:+CMSIncrementalMode&amp;nbsp; &lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; -XX:CMSInitiatingOccupancyFraction=80"&amp;nbsp; &lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;[size=150]&lt;/SPAN&gt;&lt;STRONG&gt;Full description &lt;/STRONG&gt;&lt;SPAN&gt;[/size]&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;STRONG&gt;Addind a new document produce 500 MO &lt;/STRONG&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;iotop&amp;nbsp; show more than 500 MO writed and readed for inserting a only 200 ko PDFA file&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;Total DISK READ: 0.00 B/s | Total DISK WRITE: 0.00 B/s&lt;BR /&gt;&amp;nbsp; TID&amp;nbsp; PRIO&amp;nbsp; USER&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; DISK READ&amp;nbsp; DISK WRITE&amp;nbsp; SWAPIN&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; IO&amp;gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; COMMAND&lt;BR /&gt;21138 be/4 alfresco&amp;nbsp;&amp;nbsp;&amp;nbsp; 526.40 M&amp;nbsp;&amp;nbsp;&amp;nbsp; 584.30 M&amp;nbsp; 0.00 % 10.17 % java -Dnop -Xss512K -XX:MaxPermSize=256m -Xms1024~t/tem&lt;BR /&gt;21186 be/4 alfresco&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 17.55 M&amp;nbsp;&amp;nbsp;&amp;nbsp; 448.00 K&amp;nbsp; 0.00 %&amp;nbsp; 3.50 % java -Dnop -Xss512K -XX:MaxPermSize=256m -Xms1024~t/tem&lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;At the same time, the cpu works hard &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;&amp;nbsp; &lt;/SPAN&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;PID USER&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; PR&amp;nbsp; NI&amp;nbsp; VIRT&amp;nbsp; RES&amp;nbsp; SHR S %CPU %MEM&amp;nbsp;&amp;nbsp;&amp;nbsp; TIME+&amp;nbsp; COMMAND&lt;BR /&gt;21068 alfresco&amp;nbsp; 20&amp;nbsp;&amp;nbsp; 0 2119m 1.2g&amp;nbsp; 14m S 92.2 63.2&amp;nbsp;&amp;nbsp; 6:43.85 java&lt;BR /&gt;21197 root&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 20&amp;nbsp;&amp;nbsp; 0&amp;nbsp; 177m 9252 2528 S&amp;nbsp; 0.7&amp;nbsp; 0.5&amp;nbsp;&amp;nbsp; 0:04.51 iotop&lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;STRONG&gt;Output log &lt;/STRONG&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;below is just end of the log when adding a document. At the end of the log, there is 8 seconds elapsed between these two lines &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;2012-09-04 09:56:33,514 User:myuser DEBUG [lucene.fts.FullTextSearchIndexerImpl] FTS index request for workspace://SpacesStore&lt;BR /&gt;2012-09-04 09:56:41,987&amp;nbsp; DEBUG [lucene.fts.FullTextSearchIndexerImpl] FTS Indexing workspace://SpacesStore at Tue Sep 04 09:56:41 CEST 2012&lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;SPAN&gt; &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:02,912 User:myuser DEBUG [impl.lucene.ADMLuceneIndexerImpl] Creating indexer&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:02,912 User:myuser DEBUG [impl.lucene.ADMLuceneIndexerImpl] Update node workspace://SpacesStore/9efb97f2-c2e3-4b96-a0af-52fbf61d5158&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:02,921 User:myuser DEBUG [impl.lucene.FilterIndexReaderByStringId] Applying deletions FOR 40c30117-e988-4db0-b0a8-52eb18408da8 (the index ito which these are applied is the previous one …)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:02,937 User:myuser DEBUG [impl.lucene.FilterIndexReaderByStringId] Applying deletions FOR 707e8a54-c785-453b-8722-6acb5d5d3e46 (the index ito which these are applied is the previous one …)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:03,263 User:myuser DEBUG [impl.lucene.FilterIndexReaderByStringId] Applying deletions FOR 75f2c3d4-6885-47a9-b3cd-2285245fefc9 (the index ito which these are applied is the previous one …)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:04,527 User:myuser DEBUG [impl.lucene.FilterIndexReaderByStringId] Applying deletions FOR 4968aab5-4fff-4dda-bb8e-c079cbf8c8ac (the index ito which these are applied is the previous one …)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:05,416 User:myuser DEBUG [impl.lucene.FilterIndexReaderByStringId] Applying deletions FOR 4c33d483-5ff5-4b1f-9d5c-e74446bfe3d3 (the index ito which these are applied is the previous one …)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,323 User:myuser DEBUG [impl.lucene.FilterIndexReaderByStringId] Applying deletions FOR 27b977cf-4739-4e5c-84ce-27bda6d4d526 (the index ito which these are applied is the previous one …)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,334 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using EXACT_LANGUAGE_AND_ALL is [, {fr}]&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,347 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using EXACT_LANGUAGE_AND_ALL is [, {fr}]&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,358 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,358 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,359 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,359 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,359 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,360 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,361 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,361 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,361 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,366 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,366 User:myuser DEBUG [impl.lucene.LuceneAnalyser] Loaded org.alfresco.repo.search.impl.lucene.analysis.AlfrescoStandardAnalyser for type {&lt;/SPAN&gt;&lt;A href="http://www.alfresco.org/model/dictionary/1.0}boolean" rel="nofollow noopener noreferrer"&gt;http://www.alfresco.org/model/dictionary/1.0}boolean&lt;/A&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,366 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,367 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,369 User:myuser DEBUG [impl.lucene.LuceneAnalyser] Loaded org.alfresco.repo.search.impl.lucene.analysis.DateAnalyser for type {&lt;/SPAN&gt;&lt;A href="http://www.alfresco.org/model/dictionary/1.0}datetime" rel="nofollow noopener noreferrer"&gt;http://www.alfresco.org/model/dictionary/1.0}datetime&lt;/A&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,370 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,371 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,371 User:myuser DEBUG [impl.lucene.LuceneAnalyser] Loaded org.alfresco.repo.search.impl.lucene.analysis.DateAnalyser for type {&lt;/SPAN&gt;&lt;A href="http://www.alfresco.org/model/dictionary/1.0}datetime" rel="nofollow noopener noreferrer"&gt;http://www.alfresco.org/model/dictionary/1.0}datetime&lt;/A&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,372 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,373 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,374 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,374 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,375 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,376 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using EXACT_LANGUAGE_AND_ALL is [, {fr}]&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,377 User:myuser DEBUG [impl.lucene.LuceneAnalyser] Loaded org.alfresco.repo.search.impl.lucene.analysis.LongAnalyser for type {&lt;/SPAN&gt;&lt;A href="http://www.alfresco.org/model/dictionary/1.0}long" rel="nofollow noopener noreferrer"&gt;http://www.alfresco.org/model/dictionary/1.0}long&lt;/A&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,377 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,378 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,381 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,381 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,382 User:myuser DEBUG [lucene.analysis.MLAnalayser] Loading org.apache.lucene.analysis.fr.FrenchAnalyzer for fr_CH&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:06,382 User:myuser DEBUG [lucene.analysis.MLTokenDuplicator] Locale fr_CH using ALL_ONLY is []&lt;/SPAN&gt;&lt;BR /&gt;&lt;STRONG&gt;2012-09-04 09:56:33,514 User:myuser DEBUG [lucene.fts.FullTextSearchIndexerImpl] FTS index request for workspace://SpacesStore&lt;BR /&gt;2012-09-04 09:56:41,987&amp;nbsp; DEBUG [lucene.fts.FullTextSearchIndexerImpl] FTS Indexing workspace://SpacesStore at Tue Sep 04 09:56:41 CEST 2012&lt;/STRONG&gt;&lt;SPAN&gt;2012-09-04 09:56:41,988&amp;nbsp; DEBUG [impl.lucene.ADMLuceneIndexerImpl] Creating indexer&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:41,989&amp;nbsp; DEBUG [impl.lucene.FilterIndexReaderByStringId] Applying deletions FOR 5bcc8dd0-8b6c-4874-adc8-31db4c61264a (the index ito which these are applied is the previous one …)&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;2012-09-04 09:56:42,399&amp;nbsp; DEBUG [lucene.fts.FullTextSearchIndexerImpl] FTS index completed for workspace://SpacesStore … 0 remaining&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;STRONG&gt;When starting, Alfresco read 7 GO&lt;/STRONG&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;I also noticed that when Alfresco starts, it reads 7 GO before the webapp is alive. &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Mesured with iotop :&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&lt;/SPAN&gt;&lt;BR /&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;Total DISK READ: 0.00 B/s | Total DISK WRITE: 0.00 B/s&lt;BR /&gt;&amp;nbsp; TID&amp;nbsp; PRIO&amp;nbsp; USER&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; DISK READ&amp;nbsp; DISK WRITE&amp;nbsp; SWAPIN&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; IO&amp;gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; COMMAND&lt;BR /&gt;21070 be/4 alfresco&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 7.17 G&amp;nbsp;&amp;nbsp;&amp;nbsp; 121.76 M&amp;nbsp; 0.02 % 23.50 &lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;STRONG&gt;No change when disabling cm:content indexing &lt;/STRONG&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp; &amp;lt;type name="cm:content"&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;title&amp;gt;Content&amp;lt;/title&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;parent&amp;gt;cm:cmobject&amp;lt;/parent&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;archive&amp;gt;true&amp;lt;/archive&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;properties&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;property name="cm:content"&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;type&amp;gt;d:content&amp;lt;/type&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;mandatory&amp;gt;false&amp;lt;/mandatory&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;!– Although content is marked as indexed atomically it may end up asynchronous –&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;!– if the content conversion will take too long. Content that does not require conversion –&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;!– to UTF8 test/plain will always be indexed atomically –&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;index enabled="false"&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;atomic&amp;gt;true&amp;lt;/atomic&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;stored&amp;gt;false&amp;lt;/stored&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;tokenised&amp;gt;true&amp;lt;/tokenised&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;/index&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;/property&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;/properties&amp;gt;&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &amp;lt;/type&amp;gt;&lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;SPAN&gt;For our business solution, whe don't need fulltext search, so I do understand why Lucene output 500 MO when cm:content indexing is disabled !&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;STRONG&gt;Conclusion&lt;/STRONG&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;I looking for a solution to reduce these IO writing, any help welcome !&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Best regards &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Pierre-André&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Tue, 04 Sep 2012 10:16:50 GMT</pubDate>
    <dc:creator>dbas2000</dc:creator>
    <dc:date>2012-09-04T10:16:50Z</dc:date>
    <item>
      <title>Alfresco write-read 500 MO when adding a 200 ko pdf document</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256091#M209221</link>
      <description>Our Alfresco output 500 MO to and from the disk where lucene-indexes are located, for each document added to the repository.Our documents are only small pieces of PDFA files (200 ko) !So, it takes more than 10 seconds to process a document and 2000 documents are inserted per days.This scenario appea</description>
      <pubDate>Tue, 04 Sep 2012 10:16:50 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256091#M209221</guid>
      <dc:creator>dbas2000</dc:creator>
      <dc:date>2012-09-04T10:16:50Z</dc:date>
    </item>
    <item>
      <title>Re: Alfresco write-read 500 MO when adding a 200 ko pdf document</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256092#M209222</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;The indexes are used for more than just full text search.&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;And although Lucene is IO heavy it should not be a problem.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;The recommendation I've always seen is to put your indexes on your fastest local disk.&amp;nbsp;&amp;nbsp; &lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN&gt;And make sure its not configured with a filesystem with un-neccessasary features like slow and safe RAID settings or virus scanner.&amp;nbsp; The index is derived data, it can be regenerated.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;The usual problems with running alfresco in a JVM is too little RAM.&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Tue, 04 Sep 2012 16:18:11 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256092#M209222</guid>
      <dc:creator>mrogers</dc:creator>
      <dc:date>2012-09-04T16:18:11Z</dc:date>
    </item>
    <item>
      <title>Re: Alfresco write-read 500 MO when adding a 200 ko pdf document</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256093#M209223</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Hi,&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BLOCKQUOTE class="jive-quote"&gt;I looking for a solution to reduce these IO writing, any help welcome !&lt;/BLOCKQUOTE&gt;&lt;BR /&gt;&lt;SPAN&gt;How did you know the absolute number of write I/O is your problem?&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;I guess your problem is indexing speed, correct? Then, sync is likely the most time consuming operations as index file gets fragmented. And it would be mostly caused by index merger, which could be improved by index writer's buffer RAM size. Could be only improved by some kind of sharding if you don't change your hardware.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;But anyway, I think you need to make your problem clear and nail down further to find your real bottleneck.&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Wed, 05 Sep 2012 08:51:57 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256093#M209223</guid>
      <dc:creator>t_sato</dc:creator>
      <dc:date>2012-09-05T08:51:57Z</dc:date>
    </item>
    <item>
      <title>Re: Alfresco write-read 500 MO when adding a 200 ko pdf document</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256094#M209224</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Thanks to mrogers and t_sato for your post.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;After more investigations, I discovered that is the merge process that produce this traffic.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;With the tool &lt;/SPAN&gt;&lt;STRONG&gt;iotop&lt;/STRONG&gt;&lt;SPAN&gt;, we can see that the IO traffic is produced whatever segments are merged.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;The mergeFactor is fixed to 5 but every 2 documents a segment is flushed to the disk.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Below is the result from the IndexInfo.jar against the SpacesStore. &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Does somebody knows how to analyse these output ?&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;The contentStore holds 1'600'000 documents and the first segment holds 3'029'531 documents !&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;java -Xmx512m -cp ./IndexInfo.jar org.alfresco.repo.search.impl.lucene.index.IndexInfo C:\\labs\\backup-lucene-indexes\\workspace\\SpacesStore&amp;nbsp; &lt;BR /&gt;Entry List for lucene-indexes\workspace\SpacesStore &lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;&amp;nbsp;&amp;nbsp; Size = 9&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 0&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=0ab76c3f-be42-4486-bf5d-0716df6084f9 Type=INDEX Status=COMMITTED Docs=3029531 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 1&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=12f3f5b3-047b-4179-808a-c5e55dab6ba4 Type=INDEX Status=COMMITTED Docs=1745366 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 2&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=adfdcb27-3e94-4cfe-9826-072335af142b Type=INDEX Status=COMMITTED Docs=1128625 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 3&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=3ad8cb8c-3515-47e2-b26b-6c342e8a5b26 Type=INDEX Status=COMMITTED Docs=725190 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 4&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=c15f8d81-79ed-4a55-985a-1f7b8a1a1188 Type=INDEX Status=COMMITTED Docs=316397 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 5&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=9d21316f-64b4-406c-8029-011bbc029970 Type=DELTA Status=COMMITTED Docs=40 Deletions=29&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 6&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=de201603-4374-4cf1-975c-673fe5cc2d7b Type=DELTA Status=COMMITTED Docs=80 Deletions=65&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 7&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=d85fb371-5b9f-4938-a3e2-4d7aac73c5ff Type=DELTA Status=COMMITTED Docs=128 Deletions=86&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 8&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=5b1d1df9-3e96-4334-9914-0fd2e996a775 Type=DELTA Status=COMMITTED Docs=119 Deletions=119&lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Thank's for any help.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Pierre-André&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 10 Sep 2012 13:09:41 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256094#M209224</guid>
      <dc:creator>dbas2000</dc:creator>
      <dc:date>2012-09-10T13:09:41Z</dc:date>
    </item>
    <item>
      <title>Re: Alfresco write-read 500 MO when adding a 200 ko pdf document</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256095#M209225</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Hi Pierre, &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;So now &lt;/SPAN&gt;&lt;A href="http://wiki.alfresco.com/wiki/Index_Merging_Performance" rel="nofollow noopener noreferrer"&gt;this&lt;/A&gt;&lt;SPAN&gt; must be the wiki you want to take a look.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;It says:&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BLOCKQUOTE class="jive-quote"&gt;It is usualy a good practice that the highest-numbered INDEX entries (which contains the least documents, number 4 in the examples above) do not contain more than a few hundred documents. If it's not the case, it could lead to massive amount of IO pressure on the index directories for merging operations.&lt;/BLOCKQUOTE&gt;&lt;BR /&gt;&lt;SPAN&gt;You have the default merge factor, 5, so it applies to you as well. You have 316397 documents in the highest-numbered INDEX entry. It is far more than hundreds! So increasing the merge factor is definitely an option to improve indexing performance. &lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;There Lucene pages are also helpful to understand how Lucene index works.&lt;/SPAN&gt;&lt;BR /&gt;&lt;A href="http://lucene.apache.org/core/old_versioned_docs/versions/2_9_3/api/all/org/apache/lucene/index/IndexWriter.html" rel="nofollow noopener noreferrer"&gt;IndexWriter(2.9.3)&lt;/A&gt;&lt;BR /&gt;&lt;A href="http://wiki.apache.org/lucene-java/ImproveIndexingSpeed" rel="nofollow noopener noreferrer"&gt;Improve Index Speed from Lucene wiki&lt;/A&gt;&lt;BR /&gt;&lt;A href="http://wiki.alfresco.com/wiki/Full-Text_Search_Configuration" rel="nofollow noopener noreferrer"&gt;Full Text Search Configuraiton from Alfresco wiki&lt;/A&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Hope this helps.&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Tue, 11 Sep 2012 04:10:36 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256095#M209225</guid>
      <dc:creator>t_sato</dc:creator>
      <dc:date>2012-09-11T04:10:36Z</dc:date>
    </item>
    <item>
      <title>Re: Alfresco write-read 500 MO when adding a 200 ko pdf document</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256096#M209226</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Hi t_sato,&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;So I changed the configuration with this parameters and the FULL reindexing process is currently working - Wait and see !&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;lucene.indexer.mergerTargetIndexCount=8&lt;BR /&gt;lucene.indexer.maxRamInMbForInMemoryMerge=48&lt;BR /&gt;lucene.indexer.writerRamBufferSizeMb=48&lt;BR /&gt;lucene.indexer.mergerRamBufferSizeMb=48&lt;BR /&gt;lucene.indexer.maxRamInMbForInMemoryIndex=48&lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;SPAN&gt;I will post the result re-indexing is completed.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Pierre-André&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Tue, 11 Sep 2012 06:19:39 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256096#M209226</guid>
      <dc:creator>dbas2000</dc:creator>
      <dc:date>2012-09-11T06:19:39Z</dc:date>
    </item>
    <item>
      <title>Re: Alfresco write-read 500 MO when adding a 200 ko pdf document</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256097#M209227</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Hi,&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Here is the indexes status after the FULL indexes rebuilding. 24 hours for 1'600'000 documents :&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;&amp;nbsp; &lt;/SPAN&gt;&lt;PRE class="language-none line-numbers"&gt;&lt;CODE&gt;Size = 7&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 0&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=facae57d-2997-4964-b710-6bf7a88e1345 Type=INDEX Status=COMMITTED Docs=5527866 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 1&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=32064b10-d4dd-4514-a652-5bd55921892a Type=INDEX Status=COMMITTED Docs=845705 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 2&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=a68a0558-9429-4217-a44e-7f696e79a113 Type=INDEX Status=COMMITTED Docs=517370 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 3&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=0482c5b5-0c3f-4c2d-ae87-ad848466faac Type=INDEX Status=COMMITTED Docs=49291 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 4&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=d0b834a1-ce86-4493-bd13-a1905360c893 Type=INDEX Status=COMMITTED Docs=4751 Deletions=0&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 5&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=27e26039-1ce6-4336-bea3-dd45f9fc4533 Type=DELTA Status=COMMITTED Docs=18 Deletions=11&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 6&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; Name=0563c9a4-daf6-4dea-91a1-96d1936cf651 Type=DELTA Status=COMMITTED Docs=50 Deletions=50&lt;SPAN class="line-numbers-rows"&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;SPAN&gt;‍&lt;/SPAN&gt;&lt;/SPAN&gt;&lt;/CODE&gt;&lt;/PRE&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;I thing it's a lot better than the previous status !&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;My questions are :&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;In order to keep the production online, does it possible to launch the reindexing process in an other server and then replace de production indexes with the rebuilded indexes ?&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;In the first segment there is &lt;/SPAN&gt;&lt;STRONG&gt;Docs=5'527'866&lt;/STRONG&gt;&lt;SPAN&gt;.&amp;nbsp; Does &lt;/SPAN&gt;&lt;STRONG&gt;Docs &lt;/STRONG&gt;&lt;SPAN&gt; represents the number of indexed files, because the contenstore hold only 1'600'000 documents ?&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Thanks&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Pierre-André&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 13 Sep 2012 13:06:46 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256097#M209227</guid>
      <dc:creator>dbas2000</dc:creator>
      <dc:date>2012-09-13T13:06:46Z</dc:date>
    </item>
    <item>
      <title>Re: Alfresco write-read 500 MO when adding a 200 ko pdf document</title>
      <link>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256098#M209228</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Looks good!&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BLOCKQUOTE class="jive-quote"&gt;In order to keep the production online, does it possible to launch the reindexing process in an other server and then replace de production indexes with the rebuilded indexes ?&lt;/BLOCKQUOTE&gt;&lt;BR /&gt;&lt;SPAN&gt;I'm afraid not unless you can have your system read-only during the rebuilding process(24 hours?).&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;You may need a professional Alfresco consulting service for the best possible deployment in production.&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BLOCKQUOTE class="jive-quote"&gt;In the first segment there is Docs=5'527'866. Does Docs represents the number of indexed files, because the contenstore hold only 1'600'000 documents ?&lt;/BLOCKQUOTE&gt;&lt;BR /&gt;&lt;SPAN&gt;I guess DOCS comes from numDocs of IndexReader. Then yes, it is indexed documents. I don't know details, but it means(not surprising) that 2 or 3 additional system document are stored per user document.&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Fri, 14 Sep 2012 03:09:25 GMT</pubDate>
      <guid>https://connect.hyland.com/t5/alfresco-archive/alfresco-write-read-500-mo-when-adding-a-200-ko-pdf-document/m-p/256098#M209228</guid>
      <dc:creator>t_sato</dc:creator>
      <dc:date>2012-09-14T03:09:25Z</dc:date>
    </item>
  </channel>
</rss>

