Mailing-List: contact java-user-help@lucene.apache.org; run by ezmlm
Precedence: bulk
Reply-To: java-user@lucene.apache.org
Received-SPF: pass (athena.apache.org: domain of ian.lea@gmail.com designates
 209.85.213.176 as permitted sender)
MIME-Version: 1.0
In-Reply-To: 
 <CAL4PpoTnZvJb_u1JXMq9m3WZKO_ujDd_UDHsRU1=4HqefWKq=w@mail.gmail.com>
References: 
 <CAL4PpoRskNxoZEqACPR=v7kRg2yhJUoczv+uQ1vrODEq83VGTw@mail.gmail.com>
 <CAE9W93PVi0yKPuDOCTjHTuxResVDe+U5hYDrf=VMrn8+crpAOQ@mail.gmail.com>
 <CAL4PpoTnZvJb_u1JXMq9m3WZKO_ujDd_UDHsRU1=4HqefWKq=w@mail.gmail.com>
From: Ian Lea <ian.lea@gmail.com>
Date: Fri, 18 May 2012 17:58:11 +0100
Message-ID: 
 <CAEY5pxWUm9UDTPE_htfRLuhb9=6m6gA7UnStMvMUhYu3og3ycQ@mail.gmail.com>
Subject: Re: old fashioned....."Too many open files"!
To: java-user@lucene.apache.org
Content-Type: text/plain; charset=ISO-8859-1
Content-Transfer-Encoding: quoted-printable

You may need to cut it down to something simpler, but I can't see any
reader.close() calls.


--
Ian.


On Fri, May 18, 2012 at 5:47 PM, Michel Blase <mblase23@gmail.com> wrote:
> This is the code in charge of managing the Lucene index. Thanks for your
> help!
>
>
>
> package luz.aurora.lucene;
>
> import java.io.File;
> import java.io.IOException;
> import java.util.*;
> import luz.aurora.search.ExtendedQueryParser;
> import org.apache.lucene.analysis.Analyzer;
> import org.apache.lucene.analysis.standard.StandardAnalyzer;
> import org.apache.lucene.document.Document;
> import org.apache.lucene.index.*;
> import org.apache.lucene.queryParser.ParseException;
> import org.apache.lucene.search.IndexSearcher;
> import org.apache.lucene.search.Query;
> import org.apache.lucene.search.TopDocs;
> import org.apache.lucene.search.highlight.Highlighter;
> import org.apache.lucene.search.highlight.QueryScorer;
> import org.apache.lucene.search.highlight.SimpleHTMLFormatter;
> import org.apache.lucene.search.highlight.SimpleSpanFragmenter;
> import org.apache.lucene.store.Directory;
> import org.apache.lucene.store.FSDirectory;
>
>
> public class LuceneManager {
>
> =A0 =A0private HashMap<Integer,String> IndexesPaths;
> =A0 =A0private HashMap<Integer,IndexWriter> Writers;
>
> =A0 =A0private int CurrentOpenIndex_ID;
> =A0 =A0private String CurrentOpenIndex_TablePrefix;
>
> =A0 =A0public =A0LuceneManager(int CurrentOpenIndex_ID,String
> CurrentOpenIndex_TablePrefix, HashMap<Integer,String> IndexesPaths) throw=
s
> Exception {
> =A0 =A0 =A0 =A0this.CurrentOpenIndex_ID =3D CurrentOpenIndex_ID;
> =A0 =A0 =A0 =A0this.IndexesPaths =3D IndexesPaths;
> =A0 =A0 =A0 =A0this.Writers =3D new HashMap<Integer,IndexWriter>();
> =A0 =A0 =A0 =A0this.CurrentOpenIndex_TablePrefix =3D CurrentOpenIndex_Tab=
lePrefix;
>
> =A0 =A0 =A0 =A0SetUpWriters();
> =A0 =A0}
>
> =A0 =A0private void SetUpWriters() throws Exception {
> =A0 =A0 =A0 =A0Set set =3D IndexesPaths.entrySet();
> =A0 =A0 =A0 =A0Iterator i =3D set.iterator();
>
> =A0 =A0 =A0 =A0while(i.hasNext()){
> =A0 =A0 =A0 =A0 =A0 =A0Map.Entry index =3D (Map.Entry)i.next();
> =A0 =A0 =A0 =A0 =A0 =A0int id =3D (Integer)index.getKey();
> =A0 =A0 =A0 =A0 =A0 =A0String path =3D (String)index.getValue();
>
> =A0 =A0 =A0 =A0 =A0 =A0File app =3D new File(path);
> =A0 =A0 =A0 =A0 =A0 =A0Directory dir =3D FSDirectory.open(app);
> =A0 =A0 =A0 =A0 =A0 =A0IndexWriterConfig config =3D new
> IndexWriterConfig(LuceneVersion.CurrentVersion,new
> StandardAnalyzer(LuceneVersion.CurrentVersion));
>
> =A0 =A0 =A0 =A0 =A0 =A0//config.setMaxBufferedDocs(50);
> =A0 =A0 =A0 =A0 =A0 =A0config.setRAMBufferSizeMB(400);
> =A0 =A0 =A0 =A0 =A0 =A0TieredMergePolicy mp =3D
> (TieredMergePolicy)config.getMergePolicy();
> =A0 =A0 =A0 =A0 =A0 =A0mp.setUseCompoundFile(true);
> =A0 =A0 =A0 =A0 =A0 =A0config.setMergePolicy(mp);
>
> =A0 =A0 =A0 =A0 =A0 =A0/*
> =A0 =A0 =A0 =A0 =A0 =A0LogMergePolicy lmp =3D (LogMergePolicy)config.getM=
ergePolicy();
> =A0 =A0 =A0 =A0 =A0 =A0lmp.setUseCompoundFile(true);
> =A0 =A0 =A0 =A0 =A0 =A0lmp.setMaxMergeDocs(10000);
> =A0 =A0 =A0 =A0 =A0 =A0config.setMergePolicy(lmp);
> =A0 =A0 =A0 =A0 =A0 =A0*/
>
> =A0 =A0 =A0 =A0 =A0 =A0Writers.put(id, new IndexWriter(dir,config));
> =A0 =A0 =A0 =A0}
> =A0 =A0}
>
> =A0 =A0public void AddDocument(int IndexId,Document doc,Analyzer analyzer=
)
> throws CorruptIndexException, IOException {
> =A0 =A0 =A0 =A0IndexWriter im =3D Writers.get(IndexId);
> =A0 =A0 =A0 =A0im.addDocument(doc, analyzer);
> =A0 =A0}
>
> =A0 =A0public void AddDocument(Document doc,Analyzer analyzer) throws
> CorruptIndexException, IOException {
> =A0 =A0 =A0 =A0IndexWriter im =3D Writers.get(this.CurrentOpenIndex_ID);
> =A0 =A0 =A0 =A0im.addDocument(doc, analyzer);
> =A0 =A0}
>
> =A0 =A0public void DeleteDoc(int IndexId,int SegmentIdFromDb) throws
> CorruptIndexException, IOException {
> =A0 =A0 =A0 =A0IndexWriter im =3D Writers.get(IndexId);
> =A0 =A0 =A0 =A0Term term =3D new Term("SegmentID",Integer.toString(Segmen=
tIdFromDb));
> =A0 =A0 =A0 =A0im.deleteDocuments(term);
> =A0 =A0}
>
> =A0 =A0public void DeleteDocuments(String query) throws ParseException,
> CorruptIndexException, IOException {
>
> =A0 =A0 =A0 =A0ExtendedQueryParser parser =3D new
> ExtendedQueryParser(LuceneVersion.CurrentVersion,"ID",new
> StandardAnalyzer(LuceneVersion.CurrentVersion));
> Query q =3D parser.parse(query);
>
> =A0 =A0 =A0 =A0Set set =3D Writers.entrySet();
> =A0 =A0 =A0 =A0Iterator i =3D set.iterator();
>
> =A0 =A0 =A0 =A0while(i.hasNext()){
> =A0 =A0 =A0 =A0 =A0 =A0Map.Entry app =3D (Map.Entry)i.next();
> =A0 =A0 =A0 =A0 =A0 =A0IndexWriter im =3D (IndexWriter)app.getValue();
> =A0 =A0 =A0 =A0 =A0 =A0im.deleteDocuments(q);
> =A0 =A0 =A0 =A0}
> =A0 =A0}
>
> =A0 =A0private IndexSearcher getSearcher() throws CorruptIndexException,
> IOException {
> =A0 =A0 =A0 =A0int NumberOfIndexes =3D Writers.size();
>
> =A0 =A0 =A0 =A0ArrayList<IndexReader> readers =3D new ArrayList<IndexRead=
er>();
> =A0 =A0 =A0 =A0IndexReader[] readerList =3D new IndexReader[NumberOfIndex=
es];
>
> =A0 =A0 =A0 =A0Set set =3D Writers.entrySet();
> =A0 =A0 =A0 =A0Iterator i =3D set.iterator();
> =A0 =A0 =A0 =A0while(i.hasNext()){
> =A0 =A0 =A0 =A0 =A0 =A0Map.Entry index =3D (Map.Entry)i.next();
> =A0 =A0 =A0 =A0 =A0 =A0IndexWriter iw =3D (IndexWriter)index.getValue();
> =A0 =A0 =A0 =A0 =A0 =A0readers.add(IndexReader.open(iw, true));
> =A0 =A0 =A0 =A0}
>
> =A0 =A0 =A0 =A0MultiReader mr =3D new MultiReader(readers.toArray(readerL=
ist));
> =A0 =A0 =A0 =A0return new IndexSearcher(mr);
> =A0 =A0}
>
> =A0 =A0public void close() throws CorruptIndexException, IOException {
> =A0 =A0 =A0 =A0Set set =3D Writers.entrySet();
> =A0 =A0 =A0 =A0Iterator i =3D set.iterator();
> =A0 =A0 =A0 =A0while(i.hasNext()){
> =A0 =A0 =A0 =A0 =A0 =A0Map.Entry index =3D (Map.Entry)i.next();
> =A0 =A0 =A0 =A0 =A0 =A0IndexWriter iw =3D (IndexWriter)index.getValue();
> =A0 =A0 =A0 =A0 =A0 =A0iw.close();
> =A0 =A0 =A0 =A0}
> =A0 =A0}
>
> =A0 =A0public void commit() throws CorruptIndexException, IOException,
> Exception {
> =A0 =A0 =A0 =A0Set set =3D Writers.entrySet();
> =A0 =A0 =A0 =A0Iterator i =3D set.iterator();
> =A0 =A0 =A0 =A0while(i.hasNext()){
> =A0 =A0 =A0 =A0 =A0 =A0Map.Entry index =3D (Map.Entry)i.next();
> =A0 =A0 =A0 =A0 =A0 =A0IndexWriter iw =3D (IndexWriter)index.getValue();
> =A0 =A0 =A0 =A0 =A0 =A0iw.commit();
> =A0 =A0 =A0 =A0}
>
> =A0 =A0}
>
> =A0 =A0public int getCurrentOpenIndexId() {
> =A0 =A0 =A0 =A0return this.CurrentOpenIndex_ID;
> =A0 =A0}
>
> =A0 =A0public String getCurrentOpenIndexTablePrefix() {
> =A0 =A0 =A0 =A0return this.CurrentOpenIndex_TablePrefix;
> =A0 =A0}
>
>
> =A0 =A0//SEARCH START
>
> =A0 =A0public TopDocs Search(String q,Analyzer analyzer,int NumberOfResul=
ts)
> throws Exception {
> =A0 =A0 =A0 =A0ExtendedQueryParser parser =3D new
> ExtendedQueryParser(LuceneVersion.CurrentVersion,"ID",analyzer);
> Query query =3D parser.parse(q);
> =A0 =A0 =A0 =A0//Filter f =3D NumericRangeFilter.newIntRange("SegmentID",=
 393, 393,
> true, true);
> //FilteredQuery fq =3D new FilteredQuery(query,f);
> //TopDocs docs =3D searcher.search(fq, NumberOfResults);
> //System.out.println(searcher.getIndexReader().)
> return getSearcher().search(query, NumberOfResults);
> =A0 =A0}
>
> =A0 =A0public TopDocs SearchAndHighlight(String q,Analyzer analyzer,int
> NumberOfResults) throws Exception {
> =A0 =A0 =A0 =A0ExtendedQueryParser parser =3D new
> ExtendedQueryParser(LuceneVersion.CurrentVersion,"ID",analyzer);
> Query query =3D parser.parse(q);
> =A0 =A0 =A0 =A0return getSearcher().search(query, NumberOfResults);
> =A0 =A0}
>
> =A0 =A0public Highlighter getHighlighter(String query,Analyzer analyzer,S=
tring
> OpeningTag,String ClosingTag) throws ParseException {
> =A0 =A0 =A0 =A0ExtendedQueryParser qp =3D new
> ExtendedQueryParser(LuceneVersion.CurrentVersion,"ID",analyzer);
> =A0 =A0 =A0 =A0Query q =3D qp.parse(query);
> =A0 =A0 =A0 =A0QueryScorer qs =3D new QueryScorer(q);
> =A0 =A0 =A0 =A0SimpleHTMLFormatter formatter =3D =A0new
> SimpleHTMLFormatter(OpeningTag,ClosingTag);
> =A0 =A0 =A0 =A0Highlighter hl =3D new Highlighter(formatter,qs);
> =A0 =A0 =A0 =A0hl.setTextFragmenter(new SimpleSpanFragmenter(qs));
> =A0 =A0 =A0 =A0return hl;
> =A0 =A0}
>
> =A0 =A0public Document getDoc(int i) throws CorruptIndexException, IOExce=
ption
> {
> =A0 =A0 =A0 =A0return getSearcher().doc(i);
> =A0 =A0}
>
>
>
> }
>
>
>
>
>
> On Thu, May 17, 2012 at 10:37 PM, findbestopensource <
> findbestopensource@gmail.com> wrote:
>
>> Post complete code. You are not closing the objects (IndexWriter / Index
>> Searcher) properly.
>>
>> Regards
>> Aditya
>> www.findbestopensource.com
>>
>>
>> On Fri, May 18, 2012 at 6:51 AM, Michel Blase <mblase23@gmail.com> wrote=
:
>>
>> > Hi all,
>> >
>> > I have few problems Indexing. I keep hitting "Too many open files". It
>> > seems like Lucene is not releasing files handlers after deleting
>> segments.
>> >
>> > This is a piece from the lsof output showing the problem:
>> >
>> >
>> > java =A0 =A023024 root *347r =A0 =A0 =A0REG =A0 =A0 =A0251,0 =A0 =A0 2=
660 149376
>> > /home/INDEXES_ROOT/SMPL_1/_bvq.cfs (deleted)
>> > java =A0 =A023024 root *348r =A0 =A0 =A0REG =A0 =A0 =A0251,0 =A0 =A0 2=
477 149382
>> > /home/INDEXES_ROOT/SMPL_1/_bvr.cfs (deleted)
>> > java =A0 =A023024 root *349r =A0 =A0 =A0REG =A0 =A0 =A0251,0 =A0 =A0 2=
747 149392
>> > /home/INDEXES_ROOT/SMPL_1/_bvu.cfs (deleted)
>> > java =A0 =A023024 root *350r =A0 =A0 =A0REG =A0 =A0 =A0251,0 =A0 =A0 2=
339 149384
>> > /home/INDEXES_ROOT/SMPL_1/_bvs.cfs (deleted)
>> >
>> > and this is the code I'm using (I'm using Lucene3.6)
>> >
>> > -- IndexWriter creation:
>> >
>> > File app =3D new File(path);
>> > Directory dir =3D FSDirectory.open(app);
>> > IndexWriterConfig config =3D new
>> > IndexWriterConfig(LuceneVersion.CurrentVersion,new
>> > StandardAnalyzer(LuceneVersion.CurrentVersion));
>> >
>> > //these are random tries attempting to solve the problem:
>> > config.setRAMBufferSizeMB(400);
>> > TieredMergePolicy mp =3D (TieredMergePolicy)config.getMergePolicy();
>> > mp.setUseCompoundFile(true);
>> > config.setMergePolicy(mp);
>> > IndexWriter im =3D new IndexWriter(dir,config);
>> >
>> > -- Then just a loop over my doc list calling for indexing:
>> > im.addDocument(doc, analyzer);
>> >
>> >
>> > Any idea?
>> > Thanks,
>> > Luca
>> >
>>

---------------------------------------------------------------------
To unsubscribe, e-mail: java-user-unsubscribe@lucene.apache.org
For additional commands, e-mail: java-user-help@lucene.apache.org