FileDocCategorySizeDatePackage
TestSegmentTermEnum.javaAPI DocApache Lucene 1.4.32862Mon Jun 14 02:16:06 BST 2004org.apache.lucene.index

TestSegmentTermEnum

public class TestSegmentTermEnum extends TestCase
author
goller

Fields Summary
Directory
dir
Constructors Summary
Methods Summary
private voidaddDoc(org.apache.lucene.index.IndexWriter writer, java.lang.String value)

    Document doc = new Document();
    doc.add(Field.UnStored("content", value));

    try {
      writer.addDocument(doc);
    }
    catch (IOException e) {
      e.printStackTrace();
    }
  
public voidtestTermEnum()


    
  
    IndexWriter writer = null;

    try {
      writer  = new IndexWriter(dir, new WhitespaceAnalyzer(), true);

      // add 100 documents with term : aaa
      // add 100 documents with terms: aaa bbb
      // Therefore, term 'aaa' has document frequency of 200 and term 'bbb' 100
      for (int i = 0; i < 100; i++) {
        addDoc(writer, "aaa");
        addDoc(writer, "aaa bbb");
      }

      writer.close();
    }
    catch (IOException e) {
      e.printStackTrace();
    }

    try {
      // verify document frequency of terms in an unoptimized index
      verifyDocFreq();

      // merge segments by optimizing the index
      writer = new IndexWriter(dir, new WhitespaceAnalyzer(), false);
      writer.optimize();
      writer.close();

      // verify document frequency of terms in an optimized index
      verifyDocFreq();
    }
    catch (IOException e2) {
      e2.printStackTrace();
    }
  
private voidverifyDocFreq()

      IndexReader reader = IndexReader.open(dir);
      TermEnum termEnum = null;

    // create enumeration of all terms
    termEnum = reader.terms();
    // go to the first term (aaa)
    termEnum.next();
    // assert that term is 'aaa'
    assertEquals("aaa", termEnum.term().text());
    assertEquals(200, termEnum.docFreq());
    // go to the second term (bbb)
    termEnum.next();
    // assert that term is 'bbb'
    assertEquals("bbb", termEnum.term().text());
    assertEquals(100, termEnum.docFreq());

    termEnum.close();


    // create enumeration of terms after term 'aaa', including 'aaa'
    termEnum = reader.terms(new Term("content", "aaa"));
    // assert that term is 'aaa'
    assertEquals("aaa", termEnum.term().text());
    assertEquals(200, termEnum.docFreq());
    // go to term 'bbb'
    termEnum.next();
    // assert that term is 'bbb'
    assertEquals("bbb", termEnum.term().text());
    assertEquals(100, termEnum.docFreq());

    termEnum.close();