bmesser 2004/12/29 13:38:41
Modified: src/test/org/apache/lucene/index TestSegmentReader.java
TestIndexReader.java TestSegmentMerger.java
Log:
adjust test cases to make use of the new IndexReader.getFieldNames method
Revision Changes Path
1.7 +5 -5
jakarta-lucene/src/test/org/apache/lucene/index/TestSegmentReader.java
Index: TestSegmentReader.java
===================================================================
RCS file:
/home/cvs/jakarta-lucene/src/test/org/apache/lucene/index/TestSegmentReader.java,v
retrieving revision 1.6
retrieving revision 1.7
diff -u -r1.6 -r1.7
--- TestSegmentReader.java 19 Dec 2004 14:58:49 -0000 1.6
+++ TestSegmentReader.java 29 Dec 2004 21:38:41 -0000 1.7
@@ -104,7 +104,7 @@
}
public void testGetFieldNameVariations() {
- Collection result = reader.getFieldNames();
+ Collection result = reader.getFieldNames(IndexReader.FieldOption.ALL);
assertTrue(result != null);
assertTrue(result.size() == 6);
for (Iterator iter = result.iterator(); iter.hasNext();) {
@@ -112,7 +112,7 @@
//System.out.println("Name: " + s);
assertTrue(DocHelper.nameValues.containsKey(s) == true ||
s.equals(""));
}
- result = reader.getFieldNames(true);
+ result = reader.getFieldNames(IndexReader.FieldOption.INDEXED);
assertTrue(result != null);
assertTrue(result.size() == 5);
for (Iterator iter = result.iterator(); iter.hasNext();) {
@@ -120,15 +120,15 @@
assertTrue(DocHelper.nameValues.containsKey(s) == true ||
s.equals(""));
}
- result = reader.getFieldNames(false);
+ result = reader.getFieldNames(IndexReader.FieldOption.UNINDEXED);
assertTrue(result != null);
assertTrue(result.size() == 1);
//Get all indexed fields that are storing term vectors
- result = reader.getIndexedFieldNames(true);
+ result =
reader.getFieldNames(IndexReader.FieldOption.INDEXED_WITH_TERMVECTOR);
assertTrue(result != null);
assertTrue(result.size() == 2);
- result = reader.getIndexedFieldNames(false);
+ result =
reader.getFieldNames(IndexReader.FieldOption.INDEXED_NO_TERMVECTOR);
assertTrue(result != null);
assertTrue(result.size() == 3);
}
1.12 +63 -17
jakarta-lucene/src/test/org/apache/lucene/index/TestIndexReader.java
Index: TestIndexReader.java
===================================================================
RCS file:
/home/cvs/jakarta-lucene/src/test/org/apache/lucene/index/TestIndexReader.java,v
retrieving revision 1.11
retrieving revision 1.12
diff -u -r1.11 -r1.12
--- TestIndexReader.java 22 Dec 2004 19:43:05 -0000 1.11
+++ TestIndexReader.java 29 Dec 2004 21:38:41 -0000 1.12
@@ -62,7 +62,7 @@
writer.close();
// set up reader
IndexReader reader = IndexReader.open(d);
- Collection fieldNames = reader.getFieldNames();
+ Collection fieldNames =
reader.getFieldNames(IndexReader.FieldOption.ALL);
assertTrue(fieldNames.contains("keyword"));
assertTrue(fieldNames.contains("text"));
assertTrue(fieldNames.contains("unindexed"));
@@ -79,11 +79,17 @@
{
addDocumentWithDifferentFields(writer);
}
+ // new termvector fields
+ for (int i = 0; i < 5*writer.getMergeFactor(); i++)
+ {
+ addDocumentWithTermVectorFields(writer);
+ }
+
writer.close();
// verify fields again
reader = IndexReader.open(d);
- fieldNames = reader.getFieldNames();
- assertEquals(8, fieldNames.size()); // the following fields
+ fieldNames = reader.getFieldNames(IndexReader.FieldOption.ALL);
+ assertEquals(13, fieldNames.size()); // the following fields
assertTrue(fieldNames.contains("keyword"));
assertTrue(fieldNames.contains("text"));
assertTrue(fieldNames.contains("unindexed"));
@@ -92,22 +98,50 @@
assertTrue(fieldNames.contains("text2"));
assertTrue(fieldNames.contains("unindexed2"));
assertTrue(fieldNames.contains("unstored2"));
-
+ assertTrue(fieldNames.contains("tvnot"));
+ assertTrue(fieldNames.contains("termvector"));
+ assertTrue(fieldNames.contains("tvposition"));
+ assertTrue(fieldNames.contains("tvoffset"));
+ assertTrue(fieldNames.contains("tvpositionoffset"));
+
// verify that only indexed fields were returned
- Collection indexedFieldNames = reader.getFieldNames(true);
- assertEquals(6, indexedFieldNames.size());
- assertTrue(indexedFieldNames.contains("keyword"));
- assertTrue(indexedFieldNames.contains("text"));
- assertTrue(indexedFieldNames.contains("unstored"));
- assertTrue(indexedFieldNames.contains("keyword2"));
- assertTrue(indexedFieldNames.contains("text2"));
- assertTrue(indexedFieldNames.contains("unstored2"));
-
+ fieldNames = reader.getFieldNames(IndexReader.FieldOption.INDEXED);
+ assertEquals(11, fieldNames.size()); // 6 original + the 5
termvector fields
+ assertTrue(fieldNames.contains("keyword"));
+ assertTrue(fieldNames.contains("text"));
+ assertTrue(fieldNames.contains("unstored"));
+ assertTrue(fieldNames.contains("keyword2"));
+ assertTrue(fieldNames.contains("text2"));
+ assertTrue(fieldNames.contains("unstored2"));
+ assertTrue(fieldNames.contains("tvnot"));
+ assertTrue(fieldNames.contains("termvector"));
+ assertTrue(fieldNames.contains("tvposition"));
+ assertTrue(fieldNames.contains("tvoffset"));
+ assertTrue(fieldNames.contains("tvpositionoffset"));
+
// verify that only unindexed fields were returned
- Collection unindexedFieldNames = reader.getFieldNames(false);
- assertEquals(2, unindexedFieldNames.size()); // the following
fields
- assertTrue(unindexedFieldNames.contains("unindexed"));
- assertTrue(unindexedFieldNames.contains("unindexed2"));
+ fieldNames = reader.getFieldNames(IndexReader.FieldOption.UNINDEXED);
+ assertEquals(2, fieldNames.size()); // the following fields
+ assertTrue(fieldNames.contains("unindexed"));
+ assertTrue(fieldNames.contains("unindexed2"));
+
+ // verify index term vector fields
+ fieldNames =
reader.getFieldNames(IndexReader.FieldOption.TERMVECTOR);
+ assertEquals(1, fieldNames.size()); // 1 field has term vector
only
+ assertTrue(fieldNames.contains("termvector"));
+
+ fieldNames =
reader.getFieldNames(IndexReader.FieldOption.TERMVECTOR_WITH_POSITION);
+ assertEquals(1, fieldNames.size()); // 4 fields are indexed with
term vectors
+ assertTrue(fieldNames.contains("tvposition"));
+
+ fieldNames =
reader.getFieldNames(IndexReader.FieldOption.TERMVECTOR_WITH_OFFSET);
+ assertEquals(1, fieldNames.size()); // 4 fields are indexed with
term vectors
+ assertTrue(fieldNames.contains("tvoffset"));
+
+ fieldNames =
reader.getFieldNames(IndexReader.FieldOption.TERMVECTOR_WITH_POSITION_OFFSET);
+ assertEquals(1, fieldNames.size()); // 4 fields are indexed with
term vectors
+ assertTrue(fieldNames.contains("tvpositionoffset"));
+
}
@@ -431,6 +465,18 @@
writer.addDocument(doc);
}
+ private void addDocumentWithTermVectorFields(IndexWriter writer) throws
IOException
+ {
+ Document doc = new Document();
+ doc.add(new Field("tvnot","tvnot", Field.Store.YES,
Field.Index.TOKENIZED, Field.TermVector.NO));
+ doc.add(new Field("termvector","termvector", Field.Store.YES,
Field.Index.TOKENIZED, Field.TermVector.YES));
+ doc.add(new Field("tvoffset","tvoffset", Field.Store.YES,
Field.Index.TOKENIZED, Field.TermVector.WITH_OFFSETS));
+ doc.add(new Field("tvposition","tvposition", Field.Store.YES,
Field.Index.TOKENIZED, Field.TermVector.WITH_POSITIONS));
+ doc.add(new Field("tvpositionoffset","tvpositionoffset",
Field.Store.YES, Field.Index.TOKENIZED,
Field.TermVector.WITH_POSITIONS_OFFSETS));
+
+ writer.addDocument(doc);
+ }
+
private void addDoc(IndexWriter writer, String value)
{
Document doc = new Document();
1.7 +2 -2
jakarta-lucene/src/test/org/apache/lucene/index/TestSegmentMerger.java
Index: TestSegmentMerger.java
===================================================================
RCS file:
/home/cvs/jakarta-lucene/src/test/org/apache/lucene/index/TestSegmentMerger.java,v
retrieving revision 1.6
retrieving revision 1.7
diff -u -r1.6 -r1.7
--- TestSegmentMerger.java 5 Oct 2004 17:30:47 -0000 1.6
+++ TestSegmentMerger.java 29 Dec 2004 21:38:41 -0000 1.7
@@ -95,9 +95,9 @@
assertTrue(termDocs != null);
assertTrue(termDocs.next() == true);
- Collection stored = mergedReader.getIndexedFieldNames(true);
+ Collection stored =
mergedReader.getFieldNames(IndexReader.FieldOption.INDEXED_WITH_TERMVECTOR);
assertTrue(stored != null);
- //System.out.println("stored size: " + stored.size());
+ System.out.println("stored size: " + stored.size());
assertTrue(stored.size() == 2);
TermFreqVector vector = mergedReader.getTermFreqVector(0,
DocHelper.TEXT_FIELD_2_KEY);
---------------------------------------------------------------------
To unsubscribe, e-mail: [EMAIL PROTECTED]
For additional commands, e-mail: [EMAIL PROTECTED]