com.leavesfly.lia.tool.ChainedFilterTest.java Source code

Java tutorial

Introduction

Here is the source code for com.leavesfly.lia.tool.ChainedFilterTest.java

Source

package com.leavesfly.lia.tool;

/**
 * Copyright Manning Publications Co.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific lan      
 */

import junit.framework.TestCase;

import org.apache.lucene.store.RAMDirectory;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.BooleanClause;
import org.apache.lucene.search.TermQuery;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.TermRangeFilter;
import org.apache.lucene.search.QueryWrapperFilter;
import org.apache.lucene.search.CachingWrapperFilter;
import org.apache.lucene.search.Filter;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.DateTools;
import org.apache.lucene.document.Field;
import org.apache.lucene.analysis.WhitespaceAnalyzer;
import org.apache.lucene.misc.ChainedFilter;

import com.leavesfly.lia.commom.TestUtil;

import java.util.Calendar;

// From chapter 9
public class ChainedFilterTest extends TestCase {
    public static final int MAX = 500;
    private RAMDirectory directory;
    private IndexSearcher searcher;
    private Query query;
    private Filter dateFilter;
    private Filter bobFilter;
    private Filter sueFilter;

    public void setUp() throws Exception {
        directory = new RAMDirectory();
        IndexWriter writer = new IndexWriter(directory, new WhitespaceAnalyzer(),
                IndexWriter.MaxFieldLength.UNLIMITED);

        Calendar cal = Calendar.getInstance();
        cal.set(2009, 1, 1, 0, 0); // A

        for (int i = 0; i < MAX; i++) {
            Document doc = new Document();
            doc.add(new Field("key", "" + (i + 1), Field.Store.YES, Field.Index.NOT_ANALYZED));
            doc.add(new Field("owner", (i < MAX / 2) ? "bob" : "sue", Field.Store.YES, Field.Index.NOT_ANALYZED));
            doc.add(new Field("date", DateTools.timeToString(cal.getTimeInMillis(), DateTools.Resolution.DAY),
                    Field.Store.YES, Field.Index.NOT_ANALYZED));
            writer.addDocument(doc);

            cal.add(Calendar.DATE, 1);
        }

        writer.close();

        searcher = new IndexSearcher(directory);

        BooleanQuery bq = new BooleanQuery(); // B
        bq.add(new TermQuery(new Term("owner", "bob")), // B
                BooleanClause.Occur.SHOULD); // B
        bq.add(new TermQuery(new Term("owner", "sue")), // B
                BooleanClause.Occur.SHOULD); // B
        query = bq;

        cal.set(2099, 1, 1, 0, 0);
        dateFilter = TermRangeFilter.Less("date", // C
                DateTools.timeToString( // C
                        cal.getTimeInMillis(), // C
                        DateTools.Resolution.DAY));// C

        bobFilter = new CachingWrapperFilter( // D
                new QueryWrapperFilter( // D
                        new TermQuery(new Term("owner", "bob")))); // D

        sueFilter = new CachingWrapperFilter( // E
                new QueryWrapperFilter( // E
                        new TermQuery(new Term("owner", "sue")))); // E
    }

    /*
     * #A 2009 January 01 #B BooleanQuery that matches all documents #C Date
     * filter also matches all documents #D Matches only Bob's documents #E
     * Matches only Sue's documents
     */

    public void testSingleFilter() throws Exception {
        ChainedFilter chain = new ChainedFilter(new Filter[] { dateFilter });
        TopDocs hits = searcher.search(query, chain, 10);
        assertEquals(MAX, hits.totalHits);

        chain = new ChainedFilter(new Filter[] { bobFilter });
        assertEquals(MAX / 2, TestUtil.hitCount(searcher, query, chain), hits.totalHits);
    }

    public void testOR() throws Exception {
        ChainedFilter chain = new ChainedFilter(new Filter[] { sueFilter, bobFilter });

        assertEquals("OR matches all", MAX, TestUtil.hitCount(searcher, query, chain));
    }

    public void testAND() throws Exception {
        ChainedFilter chain = new ChainedFilter(new Filter[] { dateFilter, bobFilter }, ChainedFilter.AND);
        TopDocs hits = searcher.search(query, chain, 10);
        assertEquals("AND matches just Bob", MAX / 2, hits.totalHits);
        Document firstDoc = searcher.doc(hits.scoreDocs[0].doc);
        assertEquals("bob", firstDoc.get("owner"));
    }

    public void testXOR() throws Exception {
        ChainedFilter chain = new ChainedFilter(new Filter[] { dateFilter, bobFilter }, ChainedFilter.XOR);
        TopDocs hits = searcher.search(query, chain, 10);
        assertEquals("XOR matches Sue", MAX / 2, hits.totalHits);
        Document firstDoc = searcher.doc(hits.scoreDocs[0].doc);
        assertEquals("sue", firstDoc.get("owner"));
    }

    public void testANDNOT() throws Exception {
        ChainedFilter chain = new ChainedFilter(new Filter[] { dateFilter, sueFilter },
                new int[] { ChainedFilter.AND, ChainedFilter.ANDNOT });

        TopDocs hits = searcher.search(query, chain, 10);
        assertEquals("ANDNOT matches just Bob", MAX / 2, hits.totalHits);
        Document firstDoc = searcher.doc(hits.scoreDocs[0].doc);
        assertEquals("bob", firstDoc.get("owner"));
    }
}