aos.lucene.search.advanced.MultiPhraseQueryTest.java Source code

Java tutorial

Introduction

Here is the source code for aos.lucene.search.advanced.MultiPhraseQueryTest.java

Source

/****************************************************************
 * Licensed to the AOS Community (AOS) under one or more        *
 * contributor license agreements.  See the NOTICE file         *
 * distributed with this work for additional information        *
 * regarding copyright ownership.  The AOS licenses this file   *
 * to you under the Apache License, Version 2.0 (the            *
 * "License"); you may not use this file except in compliance   *
 * with the License.  You may obtain a copy of the License at   *
 *                                                              *
 *   http://www.apache.org/licenses/LICENSE-2.0                 *
 *                                                              *
 * Unless required by applicable law or agreed to in writing,   *
 * software distributed under the License is distributed on an  *
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY       *
 * KIND, either express or implied.  See the License for the    *
 * specific language governing permissions and limitations      *
 * under the License.                                           *
 ****************************************************************/
package aos.lucene.search.advanced;

import junit.framework.TestCase;

import org.apache.lucene.queryParser.QueryParser;
import org.apache.lucene.analysis.WhitespaceAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.PhraseQuery;
import org.apache.lucene.search.MultiPhraseQuery;
import org.apache.lucene.search.BooleanClause;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.RAMDirectory;
import org.apache.lucene.util.Version;

import io.aos.lucene.analysis.synonym.SynonymAnalyzer;
import io.aos.lucene.analysis.synonym.SynonymEngine;

import java.io.IOException;

// From chapter 5
public class MultiPhraseQueryTest extends TestCase {
    private IndexSearcher searcher;

    protected void setUp() throws Exception {
        Directory directory = new RAMDirectory();
        IndexWriter writer = new IndexWriter(directory, new WhitespaceAnalyzer(Version.LUCENE_46),
                IndexWriter.MaxFieldLength.UNLIMITED);
        Document doc1 = new Document();
        doc1.add(new Field("field", "the quick brown fox jumped over the lazy dog", Field.Store.YES,
                Field.Index.ANALYZED));
        writer.addDocument(doc1);
        Document doc2 = new Document();
        doc2.add(new Field("field", "the fast fox hopped over the hound", Field.Store.YES, Field.Index.ANALYZED));
        writer.addDocument(doc2);
        writer.close();

        searcher = new IndexSearcher(directory);
    }

    public void testBasic() throws Exception {
        MultiPhraseQuery query = new MultiPhraseQuery();
        query.add(new Term[] { // #A
                new Term("field", "quick"), // #A
                new Term("field", "fast") // #A
        });
        query.add(new Term("field", "fox")); // #B
        LOGGER.info(query);

        TopDocs hits = searcher.search(query, 10);
        assertEquals("fast fox match", 1, hits.totalHits);

        query.setSlop(1);
        hits = searcher.search(query, 10);
        assertEquals("both match", 2, hits.totalHits);
    }
    /*
    #A Any of these terms may be in first position to match
    #B Only one in second position
    */

    public void testAgainstOR() throws Exception {
        PhraseQuery quickFox = new PhraseQuery();
        quickFox.setSlop(1);
        quickFox.add(new Term("field", "quick"));
        quickFox.add(new Term("field", "fox"));

        PhraseQuery fastFox = new PhraseQuery();
        fastFox.add(new Term("field", "fast"));
        fastFox.add(new Term("field", "fox"));

        BooleanQuery query = new BooleanQuery();
        query.add(quickFox, BooleanClause.Occur.SHOULD);
        query.add(fastFox, BooleanClause.Occur.SHOULD);
        TopDocs hits = searcher.search(query, 10);
        assertEquals(2, hits.totalHits);
    }

    public void testQueryParser() throws Exception {
        SynonymEngine engine = new SynonymEngine() {
            public String[] getSynonyms(String s) {
                if (s.equals("quick"))
                    return new String[] { "fast" };
                else
                    return null;
            }
        };

        Query q = new QueryParser(Version.LUCENE_46, "field", new SynonymAnalyzer(engine)).parse("\"quick fox\"");

        assertEquals("analyzed", "field:\"(quick fast) fox\"", q.toString());
        assertTrue("parsed as MultiPhraseQuery", q instanceof MultiPhraseQuery);
    }

    private void debug(TopDocs hits) throws IOException {
        for (ScoreDoc sd : hits.scoreDocs) {
            Document doc = searcher.doc(sd.doc);
            LOGGER.info(sd.score + ": " + doc.get("field"));
        }

    }
}