org.sindice.siren.search.TestSirenTermScorer.java Source code

Java tutorial

Introduction

Here is the source code for org.sindice.siren.search.TestSirenTermScorer.java

Source

/**
 * Copyright 2009, Renaud Delbru
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
/**
 * @project siren
 * @author Renaud Delbru [ 10 Dec 2009 ]
 * @link http://renaud.delbru.fr/
 * @copyright Copyright (C) 2009 by Renaud Delbru, All rights reserved.
 */
package org.sindice.siren.search;

import static org.junit.Assert.*;

import java.io.IOException;

import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermPositions;
import org.apache.lucene.search.DefaultSimilarity;
import org.apache.lucene.search.DocIdSetIterator;
import org.junit.Test;

public class TestSirenTermScorer extends AbstractTestSirenScorer {

    @Test(expected = RuntimeException.class)
    public void testNextPositionFail() throws Exception {
        _helper.addDocument("<http://renaud.delbru.fr/> . ");
        final Term term = new Term(QueryTestingHelper.DEFAULT_FIELD, "renaud");
        final IndexReader reader = _helper.getIndexReader();
        final TermPositions termPositions = reader.termPositions(term);

        final SirenTermScorer scorer = new SirenTermScorer(new ConstantWeight(), termPositions,
                new DefaultSimilarity(), reader.norms(term.field()));
        scorer.nextPosition();
    }

    @Test
    public void testNextWithURI() throws Exception {
        this.assertTo(new AssertNextEntityFunctor(),
                new String[] { "<http://renaud.delbru.fr/> <http://renaud.delbru.fr/> . " },
                new String[] { "renaud" }, 1, new int[] { 1 }, new int[] { 2 }, new int[] { 0 }, new int[] { 0 },
                new int[] { 0 }, new int[] { 0 });
        this.assertTo(new AssertNextEntityFunctor(),
                new String[] { "<http://renaud.delbru.fr/> <http://renaud.delbru.fr/> . ",
                        "<http://renaud.delbru.fr/> <http://test/name> \"Renaud Delbru\" . " },
                new String[] { "renaud" }, 2, new int[] { 1, 1 }, new int[] { 2, 2 }, new int[] { 0, 1 },
                new int[] { 0, 0 }, new int[] { 0, 0 }, new int[] { 0, 0 });
    }

    @Test
    public void testNextPositionWithURI() throws Exception {
        this.assertTo(new AssertNextPositionEntityFunctor(),
                new String[] { "<http://renaud.delbru.fr/> <http://renaud.delbru.fr/> . " },
                new String[] { "renaud" }, 1, new int[] { 1 }, new int[] { 2 }, new int[] { 0, 0 },
                new int[] { 0, 0 }, new int[] { 0, 1 }, new int[] { 0, 2 });
        this.assertTo(new AssertNextPositionEntityFunctor(),
                new String[] { "<http://renaud.delbru.fr/> <http://renaud.delbru.fr/> . \n"
                        + "<http://renaud.delbru.fr/> <http://test/name> \"Renaud Delbru\" . " },
                new String[] { "renaud" }, 1, new int[] { 2 }, new int[] { 2, 2 }, new int[] { 0, 0, 0, 0 },
                new int[] { 0, 0, 1, 1 }, new int[] { 0, 1, 0, 2 }, new int[] { 0, 2, 4, 8 });
    }

    @Test
    public void testSkipToEntityTupleCell() throws Exception {
        for (int i = 0; i < 32; i++)
            _helper.addDocument("<http://renaud.delbru.fr/> . \"renaud delbru\" \"renaud delbru\" . ");
        final SirenScorer scorer = this.getTermScorer(QueryTestingHelper.DEFAULT_FIELD, "renaud");
        assertFalse(scorer.advance(16, 1, 1) == DocIdSetIterator.NO_MORE_DOCS);
        assertEquals(16, scorer.docID());
        assertEquals(16, scorer.entity());
        assertEquals(1, scorer.tuple());
        assertEquals(1, scorer.cell());
        assertEquals(-1, scorer.dataset());
        assertEquals(4, scorer.pos());
    }

    @Test
    public void testSkipToNonExistingEntityTupleCell() throws Exception {
        for (int i = 0; i < 32; i++)
            _helper.addDocument("<http://renaud.delbru.fr/> . \"renaud delbru\" \"renaud delbru\" . ");
        final SirenScorer scorer = this.getTermScorer(QueryTestingHelper.DEFAULT_FIELD, "renaud");
        // does not exist, should skip to entity 17 and first cell
        assertFalse(scorer.advance(16, 3, 2) == DocIdSetIterator.NO_MORE_DOCS);
        assertEquals(17, scorer.docID());
        assertEquals(17, scorer.entity());
        assertEquals(0, scorer.tuple());
        assertEquals(0, scorer.cell());
        assertEquals(-1, scorer.dataset());
        assertEquals(0, scorer.pos());
    }

    @Test
    public void testSkipToEntityTupleCellNextPosition() throws Exception {
        for (int i = 0; i < 32; i++)
            _helper.addDocument("<http://renaud.delbru.fr/> . \"renaud delbru\" \"renaud delbru\" . ");
        final SirenScorer scorer = this.getTermScorer(QueryTestingHelper.DEFAULT_FIELD, "delbru");
        assertFalse(scorer.advance(16, 1, 0) == DocIdSetIterator.NO_MORE_DOCS);
        assertEquals(16, scorer.docID());
        assertEquals(16, scorer.entity());
        assertEquals(1, scorer.tuple());
        assertEquals(0, scorer.cell());
        assertEquals(-1, scorer.dataset());
        assertEquals(3, scorer.pos());

        // Should not return match in first tuple (tuple 0)
        assertFalse(scorer.nextPosition() == SirenIdIterator.NO_MORE_POS);
        assertEquals(1, scorer.tuple());
        assertEquals(1, scorer.cell());
        assertEquals(-1, scorer.dataset());
        assertEquals(5, scorer.pos());

        assertTrue(scorer.nextPosition() == SirenIdIterator.NO_MORE_POS);
    }

    @Test(expected = Exception.class)
    public void testInvalidScoreCall() throws IOException {
        _helper.addDocument("\"Renaud\" . ");

        final Term t = new Term(QueryTestingHelper.DEFAULT_FIELD, "renaud");
        final IndexReader reader = _helper.getIndexReader();
        final TermPositions termPositions = reader.termPositions(t);

        final SirenTermScorer scorer = new SirenTermScorer(new ConstantWeight(), termPositions,
                new DefaultSimilarity(), reader.norms(QueryTestingHelper.DEFAULT_FIELD));

        assertNotNull("scorer is null and it shouldn't be", scorer);

        // Invalid call
        scorer.score();
    }

    @Test
    public void testScore() throws IOException {
        _helper.addDocument("\"Renaud\" . ");

        final Term t = new Term(QueryTestingHelper.DEFAULT_FIELD, "renaud");
        final IndexReader reader = _helper.getIndexReader();
        final TermPositions termPositions = reader.termPositions(t);

        final SirenTermScorer scorer = new SirenTermScorer(new ConstantWeight(), termPositions,
                new DefaultSimilarity(), reader.norms(QueryTestingHelper.DEFAULT_FIELD));
        assertNotNull("scorer is null and it shouldn't be", scorer);

        assertNotNull("next returns null and it shouldn't be", scorer.nextDoc());
        assertEquals(0, scorer.entity());
        // All it does is returning the term frequency since weight is constant
        assertEquals(1.0, scorer.score(), 0.01);
    }

    ///////////////////////////////////
    //
    // END OF TESTS
    // START HELPER METHODS AND CLASSES
    //
    ///////////////////////////////////

    @Override
    protected void assertTo(final AssertFunctor functor, final String[] input, final String[] terms,
            final int expectedNumDocs, final int[] expectedNumTuples, final int[] expectedNumCells,
            final int[] expectedEntityID, final int[] expectedTupleID, final int[] expectedCellID,
            final int[] expectedPos) throws Exception {
        _helper.reset();
        _helper.addDocuments(input);
        final IndexReader reader = _helper.getIndexReader();
        assertEquals(expectedNumDocs, reader.numDocs());

        SirenTermScorer scorer = null;
        for (final String t : terms) {
            scorer = this.getTermScorer(QueryTestingHelper.DEFAULT_FIELD, t);
            functor.run(scorer, expectedNumDocs, expectedNumTuples, expectedNumCells, expectedEntityID,
                    expectedTupleID, expectedCellID, expectedPos);
        }
        reader.close();
    }

}