Example usage for org.apache.lucene.codecs.simpletext SimpleTextCodec SimpleTextCodec

List of usage examples for org.apache.lucene.codecs.simpletext SimpleTextCodec SimpleTextCodec

Introduction

In this page you can find the example usage for org.apache.lucene.codecs.simpletext SimpleTextCodec SimpleTextCodec.

Prototype

public SimpleTextCodec() 

Source Link

Usage

From source file:nicta.com.au.patent.pac.index.PACIndexer.java

public PACIndexer(String indexDir) throws IOException {
    File indexDirFile = new File(indexDir);

    Map<String, Analyzer> analyzerPerField = new HashMap<>();
    analyzerPerField.put(PatentDocument.Title,
            new EnglishAnalyzer(Version.LUCENE_48, PatentsStopWords.TITLE_ENGLISH_STOP_WORDS_SET));
    analyzerPerField.put(PatentDocument.Abstract,
            new EnglishAnalyzer(Version.LUCENE_48, PatentsStopWords.ABSTRACT_ENGLISH_STOP_WORDS_SET));
    analyzerPerField.put(PatentDocument.Description,
            new EnglishAnalyzer(Version.LUCENE_48, PatentsStopWords.DESCRIPTION_ENGLISH_STOP_WORDS_SET));
    analyzerPerField.put(PatentDocument.Claims,
            new EnglishAnalyzer(Version.LUCENE_48, PatentsStopWords.CLAIMS_ENGLISH_STOP_WORDS_SET));
    aWrapper = new PerFieldAnalyzerWrapper(new StandardAnalyzer(Version.LUCENE_48), analyzerPerField);

    analyzer = new EnglishAnalyzer(Version.LUCENE_48, PatentsStopWords.ENGLISH_STOP_WORDS_SET);
    //        analyzer = new StandardAnalyzer(Version.LUCENE_48);
    IndexWriterConfig conf = new IndexWriterConfig(Version.LUCENE_48, aWrapper);
    conf.setUseCompoundFile(false);/*  ww  w  .j ava  2s  .co m*/
    conf.setCodec(new SimpleTextCodec());
    writer = new IndexWriter(FSDirectory.open(indexDirFile), conf);
}

From source file:org.apache.solr.codecs.test.testSimpleTextCodec.java

License:Apache License

public static void main(String[] args) {
    try {//from   w  w w. j av  a  2s . co  m
        plaintextDir = assureDirectoryExists(new File(INDEX_ROOT_FOLDER, "plaintext"));

        //----------- index documents -------
        StandardAnalyzer analyzer = new StandardAnalyzer(Version.LUCENE_48);
        IndexWriterConfig config = new IndexWriterConfig(Version.LUCENE_48, analyzer);
        // recreate the index on each execution
        config.setOpenMode(IndexWriterConfig.OpenMode.CREATE);
        config.setCodec(new SimpleTextCodec());
        config.setUseCompoundFile(false);
        Directory luceneDir = FSDirectory.open(plaintextDir);
        IndexWriter writer = new IndexWriter(luceneDir, config);
        writer.addDocument(Arrays.asList(new TextField("title", "The title of my first document", Store.YES),
                new TextField("content", "The content of the first document", Store.YES)));

        writer.addDocument(Arrays.asList(new TextField("title", "The tAtle of the second document", Store.YES),
                new TextField("content", "The content of the second document", Store.YES)));
        writer.addDocument(Arrays.asList(new TextField("title", "The title of the third document", Store.YES),
                new TextField("content", "The content of the third document", Store.YES)));
        writer.commit();
        writer.close();
        IndexReader reader = DirectoryReader.open(luceneDir);
        // now test for docs
        if (reader.numDocs() != 3)
            throw new IOException("amount of returned docs are less than indexed");
        else
            System.out.println("test passed");
        searchIndex("content", "third");
    } catch (Throwable te) {
        te.printStackTrace();
    }
}

From source file:org.apache.solr.core.SimpleTextCodecFactory.java

License:Apache License

@Override
public void init(NamedList args) {
    super.init(args);
    assert codec == null;
    codec = new SimpleTextCodec();
}