Example usage for org.apache.lucene.analysis.it ItalianAnalyzer ItalianAnalyzer

List of usage examples for org.apache.lucene.analysis.it ItalianAnalyzer ItalianAnalyzer

Introduction

In this page you can find the example usage for org.apache.lucene.analysis.it ItalianAnalyzer ItalianAnalyzer.

Prototype

public ItalianAnalyzer() 

Source Link

Document

Builds an analyzer with the default stop words: #DEFAULT_STOPWORD_FILE .

Usage

From source file:de.mirkosertic.desktopsearch.AnalyzerCache.java

License:Open Source License

public AnalyzerCache(Configuration aConfiguration) {
    standardAnalyzer = configure(new StandardAnalyzer());
    analyzerByLanguage = new HashMap<>();

    registerIfEnabled(SupportedLanguage.ar, aConfiguration, configure(new ArabicAnalyzer()));
    registerIfEnabled(SupportedLanguage.bg, aConfiguration, configure(new BulgarianAnalyzer()));
    registerIfEnabled(SupportedLanguage.br, aConfiguration, configure(new BrazilianAnalyzer()));
    registerIfEnabled(SupportedLanguage.ca, aConfiguration, configure(new CatalanAnalyzer()));
    registerIfEnabled(SupportedLanguage.ckb, aConfiguration, configure(new SoraniAnalyzer()));
    registerIfEnabled(SupportedLanguage.cz, aConfiguration, configure(new CzechAnalyzer()));
    registerIfEnabled(SupportedLanguage.da, aConfiguration, configure(new DanishAnalyzer()));
    registerIfEnabled(SupportedLanguage.de, aConfiguration, configure(new GermanAnalyzer()));
    registerIfEnabled(SupportedLanguage.el, aConfiguration, configure(new GreekAnalyzer()));
    registerIfEnabled(SupportedLanguage.en, aConfiguration, configure(new EnglishAnalyzer()));
    registerIfEnabled(SupportedLanguage.es, aConfiguration, configure(new SpanishAnalyzer()));
    registerIfEnabled(SupportedLanguage.eu, aConfiguration, configure(new BasqueAnalyzer()));
    registerIfEnabled(SupportedLanguage.fa, aConfiguration, configure(new PersianAnalyzer()));
    registerIfEnabled(SupportedLanguage.fi, aConfiguration, configure(new FinnishAnalyzer()));
    registerIfEnabled(SupportedLanguage.fr, aConfiguration, configure(new FrenchAnalyzer()));
    registerIfEnabled(SupportedLanguage.ga, aConfiguration, configure(new IrishAnalyzer()));
    registerIfEnabled(SupportedLanguage.gl, aConfiguration, configure(new GalicianAnalyzer()));
    registerIfEnabled(SupportedLanguage.hi, aConfiguration, configure(new HindiAnalyzer()));
    registerIfEnabled(SupportedLanguage.hu, aConfiguration, configure(new HungarianAnalyzer()));
    registerIfEnabled(SupportedLanguage.hy, aConfiguration, configure(new ArmenianAnalyzer()));
    registerIfEnabled(SupportedLanguage.id, aConfiguration, configure(new IndonesianAnalyzer()));
    registerIfEnabled(SupportedLanguage.it, aConfiguration, configure(new ItalianAnalyzer()));
    registerIfEnabled(SupportedLanguage.lv, aConfiguration, configure(new LatvianAnalyzer()));
    registerIfEnabled(SupportedLanguage.nl, aConfiguration, configure(new DutchAnalyzer()));
    registerIfEnabled(SupportedLanguage.no, aConfiguration, configure(new NorwegianAnalyzer()));
    registerIfEnabled(SupportedLanguage.pt, aConfiguration, configure(new PortugueseAnalyzer()));
    registerIfEnabled(SupportedLanguage.ro, aConfiguration, configure(new RomanianAnalyzer()));
    registerIfEnabled(SupportedLanguage.ru, aConfiguration, configure(new RussianAnalyzer()));
    registerIfEnabled(SupportedLanguage.sv, aConfiguration, configure(new SwedishAnalyzer()));
    registerIfEnabled(SupportedLanguage.th, aConfiguration, configure(new ThaiAnalyzer()));
    registerIfEnabled(SupportedLanguage.tr, aConfiguration, configure(new TurkishAnalyzer()));
}

From source file:evalita.q4faq.baseline.Index.java

License:Open Source License

/**
 * @param args the command line arguments
 */// www.  ja  v  a 2s.  com
public static void main(String[] args) {
    try {
        if (args.length > 1) {
            Reader in = new FileReader(args[0]);
            IndexWriterConfig config = new IndexWriterConfig(Version.LATEST, new ItalianAnalyzer());
            IndexWriter writer = new IndexWriter(FSDirectory.open(new File(args[1])), config);
            Iterable<CSVRecord> records = CSVFormat.EXCEL.withHeader().withDelimiter(';').parse(in);
            for (CSVRecord record : records) {
                int id = Integer.parseInt(record.get("id"));
                String question = record.get("question");
                String answer = record.get("answer");
                String tag = record.get("tag");
                Document doc = new Document();
                doc.add(new StringField("id", String.valueOf(id), Field.Store.YES));
                doc.add(new TextField("question", question, Field.Store.NO));
                doc.add(new TextField("answer", answer, Field.Store.NO));
                doc.add(new TextField("tag", tag.replace(",", " "), Field.Store.NO));
                writer.addDocument(doc);
            }
            writer.close();
        } else {
            throw new IllegalArgumentException("Number of arguments not valid");
        }
    } catch (IOException | IllegalArgumentException ex) {
        Logger.getLogger(Index.class.getName()).log(Level.SEVERE, null, ex);
    }
}

From source file:evalita.q4faq.baseline.Search.java

License:Open Source License

/**
 * @param args the command line arguments
 *///from   w w  w  . j a  va 2  s .  c o m
public static void main(String[] args) {
    try {
        if (args.length > 2) {
            IndexSearcher searcher = new IndexSearcher(
                    DirectoryReader.open(FSDirectory.open(new File(args[0]))));
            BufferedReader reader = new BufferedReader(new FileReader(args[1]));
            BufferedWriter writer = new BufferedWriter(new FileWriter(args[2]));
            String[] fields = new String[] { "question", "answer", "tag" };
            Map<String, Float> boosts = new HashMap<>();
            boosts.put("question", 4f);
            boosts.put("answer", 2f);
            boosts.put("tag", 1f);
            QueryParser parser = new MultiFieldQueryParser(fields, new ItalianAnalyzer(), boosts);
            while (reader.ready()) {
                String[] split = reader.readLine().split("\t");
                Query q = parser.parse(split[1].replace("?", " ").replace("!", " ").replace("/", " "));
                TopDocs topdocs = searcher.search(q, 25);
                for (ScoreDoc res : topdocs.scoreDocs) {
                    writer.append(split[0]).append("\t");
                    writer.append(searcher.doc(res.doc).get("id")).append("\t");
                    writer.append(String.valueOf(res.score));
                    writer.newLine();
                }
            }
            reader.close();
            writer.close();
        } else {
            throw new IllegalArgumentException("Number of arguments not valid");
        }
    } catch (IOException | IllegalArgumentException | ParseException ex) {
        Logger.getLogger(Search.class.getName()).log(Level.SEVERE, null, ex);
    }
}