o código padrão é esse
public void simpleLucene() throws CorruptIndexException, LockObtainFailedException, IOException, ParseException {
Analyzer analyzer = new StandardAnalyzer(Version.LUCENE_CURRENT);
// Store the index in memory:
Directory directory = new RAMDirectory();
// To store an index on disk, use this instead (note that the
// parameter true will overwrite the index in that directory
// if one exists):
// Directory directory = FSDirectory.open(new File("/tmp/testindex"));
IndexWriter iwriter = new IndexWriter(directory, analyzer, true, new IndexWriter.MaxFieldLength(25000));
Document doc = new Document();
String text = "O Brasil é um país da América do Sul.";
doc.add(new Field("fieldname", text, Field.Store.YES, Field.Index.ANALYZED));
iwriter.addDocument(doc);
doc = new Document();
text = "Brasilia é a capital do Brasil";
doc.add(new Field("fieldname", text, Field.Store.YES, Field.Index.ANALYZED));
iwriter.addDocument(doc);
iwriter.close();
// Now search the index:
IndexSearcher isearcher = new IndexSearcher(directory);
// Parse a simple query that searches for "text":
QueryParser parser = new QueryParser(Version.LUCENE_CURRENT, "fieldname", analyzer);
Query query = parser.parse("Brasli"); //errado intencionalmente
TopScoreDocCollector collector = TopScoreDocCollector.create(10, true);
isearcher.search(query, collector);
System.out.println("collector.getTotalHits()=" + collector.getTotalHits());
// assertEquals(2, collector.getTotalHits());
// Iterate through the results:
ScoreDoc[] hits = collector.topDocs().scoreDocs;
for (int i = 0; i < hits.length; i++) {
Document hitDoc = isearcher.doc(hits[i].doc);
System.out.println("hitDoc.get(\"fieldname\")=" + hitDoc.get("fieldname"));
}
isearcher.close();
directory.close();
}
gostaria que ele devolvesse “Brasil” 2 ocorrências mesmo o parâmetro de busca estando errado, semelhante as consultas do google