2021-02-03 13:48:30 +01:00
|
|
|
package it.cavallium.dbengine.client;
|
|
|
|
|
2021-03-02 01:53:36 +01:00
|
|
|
import it.cavallium.dbengine.client.query.QueryUtils;
|
|
|
|
import it.cavallium.dbengine.client.query.current.data.QueryParams;
|
|
|
|
import it.cavallium.dbengine.client.query.current.data.ScoreMode;
|
|
|
|
import it.cavallium.dbengine.client.query.current.data.ScoreSort;
|
2021-02-03 13:48:30 +01:00
|
|
|
import it.cavallium.dbengine.database.LLDocument;
|
|
|
|
import it.cavallium.dbengine.database.LLItem;
|
|
|
|
import it.cavallium.dbengine.database.LLLuceneIndex;
|
2021-03-03 15:03:25 +01:00
|
|
|
import it.cavallium.dbengine.database.LLSignal;
|
2021-02-03 13:48:30 +01:00
|
|
|
import it.cavallium.dbengine.database.LLTerm;
|
2021-03-02 01:53:36 +01:00
|
|
|
import it.cavallium.dbengine.database.disk.LLLocalDatabaseConnection;
|
2021-02-04 22:42:57 +01:00
|
|
|
import it.cavallium.dbengine.lucene.LuceneUtils;
|
|
|
|
import it.cavallium.dbengine.lucene.analyzer.TextFieldsAnalyzer;
|
|
|
|
import it.cavallium.dbengine.lucene.analyzer.TextFieldsSimilarity;
|
2021-02-03 13:48:30 +01:00
|
|
|
import java.io.IOException;
|
|
|
|
import java.nio.file.Files;
|
|
|
|
import java.nio.file.Path;
|
|
|
|
import java.time.Duration;
|
|
|
|
import java.util.Comparator;
|
|
|
|
import java.util.StringJoiner;
|
|
|
|
import java.util.concurrent.CompletionException;
|
|
|
|
import org.apache.lucene.document.Field.Store;
|
|
|
|
import reactor.core.publisher.Mono;
|
|
|
|
import reactor.core.scheduler.Schedulers;
|
|
|
|
|
|
|
|
public class IndicizationExample {
|
|
|
|
|
|
|
|
public static void main(String[] args) {
|
|
|
|
tempIndex(true)
|
|
|
|
.flatMap(index -> index
|
|
|
|
.addDocument(new LLTerm("id", "123"),
|
|
|
|
new LLDocument(new LLItem[]{
|
|
|
|
LLItem.newStringField("id", "123", Store.YES),
|
2021-02-04 22:42:57 +01:00
|
|
|
LLItem.newTextField("name", "Mario", Store.NO),
|
2021-02-03 13:48:30 +01:00
|
|
|
LLItem.newStringField("surname", "Rossi", Store.NO)
|
|
|
|
})
|
|
|
|
)
|
|
|
|
.then(index.refresh())
|
2021-02-14 13:46:11 +01:00
|
|
|
.then(index.search(null,
|
2021-03-02 01:53:36 +01:00
|
|
|
QueryParams
|
|
|
|
.builder()
|
|
|
|
.query(QueryUtils.exactSearch(TextFieldsAnalyzer.N4GramPartialString, "name", "Mario"))
|
|
|
|
.limit(1)
|
|
|
|
.sort(ScoreSort.of())
|
|
|
|
.scoreMode(ScoreMode.of(false, true))
|
|
|
|
.build(),
|
2021-02-14 13:46:11 +01:00
|
|
|
"id"
|
|
|
|
))
|
2021-03-03 15:03:25 +01:00
|
|
|
.flatMap(results -> Mono.from(results
|
2021-02-03 13:48:30 +01:00
|
|
|
.results()
|
|
|
|
.flatMap(r -> r)
|
2021-03-03 15:03:25 +01:00
|
|
|
.doOnNext(signal -> {
|
|
|
|
if (signal.isValue()) {
|
|
|
|
System.out.println("Value: " + signal.getValue());
|
|
|
|
}
|
|
|
|
})
|
|
|
|
.filter(LLSignal::isTotalHitsCount))
|
2021-02-03 13:48:30 +01:00
|
|
|
)
|
|
|
|
.doOnNext(count -> System.out.println("Total hits: " + count))
|
|
|
|
.doOnTerminate(() -> System.out.println("Completed"))
|
|
|
|
.then(index.close())
|
|
|
|
)
|
|
|
|
.subscribeOn(Schedulers.parallel())
|
2022-07-02 11:44:13 +02:00
|
|
|
.transform(LLUtils::handleDiscard)
|
2021-02-03 13:48:30 +01:00
|
|
|
.block();
|
2021-02-04 22:42:57 +01:00
|
|
|
tempIndex(true)
|
|
|
|
.flatMap(index ->
|
|
|
|
index
|
|
|
|
.addDocument(new LLTerm("id", "126"),
|
|
|
|
new LLDocument(new LLItem[]{
|
|
|
|
LLItem.newStringField("id", "126", Store.YES),
|
|
|
|
LLItem.newTextField("name", "Marioxq", Store.NO),
|
|
|
|
LLItem.newStringField("surname", "Rossi", Store.NO)
|
|
|
|
})
|
|
|
|
)
|
|
|
|
.then(index
|
|
|
|
.addDocument(new LLTerm("id", "123"),
|
|
|
|
new LLDocument(new LLItem[]{
|
|
|
|
LLItem.newStringField("id", "123", Store.YES),
|
|
|
|
LLItem.newTextField("name", "Mario", Store.NO),
|
|
|
|
LLItem.newStringField("surname", "Rossi", Store.NO)
|
|
|
|
})
|
|
|
|
))
|
|
|
|
.then(index
|
|
|
|
.addDocument(new LLTerm("id", "124"),
|
|
|
|
new LLDocument(new LLItem[]{
|
|
|
|
LLItem.newStringField("id", "124", Store.YES),
|
|
|
|
LLItem.newTextField("name", "Mariossi", Store.NO),
|
|
|
|
LLItem.newStringField("surname", "Rossi", Store.NO)
|
|
|
|
})
|
|
|
|
))
|
|
|
|
.then(index
|
|
|
|
.addDocument(new LLTerm("id", "125"),
|
|
|
|
new LLDocument(new LLItem[]{
|
|
|
|
LLItem.newStringField("id", "125", Store.YES),
|
|
|
|
LLItem.newTextField("name", "Mario marios", Store.NO),
|
|
|
|
LLItem.newStringField("surname", "Rossi", Store.NO)
|
|
|
|
})
|
|
|
|
))
|
|
|
|
.then(index
|
|
|
|
.addDocument(new LLTerm("id", "128"),
|
|
|
|
new LLDocument(new LLItem[]{
|
|
|
|
LLItem.newStringField("id", "128", Store.YES),
|
|
|
|
LLItem.newTextField("name", "Marion", Store.NO),
|
|
|
|
LLItem.newStringField("surname", "Rossi", Store.NO)
|
|
|
|
})
|
|
|
|
))
|
|
|
|
.then(index
|
|
|
|
.addDocument(new LLTerm("id", "127"),
|
|
|
|
new LLDocument(new LLItem[]{
|
|
|
|
LLItem.newStringField("id", "127", Store.YES),
|
|
|
|
LLItem.newTextField("name", "Mariotto", Store.NO),
|
|
|
|
LLItem.newStringField("surname", "Rossi", Store.NO)
|
|
|
|
})
|
|
|
|
))
|
|
|
|
.then(index.refresh())
|
2021-03-02 01:53:36 +01:00
|
|
|
.then(index.search(null,
|
|
|
|
QueryParams
|
|
|
|
.builder()
|
|
|
|
.query(QueryUtils.exactSearch(TextFieldsAnalyzer.N4GramPartialString, "name", "Mario"))
|
|
|
|
.limit(10)
|
|
|
|
.sort(MultiSort.topScore().getQuerySort())
|
|
|
|
.scoreMode(ScoreMode.of(false, true))
|
|
|
|
.build(),
|
|
|
|
"id"
|
|
|
|
))
|
2021-03-03 17:29:14 +01:00
|
|
|
.flatMap(results -> LuceneUtils.mergeSignalStreamRaw(results
|
2021-02-22 01:54:25 +01:00
|
|
|
.results(), MultiSort.topScoreRaw(), 10L)
|
2021-02-04 22:42:57 +01:00
|
|
|
.doOnNext(value -> System.out.println("Value: " + value))
|
2021-03-03 15:03:25 +01:00
|
|
|
.then(Mono.from(results
|
|
|
|
.results()
|
|
|
|
.flatMap(part -> part)
|
|
|
|
.filter(LLSignal::isTotalHitsCount)
|
|
|
|
.map(LLSignal::getTotalHitsCount)))
|
2021-02-04 22:42:57 +01:00
|
|
|
)
|
|
|
|
.doOnNext(count -> System.out.println("Total hits: " + count))
|
|
|
|
.doOnTerminate(() -> System.out.println("Completed"))
|
|
|
|
.then(index.close())
|
|
|
|
)
|
|
|
|
.subscribeOn(Schedulers.parallel())
|
2022-07-02 11:44:13 +02:00
|
|
|
.transform(LLUtils::handleDiscard)
|
2021-02-04 22:42:57 +01:00
|
|
|
.block();
|
2021-02-03 13:48:30 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static final class CurrentCustomType {
|
|
|
|
|
|
|
|
private final int number;
|
|
|
|
|
|
|
|
public CurrentCustomType(int number) {
|
|
|
|
this.number = number;
|
|
|
|
}
|
|
|
|
|
|
|
|
public int getNumber() {
|
|
|
|
return number;
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public String toString() {
|
|
|
|
return new StringJoiner(", ", CurrentCustomType.class.getSimpleName() + "[", "]")
|
|
|
|
.add("number=" + number)
|
|
|
|
.toString();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private static <U> Mono<? extends LLLuceneIndex> tempIndex(boolean delete) {
|
|
|
|
var wrkspcPath = Path.of("/tmp/tempdb/");
|
|
|
|
return Mono
|
|
|
|
.fromCallable(() -> {
|
|
|
|
if (delete && Files.exists(wrkspcPath)) {
|
|
|
|
Files.walk(wrkspcPath).sorted(Comparator.reverseOrder()).forEach(file -> {
|
|
|
|
try {
|
|
|
|
Files.delete(file);
|
|
|
|
} catch (IOException ex) {
|
|
|
|
throw new CompletionException(ex);
|
|
|
|
}
|
|
|
|
});
|
|
|
|
}
|
|
|
|
Files.createDirectories(wrkspcPath);
|
|
|
|
return null;
|
|
|
|
})
|
|
|
|
.subscribeOn(Schedulers.boundedElastic())
|
|
|
|
.then(new LLLocalDatabaseConnection(wrkspcPath, true).connect())
|
|
|
|
.flatMap(conn -> conn.getLuceneIndex("testindices",
|
2021-02-04 22:42:57 +01:00
|
|
|
10,
|
2021-02-06 19:21:31 +01:00
|
|
|
TextFieldsAnalyzer.N4GramPartialString,
|
2021-02-04 22:42:57 +01:00
|
|
|
TextFieldsSimilarity.NGramBM25Plus,
|
2021-02-03 13:48:30 +01:00
|
|
|
Duration.ofSeconds(5),
|
|
|
|
Duration.ofSeconds(5),
|
|
|
|
false
|
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|