mirror of
https://github.com/AppFlowy-IO/AppFlowy.git
synced 2024-08-30 18:12:39 +00:00
54 lines
1.7 KiB
Rust
54 lines
1.7 KiB
Rust
|
use tantivy::collector::TopDocs;
|
||
|
use tantivy::query::QueryParser;
|
||
|
use tantivy::schema::*;
|
||
|
use tantivy::{doc, DocAddress, Index, Score};
|
||
|
|
||
|
#[test]
|
||
|
fn search_folder_test() {
|
||
|
let mut schema_builder = Schema::builder();
|
||
|
let id = schema_builder.add_text_field("id", TEXT);
|
||
|
let title = schema_builder.add_text_field("title", TEXT | STORED);
|
||
|
let schema = schema_builder.build();
|
||
|
|
||
|
// Indexing documents
|
||
|
let index = Index::create_from_tempdir(schema.clone()).unwrap();
|
||
|
|
||
|
// Here we use a buffer of 100MB that will be split
|
||
|
// between indexing threads.
|
||
|
let mut index_writer = index.writer(100_000_000).unwrap();
|
||
|
|
||
|
// Let's index one documents!
|
||
|
index_writer
|
||
|
.add_document(doc!(
|
||
|
id => "123456789",
|
||
|
title => "The Old Man and the Seawhale",
|
||
|
))
|
||
|
.unwrap();
|
||
|
|
||
|
// We need to call .commit() explicitly to force the
|
||
|
// index_writer to finish processing the documents in the queue,
|
||
|
// flush the current index to the disk, and advertise
|
||
|
// the existence of new documents.
|
||
|
index_writer.commit().unwrap();
|
||
|
|
||
|
// # Searching
|
||
|
let reader = index.reader().unwrap();
|
||
|
|
||
|
let searcher = reader.searcher();
|
||
|
|
||
|
let mut query_parser = QueryParser::for_index(&index, vec![title]);
|
||
|
query_parser.set_field_fuzzy(title, true, 2, true);
|
||
|
let query = query_parser.parse_query("sewhals").unwrap();
|
||
|
|
||
|
// Perform search.
|
||
|
// `topdocs` contains the 10 most relevant doc ids, sorted by decreasing scores...
|
||
|
let top_docs: Vec<(Score, DocAddress)> =
|
||
|
searcher.search(&query, &TopDocs::with_limit(10)).unwrap();
|
||
|
|
||
|
for (_score, doc_address) in top_docs {
|
||
|
// Retrieve the actual content of documents given its `doc_address`.
|
||
|
let retrieved_doc = searcher.doc(doc_address).unwrap();
|
||
|
println!("{}", schema.to_json(&retrieved_doc));
|
||
|
}
|
||
|
}
|