You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

50 lines
1.8KB

  1. use clap::ArgMatches;
  2. use serde_json;
  3. use std::convert::From;
  4. use std::path::Path;
  5. use std::path::PathBuf;
  6. use tantivy;
  7. use tantivy::query::QueryParser;
  8. use tantivy::schema::Field;
  9. use tantivy::schema::FieldType;
  10. use tantivy::Index;
  11. pub fn run_search_cli(matches: &ArgMatches) -> Result<(), String> {
  12. let index_directory = PathBuf::from(matches.value_of("index").unwrap());
  13. let query = matches.value_of("query").unwrap();
  14. run_search(&index_directory, &query).map_err(|e| format!("{:?}", e))
  15. }
  16. fn run_search(directory: &Path, query: &str) -> tantivy::Result<()> {
  17. let index = Index::open_in_dir(directory)?;
  18. let schema = index.schema();
  19. let default_fields: Vec<Field> = schema
  20. .fields()
  21. .iter()
  22. .enumerate()
  23. .filter(|&(_, ref field_entry)| match *field_entry.field_type() {
  24. FieldType::Str(ref text_field_options) => {
  25. text_field_options.get_indexing_options().is_some()
  26. }
  27. _ => false,
  28. })
  29. .map(|(i, _)| Field(i as u32))
  30. .collect();
  31. let query_parser = QueryParser::new(schema.clone(), default_fields, index.tokenizers().clone());
  32. let query = query_parser.parse_query(query)?;
  33. let searcher = index.reader()?.searcher();
  34. let weight = query.weight(&searcher, false)?;
  35. let schema = index.schema();
  36. for segment_reader in searcher.segment_readers() {
  37. let mut scorer = weight.scorer(segment_reader)?;
  38. let store_reader = segment_reader.get_store_reader();
  39. while scorer.advance() {
  40. let doc_id = scorer.doc();
  41. let doc = store_reader.get(doc_id)?;
  42. let named_doc = schema.to_named_doc(&doc);
  43. println!("{}", serde_json::to_string(&named_doc).unwrap());
  44. }
  45. }
  46. Ok(())
  47. }