You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

53 lines
1.8KB

  1. use clap::ArgMatches;
  2. use std::convert::From;
  3. use std::path::Path;
  4. use std::path::PathBuf;
  5. use tantivy;
  6. use tantivy::Index;
  7. use tantivy::query::QueryParser;
  8. use tantivy::schema::Field;
  9. use serde_json;
  10. use tantivy::schema::FieldType;
  11. pub fn run_search_cli(matches: &ArgMatches) -> Result<(), String> {
  12. let index_directory = PathBuf::from(matches.value_of("index").unwrap());
  13. let query = matches.value_of("query").unwrap();
  14. run_search(&index_directory, &query)
  15. .map_err(|e| format!("{:?}", e))
  16. }
  17. fn run_search(directory: &Path, query: &str) -> tantivy::Result<()> {
  18. let index = Index::open(directory)?;
  19. let schema = index.schema();
  20. let default_fields: Vec<Field> = schema
  21. .fields()
  22. .iter()
  23. .enumerate()
  24. .filter(
  25. |&(_, ref field_entry)|
  26. match *field_entry.field_type() {
  27. FieldType::Str(ref text_field_options) => {
  28. text_field_options.get_indexing_options().is_some()
  29. },
  30. _ => false
  31. }
  32. )
  33. .map(|(i, _)| Field(i as u32))
  34. .collect();
  35. let query_parser = QueryParser::new(schema.clone(), default_fields, index.tokenizers().clone());
  36. let query = query_parser.parse_query(query)?;
  37. let searcher = index.searcher();
  38. let weight = query.weight(&searcher, false)?;
  39. let schema = index.schema();
  40. for segment_reader in searcher.segment_readers() {
  41. let mut scorer = weight.scorer(segment_reader)?;
  42. while scorer.advance() {
  43. let doc_id = scorer.doc();
  44. let doc = segment_reader.doc(doc_id)?;
  45. let named_doc = schema.to_named_doc(&doc);
  46. println!("{}", serde_json::to_string(&named_doc).unwrap());
  47. }
  48. }
  49. Ok(())
  50. }