Files
tantivy/src/schema/field_entry.rs

204 lines
6.2 KiB
Rust

use serde::{Deserialize, Serialize};
use crate::schema::bytes_options::BytesOptions;
use crate::schema::{
is_valid_field_name, DateOptions, FacetOptions, FieldType, JsonObjectOptions, NumericOptions,
TextOptions,
};
/// A `FieldEntry` represents a field and its configuration.
/// `Schema` are a collection of `FieldEntry`
///
/// It consists of
/// - a field name
/// - a field type, itself wrapping up options describing
/// how the field should be indexed.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct FieldEntry {
name: String,
#[serde(flatten)]
field_type: FieldType,
}
impl FieldEntry {
/// Creates a new field entry given a name and a field type
pub fn new(field_name: String, field_type: FieldType) -> FieldEntry {
assert!(is_valid_field_name(&field_name));
FieldEntry {
name: field_name,
field_type,
}
}
/// Creates a new text field entry.
pub fn new_text(field_name: String, text_options: TextOptions) -> FieldEntry {
Self::new(field_name, FieldType::Str(text_options))
}
/// Creates a new u64 field entry.
pub fn new_u64(field_name: String, int_options: NumericOptions) -> FieldEntry {
Self::new(field_name, FieldType::U64(int_options))
}
/// Creates a new i64 field entry.
pub fn new_i64(field_name: String, int_options: NumericOptions) -> FieldEntry {
Self::new(field_name, FieldType::I64(int_options))
}
/// Creates a new f64 field entry.
pub fn new_f64(field_name: String, f64_options: NumericOptions) -> FieldEntry {
Self::new(field_name, FieldType::F64(f64_options))
}
/// Creates a new bool field entry.
pub fn new_bool(field_name: String, bool_options: NumericOptions) -> FieldEntry {
Self::new(field_name, FieldType::Bool(bool_options))
}
/// Creates a new date field entry.
pub fn new_date(field_name: String, date_options: DateOptions) -> FieldEntry {
Self::new(field_name, FieldType::Date(date_options))
}
/// Creates a field entry for a facet.
pub fn new_facet(field_name: String, facet_options: FacetOptions) -> FieldEntry {
Self::new(field_name, FieldType::Facet(facet_options))
}
/// Creates a field entry for a bytes field
pub fn new_bytes(field_name: String, bytes_options: BytesOptions) -> FieldEntry {
Self::new(field_name, FieldType::Bytes(bytes_options))
}
/// Creates a field entry for a json field
pub fn new_json(field_name: String, json_object_options: JsonObjectOptions) -> FieldEntry {
Self::new(field_name, FieldType::JsonObject(json_object_options))
}
/// Returns the name of the field
pub fn name(&self) -> &str {
&self.name
}
/// Returns the field type
pub fn field_type(&self) -> &FieldType {
&self.field_type
}
/// Returns true if the field is indexed.
///
/// An indexed field is searchable.
pub fn is_indexed(&self) -> bool {
self.field_type.is_indexed()
}
/// Returns true if the field is normed
pub fn has_fieldnorms(&self) -> bool {
self.field_type.has_fieldnorms()
}
/// Returns true if the field is a fast field
pub fn is_fast(&self) -> bool {
self.field_type.is_fast()
}
/// Returns true if the field is stored
pub fn is_stored(&self) -> bool {
match self.field_type {
FieldType::U64(ref options)
| FieldType::I64(ref options)
| FieldType::F64(ref options)
| FieldType::Bool(ref options) => options.is_stored(),
FieldType::Date(ref options) => options.is_stored(),
FieldType::Str(ref options) => options.is_stored(),
FieldType::Facet(ref options) => options.is_stored(),
FieldType::Bytes(ref options) => options.is_stored(),
FieldType::JsonObject(ref options) => options.is_stored(),
}
}
}
#[cfg(test)]
mod tests {
use serde_json;
use super::*;
use crate::schema::{Schema, TextFieldIndexing, TEXT};
use crate::Index;
#[test]
#[should_panic]
fn test_invalid_field_name_should_panic() {
FieldEntry::new_text("-hello".to_string(), TEXT);
}
#[test]
fn test_json_serialization() {
let field_value = FieldEntry::new_text(String::from("title"), TEXT);
let expected = r#"{
"name": "title",
"type": "text",
"options": {
"indexing": {
"record": "position",
"fieldnorms": true,
"tokenizer": "default"
},
"stored": false,
"fast": false
}
}"#;
let field_value_json = serde_json::to_string_pretty(&field_value).unwrap();
assert_eq!(expected, &field_value_json);
let field_value: FieldEntry = serde_json::from_str(expected).unwrap();
assert_eq!("title", field_value.name);
match field_value.field_type {
FieldType::Str(_) => {}
_ => panic!("expected FieldType::Str"),
}
}
#[test]
fn test_json_deserialization() {
let json_str = r#"{
"name": "title",
"options": {
"indexing": {
"record": "position",
"fieldnorms": true,
"tokenizer": "default"
},
"stored": false
},
"type": "text"
}"#;
let field_entry: FieldEntry = serde_json::from_str(json_str).unwrap();
match field_entry.field_type {
FieldType::Str(_) => {}
_ => panic!("expected FieldType::Str"),
}
}
#[test]
fn test_missing_fieldnorms() -> crate::Result<()> {
let mut schema_builder = Schema::builder();
let no_field_norm = TextOptions::default()
.set_indexing_options(TextFieldIndexing::default().set_fieldnorms(false));
let text = schema_builder.add_text_field("text", no_field_norm);
let schema = schema_builder.build();
let index = Index::create_in_ram(schema);
let mut index_writer = index.writer_for_tests()?;
index_writer.add_document(doc!(text=>"abc"))?;
index_writer.commit()?;
let searcher = index.reader()?.searcher();
let err = searcher.segment_reader(0u32).get_fieldnorms_reader(text);
assert!(matches!(err, Err(crate::TantivyError::SchemaError(_))));
Ok(())
}
}