mirror of
https://github.com/quickwit-oss/tantivy.git
synced 2026-01-13 04:22:54 +00:00
219 lines
6.8 KiB
Rust
219 lines
6.8 KiB
Rust
use serde::{Deserialize, Serialize};
|
|
|
|
use super::ip_options::IpAddrOptions;
|
|
use crate::schema::bytes_options::BytesOptions;
|
|
use crate::schema::{
|
|
is_valid_field_name, DateOptions, FacetOptions, FieldType, JsonObjectOptions, NumericOptions,
|
|
TextOptions,
|
|
};
|
|
|
|
/// A `FieldEntry` represents a field and its configuration.
|
|
/// `Schema` are a collection of `FieldEntry`
|
|
///
|
|
/// It consists of
|
|
/// - a field name
|
|
/// - a field type, itself wrapping up options describing
|
|
/// how the field should be indexed.
|
|
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
|
|
pub struct FieldEntry {
|
|
name: String,
|
|
#[serde(flatten)]
|
|
field_type: FieldType,
|
|
}
|
|
|
|
impl FieldEntry {
|
|
/// Creates a new field entry given a name and a field type
|
|
pub fn new(field_name: String, field_type: FieldType) -> FieldEntry {
|
|
assert!(is_valid_field_name(&field_name));
|
|
FieldEntry {
|
|
name: field_name,
|
|
field_type,
|
|
}
|
|
}
|
|
|
|
/// Creates a new text field entry.
|
|
pub fn new_text(field_name: String, text_options: TextOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::Str(text_options))
|
|
}
|
|
|
|
/// Creates a new u64 field entry.
|
|
pub fn new_u64(field_name: String, int_options: NumericOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::U64(int_options))
|
|
}
|
|
|
|
/// Creates a new i64 field entry.
|
|
pub fn new_i64(field_name: String, int_options: NumericOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::I64(int_options))
|
|
}
|
|
|
|
/// Creates a new f64 field entry.
|
|
pub fn new_f64(field_name: String, f64_options: NumericOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::F64(f64_options))
|
|
}
|
|
|
|
/// Creates a new bool field entry.
|
|
pub fn new_bool(field_name: String, bool_options: NumericOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::Bool(bool_options))
|
|
}
|
|
|
|
/// Creates a new date field entry.
|
|
pub fn new_date(field_name: String, date_options: DateOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::Date(date_options))
|
|
}
|
|
|
|
/// Creates a new ip address field entry.
|
|
pub fn new_ip_addr(field_name: String, ip_options: IpAddrOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::IpAddr(ip_options))
|
|
}
|
|
|
|
/// Creates a field entry for a facet.
|
|
pub fn new_facet(field_name: String, facet_options: FacetOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::Facet(facet_options))
|
|
}
|
|
|
|
/// Creates a field entry for a bytes field
|
|
pub fn new_bytes(field_name: String, bytes_options: BytesOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::Bytes(bytes_options))
|
|
}
|
|
|
|
/// Creates a field entry for a json field
|
|
pub fn new_json(field_name: String, json_object_options: JsonObjectOptions) -> FieldEntry {
|
|
Self::new(field_name, FieldType::JsonObject(json_object_options))
|
|
}
|
|
|
|
/// Returns the name of the field
|
|
pub fn name(&self) -> &str {
|
|
&self.name
|
|
}
|
|
|
|
/// Returns the field type
|
|
pub fn field_type(&self) -> &FieldType {
|
|
&self.field_type
|
|
}
|
|
|
|
/// Returns true if the field is indexed.
|
|
///
|
|
/// An indexed field is searchable.
|
|
pub fn is_indexed(&self) -> bool {
|
|
self.field_type.is_indexed()
|
|
}
|
|
|
|
/// Returns true if the field is normed
|
|
pub fn has_fieldnorms(&self) -> bool {
|
|
self.field_type.has_fieldnorms()
|
|
}
|
|
|
|
/// Returns true if the field is a fast field
|
|
pub fn is_fast(&self) -> bool {
|
|
self.field_type.is_fast()
|
|
}
|
|
|
|
/// Returns true if the field has the expand dots option set (for json fields)
|
|
pub fn is_expand_dots_enabled(&self) -> bool {
|
|
match self.field_type {
|
|
FieldType::JsonObject(ref options) => options.is_expand_dots_enabled(),
|
|
_ => false,
|
|
}
|
|
}
|
|
|
|
/// Returns true if the field is stored
|
|
#[inline]
|
|
pub fn is_stored(&self) -> bool {
|
|
match self.field_type {
|
|
FieldType::U64(ref options)
|
|
| FieldType::I64(ref options)
|
|
| FieldType::F64(ref options)
|
|
| FieldType::Bool(ref options) => options.is_stored(),
|
|
FieldType::Date(ref options) => options.is_stored(),
|
|
FieldType::Str(ref options) => options.is_stored(),
|
|
FieldType::Facet(ref options) => options.is_stored(),
|
|
FieldType::Bytes(ref options) => options.is_stored(),
|
|
FieldType::JsonObject(ref options) => options.is_stored(),
|
|
FieldType::IpAddr(ref options) => options.is_stored(),
|
|
}
|
|
}
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod tests {
|
|
|
|
use super::*;
|
|
use crate::schema::{Schema, TextFieldIndexing, TEXT};
|
|
use crate::Index;
|
|
|
|
#[test]
|
|
#[should_panic]
|
|
fn test_invalid_field_name_should_panic() {
|
|
FieldEntry::new_text("-hello".to_string(), TEXT);
|
|
}
|
|
|
|
#[test]
|
|
fn test_json_serialization() {
|
|
let field_value = FieldEntry::new_text(String::from("title"), TEXT);
|
|
|
|
let expected = r#"{
|
|
"name": "title",
|
|
"type": "text",
|
|
"options": {
|
|
"indexing": {
|
|
"record": "position",
|
|
"fieldnorms": true,
|
|
"tokenizer": "default"
|
|
},
|
|
"stored": false,
|
|
"fast": false
|
|
}
|
|
}"#;
|
|
let field_value_json = serde_json::to_string_pretty(&field_value).unwrap();
|
|
|
|
assert_eq!(expected, &field_value_json);
|
|
|
|
let field_value: FieldEntry = serde_json::from_str(expected).unwrap();
|
|
|
|
assert_eq!("title", field_value.name);
|
|
|
|
match field_value.field_type {
|
|
FieldType::Str(_) => {}
|
|
_ => panic!("expected FieldType::Str"),
|
|
}
|
|
}
|
|
|
|
#[test]
|
|
fn test_json_deserialization() {
|
|
let json_str = r#"{
|
|
"name": "title",
|
|
"options": {
|
|
"indexing": {
|
|
"record": "position",
|
|
"fieldnorms": true,
|
|
"tokenizer": "default"
|
|
},
|
|
"stored": false
|
|
},
|
|
"type": "text"
|
|
}"#;
|
|
let field_entry: FieldEntry = serde_json::from_str(json_str).unwrap();
|
|
match field_entry.field_type {
|
|
FieldType::Str(_) => {}
|
|
_ => panic!("expected FieldType::Str"),
|
|
}
|
|
}
|
|
|
|
#[test]
|
|
fn test_missing_fieldnorms() -> crate::Result<()> {
|
|
let mut schema_builder = Schema::builder();
|
|
let no_field_norm = TextOptions::default()
|
|
.set_indexing_options(TextFieldIndexing::default().set_fieldnorms(false));
|
|
let text = schema_builder.add_text_field("text", no_field_norm);
|
|
let schema = schema_builder.build();
|
|
let index = Index::create_in_ram(schema);
|
|
let mut index_writer = index.writer_for_tests()?;
|
|
index_writer.add_document(doc!(text=>"abc"))?;
|
|
index_writer.commit()?;
|
|
let searcher = index.reader()?.searcher();
|
|
let err = searcher.segment_reader(0u32).get_fieldnorms_reader(text);
|
|
assert!(matches!(err, Err(crate::TantivyError::SchemaError(_))));
|
|
Ok(())
|
|
}
|
|
}
|