use std::fmt; use serde::de::Visitor; use serde::{Deserialize, Deserializer, Serialize, Serializer}; use serde_json::Map; use crate::schema::Facet; use crate::tokenizer::PreTokenizedString; use crate::DateTime; /// Value represents the value of a any field. /// It is an enum over all over all of the possible field type. #[derive(Debug, Clone, PartialEq)] pub enum Value { /// The str type is used for any text information. Str(String), /// Pre-tokenized str type, PreTokStr(PreTokenizedString), /// Unsigned 64-bits Integer `u64` U64(u64), /// Signed 64-bits Integer `i64` I64(i64), /// 64-bits Float `f64` F64(f64), /// Bool value Bool(bool), /// Date/time with microseconds precision Date(DateTime), /// Facet Facet(Facet), /// Arbitrarily sized byte array Bytes(Vec), /// Json object value. JsonObject(serde_json::Map), } impl Eq for Value {} impl Serialize for Value { fn serialize(&self, serializer: S) -> Result where S: Serializer { match *self { Value::Str(ref v) => serializer.serialize_str(v), Value::PreTokStr(ref v) => v.serialize(serializer), Value::U64(u) => serializer.serialize_u64(u), Value::I64(u) => serializer.serialize_i64(u), Value::F64(u) => serializer.serialize_f64(u), Value::Bool(b) => serializer.serialize_bool(b), Value::Date(ref date) => time::serde::rfc3339::serialize(&date.into_utc(), serializer), Value::Facet(ref facet) => facet.serialize(serializer), Value::Bytes(ref bytes) => serializer.serialize_bytes(bytes), Value::JsonObject(ref obj) => obj.serialize(serializer), } } } impl<'de> Deserialize<'de> for Value { fn deserialize(deserializer: D) -> Result where D: Deserializer<'de> { struct ValueVisitor; impl<'de> Visitor<'de> for ValueVisitor { type Value = Value; fn expecting(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result { formatter.write_str("a string or u32") } fn visit_i64(self, v: i64) -> Result { Ok(Value::I64(v)) } fn visit_u64(self, v: u64) -> Result { Ok(Value::U64(v)) } fn visit_f64(self, v: f64) -> Result { Ok(Value::F64(v)) } fn visit_bool(self, v: bool) -> Result { Ok(Value::Bool(v)) } fn visit_str(self, v: &str) -> Result { Ok(Value::Str(v.to_owned())) } fn visit_string(self, v: String) -> Result { Ok(Value::Str(v)) } } deserializer.deserialize_any(ValueVisitor) } } impl Value { /// Returns the text value, provided the value is of the `Str` type. /// (Returns `None` if the value is not of the `Str` type). pub fn as_text(&self) -> Option<&str> { if let Value::Str(text) = self { Some(text) } else { None } } /// Returns the facet value, provided the value is of the `Facet` type. /// (Returns `None` if the value is not of the `Facet` type). pub fn as_facet(&self) -> Option<&Facet> { if let Value::Facet(facet) = self { Some(facet) } else { None } } /// Returns the tokenized text, provided the value is of the `PreTokStr` type. /// (Returns `None` if the value is not of the `PreTokStr` type.) pub fn tokenized_text(&self) -> Option<&PreTokenizedString> { if let Value::PreTokStr(tokenized_text) = self { Some(tokenized_text) } else { None } } /// Returns the u64-value, provided the value is of the `U64` type. /// (Returns `None` if the value is not of the `U64` type) pub fn as_u64(&self) -> Option { if let Value::U64(val) = self { Some(*val) } else { None } } /// Returns the i64-value, provided the value is of the `I64` type. /// /// Returns `None` if the value is not of type `I64`. pub fn as_i64(&self) -> Option { if let Value::I64(val) = self { Some(*val) } else { None } } /// Returns the f64-value, provided the value is of the `F64` type. /// /// Returns `None` if the value is not of type `F64`. pub fn as_f64(&self) -> Option { if let Value::F64(value) = self { Some(*value) } else { None } } /// Returns the bool value, provided the value is of the `Bool` type. /// /// Returns `None` if the value is not of type `Bool`. pub fn as_bool(&self) -> Option { if let Value::Bool(value) = self { Some(*value) } else { None } } /// Returns the Date-value, provided the value is of the `Date` type. /// /// Returns `None` if the value is not of type `Date`. pub fn as_date(&self) -> Option { if let Value::Date(date) = self { Some(*date) } else { None } } /// Returns the Bytes-value, provided the value is of the `Bytes` type. /// /// Returns `None` if the value is not of type `Bytes`. pub fn as_bytes(&self) -> Option<&[u8]> { if let Value::Bytes(bytes) = self { Some(bytes) } else { None } } /// Returns the json object, provided the value is of the `JsonObject` type. /// /// Returns `None` if the value is not of type `JsonObject`. pub fn as_json(&self) -> Option<&Map> { if let Value::JsonObject(json) = self { Some(json) } else { None } } } impl From for Value { fn from(s: String) -> Value { Value::Str(s) } } impl From for Value { fn from(v: u64) -> Value { Value::U64(v) } } impl From for Value { fn from(v: i64) -> Value { Value::I64(v) } } impl From for Value { fn from(v: f64) -> Value { Value::F64(v) } } impl From for Value { fn from(b: bool) -> Self { Value::Bool(b) } } impl From for Value { fn from(dt: DateTime) -> Value { Value::Date(dt) } } impl<'a> From<&'a str> for Value { fn from(s: &'a str) -> Value { Value::Str(s.to_string()) } } impl<'a> From<&'a [u8]> for Value { fn from(bytes: &'a [u8]) -> Value { Value::Bytes(bytes.to_vec()) } } impl From for Value { fn from(facet: Facet) -> Value { Value::Facet(facet) } } impl From> for Value { fn from(bytes: Vec) -> Value { Value::Bytes(bytes) } } impl From for Value { fn from(pretokenized_string: PreTokenizedString) -> Value { Value::PreTokStr(pretokenized_string) } } impl From> for Value { fn from(json_object: serde_json::Map) -> Value { Value::JsonObject(json_object) } } impl From for Value { fn from(json_value: serde_json::Value) -> Value { match json_value { serde_json::Value::Object(json_object) => Value::JsonObject(json_object), _ => { panic!("Expected a json object."); } } } } mod binary_serialize { use std::io::{self, Read, Write}; use common::{f64_to_u64, u64_to_f64, BinarySerializable}; use super::Value; use crate::schema::Facet; use crate::tokenizer::PreTokenizedString; use crate::DateTime; const TEXT_CODE: u8 = 0; const U64_CODE: u8 = 1; const I64_CODE: u8 = 2; const HIERARCHICAL_FACET_CODE: u8 = 3; const BYTES_CODE: u8 = 4; const DATE_CODE: u8 = 5; const F64_CODE: u8 = 6; const EXT_CODE: u8 = 7; const JSON_OBJ_CODE: u8 = 8; const BOOL_CODE: u8 = 9; // extended types const TOK_STR_CODE: u8 = 0; impl BinarySerializable for Value { fn serialize(&self, writer: &mut W) -> io::Result<()> { match *self { Value::Str(ref text) => { TEXT_CODE.serialize(writer)?; text.serialize(writer) } Value::PreTokStr(ref tok_str) => { EXT_CODE.serialize(writer)?; TOK_STR_CODE.serialize(writer)?; if let Ok(text) = serde_json::to_string(tok_str) { text.serialize(writer) } else { Err(io::Error::new( io::ErrorKind::Other, "Failed to dump Value::PreTokStr(_) to json.", )) } } Value::U64(ref val) => { U64_CODE.serialize(writer)?; val.serialize(writer) } Value::I64(ref val) => { I64_CODE.serialize(writer)?; val.serialize(writer) } Value::F64(ref val) => { F64_CODE.serialize(writer)?; f64_to_u64(*val).serialize(writer) } Value::Bool(ref val) => { BOOL_CODE.serialize(writer)?; val.serialize(writer) } Value::Date(ref val) => { DATE_CODE.serialize(writer)?; let DateTime { timestamp_micros, .. } = val; timestamp_micros.serialize(writer) } Value::Facet(ref facet) => { HIERARCHICAL_FACET_CODE.serialize(writer)?; facet.serialize(writer) } Value::Bytes(ref bytes) => { BYTES_CODE.serialize(writer)?; bytes.serialize(writer) } Value::JsonObject(ref map) => { JSON_OBJ_CODE.serialize(writer)?; serde_json::to_writer(writer, &map)?; Ok(()) } } } fn deserialize(reader: &mut R) -> io::Result { let type_code = u8::deserialize(reader)?; match type_code { TEXT_CODE => { let text = String::deserialize(reader)?; Ok(Value::Str(text)) } U64_CODE => { let value = u64::deserialize(reader)?; Ok(Value::U64(value)) } I64_CODE => { let value = i64::deserialize(reader)?; Ok(Value::I64(value)) } F64_CODE => { let value = u64_to_f64(u64::deserialize(reader)?); Ok(Value::F64(value)) } BOOL_CODE => { let value = bool::deserialize(reader)?; Ok(Value::Bool(value)) } DATE_CODE => { let timestamp_micros = i64::deserialize(reader)?; Ok(Value::Date(DateTime::from_timestamp_micros( timestamp_micros, ))) } HIERARCHICAL_FACET_CODE => Ok(Value::Facet(Facet::deserialize(reader)?)), BYTES_CODE => Ok(Value::Bytes(Vec::::deserialize(reader)?)), EXT_CODE => { let ext_type_code = u8::deserialize(reader)?; match ext_type_code { TOK_STR_CODE => { let str_val = String::deserialize(reader)?; if let Ok(value) = serde_json::from_str::(&str_val) { Ok(Value::PreTokStr(value)) } else { Err(io::Error::new( io::ErrorKind::Other, "Failed to parse string data as Value::PreTokStr(_).", )) } } _ => Err(io::Error::new( io::ErrorKind::InvalidData, format!( "No extended field type is associated with code {:?}", ext_type_code ), )), } } JSON_OBJ_CODE => { // As explained in // https://docs.serde.rs/serde_json/fn.from_reader.html // // `T::from_reader(..)` expects EOF after reading the object, // which is not what we want here. // // For this reason we need to create our own `Deserializer`. let mut de = serde_json::Deserializer::from_reader(reader); let json_map = as serde::Deserialize>::deserialize(&mut de)?; Ok(Value::JsonObject(json_map)) } _ => Err(io::Error::new( io::ErrorKind::InvalidData, format!("No field type is associated with code {:?}", type_code), )), } } } } #[cfg(test)] mod tests { use super::Value; use crate::time::format_description::well_known::Rfc3339; use crate::time::OffsetDateTime; use crate::DateTime; #[test] fn test_serialize_date() { let value = Value::from(DateTime::from_utc( OffsetDateTime::parse("1996-12-20T00:39:57+00:00", &Rfc3339).unwrap(), )); let serialized_value_json = serde_json::to_string_pretty(&value).unwrap(); assert_eq!(serialized_value_json, r#""1996-12-20T00:39:57Z""#); let value = Value::from(DateTime::from_utc( OffsetDateTime::parse("1996-12-20T00:39:57-01:00", &Rfc3339).unwrap(), )); let serialized_value_json = serde_json::to_string_pretty(&value).unwrap(); // The time zone information gets lost by conversion into `Value::Date` and // implicitly becomes UTC. assert_eq!(serialized_value_json, r#""1996-12-20T01:39:57Z""#); } }