#![allow(clippy::unreadable_literal)] use crate::error::{invalid_data_error, Infallible}; use crate::model::xsd::*; use crate::model::*; use rand::random; use rio_api::model as rio; use siphasher::sip128::{Hasher128, SipHasher24}; use std::collections::HashMap; use std::error::Error; use std::hash::Hash; use std::hash::Hasher; use std::io::Read; use std::mem::size_of; use std::{fmt, io, str}; #[derive(Ord, PartialOrd, Eq, PartialEq, Debug, Copy, Clone, Hash)] #[repr(transparent)] pub struct StrHash { hash: u128, } impl StrHash { pub fn new(value: &str) -> Self { let mut hasher = SipHasher24::new(); hasher.write(value.as_bytes()); Self { hash: hasher.finish128().into(), } } #[inline] pub fn from_be_bytes(bytes: [u8; 16]) -> Self { Self { hash: u128::from_be_bytes(bytes), } } #[inline] pub fn to_be_bytes(&self) -> [u8; 16] { self.hash.to_be_bytes() } } const TYPE_DEFAULT_GRAPH_ID: u8 = 0; const TYPE_NAMED_NODE_ID: u8 = 1; const TYPE_INLINE_BLANK_NODE_ID: u8 = 2; const TYPE_NAMED_BLANK_NODE_ID: u8 = 3; const TYPE_LANG_STRING_LITERAL_ID: u8 = 4; const TYPE_TYPED_LITERAL_ID: u8 = 5; const TYPE_STRING_LITERAL: u8 = 6; const TYPE_BOOLEAN_LITERAL_TRUE: u8 = 7; const TYPE_BOOLEAN_LITERAL_FALSE: u8 = 8; const TYPE_FLOAT_LITERAL: u8 = 9; const TYPE_DOUBLE_LITERAL: u8 = 10; const TYPE_INTEGER_LITERAL: u8 = 11; const TYPE_DECIMAL_LITERAL: u8 = 12; const TYPE_DATE_TIME_LITERAL: u8 = 13; const TYPE_DATE_LITERAL: u8 = 14; const TYPE_TIME_LITERAL: u8 = 15; const TYPE_DURATION_LITERAL: u8 = 16; const TYPE_YEAR_MONTH_DURATION_LITERAL: u8 = 17; const TYPE_DAY_TIME_DURATION_LITERAL: u8 = 18; #[derive(Debug, Clone, Copy)] pub enum EncodedTerm { DefaultGraph, NamedNode { iri_id: StrHash, }, InlineBlankNode { id: u128, }, NamedBlankNode { id_id: StrHash, }, StringLiteral { value_id: StrHash, }, LangStringLiteral { value_id: StrHash, language_id: StrHash, }, TypedLiteral { value_id: StrHash, datatype_id: StrHash, }, BooleanLiteral(bool), FloatLiteral(f32), DoubleLiteral(f64), IntegerLiteral(i64), DecimalLiteral(Decimal), DateLiteral(Date), TimeLiteral(Time), DateTimeLiteral(DateTime), DurationLiteral(Duration), YearMonthDurationLiteral(YearMonthDuration), DayTimeDurationLiteral(DayTimeDuration), } impl PartialEq for EncodedTerm { fn eq(&self, other: &Self) -> bool { match (self, other) { (EncodedTerm::DefaultGraph, EncodedTerm::DefaultGraph) => true, ( EncodedTerm::NamedNode { iri_id: iri_id_a }, EncodedTerm::NamedNode { iri_id: iri_id_b }, ) => iri_id_a == iri_id_b, ( EncodedTerm::InlineBlankNode { id: id_a }, EncodedTerm::InlineBlankNode { id: id_b }, ) => id_a == id_b, ( EncodedTerm::NamedBlankNode { id_id: id_a }, EncodedTerm::NamedBlankNode { id_id: id_b }, ) => id_a == id_b, ( EncodedTerm::StringLiteral { value_id: value_id_a, }, EncodedTerm::StringLiteral { value_id: value_id_b, }, ) => value_id_a == value_id_b, ( EncodedTerm::LangStringLiteral { value_id: value_id_a, language_id: language_id_a, }, EncodedTerm::LangStringLiteral { value_id: value_id_b, language_id: language_id_b, }, ) => value_id_a == value_id_b && language_id_a == language_id_b, ( EncodedTerm::TypedLiteral { value_id: value_id_a, datatype_id: datatype_id_a, }, EncodedTerm::TypedLiteral { value_id: value_id_b, datatype_id: datatype_id_b, }, ) => value_id_a == value_id_b && datatype_id_a == datatype_id_b, (EncodedTerm::BooleanLiteral(a), EncodedTerm::BooleanLiteral(b)) => a == b, (EncodedTerm::FloatLiteral(a), EncodedTerm::FloatLiteral(b)) => { if a.is_nan() { b.is_nan() } else { a == b } } (EncodedTerm::DoubleLiteral(a), EncodedTerm::DoubleLiteral(b)) => { if a.is_nan() { b.is_nan() } else { a == b } } (EncodedTerm::IntegerLiteral(a), EncodedTerm::IntegerLiteral(b)) => a == b, (EncodedTerm::DecimalLiteral(a), EncodedTerm::DecimalLiteral(b)) => a == b, (EncodedTerm::DateLiteral(a), EncodedTerm::DateLiteral(b)) => a == b, (EncodedTerm::TimeLiteral(a), EncodedTerm::TimeLiteral(b)) => a == b, (EncodedTerm::DateTimeLiteral(a), EncodedTerm::DateTimeLiteral(b)) => a == b, (EncodedTerm::DurationLiteral(a), EncodedTerm::DurationLiteral(b)) => a == b, ( EncodedTerm::YearMonthDurationLiteral(a), EncodedTerm::YearMonthDurationLiteral(b), ) => a == b, (EncodedTerm::DayTimeDurationLiteral(a), EncodedTerm::DayTimeDurationLiteral(b)) => { a == b } (_, _) => false, } } } impl Eq for EncodedTerm {} impl Hash for EncodedTerm { fn hash(&self, state: &mut H) { match self { EncodedTerm::NamedNode { iri_id } => iri_id.hash(state), EncodedTerm::InlineBlankNode { id } => id.hash(state), EncodedTerm::NamedBlankNode { id_id } => id_id.hash(state), EncodedTerm::DefaultGraph => (), EncodedTerm::StringLiteral { value_id } => value_id.hash(state), EncodedTerm::LangStringLiteral { value_id, language_id, } => { value_id.hash(state); language_id.hash(state); } EncodedTerm::TypedLiteral { value_id, datatype_id, } => { value_id.hash(state); datatype_id.hash(state); } EncodedTerm::BooleanLiteral(value) => value.hash(state), EncodedTerm::FloatLiteral(value) => state.write(&value.to_ne_bytes()), EncodedTerm::DoubleLiteral(value) => state.write(&value.to_ne_bytes()), EncodedTerm::IntegerLiteral(value) => value.hash(state), EncodedTerm::DecimalLiteral(value) => value.hash(state), EncodedTerm::DateLiteral(value) => value.hash(state), EncodedTerm::TimeLiteral(value) => value.hash(state), EncodedTerm::DateTimeLiteral(value) => value.hash(state), EncodedTerm::DurationLiteral(value) => value.hash(state), EncodedTerm::YearMonthDurationLiteral(value) => value.hash(state), EncodedTerm::DayTimeDurationLiteral(value) => value.hash(state), } } } impl EncodedTerm { pub fn is_named_node(&self) -> bool { match self { EncodedTerm::NamedNode { .. } => true, _ => false, } } pub fn is_blank_node(&self) -> bool { match self { EncodedTerm::InlineBlankNode { .. } | EncodedTerm::NamedBlankNode { .. } => true, _ => false, } } pub fn is_literal(&self) -> bool { match self { EncodedTerm::StringLiteral { .. } | EncodedTerm::LangStringLiteral { .. } | EncodedTerm::TypedLiteral { .. } | EncodedTerm::BooleanLiteral(_) | EncodedTerm::FloatLiteral(_) | EncodedTerm::DoubleLiteral(_) | EncodedTerm::IntegerLiteral(_) | EncodedTerm::DecimalLiteral(_) | EncodedTerm::DateLiteral(_) | EncodedTerm::TimeLiteral(_) | EncodedTerm::DateTimeLiteral(_) | EncodedTerm::DurationLiteral(_) | EncodedTerm::YearMonthDurationLiteral(_) | EncodedTerm::DayTimeDurationLiteral(_) => true, _ => false, } } fn type_id(&self) -> u8 { match self { EncodedTerm::DefaultGraph { .. } => TYPE_DEFAULT_GRAPH_ID, EncodedTerm::NamedNode { .. } => TYPE_NAMED_NODE_ID, EncodedTerm::InlineBlankNode { .. } => TYPE_INLINE_BLANK_NODE_ID, EncodedTerm::NamedBlankNode { .. } => TYPE_NAMED_BLANK_NODE_ID, EncodedTerm::StringLiteral { .. } => TYPE_STRING_LITERAL, EncodedTerm::LangStringLiteral { .. } => TYPE_LANG_STRING_LITERAL_ID, EncodedTerm::TypedLiteral { .. } => TYPE_TYPED_LITERAL_ID, EncodedTerm::BooleanLiteral(true) => TYPE_BOOLEAN_LITERAL_TRUE, EncodedTerm::BooleanLiteral(false) => TYPE_BOOLEAN_LITERAL_FALSE, EncodedTerm::FloatLiteral(_) => TYPE_FLOAT_LITERAL, EncodedTerm::DoubleLiteral(_) => TYPE_DOUBLE_LITERAL, EncodedTerm::IntegerLiteral(_) => TYPE_INTEGER_LITERAL, EncodedTerm::DecimalLiteral(_) => TYPE_DECIMAL_LITERAL, EncodedTerm::DateLiteral(_) => TYPE_DATE_LITERAL, EncodedTerm::TimeLiteral(_) => TYPE_TIME_LITERAL, EncodedTerm::DateTimeLiteral(_) => TYPE_DATE_TIME_LITERAL, EncodedTerm::DurationLiteral(_) => TYPE_DURATION_LITERAL, EncodedTerm::YearMonthDurationLiteral(_) => TYPE_YEAR_MONTH_DURATION_LITERAL, EncodedTerm::DayTimeDurationLiteral(_) => TYPE_DAY_TIME_DURATION_LITERAL, } } } impl From for EncodedTerm { fn from(value: bool) -> Self { EncodedTerm::BooleanLiteral(value) } } impl From for EncodedTerm { fn from(value: i64) -> Self { EncodedTerm::IntegerLiteral(value) } } impl From for EncodedTerm { fn from(value: i32) -> Self { EncodedTerm::IntegerLiteral(value.into()) } } impl From for EncodedTerm { fn from(value: u32) -> Self { EncodedTerm::IntegerLiteral(value.into()) } } impl From for EncodedTerm { fn from(value: u8) -> Self { EncodedTerm::IntegerLiteral(value.into()) } } impl From for EncodedTerm { fn from(value: f32) -> Self { EncodedTerm::FloatLiteral(value) } } impl From for EncodedTerm { fn from(value: f64) -> Self { EncodedTerm::DoubleLiteral(value) } } impl From for EncodedTerm { fn from(value: Decimal) -> Self { EncodedTerm::DecimalLiteral(value) } } impl From for EncodedTerm { fn from(value: Date) -> Self { EncodedTerm::DateLiteral(value) } } impl From