use crate::sparql::algebra::QueryDataset; use crate::sparql::EvaluationError; use crate::store::numeric_encoder::{ EncodedQuad, EncodedTerm, ReadEncoder, StrContainer, StrEncodingAware, StrHash, StrId, StrLookup, }; use crate::store::ReadableEncodedStore; use std::cell::RefCell; use std::collections::HashMap; use std::iter::{empty, once, Once}; pub(crate) struct DatasetView { store: S, extra: RefCell>, dataset: EncodedDatasetSpec, } impl DatasetView { pub fn new(store: S, dataset: &QueryDataset) -> Result { let dataset = EncodedDatasetSpec { default: dataset .default_graph_graphs() .map(|graphs| { graphs .iter() .flat_map(|g| store.get_encoded_graph_name(g.as_ref()).transpose()) .collect::, _>>() }) .transpose() .map_err(|e| e.into())?, named: dataset .available_named_graphs() .map(|graphs| { graphs .iter() .flat_map(|g| { store .get_encoded_named_or_blank_node(g.as_ref()) .transpose() }) .collect::, _>>() }) .transpose() .map_err(|e| e.into())?, }; Ok(Self { store, extra: RefCell::new(HashMap::default()), dataset, }) } #[allow(clippy::needless_collect)] fn encoded_quads_for_pattern_in_dataset( &self, subject: Option>, predicate: Option>, object: Option>, graph_name: Option>, ) -> Box>, EvaluationError>>> { if let Some(graph_name) = graph_name { if graph_name.is_default_graph() { if let Some(default_graph_graphs) = &self.dataset.default { if default_graph_graphs.len() == 1 { // Single graph optimization Box::new( map_iter(self.store.encoded_quads_for_pattern( subject, predicate, object, Some(default_graph_graphs[0]), )) .map(|quad| { let quad = quad?; Ok(EncodedQuad::new( quad.subject, quad.predicate, quad.object, EncodedTerm::DefaultGraph, )) }), ) } else { let iters = default_graph_graphs .iter() .map(|graph_name| { self.store.encoded_quads_for_pattern( subject, predicate, object, Some(*graph_name), ) }) .collect::>(); Box::new(map_iter(iters.into_iter().flatten()).map(|quad| { let quad = quad?; Ok(EncodedQuad::new( quad.subject, quad.predicate, quad.object, EncodedTerm::DefaultGraph, )) })) } } else { Box::new(map_iter( self.store .encoded_quads_for_pattern(subject, predicate, object, None), )) } } else if self .dataset .named .as_ref() .map_or(true, |d| d.contains(&graph_name)) { Box::new(map_iter(self.store.encoded_quads_for_pattern( subject, predicate, object, Some(graph_name), ))) } else { Box::new(empty()) } } else if let Some(named_graphs) = &self.dataset.named { let iters = named_graphs .iter() .map(|graph_name| { self.store.encoded_quads_for_pattern( subject, predicate, object, Some(*graph_name), ) }) .collect::>(); Box::new(map_iter(iters.into_iter().flatten())) } else { Box::new( map_iter( self.store .encoded_quads_for_pattern(subject, predicate, object, None), ) .filter(|quad| match quad { Err(_) => true, Ok(quad) => quad.graph_name != EncodedTerm::DefaultGraph, }), ) } } } impl StrEncodingAware for DatasetView { type Error = EvaluationError; type StrId = DatasetStrId; } impl StrLookup for DatasetView { fn get_str(&self, id: DatasetStrId) -> Result, EvaluationError> { match id { DatasetStrId::Store(id) => self.store.get_str(id).map_err(|e| e.into()), DatasetStrId::Temporary(id) => Ok(self.extra.borrow().get(&id).cloned()), } } fn get_str_id(&self, value: &str) -> Result>, EvaluationError> { let id = StrHash::new(value); if self.extra.borrow().contains_key(&id) { Ok(Some(DatasetStrId::Temporary(id))) } else { Ok(self .store .get_str_id(value) .map_err(|e| e.into())? .map(DatasetStrId::Store)) } } } impl ReadableEncodedStore for DatasetView { type QuadsIter = Box>, EvaluationError>>>; type GraphsIter = Once>, EvaluationError>>; fn encoded_quads_for_pattern( &self, subject: Option>, predicate: Option>, object: Option>, graph_name: Option>, ) -> Box>, EvaluationError>>> { if let Some((subject, predicate, object, graph_name)) = try_map_quad_pattern(subject, predicate, object, graph_name) { self.encoded_quads_for_pattern_in_dataset(subject, predicate, object, graph_name) } else { Box::new(empty()) } } fn encoded_named_graphs(&self) -> Self::GraphsIter { once(Err(EvaluationError::msg( "Graphs lookup is not implemented by DatasetView", ))) } fn contains_encoded_named_graph( &self, _: EncodedTerm, ) -> Result { Err(EvaluationError::msg( "Graphs lookup is not implemented by DatasetView", )) } } fn map_iter<'a, I: StrId>( iter: impl Iterator, impl Into>> + 'a, ) -> impl Iterator>, EvaluationError>> + 'a { iter.map(|t| { t.map(|q| EncodedQuad { subject: q.subject.map_id(DatasetStrId::Store), predicate: q.predicate.map_id(DatasetStrId::Store), object: q.object.map_id(DatasetStrId::Store), graph_name: q.graph_name.map_id(DatasetStrId::Store), }) .map_err(|e| e.into()) }) } type QuadPattern = ( Option>, Option>, Option>, Option>, ); fn try_map_quad_pattern( subject: Option>>, predicate: Option>>, object: Option>>, graph_name: Option>>, ) -> Option> { Some(( transpose(subject.map(|t| t.try_map_id(unwrap_store_id).ok()))?, transpose(predicate.map(|t| t.try_map_id(unwrap_store_id).ok()))?, transpose(object.map(|t| t.try_map_id(unwrap_store_id).ok()))?, transpose(graph_name.map(|t| t.try_map_id(unwrap_store_id).ok()))?, )) } fn transpose(o: Option>) -> Option> { match o { Some(Some(v)) => Some(Some(v)), Some(None) => None, None => Some(None), } } fn unwrap_store_id(id: DatasetStrId) -> Result { match id { DatasetStrId::Store(id) => Ok(id), DatasetStrId::Temporary(_) => Err(()), } } impl<'a, S: ReadableEncodedStore> StrContainer for &'a DatasetView { fn insert_str(&mut self, value: &str) -> Result { if let Some(id) = self.store.get_str_id(value).map_err(|e| e.into())? { Ok(DatasetStrId::Store(id)) } else { let hash = StrHash::new(value); self.extra .borrow_mut() .entry(hash) .or_insert_with(|| value.to_owned()); Ok(DatasetStrId::Temporary(hash)) } } } #[derive(Eq, PartialEq, Debug, Copy, Clone, Hash)] pub enum DatasetStrId { Store(I), Temporary(StrHash), } impl StrId for DatasetStrId {} struct EncodedDatasetSpec { default: Option>>, named: Option>>, }