|
|
|
use crate::sparql::algebra::QueryDataset;
|
|
|
|
use crate::sparql::EvaluationError;
|
|
|
|
use crate::store::numeric_encoder::{
|
|
|
|
EncodedQuad, EncodedTerm, ReadEncoder, StrContainer, StrEncodingAware, StrHash, StrId,
|
|
|
|
StrLookup,
|
|
|
|
};
|
|
|
|
use crate::store::ReadableEncodedStore;
|
|
|
|
use std::cell::RefCell;
|
|
|
|
use std::collections::HashMap;
|
|
|
|
use std::iter::{empty, once, Once};
|
|
|
|
|
|
|
|
pub(crate) struct DatasetView<S: ReadableEncodedStore> {
|
|
|
|
store: S,
|
|
|
|
extra: RefCell<HashMap<StrHash, String>>,
|
|
|
|
dataset: EncodedDatasetSpec<S::StrId>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<S: ReadableEncodedStore> DatasetView<S> {
|
|
|
|
pub fn new(store: S, dataset: &QueryDataset) -> Result<Self, EvaluationError> {
|
|
|
|
let dataset = EncodedDatasetSpec {
|
|
|
|
default: dataset
|
|
|
|
.default_graph_graphs()
|
|
|
|
.map(|graphs| {
|
|
|
|
graphs
|
|
|
|
.iter()
|
|
|
|
.flat_map(|g| store.get_encoded_graph_name(g.as_ref()).transpose())
|
|
|
|
.collect::<Result<Vec<_>, _>>()
|
|
|
|
})
|
|
|
|
.transpose()
|
|
|
|
.map_err(|e| e.into())?,
|
|
|
|
named: dataset
|
|
|
|
.available_named_graphs()
|
|
|
|
.map(|graphs| {
|
|
|
|
graphs
|
|
|
|
.iter()
|
|
|
|
.flat_map(|g| {
|
|
|
|
store
|
|
|
|
.get_encoded_named_or_blank_node(g.as_ref())
|
|
|
|
.transpose()
|
|
|
|
})
|
|
|
|
.collect::<Result<Vec<_>, _>>()
|
|
|
|
})
|
|
|
|
.transpose()
|
|
|
|
.map_err(|e| e.into())?,
|
|
|
|
};
|
|
|
|
Ok(Self {
|
|
|
|
store,
|
|
|
|
extra: RefCell::new(HashMap::default()),
|
|
|
|
dataset,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
#[allow(clippy::needless_collect)]
|
|
|
|
fn encoded_quads_for_pattern_in_dataset(
|
|
|
|
&self,
|
|
|
|
subject: Option<EncodedTerm<S::StrId>>,
|
|
|
|
predicate: Option<EncodedTerm<S::StrId>>,
|
|
|
|
object: Option<EncodedTerm<S::StrId>>,
|
|
|
|
graph_name: Option<EncodedTerm<S::StrId>>,
|
|
|
|
) -> Box<dyn Iterator<Item = Result<EncodedQuad<DatasetStrId<S::StrId>>, EvaluationError>>>
|
|
|
|
{
|
|
|
|
if let Some(graph_name) = graph_name {
|
|
|
|
if graph_name.is_default_graph() {
|
|
|
|
if let Some(default_graph_graphs) = &self.dataset.default {
|
|
|
|
if default_graph_graphs.len() == 1 {
|
|
|
|
// Single graph optimization
|
|
|
|
Box::new(
|
|
|
|
map_iter(self.store.encoded_quads_for_pattern(
|
|
|
|
subject,
|
|
|
|
predicate,
|
|
|
|
object,
|
|
|
|
Some(default_graph_graphs[0]),
|
|
|
|
))
|
|
|
|
.map(|quad| {
|
|
|
|
let quad = quad?;
|
|
|
|
Ok(EncodedQuad::new(
|
|
|
|
quad.subject,
|
|
|
|
quad.predicate,
|
|
|
|
quad.object,
|
|
|
|
EncodedTerm::DefaultGraph,
|
|
|
|
))
|
|
|
|
}),
|
|
|
|
)
|
|
|
|
} else {
|
|
|
|
let iters = default_graph_graphs
|
|
|
|
.iter()
|
|
|
|
.map(|graph_name| {
|
|
|
|
self.store.encoded_quads_for_pattern(
|
|
|
|
subject,
|
|
|
|
predicate,
|
|
|
|
object,
|
|
|
|
Some(*graph_name),
|
|
|
|
)
|
|
|
|
})
|
|
|
|
.collect::<Vec<_>>();
|
|
|
|
Box::new(map_iter(iters.into_iter().flatten()).map(|quad| {
|
|
|
|
let quad = quad?;
|
|
|
|
Ok(EncodedQuad::new(
|
|
|
|
quad.subject,
|
|
|
|
quad.predicate,
|
|
|
|
quad.object,
|
|
|
|
EncodedTerm::DefaultGraph,
|
|
|
|
))
|
|
|
|
}))
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
Box::new(map_iter(
|
|
|
|
self.store
|
|
|
|
.encoded_quads_for_pattern(subject, predicate, object, None),
|
|
|
|
))
|
|
|
|
}
|
|
|
|
} else if self
|
|
|
|
.dataset
|
|
|
|
.named
|
|
|
|
.as_ref()
|
|
|
|
.map_or(true, |d| d.contains(&graph_name))
|
|
|
|
{
|
|
|
|
Box::new(map_iter(self.store.encoded_quads_for_pattern(
|
|
|
|
subject,
|
|
|
|
predicate,
|
|
|
|
object,
|
|
|
|
Some(graph_name),
|
|
|
|
)))
|
|
|
|
} else {
|
|
|
|
Box::new(empty())
|
|
|
|
}
|
|
|
|
} else if let Some(named_graphs) = &self.dataset.named {
|
|
|
|
let iters = named_graphs
|
|
|
|
.iter()
|
|
|
|
.map(|graph_name| {
|
|
|
|
self.store.encoded_quads_for_pattern(
|
|
|
|
subject,
|
|
|
|
predicate,
|
|
|
|
object,
|
|
|
|
Some(*graph_name),
|
|
|
|
)
|
|
|
|
})
|
|
|
|
.collect::<Vec<_>>();
|
|
|
|
Box::new(map_iter(iters.into_iter().flatten()))
|
|
|
|
} else {
|
|
|
|
Box::new(
|
|
|
|
map_iter(
|
|
|
|
self.store
|
|
|
|
.encoded_quads_for_pattern(subject, predicate, object, None),
|
|
|
|
)
|
|
|
|
.filter(|quad| match quad {
|
|
|
|
Err(_) => true,
|
|
|
|
Ok(quad) => quad.graph_name != EncodedTerm::DefaultGraph,
|
|
|
|
}),
|
|
|
|
)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<S: ReadableEncodedStore> StrEncodingAware for DatasetView<S> {
|
|
|
|
type Error = EvaluationError;
|
|
|
|
type StrId = DatasetStrId<S::StrId>;
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<S: ReadableEncodedStore> StrLookup for DatasetView<S> {
|
|
|
|
fn get_str(&self, id: DatasetStrId<S::StrId>) -> Result<Option<String>, EvaluationError> {
|
|
|
|
match id {
|
|
|
|
DatasetStrId::Store(id) => self.store.get_str(id).map_err(|e| e.into()),
|
|
|
|
DatasetStrId::Temporary(id) => Ok(self.extra.borrow().get(&id).cloned()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn get_str_id(&self, value: &str) -> Result<Option<DatasetStrId<S::StrId>>, EvaluationError> {
|
|
|
|
let id = StrHash::new(value);
|
|
|
|
if self.extra.borrow().contains_key(&id) {
|
|
|
|
Ok(Some(DatasetStrId::Temporary(id)))
|
|
|
|
} else {
|
|
|
|
Ok(self
|
|
|
|
.store
|
|
|
|
.get_str_id(value)
|
|
|
|
.map_err(|e| e.into())?
|
|
|
|
.map(DatasetStrId::Store))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<S: ReadableEncodedStore> ReadableEncodedStore for DatasetView<S> {
|
|
|
|
type QuadsIter =
|
|
|
|
Box<dyn Iterator<Item = Result<EncodedQuad<DatasetStrId<S::StrId>>, EvaluationError>>>;
|
|
|
|
type GraphsIter = Once<Result<EncodedTerm<DatasetStrId<S::StrId>>, EvaluationError>>;
|
|
|
|
|
|
|
|
fn encoded_quads_for_pattern(
|
|
|
|
&self,
|
|
|
|
subject: Option<EncodedTerm<Self::StrId>>,
|
|
|
|
predicate: Option<EncodedTerm<Self::StrId>>,
|
|
|
|
object: Option<EncodedTerm<Self::StrId>>,
|
|
|
|
graph_name: Option<EncodedTerm<Self::StrId>>,
|
|
|
|
) -> Box<dyn Iterator<Item = Result<EncodedQuad<DatasetStrId<S::StrId>>, EvaluationError>>>
|
|
|
|
{
|
|
|
|
if let Some((subject, predicate, object, graph_name)) =
|
|
|
|
try_map_quad_pattern(subject, predicate, object, graph_name)
|
|
|
|
{
|
|
|
|
self.encoded_quads_for_pattern_in_dataset(subject, predicate, object, graph_name)
|
|
|
|
} else {
|
|
|
|
Box::new(empty())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn encoded_named_graphs(&self) -> Self::GraphsIter {
|
|
|
|
once(Err(EvaluationError::msg(
|
|
|
|
"Graphs lookup is not implemented by DatasetView",
|
|
|
|
)))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn contains_encoded_named_graph(
|
|
|
|
&self,
|
|
|
|
_: EncodedTerm<Self::StrId>,
|
|
|
|
) -> Result<bool, EvaluationError> {
|
|
|
|
Err(EvaluationError::msg(
|
|
|
|
"Graphs lookup is not implemented by DatasetView",
|
|
|
|
))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn map_iter<'a, I: StrId>(
|
|
|
|
iter: impl Iterator<Item = Result<EncodedQuad<I>, impl Into<EvaluationError>>> + 'a,
|
|
|
|
) -> impl Iterator<Item = Result<EncodedQuad<DatasetStrId<I>>, EvaluationError>> + 'a {
|
|
|
|
iter.map(|t| {
|
|
|
|
t.map(|q| EncodedQuad {
|
|
|
|
subject: q.subject.map_id(DatasetStrId::Store),
|
|
|
|
predicate: q.predicate.map_id(DatasetStrId::Store),
|
|
|
|
object: q.object.map_id(DatasetStrId::Store),
|
|
|
|
graph_name: q.graph_name.map_id(DatasetStrId::Store),
|
|
|
|
})
|
|
|
|
.map_err(|e| e.into())
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
type QuadPattern<I> = (
|
|
|
|
Option<EncodedTerm<I>>,
|
|
|
|
Option<EncodedTerm<I>>,
|
|
|
|
Option<EncodedTerm<I>>,
|
|
|
|
Option<EncodedTerm<I>>,
|
|
|
|
);
|
|
|
|
|
|
|
|
fn try_map_quad_pattern<I: StrId>(
|
|
|
|
subject: Option<EncodedTerm<DatasetStrId<I>>>,
|
|
|
|
predicate: Option<EncodedTerm<DatasetStrId<I>>>,
|
|
|
|
object: Option<EncodedTerm<DatasetStrId<I>>>,
|
|
|
|
graph_name: Option<EncodedTerm<DatasetStrId<I>>>,
|
|
|
|
) -> Option<QuadPattern<I>> {
|
|
|
|
Some((
|
|
|
|
transpose(subject.map(|t| t.try_map_id(unwrap_store_id).ok()))?,
|
|
|
|
transpose(predicate.map(|t| t.try_map_id(unwrap_store_id).ok()))?,
|
|
|
|
transpose(object.map(|t| t.try_map_id(unwrap_store_id).ok()))?,
|
|
|
|
transpose(graph_name.map(|t| t.try_map_id(unwrap_store_id).ok()))?,
|
|
|
|
))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn transpose<T>(o: Option<Option<T>>) -> Option<Option<T>> {
|
|
|
|
match o {
|
|
|
|
Some(Some(v)) => Some(Some(v)),
|
|
|
|
Some(None) => None,
|
|
|
|
None => Some(None),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn unwrap_store_id<I: StrId>(id: DatasetStrId<I>) -> Result<I, ()> {
|
|
|
|
match id {
|
|
|
|
DatasetStrId::Store(id) => Ok(id),
|
|
|
|
DatasetStrId::Temporary(_) => Err(()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a, S: ReadableEncodedStore> StrContainer for &'a DatasetView<S> {
|
|
|
|
fn insert_str(&mut self, value: &str) -> Result<Self::StrId, EvaluationError> {
|
|
|
|
if let Some(id) = self.store.get_str_id(value).map_err(|e| e.into())? {
|
|
|
|
Ok(DatasetStrId::Store(id))
|
|
|
|
} else {
|
|
|
|
let hash = StrHash::new(value);
|
|
|
|
self.extra
|
|
|
|
.borrow_mut()
|
|
|
|
.entry(hash)
|
|
|
|
.or_insert_with(|| value.to_owned());
|
|
|
|
Ok(DatasetStrId::Temporary(hash))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Eq, PartialEq, Debug, Copy, Clone, Hash)]
|
|
|
|
pub enum DatasetStrId<I: StrId> {
|
|
|
|
Store(I),
|
|
|
|
Temporary(StrHash),
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<I: StrId> StrId for DatasetStrId<I> {}
|
|
|
|
|
|
|
|
struct EncodedDatasetSpec<I: StrId> {
|
|
|
|
default: Option<Vec<EncodedTerm<I>>>,
|
|
|
|
named: Option<Vec<EncodedTerm<I>>>,
|
|
|
|
}
|