Simplifies Sophia traits implementation

pull/171/head
Tpt 4 years ago
parent 943d116f56
commit 13ee6bf80c
  1. 179
      lib/src/store/sophia.rs

@ -1,51 +1,33 @@
//! This crate provides implementation of [Sophia](https://docs.rs/sophia/) traits for the `store` module. //! This crate provides implementation of [Sophia](https://docs.rs/sophia/) traits for the `store` module.
use crate::model::*;
use crate::model::{
BlankNodeRef, GraphNameRef, LiteralRef, NamedNodeRef, NamedOrBlankNodeRef, Quad, QuadRef, Term,
TermRef,
};
use crate::sparql::{EvaluationError, QueryResults}; use crate::sparql::{EvaluationError, QueryResults};
use crate::store::*; use crate::store::SledStore;
use sophia_api::dataset::*; use sophia_api::dataset::{
CollectibleDataset, DQuadSource, DResultTermSet, DTerm, Dataset, MDResult, MutableDataset,
};
use sophia_api::quad::stream::{QuadSource, StreamResult}; use sophia_api::quad::stream::{QuadSource, StreamResult};
use sophia_api::quad::streaming_mode::{ByValue, StreamedQuad}; use sophia_api::quad::streaming_mode::{ByValue, StreamedQuad};
use sophia_api::term::{TTerm, TermKind}; use sophia_api::term::{TTerm, TermKind};
use std::collections::HashSet; use std::collections::HashSet;
use std::hash::Hash; use std::hash::Hash;
use std::io::{Error, ErrorKind};
use std::iter::empty; use std::iter::empty;
type SophiaQuad = ([Term; 3], Option<Term>); type SophiaQuad = ([Term; 3], Option<Term>);
type StreamedSophiaQuad<'a> = StreamedQuad<'a, ByValue<SophiaQuad>>; type StreamedSophiaQuad<'a> = StreamedQuad<'a, ByValue<SophiaQuad>>;
/// Execute a SPARQL query in a store, and return the result as a HashSet, impl Dataset for SledStore {
/// mapping the error (if any) through the given function.
///
/// # Precondition
/// + the query must be a SELECT query with a single selected variable
/// + it must not produce NULL results
macro_rules! sparql_to_hashset {
($store: ident, $err_map: ident, $sparql: expr) => {{
(|| -> Result<HashSet<Term>, EvaluationError> {
if let QueryResults::Solutions(solutions) = $store.query($sparql)? {
solutions
.map(|r| r.map(|v| v.get(0).unwrap().clone()))
.collect()
} else {
unreachable!()
}
})()
.map_err($err_map)
}};
}
macro_rules! impl_dataset {
($store: ident, $error: ty, $quad_map: ident, $err_map: ident) => {
impl Dataset for $store {
type Quad = ByValue<SophiaQuad>; type Quad = ByValue<SophiaQuad>;
type Error = $error; type Error = Error;
fn quads(&self) -> DQuadSource<'_, Self> { fn quads(&self) -> DQuadSource<'_, Self> {
Box::new( Box::new(self.iter().map(io_quad_map))
self.quads_for_pattern(None, None, None, None)
.map($quad_map),
)
} }
fn quads_with_s<'s, TS>(&'s self, s: &'s TS) -> DQuadSource<'s, Self> fn quads_with_s<'s, TS>(&'s self, s: &'s TS) -> DQuadSource<'s, Self>
where where
TS: TTerm + ?Sized, TS: TTerm + ?Sized,
@ -55,7 +37,7 @@ macro_rules! impl_dataset {
if s.is_none() { if s.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(s, None, None, None).map($quad_map)) Box::new(self.quads_for_pattern(s, None, None, None).map(io_quad_map))
} }
} }
fn quads_with_p<'s, TP>(&'s self, p: &'s TP) -> DQuadSource<'s, Self> fn quads_with_p<'s, TP>(&'s self, p: &'s TP) -> DQuadSource<'s, Self>
@ -67,7 +49,7 @@ macro_rules! impl_dataset {
if p.is_none() { if p.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(None, p, None, None).map($quad_map)) Box::new(self.quads_for_pattern(None, p, None, None).map(io_quad_map))
} }
} }
fn quads_with_o<'s, TS>(&'s self, o: &'s TS) -> DQuadSource<'s, Self> fn quads_with_o<'s, TS>(&'s self, o: &'s TS) -> DQuadSource<'s, Self>
@ -79,7 +61,7 @@ macro_rules! impl_dataset {
if o.is_none() { if o.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(None, None, o, None).map($quad_map)) Box::new(self.quads_for_pattern(None, None, o, None).map(io_quad_map))
} }
} }
fn quads_with_g<'s, TS>(&'s self, g: Option<&'s TS>) -> DQuadSource<'s, Self> fn quads_with_g<'s, TS>(&'s self, g: Option<&'s TS>) -> DQuadSource<'s, Self>
@ -91,7 +73,7 @@ macro_rules! impl_dataset {
if g.is_none() { if g.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(None, None, None, g).map($quad_map)) Box::new(self.quads_for_pattern(None, None, None, g).map(io_quad_map))
} }
} }
fn quads_with_sp<'s, TS, TP>(&'s self, s: &'s TS, p: &'s TP) -> DQuadSource<'s, Self> fn quads_with_sp<'s, TS, TP>(&'s self, s: &'s TS, p: &'s TP) -> DQuadSource<'s, Self>
@ -106,7 +88,7 @@ macro_rules! impl_dataset {
if s.is_none() || p.is_none() { if s.is_none() || p.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(s, p, None, None).map($quad_map)) Box::new(self.quads_for_pattern(s, p, None, None).map(io_quad_map))
} }
} }
fn quads_with_so<'s, TS, TO>(&'s self, s: &'s TS, o: &'s TO) -> DQuadSource<'s, Self> fn quads_with_so<'s, TS, TO>(&'s self, s: &'s TS, o: &'s TO) -> DQuadSource<'s, Self>
@ -121,14 +103,10 @@ macro_rules! impl_dataset {
if s.is_none() || o.is_none() { if s.is_none() || o.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(s, None, o, None).map($quad_map)) Box::new(self.quads_for_pattern(s, None, o, None).map(io_quad_map))
} }
} }
fn quads_with_sg<'s, TS, TG>( fn quads_with_sg<'s, TS, TG>(&'s self, s: &'s TS, g: Option<&'s TG>) -> DQuadSource<'s, Self>
&'s self,
s: &'s TS,
g: Option<&'s TG>,
) -> DQuadSource<'s, Self>
where where
TS: TTerm + ?Sized, TS: TTerm + ?Sized,
TG: TTerm + ?Sized, TG: TTerm + ?Sized,
@ -140,7 +118,7 @@ macro_rules! impl_dataset {
if s.is_none() || g.is_none() { if s.is_none() || g.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(s, None, None, g).map($quad_map)) Box::new(self.quads_for_pattern(s, None, None, g).map(io_quad_map))
} }
} }
fn quads_with_po<'s, TP, TO>(&'s self, p: &'s TP, o: &'s TO) -> DQuadSource<'s, Self> fn quads_with_po<'s, TP, TO>(&'s self, p: &'s TP, o: &'s TO) -> DQuadSource<'s, Self>
@ -155,14 +133,10 @@ macro_rules! impl_dataset {
if p.is_none() || o.is_none() { if p.is_none() || o.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(None, p, o, None).map($quad_map)) Box::new(self.quads_for_pattern(None, p, o, None).map(io_quad_map))
} }
} }
fn quads_with_pg<'s, TP, TG>( fn quads_with_pg<'s, TP, TG>(&'s self, p: &'s TP, g: Option<&'s TG>) -> DQuadSource<'s, Self>
&'s self,
p: &'s TP,
g: Option<&'s TG>,
) -> DQuadSource<'s, Self>
where where
TP: TTerm + ?Sized, TP: TTerm + ?Sized,
TG: TTerm + ?Sized, TG: TTerm + ?Sized,
@ -174,14 +148,10 @@ macro_rules! impl_dataset {
if p.is_none() || g.is_none() { if p.is_none() || g.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(None, p, None, g).map($quad_map)) Box::new(self.quads_for_pattern(None, p, None, g).map(io_quad_map))
} }
} }
fn quads_with_og<'s, TO, TG>( fn quads_with_og<'s, TO, TG>(&'s self, o: &'s TO, g: Option<&'s TG>) -> DQuadSource<'s, Self>
&'s self,
o: &'s TO,
g: Option<&'s TG>,
) -> DQuadSource<'s, Self>
where where
TO: TTerm + ?Sized, TO: TTerm + ?Sized,
TG: TTerm + ?Sized, TG: TTerm + ?Sized,
@ -193,7 +163,7 @@ macro_rules! impl_dataset {
if o.is_none() || g.is_none() { if o.is_none() || g.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(None, None, o, g).map($quad_map)) Box::new(self.quads_for_pattern(None, None, o, g).map(io_quad_map))
} }
} }
fn quads_with_spo<'s, TS, TP, TO>( fn quads_with_spo<'s, TS, TP, TO>(
@ -216,7 +186,7 @@ macro_rules! impl_dataset {
if s.is_none() || p.is_none() || o.is_none() { if s.is_none() || p.is_none() || o.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(s, p, o, None).map($quad_map)) Box::new(self.quads_for_pattern(s, p, o, None).map(io_quad_map))
} }
} }
fn quads_with_spg<'s, TS, TP, TG>( fn quads_with_spg<'s, TS, TP, TG>(
@ -239,7 +209,7 @@ macro_rules! impl_dataset {
if s.is_none() || p.is_none() || g.is_none() { if s.is_none() || p.is_none() || g.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(s, p, None, g).map($quad_map)) Box::new(self.quads_for_pattern(s, p, None, g).map(io_quad_map))
} }
} }
fn quads_with_sog<'s, TS, TO, TG>( fn quads_with_sog<'s, TS, TO, TG>(
@ -262,7 +232,7 @@ macro_rules! impl_dataset {
if s.is_none() || o.is_none() || g.is_none() { if s.is_none() || o.is_none() || g.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(s, None, o, g).map($quad_map)) Box::new(self.quads_for_pattern(s, None, o, g).map(io_quad_map))
} }
} }
fn quads_with_pog<'s, TP, TO, TG>( fn quads_with_pog<'s, TP, TO, TG>(
@ -285,7 +255,7 @@ macro_rules! impl_dataset {
if p.is_none() || o.is_none() || g.is_none() { if p.is_none() || o.is_none() || g.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(None, p, o, g).map($quad_map)) Box::new(self.quads_for_pattern(None, p, o, g).map(io_quad_map))
} }
} }
fn quads_with_spog<'s, TS, TP, TO, TG>( fn quads_with_spog<'s, TS, TP, TO, TG>(
@ -312,52 +282,48 @@ macro_rules! impl_dataset {
if s.is_none() || p.is_none() || o.is_none() || g.is_none() { if s.is_none() || p.is_none() || o.is_none() || g.is_none() {
Box::new(empty()) Box::new(empty())
} else { } else {
Box::new(self.quads_for_pattern(s, p, o, g).map($quad_map)) Box::new(self.quads_for_pattern(s, p, o, g).map(io_quad_map))
} }
} }
fn subjects(&self) -> DResultTermSet<Self> fn subjects(&self) -> DResultTermSet<Self>
where where
DTerm<Self>: Clone + Eq + Hash, DTerm<Self>: Clone + Eq + Hash,
{ {
sparql_to_hashset!( sparql_to_hashset(
self, self,
$err_map, "SELECT DISTINCT ?s {{?s ?p ?o} UNION { GRAPH ?g {?s ?p ?o}}}",
"SELECT DISTINCT ?s {{?s ?p ?o} UNION { GRAPH ?g {?s ?p ?o}}}"
) )
} }
fn predicates(&self) -> DResultTermSet<Self> fn predicates(&self) -> DResultTermSet<Self>
where where
DTerm<Self>: Clone + Eq + Hash, DTerm<Self>: Clone + Eq + Hash,
{ {
sparql_to_hashset!( sparql_to_hashset(
self, self,
$err_map, "SELECT DISTINCT ?p {{?s ?p ?o} UNION { GRAPH ?g {?s ?p ?o}}}",
"SELECT DISTINCT ?p {{?s ?p ?o} UNION { GRAPH ?g {?s ?p ?o}}}"
) )
} }
fn objects(&self) -> DResultTermSet<Self> fn objects(&self) -> DResultTermSet<Self>
where where
DTerm<Self>: Clone + Eq + Hash, DTerm<Self>: Clone + Eq + Hash,
{ {
sparql_to_hashset!( sparql_to_hashset(
self, self,
$err_map, "SELECT DISTINCT ?o {{?s ?p ?o} UNION { GRAPH ?g {?s ?p ?o}}}",
"SELECT DISTINCT ?o {{?s ?p ?o} UNION { GRAPH ?g {?s ?p ?o}}}"
) )
} }
fn graph_names(&self) -> DResultTermSet<Self> fn graph_names(&self) -> DResultTermSet<Self>
where where
DTerm<Self>: Clone + Eq + Hash, DTerm<Self>: Clone + Eq + Hash,
{ {
sparql_to_hashset!(self, $err_map, "SELECT DISTINCT ?g {GRAPH ?g {?s ?p ?o}}") sparql_to_hashset(self, "SELECT DISTINCT ?g {GRAPH ?g {?s ?p ?o}}")
} }
fn iris(&self) -> DResultTermSet<Self> fn iris(&self) -> DResultTermSet<Self>
where where
DTerm<Self>: Clone + Eq + Hash, DTerm<Self>: Clone + Eq + Hash,
{ {
sparql_to_hashset!( sparql_to_hashset(
self, self,
$err_map,
"SELECT DISTINCT ?iri { "SELECT DISTINCT ?iri {
{?iri ?p ?o} UNION {?iri ?p ?o} UNION
{?s ?iri ?o} UNION {?s ?iri ?o} UNION
@ -367,16 +333,15 @@ macro_rules! impl_dataset {
{GRAPH ?g {?s ?iri ?o}} UNION {GRAPH ?g {?s ?iri ?o}} UNION
{GRAPH ?g {?s ?p ?iri}} {GRAPH ?g {?s ?p ?iri}}
FILTER isIRI(?iri) FILTER isIRI(?iri)
}" }",
) )
} }
fn bnodes(&self) -> DResultTermSet<Self> fn bnodes(&self) -> DResultTermSet<Self>
where where
DTerm<Self>: Clone + Eq + Hash, DTerm<Self>: Clone + Eq + Hash,
{ {
sparql_to_hashset!( sparql_to_hashset(
self, self,
$err_map,
"SELECT DISTINCT ?bn { "SELECT DISTINCT ?bn {
{?bn ?p ?o} UNION {?bn ?p ?o} UNION
{?s ?p ?bn} UNION {?s ?p ?bn} UNION
@ -384,21 +349,20 @@ macro_rules! impl_dataset {
{GRAPH ?s {?bn ?p ?o}} UNION {GRAPH ?s {?bn ?p ?o}} UNION
{GRAPH ?g {?s ?p ?bn}} {GRAPH ?g {?s ?p ?bn}}
FILTER isBlank(?bn) FILTER isBlank(?bn)
}" }",
) )
} }
fn literals(&self) -> DResultTermSet<Self> fn literals(&self) -> DResultTermSet<Self>
where where
DTerm<Self>: Clone + Eq + Hash, DTerm<Self>: Clone + Eq + Hash,
{ {
sparql_to_hashset!( sparql_to_hashset(
self, self,
$err_map,
"SELECT DISTINCT ?lit { "SELECT DISTINCT ?lit {
{?s ?p ?lit} UNION {?s ?p ?lit} UNION
{ GRAPH ?g {?s ?p ?lit}} { GRAPH ?g {?s ?p ?lit}}
FILTER isLiteral(?lit) FILTER isLiteral(?lit)
}" }",
) )
} }
fn variables(&self) -> DResultTermSet<Self> fn variables(&self) -> DResultTermSet<Self>
@ -408,16 +372,9 @@ macro_rules! impl_dataset {
Ok(std::collections::HashSet::new()) Ok(std::collections::HashSet::new())
} }
} }
};
}
mod sled {
use super::*;
impl_dataset!(SledStore, std::io::Error, io_quad_map, io_err_map);
impl MutableDataset for SledStore { impl MutableDataset for SledStore {
type MutationError = std::io::Error; type MutationError = Error;
fn insert<TS, TP, TO, TG>( fn insert<TS, TP, TO, TG>(
&mut self, &mut self,
s: &TS, s: &TS,
@ -470,34 +427,25 @@ mod sled {
} }
impl CollectibleDataset for SledStore { impl CollectibleDataset for SledStore {
fn from_quad_source<QS: QuadSource>( fn from_quad_source<QS: QuadSource>(quads: QS) -> StreamResult<Self, QS::Error, Self::Error> {
quads: QS, let mut d = SledStore::new().map_err(sophia_api::quad::stream::StreamError::SinkError)?;
) -> StreamResult<Self, QS::Error, Self::Error> {
let mut d =
SledStore::new().map_err(sophia_api::quad::stream::StreamError::SinkError)?;
d.insert_all(quads)?; d.insert_all(quads)?;
Ok(d) Ok(d)
} }
} }
#[cfg(test)]
sophia_api::test_dataset_impl!(test, SledStore, false, false);
}
// helper functions // helper functions
fn io_quad_map<'a>( fn io_quad_map<'a>(res: Result<Quad, Error>) -> Result<StreamedSophiaQuad<'a>, Error> {
res: Result<Quad, std::io::Error>,
) -> Result<StreamedSophiaQuad<'a>, std::io::Error> {
res.map(|q| { res.map(|q| {
let q: SophiaQuad = q.into(); let q: SophiaQuad = q.into();
StreamedQuad::by_value(q) StreamedQuad::by_value(q)
}) })
} }
fn io_err_map(err: EvaluationError) -> std::io::Error { fn io_err_map(err: EvaluationError) -> Error {
match err { match err {
EvaluationError::Io(err) => err, EvaluationError::Io(err) => err,
_ => panic!("Unexpected error"), err => Error::new(ErrorKind::InvalidInput, err),
} }
} }
@ -576,7 +524,7 @@ fn convert_iri_raw<'a>(
suffix: Option<&'a str>, suffix: Option<&'a str>,
buffer: &'a mut String, buffer: &'a mut String,
) -> NamedNodeRef<'a> { ) -> NamedNodeRef<'a> {
let iri: &'a str = match suffix { NamedNodeRef::new_unchecked(match suffix {
Some(suffix) => { Some(suffix) => {
buffer.clear(); buffer.clear();
buffer.push_str(ns); buffer.push_str(ns);
@ -584,8 +532,7 @@ fn convert_iri_raw<'a>(
buffer buffer
} }
None => ns, None => ns,
}; })
NamedNodeRef::new_unchecked(iri)
} }
fn convert_quadref<'a, TS, TP, TO, TG>( fn convert_quadref<'a, TS, TP, TO, TG>(
@ -622,3 +569,23 @@ where
}; };
Some(QuadRef::new(s, p, o, g)) Some(QuadRef::new(s, p, o, g))
} }
/// Execute a SPARQL query in a store, and return the result as a HashSet,
/// mapping the error (if any) through the given function.
///
/// # Precondition
/// + the query must be a SELECT query with a single selected variable
/// + it must not produce NULL results
fn sparql_to_hashset(store: &SledStore, sparql: &str) -> Result<HashSet<Term>, Error> {
if let QueryResults::Solutions(solutions) = store.query(sparql).map_err(io_err_map)? {
solutions
.map(|r| r.map(|v| v.get(0).unwrap().clone()))
.collect::<Result<_, _>>()
.map_err(io_err_map)
} else {
unreachable!()
}
}
#[cfg(test)]
sophia_api::test_dataset_impl!(test, SledStore, false, false);

Loading…
Cancel
Save