orm shape type to sparql with select

feat/orm-diffs
Laurin Weger 18 hours ago
parent a6e6b18e42
commit 0753859d0d
No known key found for this signature in database
GPG Key ID: 9B372BB0B792770F
  1. 6
      engine/verifier/src/orm/initialize.rs
  2. 11
      engine/verifier/src/orm/process_changes.rs
  3. 336
      engine/verifier/src/orm/query.rs
  4. 13
      sdk/rust/src/tests/orm_creation.rs

@ -17,7 +17,7 @@ use std::collections::HashMap;
use std::sync::Arc;
use std::sync::RwLock;
use crate::orm::query::shape_type_to_sparql;
use crate::orm::query::shape_type_to_sparql_select;
use crate::orm::types::*;
use crate::orm::utils::nuri_to_string;
use crate::types::CancelFn;
@ -84,8 +84,8 @@ impl Verifier {
shape_type: &OrmShapeType,
) -> Result<Value, NgError> {
// Query triples for this shape
let shape_query = shape_type_to_sparql(&shape_type.schema, &shape_type.shape, None)?;
let shape_triples = self.query_sparql_construct(shape_query, Some(nuri_to_string(nuri)))?;
let shape_query = shape_type_to_sparql_select(&shape_type.schema, &shape_type.shape, None)?;
let shape_triples = self.query_sparql_select(shape_query, Some(nuri_to_string(nuri)))?;
let changes: OrmChanges =
self.apply_triple_changes(&shape_triples, &[], nuri, Some(session_id.clone()), true)?;

@ -22,7 +22,7 @@ use ng_repo::errors::NgError;
use ng_repo::log::*;
use crate::orm::add_remove_triples::add_remove_triples;
use crate::orm::query::shape_type_to_sparql;
use crate::orm::query::shape_type_to_sparql_select;
use crate::orm::types::*;
use crate::orm::utils::*;
use crate::orm::OrmChanges;
@ -353,10 +353,13 @@ impl Verifier {
if objects_to_fetch.len() > 0 {
// Create sparql query
let shape_query =
shape_type_to_sparql(&schema, &shape_iri, Some(objects_to_fetch))?;
let shape_query = shape_type_to_sparql_select(
&schema,
&shape_iri,
Some(objects_to_fetch),
)?;
let new_triples =
self.query_sparql_construct(shape_query, Some(nuri_to_string(nuri)))?;
self.query_sparql_select(shape_query, Some(nuri_to_string(nuri)))?;
log_info!(
"[process_changes_for_shape_and_session] Fetched {} triples, recursively processing nested objects",

@ -18,11 +18,64 @@ use crate::orm::utils::{escape_literal, is_iri};
use crate::verifier::*;
use ng_net::orm::*;
use ng_oxigraph::oxigraph::sparql::{Query, QueryResults};
use ng_oxigraph::oxrdf::Triple;
use ng_oxigraph::oxrdf::{NamedNode, Triple};
use ng_repo::errors::NgError;
use ng_repo::log::*;
impl Verifier {
pub fn query_sparql_select(
&self,
query: String,
nuri: Option<String>,
) -> Result<Vec<Triple>, NgError> {
let oxistore = self.graph_dataset.as_ref().unwrap();
let nuri_str = nuri.as_ref().map(|s| s.as_str());
log_debug!("querying select\n{}\n{}\n", nuri_str.unwrap(), query);
let parsed =
Query::parse(&query, nuri_str).map_err(|e| NgError::OxiGraphError(e.to_string()))?;
let results = oxistore
.query(parsed, nuri)
.map_err(|e| NgError::OxiGraphError(e.to_string()))?;
match results {
QueryResults::Solutions(solutions) => {
let mut result_triples: HashSet<Triple> = HashSet::new();
for s in solutions {
match s {
Err(e) => {
log_err!("{}", e.to_string());
return Err(NgError::SparqlError(e.to_string()));
}
Ok(solution) => {
let s = solution.get("s").unwrap();
let p = solution.get("p").unwrap();
let o = solution.get("o").unwrap();
// let g = solution.get("g"); // Optional
let triple = Triple {
subject: match s {
ng_oxigraph::oxrdf::Term::NamedNode(n) => {
ng_oxigraph::oxrdf::Subject::NamedNode(n.clone())
}
_ => panic!("Expected NamedNode for subject"),
},
predicate: match p {
ng_oxigraph::oxrdf::Term::NamedNode(n) => n.clone(),
_ => panic!(),
},
object: o.clone(),
};
log_debug!("triple fetched: {:?}", triple);
result_triples.insert(triple);
}
}
}
Ok(Vec::from_iter(result_triples))
}
_ => return Err(NgError::InvalidResponse),
}
}
pub fn query_sparql_construct(
&self,
query: String,
@ -92,7 +145,7 @@ pub fn literal_to_sparql_str(var: OrmSchemaDataType) -> Vec<String> {
}
}
pub fn shape_type_to_sparql(
pub fn shape_type_to_sparql_construct(
schema: &OrmSchema,
shape: &ShapeIri,
filter_subjects: Option<Vec<String>>,
@ -295,3 +348,282 @@ pub fn shape_type_to_sparql(
construct_body, where_body
))
}
pub fn shape_type_to_sparql_select(
schema: &OrmSchema,
shape: &ShapeIri,
filter_subjects: Option<Vec<String>>,
) -> Result<String, NgError> {
// Use a counter to generate unique variable names.
let mut var_counter = 0;
fn get_new_var_name(counter: &mut i32) -> String {
let name = format!("v{}", counter);
*counter += 1;
name
}
fn get_new_graph_var_name(counter: &mut i32) -> String {
let name = format!("g{}", counter);
*counter += 1;
name
}
// Collect SELECT branches (each produces bindings for ?s ?p ?o ?g) and shared WHERE constraints.
let mut select_branches: Vec<String> = Vec::new();
let mut where_statements: Vec<String> = Vec::new();
// Keep track of visited shapes while recursing to prevent infinite loops.
let mut visited_shapes: HashSet<ShapeIri> = HashSet::new();
// Recursive function to build constraints and output branches per shape layer.
// Returns nested WHERE blocks (already wrapped in appropriate GRAPH clauses) to be included at the parent scope.
fn process_shape(
schema: &OrmSchema,
shape: &OrmSchemaShape,
subject_var_name: &str,
current_graph_var_name: &str,
// If this shape is reached via a parent predicate, we pass the link to bind nested subject even when optional
link_from_parent: Option<(
&str, /* parent subj var */
&str, /* predicate IRI */
&str, /* parent graph var */
&str, /* this subj var */
)>,
select_branches: &mut Vec<String>,
where_statements: &mut Vec<String>,
var_counter: &mut i32,
visited_shapes: &mut HashSet<String>,
in_recursion: bool,
) -> Vec<String> {
// Prevent infinite recursion on cyclic schemas.
// TODO: We could handle this as IRI string reference.
if visited_shapes.contains(&shape.iri) {
return vec![];
}
let mut new_where_statements: Vec<String> = vec![];
visited_shapes.insert(shape.iri.clone());
// Add statements for each predicate of the current shape layer.
for predicate in &shape.predicates {
let mut union_triples: Vec<String> = Vec::new();
let mut nested_where_blocks: Vec<String> = Vec::new();
// Traverse acceptable nested shapes, if any.
for datatype in &predicate.dataTypes {
if datatype.valType == OrmSchemaValType::shape {
let shape_iri = &datatype.shape.clone().unwrap();
let nested_shape = schema.get(shape_iri).unwrap();
// Var for object at this branch
let obj_var_name = get_new_var_name(var_counter);
// This triple binds the nested subject for this branch (in current layer's graph)
let triple = format!(
" ?{} <{}> ?{}",
subject_var_name, predicate.iri, obj_var_name
);
union_triples.push(triple.clone());
// Output branch for the parent link triple itself (belongs to current layer) when not in recursive catch-all
if !in_recursion {
let branch = format!(
" GRAPH ?{} {{\n{}\n }}\n BIND(?{} AS ?s)\n BIND(<{}> AS ?p)\n BIND(?{} AS ?o)\n BIND(?{} AS ?g)",
current_graph_var_name,
triple,
subject_var_name,
predicate.iri,
obj_var_name,
current_graph_var_name
);
select_branches.push(format!("{{\n{}\n}}", branch));
}
// Recurse for nested shape: it has its own graph layer
let nested_graph_var = get_new_graph_var_name(var_counter);
let nested_blocks = process_shape(
schema,
nested_shape,
&obj_var_name,
&nested_graph_var,
Some((
subject_var_name,
&predicate.iri,
current_graph_var_name,
&obj_var_name,
)),
select_branches,
where_statements,
var_counter,
visited_shapes,
true,
);
nested_where_blocks.extend(nested_blocks);
}
}
// Build the WHERE part for this predicate in the current layer
let where_body: String;
if !union_triples.is_empty() {
let union_body = union_triples
.iter()
.map(|b| format!("{{\n{}\n}}", b))
.collect::<Vec<_>>()
.join(" UNION ");
if !nested_where_blocks.is_empty() {
let nested_joined = nested_where_blocks.join(" .\n");
where_body = format!("{} .\n{}", union_body, nested_joined);
} else {
where_body = union_body;
}
} else {
// Value predicate (non-shape)
let obj_var_name = get_new_var_name(var_counter);
let triple = format!(
" ?{} <{}> ?{}",
subject_var_name, predicate.iri, obj_var_name
);
where_body = triple.clone();
// Output branch for this value triple in current graph layer
if !in_recursion {
let branch = format!(
" GRAPH ?{} {{\n{}\n }}\n BIND(?{} AS ?s)\n BIND(<{}> AS ?p)\n BIND(?{} AS ?o)\n BIND(?{} AS ?g)",
current_graph_var_name,
triple,
subject_var_name,
predicate.iri,
obj_var_name,
current_graph_var_name
);
select_branches.push(format!("{{\n{}\n}}", branch));
}
}
// Optional wrapper, if needed
if predicate.minCardinality < 1 {
new_where_statements.push(format!(" OPTIONAL {{\n{}\n }}", where_body));
} else {
new_where_statements.push(where_body);
}
}
if in_recursion {
// In recursion, add a catch-all triple for this nested subject within its graph layer
let pred_var_name = get_new_var_name(var_counter);
let obj_var_name = get_new_var_name(var_counter);
let catch_all = format!(
" ?{} ?{} ?{}",
subject_var_name, pred_var_name, obj_var_name
);
// Output branch for nested triples: include the parent link triple to bind nested subject even when optional
if let Some((parent_subj, parent_pred, parent_graph, this_subj)) = link_from_parent {
let parent_link = format!(
" GRAPH ?{} {{\n ?{} <{}> ?{}\n }}",
parent_graph, parent_subj, parent_pred, this_subj
);
let nested_graph_block = format!(
" GRAPH ?{} {{\n{}\n }}",
current_graph_var_name, catch_all
);
let branch = format!(
"{}\n{}\n BIND(?{} AS ?s)\n BIND(?{} AS ?p)\n BIND(?{} AS ?o)\n BIND(?{} AS ?g)",
parent_link,
nested_graph_block,
subject_var_name,
pred_var_name,
obj_var_name,
current_graph_var_name
);
select_branches.push(format!("{{\n{}\n}}", branch));
} else {
// Fallback: no explicit parent link (shouldn't happen for nested shapes), still output within graph
let branch = format!(
" GRAPH ?{} {{\n{}\n }}\n BIND(?{} AS ?s)\n BIND(?{} AS ?p)\n BIND(?{} AS ?o)\n BIND(?{} AS ?g)",
current_graph_var_name,
catch_all,
subject_var_name,
pred_var_name,
obj_var_name,
current_graph_var_name
);
select_branches.push(format!("{{\n{}\n}}", branch));
}
// Combine catch-all with specific predicates of this nested shape inside its graph
let joined_where_statements = new_where_statements.join(" .\n");
let inner_union = if joined_where_statements.is_empty() {
format!("{{{}}}", catch_all)
} else {
format!(
"{{{}}} UNION {{\n {}\n }}",
catch_all, joined_where_statements
)
};
let nested_block = format!(
" GRAPH ?{} {{\n {}\n }}",
current_graph_var_name, inner_union
);
visited_shapes.remove(&shape.iri);
return vec![nested_block];
} else {
// Add current layer constraints wrapped in its graph
if !new_where_statements.is_empty() {
let body = new_where_statements.join(" .\n");
where_statements.push(format!(
" GRAPH ?{} {{\n{}\n }}",
current_graph_var_name, body
));
}
}
visited_shapes.remove(&shape.iri);
vec![]
}
let root_shape = schema.get(shape).ok_or(VerifierError::InvalidOrmSchema)?;
// Root subject and graph variable names
let root_var_name = get_new_var_name(&mut var_counter);
let root_graph_var = get_new_graph_var_name(&mut var_counter);
process_shape(
schema,
root_shape,
&root_var_name,
&root_graph_var,
None,
&mut select_branches,
&mut where_statements,
&mut var_counter,
&mut visited_shapes,
false,
);
// Filter subjects, if present (applies to the root subject var)
if let Some(subjects) = filter_subjects {
let subjects_str = subjects
.iter()
.map(|s| format!("<{}>", s))
.collect::<Vec<_>>()
.join(", ");
where_statements.push(format!(" FILTER(?v0 IN ({}))", subjects_str));
}
// Assemble final query
let mut where_parts: Vec<String> = Vec::new();
if !where_statements.is_empty() {
where_parts.push(where_statements.join(" .\n"));
}
if !select_branches.is_empty() {
let union_body = select_branches.join(" UNION ");
where_parts.push(union_body);
}
Ok(format!(
"SELECT DISTINCT ?s ?p ?o ?g\nWHERE {{\n{}\n}}",
where_parts.join(" .\n")
))
}

@ -17,8 +17,8 @@ use ng_net::orm::{
OrmShapeType,
};
use ng_repo::log_info;
use ng_verifier::orm::query::shape_type_to_sparql;
use ng_repo::{log_debug, log_info};
use ng_verifier::orm::query::shape_type_to_sparql_select;
use serde_json::json;
use std::collections::HashMap;
use std::sync::Arc;
@ -78,7 +78,7 @@ INSERT DATA {
};
// Generate and execute the CONSTRUCT query
let query = shape_type_to_sparql(&shape_type.schema, &shape_type.shape, None).unwrap();
let query = shape_type_to_sparql_select(&shape_type.schema, &shape_type.shape, None).unwrap();
let triples = doc_sparql_construct(session_id, query, Some(doc_nuri.clone()))
.await
@ -181,7 +181,7 @@ INSERT DATA {
};
// Generate and run query
let query = shape_type_to_sparql(&shape_type.schema, &shape_type.shape, None).unwrap();
let query = shape_type_to_sparql_select(&shape_type.schema, &shape_type.shape, None).unwrap();
let triples = doc_sparql_construct(session_id, query, Some(doc_nuri.clone()))
.await
.unwrap();
@ -244,7 +244,7 @@ INSERT DATA {
};
// Generate and run query
let query = shape_type_to_sparql(&shape_type.schema, &shape_type.shape, None).unwrap();
let query = shape_type_to_sparql_select(&shape_type.schema, &shape_type.shape, None).unwrap();
let triples = doc_sparql_construct(session_id, query, Some(doc_nuri.clone()))
.await
.unwrap();
@ -319,7 +319,7 @@ INSERT DATA {
};
// Generate and run query. This must not infinite loop.
let query = shape_type_to_sparql(&shape_type.schema, &shape_type.shape, None).unwrap();
let query = shape_type_to_sparql_select(&shape_type.schema, &shape_type.shape, None).unwrap();
let triples = doc_sparql_construct(session_id, query, Some(doc_nuri.clone()))
.await
.unwrap();
@ -619,6 +619,7 @@ INSERT DATA {
]);
let mut actual_mut = orm_json.clone();
log_info!("actual data for orm_root_array:\n{:?}", actual_mut);
assert_json_eq(&mut expected, &mut actual_mut);
break;

Loading…
Cancel
Save