#![allow(clippy::ignored_unit_patterns)] use crate::algebra::*; use crate::query::*; use crate::term::*; use crate::update::*; use oxilangtag::LanguageTag; use oxiri::{Iri, IriParseError}; use oxrdf::vocab::{rdf, xsd}; use peg::parser; use peg::str::LineCol; use rand::random; use std::collections::{HashMap, HashSet}; use std::error::Error; use std::mem::take; use std::str::FromStr; use std::{char, fmt}; /// Parses a SPARQL query with an optional base IRI to resolve relative IRIs in the query. pub fn parse_query(query: &str, base_iri: Option<&str>) -> Result { let mut state = ParserState { base_iri: if let Some(base_iri) = base_iri { Some(Iri::parse(base_iri.to_owned()).map_err(|e| ParseError { inner: ParseErrorKind::InvalidBaseIri(e), })?) } else { None }, namespaces: HashMap::default(), used_bnodes: HashSet::default(), currently_used_bnodes: HashSet::default(), aggregates: Vec::new(), }; parser::QueryUnit(query, &mut state).map_err(|e| ParseError { inner: ParseErrorKind::Parser(e), }) } /// Parses a SPARQL update with an optional base IRI to resolve relative IRIs in the query. pub fn parse_update(update: &str, base_iri: Option<&str>) -> Result { let mut state = ParserState { base_iri: if let Some(base_iri) = base_iri { Some(Iri::parse(base_iri.to_owned()).map_err(|e| ParseError { inner: ParseErrorKind::InvalidBaseIri(e), })?) } else { None }, namespaces: HashMap::default(), used_bnodes: HashSet::default(), currently_used_bnodes: HashSet::default(), aggregates: Vec::new(), }; let operations = parser::UpdateInit(update, &mut state).map_err(|e| ParseError { inner: ParseErrorKind::Parser(e), })?; Ok(Update { operations, base_iri: state.base_iri, }) } /// Error returned during SPARQL parsing. #[derive(Debug)] pub struct ParseError { inner: ParseErrorKind, } #[derive(Debug)] enum ParseErrorKind { InvalidBaseIri(IriParseError), Parser(peg::error::ParseError), } impl fmt::Display for ParseError { #[inline] fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { match &self.inner { ParseErrorKind::InvalidBaseIri(e) => { write!(f, "Invalid SPARQL base IRI provided: {e}") } ParseErrorKind::Parser(e) => e.fmt(f), } } } impl Error for ParseError { #[inline] fn source(&self) -> Option<&(dyn Error + 'static)> { match &self.inner { ParseErrorKind::InvalidBaseIri(e) => Some(e), ParseErrorKind::Parser(e) => Some(e), } } } struct AnnotatedTerm { term: TermPattern, annotations: Vec<(NamedNodePattern, Vec)>, } #[derive(Default)] struct FocusedTriplePattern { focus: F, patterns: Vec, } impl FocusedTriplePattern { fn new(focus: F) -> Self { Self { focus, patterns: Vec::new(), } } } impl From> for FocusedTriplePattern> { fn from(input: FocusedTriplePattern) -> Self { Self { focus: vec![input.focus], patterns: input.patterns, } } } #[derive(Clone, Debug)] enum VariableOrPropertyPath { Variable(Variable), PropertyPath(PropertyPathExpression), } impl From for VariableOrPropertyPath { fn from(var: Variable) -> Self { Self::Variable(var) } } impl From for VariableOrPropertyPath { fn from(pattern: NamedNodePattern) -> Self { match pattern { NamedNodePattern::NamedNode(node) => PropertyPathExpression::from(node).into(), NamedNodePattern::Variable(v) => v.into(), } } } impl From for VariableOrPropertyPath { fn from(path: PropertyPathExpression) -> Self { Self::PropertyPath(path) } } fn add_to_triple_patterns( subject: TermPattern, predicate: NamedNodePattern, object: AnnotatedTerm, patterns: &mut Vec, ) -> Result<(), &'static str> { let triple = TriplePattern::new(subject, predicate, object.term); #[cfg(feature = "rdf-star")] for (p, os) in object.annotations { for o in os { add_to_triple_patterns(triple.clone().into(), p.clone(), o, patterns)? } } #[cfg(not(feature = "rdf-star"))] if !object.annotations.is_empty() { return Err("Embedded triples are only available in SPARQL-star"); } patterns.push(triple); Ok(()) } fn add_to_triple_or_path_patterns( subject: TermPattern, predicate: impl Into, object: AnnotatedTermPath, patterns: &mut Vec, ) -> Result<(), &'static str> { match predicate.into() { VariableOrPropertyPath::Variable(p) => { add_triple_to_triple_or_path_patterns(subject, p, object, patterns)?; } VariableOrPropertyPath::PropertyPath(p) => match p { PropertyPathExpression::NamedNode(p) => { add_triple_to_triple_or_path_patterns(subject, p, object, patterns)?; } PropertyPathExpression::Reverse(p) => add_to_triple_or_path_patterns( object.term, *p, AnnotatedTermPath { term: subject, annotations: object.annotations, }, patterns, )?, PropertyPathExpression::Sequence(a, b) => { if !object.annotations.is_empty() { return Err("Annotations are not allowed on property paths"); } let middle = BlankNode::default(); add_to_triple_or_path_patterns( subject, *a, AnnotatedTermPath { term: middle.clone().into(), annotations: Vec::new(), }, patterns, )?; add_to_triple_or_path_patterns( middle.into(), *b, AnnotatedTermPath { term: object.term, annotations: Vec::new(), }, patterns, )?; } path => { if !object.annotations.is_empty() { return Err("Annotations are not allowed on property paths"); } patterns.push(TripleOrPathPattern::Path { subject, path, object: object.term, }) } }, } Ok(()) } fn add_triple_to_triple_or_path_patterns( subject: TermPattern, predicate: impl Into, object: AnnotatedTermPath, patterns: &mut Vec, ) -> Result<(), &'static str> { let triple = TriplePattern::new(subject, predicate, object.term); #[cfg(feature = "rdf-star")] for (p, os) in object.annotations { for o in os { add_to_triple_or_path_patterns(triple.clone().into(), p.clone(), o, patterns)? } } #[cfg(not(feature = "rdf-star"))] if !object.annotations.is_empty() { return Err("Embedded triples are only available in SPARQL-star"); } patterns.push(triple.into()); Ok(()) } fn build_bgp(patterns: Vec) -> GraphPattern { let mut bgp = Vec::new(); let mut elements = Vec::with_capacity(patterns.len()); for pattern in patterns { match pattern { TripleOrPathPattern::Triple(t) => bgp.push(t), TripleOrPathPattern::Path { subject, path, object, } => { if !bgp.is_empty() { elements.push(GraphPattern::Bgp { patterns: take(&mut bgp), }); } elements.push(GraphPattern::Path { subject, path, object, }) } } } if !bgp.is_empty() { elements.push(GraphPattern::Bgp { patterns: bgp }); } elements.into_iter().reduce(new_join).unwrap_or_default() } #[derive(Debug)] enum TripleOrPathPattern { Triple(TriplePattern), Path { subject: TermPattern, path: PropertyPathExpression, object: TermPattern, }, } impl From for TripleOrPathPattern { fn from(tp: TriplePattern) -> Self { Self::Triple(tp) } } #[derive(Debug)] struct AnnotatedTermPath { term: TermPattern, annotations: Vec<(VariableOrPropertyPath, Vec)>, } impl From for AnnotatedTermPath { fn from(term: AnnotatedTerm) -> Self { Self { term: term.term, annotations: term .annotations .into_iter() .map(|(p, o)| (p.into(), o.into_iter().map(Self::from).collect())) .collect(), } } } #[derive(Debug, Default)] struct FocusedTripleOrPathPattern { focus: F, patterns: Vec, } impl FocusedTripleOrPathPattern { fn new(focus: F) -> Self { Self { focus, patterns: Vec::new(), } } } impl From> for FocusedTripleOrPathPattern> { fn from(input: FocusedTripleOrPathPattern) -> Self { Self { focus: vec![input.focus], patterns: input.patterns, } } } impl> From> for FocusedTripleOrPathPattern { fn from(input: FocusedTriplePattern) -> Self { Self { focus: input.focus.into(), patterns: input.patterns.into_iter().map(Into::into).collect(), } } } #[derive(Eq, PartialEq, Debug, Clone, Hash)] enum PartialGraphPattern { Optional(GraphPattern, Option), #[cfg(feature = "sep-0006")] Lateral(GraphPattern), Minus(GraphPattern), Bind(Expression, Variable), Filter(Expression), Other(GraphPattern), } fn new_join(l: GraphPattern, r: GraphPattern) -> GraphPattern { //Avoid to output empty BGPs if let GraphPattern::Bgp { patterns: pl } = &l { if pl.is_empty() { return r; } } if let GraphPattern::Bgp { patterns: pr } = &r { if pr.is_empty() { return l; } } match (l, r) { (GraphPattern::Bgp { patterns: mut pl }, GraphPattern::Bgp { patterns: pr }) => { pl.extend(pr); GraphPattern::Bgp { patterns: pl } } (GraphPattern::Bgp { patterns }, other) | (other, GraphPattern::Bgp { patterns }) if patterns.is_empty() => { other } (l, r) => GraphPattern::Join { left: Box::new(l), right: Box::new(r), }, } } fn not_empty_fold( iter: impl Iterator, combine: impl Fn(T, T) -> T, ) -> Result { iter.fold(None, |a, b| match a { Some(av) => Some(combine(av, b)), None => Some(b), }) .ok_or("The iterator should not be empty") } enum SelectionOption { Distinct, Reduced, Default, } enum SelectionMember { Variable(Variable), Expression(Expression, Variable), } enum SelectionVariables { Explicit(Vec), Star, Everything, } struct Selection { pub option: SelectionOption, pub variables: SelectionVariables, } impl Selection { fn no_op() -> Self { Self { option: SelectionOption::Default, variables: SelectionVariables::Everything, } } } fn build_select( select: Selection, r#where: GraphPattern, mut group: Option<(Vec, Vec<(Expression, Variable)>)>, having: Option, order_by: Option>, offset_limit: Option<(usize, Option)>, values: Option, state: &mut ParserState, ) -> Result { let mut p = r#where; let mut with_aggregate = false; //GROUP BY let aggregates = state.aggregates.pop().unwrap_or_default(); if group.is_none() && !aggregates.is_empty() { group = Some((vec![], vec![])); } if let Some((clauses, binds)) = group { for (expression, variable) in binds { p = GraphPattern::Extend { inner: Box::new(p), variable, expression, }; } p = GraphPattern::Group { inner: Box::new(p), variables: clauses, aggregates, }; with_aggregate = true; } //HAVING if let Some(expr) = having { p = GraphPattern::Filter { expr, inner: Box::new(p), }; } //VALUES if let Some(data) = values { p = new_join(p, data); } //SELECT let mut pv = Vec::new(); let with_project = match select.variables { SelectionVariables::Explicit(sel_items) => { let mut visible = HashSet::default(); p.on_in_scope_variable(|v| { visible.insert(v.clone()); }); for sel_item in sel_items { let v = match sel_item { SelectionMember::Variable(v) => { if with_aggregate && !visible.contains(&v) { // We validate projection variables if there is an aggregate return Err("The SELECT contains a variable that is unbound"); } v } SelectionMember::Expression(expression, variable) => { if visible.contains(&variable) { // We disallow to override an existing variable with an expression return Err( "The SELECT overrides an existing variable using an expression", ); } if with_aggregate && !are_variables_bound(&expression, &visible) { // We validate projection variables if there is an aggregate return Err( "The SELECT contains an expression with a variable that is unbound", ); } p = GraphPattern::Extend { inner: Box::new(p), variable: variable.clone(), expression, }; variable } }; if pv.contains(&v) { return Err("Duplicated variable name in SELECT"); } pv.push(v) } true } SelectionVariables::Star => { if with_aggregate { return Err("SELECT * is not authorized with GROUP BY"); } //TODO: is it really useful to do a projection? p.on_in_scope_variable(|v| { if !pv.contains(v) { pv.push(v.clone()); } }); pv.sort(); true } SelectionVariables::Everything => false, }; let mut m = p; //ORDER BY if let Some(expression) = order_by { m = GraphPattern::OrderBy { inner: Box::new(m), expression, }; } //PROJECT if with_project { m = GraphPattern::Project { inner: Box::new(m), variables: pv, }; } match select.option { SelectionOption::Distinct => m = GraphPattern::Distinct { inner: Box::new(m) }, SelectionOption::Reduced => m = GraphPattern::Reduced { inner: Box::new(m) }, SelectionOption::Default => (), } //OFFSET LIMIT if let Some((start, length)) = offset_limit { m = GraphPattern::Slice { inner: Box::new(m), start, length, } } Ok(m) } fn are_variables_bound(expression: &Expression, variables: &HashSet) -> bool { match expression { Expression::NamedNode(_) | Expression::Literal(_) | Expression::Bound(_) | Expression::Coalesce(_) | Expression::Exists(_) => true, Expression::Variable(var) => variables.contains(var), Expression::UnaryPlus(e) | Expression::UnaryMinus(e) | Expression::Not(e) => { are_variables_bound(e, variables) } Expression::Or(a, b) | Expression::And(a, b) | Expression::Equal(a, b) | Expression::SameTerm(a, b) | Expression::Greater(a, b) | Expression::GreaterOrEqual(a, b) | Expression::Less(a, b) | Expression::LessOrEqual(a, b) | Expression::Add(a, b) | Expression::Subtract(a, b) | Expression::Multiply(a, b) | Expression::Divide(a, b) => { are_variables_bound(a, variables) && are_variables_bound(b, variables) } Expression::In(a, b) => { are_variables_bound(a, variables) && b.iter().all(|b| are_variables_bound(b, variables)) } Expression::FunctionCall(_, parameters) => { parameters.iter().all(|p| are_variables_bound(p, variables)) } Expression::If(a, b, c) => { are_variables_bound(a, variables) && are_variables_bound(b, variables) && are_variables_bound(c, variables) } } } /// Called on every variable defined using "AS" or "VALUES" #[cfg(feature = "sep-0006")] fn add_defined_variables<'a>(pattern: &'a GraphPattern, set: &mut HashSet<&'a Variable>) { match pattern { GraphPattern::Bgp { .. } | GraphPattern::Path { .. } => {} GraphPattern::Join { left, right } | GraphPattern::LeftJoin { left, right, .. } | GraphPattern::Lateral { left, right } | GraphPattern::Union { left, right } | GraphPattern::Minus { left, right } => { add_defined_variables(left, set); add_defined_variables(right, set); } GraphPattern::Graph { inner, .. } => { add_defined_variables(inner, set); } GraphPattern::Extend { inner, variable, .. } => { set.insert(variable); add_defined_variables(inner, set); } GraphPattern::Group { variables, aggregates, inner, } => { for (v, _) in aggregates { set.insert(v); } let mut inner_variables = HashSet::new(); add_defined_variables(inner, &mut inner_variables); for v in inner_variables { if variables.contains(v) { set.insert(v); } } } GraphPattern::Values { variables, .. } => { for v in variables { set.insert(v); } } GraphPattern::Project { variables, inner } => { let mut inner_variables = HashSet::new(); add_defined_variables(inner, &mut inner_variables); for v in inner_variables { if variables.contains(v) { set.insert(v); } } } GraphPattern::Service { inner, .. } | GraphPattern::Filter { inner, .. } | GraphPattern::OrderBy { inner, .. } | GraphPattern::Distinct { inner } | GraphPattern::Reduced { inner } | GraphPattern::Slice { inner, .. } => add_defined_variables(inner, set), } } fn copy_graph(from: impl Into, to: impl Into) -> GraphUpdateOperation { let bgp = GraphPattern::Bgp { patterns: vec![TriplePattern::new( Variable::new_unchecked("s"), Variable::new_unchecked("p"), Variable::new_unchecked("o"), )], }; GraphUpdateOperation::DeleteInsert { delete: Vec::new(), insert: vec![QuadPattern::new( Variable::new_unchecked("s"), Variable::new_unchecked("p"), Variable::new_unchecked("o"), to, )], using: None, pattern: Box::new(match from.into() { GraphName::NamedNode(from) => GraphPattern::Graph { name: from.into(), inner: Box::new(bgp), }, GraphName::DefaultGraph => bgp, }), } } enum Either { Left(L), Right(R), } pub struct ParserState { base_iri: Option>, namespaces: HashMap, used_bnodes: HashSet, currently_used_bnodes: HashSet, aggregates: Vec>, } impl ParserState { fn parse_iri(&self, iri: String) -> Result, IriParseError> { if let Some(base_iri) = &self.base_iri { base_iri.resolve(&iri) } else { Iri::parse(iri) } } fn new_aggregation(&mut self, agg: AggregateExpression) -> Result { let aggregates = self.aggregates.last_mut().ok_or("Unexpected aggregate")?; Ok(aggregates .iter() .find_map(|(v, a)| (a == &agg).then_some(v)) .cloned() .unwrap_or_else(|| { let new_var = variable(); aggregates.push((new_var.clone(), agg)); new_var })) } } fn unescape_iriref(mut input: &str) -> Result { let mut output = String::with_capacity(input.len()); while let Some((before, after)) = input.split_once('\\') { output.push_str(before); let mut after = after.chars(); let (escape, after) = match after.next() { Some('u') => read_hex_char::<4>(after.as_str())?, Some('U') => read_hex_char::<8>(after.as_str())?, Some(_) => { return Err( "IRIs are only allowed to contain escape sequences \\uXXXX and \\UXXXXXXXX", ) } None => return Err("IRIs are not allowed to end with a '\'"), }; output.push(escape); input = after; } output.push_str(input); Ok(output) } fn unescape_string(mut input: &str) -> Result { let mut output = String::with_capacity(input.len()); while let Some((before, after)) = input.split_once('\\') { output.push_str(before); let mut after = after.chars(); let (escape, after) = match after.next() { Some('t') => ('\u{0009}', after.as_str()), Some('b') => ('\u{0008}', after.as_str()), Some('n') => ('\u{000A}', after.as_str()), Some('r') => ('\u{000D}', after.as_str()), Some('f') => ('\u{000C}', after.as_str()), Some('"') => ('\u{0022}', after.as_str()), Some('\'') => ('\u{0027}', after.as_str()), Some('\\') => ('\u{005C}', after.as_str()), Some('u') => read_hex_char::<4>(after.as_str())?, Some('U') => read_hex_char::<8>(after.as_str())?, Some(_) => return Err("The character that can be escaped in strings are tbnrf\"'\\"), None => return Err("strings are not allowed to end with a '\'"), }; output.push(escape); input = after; } output.push_str(input); Ok(output) } fn read_hex_char(input: &str) -> Result<(char, &str), &'static str> { if let Some(escape) = input.get(..SIZE) { if let Some(char) = u32::from_str_radix(escape, 16) .ok() .and_then(char::from_u32) { Ok((char, &input[SIZE..])) } else { Err("\\u escape sequence should be followed by hexadecimal digits") } } else { Err("\\u escape sequence should be followed by hexadecimal digits") } } fn variable() -> Variable { Variable::new_unchecked(format!("{:x}", random::())) } parser! { //See https://www.w3.org/TR/turtle/#sec-grammar grammar parser(state: &mut ParserState) for str { pub rule QueryUnit() -> Query = Query() rule Query() -> Query = _ Prologue() _ q:(SelectQuery() / ConstructQuery() / DescribeQuery() / AskQuery()) _ { q } pub rule UpdateInit() -> Vec = Update() rule Prologue() = (BaseDecl() _ / PrefixDecl() _)* {} rule BaseDecl() = i("BASE") _ i:IRIREF() { state.base_iri = Some(i) } rule PrefixDecl() = i("PREFIX") _ ns:PNAME_NS() _ i:IRIREF() { state.namespaces.insert(ns.into(), i.into_inner()); } rule SelectQuery() -> Query = s:SelectClause() _ d:DatasetClauses() _ w:WhereClause() _ g:GroupClause()? _ h:HavingClause()? _ o:OrderClause()? _ l:LimitOffsetClauses()? _ v:ValuesClause() {? Ok(Query::Select { dataset: d, pattern: build_select(s, w, g, h, o, l, v, state)?, base_iri: state.base_iri.clone() }) } rule SubSelect() -> GraphPattern = s:SelectClause() _ w:WhereClause() _ g:GroupClause()? _ h:HavingClause()? _ o:OrderClause()? _ l:LimitOffsetClauses()? _ v:ValuesClause() {? build_select(s, w, g, h, o, l, v, state) } rule SelectClause() -> Selection = i("SELECT") _ Selection_init() o:SelectClause_option() _ v:SelectClause_variables() { Selection { option: o, variables: v } } rule Selection_init() = { state.aggregates.push(Vec::new()) } rule SelectClause_option() -> SelectionOption = i("DISTINCT") { SelectionOption::Distinct } / i("REDUCED") { SelectionOption::Reduced } / { SelectionOption::Default } rule SelectClause_variables() -> SelectionVariables = "*" { SelectionVariables::Star } / p:SelectClause_member()+ { SelectionVariables::Explicit(p) } rule SelectClause_member() -> SelectionMember = v:Var() _ { SelectionMember::Variable(v) } / "(" _ e:Expression() _ i("AS") _ v:Var() _ ")" _ { SelectionMember::Expression(e, v) } rule ConstructQuery() -> Query = i("CONSTRUCT") _ c:ConstructTemplate() _ d:DatasetClauses() _ w:WhereClause() _ g:GroupClause()? _ h:HavingClause()? _ o:OrderClause()? _ l:LimitOffsetClauses()? _ v:ValuesClause() {? Ok(Query::Construct { template: c, dataset: d, pattern: build_select(Selection::no_op(), w, g, h, o, l, v, state)?, base_iri: state.base_iri.clone() }) } / i("CONSTRUCT") _ d:DatasetClauses() _ i("WHERE") _ "{" _ c:ConstructQuery_optional_triple_template() _ "}" _ g:GroupClause()? _ h:HavingClause()? _ o:OrderClause()? _ l:LimitOffsetClauses()? _ v:ValuesClause() {? Ok(Query::Construct { template: c.clone(), dataset: d, pattern: build_select( Selection::no_op(), GraphPattern::Bgp { patterns: c }, g, h, o, l, v, state )?, base_iri: state.base_iri.clone() }) } rule ConstructQuery_optional_triple_template() -> Vec = TriplesTemplate() / { Vec::new() } rule DescribeQuery() -> Query = i("DESCRIBE") _ "*" _ d:DatasetClauses() w:WhereClause()? _ g:GroupClause()? _ h:HavingClause()? _ o:OrderClause()? _ l:LimitOffsetClauses()? _ v:ValuesClause() {? Ok(Query::Describe { dataset: d, pattern: build_select(Selection::no_op(), w.unwrap_or_default(), g, h, o, l, v, state)?, base_iri: state.base_iri.clone() }) } / i("DESCRIBE") _ p:DescribeQuery_item()+ _ d:DatasetClauses() w:WhereClause()? _ g:GroupClause()? _ h:HavingClause()? _ o:OrderClause()? _ l:LimitOffsetClauses()? _ v:ValuesClause() {? Ok(Query::Describe { dataset: d, pattern: build_select(Selection { option: SelectionOption::Default, variables: SelectionVariables::Explicit(p.into_iter().map(|var_or_iri| match var_or_iri { NamedNodePattern::NamedNode(n) => SelectionMember::Expression(n.into(), variable()), NamedNodePattern::Variable(v) => SelectionMember::Variable(v) }).collect()) }, w.unwrap_or_default(), g, h, o, l, v, state)?, base_iri: state.base_iri.clone() }) } rule DescribeQuery_item() -> NamedNodePattern = i:VarOrIri() _ { i } rule AskQuery() -> Query = i("ASK") _ d:DatasetClauses() _ w:WhereClause() _ g:GroupClause()? _ h:HavingClause()? _ o:OrderClause()? _ l:LimitOffsetClauses()? _ v:ValuesClause() {? Ok(Query::Ask { dataset: d, pattern: build_select(Selection::no_op(), w, g, h, o, l, v, state)?, base_iri: state.base_iri.clone() }) } rule DatasetClause() -> (Option, Option) = i("FROM") _ d:(DefaultGraphClause() / NamedGraphClause()) { d } rule DatasetClauses() -> Option = d:DatasetClause() ** (_) { if d.is_empty() { return None; } let mut default = Vec::new(); let mut named = Vec::new(); for (d, n) in d { if let Some(d) = d { default.push(d); } if let Some(n) = n { named.push(n); } } Some(QueryDataset { default, named: Some(named) }) } rule DefaultGraphClause() -> (Option, Option) = s:SourceSelector() { (Some(s), None) } rule NamedGraphClause() -> (Option, Option) = i("NAMED") _ s:SourceSelector() { (None, Some(s)) } rule SourceSelector() -> NamedNode = iri() rule WhereClause() -> GraphPattern = i("WHERE")? _ p:GroupGraphPattern() { p } rule GroupClause() -> (Vec, Vec<(Expression,Variable)>) = i("GROUP") _ i("BY") _ c:GroupCondition_item()+ { let mut projections: Vec<(Expression,Variable)> = Vec::new(); let clauses = c.into_iter().map(|(e, vo)| { if let Expression::Variable(v) = e { v } else { let v = vo.unwrap_or_else(variable); projections.push((e, v.clone())); v } }).collect(); (clauses, projections) } rule GroupCondition_item() -> (Expression, Option) = c:GroupCondition() _ { c } rule GroupCondition() -> (Expression, Option) = e:BuiltInCall() { (e, None) } / e:FunctionCall() { (e, None) } / "(" _ e:Expression() _ v:GroupCondition_as()? ")" { (e, v) } / e:Var() { (e.into(), None) } rule GroupCondition_as() -> Variable = i("AS") _ v:Var() _ { v } rule HavingClause() -> Expression = i("HAVING") _ e:HavingCondition()+ {? not_empty_fold(e.into_iter(), |a, b| Expression::And(Box::new(a), Box::new(b))) } rule HavingCondition() -> Expression = Constraint() rule OrderClause() -> Vec = i("ORDER") _ i("BY") _ c:OrderClause_item()+ { c } rule OrderClause_item() -> OrderExpression = c:OrderCondition() _ { c } rule OrderCondition() -> OrderExpression = i("ASC") _ e: BrackettedExpression() { OrderExpression::Asc(e) } / i("DESC") _ e: BrackettedExpression() { OrderExpression::Desc(e) } / e: Constraint() { OrderExpression::Asc(e) } / v: Var() { OrderExpression::Asc(Expression::from(v)) } rule LimitOffsetClauses() -> (usize, Option) = l:LimitClause() _ o:OffsetClause()? { (o.unwrap_or(0), Some(l)) } / o:OffsetClause() _ l:LimitClause()? { (o, l) } rule LimitClause() -> usize = i("LIMIT") _ l:$(INTEGER()) {? usize::from_str(l).map_err(|_| "The query limit should be a non negative integer") } rule OffsetClause() -> usize = i("OFFSET") _ o:$(INTEGER()) {? usize::from_str(o).map_err(|_| "The query offset should be a non negative integer") } rule ValuesClause() -> Option = i("VALUES") _ p:DataBlock() { Some(p) } / { None } rule Update() -> Vec = _ Prologue() _ u:(Update1() ** (_ ";" _)) _ ( ";" _)? { u.into_iter().flatten().collect() } rule Update1() -> Vec = Load() / Clear() / Drop() / Add() / Move() / Copy() / Create() / InsertData() / DeleteData() / DeleteWhere() / Modify() rule Update1_silent() -> bool = i("SILENT") { true } / { false } rule Load() -> Vec = i("LOAD") _ silent:Update1_silent() _ source:iri() _ destination:Load_to()? { vec![GraphUpdateOperation::Load { silent, source, destination: destination.map_or(GraphName::DefaultGraph, GraphName::NamedNode) }] } rule Load_to() -> NamedNode = i("INTO") _ g: GraphRef() { g } rule Clear() -> Vec = i("CLEAR") _ silent:Update1_silent() _ graph:GraphRefAll() { vec![GraphUpdateOperation::Clear { silent, graph }] } rule Drop() -> Vec = i("DROP") _ silent:Update1_silent() _ graph:GraphRefAll() { vec![GraphUpdateOperation::Drop { silent, graph }] } rule Create() -> Vec = i("CREATE") _ silent:Update1_silent() _ graph:GraphRef() { vec![GraphUpdateOperation::Create { silent, graph }] } rule Add() -> Vec = i("ADD") _ silent:Update1_silent() _ from:GraphOrDefault() _ i("TO") _ to:GraphOrDefault() { // Rewriting defined by https://www.w3.org/TR/sparql11-update/#add if from == to { Vec::new() // identity case } else { let bgp = GraphPattern::Bgp { patterns: vec![TriplePattern::new(Variable::new_unchecked("s"), Variable::new_unchecked("p"), Variable::new_unchecked("o"))] }; vec![copy_graph(from, to)] } } rule Move() -> Vec = i("MOVE") _ silent:Update1_silent() _ from:GraphOrDefault() _ i("TO") _ to:GraphOrDefault() { // Rewriting defined by https://www.w3.org/TR/sparql11-update/#move if from == to { Vec::new() // identity case } else { let bgp = GraphPattern::Bgp { patterns: vec![TriplePattern::new(Variable::new_unchecked("s"), Variable::new_unchecked("p"), Variable::new_unchecked("o"))] }; vec![GraphUpdateOperation::Drop { silent: true, graph: to.clone().into() }, copy_graph(from.clone(), to), GraphUpdateOperation::Drop { silent, graph: from.into() }] } } rule Copy() -> Vec = i("COPY") _ silent:Update1_silent() _ from:GraphOrDefault() _ i("TO") _ to:GraphOrDefault() { // Rewriting defined by https://www.w3.org/TR/sparql11-update/#copy if from == to { Vec::new() // identity case } else { let bgp = GraphPattern::Bgp { patterns: vec![TriplePattern::new(Variable::new_unchecked("s"), Variable::new_unchecked("p"), Variable::new_unchecked("o"))] }; vec![GraphUpdateOperation::Drop { silent: true, graph: to.clone().into() }, copy_graph(from, to)] } } rule InsertData() -> Vec = i("INSERT") _ i("DATA") _ data:QuadData() { vec![GraphUpdateOperation::InsertData { data }] } rule DeleteData() -> Vec = i("DELETE") _ i("DATA") _ data:GroundQuadData() { vec![GraphUpdateOperation::DeleteData { data }] } rule DeleteWhere() -> Vec = i("DELETE") _ i("WHERE") _ d:QuadPattern() {? let pattern = d.iter().map(|q| { let bgp = GraphPattern::Bgp { patterns: vec![TriplePattern::new(q.subject.clone(), q.predicate.clone(), q.object.clone())] }; match &q.graph_name { GraphNamePattern::NamedNode(graph_name) => GraphPattern::Graph { name: graph_name.clone().into(), inner: Box::new(bgp) }, GraphNamePattern::DefaultGraph => bgp, GraphNamePattern::Variable(graph_name) => GraphPattern::Graph { name: graph_name.clone().into(), inner: Box::new(bgp) }, } }).reduce(new_join).unwrap_or_default(); let delete = d.into_iter().map(GroundQuadPattern::try_from).collect::,_>>().map_err(|()| "Blank nodes are not allowed in DELETE WHERE")?; Ok(vec![GraphUpdateOperation::DeleteInsert { delete, insert: Vec::new(), using: None, pattern: Box::new(pattern) }]) } rule Modify() -> Vec = with:Modify_with()? _ Modify_clear() c:Modify_clauses() _ u:(UsingClause() ** (_)) _ i("WHERE") _ pattern:GroupGraphPattern() { let (delete, insert) = c; let mut delete = delete.unwrap_or_default(); let mut insert = insert.unwrap_or_default(); #[allow(clippy::shadow_same)] let mut pattern = pattern; let mut using = if u.is_empty() { None } else { let mut default = Vec::new(); let mut named = Vec::new(); for (d, n) in u { if let Some(d) = d { default.push(d) } if let Some(n) = n { named.push(n) } } Some(QueryDataset { default, named: Some(named) }) }; if let Some(with) = with { // We inject WITH everywhere delete = delete.into_iter().map(|q| if q.graph_name == GraphNamePattern::DefaultGraph { GroundQuadPattern { subject: q.subject, predicate: q.predicate, object: q.object, graph_name: with.clone().into() } } else { q }).collect(); insert = insert.into_iter().map(|q| if q.graph_name == GraphNamePattern::DefaultGraph { QuadPattern { subject: q.subject, predicate: q.predicate, object: q.object, graph_name: with.clone().into() } } else { q }).collect(); if using.is_none() { using = Some(QueryDataset { default: vec![with], named: None }); } } vec![GraphUpdateOperation::DeleteInsert { delete, insert, using, pattern: Box::new(pattern) }] } rule Modify_with() -> NamedNode = i("WITH") _ i:iri() _ { i } rule Modify_clauses() -> (Option>, Option>) = d:DeleteClause() _ i:InsertClause()? { (Some(d), i) } / i:InsertClause() { (None, Some(i)) } rule Modify_clear() = { state.used_bnodes.clear(); state.currently_used_bnodes.clear(); } rule DeleteClause() -> Vec = i("DELETE") _ q:QuadPattern() {? q.into_iter().map(GroundQuadPattern::try_from).collect::,_>>().map_err(|()| "Blank nodes are not allowed in DELETE WHERE") } rule InsertClause() -> Vec = i("INSERT") _ q:QuadPattern() { q } rule UsingClause() -> (Option, Option) = i("USING") _ d:(UsingClause_default() / UsingClause_named()) { d } rule UsingClause_default() -> (Option, Option) = i:iri() { (Some(i), None) } rule UsingClause_named() -> (Option, Option) = i("NAMED") _ i:iri() { (None, Some(i)) } rule GraphOrDefault() -> GraphName = i("DEFAULT") { GraphName::DefaultGraph } / (i("GRAPH") _)? g:iri() { GraphName::NamedNode(g) } rule GraphRef() -> NamedNode = i("GRAPH") _ g:iri() { g } rule GraphRefAll() -> GraphTarget = i: GraphRef() { i.into() } / i("DEFAULT") { GraphTarget::DefaultGraph } / i("NAMED") { GraphTarget::NamedGraphs } / i("ALL") { GraphTarget::AllGraphs } rule QuadPattern() -> Vec = "{" _ q:Quads() _ "}" { q } rule QuadData() -> Vec = "{" _ q:Quads() _ "}" {? q.into_iter().map(Quad::try_from).collect::, ()>>().map_err(|()| "Variables are not allowed in INSERT DATA") } rule GroundQuadData() -> Vec = "{" _ q:Quads() _ "}" {? q.into_iter().map(|q| GroundQuad::try_from(Quad::try_from(q)?)).collect::, ()>>().map_err(|()| "Variables and blank nodes are not allowed in DELETE DATA") } rule Quads() -> Vec = q:(Quads_TriplesTemplate() / Quads_QuadsNotTriples()) ** (_) { q.into_iter().flatten().collect() } rule Quads_TriplesTemplate() -> Vec = t:TriplesTemplate() { t.into_iter().map(|t| QuadPattern::new(t.subject, t.predicate, t.object, GraphNamePattern::DefaultGraph)).collect() } //TODO: return iter? rule Quads_QuadsNotTriples() -> Vec = q:QuadsNotTriples() _ "."? { q } rule QuadsNotTriples() -> Vec = i("GRAPH") _ g:VarOrIri() _ "{" _ t:TriplesTemplate()? _ "}" { t.unwrap_or_default().into_iter().map(|t| QuadPattern::new(t.subject, t.predicate, t.object, g.clone())).collect() } rule TriplesTemplate() -> Vec = ts:TriplesTemplate_inner() ++ (".") ("." _)? { ts.into_iter().flatten().collect() } rule TriplesTemplate_inner() -> Vec = _ t:TriplesSameSubject() _ { t } rule GroupGraphPattern() -> GraphPattern = "{" _ GroupGraphPattern_clear() p:GroupGraphPatternSub() GroupGraphPattern_clear() _ "}" { p } / "{" _ GroupGraphPattern_clear() p:SubSelect() GroupGraphPattern_clear() _ "}" { p } rule GroupGraphPattern_clear() = { // We deal with blank nodes aliases rule state.used_bnodes.extend(state.currently_used_bnodes.iter().cloned()); state.currently_used_bnodes.clear(); } rule GroupGraphPatternSub() -> GraphPattern = a:TriplesBlock()? _ b:GroupGraphPatternSub_item()* {? let mut filter: Option = None; let mut g = a.map_or_else(GraphPattern::default, build_bgp); for e in b.into_iter().flatten() { match e { PartialGraphPattern::Optional(p, f) => { g = GraphPattern::LeftJoin { left: Box::new(g), right: Box::new(p), expression: f } } #[cfg(feature = "sep-0006")] PartialGraphPattern::Lateral(p) => { let mut defined_variables = HashSet::default(); add_defined_variables(&p, &mut defined_variables); let mut contains = false; g.on_in_scope_variable(|v| { if defined_variables.contains(v) { contains = true; } }); if contains { return Err("An existing variable is overridden in the right side of LATERAL"); } g = GraphPattern::Lateral { left: Box::new(g), right: Box::new(p) } } PartialGraphPattern::Minus(p) => { g = GraphPattern::Minus { left: Box::new(g), right: Box::new(p) } } PartialGraphPattern::Bind(expression, variable) => { let mut contains = false; g.on_in_scope_variable(|v| { if *v == variable { contains = true; } }); if contains { return Err("BIND is overriding an existing variable") } g = GraphPattern::Extend { inner: Box::new(g), variable, expression } } PartialGraphPattern::Filter(expr) => filter = Some(if let Some(f) = filter { Expression::And(Box::new(f), Box::new(expr)) } else { expr }), PartialGraphPattern::Other(e) => g = new_join(g, e), } } Ok(if let Some(expr) = filter { GraphPattern::Filter { expr, inner: Box::new(g) } } else { g }) } rule GroupGraphPatternSub_item() -> Vec = a:GraphPatternNotTriples() _ ("." _)? b:TriplesBlock()? _ { let mut result = vec![a]; if let Some(v) = b { result.push(PartialGraphPattern::Other(build_bgp(v))); } result } rule TriplesBlock() -> Vec = hs:TriplesBlock_inner() ++ (".") ("." _)? { hs.into_iter().flatten().collect() } rule TriplesBlock_inner() -> Vec = _ h:TriplesSameSubjectPath() _ { h } rule GraphPatternNotTriples() -> PartialGraphPattern = GroupOrUnionGraphPattern() / OptionalGraphPattern() / LateralGraphPattern() / MinusGraphPattern() / GraphGraphPattern() / ServiceGraphPattern() / Filter() / Bind() / InlineData() rule OptionalGraphPattern() -> PartialGraphPattern = i("OPTIONAL") _ p:GroupGraphPattern() { if let GraphPattern::Filter { expr, inner } = p { PartialGraphPattern::Optional(*inner, Some(expr)) } else { PartialGraphPattern::Optional(p, None) } } rule LateralGraphPattern() -> PartialGraphPattern = i("LATERAL") _ p:GroupGraphPattern() {? #[cfg(feature = "sep-0006")]{Ok(PartialGraphPattern::Lateral(p))} #[cfg(not(feature = "sep-0006"))]{Err("The LATERAL modifier is not supported")} } rule GraphGraphPattern() -> PartialGraphPattern = i("GRAPH") _ name:VarOrIri() _ p:GroupGraphPattern() { PartialGraphPattern::Other(GraphPattern::Graph { name, inner: Box::new(p) }) } rule ServiceGraphPattern() -> PartialGraphPattern = i("SERVICE") _ i("SILENT") _ name:VarOrIri() _ p:GroupGraphPattern() { PartialGraphPattern::Other(GraphPattern::Service { name, inner: Box::new(p), silent: true }) } / i("SERVICE") _ name:VarOrIri() _ p:GroupGraphPattern() { PartialGraphPattern::Other(GraphPattern::Service{ name, inner: Box::new(p), silent: false }) } rule Bind() -> PartialGraphPattern = i("BIND") _ "(" _ e:Expression() _ i("AS") _ v:Var() _ ")" { PartialGraphPattern::Bind(e, v) } rule InlineData() -> PartialGraphPattern = i("VALUES") _ p:DataBlock() { PartialGraphPattern::Other(p) } rule DataBlock() -> GraphPattern = l:(InlineDataOneVar() / InlineDataFull()) { GraphPattern::Values { variables: l.0, bindings: l.1 } } rule InlineDataOneVar() -> (Vec, Vec>>) = var:Var() _ "{" _ d:InlineDataOneVar_value()* "}" { (vec![var], d) } rule InlineDataOneVar_value() -> Vec> = t:DataBlockValue() _ { vec![t] } rule InlineDataFull() -> (Vec, Vec>>) = "(" _ vars:InlineDataFull_var()* _ ")" _ "{" _ vals:InlineDataFull_values()* "}" {? if vals.iter().all(|vs| vs.len() == vars.len()) { Ok((vars, vals)) } else { Err("The VALUES clause rows should have exactly the same number of values as there are variables. To set a value to undefined use UNDEF.") } } rule InlineDataFull_var() -> Variable = v:Var() _ { v } rule InlineDataFull_values() -> Vec> = "(" _ v:InlineDataFull_value()* _ ")" _ { v } rule InlineDataFull_value() -> Option = v:DataBlockValue() _ { v } rule DataBlockValue() -> Option = t:QuotedTripleData() {? #[cfg(feature = "rdf-star")]{Ok(Some(t.into()))} #[cfg(not(feature = "rdf-star"))]{Err("Embedded triples are only available in SPARQL-star")} } / i:iri() { Some(i.into()) } / l:RDFLiteral() { Some(l.into()) } / l:NumericLiteral() { Some(l.into()) } / l:BooleanLiteral() { Some(l.into()) } / i("UNDEF") { None } rule MinusGraphPattern() -> PartialGraphPattern = i("MINUS") _ p: GroupGraphPattern() { PartialGraphPattern::Minus(p) } rule GroupOrUnionGraphPattern() -> PartialGraphPattern = p:GroupOrUnionGraphPattern_item() **<1,> (i("UNION") _) {? not_empty_fold(p.into_iter(), |a, b| { GraphPattern::Union { left: Box::new(a), right: Box::new(b) } }).map(PartialGraphPattern::Other) } rule GroupOrUnionGraphPattern_item() -> GraphPattern = p:GroupGraphPattern() _ { p } rule Filter() -> PartialGraphPattern = i("FILTER") _ c:Constraint() { PartialGraphPattern::Filter(c) } rule Constraint() -> Expression = BrackettedExpression() / FunctionCall() / BuiltInCall() rule FunctionCall() -> Expression = f: iri() _ a: ArgList() { Expression::FunctionCall(Function::Custom(f), a) } rule ArgList() -> Vec = "(" _ e:ArgList_item() **<1,> ("," _) _ ")" { e } / NIL() { Vec::new() } rule ArgList_item() -> Expression = e:Expression() _ { e } rule ExpressionList() -> Vec = "(" _ e:ExpressionList_item() **<1,> ("," _) ")" { e } / NIL() { Vec::new() } rule ExpressionList_item() -> Expression = e:Expression() _ { e } rule ConstructTemplate() -> Vec = "{" _ t:ConstructTriples() _ "}" { t } rule ConstructTriples() -> Vec = p:ConstructTriples_item() ** ("." _) "."? { p.into_iter().flatten().collect() } rule ConstructTriples_item() -> Vec = t:TriplesSameSubject() _ { t } rule TriplesSameSubject() -> Vec = s:VarOrTerm() _ po:PropertyListNotEmpty() {? let mut patterns = po.patterns; for (p, os) in po.focus { for o in os { add_to_triple_patterns(s.clone(), p.clone(), o, &mut patterns)? } } Ok(patterns) } / s:TriplesNode() _ po:PropertyList() {? let mut patterns = s.patterns; patterns.extend(po.patterns); for (p, os) in po.focus { for o in os { add_to_triple_patterns(s.focus.clone(), p.clone(), o, &mut patterns)? } } Ok(patterns) } rule PropertyList() -> FocusedTriplePattern)>> = PropertyListNotEmpty() / { FocusedTriplePattern::default() } rule PropertyListNotEmpty() -> FocusedTriplePattern)>> = l:PropertyListNotEmpty_item() **<1,> (";" _) { l.into_iter().fold(FocusedTriplePattern::)>>::default(), |mut a, b| { a.focus.push(b.focus); a.patterns.extend(b.patterns); a }) } rule PropertyListNotEmpty_item() -> FocusedTriplePattern<(NamedNodePattern,Vec)> = p:Verb() _ o:ObjectList() _ { FocusedTriplePattern { focus: (p, o.focus), patterns: o.patterns } } rule Verb() -> NamedNodePattern = VarOrIri() / "a" { rdf::TYPE.into_owned().into() } rule ObjectList() -> FocusedTriplePattern> = o:ObjectList_item() **<1,> ("," _) { o.into_iter().fold(FocusedTriplePattern::>::default(), |mut a, b| { a.focus.push(b.focus); a.patterns.extend_from_slice(&b.patterns); a }) } rule ObjectList_item() -> FocusedTriplePattern = o:Object() _ { o } rule Object() -> FocusedTriplePattern = g:GraphNode() _ a:Annotation()? { if let Some(a) = a { let mut patterns = g.patterns; patterns.extend(a.patterns); FocusedTriplePattern { focus: AnnotatedTerm { term: g.focus, annotations: a.focus }, patterns } } else { FocusedTriplePattern { focus: AnnotatedTerm { term: g.focus, annotations: Vec::new() }, patterns: g.patterns } } } rule TriplesSameSubjectPath() -> Vec = s:VarOrTerm() _ po:PropertyListPathNotEmpty() {? let mut patterns = po.patterns; for (p, os) in po.focus { for o in os { add_to_triple_or_path_patterns(s.clone(), p.clone(), o, &mut patterns)?; } } Ok(patterns) } / s:TriplesNodePath() _ po:PropertyListPath() {? let mut patterns = s.patterns; patterns.extend(po.patterns); for (p, os) in po.focus { for o in os { add_to_triple_or_path_patterns(s.focus.clone(), p.clone(), o, &mut patterns)?; } } Ok(patterns) } rule PropertyListPath() -> FocusedTripleOrPathPattern)>> = PropertyListPathNotEmpty() / { FocusedTripleOrPathPattern::default() } rule PropertyListPathNotEmpty() -> FocusedTripleOrPathPattern)>> = hp:(VerbPath() / VerbSimple()) _ ho:ObjectListPath() _ t:PropertyListPathNotEmpty_item()* { t.into_iter().flatten().fold(FocusedTripleOrPathPattern { focus: vec![(hp, ho.focus)], patterns: ho.patterns }, |mut a, b| { a.focus.push(b.focus); a.patterns.extend(b.patterns); a }) } rule PropertyListPathNotEmpty_item() -> Option)>> = ";" _ c:PropertyListPathNotEmpty_item_content()? { c } rule PropertyListPathNotEmpty_item_content() -> FocusedTripleOrPathPattern<(VariableOrPropertyPath,Vec)> = p:(VerbPath() / VerbSimple()) _ o:ObjectListPath() _ { FocusedTripleOrPathPattern { focus: (p, o.focus.into_iter().map(AnnotatedTermPath::from).collect()), patterns: o.patterns } } rule VerbPath() -> VariableOrPropertyPath = p:Path() { p.into() } rule VerbSimple() -> VariableOrPropertyPath = v:Var() { v.into() } rule ObjectListPath() -> FocusedTripleOrPathPattern> = o:ObjectListPath_item() **<1,> ("," _) { o.into_iter().fold(FocusedTripleOrPathPattern::>::default(), |mut a, b| { a.focus.push(b.focus); a.patterns.extend(b.patterns); a }) } rule ObjectListPath_item() -> FocusedTripleOrPathPattern = o:ObjectPath() _ { o } rule ObjectPath() -> FocusedTripleOrPathPattern = g:GraphNodePath() _ a:AnnotationPath()? { if let Some(a) = a { let mut patterns = g.patterns; patterns.extend(a.patterns); FocusedTripleOrPathPattern { focus: AnnotatedTermPath { term: g.focus, annotations: a.focus }, patterns } } else { FocusedTripleOrPathPattern { focus: AnnotatedTermPath { term: g.focus, annotations: Vec::new() }, patterns: g.patterns } } } rule Path() -> PropertyPathExpression = PathAlternative() rule PathAlternative() -> PropertyPathExpression = p:PathAlternative_item() **<1,> ("|" _) {? not_empty_fold(p.into_iter(), |a, b| { PropertyPathExpression::Alternative(Box::new(a), Box::new(b)) }) } rule PathAlternative_item() -> PropertyPathExpression = p:PathSequence() _ { p } rule PathSequence() -> PropertyPathExpression = p:PathSequence_item() **<1,> ("/" _) {? not_empty_fold(p.into_iter(), |a, b| { PropertyPathExpression::Sequence(Box::new(a), Box::new(b)) }) } rule PathSequence_item() -> PropertyPathExpression = p:PathEltOrInverse() _ { p } rule PathElt() -> PropertyPathExpression = p:PathPrimary() _ o:PathElt_op()? { match o { Some('?') => PropertyPathExpression::ZeroOrOne(Box::new(p)), Some('*') => PropertyPathExpression::ZeroOrMore(Box::new(p)), Some('+') => PropertyPathExpression::OneOrMore(Box::new(p)), Some(_) => unreachable!(), None => p } } rule PathElt_op() -> char = "*" { '*' } / "+" { '+' } / "?" !(['0'..='9'] / PN_CHARS_U()) { '?' } // We mandate that this is not a variable rule PathEltOrInverse() -> PropertyPathExpression = "^" _ p:PathElt() { PropertyPathExpression::Reverse(Box::new(p)) } / PathElt() rule PathPrimary() -> PropertyPathExpression = v:iri() { v.into() } / "a" { rdf::TYPE.into_owned().into() } / "!" _ p:PathNegatedPropertySet() { p } / "(" _ p:Path() _ ")" { p } rule PathNegatedPropertySet() -> PropertyPathExpression = "(" _ p:PathNegatedPropertySet_item() **<1,> ("|" _) ")" { let mut direct = Vec::new(); let mut inverse = Vec::new(); for e in p { match e { Either::Left(a) => direct.push(a), Either::Right(b) => inverse.push(b) } } if inverse.is_empty() { PropertyPathExpression::NegatedPropertySet(direct) } else if direct.is_empty() { PropertyPathExpression::Reverse(Box::new(PropertyPathExpression::NegatedPropertySet(inverse))) } else { PropertyPathExpression::Alternative( Box::new(PropertyPathExpression::NegatedPropertySet(direct)), Box::new(PropertyPathExpression::Reverse(Box::new(PropertyPathExpression::NegatedPropertySet(inverse)))) ) } } / p:PathOneInPropertySet() { match p { Either::Left(a) => PropertyPathExpression::NegatedPropertySet(vec![a]), Either::Right(b) => PropertyPathExpression::Reverse(Box::new(PropertyPathExpression::NegatedPropertySet(vec![b]))), } } rule PathNegatedPropertySet_item() -> Either = p:PathOneInPropertySet() _ { p } rule PathOneInPropertySet() -> Either = "^" _ v:iri() { Either::Right(v) } / "^" _ "a" { Either::Right(rdf::TYPE.into()) } / v:iri() { Either::Left(v) } / "a" { Either::Left(rdf::TYPE.into()) } rule TriplesNode() -> FocusedTriplePattern = Collection() / BlankNodePropertyList() rule BlankNodePropertyList() -> FocusedTriplePattern = "[" _ po:PropertyListNotEmpty() _ "]" {? let mut patterns = po.patterns; let mut bnode = TermPattern::from(BlankNode::default()); for (p, os) in po.focus { for o in os { add_to_triple_patterns(bnode.clone(), p.clone(), o, &mut patterns)?; } } Ok(FocusedTriplePattern { focus: bnode, patterns }) } rule TriplesNodePath() -> FocusedTripleOrPathPattern = CollectionPath() / BlankNodePropertyListPath() rule BlankNodePropertyListPath() -> FocusedTripleOrPathPattern = "[" _ po:PropertyListPathNotEmpty() _ "]" {? let mut patterns = po.patterns; let mut bnode = TermPattern::from(BlankNode::default()); for (p, os) in po.focus { for o in os { add_to_triple_or_path_patterns(bnode.clone(), p.clone(), o, &mut patterns)?; } } Ok(FocusedTripleOrPathPattern { focus: bnode, patterns }) } rule Collection() -> FocusedTriplePattern = "(" _ o:Collection_item()+ ")" { let mut patterns: Vec = Vec::new(); let mut current_list_node = TermPattern::from(rdf::NIL.into_owned()); for objWithPatterns in o.into_iter().rev() { let new_blank_node = TermPattern::from(BlankNode::default()); patterns.push(TriplePattern::new(new_blank_node.clone(), rdf::FIRST.into_owned(), objWithPatterns.focus.clone())); patterns.push(TriplePattern::new(new_blank_node.clone(), rdf::REST.into_owned(), current_list_node)); current_list_node = new_blank_node; patterns.extend_from_slice(&objWithPatterns.patterns); } FocusedTriplePattern { focus: current_list_node, patterns } } rule Collection_item() -> FocusedTriplePattern = o:GraphNode() _ { o } rule CollectionPath() -> FocusedTripleOrPathPattern = "(" _ o:CollectionPath_item()+ _ ")" { let mut patterns: Vec = Vec::new(); let mut current_list_node = TermPattern::from(rdf::NIL.into_owned()); for objWithPatterns in o.into_iter().rev() { let new_blank_node = TermPattern::from(BlankNode::default()); patterns.push(TriplePattern::new(new_blank_node.clone(), rdf::FIRST.into_owned(), objWithPatterns.focus.clone()).into()); patterns.push(TriplePattern::new(new_blank_node.clone(), rdf::REST.into_owned(), current_list_node).into()); current_list_node = new_blank_node; patterns.extend(objWithPatterns.patterns); } FocusedTripleOrPathPattern { focus: current_list_node, patterns } } rule CollectionPath_item() -> FocusedTripleOrPathPattern = p:GraphNodePath() _ { p } rule Annotation() -> FocusedTriplePattern)>> = "{|" _ a:PropertyListNotEmpty() _ "|}" { a } rule AnnotationPath() -> FocusedTripleOrPathPattern)>> = "{|" _ a: PropertyListPathNotEmpty() _ "|}" { a } rule GraphNode() -> FocusedTriplePattern = t:VarOrTerm() { FocusedTriplePattern::new(t) } / TriplesNode() rule GraphNodePath() -> FocusedTripleOrPathPattern = t:VarOrTerm() { FocusedTripleOrPathPattern::new(t) } / TriplesNodePath() rule VarOrTerm() -> TermPattern = v:Var() { v.into() } / t:QuotedTriple() {? #[cfg(feature = "rdf-star")]{Ok(t.into())} #[cfg(not(feature = "rdf-star"))]{Err("Embedded triples are only available in SPARQL-star")} } / t:GraphTerm() { t.into() } rule QuotedTriple() -> TriplePattern = "<<" _ s:VarOrTerm() _ p:Verb() _ o:VarOrTerm() _ ">>" {? Ok(TriplePattern { subject: s, predicate: p, object: o }) } rule QuotedTripleData() -> GroundTriple = "<<" _ s:DataValueTerm() _ p:QuotedTripleData_p() _ o:DataValueTerm() _ ">>" {? Ok(GroundTriple { subject: s.try_into().map_err(|()| "Literals are not allowed in subject position of nested patterns")?, predicate: p, object: o }) } rule QuotedTripleData_p() -> NamedNode = i: iri() { i } / "a" { rdf::TYPE.into() } rule DataValueTerm() -> GroundTerm = i:iri() { i.into() } / l:RDFLiteral() { l.into() } / l:NumericLiteral() { l.into() } / l:BooleanLiteral() { l.into() } / t:QuotedTripleData() {? #[cfg(feature = "rdf-star")]{Ok(t.into())} #[cfg(not(feature = "rdf-star"))]{Err("Embedded triples are only available in SPARQL-star")} } rule VarOrIri() -> NamedNodePattern = v:Var() { v.into() } / i:iri() { i.into() } rule Var() -> Variable = name:(VAR1() / VAR2()) { Variable::new_unchecked(name) } rule GraphTerm() -> Term = i:iri() { i.into() } / l:RDFLiteral() { l.into() } / l:NumericLiteral() { l.into() } / l:BooleanLiteral() { l.into() } / b:BlankNode() { b.into() } / NIL() { rdf::NIL.into_owned().into() } rule Expression() -> Expression = e:ConditionalOrExpression() {e} rule ConditionalOrExpression() -> Expression = e:ConditionalOrExpression_item() **<1,> ("||" _) {? not_empty_fold(e.into_iter(), |a, b| Expression::Or(Box::new(a), Box::new(b))) } rule ConditionalOrExpression_item() -> Expression = e:ConditionalAndExpression() _ { e } rule ConditionalAndExpression() -> Expression = e:ConditionalAndExpression_item() **<1,> ("&&" _) {? not_empty_fold(e.into_iter(), |a, b| Expression::And(Box::new(a), Box::new(b))) } rule ConditionalAndExpression_item() -> Expression = e:ValueLogical() _ { e } rule ValueLogical() -> Expression = RelationalExpression() rule RelationalExpression() -> Expression = a:NumericExpression() _ o: RelationalExpression_inner()? { match o { Some(("=", Some(b), None)) => Expression::Equal(Box::new(a), Box::new(b)), Some(("!=", Some(b), None)) => Expression::Not(Box::new(Expression::Equal(Box::new(a), Box::new(b)))), Some((">", Some(b), None)) => Expression::Greater(Box::new(a), Box::new(b)), Some((">=", Some(b), None)) => Expression::GreaterOrEqual(Box::new(a), Box::new(b)), Some(("<", Some(b), None)) => Expression::Less(Box::new(a), Box::new(b)), Some(("<=", Some(b), None)) => Expression::LessOrEqual(Box::new(a), Box::new(b)), Some(("IN", None, Some(l))) => Expression::In(Box::new(a), l), Some(("NOT IN", None, Some(l))) => Expression::Not(Box::new(Expression::In(Box::new(a), l))), Some(_) => unreachable!(), None => a } } rule RelationalExpression_inner() -> (&'input str, Option, Option>) = s: $("=" / "!=" / ">=" / ">" / "<=" / "<") _ e:NumericExpression() { (s, Some(e), None) } / i("IN") _ l:ExpressionList() { ("IN", None, Some(l)) } / i("NOT") _ i("IN") _ l:ExpressionList() { ("NOT IN", None, Some(l)) } rule NumericExpression() -> Expression = AdditiveExpression() rule AdditiveExpression() -> Expression = a:MultiplicativeExpression() _ o:AdditiveExpression_inner()? { match o { Some(("+", b)) => Expression::Add(Box::new(a), Box::new(b)), Some(("-", b)) => Expression::Subtract(Box::new(a), Box::new(b)), Some(_) => unreachable!(), None => a, } } rule AdditiveExpression_inner() -> (&'input str, Expression) = s: $("+" / "-") _ e:AdditiveExpression() { (s, e) } rule MultiplicativeExpression() -> Expression = a:UnaryExpression() _ o: MultiplicativeExpression_inner()? { match o { Some(("*", b)) => Expression::Multiply(Box::new(a), Box::new(b)), Some(("/", b)) => Expression::Divide(Box::new(a), Box::new(b)), Some(_) => unreachable!(), None => a } } rule MultiplicativeExpression_inner() -> (&'input str, Expression) = s: $("*" / "/") _ e:MultiplicativeExpression() { (s, e) } rule UnaryExpression() -> Expression = s: $("!" / "+" / "-")? _ e:PrimaryExpression() { match s { Some("!") => Expression::Not(Box::new(e)), Some("+") => Expression::UnaryPlus(Box::new(e)), Some("-") => Expression::UnaryMinus(Box::new(e)), Some(_) => unreachable!(), None => e, } } rule PrimaryExpression() -> Expression = BrackettedExpression() / ExprQuotedTriple() / iriOrFunction() / v:Var() { v.into() } / l:RDFLiteral() { l.into() } / l:NumericLiteral() { l.into() } / l:BooleanLiteral() { l.into() } / BuiltInCall() rule ExprVarOrTerm() -> Expression = ExprQuotedTriple() / i:iri() { i.into() } / l:RDFLiteral() { l.into() } / l:NumericLiteral() { l.into() } / l:BooleanLiteral() { l.into() } / v:Var() { v.into() } rule ExprQuotedTriple() -> Expression = "<<" _ s:ExprVarOrTerm() _ p:Verb() _ o:ExprVarOrTerm() _ ">>" {? #[cfg(feature = "rdf-star")]{Ok(Expression::FunctionCall(Function::Triple, vec![s, p.into(), o]))} #[cfg(not(feature = "rdf-star"))]{Err("Embedded triples are only available in SPARQL-star")} } rule BrackettedExpression() -> Expression = "(" _ e:Expression() _ ")" { e } rule BuiltInCall() -> Expression = a:Aggregate() {? state.new_aggregation(a).map(Into::into) } / i("STR") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Str, vec![e]) } / i("LANG") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Lang, vec![e]) } / i("LANGMATCHES") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::LangMatches, vec![a, b]) } / i("DATATYPE") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Datatype, vec![e]) } / i("BOUND") _ "(" _ v:Var() _ ")" { Expression::Bound(v) } / (i("IRI") / i("URI")) _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Iri, vec![e]) } / i("BNODE") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::BNode, vec![e]) } / i("BNODE") NIL() { Expression::FunctionCall(Function::BNode, vec![]) } / i("RAND") _ NIL() { Expression::FunctionCall(Function::Rand, vec![]) } / i("ABS") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Abs, vec![e]) } / i("CEIL") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Ceil, vec![e]) } / i("FLOOR") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Floor, vec![e]) } / i("ROUND") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Round, vec![e]) } / i("CONCAT") e:ExpressionList() { Expression::FunctionCall(Function::Concat, e) } / SubstringExpression() / i("STRLEN") _ "(" _ e: Expression() _ ")" { Expression::FunctionCall(Function::StrLen, vec![e]) } / StrReplaceExpression() / i("UCASE") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::UCase, vec![e]) } / i("LCASE") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::LCase, vec![e]) } / i("ENCODE_FOR_URI") "(" _ e: Expression() _ ")" { Expression::FunctionCall(Function::EncodeForUri, vec![e]) } / i("CONTAINS") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::Contains, vec![a, b]) } / i("STRSTARTS") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::StrStarts, vec![a, b]) } / i("STRENDS") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::StrEnds, vec![a, b]) } / i("STRBEFORE") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::StrBefore, vec![a, b]) } / i("STRAFTER") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::StrAfter, vec![a, b]) } / i("YEAR") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Year, vec![e]) } / i("MONTH") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Month, vec![e]) } / i("DAY") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Day, vec![e]) } / i("HOURS") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Hours, vec![e]) } / i("MINUTES") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Minutes, vec![e]) } / i("SECONDS") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Seconds, vec![e]) } / i("TIMEZONE") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Timezone, vec![e]) } / i("TZ") _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Tz, vec![e]) } / i("NOW") _ NIL() { Expression::FunctionCall(Function::Now, vec![]) } / i("UUID") _ NIL() { Expression::FunctionCall(Function::Uuid, vec![]) }/ i("STRUUID") _ NIL() { Expression::FunctionCall(Function::StrUuid, vec![]) } / i("MD5") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Md5, vec![e]) } / i("SHA1") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Sha1, vec![e]) } / i("SHA256") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Sha256, vec![e]) } / i("SHA384") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Sha384, vec![e]) } / i("SHA512") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::Sha512, vec![e]) } / i("COALESCE") e:ExpressionList() { Expression::Coalesce(e) } / i("IF") _ "(" _ a:Expression() _ "," _ b:Expression() _ "," _ c:Expression() _ ")" { Expression::If(Box::new(a), Box::new(b), Box::new(c)) } / i("STRLANG") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::StrLang, vec![a, b]) } / i("STRDT") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::StrDt, vec![a, b]) } / i("sameTerm") "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::SameTerm(Box::new(a), Box::new(b)) } / (i("isIRI") / i("isURI")) _ "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::IsIri, vec![e]) } / i("isBLANK") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::IsBlank, vec![e]) } / i("isLITERAL") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::IsLiteral, vec![e]) } / i("isNUMERIC") "(" _ e:Expression() _ ")" { Expression::FunctionCall(Function::IsNumeric, vec![e]) } / RegexExpression() / ExistsFunc() / NotExistsFunc() / i("TRIPLE") "(" _ s:Expression() _ "," _ p:Expression() "," _ o:Expression() ")" {? #[cfg(feature = "rdf-star")]{Ok(Expression::FunctionCall(Function::Triple, vec![s, p, o]))} #[cfg(not(feature = "rdf-star"))]{Err("The TRIPLE function is only available in SPARQL-star")} } / i("SUBJECT") "(" _ e:Expression() _ ")" {? #[cfg(feature = "rdf-star")]{Ok(Expression::FunctionCall(Function::Subject, vec![e]))} #[cfg(not(feature = "rdf-star"))]{Err("The SUBJECT function is only available in SPARQL-star")} } / i("PREDICATE") "(" _ e:Expression() _ ")" {? #[cfg(feature = "rdf-star")]{Ok(Expression::FunctionCall(Function::Predicate, vec![e]))} #[cfg(not(feature = "rdf-star"))]{Err("The PREDICATE function is only available in SPARQL-star")} } / i("OBJECT") "(" _ e:Expression() _ ")" {? #[cfg(feature = "rdf-star")]{Ok(Expression::FunctionCall(Function::Object, vec![e]))} #[cfg(not(feature = "rdf-star"))]{Err("The OBJECT function is only available in SPARQL-star")} } / i("isTriple") "(" _ e:Expression() _ ")" {? #[cfg(feature = "rdf-star")]{Ok(Expression::FunctionCall(Function::IsTriple, vec![e]))} #[cfg(not(feature = "rdf-star"))]{Err("The isTriple function is only available in SPARQL-star")} } / i("ADJUST") "(" _ a:Expression() _ "," _ b:Expression() _ ")" {? #[cfg(feature = "sep-0002")]{Ok(Expression::FunctionCall(Function::Adjust, vec![a, b]))} #[cfg(not(feature = "sep-0002"))]{Err("The ADJUST function is only available in SPARQL 1.2 SEP 0002")} } rule RegexExpression() -> Expression = i("REGEX") _ "(" _ a:Expression() _ "," _ b:Expression() _ "," _ c:Expression() _ ")" { Expression::FunctionCall(Function::Regex, vec![a, b, c]) } / i("REGEX") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::Regex, vec![a, b]) } rule SubstringExpression() -> Expression = i("SUBSTR") _ "(" _ a:Expression() _ "," _ b:Expression() _ "," _ c:Expression() _ ")" { Expression::FunctionCall(Function::SubStr, vec![a, b, c]) } / i("SUBSTR") _ "(" _ a:Expression() _ "," _ b:Expression() _ ")" { Expression::FunctionCall(Function::SubStr, vec![a, b]) } rule StrReplaceExpression() -> Expression = i("REPLACE") _ "(" _ a:Expression() _ "," _ b:Expression() _ "," _ c:Expression() _ "," _ d:Expression() _ ")" { Expression::FunctionCall(Function::Replace, vec![a, b, c, d]) } / i("REPLACE") _ "(" _ a:Expression() _ "," _ b:Expression() _ "," _ c:Expression() _ ")" { Expression::FunctionCall(Function::Replace, vec![a, b, c]) } rule ExistsFunc() -> Expression = i("EXISTS") _ p:GroupGraphPattern() { Expression::Exists(Box::new(p)) } rule NotExistsFunc() -> Expression = i("NOT") _ i("EXISTS") _ p:GroupGraphPattern() { Expression::Not(Box::new(Expression::Exists(Box::new(p)))) } rule Aggregate() -> AggregateExpression = i("COUNT") _ "(" _ i("DISTINCT") _ "*" _ ")" { AggregateExpression::CountSolutions { distinct: true } } / i("COUNT") _ "(" _ i("DISTINCT") _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Count, expr, distinct: true } } / i("COUNT") _ "(" _ "*" _ ")" { AggregateExpression::CountSolutions { distinct: false } } / i("COUNT") _ "(" _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Count, expr, distinct: false } } / i("SUM") _ "(" _ i("DISTINCT") _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Sum, expr, distinct: true } } / i("SUM") _ "(" _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Sum, expr, distinct: false } } / i("MIN") _ "(" _ i("DISTINCT") _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Min, expr, distinct: true } } / i("MIN") _ "(" _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Min, expr, distinct: false } } / i("MAX") _ "(" _ i("DISTINCT") _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Max, expr, distinct: true } } / i("MAX") _ "(" _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Max, expr, distinct: false } } / i("AVG") _ "(" _ i("DISTINCT") _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Avg, expr, distinct: true } } / i("AVG") _ "(" _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Avg, expr, distinct: false } } / i("SAMPLE") _ "(" _ i("DISTINCT") _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Sample, expr, distinct: true } } / i("SAMPLE") _ "(" _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Sample, expr, distinct: false } } / i("GROUP_CONCAT") _ "(" _ i("DISTINCT") _ expr:Expression() _ ";" _ i("SEPARATOR") _ "=" _ s:String() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::GroupConcat { separator: Some(s) }, expr, distinct: true } } / i("GROUP_CONCAT") _ "(" _ i("DISTINCT") _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::GroupConcat { separator: None }, expr, distinct: true } } / i("GROUP_CONCAT") _ "(" _ expr:Expression() _ ";" _ i("SEPARATOR") _ "=" _ s:String() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::GroupConcat { separator: Some(s) }, expr, distinct: true } } / i("GROUP_CONCAT") _ "(" _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::GroupConcat { separator: None }, expr, distinct: false } } / name:iri() _ "(" _ i("DISTINCT") _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Custom(name), expr, distinct: true } } / name:iri() _ "(" _ expr:Expression() _ ")" { AggregateExpression::FunctionCall { name: AggregateFunction::Custom(name), expr, distinct: false } } rule iriOrFunction() -> Expression = i: iri() _ a: ArgList()? { match a { Some(a) => Expression::FunctionCall(Function::Custom(i), a), None => i.into() } } rule RDFLiteral() -> Literal = value:String() _ "^^" _ datatype:iri() { Literal::new_typed_literal(value, datatype) } / value:String() _ language:LANGTAG() { Literal::new_language_tagged_literal_unchecked(value, language.into_inner()) } / value:String() { Literal::new_simple_literal(value) } rule NumericLiteral() -> Literal = NumericLiteralUnsigned() / NumericLiteralPositive() / NumericLiteralNegative() rule NumericLiteralUnsigned() -> Literal = d:$(DOUBLE()) { Literal::new_typed_literal(d, xsd::DOUBLE) } / d:$(DECIMAL()) { Literal::new_typed_literal(d, xsd::DECIMAL) } / i:$(INTEGER()) { Literal::new_typed_literal(i, xsd::INTEGER) } rule NumericLiteralPositive() -> Literal = d:$(DOUBLE_POSITIVE()) { Literal::new_typed_literal(d, xsd::DOUBLE) } / d:$(DECIMAL_POSITIVE()) { Literal::new_typed_literal(d, xsd::DECIMAL) } / i:$(INTEGER_POSITIVE()) { Literal::new_typed_literal(i, xsd::INTEGER) } rule NumericLiteralNegative() -> Literal = d:$(DOUBLE_NEGATIVE()) { Literal::new_typed_literal(d, xsd::DOUBLE) } / d:$(DECIMAL_NEGATIVE()) { Literal::new_typed_literal(d, xsd::DECIMAL) } / i:$(INTEGER_NEGATIVE()) { Literal::new_typed_literal(i, xsd::INTEGER) } rule BooleanLiteral() -> Literal = "true" { Literal::new_typed_literal("true", xsd::BOOLEAN) } / "false" { Literal::new_typed_literal("false", xsd::BOOLEAN) } rule String() -> String = STRING_LITERAL_LONG1() / STRING_LITERAL_LONG2() / STRING_LITERAL1() / STRING_LITERAL2() rule iri() -> NamedNode = i:(IRIREF() / PrefixedName()) { NamedNode::from(i) } rule PrefixedName() -> Iri = PNAME_LN() / ns:PNAME_NS() {? if let Some(iri) = state.namespaces.get(ns).cloned() { Iri::parse(iri).map_err(|_| "IRI parsing failed") } else { Err("Prefix not found") } } rule BlankNode() -> BlankNode = id:BLANK_NODE_LABEL() {? let node = BlankNode::new_unchecked(id); if state.used_bnodes.contains(&node) { Err("Already used blank node id") } else { state.currently_used_bnodes.insert(node.clone()); Ok(node) } } / ANON() { BlankNode::default() } rule IRIREF() -> Iri = "<" i:$((!['>'] [_])*) ">" {? state.parse_iri(unescape_iriref(i)?).map_err(|_| "IRI parsing failed") } rule PNAME_NS() -> &'input str = ns:$(PN_PREFIX()?) ":" { ns } rule PNAME_LN() -> Iri = ns:PNAME_NS() local:$(PN_LOCAL()) {? if let Some(base) = state.namespaces.get(ns) { let mut iri = String::with_capacity(base.len() + local.len()); iri.push_str(base); for chunk in local.split('\\') { // We remove \ iri.push_str(chunk); } Iri::parse(iri).map_err(|_| "IRI parsing failed") } else { Err("Prefix not found") } } rule BLANK_NODE_LABEL() -> &'input str = "_:" b:$((['0'..='9'] / PN_CHARS_U()) PN_CHARS()* ("."+ PN_CHARS()+)*) { b } rule VAR1() -> &'input str = "?" v:$(VARNAME()) { v } rule VAR2() -> &'input str = "$" v:$(VARNAME()) { v } rule LANGTAG() -> LanguageTag = "@" l:$(['a' ..= 'z' | 'A' ..= 'Z']+ ("-" ['a' ..= 'z' | 'A' ..= 'Z' | '0' ..= '9']+)*) {? LanguageTag::parse(l.to_ascii_lowercase()).map_err(|_| "language tag parsing failed") } rule INTEGER() = ['0'..='9']+ rule DECIMAL() = ['0'..='9']* "." ['0'..='9']+ rule DOUBLE() = (['0'..='9']+ "." ['0'..='9']* / "." ['0'..='9']+ / ['0'..='9']+) EXPONENT() rule INTEGER_POSITIVE() = "+" _ INTEGER() rule DECIMAL_POSITIVE() = "+" _ DECIMAL() rule DOUBLE_POSITIVE() = "+" _ DOUBLE() rule INTEGER_NEGATIVE() = "-" _ INTEGER() rule DECIMAL_NEGATIVE() = "-" _ DECIMAL() rule DOUBLE_NEGATIVE() = "-" _ DOUBLE() rule EXPONENT() = ['e' | 'E'] ['+' | '-']? ['0'..='9']+ rule STRING_LITERAL1() -> String = "'" l:$((STRING_LITERAL1_simple_char() / ECHAR() / UCHAR())*) "'" {? unescape_string(l) } rule STRING_LITERAL1_simple_char() = !['\u{27}' | '\u{5C}' | '\u{A}' | '\u{D}'] [_] rule STRING_LITERAL2() -> String = "\"" l:$((STRING_LITERAL2_simple_char() / ECHAR() / UCHAR())*) "\"" {? unescape_string(l) } rule STRING_LITERAL2_simple_char() = !['\u{22}' | '\u{5C}' | '\u{A}' | '\u{D}'] [_] rule STRING_LITERAL_LONG1() -> String = "'''" l:$(STRING_LITERAL_LONG1_inner()*) "'''" {? unescape_string(l) } rule STRING_LITERAL_LONG1_inner() = ("''" / "'")? (STRING_LITERAL_LONG1_simple_char() / ECHAR() / UCHAR()) rule STRING_LITERAL_LONG1_simple_char() = !['\'' | '\\'] [_] rule STRING_LITERAL_LONG2() -> String = "\"\"\"" l:$(STRING_LITERAL_LONG2_inner()*) "\"\"\"" {? unescape_string(l) } rule STRING_LITERAL_LONG2_inner() = ("\"\"" / "\"")? (STRING_LITERAL_LONG2_simple_char() / ECHAR() / UCHAR()) rule STRING_LITERAL_LONG2_simple_char() = !['"' | '\\'] [_] rule UCHAR() = "\\u" HEX() HEX() HEX() HEX() / "\\U" HEX() HEX() HEX() HEX() HEX() HEX() HEX() HEX() rule ECHAR() = "\\" ['t' | 'b' | 'n' | 'r' | 'f' | '"' |'\'' | '\\'] rule NIL() = "(" WS()* ")" rule WS() = quiet! { ['\u{20}' | '\u{9}' | '\u{D}' | '\u{A}'] } rule ANON() = "[" WS()* "]" rule PN_CHARS_BASE() = ['A' ..= 'Z' | 'a' ..= 'z' | '\u{00C0}'..='\u{00D6}' | '\u{00D8}'..='\u{00F6}' | '\u{00F8}'..='\u{02FF}' | '\u{0370}'..='\u{037D}' | '\u{037F}'..='\u{1FFF}' | '\u{200C}'..='\u{200D}' | '\u{2070}'..='\u{218F}' | '\u{2C00}'..='\u{2FEF}' | '\u{3001}'..='\u{D7FF}' | '\u{F900}'..='\u{FDCF}' | '\u{FDF0}'..='\u{FFFD}'] rule PN_CHARS_U() = ['_'] / PN_CHARS_BASE() rule VARNAME() = (['0'..='9'] / PN_CHARS_U()) (['0' ..= '9' | '\u{00B7}' | '\u{0300}'..='\u{036F}' | '\u{203F}'..='\u{2040}'] / PN_CHARS_U())* rule PN_CHARS() = ['-' | '0' ..= '9' | '\u{00B7}' | '\u{0300}'..='\u{036F}' | '\u{203F}'..='\u{2040}'] / PN_CHARS_U() rule PN_PREFIX() = PN_CHARS_BASE() PN_CHARS()* ("."+ PN_CHARS()+)* rule PN_LOCAL() = (PN_CHARS_U() / [':' | '0'..='9'] / PLX()) (PN_CHARS() / [':'] / PLX())* (['.']+ (PN_CHARS() / [':'] / PLX())+)? rule PLX() = PERCENT() / PN_LOCAL_ESC() rule PERCENT() = ['%'] HEX() HEX() rule HEX() = ['0' ..= '9' | 'A' ..= 'F' | 'a' ..= 'f'] rule PN_LOCAL_ESC() = ['\\'] ['_' | '~' | '.' | '-' | '!' | '$' | '&' | '\'' | '(' | ')' | '*' | '+' | ',' | ';' | '=' | '/' | '?' | '#' | '@' | '%'] //TODO: added '/' to make tests pass but is it valid? //space rule _() = quiet! { ([' ' | '\t' | '\n' | '\r'] / comment())* } //comment rule comment() = quiet! { ['#'] (!['\r' | '\n'] [_])* } rule i(literal: &'static str) = input: $([_]*<{literal.len()}>) {? if input.eq_ignore_ascii_case(literal) { Ok(()) } else { Err(literal) } } } }