//! [SPARQL 1.1 Query Algebra](https://www.w3.org/TR/sparql11-query/#sparqlQuery) representation. use crate::term::*; use oxrdf::LiteralRef; use std::fmt; /// A [property path expression](https://www.w3.org/TR/sparql11-query/#defn_PropertyPathExpr). #[derive(Eq, PartialEq, Debug, Clone, Hash)] pub enum PropertyPathExpression { NamedNode(NamedNode), Reverse(Box), Sequence(Box, Box), Alternative(Box, Box), ZeroOrMore(Box), OneOrMore(Box), ZeroOrOne(Box), NegatedPropertySet(Vec), } impl PropertyPathExpression { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { match self { Self::NamedNode(p) => write!(f, "{p}"), Self::Reverse(p) => { f.write_str("(reverse ")?; p.fmt_sse(f)?; f.write_str(")") } Self::Alternative(a, b) => { f.write_str("(alt ")?; a.fmt_sse(f)?; f.write_str(" ")?; b.fmt_sse(f)?; f.write_str(")") } Self::Sequence(a, b) => { f.write_str("(seq ")?; a.fmt_sse(f)?; f.write_str(" ")?; b.fmt_sse(f)?; f.write_str(")") } Self::ZeroOrMore(p) => { f.write_str("(path* ")?; p.fmt_sse(f)?; f.write_str(")") } Self::OneOrMore(p) => { f.write_str("(path+ ")?; p.fmt_sse(f)?; f.write_str(")") } Self::ZeroOrOne(p) => { f.write_str("(path? ")?; p.fmt_sse(f)?; f.write_str(")") } Self::NegatedPropertySet(p) => { f.write_str("(notoneof")?; for p in p { write!(f, " {p}")?; } f.write_str(")") } } } } impl fmt::Display for PropertyPathExpression { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { match self { Self::NamedNode(p) => p.fmt(f), Self::Reverse(p) => write!(f, "^({p})"), Self::Sequence(a, b) => write!(f, "({a} / {b})"), Self::Alternative(a, b) => write!(f, "({a} | {b})"), Self::ZeroOrMore(p) => write!(f, "({p})*"), Self::OneOrMore(p) => write!(f, "({p})+"), Self::ZeroOrOne(p) => write!(f, "({p})?"), Self::NegatedPropertySet(p) => { f.write_str("!(")?; for (i, c) in p.iter().enumerate() { if i > 0 { f.write_str(" | ")?; } write!(f, "{c}")?; } f.write_str(")") } } } } /// The `display(with = ...)` will not work until this PR lands: /// https://github.com/frozenlib/parse-display/issues/36#issuecomment-1925367731 /// #[cfg(skip)] #[derive(Eq, PartialEq, Debug, Clone, Hash, parse_display::Display)] pub enum PropertyPathExpression { #[display("{0}")] NamedNode(NamedNode), #[display("^({0})")] Reverse(Box), #[display("({0} / {1})")] Sequence(Box, Box), #[display("({0} | {1})")] Alternative(Box, Box), #[display("({0})*")] ZeroOrMore(Box), #[display("({0})+")] OneOrMore(Box), #[display("({0})?")] ZeroOrOne(Box), #[display("!({0})")] NegatedPropertySet(#[display(with = delimiter(" | "))] Vec), } impl From for PropertyPathExpression { fn from(p: NamedNode) -> Self { Self::NamedNode(p) } } /// An [expression](https://www.w3.org/TR/sparql11-query/#expressions). #[derive(Eq, PartialEq, Debug, Clone, Hash)] pub enum Expression { NamedNode(NamedNode), Literal(Literal), Variable(Variable), /// [Logical-or](https://www.w3.org/TR/sparql11-query/#func-logical-or). Or(Box, Box), /// [Logical-and](https://www.w3.org/TR/sparql11-query/#func-logical-and). And(Box, Box), /// [RDFterm-equal](https://www.w3.org/TR/sparql11-query/#func-RDFterm-equal) and all the XSD equalities. Equal(Box, Box), /// [sameTerm](https://www.w3.org/TR/sparql11-query/#func-sameTerm). SameTerm(Box, Box), /// [op:numeric-greater-than](https://www.w3.org/TR/xpath-functions-31/#func-numeric-greater-than) and other XSD greater than operators. Greater(Box, Box), GreaterOrEqual(Box, Box), /// [op:numeric-less-than](https://www.w3.org/TR/xpath-functions-31/#func-numeric-less-than) and other XSD greater than operators. Less(Box, Box), LessOrEqual(Box, Box), /// [IN](https://www.w3.org/TR/sparql11-query/#func-in) In(Box, Vec), /// [op:numeric-add](https://www.w3.org/TR/xpath-functions-31/#func-numeric-add) and other XSD additions. Add(Box, Box), /// [op:numeric-subtract](https://www.w3.org/TR/xpath-functions-31/#func-numeric-subtract) and other XSD subtractions. Subtract(Box, Box), /// [op:numeric-multiply](https://www.w3.org/TR/xpath-functions-31/#func-numeric-multiply) and other XSD multiplications. Multiply(Box, Box), /// [op:numeric-divide](https://www.w3.org/TR/xpath-functions-31/#func-numeric-divide) and other XSD divides. Divide(Box, Box), /// [op:numeric-unary-plus](https://www.w3.org/TR/xpath-functions-31/#func-numeric-unary-plus) and other XSD unary plus. UnaryPlus(Box), /// [op:numeric-unary-minus](https://www.w3.org/TR/xpath-functions-31/#func-numeric-unary-minus) and other XSD unary minus. UnaryMinus(Box), /// [fn:not](https://www.w3.org/TR/xpath-functions-31/#func-not). Not(Box), /// [EXISTS](https://www.w3.org/TR/sparql11-query/#func-filter-exists). Exists(Box), /// [BOUND](https://www.w3.org/TR/sparql11-query/#func-bound). Bound(Variable), /// [IF](https://www.w3.org/TR/sparql11-query/#func-if). If(Box, Box, Box), /// [COALESCE](https://www.w3.org/TR/sparql11-query/#func-coalesce). Coalesce(Vec), /// A regular function call. FunctionCall(Function, Vec), } impl Expression { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { match self { Self::NamedNode(node) => write!(f, "{node}"), Self::Literal(l) => write!(f, "{l}"), Self::Variable(var) => write!(f, "{var}"), Self::Or(a, b) => fmt_sse_binary_expression(f, "||", a, b), Self::And(a, b) => fmt_sse_binary_expression(f, "&&", a, b), Self::Equal(a, b) => fmt_sse_binary_expression(f, "=", a, b), Self::SameTerm(a, b) => fmt_sse_binary_expression(f, "sameTerm", a, b), Self::Greater(a, b) => fmt_sse_binary_expression(f, ">", a, b), Self::GreaterOrEqual(a, b) => fmt_sse_binary_expression(f, ">=", a, b), Self::Less(a, b) => fmt_sse_binary_expression(f, "<", a, b), Self::LessOrEqual(a, b) => fmt_sse_binary_expression(f, "<=", a, b), Self::In(a, b) => { f.write_str("(in ")?; a.fmt_sse(f)?; for p in b { f.write_str(" ")?; p.fmt_sse(f)?; } f.write_str(")") } Self::Add(a, b) => fmt_sse_binary_expression(f, "+", a, b), Self::Subtract(a, b) => fmt_sse_binary_expression(f, "-", a, b), Self::Multiply(a, b) => fmt_sse_binary_expression(f, "*", a, b), Self::Divide(a, b) => fmt_sse_binary_expression(f, "/", a, b), Self::UnaryPlus(e) => fmt_sse_unary_expression(f, "+", e), Self::UnaryMinus(e) => fmt_sse_unary_expression(f, "-", e), Self::Not(e) => fmt_sse_unary_expression(f, "!", e), Self::FunctionCall(function, parameters) => { f.write_str("( ")?; function.fmt_sse(f)?; for p in parameters { f.write_str(" ")?; p.fmt_sse(f)?; } f.write_str(")") } Self::Exists(p) => { f.write_str("(exists ")?; p.fmt_sse(f)?; f.write_str(")") } Self::Bound(v) => { write!(f, "(bound {v})") } Self::If(a, b, c) => { f.write_str("(if ")?; a.fmt_sse(f)?; f.write_str(" ")?; b.fmt_sse(f)?; f.write_str(" ")?; c.fmt_sse(f)?; f.write_str(")") } Self::Coalesce(parameters) => { f.write_str("(coalesce")?; for p in parameters { f.write_str(" ")?; p.fmt_sse(f)?; } f.write_str(")") } } } } impl fmt::Display for Expression { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { match self { Self::NamedNode(node) => node.fmt(f), Self::Literal(l) => l.fmt(f), Self::Variable(var) => var.fmt(f), Self::Or(a, b) => write!(f, "({a} || {b})"), Self::And(a, b) => write!(f, "({a} && {b})"), Self::Equal(a, b) => { write!(f, "({a} = {b})") } Self::SameTerm(a, b) => { write!(f, "sameTerm({a}, {b})") } Self::Greater(a, b) => { write!(f, "({a} > {b})") } Self::GreaterOrEqual(a, b) => write!(f, "({a} >= {b})"), Self::Less(a, b) => { write!(f, "({a} < {b})") } Self::LessOrEqual(a, b) => write!(f, "({a} <= {b})"), Self::In(a, b) => { write!(f, "({a} IN ")?; write_arg_list(b, f)?; f.write_str(")") } Self::Add(a, b) => { write!(f, "{a} + {b}") } Self::Subtract(a, b) => { write!(f, "{a} - {b}") } Self::Multiply(a, b) => { write!(f, "{a} * {b}") } Self::Divide(a, b) => { write!(f, "{a} / {b}") } Self::UnaryPlus(e) => write!(f, "+{e}"), Self::UnaryMinus(e) => write!(f, "-{e}"), Self::Not(e) => match e.as_ref() { Self::Exists(p) => write!(f, "NOT EXISTS {{ {p} }}"), e => write!(f, "!{e}"), }, Self::FunctionCall(function, parameters) => { write!(f, "{function}")?; write_arg_list(parameters, f) } Self::Bound(v) => write!(f, "BOUND({v})"), Self::Exists(p) => write!(f, "EXISTS {{ {p} }}"), Self::If(a, b, c) => write!(f, "IF({a}, {b}, {c})"), Self::Coalesce(parameters) => { f.write_str("COALESCE")?; write_arg_list(parameters, f) } } } } impl From for Expression { fn from(p: NamedNode) -> Self { Self::NamedNode(p) } } impl From for Expression { fn from(p: Literal) -> Self { Self::Literal(p) } } impl From for Expression { fn from(v: Variable) -> Self { Self::Variable(v) } } impl From for Expression { fn from(p: NamedNodePattern) -> Self { match p { NamedNodePattern::NamedNode(p) => p.into(), NamedNodePattern::Variable(p) => p.into(), } } } fn write_arg_list( params: impl IntoIterator, f: &mut fmt::Formatter<'_>, ) -> fmt::Result { f.write_str("(")?; let mut cont = false; for p in params { if cont { f.write_str(", ")?; } p.fmt(f)?; cont = true; } f.write_str(")") } /// A function name. #[derive(Eq, PartialEq, Debug, Clone, Hash, parse_display::Display)] #[display(style = "UPPERCASE")] pub enum Function { Str, Lang, LangMatches, Datatype, Iri, BNode, Rand, Abs, Ceil, Floor, Round, Concat, SubStr, StrLen, Replace, UCase, LCase, #[display("ENCODE_FOR_URI")] EncodeForUri, Contains, StrStarts, StrEnds, StrBefore, StrAfter, Year, Month, Day, Hours, Minutes, Seconds, Timezone, Tz, Now, Uuid, StrUuid, Md5, Sha1, Sha256, Sha384, Sha512, StrLang, StrDt, #[display("isIRI")] IsIri, #[display("isBLANK")] IsBlank, #[display("isLITERAL")] IsLiteral, #[display("isNUMERIC")] IsNumeric, Regex, #[cfg(feature = "rdf-star")] Triple, #[cfg(feature = "rdf-star")] Subject, #[cfg(feature = "rdf-star")] Predicate, #[cfg(feature = "rdf-star")] Object, #[cfg(feature = "rdf-star")] #[display("isTRIPLE")] IsTriple, #[cfg(feature = "sep-0002")] Adjust, #[display("{0}")] Custom(NamedNode), } impl Function { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { match self { Self::Str => f.write_str("str"), Self::Lang => f.write_str("lang"), Self::LangMatches => f.write_str("langmatches"), Self::Datatype => f.write_str("datatype"), Self::Iri => f.write_str("iri"), Self::BNode => f.write_str("bnode"), Self::Rand => f.write_str("rand"), Self::Abs => f.write_str("abs"), Self::Ceil => f.write_str("ceil"), Self::Floor => f.write_str("floor"), Self::Round => f.write_str("round"), Self::Concat => f.write_str("concat"), Self::SubStr => f.write_str("substr"), Self::StrLen => f.write_str("strlen"), Self::Replace => f.write_str("replace"), Self::UCase => f.write_str("ucase"), Self::LCase => f.write_str("lcase"), Self::EncodeForUri => f.write_str("encode_for_uri"), Self::Contains => f.write_str("contains"), Self::StrStarts => f.write_str("strstarts"), Self::StrEnds => f.write_str("strends"), Self::StrBefore => f.write_str("strbefore"), Self::StrAfter => f.write_str("strafter"), Self::Year => f.write_str("year"), Self::Month => f.write_str("month"), Self::Day => f.write_str("day"), Self::Hours => f.write_str("hours"), Self::Minutes => f.write_str("minutes"), Self::Seconds => f.write_str("seconds"), Self::Timezone => f.write_str("timezone"), Self::Tz => f.write_str("tz"), Self::Now => f.write_str("now"), Self::Uuid => f.write_str("uuid"), Self::StrUuid => f.write_str("struuid"), Self::Md5 => f.write_str("md5"), Self::Sha1 => f.write_str("sha1"), Self::Sha256 => f.write_str("sha256"), Self::Sha384 => f.write_str("sha384"), Self::Sha512 => f.write_str("sha512"), Self::StrLang => f.write_str("strlang"), Self::StrDt => f.write_str("strdt"), Self::IsIri => f.write_str("isiri"), Self::IsBlank => f.write_str("isblank"), Self::IsLiteral => f.write_str("isliteral"), Self::IsNumeric => f.write_str("isnumeric"), Self::Regex => f.write_str("regex"), #[cfg(feature = "rdf-star")] Self::Triple => f.write_str("triple"), #[cfg(feature = "rdf-star")] Self::Subject => f.write_str("subject"), #[cfg(feature = "rdf-star")] Self::Predicate => f.write_str("predicate"), #[cfg(feature = "rdf-star")] Self::Object => f.write_str("object"), #[cfg(feature = "rdf-star")] Self::IsTriple => f.write_str("istriple"), #[cfg(feature = "sep-0002")] Self::Adjust => f.write_str("adjust"), Self::Custom(iri) => write!(f, "{iri}"), } } } #[cfg(test)] mod test_func { use super::*; #[test] fn display() { // This is a temporary migration test - we can remove most of these before merging assert_eq!(Function::Str.to_string(), "STR"); assert_eq!(Function::Lang.to_string(), "LANG"); assert_eq!(Function::LangMatches.to_string(), "LANGMATCHES"); assert_eq!(Function::Datatype.to_string(), "DATATYPE"); assert_eq!(Function::Iri.to_string(), "IRI"); assert_eq!(Function::BNode.to_string(), "BNODE"); assert_eq!(Function::Rand.to_string(), "RAND"); assert_eq!(Function::Abs.to_string(), "ABS"); assert_eq!(Function::Ceil.to_string(), "CEIL"); assert_eq!(Function::Floor.to_string(), "FLOOR"); assert_eq!(Function::Round.to_string(), "ROUND"); assert_eq!(Function::Concat.to_string(), "CONCAT"); assert_eq!(Function::SubStr.to_string(), "SUBSTR"); assert_eq!(Function::StrLen.to_string(), "STRLEN"); assert_eq!(Function::Replace.to_string(), "REPLACE"); assert_eq!(Function::UCase.to_string(), "UCASE"); assert_eq!(Function::LCase.to_string(), "LCASE"); assert_eq!(Function::EncodeForUri.to_string(), "ENCODE_FOR_URI"); assert_eq!(Function::Contains.to_string(), "CONTAINS"); assert_eq!(Function::StrStarts.to_string(), "STRSTARTS"); assert_eq!(Function::StrEnds.to_string(), "STRENDS"); assert_eq!(Function::StrBefore.to_string(), "STRBEFORE"); assert_eq!(Function::StrAfter.to_string(), "STRAFTER"); assert_eq!(Function::Year.to_string(), "YEAR"); assert_eq!(Function::Month.to_string(), "MONTH"); assert_eq!(Function::Day.to_string(), "DAY"); assert_eq!(Function::Hours.to_string(), "HOURS"); assert_eq!(Function::Minutes.to_string(), "MINUTES"); assert_eq!(Function::Seconds.to_string(), "SECONDS"); assert_eq!(Function::Timezone.to_string(), "TIMEZONE"); assert_eq!(Function::Tz.to_string(), "TZ"); assert_eq!(Function::Now.to_string(), "NOW"); assert_eq!(Function::Uuid.to_string(), "UUID"); assert_eq!(Function::StrUuid.to_string(), "STRUUID"); assert_eq!(Function::Md5.to_string(), "MD5"); assert_eq!(Function::Sha1.to_string(), "SHA1"); assert_eq!(Function::Sha256.to_string(), "SHA256"); assert_eq!(Function::Sha384.to_string(), "SHA384"); assert_eq!(Function::Sha512.to_string(), "SHA512"); assert_eq!(Function::StrLang.to_string(), "STRLANG"); assert_eq!(Function::StrDt.to_string(), "STRDT"); assert_eq!(Function::IsIri.to_string(), "isIRI"); assert_eq!(Function::IsBlank.to_string(), "isBLANK"); assert_eq!(Function::IsLiteral.to_string(), "isLITERAL"); assert_eq!(Function::IsNumeric.to_string(), "isNUMERIC"); assert_eq!(Function::Regex.to_string(), "REGEX"); #[cfg(feature = "rdf-star")] assert_eq!(Function::Triple.to_string(), "TRIPLE"); #[cfg(feature = "rdf-star")] assert_eq!(Function::Subject.to_string(), "SUBJECT"); #[cfg(feature = "rdf-star")] assert_eq!(Function::Predicate.to_string(), "PREDICATE"); #[cfg(feature = "rdf-star")] assert_eq!(Function::Object.to_string(), "OBJECT"); #[cfg(feature = "rdf-star")] assert_eq!(Function::IsTriple.to_string(), "isTRIPLE"); #[cfg(feature = "sep-0002")] assert_eq!(Function::Adjust.to_string(), "ADJUST"); assert_eq!( Function::Custom(NamedNode::new("http://example.com/foo").unwrap()).to_string(), "" ); } } /// A SPARQL query [graph pattern](https://www.w3.org/TR/sparql11-query/#sparqlQuery). #[derive(Eq, PartialEq, Debug, Clone, Hash)] pub enum GraphPattern { /// A [basic graph pattern](https://www.w3.org/TR/sparql11-query/#defn_BasicGraphPattern). Bgp { patterns: Vec }, /// A [property path pattern](https://www.w3.org/TR/sparql11-query/#defn_evalPP_predicate). Path { subject: TermPattern, path: PropertyPathExpression, object: TermPattern, }, /// [Join](https://www.w3.org/TR/sparql11-query/#defn_algJoin). Join { left: Box, right: Box }, /// [LeftJoin](https://www.w3.org/TR/sparql11-query/#defn_algLeftJoin). LeftJoin { left: Box, right: Box, expression: Option, }, /// Lateral join i.e. evaluate right for all result row of left #[cfg(feature = "sep-0006")] Lateral { left: Box, right: Box }, /// [Filter](https://www.w3.org/TR/sparql11-query/#defn_algFilter). Filter { expr: Expression, inner: Box }, /// [Union](https://www.w3.org/TR/sparql11-query/#defn_algUnion). Union { left: Box, right: Box }, Graph { name: NamedNodePattern, inner: Box, }, /// [Extend](https://www.w3.org/TR/sparql11-query/#defn_extend). Extend { inner: Box, variable: Variable, expression: Expression, }, /// [Minus](https://www.w3.org/TR/sparql11-query/#defn_algMinus). Minus { left: Box, right: Box }, /// A table used to provide inline values Values { variables: Vec, bindings: Vec>>, }, /// [OrderBy](https://www.w3.org/TR/sparql11-query/#defn_algOrdered). OrderBy { inner: Box, expression: Vec, }, /// [Project](https://www.w3.org/TR/sparql11-query/#defn_algProjection). Project { inner: Box, variables: Vec, }, /// [Distinct](https://www.w3.org/TR/sparql11-query/#defn_algDistinct). Distinct { inner: Box }, /// [Reduced](https://www.w3.org/TR/sparql11-query/#defn_algReduced). Reduced { inner: Box }, /// [Slice](https://www.w3.org/TR/sparql11-query/#defn_algSlice). Slice { inner: Box, start: usize, length: Option, }, /// [Group](https://www.w3.org/TR/sparql11-query/#aggregateAlgebra). Group { inner: Box, variables: Vec, aggregates: Vec<(Variable, AggregateExpression)>, }, /// [Service](https://www.w3.org/TR/sparql11-federated-query/#defn_evalService). Service { name: NamedNodePattern, inner: Box, silent: bool, }, } impl fmt::Display for GraphPattern { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { match self { Self::Bgp { patterns } => { for pattern in patterns { write!(f, "{pattern} .")? } Ok(()) } Self::Path { subject, path, object, } => write!(f, "{subject} {path} {object} ."), Self::Join { left, right } => { #[allow(clippy::match_same_arms)] match right.as_ref() { Self::LeftJoin { .. } | Self::Minus { .. } | Self::Extend { .. } | Self::Filter { .. } => { // The second block might be considered as a modification of the first one. write!(f, "{left} {{ {right} }}") } #[cfg(feature = "sep-0006")] Self::Lateral { .. } => { write!(f, "{left} {{ {right} }}") } _ => write!(f, "{left} {right}"), } } Self::LeftJoin { left, right, expression, } => { if let Some(expr) = expression { write!(f, "{left} OPTIONAL {{ {right} FILTER({expr}) }}") } else { write!(f, "{left} OPTIONAL {{ {right} }}") } } #[cfg(feature = "sep-0006")] Self::Lateral { left, right } => { write!(f, "{left} LATERAL {{ {right} }}") } Self::Filter { expr, inner } => { write!(f, "{inner} FILTER({expr})") } Self::Union { left, right } => write!(f, "{{ {left} }} UNION {{ {right} }}"), Self::Graph { name, inner } => { write!(f, "GRAPH {name} {{ {inner} }}") } Self::Extend { inner, variable, expression, } => write!(f, "{inner} BIND({expression} AS {variable})"), Self::Minus { left, right } => write!(f, "{left} MINUS {{ {right} }}"), Self::Service { name, inner, silent, } => { if *silent { write!(f, "SERVICE SILENT {name} {{ {inner} }}") } else { write!(f, "SERVICE {name} {{ {inner} }}") } } Self::Values { variables, bindings, } => { f.write_str("VALUES ( ")?; for var in variables { write!(f, "{var} ")?; } f.write_str(") { ")?; for row in bindings { f.write_str("( ")?; for val in row { match val { Some(val) => write!(f, "{val} "), None => f.write_str("UNDEF "), }?; } f.write_str(") ")?; } f.write_str(" }") } Self::Group { inner, variables, aggregates, } => { f.write_str("{SELECT")?; for (a, v) in aggregates { write!(f, " ({v} AS {a})")?; } for b in variables { write!(f, " {b}")?; } write!(f, " WHERE {{ {inner} }}")?; if !variables.is_empty() { f.write_str(" GROUP BY")?; for v in variables { write!(f, " {v}")?; } } f.write_str("}") } p => write!( f, "{{ {} }}", SparqlGraphRootPattern { pattern: p, dataset: None } ), } } } impl Default for GraphPattern { fn default() -> Self { Self::Bgp { patterns: Vec::default(), } } } impl GraphPattern { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { match self { Self::Bgp { patterns } => { f.write_str("(bgp")?; for pattern in patterns { f.write_str(" ")?; pattern.fmt_sse(f)?; } f.write_str(")") } Self::Path { subject, path, object, } => { f.write_str("(path ")?; subject.fmt_sse(f)?; f.write_str(" ")?; path.fmt_sse(f)?; f.write_str(" ")?; object.fmt_sse(f)?; f.write_str(")") } Self::Join { left, right } => { f.write_str("(join ")?; left.fmt_sse(f)?; f.write_str(" ")?; right.fmt_sse(f)?; f.write_str(")") } Self::LeftJoin { left, right, expression, } => { f.write_str("(leftjoin ")?; left.fmt_sse(f)?; f.write_str(" ")?; right.fmt_sse(f)?; if let Some(expr) = expression { f.write_str(" ")?; expr.fmt_sse(f)?; } f.write_str(")") } #[cfg(feature = "sep-0006")] Self::Lateral { left, right } => { f.write_str("(lateral ")?; left.fmt_sse(f)?; f.write_str(" ")?; right.fmt_sse(f)?; f.write_str(")") } Self::Filter { expr, inner } => { f.write_str("(filter ")?; expr.fmt_sse(f)?; f.write_str(" ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Union { left, right } => { f.write_str("(union ")?; left.fmt_sse(f)?; f.write_str(" ")?; right.fmt_sse(f)?; f.write_str(")") } Self::Graph { name, inner } => { f.write_str("(graph ")?; name.fmt_sse(f)?; f.write_str(" ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Extend { inner, variable, expression, } => { write!(f, "(extend (({variable} ")?; expression.fmt_sse(f)?; f.write_str(")) ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Minus { left, right } => { f.write_str("(minus ")?; left.fmt_sse(f)?; f.write_str(" ")?; right.fmt_sse(f)?; f.write_str(")") } Self::Service { name, inner, silent, } => { f.write_str("(service ")?; if *silent { f.write_str("silent ")?; } name.fmt_sse(f)?; f.write_str(" ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Group { inner, variables, aggregates, } => { f.write_str("(group (")?; for (i, v) in variables.iter().enumerate() { if i > 0 { f.write_str(" ")?; } write!(f, "{v}")?; } f.write_str(") (")?; for (i, (v, a)) in aggregates.iter().enumerate() { if i > 0 { f.write_str(" ")?; } f.write_str("(")?; a.fmt_sse(f)?; write!(f, " {v})")?; } f.write_str(") ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Values { variables, bindings, } => { f.write_str("(table (vars")?; for var in variables { write!(f, " {var}")?; } f.write_str(")")?; for row in bindings { f.write_str(" (row")?; for (value, var) in row.iter().zip(variables) { if let Some(value) = value { write!(f, " ({var} {value})")?; } } f.write_str(")")?; } f.write_str(")") } Self::OrderBy { inner, expression } => { f.write_str("(order (")?; for (i, c) in expression.iter().enumerate() { if i > 0 { f.write_str(" ")?; } c.fmt_sse(f)?; } f.write_str(") ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Project { inner, variables } => { f.write_str("(project (")?; for (i, v) in variables.iter().enumerate() { if i > 0 { f.write_str(" ")?; } write!(f, "{v}")?; } f.write_str(") ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Distinct { inner } => { f.write_str("(distinct ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Reduced { inner } => { f.write_str("(reduced ")?; inner.fmt_sse(f)?; f.write_str(")") } Self::Slice { inner, start, length, } => { if let Some(length) = length { write!(f, "(slice {start} {length} ")?; } else { write!(f, "(slice {start} _ ")?; } inner.fmt_sse(f)?; f.write_str(")") } } } /// Calls `callback` on each [in-scope variable](https://www.w3.org/TR/sparql11-query/#variableScope) occurrence. pub fn on_in_scope_variable<'a>(&'a self, mut callback: impl FnMut(&'a Variable)) { self.lookup_in_scope_variables(&mut callback) } fn lookup_in_scope_variables<'a>(&'a self, callback: &mut impl FnMut(&'a Variable)) { #[allow(clippy::match_same_arms)] match self { Self::Bgp { patterns } => { for pattern in patterns { lookup_triple_pattern_variables(pattern, callback) } } Self::Path { subject, object, .. } => { if let TermPattern::Variable(s) = subject { callback(s); } #[cfg(feature = "rdf-star")] if let TermPattern::Triple(s) = subject { lookup_triple_pattern_variables(s, callback) } if let TermPattern::Variable(o) = object { callback(o); } #[cfg(feature = "rdf-star")] if let TermPattern::Triple(o) = object { lookup_triple_pattern_variables(o, callback) } } Self::Join { left, right } | Self::LeftJoin { left, right, .. } | Self::Union { left, right } => { left.lookup_in_scope_variables(callback); right.lookup_in_scope_variables(callback); } #[cfg(feature = "sep-0006")] Self::Lateral { left, right } => { left.lookup_in_scope_variables(callback); right.lookup_in_scope_variables(callback); } Self::Graph { name, inner } => { if let NamedNodePattern::Variable(g) = &name { callback(g); } inner.lookup_in_scope_variables(callback); } Self::Extend { inner, variable, .. } => { callback(variable); inner.lookup_in_scope_variables(callback); } Self::Minus { left, .. } => left.lookup_in_scope_variables(callback), Self::Group { variables, aggregates, .. } => { for v in variables { callback(v); } for (v, _) in aggregates { callback(v); } } Self::Values { variables, .. } | Self::Project { variables, .. } => { for v in variables { callback(v); } } Self::Service { inner, .. } | Self::Filter { inner, .. } | Self::OrderBy { inner, .. } | Self::Distinct { inner } | Self::Reduced { inner } | Self::Slice { inner, .. } => inner.lookup_in_scope_variables(callback), } } } fn lookup_triple_pattern_variables<'a>( pattern: &'a TriplePattern, callback: &mut impl FnMut(&'a Variable), ) { if let TermPattern::Variable(s) = &pattern.subject { callback(s); } #[cfg(feature = "rdf-star")] if let TermPattern::Triple(s) = &pattern.subject { lookup_triple_pattern_variables(s, callback) } if let NamedNodePattern::Variable(p) = &pattern.predicate { callback(p); } if let TermPattern::Variable(o) = &pattern.object { callback(o); } #[cfg(feature = "rdf-star")] if let TermPattern::Triple(o) = &pattern.object { lookup_triple_pattern_variables(o, callback) } } pub(crate) struct SparqlGraphRootPattern<'a> { pub(crate) pattern: &'a GraphPattern, pub(crate) dataset: Option<&'a QueryDataset>, } impl<'a> fmt::Display for SparqlGraphRootPattern<'a> { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { let mut distinct = false; let mut reduced = false; let mut order = None; let mut start = 0; let mut length = None; let mut project: &[Variable] = &[]; let mut child = self.pattern; loop { match child { GraphPattern::OrderBy { inner, expression } => { order = Some(expression); child = inner; } GraphPattern::Project { inner, variables } if project.is_empty() => { project = variables; child = inner; } GraphPattern::Distinct { inner } => { distinct = true; child = inner; } GraphPattern::Reduced { inner } => { reduced = true; child = inner; } GraphPattern::Slice { inner, start: s, length: l, } => { start = *s; length = *l; child = inner; } p => { f.write_str("SELECT")?; if distinct { f.write_str(" DISTINCT")?; } if reduced { f.write_str(" REDUCED")?; } if project.is_empty() { f.write_str(" *")?; } else { for v in project { write!(f, " {v}")?; } } if let Some(dataset) = self.dataset { write!(f, " {dataset}")?; } write!(f, " WHERE {{ {p} }}")?; if let Some(order) = order { f.write_str(" ORDER BY")?; for c in order { write!(f, " {c}")?; } } if start > 0 { write!(f, " OFFSET {start}")?; } if let Some(length) = length { write!(f, " LIMIT {length}")?; } return Ok(()); } } } } } /// A set function used in aggregates (c.f. [`GraphPattern::Group`]). #[derive(Eq, PartialEq, Debug, Clone, Hash)] pub enum AggregateExpression { /// [Count](https://www.w3.org/TR/sparql11-query/#defn_aggCount) with *. CountSolutions { distinct: bool }, FunctionCall { name: AggregateFunction, expr: Expression, distinct: bool, }, } impl AggregateExpression { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { match self { Self::CountSolutions { distinct } => { f.write_str("(count")?; if *distinct { f.write_str(" distinct")?; } f.write_str(")") } Self::FunctionCall { name: AggregateFunction::GroupConcat { separator: Some(separator), }, expr, distinct, } => { f.write_str("(group_concat ")?; if *distinct { f.write_str("distinct ")?; } expr.fmt_sse(f)?; write!(f, " {})", LiteralRef::new_simple_literal(separator)) } Self::FunctionCall { name, expr, distinct, } => { f.write_str("(")?; name.fmt_sse(f)?; f.write_str(" ")?; if *distinct { f.write_str("distinct ")?; } expr.fmt_sse(f)?; f.write_str(")") } } } } impl fmt::Display for AggregateExpression { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { match self { Self::CountSolutions { distinct } => { if *distinct { f.write_str("COUNT(DISTINCT *)") } else { f.write_str("COUNT(*)") } } Self::FunctionCall { name: AggregateFunction::GroupConcat { separator: Some(separator), }, expr, distinct, } => { if *distinct { write!( f, "GROUP_CONCAT(DISTINCT {}; SEPARATOR = {})", expr, LiteralRef::new_simple_literal(separator) ) } else { write!( f, "GROUP_CONCAT({}; SEPARATOR = {})", expr, LiteralRef::new_simple_literal(separator) ) } } Self::FunctionCall { name, expr, distinct, } => { if *distinct { write!(f, "{name}(DISTINCT {expr})") } else { write!(f, "{name}({expr})") } } } } } /// An aggregate function name. #[derive(Eq, PartialEq, Debug, Clone, Hash, parse_display::Display)] #[display(style = "SNAKE_CASE")] pub enum AggregateFunction { /// [Count](https://www.w3.org/TR/sparql11-query/#defn_aggCount) with *. Count, /// [Sum](https://www.w3.org/TR/sparql11-query/#defn_aggSum). Sum, /// [Avg](https://www.w3.org/TR/sparql11-query/#defn_aggAvg). Avg, /// [Min](https://www.w3.org/TR/sparql11-query/#defn_aggMin). Min, /// [Max](https://www.w3.org/TR/sparql11-query/#defn_aggMax). Max, /// [GroupConcat](https://www.w3.org/TR/sparql11-query/#defn_aggGroupConcat). #[display("{}")] GroupConcat { separator: Option }, /// [Sample](https://www.w3.org/TR/sparql11-query/#defn_aggSample). Sample, #[display("{0}")] Custom(NamedNode), } impl AggregateFunction { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { match self { Self::Count => f.write_str("count"), Self::Sum => f.write_str("sum"), Self::Avg => f.write_str("avg"), Self::Min => f.write_str("min"), Self::Max => f.write_str("max"), Self::GroupConcat { .. } => f.write_str("group_concat"), Self::Sample => f.write_str("sample"), Self::Custom(iri) => write!(f, "{iri}"), } } } #[cfg(test)] mod test_agg { use super::*; #[test] fn display() { // This is a temporary migration test - we can remove most of these before merging assert_eq!(AggregateFunction::Count.to_string(), "COUNT"); assert_eq!(AggregateFunction::Sum.to_string(), "SUM"); assert_eq!(AggregateFunction::Avg.to_string(), "AVG"); assert_eq!(AggregateFunction::Min.to_string(), "MIN"); assert_eq!(AggregateFunction::Max.to_string(), "MAX"); assert_eq!( AggregateFunction::GroupConcat { separator: Some("foo".to_owned()) } .to_string(), "GROUP_CONCAT" ); assert_eq!(AggregateFunction::Sample.to_string(), "SAMPLE"); assert_eq!( AggregateFunction::Custom(NamedNode::new("http://example.com/foo").unwrap()) .to_string(), "" ); } } /// An ordering comparator used by [`GraphPattern::OrderBy`]. #[derive(Eq, PartialEq, Debug, Clone, Hash, parse_display::Display)] #[display("{}({0})", style = "UPPERCASE")] pub enum OrderExpression { /// Ascending order Asc(Expression), /// Descending order Desc(Expression), } impl OrderExpression { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { match self { Self::Asc(e) => { f.write_str("(asc ")?; e.fmt_sse(f)?; f.write_str(")") } Self::Desc(e) => { f.write_str("(desc ")?; e.fmt_sse(f)?; f.write_str(")") } } } } #[cfg(test)] mod test_order_expr { use super::*; #[test] fn display() { // This is a temporary migration test - we can remove most of these before merging assert_eq!( OrderExpression::Asc(Expression::NamedNode( NamedNode::new("http://example.com/foo").unwrap() )) .to_string(), "ASC()" ); assert_eq!( OrderExpression::Desc(Expression::NamedNode( NamedNode::new("http://example.com/bar").unwrap() )) .to_string(), "DESC()" ); } } /// A SPARQL query [dataset specification](https://www.w3.org/TR/sparql11-query/#specifyingDataset). #[derive(Eq, PartialEq, Debug, Clone, Hash)] pub struct QueryDataset { pub default: Vec, pub named: Option>, } impl QueryDataset { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { f.write_str("(")?; for (i, graph_name) in self.default.iter().enumerate() { if i > 0 { f.write_str(" ")?; } write!(f, "{graph_name}")?; } if let Some(named) = &self.named { for (i, graph_name) in named.iter().enumerate() { if !self.default.is_empty() || i > 0 { f.write_str(" ")?; } write!(f, "(named {graph_name})")?; } } f.write_str(")") } } impl fmt::Display for QueryDataset { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { for g in &self.default { write!(f, " FROM {g}")?; } if let Some(named) = &self.named { for g in named { write!(f, " FROM NAMED {g}")?; } } Ok(()) } } /// A target RDF graph for update operations. /// /// Could be a specific graph, all named graphs or the complete dataset. #[derive(Eq, PartialEq, Debug, Clone, Hash, parse_display::Display)] pub enum GraphTarget { #[display("GRAPH {0}")] NamedNode(NamedNode), #[display("DEFAULT")] DefaultGraph, #[display("NAMED")] NamedGraphs, #[display("ALL")] AllGraphs, } impl GraphTarget { /// Formats using the [SPARQL S-Expression syntax](https://jena.apache.org/documentation/notes/sse.html). pub(crate) fn fmt_sse(&self, f: &mut impl fmt::Write) -> fmt::Result { match self { Self::NamedNode(node) => write!(f, "{node}"), Self::DefaultGraph => f.write_str("default"), Self::NamedGraphs => f.write_str("named"), Self::AllGraphs => f.write_str("all"), } } } impl From for GraphTarget { fn from(node: NamedNode) -> Self { Self::NamedNode(node) } } impl From for GraphTarget { fn from(graph_name: GraphName) -> Self { match graph_name { GraphName::NamedNode(node) => Self::NamedNode(node), GraphName::DefaultGraph => Self::DefaultGraph, } } } #[inline] fn fmt_sse_unary_expression(f: &mut impl fmt::Write, name: &str, e: &Expression) -> fmt::Result { write!(f, "({name} ")?; e.fmt_sse(f)?; f.write_str(")") } #[inline] fn fmt_sse_binary_expression( f: &mut impl fmt::Write, name: &str, a: &Expression, b: &Expression, ) -> fmt::Result { write!(f, "({name} ")?; a.fmt_sse(f)?; f.write_str(" ")?; b.fmt_sse(f)?; f.write_str(")") }