use anyhow::{anyhow, bail, Context, Result}; use oxigraph::io::{DatasetFormat, DatasetParser, GraphFormat, GraphParser}; use oxigraph::model::{Dataset, Graph}; use oxttl::n3::N3Quad; use oxttl::N3Parser; use std::fs::File; use std::io::Read; use std::path::PathBuf; pub fn read_file(url: &str) -> Result { let mut path = PathBuf::from(env!("CARGO_MANIFEST_DIR")); path.push(if url.starts_with("http://w3c.github.io/") { url.replace("http://w3c.github.io/", "") } else if url.starts_with("https://w3c.github.io/") { url.replace("https://w3c.github.io/", "") } else if url.starts_with("http://www.w3.org/2013/RDFXMLTests/") { url.replace("http://www.w3.org/2013/RDFXMLTests/", "rdf-tests/rdf-xml/") } else if url.starts_with("https://github.com/oxigraph/oxigraph/tests/") { url.replace( "https://github.com/oxigraph/oxigraph/tests/", "oxigraph-tests/", ) } else if url.starts_with("http://drobilla.net/sw/serd/test/") { url.replace("http://drobilla.net/sw/serd/test/", "serd-tests/") } else { bail!("Not supported url for file: {url}") }); File::open(&path).with_context(|| format!("Failed to read {}", path.display())) } pub fn read_file_to_string(url: &str) -> Result { let mut buf = String::new(); read_file(url)?.read_to_string(&mut buf)?; Ok(buf) } pub fn load_to_graph( url: &str, graph: &mut Graph, format: GraphFormat, ignore_errors: bool, ) -> Result<()> { let parser = GraphParser::from_format(format).with_base_iri(url)?; for t in parser.read_triples(read_file(url)?) { match t { Ok(t) => { graph.insert(&t); } Err(e) => { if !ignore_errors { return Err(e.into()); } } } } Ok(()) } pub fn load_graph(url: &str, format: GraphFormat, ignore_errors: bool) -> Result { let mut graph = Graph::new(); load_to_graph(url, &mut graph, format, ignore_errors)?; Ok(graph) } pub fn guess_graph_format(url: &str) -> Result { url.rsplit_once('.') .and_then(|(_, extension)| GraphFormat::from_extension(extension)) .ok_or_else(|| anyhow!("Serialization type not found for {url}")) } pub fn load_to_dataset( url: &str, dataset: &mut Dataset, format: DatasetFormat, ignore_errors: bool, ) -> Result<()> { let parser = DatasetParser::from_format(format).with_base_iri(url)?; for q in parser.read_quads(read_file(url)?) { match q { Ok(q) => { dataset.insert(&q); } Err(e) => { if !ignore_errors { return Err(e.into()); } } } } Ok(()) } pub fn load_dataset(url: &str, format: DatasetFormat, ignore_errors: bool) -> Result { let mut dataset = Dataset::new(); load_to_dataset(url, &mut dataset, format, ignore_errors)?; Ok(dataset) } pub fn guess_dataset_format(url: &str) -> Result { url.rsplit_once('.') .and_then(|(_, extension)| DatasetFormat::from_extension(extension)) .ok_or_else(|| anyhow!("Serialization type not found for {url}")) } pub fn load_n3(url: &str, ignore_errors: bool) -> Result> { let mut quads = Vec::new(); for q in N3Parser::new() .with_base_iri(url)? .with_prefix("", format!("{url}#"))? .parse_read(read_file(url)?) { match q { Ok(q) => quads.push(q), Err(e) => { if !ignore_errors { return Err(e.into()); } } } } Ok(quads) }