|
|
|
use anyhow::{anyhow, bail, Result};
|
|
|
|
use oxigraph::io::{DatasetFormat, DatasetParser, GraphFormat, GraphParser};
|
|
|
|
use oxigraph::model::{Dataset, Graph, GraphNameRef};
|
|
|
|
use oxigraph::store::Store;
|
|
|
|
use std::fs::File;
|
|
|
|
use std::io::{BufRead, BufReader, Read};
|
|
|
|
use std::path::PathBuf;
|
|
|
|
|
|
|
|
pub fn read_file(url: &str) -> Result<impl BufRead> {
|
|
|
|
let mut path = PathBuf::from(env!("CARGO_MANIFEST_DIR"));
|
|
|
|
path.push(if url.starts_with("http://w3c.github.io/rdf-tests/") {
|
|
|
|
url.replace("http://w3c.github.io/rdf-tests/", "rdf-tests/")
|
|
|
|
} else if url.starts_with("http://www.w3.org/2013/RDFXMLTests/") {
|
|
|
|
url.replace("http://www.w3.org/2013/RDFXMLTests/", "rdf-tests/rdf-xml/")
|
|
|
|
} else if url.starts_with("http://www.w3.org/2001/sw/DataAccess/tests/data-r2/") {
|
|
|
|
url.replace(
|
|
|
|
"http://www.w3.org/2001/sw/DataAccess/tests/",
|
|
|
|
"rdf-tests/sparql11/",
|
|
|
|
)
|
|
|
|
} else if url.starts_with("http://www.w3.org/2009/sparql/docs/tests/data-sparql11/") {
|
|
|
|
url.replace(
|
|
|
|
"http://www.w3.org/2009/sparql/docs/tests/",
|
|
|
|
"rdf-tests/sparql11/",
|
|
|
|
)
|
|
|
|
} else if url.starts_with("https://w3c.github.io/rdf-star/") {
|
|
|
|
url.replace("https://w3c.github.io/", "")
|
|
|
|
} else if url.starts_with("https://github.com/oxigraph/oxigraph/tests/") {
|
|
|
|
url.replace(
|
|
|
|
"https://github.com/oxigraph/oxigraph/tests/",
|
|
|
|
"oxigraph-tests/",
|
|
|
|
)
|
|
|
|
} else {
|
|
|
|
bail!("Not supported url for file: {url}")
|
|
|
|
});
|
|
|
|
Ok(BufReader::new(File::open(&path)?))
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn read_file_to_string(url: &str) -> Result<String> {
|
|
|
|
let mut buf = String::new();
|
|
|
|
read_file(url)?.read_to_string(&mut buf)?;
|
|
|
|
Ok(buf)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_to_store<'a>(
|
|
|
|
url: &str,
|
|
|
|
store: &Store,
|
|
|
|
to_graph_name: impl Into<GraphNameRef<'a>>,
|
|
|
|
) -> Result<()> {
|
|
|
|
if url.ends_with(".nt") {
|
|
|
|
store.load_graph(
|
|
|
|
read_file(url)?,
|
|
|
|
GraphFormat::NTriples,
|
|
|
|
to_graph_name,
|
|
|
|
Some(url),
|
|
|
|
)?
|
|
|
|
} else if url.ends_with(".ttl") {
|
|
|
|
store.load_graph(
|
|
|
|
read_file(url)?,
|
|
|
|
GraphFormat::Turtle,
|
|
|
|
to_graph_name,
|
|
|
|
Some(url),
|
|
|
|
)?
|
|
|
|
} else if url.ends_with(".rdf") {
|
|
|
|
store.load_graph(
|
|
|
|
read_file(url)?,
|
|
|
|
GraphFormat::RdfXml,
|
|
|
|
to_graph_name,
|
|
|
|
Some(url),
|
|
|
|
)?
|
|
|
|
} else if url.ends_with(".nq") {
|
|
|
|
store.load_dataset(read_file(url)?, DatasetFormat::NQuads, Some(url))?
|
|
|
|
} else if url.ends_with(".trig") {
|
|
|
|
store.load_dataset(read_file(url)?, DatasetFormat::TriG, Some(url))?
|
|
|
|
} else {
|
|
|
|
bail!("Serialization type not found for {url}");
|
|
|
|
}
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_to_graph(url: &str, graph: &mut Graph) -> Result<()> {
|
|
|
|
let format = url
|
|
|
|
.rsplit_once('.')
|
|
|
|
.and_then(|(_, extension)| GraphFormat::from_extension(extension))
|
|
|
|
.ok_or_else(|| anyhow!("Serialization type not found for {url}"))?;
|
|
|
|
let parser = GraphParser::from_format(format).with_base_iri(url)?;
|
|
|
|
for t in parser.read_triples(read_file(url)?)? {
|
|
|
|
graph.insert(&t?);
|
|
|
|
}
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_graph(url: &str) -> Result<Graph> {
|
|
|
|
let mut graph = Graph::new();
|
|
|
|
load_to_graph(url, &mut graph)?;
|
|
|
|
Ok(graph)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_to_dataset<'a>(
|
|
|
|
url: &str,
|
|
|
|
dataset: &mut Dataset,
|
|
|
|
to_graph_name: impl Into<GraphNameRef<'a>>,
|
|
|
|
) -> Result<()> {
|
|
|
|
let to_graph_name = to_graph_name.into();
|
|
|
|
let extension = url.rsplit_once('.').map(|(_, ext)| ext);
|
|
|
|
if let Some(format) = extension.and_then(GraphFormat::from_extension) {
|
|
|
|
let parser = GraphParser::from_format(format).with_base_iri(url)?;
|
|
|
|
for t in parser.read_triples(read_file(url)?)? {
|
|
|
|
dataset.insert(&t?.in_graph(to_graph_name));
|
|
|
|
}
|
|
|
|
} else if let Some(format) = extension.and_then(DatasetFormat::from_extension) {
|
|
|
|
let parser = DatasetParser::from_format(format).with_base_iri(url)?;
|
|
|
|
for q in parser.read_quads(read_file(url)?)? {
|
|
|
|
dataset.insert(&q?);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
bail!("Serialization type not found for {url}")
|
|
|
|
}
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_dataset(url: &str) -> Result<Dataset> {
|
|
|
|
let mut dataset = Dataset::new();
|
|
|
|
load_to_dataset(url, &mut dataset, GraphNameRef::DefaultGraph)?;
|
|
|
|
Ok(dataset)
|
|
|
|
}
|