|
|
|
use anyhow::{anyhow, bail, Context, Result};
|
|
|
|
use oxigraph::io::{DatasetFormat, DatasetParser, GraphFormat, GraphParser};
|
|
|
|
use oxigraph::model::{Dataset, Graph};
|
|
|
|
use oxttl::n3::N3Quad;
|
|
|
|
use oxttl::N3Parser;
|
|
|
|
use std::fs::File;
|
|
|
|
use std::io::Read;
|
|
|
|
use std::path::PathBuf;
|
|
|
|
|
|
|
|
pub fn read_file(url: &str) -> Result<impl Read> {
|
|
|
|
let mut path = PathBuf::from(env!("CARGO_MANIFEST_DIR"));
|
|
|
|
path.push(if url.starts_with("http://w3c.github.io/") {
|
|
|
|
url.replace("http://w3c.github.io/", "")
|
|
|
|
} else if url.starts_with("https://w3c.github.io/") {
|
|
|
|
url.replace("https://w3c.github.io/", "")
|
|
|
|
} else if url.starts_with("http://www.w3.org/2013/RDFXMLTests/") {
|
|
|
|
url.replace("http://www.w3.org/2013/RDFXMLTests/", "rdf-tests/rdf-xml/")
|
|
|
|
} else if url.starts_with("https://github.com/oxigraph/oxigraph/tests/") {
|
|
|
|
url.replace(
|
|
|
|
"https://github.com/oxigraph/oxigraph/tests/",
|
|
|
|
"oxigraph-tests/",
|
|
|
|
)
|
|
|
|
} else if url.starts_with("http://drobilla.net/sw/serd/test/") {
|
|
|
|
url.replace("http://drobilla.net/sw/serd/test/", "serd-tests/")
|
|
|
|
} else {
|
|
|
|
bail!("Not supported url for file: {url}")
|
|
|
|
});
|
|
|
|
File::open(&path).with_context(|| format!("Failed to read {}", path.display()))
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn read_file_to_string(url: &str) -> Result<String> {
|
|
|
|
let mut buf = String::new();
|
|
|
|
read_file(url)?.read_to_string(&mut buf)?;
|
|
|
|
Ok(buf)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_to_graph(
|
|
|
|
url: &str,
|
|
|
|
graph: &mut Graph,
|
|
|
|
format: GraphFormat,
|
|
|
|
ignore_errors: bool,
|
|
|
|
) -> Result<()> {
|
|
|
|
let parser = GraphParser::from_format(format).with_base_iri(url)?;
|
|
|
|
for t in parser.read_triples(read_file(url)?) {
|
|
|
|
match t {
|
|
|
|
Ok(t) => {
|
|
|
|
graph.insert(&t);
|
|
|
|
}
|
|
|
|
Err(e) => {
|
|
|
|
if !ignore_errors {
|
|
|
|
return Err(e.into());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_graph(url: &str, format: GraphFormat, ignore_errors: bool) -> Result<Graph> {
|
|
|
|
let mut graph = Graph::new();
|
|
|
|
load_to_graph(url, &mut graph, format, ignore_errors)?;
|
|
|
|
Ok(graph)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn guess_graph_format(url: &str) -> Result<GraphFormat> {
|
|
|
|
url.rsplit_once('.')
|
|
|
|
.and_then(|(_, extension)| GraphFormat::from_extension(extension))
|
|
|
|
.ok_or_else(|| anyhow!("Serialization type not found for {url}"))
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_to_dataset(
|
|
|
|
url: &str,
|
|
|
|
dataset: &mut Dataset,
|
|
|
|
format: DatasetFormat,
|
|
|
|
ignore_errors: bool,
|
|
|
|
) -> Result<()> {
|
|
|
|
let parser = DatasetParser::from_format(format).with_base_iri(url)?;
|
|
|
|
for q in parser.read_quads(read_file(url)?) {
|
|
|
|
match q {
|
|
|
|
Ok(q) => {
|
|
|
|
dataset.insert(&q);
|
|
|
|
}
|
|
|
|
Err(e) => {
|
|
|
|
if !ignore_errors {
|
|
|
|
return Err(e.into());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_dataset(url: &str, format: DatasetFormat, ignore_errors: bool) -> Result<Dataset> {
|
|
|
|
let mut dataset = Dataset::new();
|
|
|
|
load_to_dataset(url, &mut dataset, format, ignore_errors)?;
|
|
|
|
Ok(dataset)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn guess_dataset_format(url: &str) -> Result<DatasetFormat> {
|
|
|
|
url.rsplit_once('.')
|
|
|
|
.and_then(|(_, extension)| DatasetFormat::from_extension(extension))
|
|
|
|
.ok_or_else(|| anyhow!("Serialization type not found for {url}"))
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn load_n3(url: &str, ignore_errors: bool) -> Result<Vec<N3Quad>> {
|
|
|
|
let mut quads = Vec::new();
|
|
|
|
for q in N3Parser::new()
|
|
|
|
.with_base_iri(url)?
|
|
|
|
.with_prefix("", format!("{url}#"))?
|
|
|
|
.parse_from_read(read_file(url)?)
|
|
|
|
{
|
|
|
|
match q {
|
|
|
|
Ok(q) => quads.push(q),
|
|
|
|
Err(e) => {
|
|
|
|
if !ignore_errors {
|
|
|
|
return Err(e.into());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(quads)
|
|
|
|
}
|