#![cfg(test)] #![allow(clippy::panic_in_result_fn)] use oxigraph::io::RdfFormat; use oxigraph::model::vocab::{rdf, xsd}; use oxigraph::model::*; use oxigraph::store::Store; #[cfg(all(not(target_family = "wasm")))] use rand::random; #[cfg(all(not(target_family = "wasm")))] use std::env::temp_dir; use std::error::Error; #[cfg(all(not(target_family = "wasm")))] use std::fs::{create_dir_all, remove_dir_all, File}; #[cfg(all(not(target_family = "wasm")))] use std::io::Write; #[cfg(all(not(target_family = "wasm")))] use std::iter::empty; #[cfg(all(target_os = "linux"))] use std::iter::once; #[cfg(all(not(target_family = "wasm")))] use std::path::{Path, PathBuf}; #[cfg(all(target_os = "linux"))] use std::process::Command; #[allow(clippy::non_ascii_literal)] const DATA: &str = r#" @prefix schema: . @prefix wd: . @prefix xsd: . wd:Q90 a schema:City ; schema:name "Paris"@fr , "la ville lumière"@fr ; schema:country wd:Q142 ; schema:population 2000000 ; schema:startDate "-300"^^xsd:gYear ; schema:url "https://www.paris.fr/"^^xsd:anyURI ; schema:postalCode "75001" . "#; #[allow(clippy::non_ascii_literal)] const GRAPH_DATA: &str = r#" @prefix schema: . @prefix wd: . @prefix xsd: . GRAPH { wd:Q90 a schema:City ; schema:name "Paris"@fr , "la ville lumière"@fr ; schema:country wd:Q142 ; schema:population 2000000 ; schema:startDate "-300"^^xsd:gYear ; schema:url "https://www.paris.fr/"^^xsd:anyURI ; schema:postalCode "75001" . } "#; const NUMBER_OF_TRIPLES: usize = 8; fn quads(graph_name: impl Into>) -> Vec> { let graph_name = graph_name.into(); let paris = NamedNodeRef::new_unchecked("http://www.wikidata.org/entity/Q90"); let france = NamedNodeRef::new_unchecked("http://www.wikidata.org/entity/Q142"); let city = NamedNodeRef::new_unchecked("http://schema.org/City"); let name = NamedNodeRef::new_unchecked("http://schema.org/name"); let country = NamedNodeRef::new_unchecked("http://schema.org/country"); let population = NamedNodeRef::new_unchecked("http://schema.org/population"); let start_date = NamedNodeRef::new_unchecked("http://schema.org/startDate"); let url = NamedNodeRef::new_unchecked("http://schema.org/url"); let postal_code = NamedNodeRef::new_unchecked("http://schema.org/postalCode"); vec![ QuadRef::new(paris, rdf::TYPE, city, graph_name), QuadRef::new( paris, name, LiteralRef::new_language_tagged_literal_unchecked("Paris", "fr"), graph_name, ), QuadRef::new( paris, name, LiteralRef::new_language_tagged_literal_unchecked("la ville lumi\u{E8}re", "fr"), graph_name, ), QuadRef::new(paris, country, france, graph_name), QuadRef::new( paris, population, LiteralRef::new_typed_literal("2000000", xsd::INTEGER), graph_name, ), QuadRef::new( paris, start_date, LiteralRef::new_typed_literal("-300", xsd::G_YEAR), graph_name, ), QuadRef::new( paris, url, LiteralRef::new_typed_literal("https://www.paris.fr/", xsd::ANY_URI), graph_name, ), QuadRef::new( paris, postal_code, LiteralRef::new_simple_literal("75001"), graph_name, ), ] } #[test] fn test_load_graph() -> Result<(), Box> { let store = Store::new()?; store.load_from_read(RdfFormat::Turtle, DATA.as_bytes())?; for q in quads(GraphNameRef::DefaultGraph) { assert!(store.contains(q)?); } store.validate()?; Ok(()) } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_bulk_load_graph() -> Result<(), Box> { let store = Store::new()?; store .bulk_loader() .load_from_read(RdfFormat::Turtle, DATA.as_bytes())?; for q in quads(GraphNameRef::DefaultGraph) { assert!(store.contains(q)?); } store.validate()?; Ok(()) } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_bulk_load_graph_lenient() -> Result<(), Box> { let store = Store::new()?; store.bulk_loader().on_parse_error(|_| Ok(())).load_from_read( RdfFormat::NTriples, b" .\n .".as_slice(), )?; assert_eq!(store.len()?, 1); assert!(store.contains(QuadRef::new( NamedNodeRef::new_unchecked("http://example.com"), NamedNodeRef::new_unchecked("http://example.com"), NamedNodeRef::new_unchecked("http://example.com"), GraphNameRef::DefaultGraph ))?); store.validate()?; Ok(()) } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_bulk_load_empty() -> Result<(), Box> { let store = Store::new()?; store.bulk_loader().load_quads(empty::())?; assert!(store.is_empty()?); store.validate()?; Ok(()) } #[test] fn test_load_dataset() -> Result<(), Box> { let store = Store::new()?; store.load_from_read(RdfFormat::TriG, GRAPH_DATA.as_bytes())?; for q in quads(NamedNodeRef::new_unchecked( "http://www.wikidata.org/wiki/Special:EntityData/Q90", )) { assert!(store.contains(q)?); } store.validate()?; Ok(()) } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_bulk_load_dataset() -> Result<(), Box> { let store = Store::new()?; store .bulk_loader() .load_from_read(RdfFormat::TriG, GRAPH_DATA.as_bytes())?; let graph_name = NamedNodeRef::new_unchecked("http://www.wikidata.org/wiki/Special:EntityData/Q90"); for q in quads(graph_name) { assert!(store.contains(q)?); } assert!(store.contains_named_graph(graph_name)?); store.validate()?; Ok(()) } #[test] fn test_load_graph_generates_new_blank_nodes() -> Result<(), Box> { let store = Store::new()?; for _ in 0..2 { store.load_from_read( RdfFormat::NTriples, "_:a .".as_bytes(), )?; } assert_eq!(store.len()?, 2); Ok(()) } #[test] fn test_dump_graph() -> Result<(), Box> { let store = Store::new()?; for q in quads(GraphNameRef::DefaultGraph) { store.insert(q)?; } let mut buffer = Vec::new(); store.dump_graph_to_write(GraphNameRef::DefaultGraph, RdfFormat::NTriples, &mut buffer)?; assert_eq!( buffer.into_iter().filter(|c| *c == b'\n').count(), NUMBER_OF_TRIPLES ); Ok(()) } #[test] fn test_dump_dataset() -> Result<(), Box> { let store = Store::new()?; for q in quads(GraphNameRef::DefaultGraph) { store.insert(q)?; } let buffer = store.dump_to_write(RdfFormat::NQuads, Vec::new())?; assert_eq!( buffer.into_iter().filter(|c| *c == b'\n').count(), NUMBER_OF_TRIPLES ); Ok(()) } #[test] fn test_snapshot_isolation_iterator() -> Result<(), Box> { let quad = QuadRef::new( NamedNodeRef::new("http://example.com/s")?, NamedNodeRef::new("http://example.com/p")?, NamedNodeRef::new("http://example.com/o")?, NamedNodeRef::new("http://www.wikidata.org/wiki/Special:EntityData/Q90")?, ); let store = Store::new()?; store.insert(quad)?; let iter = store.iter(); store.remove(quad)?; assert_eq!( iter.collect::, _>>()?, vec![quad.into_owned()] ); store.validate()?; Ok(()) } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_bulk_load_on_existing_delete_overrides_the_delete() -> Result<(), Box> { let quad = QuadRef::new( NamedNodeRef::new_unchecked("http://example.com/s"), NamedNodeRef::new_unchecked("http://example.com/p"), NamedNodeRef::new_unchecked("http://example.com/o"), NamedNodeRef::new_unchecked("http://www.wikidata.org/wiki/Special:EntityData/Q90"), ); let store = Store::new()?; store.remove(quad)?; store.bulk_loader().load_quads([quad.into_owned()])?; assert_eq!(store.len()?, 1); Ok(()) } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_open_bad_dir() -> Result<(), Box> { let dir = TempDir::default(); create_dir_all(&dir.0)?; { File::create(dir.0.join("CURRENT"))?.write_all(b"foo")?; } assert!(Store::open(&dir.0).is_err()); Ok(()) } #[test] #[cfg(all(target_os = "linux"))] fn test_bad_stt_open() -> Result<(), Box> { let dir = TempDir::default(); let store = Store::open(&dir.0)?; remove_dir_all(&dir.0)?; store .bulk_loader() .load_quads(once(Quad::new( NamedNode::new_unchecked("http://example.com/s"), NamedNode::new_unchecked("http://example.com/p"), NamedNode::new_unchecked("http://example.com/o"), GraphName::DefaultGraph, ))) .unwrap_err(); Ok(()) } // #[test] // #[cfg(all(not(target_family = "wasm")))] // fn test_backup() -> Result<(), Box> { // let quad = QuadRef::new( // NamedNodeRef::new_unchecked("http://example.com/s"), // NamedNodeRef::new_unchecked("http://example.com/p"), // NamedNodeRef::new_unchecked("http://example.com/o"), // GraphNameRef::DefaultGraph, // ); // let store_dir = TempDir::default(); // let backup_from_rw_dir = TempDir::default(); // let backup_from_ro_dir = TempDir::default(); // let backup_from_secondary_dir = TempDir::default(); // let store = Store::open(&store_dir)?; // store.insert(quad)?; // let secondary_store = Store::open_secondary(&store_dir)?; // store.flush()?; // store.backup(&backup_from_rw_dir)?; // secondary_store.backup(&backup_from_secondary_dir)?; // store.remove(quad)?; // assert!(!store.contains(quad)?); // let backup_from_rw = Store::open_read_only(&backup_from_rw_dir.0)?; // backup_from_rw.validate()?; // assert!(backup_from_rw.contains(quad)?); // backup_from_rw.backup(&backup_from_ro_dir)?; // let backup_from_ro = Store::open_read_only(&backup_from_ro_dir.0)?; // backup_from_ro.validate()?; // assert!(backup_from_ro.contains(quad)?); // let backup_from_secondary = Store::open_read_only(&backup_from_secondary_dir.0)?; // backup_from_secondary.validate()?; // assert!(backup_from_secondary.contains(quad)?); // Ok(()) // } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_bad_backup() -> Result<(), Box> { let store_dir = TempDir::default(); let backup_dir = TempDir::default(); create_dir_all(&backup_dir.0)?; Store::open(&store_dir)?.backup(&backup_dir.0).unwrap_err(); Ok(()) } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_backup_on_in_memory() -> Result<(), Box> { let backup_dir = TempDir::default(); Store::new()?.backup(&backup_dir).unwrap_err(); Ok(()) } #[test] #[cfg(all(target_os = "linux"))] fn test_backward_compatibility() -> Result<(), Box> { // We run twice to check if data is properly saved and closed for _ in 0..2 { let store = Store::open("tests/rocksdb_bc_data")?; for q in quads(GraphNameRef::DefaultGraph) { assert!(store.contains(q)?); } let graph_name = NamedNodeRef::new_unchecked("http://www.wikidata.org/wiki/Special:EntityData/Q90"); for q in quads(graph_name) { assert!(store.contains(q)?); } assert!(store.contains_named_graph(graph_name)?); assert_eq!( vec![NamedOrBlankNode::from(graph_name)], store.named_graphs().collect::, _>>()? ); } reset_dir("tests/rocksdb_bc_data")?; Ok(()) } // #[test] // #[cfg(all(not(target_family = "wasm")))] // fn test_secondary() -> Result<(), Box> { // let quad = QuadRef::new( // NamedNodeRef::new_unchecked("http://example.com/s"), // NamedNodeRef::new_unchecked("http://example.com/p"), // NamedNodeRef::new_unchecked("http://example.com/o"), // GraphNameRef::DefaultGraph, // ); // let primary_dir = TempDir::default(); // // We open the store // let primary = Store::open(&primary_dir)?; // let secondary = Store::open_secondary(&primary_dir)?; // // We insert a quad // primary.insert(quad)?; // primary.flush()?; // // It is readable from both stores // for store in &[&primary, &secondary] { // assert!(store.contains(quad)?); // assert_eq!( // store.iter().collect::, _>>()?, // vec![quad.into_owned()] // ); // } // // We validate the states // primary.validate()?; // secondary.validate()?; // // We close the primary store and remove its content // drop(primary); // remove_dir_all(&primary_dir)?; // // We secondary store is still readable // assert!(secondary.contains(quad)?); // secondary.validate()?; // Ok(()) // } // #[test] // #[cfg(all(not(target_family = "wasm")))] // fn test_open_secondary_bad_dir() -> Result<(), Box> { // let primary_dir = TempDir::default(); // create_dir_all(&primary_dir.0)?; // { // File::create(primary_dir.0.join("CURRENT"))?.write_all(b"foo")?; // } // assert!(Store::open_secondary(&primary_dir).is_err()); // Ok(()) // } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_read_only() -> Result<(), Box> { let s = NamedNodeRef::new_unchecked("http://example.com/s"); let p = NamedNodeRef::new_unchecked("http://example.com/p"); let first_quad = QuadRef::new( s, p, NamedNodeRef::new_unchecked("http://example.com/o"), GraphNameRef::DefaultGraph, ); let second_quad = QuadRef::new( s, p, NamedNodeRef::new_unchecked("http://example.com/o2"), GraphNameRef::DefaultGraph, ); let store_dir = TempDir::default(); // We write to the store and close it { let read_write = Store::open(&store_dir)?; read_write.insert(first_quad)?; read_write.flush()?; } // We open as read-only let read_only = Store::open_read_only(&store_dir, None)?; assert!(read_only.contains(first_quad)?); assert_eq!( read_only.iter().collect::, _>>()?, vec![first_quad.into_owned()] ); read_only.validate()?; // We open as read-write again let read_write = Store::open(&store_dir)?; read_write.insert(second_quad)?; read_write.flush()?; read_write.optimize()?; // Makes sure it's well flushed // The new quad is in the read-write instance but not the read-only instance assert!(read_write.contains(second_quad)?); assert!(!read_only.contains(second_quad)?); read_only.validate()?; Ok(()) } #[test] #[cfg(all(not(target_family = "wasm")))] fn test_open_read_only_bad_dir() -> Result<(), Box> { let dir = TempDir::default(); create_dir_all(&dir.0)?; { File::create(dir.0.join("CURRENT"))?.write_all(b"foo")?; } assert!(Store::open_read_only(&dir, None).is_err()); Ok(()) } #[cfg(all(target_os = "linux"))] fn reset_dir(dir: &str) -> Result<(), Box> { assert!(Command::new("git") .args(["clean", "-fX", dir]) .status()? .success()); assert!(Command::new("git") .args(["checkout", "HEAD", "--", dir]) .status()? .success()); Ok(()) } #[cfg(all(not(target_family = "wasm")))] struct TempDir(PathBuf); #[cfg(all(not(target_family = "wasm")))] impl Default for TempDir { fn default() -> Self { Self(temp_dir().join(format!("oxigraph-test-{}", random::()))) } } #[cfg(all(not(target_family = "wasm")))] impl AsRef for TempDir { fn as_ref(&self) -> &Path { &self.0 } } #[cfg(all(not(target_family = "wasm")))] impl Drop for TempDir { fn drop(&mut self) { if self.0.is_dir() { remove_dir_all(&self.0).unwrap(); } } }