Evaluation: Adds size_hint to iterators

Removes some iterators that could be written as filter
pull/171/head
Tpt 3 years ago
parent 6d4bb36425
commit d27d62f973
  1. 129
      lib/src/sparql/eval.rs

@ -303,12 +303,15 @@ impl SimpleEvaluator {
Rc::new(move |from| { Rc::new(move |from| {
let mut errors = Vec::default(); let mut errors = Vec::default();
let mut right_values = EncodedTupleSet::new(join_keys.clone()); let mut right_values = EncodedTupleSet::new(join_keys.clone());
for result in right(from.clone()) { right_values.extend(right(from.clone()).filter_map(
match result { |result| match result {
Ok(result) => right_values.insert(result), Ok(result) => Some(result),
Err(error) => errors.push(Err(error)), Err(error) => {
} errors.push(Err(error));
None
} }
},
));
Box::new(HashJoinIterator { Box::new(HashJoinIterator {
left_iter: left(from), left_iter: left(from),
right: right_values, right: right_values,
@ -341,21 +344,30 @@ impl SimpleEvaluator {
let right: Vec<_> = right(from.clone()) let right: Vec<_> = right(from.clone())
.filter_map(std::result::Result::ok) .filter_map(std::result::Result::ok)
.collect(); .collect();
Box::new(CartesianProductAntiJoinIterator { Box::new(left(from).filter(move |left_tuple| {
left_iter: left(from), if let Ok(left_tuple) = left_tuple {
right, !right.iter().any(|right_tuple| {
are_compatible_and_not_disjointed(left_tuple, right_tuple)
}) })
} else {
true
}
}))
}) })
} else { } else {
Rc::new(move |from| { Rc::new(move |from| {
let mut right_values = EncodedTupleSet::new(join_keys.clone()); let mut right_values = EncodedTupleSet::new(join_keys.clone());
for result in right(from.clone()).filter_map(std::result::Result::ok) { right_values
right_values.insert(result); .extend(right(from.clone()).filter_map(std::result::Result::ok));
} Box::new(left(from).filter(move |left_tuple| {
Box::new(HashAntiJoinIterator { if let Ok(left_tuple) = left_tuple {
left_iter: left(from), !right_values.get(left_tuple).iter().any(|right_tuple| {
right: right_values, are_compatible_and_not_disjointed(left_tuple, right_tuple)
}) })
} else {
true
}
}))
}) })
} }
} }
@ -2974,6 +2986,11 @@ impl Iterator for CartesianProductJoinIterator {
} }
} }
} }
fn size_hint(&self) -> (usize, Option<usize>) {
let (min, max) = self.left_iter.size_hint();
(min * self.right.len(), max.map(|v| v * self.right.len()))
}
} }
struct HashJoinIterator { struct HashJoinIterator {
@ -3001,56 +3018,12 @@ impl Iterator for HashJoinIterator {
} }
} }
} }
}
struct CartesianProductAntiJoinIterator {
left_iter: EncodedTuplesIterator,
right: Vec<EncodedTuple>,
}
impl Iterator for CartesianProductAntiJoinIterator {
type Item = Result<EncodedTuple, EvaluationError>;
fn next(&mut self) -> Option<Result<EncodedTuple, EvaluationError>> {
loop {
match self.left_iter.next()? {
Ok(left_tuple) => {
let exists_compatible_right = self.right.iter().any(|right_tuple| {
are_compatible_and_not_disjointed(&left_tuple, right_tuple)
});
if !exists_compatible_right {
return Some(Ok(left_tuple));
}
}
Err(error) => return Some(Err(error)),
}
}
}
}
struct HashAntiJoinIterator {
left_iter: EncodedTuplesIterator,
right: EncodedTupleSet,
}
impl Iterator for HashAntiJoinIterator {
type Item = Result<EncodedTuple, EvaluationError>;
fn next(&mut self) -> Option<Result<EncodedTuple, EvaluationError>> { fn size_hint(&self) -> (usize, Option<usize>) {
loop { (
match self.left_iter.next()? { 0,
Ok(left_tuple) => { self.left_iter.size_hint().1.map(|v| v * self.right.len()),
let exists_compatible_right = )
self.right.get(&left_tuple).iter().any(|right_tuple| {
are_compatible_and_not_disjointed(&left_tuple, right_tuple)
});
if !exists_compatible_right {
return Some(Ok(left_tuple));
}
}
Err(error) => return Some(Err(error)),
}
}
} }
} }
@ -3187,6 +3160,11 @@ impl Iterator for ConsecutiveDeduplication {
} }
} }
} }
fn size_hint(&self) -> (usize, Option<usize>) {
let (min, max) = self.inner.size_hint();
(if min == 0 { 0 } else { 1 }, max)
}
} }
struct ConstructIterator { struct ConstructIterator {
@ -3228,6 +3206,14 @@ impl Iterator for ConstructIterator {
} }
} }
} }
fn size_hint(&self) -> (usize, Option<usize>) {
let (min, max) = self.iter.size_hint();
(
min * self.template.len(),
max.map(|v| v * self.template.len()),
)
}
} }
fn get_triple_template_value<'a>( fn get_triple_template_value<'a>(
@ -3771,6 +3757,7 @@ pub enum ComparatorFunction {
struct EncodedTupleSet { struct EncodedTupleSet {
key: Vec<usize>, key: Vec<usize>,
map: HashMap<u64, Vec<EncodedTuple>>, map: HashMap<u64, Vec<EncodedTuple>>,
len: usize,
} }
impl EncodedTupleSet { impl EncodedTupleSet {
@ -3778,6 +3765,7 @@ impl EncodedTupleSet {
Self { Self {
key, key,
map: HashMap::new(), map: HashMap::new(),
len: 0,
} }
} }
fn insert(&mut self, tuple: EncodedTuple) { fn insert(&mut self, tuple: EncodedTuple) {
@ -3785,6 +3773,7 @@ impl EncodedTupleSet {
.entry(self.tuple_key(&tuple)) .entry(self.tuple_key(&tuple))
.or_default() .or_default()
.push(tuple); .push(tuple);
self.len += 1;
} }
fn get(&self, tuple: &EncodedTuple) -> &[EncodedTuple] { fn get(&self, tuple: &EncodedTuple) -> &[EncodedTuple] {
@ -3800,6 +3789,20 @@ impl EncodedTupleSet {
} }
hasher.finish() hasher.finish()
} }
fn len(&self) -> usize {
self.len
}
}
impl Extend<EncodedTuple> for EncodedTupleSet {
fn extend<T: IntoIterator<Item = EncodedTuple>>(&mut self, iter: T) {
let iter = iter.into_iter();
self.map.reserve(iter.size_hint().0);
for tuple in iter {
self.insert(tuple);
}
}
} }
#[test] #[test]

Loading…
Cancel
Save