Skip to content

Commit

Permalink
fix LSH index not properly cleaned after tuple deletion
Browse files Browse the repository at this point in the history
  • Loading branch information
zh217 committed Jun 26, 2023
1 parent 6c07666 commit 0de57c3
Show file tree
Hide file tree
Showing 3 changed files with 29 additions and 2 deletions.
3 changes: 2 additions & 1 deletion cozo-core/src/query/stored.rs
Original file line number Diff line number Diff line change
Expand Up @@ -952,6 +952,7 @@ impl<'a> SessionTx<'a> {
let has_indices = !relation_store.indices.is_empty();
let has_hnsw_indices = !relation_store.hnsw_indices.is_empty();
let has_fts_indices = !relation_store.fts_indices.is_empty();
let has_lsh_indices = !relation_store.lsh_indices.is_empty();
let fts_processors = self.make_fts_lsh_processors(relation_store)?;
let mut new_tuples: Vec<DataValue> = vec![];
let mut old_tuples: Vec<DataValue> = vec![];
Expand All @@ -977,7 +978,7 @@ impl<'a> SessionTx<'a> {
});
}
}
if need_to_collect || has_indices || has_hnsw_indices || has_fts_indices {
if need_to_collect || has_indices || has_hnsw_indices || has_fts_indices || has_lsh_indices {
if let Some(existing) = self.store_tx.get(&key, false)? {
let mut tup = extracted.clone();
extend_tuple_from_v(&mut tup, &existing);
Expand Down
2 changes: 1 addition & 1 deletion cozo-core/src/runtime/minhash_lsh.rs
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@ impl<'a> SessionTx<'a> {
) -> Result<()> {
let bytes = match bytes {
None => {
if let Some(mut found) = inv_idx_handle.get_val_only(self, tuple)? {
if let Some(mut found) = inv_idx_handle.get_val_only(self, &tuple[..inv_idx_handle.metadata.keys.len()])? {
let inv_key = inv_idx_handle.encode_key_for_store(tuple, Default::default())?;
self.store_tx.del(&inv_key)?;
match found.pop() {
Expand Down
26 changes: 26 additions & 0 deletions cozo-core/src/runtime/tests.rs
Original file line number Diff line number Diff line change
Expand Up @@ -905,6 +905,32 @@ fn test_lsh_indexing3() {
}
}


#[test]
fn test_lsh_indexing4() {
for i in 1..10 {
let f = i as f64 / 10.;
let db = DbInstance::new("mem", "", "").unwrap();
db.run_default(r":create a {k: String => v: String}")
.unwrap();
db.run_script(
r"::lsh create a:lsh {extractor: v, tokenizer: NGram, n_gram: 3, target_threshold: $t }",
BTreeMap::from([("t".into(), f.into())]),
ScriptMutability::Mutable
)
.unwrap();
db.run_default("?[k, v] <- [['a', 'ewiygfspeoighjsfcfxzdfncalsdf']] :put a {k => v}")
.unwrap();
db.run_default("?[k] <- [['a']] :rm a {k}")
.unwrap();
let res = db
.run_default("?[k] := ~a:lsh{k | query: 'ewiygfspeoighjsfcfxzdfncalsdf', k: 1}")
.unwrap();
assert!(res.rows.len() == 0);
}
}


#[test]
fn test_lsh_indexing() {
let db = DbInstance::new("mem", "", "").unwrap();
Expand Down

0 comments on commit 0de57c3

Please sign in to comment.