From 970a489dcc31c23d70478b8a595b41e2aeadd3a2 Mon Sep 17 00:00:00 2001 From: Tamo Date: Mon, 30 Dec 2024 16:21:06 +0100 Subject: [PATCH 1/4] add a test reproducing the bug --- crates/meilisearch/tests/documents/add_documents.rs | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/crates/meilisearch/tests/documents/add_documents.rs b/crates/meilisearch/tests/documents/add_documents.rs index d72b1a7a8..d164d9a27 100644 --- a/crates/meilisearch/tests/documents/add_documents.rs +++ b/crates/meilisearch/tests/documents/add_documents.rs @@ -1220,9 +1220,12 @@ async fn replace_document() { #[actix_rt::test] async fn add_no_documents() { let server = Server::new().await; - let index = server.index("test"); - let (_response, code) = index.add_documents(json!([]), None).await; + let index = server.index("kefir"); + let (task, code) = index.add_documents(json!([]), None).await; snapshot!(code, @"202 Accepted"); + let task = server.wait_task(task.uid()).await; + let task = task.succeeded(); + snapshot!(task, @""); } #[actix_rt::test] From 33921747b7d66425fc0a8b386248125a4aa25e1c Mon Sep 17 00:00:00 2001 From: Tamo Date: Mon, 30 Dec 2024 17:48:25 +0100 Subject: [PATCH 2/4] stop skipping empty tasks when adding documents --- crates/index-scheduler/src/batch.rs | 4 +--- crates/index-scheduler/src/utils.rs | 5 ++++- .../tests/documents/add_documents.rs | 20 ++++++++++++++++++- 3 files changed, 24 insertions(+), 5 deletions(-) diff --git a/crates/index-scheduler/src/batch.rs b/crates/index-scheduler/src/batch.rs index a40eac02c..e23d1c1bb 100644 --- a/crates/index-scheduler/src/batch.rs +++ b/crates/index-scheduler/src/batch.rs @@ -1312,9 +1312,7 @@ impl IndexScheduler { if let DocumentOperation::Add(content_uuid) = operation { let content_file = self.file_store.get_update(*content_uuid)?; let mmap = unsafe { memmap2::Mmap::map(&content_file)? }; - if !mmap.is_empty() { - content_files.push(mmap); - } + content_files.push(mmap); } } diff --git a/crates/index-scheduler/src/utils.rs b/crates/index-scheduler/src/utils.rs index 1fcedfddf..8bcf70f3c 100644 --- a/crates/index-scheduler/src/utils.rs +++ b/crates/index-scheduler/src/utils.rs @@ -291,7 +291,10 @@ impl IndexScheduler { debug_assert!(old_task != *task); debug_assert_eq!(old_task.uid, task.uid); - debug_assert!(old_task.batch_uid.is_none() && task.batch_uid.is_some()); + debug_assert!( + old_task.batch_uid.is_none() && task.batch_uid.is_some(), + "\n==> old: {old_task:?}\n==> new: {task:?}" + ); if old_task.status != task.status { self.update_status(wtxn, old_task.status, |bitmap| { diff --git a/crates/meilisearch/tests/documents/add_documents.rs b/crates/meilisearch/tests/documents/add_documents.rs index d164d9a27..6c9222717 100644 --- a/crates/meilisearch/tests/documents/add_documents.rs +++ b/crates/meilisearch/tests/documents/add_documents.rs @@ -1225,7 +1225,25 @@ async fn add_no_documents() { snapshot!(code, @"202 Accepted"); let task = server.wait_task(task.uid()).await; let task = task.succeeded(); - snapshot!(task, @""); + snapshot!(task, @r#" + { + "uid": "[uid]", + "batchUid": "[batch_uid]", + "indexUid": "kefir", + "status": "succeeded", + "type": "documentAdditionOrUpdate", + "canceledBy": null, + "details": { + "receivedDocuments": 0, + "indexedDocuments": 0 + }, + "error": null, + "duration": "[duration]", + "enqueuedAt": "[date]", + "startedAt": "[date]", + "finishedAt": "[date]" + } + "#); } #[actix_rt::test] From 47b484c07c6d3b66323575349ed6092f3ff1f787 Mon Sep 17 00:00:00 2001 From: Tamo Date: Tue, 31 Dec 2024 17:24:32 +0100 Subject: [PATCH 3/4] update the test to ensure it works when specifying the primary key or not: it doesn't work --- .../tests/documents/add_documents.rs | 59 +++++++++++++++++++ 1 file changed, 59 insertions(+) diff --git a/crates/meilisearch/tests/documents/add_documents.rs b/crates/meilisearch/tests/documents/add_documents.rs index 6c9222717..7eedeed3d 100644 --- a/crates/meilisearch/tests/documents/add_documents.rs +++ b/crates/meilisearch/tests/documents/add_documents.rs @@ -1244,6 +1244,65 @@ async fn add_no_documents() { "finishedAt": "[date]" } "#); + + let (task, _code) = index.add_documents(json!([]), Some("kefkef")).await; + let task = server.wait_task(task.uid()).await; + let task = task.succeeded(); + snapshot!(task, @r#" + { + "uid": "[uid]", + "batchUid": "[batch_uid]", + "indexUid": "kefir", + "status": "succeeded", + "type": "documentAdditionOrUpdate", + "canceledBy": null, + "details": { + "receivedDocuments": 0, + "indexedDocuments": 0 + }, + "error": null, + "duration": "[duration]", + "enqueuedAt": "[date]", + "startedAt": "[date]", + "finishedAt": "[date]" + } + "#); + + let (task, _code) = index.add_documents(json!([{ "kefkef": 1 }]), None).await; + let task = server.wait_task(task.uid()).await; + let task = task.succeeded(); + snapshot!(task, @r#" + { + "uid": "[uid]", + "batchUid": "[batch_uid]", + "indexUid": "kefir", + "status": "succeeded", + "type": "documentAdditionOrUpdate", + "canceledBy": null, + "details": { + "receivedDocuments": 1, + "indexedDocuments": 1 + }, + "error": null, + "duration": "[duration]", + "enqueuedAt": "[date]", + "startedAt": "[date]", + "finishedAt": "[date]" + } + "#); + let (documents, _status) = index.get_all_documents(GetAllDocumentsOptions::default()).await; + snapshot!(documents, @r#" + { + "results": [ + { + "kefkef": 1 + } + ], + "offset": 0, + "limit": 20, + "total": 1 + } + "#); } #[actix_rt::test] From 19f48c15fb24c952b605e751fa62c6ece9f2997d Mon Sep 17 00:00:00 2001 From: Tamo Date: Tue, 31 Dec 2024 18:00:14 +0100 Subject: [PATCH 4/4] Fix the addition of empty payload --- .../update/new/indexer/document_operation.rs | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) diff --git a/crates/milli/src/update/new/indexer/document_operation.rs b/crates/milli/src/update/new/indexer/document_operation.rs index 090c1eb8e..5ccac4297 100644 --- a/crates/milli/src/update/new/indexer/document_operation.rs +++ b/crates/milli/src/update/new/indexer/document_operation.rs @@ -252,6 +252,24 @@ fn extract_addition_payload_changes<'r, 'pl: 'r>( previous_offset = iter.byte_offset(); } + if payload.is_empty() { + let result = retrieve_or_guess_primary_key( + rtxn, + index, + new_fields_ids_map, + primary_key_from_op, + None, + ); + match result { + Ok(Ok((pk, _))) => { + primary_key.get_or_insert(pk); + } + Ok(Err(UserError::NoPrimaryKeyCandidateFound)) => (), + Ok(Err(user_error)) => return Err(Error::UserError(user_error)), + Err(error) => return Err(error), + }; + } + Ok(new_docids_version_offsets) }