MeiliSearch/index-scheduler/src/autobatcher.rs

292 lines
9.9 KiB
Rust
Raw Normal View History

use std::ops::ControlFlow;
use crate::{task::Kind, TaskId};
pub enum BatchKind {
2022-09-13 22:38:43 +02:00
DocumentClear {
ids: Vec<TaskId>,
},
DocumentAddition {
addition_ids: Vec<TaskId>,
},
DocumentDeletion {
deletion_ids: Vec<TaskId>,
},
2022-09-13 22:38:43 +02:00
ClearAndSettings {
other: Vec<TaskId>,
settings_ids: Vec<TaskId>,
},
SettingsAndDocumentAddition {
settings_ids: Vec<TaskId>,
addition_ids: Vec<TaskId>,
},
Settings {
settings_ids: Vec<TaskId>,
},
2022-09-13 22:38:43 +02:00
IndexDeletion {
ids: Vec<TaskId>,
},
2022-09-13 22:38:43 +02:00
IndexCreation {
id: TaskId,
},
2022-09-13 22:38:43 +02:00
IndexUpdate {
id: TaskId,
},
2022-09-13 22:38:43 +02:00
IndexRename {
id: TaskId,
},
IndexSwap {
id: TaskId,
},
}
impl BatchKind {
/// return true if you must stop right there.
pub fn new(task_id: TaskId, kind: Kind) -> (Self, bool) {
match kind {
2022-09-13 22:38:43 +02:00
Kind::IndexCreation => (BatchKind::IndexCreation { id: task_id }, true),
Kind::IndexDeletion => (BatchKind::IndexDeletion { ids: vec![task_id] }, true),
Kind::IndexUpdate => (BatchKind::IndexUpdate { id: task_id }, true),
Kind::IndexRename => (BatchKind::IndexRename { id: task_id }, true),
Kind::IndexSwap => (BatchKind::IndexSwap { id: task_id }, true),
Kind::DocumentClear => (BatchKind::DocumentClear { ids: vec![task_id] }, false),
Kind::DocumentAdditionOrUpdate => (
BatchKind::DocumentAddition {
addition_ids: vec![task_id],
},
false,
),
Kind::DocumentDeletion => (
BatchKind::DocumentDeletion {
deletion_ids: vec![task_id],
},
false,
),
Kind::Settings => (
BatchKind::Settings {
settings_ids: vec![task_id],
},
false,
),
Kind::DumpExport | Kind::Snapshot | Kind::CancelTask => unreachable!(),
}
}
/// Return true if you must stop.
fn accumulate(mut self, id: TaskId, kind: Kind) -> ControlFlow<Self, Self> {
match (self, kind) {
// We don't batch any of these operations
2022-09-13 22:38:43 +02:00
(
this,
Kind::IndexCreation | Kind::IndexRename | Kind::IndexUpdate | Kind::IndexSwap,
) => ControlFlow::Break(this),
// The index deletion can batch with everything but must stop after
(
2022-09-13 22:38:43 +02:00
BatchKind::DocumentClear { mut ids }
| BatchKind::DocumentAddition {
addition_ids: mut ids,
}
| BatchKind::DocumentDeletion {
deletion_ids: mut ids,
}
| BatchKind::Settings {
settings_ids: mut ids,
},
2022-09-13 22:38:43 +02:00
Kind::IndexDeletion,
) => {
ids.push(id);
2022-09-13 22:38:43 +02:00
ControlFlow::Break(BatchKind::IndexDeletion { ids })
}
(
2022-09-13 22:38:43 +02:00
BatchKind::ClearAndSettings {
settings_ids: mut ids,
mut other,
}
| BatchKind::SettingsAndDocumentAddition {
addition_ids: mut ids,
settings_ids: mut other,
},
2022-09-13 22:38:43 +02:00
Kind::IndexDeletion,
) => {
ids.push(id);
ids.append(&mut other);
2022-09-13 22:38:43 +02:00
ControlFlow::Break(BatchKind::IndexDeletion { ids })
}
2022-09-13 22:38:43 +02:00
(
BatchKind::DocumentClear { mut ids },
Kind::DocumentClear | Kind::DocumentDeletion,
) => {
ids.push(id);
2022-09-13 22:38:43 +02:00
ControlFlow::Continue(BatchKind::DocumentClear { ids })
}
2022-09-13 22:38:43 +02:00
(
this @ BatchKind::DocumentClear { .. },
Kind::DocumentAdditionOrUpdate | Kind::Settings,
) => ControlFlow::Break(this),
(BatchKind::DocumentAddition { mut addition_ids }, Kind::DocumentClear) => {
addition_ids.push(id);
2022-09-13 22:38:43 +02:00
ControlFlow::Continue(BatchKind::DocumentClear { ids: addition_ids })
}
2022-09-13 22:38:43 +02:00
(BatchKind::DocumentAddition { mut addition_ids }, Kind::DocumentAdditionOrUpdate) => {
addition_ids.push(id);
ControlFlow::Continue(BatchKind::DocumentAddition { addition_ids })
}
(this @ BatchKind::DocumentAddition { .. }, Kind::DocumentDeletion) => {
ControlFlow::Break(this)
}
(BatchKind::DocumentAddition { addition_ids }, Kind::Settings) => {
ControlFlow::Continue(BatchKind::SettingsAndDocumentAddition {
settings_ids: vec![id],
addition_ids,
})
}
2022-09-13 22:38:43 +02:00
(BatchKind::DocumentDeletion { mut deletion_ids }, Kind::DocumentClear) => {
deletion_ids.push(id);
2022-09-13 22:38:43 +02:00
ControlFlow::Continue(BatchKind::DocumentClear { ids: deletion_ids })
}
2022-09-13 22:38:43 +02:00
(this @ BatchKind::DocumentDeletion { .. }, Kind::DocumentAdditionOrUpdate) => {
ControlFlow::Break(this)
}
(BatchKind::DocumentDeletion { mut deletion_ids }, Kind::DocumentDeletion) => {
deletion_ids.push(id);
ControlFlow::Continue(BatchKind::DocumentDeletion { deletion_ids })
}
(this @ BatchKind::DocumentDeletion { .. }, Kind::Settings) => ControlFlow::Break(this),
2022-09-13 22:38:43 +02:00
(BatchKind::Settings { settings_ids }, Kind::DocumentClear) => {
ControlFlow::Continue(BatchKind::ClearAndSettings {
settings_ids: settings_ids.clone(),
other: vec![id],
})
}
2022-09-13 22:38:43 +02:00
(this @ BatchKind::Settings { .. }, Kind::DocumentAdditionOrUpdate) => {
ControlFlow::Break(this)
}
(this @ BatchKind::Settings { .. }, Kind::DocumentDeletion) => ControlFlow::Break(this),
(BatchKind::Settings { mut settings_ids }, Kind::Settings) => {
settings_ids.push(id);
ControlFlow::Continue(BatchKind::Settings { settings_ids })
}
(
2022-09-13 22:38:43 +02:00
BatchKind::ClearAndSettings {
mut other,
settings_ids,
},
2022-09-13 22:38:43 +02:00
Kind::DocumentClear,
) => {
other.push(id);
2022-09-13 22:38:43 +02:00
ControlFlow::Continue(BatchKind::ClearAndSettings {
other,
settings_ids,
})
}
2022-09-13 22:38:43 +02:00
(this @ BatchKind::ClearAndSettings { .. }, Kind::DocumentAdditionOrUpdate) => {
ControlFlow::Break(this)
}
(
2022-09-13 22:38:43 +02:00
BatchKind::ClearAndSettings {
mut other,
settings_ids,
},
Kind::DocumentDeletion,
) => {
other.push(id);
2022-09-13 22:38:43 +02:00
ControlFlow::Continue(BatchKind::ClearAndSettings {
other,
settings_ids,
})
}
(
2022-09-13 22:38:43 +02:00
BatchKind::ClearAndSettings {
mut settings_ids,
other,
},
Kind::Settings,
) => {
settings_ids.push(id);
2022-09-13 22:38:43 +02:00
ControlFlow::Continue(BatchKind::ClearAndSettings {
other,
settings_ids,
})
}
(
BatchKind::SettingsAndDocumentAddition {
settings_ids,
mut addition_ids,
},
2022-09-13 22:38:43 +02:00
Kind::DocumentClear,
) => {
addition_ids.push(id);
2022-09-13 22:38:43 +02:00
ControlFlow::Continue(BatchKind::ClearAndSettings {
settings_ids,
other: addition_ids,
})
}
(
BatchKind::SettingsAndDocumentAddition {
mut addition_ids,
settings_ids,
},
2022-09-13 22:38:43 +02:00
Kind::DocumentAdditionOrUpdate,
) => {
addition_ids.push(id);
ControlFlow::Continue(BatchKind::SettingsAndDocumentAddition {
addition_ids,
settings_ids,
})
}
(this @ BatchKind::SettingsAndDocumentAddition { .. }, Kind::DocumentDeletion) => {
ControlFlow::Break(this)
}
(
BatchKind::SettingsAndDocumentAddition {
mut settings_ids,
addition_ids,
},
Kind::Settings,
) => {
settings_ids.push(id);
ControlFlow::Continue(BatchKind::SettingsAndDocumentAddition {
settings_ids,
addition_ids,
})
}
(_, Kind::CancelTask | Kind::DumpExport | Kind::Snapshot) => unreachable!(),
(
2022-09-13 22:38:43 +02:00
BatchKind::IndexCreation { .. }
| BatchKind::IndexDeletion { .. }
| BatchKind::IndexUpdate { .. }
| BatchKind::IndexRename { .. }
| BatchKind::IndexSwap { .. },
_,
) => {
unreachable!()
}
}
}
}
pub fn autobatch(enqueued: Vec<(TaskId, Kind)>) -> Option<BatchKind> {
let mut enqueued = enqueued.into_iter();
let (id, kind) = enqueued.next()?;
let (mut acc, is_finished) = BatchKind::new(id, kind);
if is_finished {
return Some(acc);
}
for (id, kind) in enqueued {
acc = match acc.accumulate(id, kind) {
ControlFlow::Continue(acc) => acc,
ControlFlow::Break(acc) => return Some(acc),
};
}
None
}