Introduce a new CLI and env var to use the old document indexer when

importing dumps
2025-07-26 00:01:00 +00:00 · 2025-07-17 16:12:23 +02:00
parent fd8b2451d7
commit fe15e11c9d
4 changed files with 73 additions and 37 deletions
--- a/crates/index-scheduler/src/lib.rs
+++ b/crates/index-scheduler/src/lib.rs
@ -139,6 +139,8 @@ pub struct IndexSchedulerOptions {
    pub embedding_cache_cap: usize,
    /// Snapshot compaction status.
    pub experimental_no_snapshot_compaction: bool,
+    /// Whether dump import use the old document indexer or the new one.
+    pub experimental_no_edition_2024_for_dumps: bool,
 }

 /// Structure which holds meilisearch's indexes and schedules the tasks
@ -168,6 +170,9 @@ pub struct IndexScheduler {
    /// Whether we should automatically cleanup the task queue or not.
    pub(crate) cleanup_enabled: bool,

+    /// Whether we should use the old document indexer or the new one.
+    pub(crate) experimental_no_edition_2024_for_dumps: bool,
+
    /// The webhook url we should send tasks to after processing every batches.
    pub(crate) webhook_url: Option<String>,
    /// The Authorization header to send to the webhook URL.
@ -210,6 +215,7 @@ impl IndexScheduler {

            index_mapper: self.index_mapper.clone(),
            cleanup_enabled: self.cleanup_enabled,
+            experimental_no_edition_2024_for_dumps: self.experimental_no_edition_2024_for_dumps,
            webhook_url: self.webhook_url.clone(),
            webhook_authorization_header: self.webhook_authorization_header.clone(),
            embedders: self.embedders.clone(),
@ -296,6 +302,7 @@ impl IndexScheduler {
            index_mapper,
            env,
            cleanup_enabled: options.cleanup_enabled,
+            experimental_no_edition_2024_for_dumps: options.experimental_no_edition_2024_for_dumps,
            webhook_url: options.webhook_url,
            webhook_authorization_header: options.webhook_authorization_header,
            embedders: Default::default(),
@ -594,6 +601,11 @@ impl IndexScheduler {
        Ok(nbr_index_processing_tasks > 0)
    }

+    /// Whether the index should use the old document indexer.
+    pub fn no_edition_2024_for_dumps(&self) -> bool {
+        self.experimental_no_edition_2024_for_dumps
+    }
+
    /// Return the tasks matching the query from the user's point of view along
    /// with the total number of tasks matching the query, ignoring from and limit.
    ///