update cellulite to the latest version

This commit is contained in:
Tamo
2025-09-17 10:46:27 +02:00
parent 3dac2cf73e
commit fec10bb2d6
13 changed files with 34 additions and 37 deletions

View File

@@ -230,6 +230,7 @@ pub fn request_threads() -> &'static ThreadPoolNoAbort {
/// Extract chunked data and send it into lmdb_writer_sx sender:
/// - documents
#[allow(clippy::too_many_arguments)]
fn send_original_documents_data(
original_documents_chunk: Result<grenad::Reader<BufReader<File>>>,
indexer: GrenadParameters,

View File

@@ -523,7 +523,7 @@ where
.is_some_and(|conf| conf.is_quantized);
let is_quantizing = embedder_config.is_some_and(|action| action.is_being_quantized);
pool.install(|| {
pool.install(|| -> Result<_> {
let mut writer =
VectorStore::new(backend, vector_store, embedder_index, was_quantized);
writer.build_and_quantize(
@@ -541,7 +541,7 @@ where
.map_err(InternalError::from)??;
}
self.index.cellulite.build(self.wtxn, &Progress::default())?;
self.index.cellulite.build(self.wtxn, &self.should_abort, &Progress::default())?;
self.execute_prefix_databases(
word_docids.map(MergerBuilder::build),

View File

@@ -189,7 +189,11 @@ where
println!("Building geojson");
indexing_context.progress.update_progress(IndexingStep::BuildingGeoJson);
index.cellulite.build(wtxn, indexing_context.progress)?;
index.cellulite.build(
wtxn,
&indexing_context.must_stop_processing,
indexing_context.progress,
)?;
indexing_context.progress.update_progress(IndexingStep::Finalizing);
@@ -322,7 +326,11 @@ where
.unwrap()?;
indexing_context.progress.update_progress(IndexingStep::BuildingGeoJson);
index.cellulite.build(wtxn, indexing_context.progress)?;
index.cellulite.build(
wtxn,
&indexing_context.must_stop_processing,
indexing_context.progress,
)?;
indexing_context.progress.update_progress(IndexingStep::Finalizing);

View File

@@ -17,7 +17,6 @@ use crate::vector::db::IndexEmbeddingConfig;
use crate::vector::settings::EmbedderAction;
use crate::vector::{Embedder, Embeddings, RuntimeEmbedders, VectorStore};
use crate::{DocumentId, Error, Index, InternalError, Result, UserError};
use crate::{Error, Index, InternalError, Result, UserError};
pub fn write_to_db(
mut writer_receiver: WriterBbqueueReceiver<'_>,