mirror of
https://github.com/meilisearch/meilisearch.git
synced 2025-10-24 04:26:27 +00:00
Introduce a new way to determine the operations to perform on the fields
This commit is contained in:
committed by
ManyTheFish
parent
0f578348f1
commit
87cf8a3c94
@@ -843,29 +843,6 @@ impl<'a, 'i> Transform<'a, 'i> {
|
|||||||
// Always keep the primary key.
|
// Always keep the primary key.
|
||||||
let is_primary_key = |id: FieldId| -> bool { settings_diff.primary_key_id == Some(id) };
|
let is_primary_key = |id: FieldId| -> bool { settings_diff.primary_key_id == Some(id) };
|
||||||
|
|
||||||
// If only the `searchableAttributes` has been changed, keep only the searchable fields.
|
|
||||||
// However, if only new searchable attributes are added, this function will
|
|
||||||
// return false has fields do not need to be reindexed.
|
|
||||||
let must_reindex_searchables = settings_diff.reindex_searchable();
|
|
||||||
let must_index_only_additional_searchables = &settings_diff.only_additional_fields();
|
|
||||||
let necessary_searchable_field_to_reindex = move |id: FieldId| -> bool {
|
|
||||||
must_index_only_additional_searchables.is_none()
|
|
||||||
&& must_reindex_searchables
|
|
||||||
&& (settings_diff.old.searchable_fields_ids.contains(&id)
|
|
||||||
|| settings_diff.new.searchable_fields_ids.contains(&id))
|
|
||||||
};
|
|
||||||
|
|
||||||
// If only new `searchableAttributes` are present, keep only those ones.
|
|
||||||
let additional_searchable_field_only = move |id: FieldId| -> bool {
|
|
||||||
match must_index_only_additional_searchables {
|
|
||||||
Some(additional_fields) => {
|
|
||||||
let additional_field = settings_diff.new.fields_ids_map.name(id).unwrap();
|
|
||||||
additional_fields.contains(additional_field)
|
|
||||||
}
|
|
||||||
None => false,
|
|
||||||
}
|
|
||||||
};
|
|
||||||
|
|
||||||
// If only a faceted field has been added, keep only this field.
|
// If only a faceted field has been added, keep only this field.
|
||||||
let must_reindex_facets = settings_diff.reindex_facets();
|
let must_reindex_facets = settings_diff.reindex_facets();
|
||||||
let necessary_faceted_field = |id: FieldId| -> bool {
|
let necessary_faceted_field = |id: FieldId| -> bool {
|
||||||
@@ -880,20 +857,16 @@ impl<'a, 'i> Transform<'a, 'i> {
|
|||||||
// we need the fields for the prompt/templating.
|
// we need the fields for the prompt/templating.
|
||||||
let reindex_vectors = settings_diff.reindex_vectors();
|
let reindex_vectors = settings_diff.reindex_vectors();
|
||||||
|
|
||||||
// The set of additional searchable fields only,
|
// The operations that we must perform on the different fields.
|
||||||
// the only purpose of these fields is to be indexed from scratch.
|
let mut operations = HashMap::new();
|
||||||
let mut additional_searchables_only = HashSet::new();
|
|
||||||
|
|
||||||
let mut obkv_writer = KvWriter::<_, FieldId>::memory();
|
let mut obkv_writer = KvWriter::<_, FieldId>::memory();
|
||||||
for (id, val) in old_obkv.iter() {
|
for (id, val) in old_obkv.iter() {
|
||||||
if is_primary_key(id)
|
if is_primary_key(id) || necessary_faceted_field(id) || reindex_vectors {
|
||||||
|| necessary_searchable_field_to_reindex(id)
|
operations.insert(id, DelAddOperation::DeletionAndAddition);
|
||||||
|| necessary_faceted_field(id)
|
|
||||||
|| reindex_vectors
|
|
||||||
{
|
|
||||||
obkv_writer.insert(id, val)?;
|
obkv_writer.insert(id, val)?;
|
||||||
} else if additional_searchable_field_only(id) {
|
} else if let Some(operation) = settings_diff.reindex_searchable_id(id) {
|
||||||
additional_searchables_only.insert(id);
|
operations.insert(id, operation);
|
||||||
obkv_writer.insert(id, val)?;
|
obkv_writer.insert(id, val)?;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@@ -913,13 +886,7 @@ impl<'a, 'i> Transform<'a, 'i> {
|
|||||||
|
|
||||||
flattened_obkv_buffer.clear();
|
flattened_obkv_buffer.clear();
|
||||||
into_del_add_obkv_conditional_operation(flattened, flattened_obkv_buffer, |id| {
|
into_del_add_obkv_conditional_operation(flattened, flattened_obkv_buffer, |id| {
|
||||||
// If the field is only required because it is an additional
|
operations.get(&id).copied().unwrap_or(DelAddOperation::DeletionAndAddition)
|
||||||
// searchable field only define it as an DelAdd::Addition only.
|
|
||||||
if additional_searchables_only.contains(&id) {
|
|
||||||
DelAddOperation::Addition
|
|
||||||
} else {
|
|
||||||
DelAddOperation::DeletionAndAddition
|
|
||||||
}
|
|
||||||
})?;
|
})?;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@@ -9,6 +9,7 @@ use itertools::{EitherOrBoth, Itertools};
|
|||||||
use serde::{Deserialize, Deserializer, Serialize, Serializer};
|
use serde::{Deserialize, Deserializer, Serialize, Serializer};
|
||||||
use time::OffsetDateTime;
|
use time::OffsetDateTime;
|
||||||
|
|
||||||
|
use super::del_add::DelAddOperation;
|
||||||
use super::index_documents::{IndexDocumentsConfig, Transform};
|
use super::index_documents::{IndexDocumentsConfig, Transform};
|
||||||
use super::IndexerConfig;
|
use super::IndexerConfig;
|
||||||
use crate::criterion::Criterion;
|
use crate::criterion::Criterion;
|
||||||
@@ -1112,6 +1113,31 @@ impl InnerIndexSettingsDiff {
|
|||||||
|| self.old.proximity_precision != self.new.proximity_precision
|
|| self.old.proximity_precision != self.new.proximity_precision
|
||||||
}
|
}
|
||||||
|
|
||||||
|
pub fn reindex_searchable_id(&self, id: FieldId) -> Option<DelAddOperation> {
|
||||||
|
if self.old.stop_words.as_ref().map(|set| set.as_fst().as_bytes())
|
||||||
|
!= self.new.stop_words.as_ref().map(|set| set.as_fst().as_bytes())
|
||||||
|
|| self.old.allowed_separators != self.new.allowed_separators
|
||||||
|
|| self.old.dictionary != self.new.dictionary
|
||||||
|
|| self.old.exact_attributes != self.new.exact_attributes
|
||||||
|
// Here we can be much more optimal by just deleting the proximity database
|
||||||
|
|| self.old.proximity_precision != self.new.proximity_precision
|
||||||
|
{
|
||||||
|
Some(DelAddOperation::DeletionAndAddition)
|
||||||
|
} else if let Some(only_additional_fields) = self.only_additional_fields() {
|
||||||
|
let additional_field = self.new.fields_ids_map.name(id).unwrap();
|
||||||
|
if only_additional_fields.contains(additional_field) {
|
||||||
|
Some(DelAddOperation::Addition)
|
||||||
|
} else {
|
||||||
|
None
|
||||||
|
}
|
||||||
|
} else if self.old.user_defined_searchable_fields != self.new.user_defined_searchable_fields
|
||||||
|
{
|
||||||
|
Some(DelAddOperation::DeletionAndAddition)
|
||||||
|
} else {
|
||||||
|
None
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
/// Returns only the additional searchable fields.
|
/// Returns only the additional searchable fields.
|
||||||
/// If any other searchable field has been modified, returns None.
|
/// If any other searchable field has been modified, returns None.
|
||||||
pub fn only_additional_fields(&self) -> Option<HashSet<String>> {
|
pub fn only_additional_fields(&self) -> Option<HashSet<String>> {
|
||||||
@@ -1599,7 +1625,7 @@ mod tests {
|
|||||||
// When we search for something that is not in
|
// When we search for something that is not in
|
||||||
// the searchable fields it must not return any document.
|
// the searchable fields it must not return any document.
|
||||||
let result = index.search(&rtxn).query("23").execute().unwrap();
|
let result = index.search(&rtxn).query("23").execute().unwrap();
|
||||||
assert!(result.documents_ids.is_empty());
|
assert_eq!(result.documents_ids, Vec::<u32>::new());
|
||||||
|
|
||||||
// When we search for something that is in the searchable fields
|
// When we search for something that is in the searchable fields
|
||||||
// we must find the appropriate document.
|
// we must find the appropriate document.
|
||||||
|
Reference in New Issue
Block a user