Merge pull request #5592 from nnethercott/extract-geo-facets-seperately

Decouple geo facet extraction from rest of document
This commit is contained in:
Many the fish
2025-05-28 16:22:10 +00:00
committed by GitHub
2 changed files with 134 additions and 111 deletions

View File

@@ -8,7 +8,7 @@ use hashbrown::HashMap;
use serde_json::Value; use serde_json::Value;
use super::super::cache::BalancedCaches; use super::super::cache::BalancedCaches;
use super::facet_document::extract_document_facets; use super::facet_document::{extract_document_facets, extract_geo_document};
use super::FacetKind; use super::FacetKind;
use crate::fields_ids_map::metadata::Metadata; use crate::fields_ids_map::metadata::Metadata;
use crate::filterable_attributes_rules::match_faceted_field; use crate::filterable_attributes_rules::match_faceted_field;
@@ -90,17 +90,12 @@ impl FacetedDocidsExtractor {
let mut cached_sorter = context.data.borrow_mut_or_yield(); let mut cached_sorter = context.data.borrow_mut_or_yield();
let mut del_add_facet_value = DelAddFacetValue::new(&context.doc_alloc); let mut del_add_facet_value = DelAddFacetValue::new(&context.doc_alloc);
let docid = document_change.docid(); let docid = document_change.docid();
let res = match document_change {
DocumentChange::Deletion(inner) => extract_document_facets( // Using a macro avoid borrowing the parameters as mutable in both closures at
inner.current(rtxn, index, context.db_fields_ids_map)?, // the same time by postponing their creation
inner.external_document_id(), macro_rules! facet_fn {
new_fields_ids_map.deref_mut(), (del) => {
filterable_attributes, |fid: FieldId, meta: Metadata, depth: perm_json_p::Depth, value: &Value| {
sortable_fields,
asc_desc_fields,
distinct_field,
is_geo_enabled,
&mut |fid, meta, depth, value| {
Self::facet_fn_with_options( Self::facet_fn_with_options(
&context.doc_alloc, &context.doc_alloc,
cached_sorter.deref_mut(), cached_sorter.deref_mut(),
@@ -114,10 +109,52 @@ impl FacetedDocidsExtractor {
depth, depth,
value, value,
) )
}, }
), };
(add) => {
|fid: FieldId, meta: Metadata, depth: perm_json_p::Depth, value: &Value| {
Self::facet_fn_with_options(
&context.doc_alloc,
cached_sorter.deref_mut(),
BalancedCaches::insert_add_u32,
&mut del_add_facet_value,
DelAddFacetValue::insert_add,
docid,
fid,
meta,
filterable_attributes,
depth,
value,
)
}
};
}
match document_change {
DocumentChange::Deletion(inner) => {
let mut del = facet_fn!(del);
extract_document_facets(
inner.current(rtxn, index, context.db_fields_ids_map)?,
new_fields_ids_map.deref_mut(),
filterable_attributes,
sortable_fields,
asc_desc_fields,
distinct_field,
&mut del,
)?;
if is_geo_enabled {
extract_geo_document(
inner.current(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(),
new_fields_ids_map.deref_mut(),
&mut del,
)?;
}
}
DocumentChange::Update(inner) => { DocumentChange::Update(inner) => {
let has_changed = inner.has_changed_for_fields( let has_changed_for_facets = inner.has_changed_for_fields(
&mut |field_name| { &mut |field_name| {
match_faceted_field( match_faceted_field(
field_name, field_name,
@@ -131,93 +168,74 @@ impl FacetedDocidsExtractor {
index, index,
context.db_fields_ids_map, context.db_fields_ids_map,
)?; )?;
let has_changed_for_geo_fields =
inner.has_changed_for_geo_fields(rtxn, index, context.db_fields_ids_map)?;
if !has_changed && !has_changed_for_geo_fields {
return Ok(());
}
// 1. Maybe update doc
if has_changed_for_facets {
extract_document_facets( extract_document_facets(
inner.current(rtxn, index, context.db_fields_ids_map)?, inner.current(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(),
new_fields_ids_map.deref_mut(), new_fields_ids_map.deref_mut(),
filterable_attributes, filterable_attributes,
sortable_fields, sortable_fields,
asc_desc_fields, asc_desc_fields,
distinct_field, distinct_field,
is_geo_enabled, &mut facet_fn!(del),
&mut |fid, meta, depth, value| {
Self::facet_fn_with_options(
&context.doc_alloc,
cached_sorter.deref_mut(),
BalancedCaches::insert_del_u32,
&mut del_add_facet_value,
DelAddFacetValue::insert_del,
docid,
fid,
meta,
filterable_attributes,
depth,
value,
)
},
)?; )?;
extract_document_facets( extract_document_facets(
inner.merged(rtxn, index, context.db_fields_ids_map)?, inner.merged(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(),
new_fields_ids_map.deref_mut(), new_fields_ids_map.deref_mut(),
filterable_attributes, filterable_attributes,
sortable_fields, sortable_fields,
asc_desc_fields, asc_desc_fields,
distinct_field, distinct_field,
is_geo_enabled, &mut facet_fn!(add),
&mut |fid, meta, depth, value| { )?;
Self::facet_fn_with_options(
&context.doc_alloc,
cached_sorter.deref_mut(),
BalancedCaches::insert_add_u32,
&mut del_add_facet_value,
DelAddFacetValue::insert_add,
docid,
fid,
meta,
filterable_attributes,
depth,
value,
)
},
)
} }
DocumentChange::Insertion(inner) => extract_document_facets(
// 2. Maybe update geo
if is_geo_enabled
&& inner.has_changed_for_geo_fields(rtxn, index, context.db_fields_ids_map)?
{
extract_geo_document(
inner.current(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(),
new_fields_ids_map.deref_mut(),
&mut facet_fn!(del),
)?;
extract_geo_document(
inner.merged(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(),
new_fields_ids_map.deref_mut(),
&mut facet_fn!(add),
)?;
}
}
DocumentChange::Insertion(inner) => {
let mut add = facet_fn!(add);
extract_document_facets(
inner.inserted(),
new_fields_ids_map.deref_mut(),
filterable_attributes,
sortable_fields,
asc_desc_fields,
distinct_field,
&mut add,
)?;
if is_geo_enabled {
extract_geo_document(
inner.inserted(), inner.inserted(),
inner.external_document_id(), inner.external_document_id(),
new_fields_ids_map.deref_mut(), new_fields_ids_map.deref_mut(),
filterable_attributes, &mut add,
sortable_fields, )?;
asc_desc_fields, }
distinct_field, }
is_geo_enabled,
&mut |fid, meta, depth, value| {
Self::facet_fn_with_options(
&context.doc_alloc,
cached_sorter.deref_mut(),
BalancedCaches::insert_add_u32,
&mut del_add_facet_value,
DelAddFacetValue::insert_add,
docid,
fid,
meta,
filterable_attributes,
depth,
value,
)
},
),
}; };
del_add_facet_value.send_data(docid, sender, &context.doc_alloc).unwrap(); del_add_facet_value.send_data(docid, sender, &context.doc_alloc).unwrap();
res Ok(())
} }
#[allow(clippy::too_many_arguments)] #[allow(clippy::too_many_arguments)]

View File

@@ -16,13 +16,11 @@ use crate::filterable_attributes_rules::match_faceted_field;
#[allow(clippy::too_many_arguments)] #[allow(clippy::too_many_arguments)]
pub fn extract_document_facets<'doc>( pub fn extract_document_facets<'doc>(
document: impl Document<'doc>, document: impl Document<'doc>,
external_document_id: &str,
field_id_map: &mut GlobalFieldsIdsMap, field_id_map: &mut GlobalFieldsIdsMap,
filterable_attributes: &[FilterableAttributesRule], filterable_attributes: &[FilterableAttributesRule],
sortable_fields: &HashSet<String>, sortable_fields: &HashSet<String>,
asc_desc_fields: &HashSet<String>, asc_desc_fields: &HashSet<String>,
distinct_field: &Option<String>, distinct_field: &Option<String>,
is_geo_enabled: bool,
facet_fn: &mut impl FnMut(FieldId, Metadata, perm_json_p::Depth, &Value) -> Result<()>, facet_fn: &mut impl FnMut(FieldId, Metadata, perm_json_p::Depth, &Value) -> Result<()>,
) -> Result<()> { ) -> Result<()> {
// return the match result for the given field name. // return the match result for the given field name.
@@ -102,7 +100,15 @@ pub fn extract_document_facets<'doc>(
} }
} }
if is_geo_enabled { Ok(())
}
pub fn extract_geo_document<'doc>(
document: impl Document<'doc>,
external_document_id: &str,
field_id_map: &mut GlobalFieldsIdsMap,
facet_fn: &mut impl FnMut(FieldId, Metadata, perm_json_p::Depth, &Value) -> Result<()>,
) -> Result<()> {
if let Some(geo_value) = document.geo_field()? { if let Some(geo_value) = document.geo_field()? {
if let Some([lat, lng]) = extract_geo_coordinates(external_document_id, geo_value)? { if let Some([lat, lng]) = extract_geo_coordinates(external_document_id, geo_value)? {
let ((lat_fid, lat_meta), (lng_fid, lng_meta)) = field_id_map let ((lat_fid, lat_meta), (lng_fid, lng_meta)) = field_id_map
@@ -114,7 +120,6 @@ pub fn extract_document_facets<'doc>(
facet_fn(lng_fid, lng_meta, perm_json_p::Depth::OnBaseKey, &lng.into())?; facet_fn(lng_fid, lng_meta, perm_json_p::Depth::OnBaseKey, &lng.into())?;
} }
} }
}
Ok(()) Ok(())
} }