feat: uncouple geo extraction from full doc

This commit is contained in:
nnethercott
2025-05-26 09:22:20 +02:00
parent 97aeb6db4d
commit 24e94b28c1
2 changed files with 188 additions and 89 deletions

View File

@@ -8,7 +8,7 @@ use hashbrown::HashMap;
use serde_json::Value; use serde_json::Value;
use super::super::cache::BalancedCaches; use super::super::cache::BalancedCaches;
use super::facet_document::extract_document_facets; use super::facet_document::{extract_document_facets, extract_geo_document};
use super::FacetKind; use super::FacetKind;
use crate::fields_ids_map::metadata::Metadata; use crate::fields_ids_map::metadata::Metadata;
use crate::filterable_attributes_rules::match_faceted_field; use crate::filterable_attributes_rules::match_faceted_field;
@@ -90,8 +90,9 @@ impl FacetedDocidsExtractor {
let mut cached_sorter = context.data.borrow_mut_or_yield(); let mut cached_sorter = context.data.borrow_mut_or_yield();
let mut del_add_facet_value = DelAddFacetValue::new(&context.doc_alloc); let mut del_add_facet_value = DelAddFacetValue::new(&context.doc_alloc);
let docid = document_change.docid(); let docid = document_change.docid();
let res = match document_change { match document_change {
DocumentChange::Deletion(inner) => extract_document_facets( DocumentChange::Deletion(inner) => {
extract_document_facets(
inner.current(rtxn, index, context.db_fields_ids_map)?, inner.current(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(), inner.external_document_id(),
new_fields_ids_map.deref_mut(), new_fields_ids_map.deref_mut(),
@@ -99,7 +100,6 @@ impl FacetedDocidsExtractor {
sortable_fields, sortable_fields,
asc_desc_fields, asc_desc_fields,
distinct_field, distinct_field,
is_geo_enabled,
&mut |fid, meta, depth, value| { &mut |fid, meta, depth, value| {
Self::facet_fn_with_options( Self::facet_fn_with_options(
&context.doc_alloc, &context.doc_alloc,
@@ -115,7 +115,32 @@ impl FacetedDocidsExtractor {
value, value,
) )
}, },
), )?;
if is_geo_enabled {
extract_geo_document(
inner.current(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(),
new_fields_ids_map.deref_mut(),
asc_desc_fields,
&mut |fid, meta, depth, value| {
Self::facet_fn_with_options(
&context.doc_alloc,
cached_sorter.deref_mut(),
BalancedCaches::insert_del_u32,
&mut del_add_facet_value,
DelAddFacetValue::insert_del,
docid,
fid,
meta,
filterable_attributes,
depth,
value,
)
},
)?;
}
}
DocumentChange::Update(inner) => { DocumentChange::Update(inner) => {
let has_changed = inner.has_changed_for_fields( let has_changed = inner.has_changed_for_fields(
&mut |field_name| { &mut |field_name| {
@@ -133,10 +158,8 @@ impl FacetedDocidsExtractor {
)?; )?;
let has_changed_for_geo_fields = let has_changed_for_geo_fields =
inner.has_changed_for_geo_fields(rtxn, index, context.db_fields_ids_map)?; inner.has_changed_for_geo_fields(rtxn, index, context.db_fields_ids_map)?;
if !has_changed && !has_changed_for_geo_fields {
return Ok(());
}
if has_changed {
extract_document_facets( extract_document_facets(
inner.current(rtxn, index, context.db_fields_ids_map)?, inner.current(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(), inner.external_document_id(),
@@ -145,7 +168,6 @@ impl FacetedDocidsExtractor {
sortable_fields, sortable_fields,
asc_desc_fields, asc_desc_fields,
distinct_field, distinct_field,
is_geo_enabled,
&mut |fid, meta, depth, value| { &mut |fid, meta, depth, value| {
Self::facet_fn_with_options( Self::facet_fn_with_options(
&context.doc_alloc, &context.doc_alloc,
@@ -171,7 +193,6 @@ impl FacetedDocidsExtractor {
sortable_fields, sortable_fields,
asc_desc_fields, asc_desc_fields,
distinct_field, distinct_field,
is_geo_enabled,
&mut |fid, meta, depth, value| { &mut |fid, meta, depth, value| {
Self::facet_fn_with_options( Self::facet_fn_with_options(
&context.doc_alloc, &context.doc_alloc,
@@ -187,9 +208,57 @@ impl FacetedDocidsExtractor {
value, value,
) )
}, },
) )?;
} }
DocumentChange::Insertion(inner) => extract_document_facets(
if is_geo_enabled && has_changed_for_geo_fields{
extract_geo_document(
inner.current(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(),
new_fields_ids_map.deref_mut(),
asc_desc_fields,
&mut |fid, meta, depth, value| {
Self::facet_fn_with_options(
&context.doc_alloc,
cached_sorter.deref_mut(),
BalancedCaches::insert_del_u32,
&mut del_add_facet_value,
DelAddFacetValue::insert_del,
docid,
fid,
meta,
filterable_attributes,
depth,
value,
)
},
)?;
extract_geo_document(
inner.merged(rtxn, index, context.db_fields_ids_map)?,
inner.external_document_id(),
new_fields_ids_map.deref_mut(),
asc_desc_fields,
&mut |fid, meta, depth, value| {
Self::facet_fn_with_options(
&context.doc_alloc,
cached_sorter.deref_mut(),
BalancedCaches::insert_add_u32,
&mut del_add_facet_value,
DelAddFacetValue::insert_add,
docid,
fid,
meta,
filterable_attributes,
depth,
value,
)
},
)?;
}
}
DocumentChange::Insertion(inner) => {
extract_document_facets(
inner.inserted(), inner.inserted(),
inner.external_document_id(), inner.external_document_id(),
new_fields_ids_map.deref_mut(), new_fields_ids_map.deref_mut(),
@@ -197,7 +266,6 @@ impl FacetedDocidsExtractor {
sortable_fields, sortable_fields,
asc_desc_fields, asc_desc_fields,
distinct_field, distinct_field,
is_geo_enabled,
&mut |fid, meta, depth, value| { &mut |fid, meta, depth, value| {
Self::facet_fn_with_options( Self::facet_fn_with_options(
&context.doc_alloc, &context.doc_alloc,
@@ -213,11 +281,35 @@ impl FacetedDocidsExtractor {
value, value,
) )
}, },
), )?;
if is_geo_enabled {
extract_geo_document(
inner.inserted(),
inner.external_document_id(),
new_fields_ids_map.deref_mut(),
asc_desc_fields,
&mut |fid, meta, depth, value| {
Self::facet_fn_with_options(
&context.doc_alloc,
cached_sorter.deref_mut(),
BalancedCaches::insert_add_u32,
&mut del_add_facet_value,
DelAddFacetValue::insert_add,
docid,
fid,
meta,
filterable_attributes,
depth,
value,
)
},
)?;
}
}
}; };
del_add_facet_value.send_data(docid, sender, &context.doc_alloc).unwrap(); del_add_facet_value.send_data(docid, sender, &context.doc_alloc).unwrap();
res Ok(())
} }
#[allow(clippy::too_many_arguments)] #[allow(clippy::too_many_arguments)]

View File

@@ -22,7 +22,6 @@ pub fn extract_document_facets<'doc>(
sortable_fields: &HashSet<String>, sortable_fields: &HashSet<String>,
asc_desc_fields: &HashSet<String>, asc_desc_fields: &HashSet<String>,
distinct_field: &Option<String>, distinct_field: &Option<String>,
is_geo_enabled: bool,
facet_fn: &mut impl FnMut(FieldId, Metadata, perm_json_p::Depth, &Value) -> Result<()>, facet_fn: &mut impl FnMut(FieldId, Metadata, perm_json_p::Depth, &Value) -> Result<()>,
) -> Result<()> { ) -> Result<()> {
// return the match result for the given field name. // return the match result for the given field name.
@@ -102,7 +101,16 @@ pub fn extract_document_facets<'doc>(
} }
} }
if is_geo_enabled { Ok(())
}
pub fn extract_geo_document<'doc>(
document: impl Document<'doc>,
external_document_id: &str,
field_id_map: &mut GlobalFieldsIdsMap,
asc_desc_fields: &HashSet<String>,
facet_fn: &mut impl FnMut(FieldId, Metadata, perm_json_p::Depth, &Value) -> Result<()>,
) -> Result<()> {
if let Some(geo_value) = document.geo_field()? { if let Some(geo_value) = document.geo_field()? {
if let Some([lat, lng]) = extract_geo_coordinates(external_document_id, geo_value)? { if let Some([lat, lng]) = extract_geo_coordinates(external_document_id, geo_value)? {
let ((lat_fid, lat_meta), (lng_fid, lng_meta)) = field_id_map let ((lat_fid, lat_meta), (lng_fid, lng_meta)) = field_id_map
@@ -114,7 +122,6 @@ pub fn extract_document_facets<'doc>(
facet_fn(lng_fid, lng_meta, perm_json_p::Depth::OnBaseKey, &lng.into())?; facet_fn(lng_fid, lng_meta, perm_json_p::Depth::OnBaseKey, &lng.into())?;
} }
} }
}
Ok(()) Ok(())
} }