mirror of
				https://github.com/meilisearch/meilisearch.git
				synced 2025-10-25 21:16:28 +00:00 
			
		
		
		
	Compute the size of the auth-controller, index-scheduler and all update files in the global stats
This commit is contained in:
		| @@ -1,4 +1,3 @@ | ||||
| use std::collections::BTreeSet; | ||||
| use std::fs::File as StdFile; | ||||
| use std::ops::{Deref, DerefMut}; | ||||
| use std::path::{Path, PathBuf}; | ||||
| @@ -11,10 +10,14 @@ const UPDATE_FILES_PATH: &str = "updates/updates_files"; | ||||
|  | ||||
| #[derive(Debug, thiserror::Error)] | ||||
| pub enum Error { | ||||
|     #[error("Could not parse file name as utf-8")] | ||||
|     CouldNotParseFileNameAsUtf8, | ||||
|     #[error(transparent)] | ||||
|     IoError(#[from] std::io::Error), | ||||
|     #[error(transparent)] | ||||
|     PersistError(#[from] tempfile::PersistError), | ||||
|     #[error(transparent)] | ||||
|     UuidError(#[from] uuid::Error), | ||||
| } | ||||
|  | ||||
| pub type Result<T> = std::result::Result<T, Error>; | ||||
| @@ -33,13 +36,11 @@ impl DerefMut for File { | ||||
|     } | ||||
| } | ||||
|  | ||||
| #[cfg_attr(test, faux::create)] | ||||
| #[derive(Clone, Debug)] | ||||
| pub struct FileStore { | ||||
|     path: PathBuf, | ||||
| } | ||||
|  | ||||
| #[cfg(not(test))] | ||||
| impl FileStore { | ||||
|     pub fn new(path: impl AsRef<Path>) -> Result<FileStore> { | ||||
|         let path = path.as_ref().to_path_buf(); | ||||
| @@ -48,7 +49,6 @@ impl FileStore { | ||||
|     } | ||||
| } | ||||
|  | ||||
| #[cfg_attr(test, faux::methods)] | ||||
| impl FileStore { | ||||
|     /// Creates a new temporary update file. | ||||
|     /// A call to `persist` is needed to persist the file in the database. | ||||
| @@ -94,6 +94,14 @@ impl FileStore { | ||||
|         Ok(()) | ||||
|     } | ||||
|  | ||||
|     pub fn update_total_size(&self) -> Result<u64> { | ||||
|         let mut total = 0; | ||||
|         for uuid in self.all_uuids()? { | ||||
|             total += self.get_size(uuid?)?; | ||||
|         } | ||||
|         Ok(total) | ||||
|     } | ||||
|  | ||||
|     pub fn get_size(&self, uuid: Uuid) -> Result<u64> { | ||||
|         Ok(self.get_update(uuid)?.metadata()?.len()) | ||||
|     } | ||||
| @@ -105,17 +113,12 @@ impl FileStore { | ||||
|     } | ||||
|  | ||||
|     /// List the Uuids of the files in the FileStore | ||||
|     /// | ||||
|     /// This function is meant to be used by tests only. | ||||
|     #[doc(hidden)] | ||||
|     pub fn __all_uuids(&self) -> BTreeSet<Uuid> { | ||||
|         let mut uuids = BTreeSet::new(); | ||||
|         for entry in self.path.read_dir().unwrap() { | ||||
|             let entry = entry.unwrap(); | ||||
|             let uuid = Uuid::from_str(entry.file_name().to_str().unwrap()).unwrap(); | ||||
|             uuids.insert(uuid); | ||||
|         } | ||||
|         uuids | ||||
|     pub fn all_uuids(&self) -> Result<impl Iterator<Item = Result<Uuid>>> { | ||||
|         Ok(self.path.read_dir()?.map(|entry| { | ||||
|             Ok(Uuid::from_str( | ||||
|                 entry?.file_name().to_str().ok_or(Error::CouldNotParseFileNameAsUtf8)?, | ||||
|             )?) | ||||
|         })) | ||||
|     } | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,3 +1,4 @@ | ||||
| use std::collections::BTreeSet; | ||||
| use std::fmt::Write; | ||||
|  | ||||
| use meilisearch_types::heed::types::{OwnedType, SerdeBincode, SerdeJson, Str}; | ||||
| @@ -92,7 +93,9 @@ pub fn snapshot_index_scheduler(scheduler: &IndexScheduler) -> String { | ||||
|  | ||||
| pub fn snapshot_file_store(file_store: &file_store::FileStore) -> String { | ||||
|     let mut snap = String::new(); | ||||
|     for uuid in file_store.__all_uuids() { | ||||
|     // we store the uuid in a `BTreeSet` to keep them ordered. | ||||
|     let all_uuids = file_store.all_uuids().unwrap().collect::<Result<BTreeSet<_>, _>>().unwrap(); | ||||
|     for uuid in all_uuids { | ||||
|         snap.push_str(&format!("{uuid}\n")); | ||||
|     } | ||||
|     snap | ||||
|   | ||||
| @@ -452,6 +452,10 @@ impl IndexScheduler { | ||||
|         &self.index_mapper.indexer_config | ||||
|     } | ||||
|  | ||||
|     pub fn size(&self) -> Result<u64> { | ||||
|         Ok(self.env.real_disk_size()?) | ||||
|     } | ||||
|  | ||||
|     /// Return the index corresponding to the name. | ||||
|     /// | ||||
|     /// * If the index wasn't opened before, the index will be opened. | ||||
| @@ -898,6 +902,11 @@ impl IndexScheduler { | ||||
|         Ok(self.file_store.new_update_with_uuid(uuid)?) | ||||
|     } | ||||
|  | ||||
|     /// List the update files contained in the IndexScheduler. | ||||
|     pub fn update_file_size(&self) -> Result<u64> { | ||||
|         Ok(self.file_store.update_total_size()?) | ||||
|     } | ||||
|  | ||||
|     /// Delete a file from the index scheduler. | ||||
|     /// | ||||
|     /// Counterpart to the [`create_update_file`](IndexScheduler::create_update_file) method. | ||||
|   | ||||
| @@ -508,14 +508,23 @@ impl IndexScheduler { | ||||
|             if let KindWithContent::DocumentAdditionOrUpdate { content_file, .. } = kind { | ||||
|                 match status { | ||||
|                     Status::Enqueued | Status::Processing => { | ||||
|                         assert!( | ||||
|                             self.file_store.__all_uuids().contains(&content_file), | ||||
|                         assert!(self | ||||
|                         .file_store | ||||
|                         .all_uuids() | ||||
|                         .unwrap() | ||||
|                         .find(|uuid| uuid.as_ref().unwrap() == &content_file) | ||||
|                         .is_some(), | ||||
|                        "Could not find uuid `{content_file}` in the file_store. Available uuids are {:?}.", | ||||
|                             self.file_store.__all_uuids(), | ||||
|                         self.file_store.all_uuids().unwrap().collect::<Result<Vec<_>>>(), | ||||
|                         ); | ||||
|                     } | ||||
|                     Status::Succeeded | Status::Failed | Status::Canceled => { | ||||
|                         assert!(!self.file_store.__all_uuids().contains(&content_file)); | ||||
|                         assert!(self | ||||
|                             .file_store | ||||
|                             .all_uuids() | ||||
|                             .unwrap() | ||||
|                             .find(|uuid| uuid.as_ref().unwrap() == &content_file) | ||||
|                             .is_none()); | ||||
|                     } | ||||
|                 } | ||||
|             } | ||||
|   | ||||
| @@ -33,6 +33,11 @@ impl AuthController { | ||||
|         Ok(Self { store: Arc::new(store), master_key: master_key.clone() }) | ||||
|     } | ||||
|  | ||||
|     /// Return the size of the `AuthController` database in bytes. | ||||
|     pub fn size(&self) -> Result<u64> { | ||||
|         self.store.size() | ||||
|     } | ||||
|  | ||||
|     pub fn create_key(&self, create_key: CreateApiKey) -> Result<Key> { | ||||
|         match self.store.get_api_key(create_key.uid)? { | ||||
|             Some(_) => Err(AuthControllerError::ApiKeyAlreadyExists(create_key.uid.to_string())), | ||||
|   | ||||
| @@ -60,6 +60,11 @@ impl HeedAuthStore { | ||||
|         Ok(Self { env, keys, action_keyid_index_expiration, should_close_on_drop: true }) | ||||
|     } | ||||
|  | ||||
|     /// Return the size in bytes of database | ||||
|     pub fn size(&self) -> Result<u64> { | ||||
|         Ok(self.env.real_disk_size()?) | ||||
|     } | ||||
|  | ||||
|     pub fn set_drop_on_close(&mut self, v: bool) { | ||||
|         self.should_close_on_drop = v; | ||||
|     } | ||||
|   | ||||
| @@ -343,6 +343,7 @@ impl ErrorCode for file_store::Error { | ||||
|         match self { | ||||
|             Self::IoError(e) => e.error_code(), | ||||
|             Self::PersistError(e) => e.error_code(), | ||||
|             Self::CouldNotParseFileNameAsUtf8 | Self::UuidError(_) => Code::Internal, | ||||
|         } | ||||
|     } | ||||
| } | ||||
|   | ||||
| @@ -4,6 +4,7 @@ use actix_web::web::Data; | ||||
| use actix_web::{web, HttpRequest, HttpResponse}; | ||||
| use index_scheduler::{IndexScheduler, Query}; | ||||
| use log::debug; | ||||
| use meilisearch_auth::AuthController; | ||||
| use meilisearch_types::error::ResponseError; | ||||
| use meilisearch_types::settings::{Settings, Unchecked}; | ||||
| use meilisearch_types::tasks::{Kind, Status, Task, TaskId}; | ||||
| @@ -230,13 +231,15 @@ pub struct Stats { | ||||
|  | ||||
| async fn get_stats( | ||||
|     index_scheduler: GuardedData<ActionPolicy<{ actions::STATS_GET }>, Data<IndexScheduler>>, | ||||
|     auth_controller: GuardedData<ActionPolicy<{ actions::STATS_GET }>, AuthController>, | ||||
|     req: HttpRequest, | ||||
|     analytics: web::Data<dyn Analytics>, | ||||
| ) -> Result<HttpResponse, ResponseError> { | ||||
|     analytics.publish("Stats Seen".to_string(), json!({ "per_index_uid": false }), Some(&req)); | ||||
|     let search_rules = &index_scheduler.filters().search_rules; | ||||
|  | ||||
|     let stats = create_all_stats((*index_scheduler).clone(), search_rules)?; | ||||
|     let stats = | ||||
|         create_all_stats((*index_scheduler).clone(), (*auth_controller).clone(), search_rules)?; | ||||
|  | ||||
|     debug!("returns: {:?}", stats); | ||||
|     Ok(HttpResponse::Ok().json(stats)) | ||||
| @@ -244,6 +247,7 @@ async fn get_stats( | ||||
|  | ||||
| pub fn create_all_stats( | ||||
|     index_scheduler: Data<IndexScheduler>, | ||||
|     auth_controller: AuthController, | ||||
|     search_rules: &meilisearch_auth::SearchRules, | ||||
| ) -> Result<Stats, ResponseError> { | ||||
|     let mut last_task: Option<OffsetDateTime> = None; | ||||
| @@ -253,6 +257,7 @@ pub fn create_all_stats( | ||||
|         Query { statuses: Some(vec![Status::Processing]), limit: Some(1), ..Query::default() }, | ||||
|         search_rules.authorized_indexes(), | ||||
|     )?; | ||||
|     // accumulate the size of each indexes | ||||
|     let processing_index = processing_task.first().and_then(|task| task.index_uid()); | ||||
|     for (name, index) in index_scheduler.indexes()? { | ||||
|         if !search_rules.is_index_authorized(&name) { | ||||
| @@ -273,6 +278,11 @@ pub fn create_all_stats( | ||||
|  | ||||
|         indexes.insert(name, stats); | ||||
|     } | ||||
|  | ||||
|     database_size += index_scheduler.size()?; | ||||
|     database_size += auth_controller.size()?; | ||||
|     database_size += index_scheduler.update_file_size()?; | ||||
|  | ||||
|     let stats = Stats { database_size, last_update: last_task, indexes }; | ||||
|     Ok(stats) | ||||
| } | ||||
|   | ||||
		Reference in New Issue
	
	Block a user