mirror of
				https://github.com/meilisearch/meilisearch.git
				synced 2025-10-26 05:26:27 +00:00 
			
		
		
		
	Merge #4633
4633: Allow to mark vectors as "userProvided" r=Kerollmops a=dureuill # Pull Request ## Related issue Fixes #4606 ## What does this PR do? [See usage in PRD](https://meilisearch.notion.site/v1-9-AI-search-changes-e90d6803eca8417aa70a1ac5d0225697#deb96fb0595947bda7d4a371100326eb) - Extends the shape of the special `_vectors` field in documents. - previously, the `_vectors` field had to be an object, with each field the name of a configured embedder, and each value either `null`, an embedding (array of numbers), or an array of embeddings. - In this PR, the value of an embedder in the `_vectors` field can additionally be an object. The object has two fields: 1. `embeddings`: `null`, an embedding (array of numbers), or an array of embeddings. 2. `userProvided`: a boolean indicating if the vector was provided by the user. - The previous form `embedder_or_array_of_embedders` is semantically equivalent to: ```json { "embeddings": embedder_or_array_of_embedders, "userProvided": true } ``` - During the indexing step, the subfields and values of the `_vectors` field that have `userProvided` set to **false** are added in the vector DB, but not in the documents DB: that means that future modifications of the documents will trigger a regeneration of that particular vector using the document template. - This allows **importing** embeddings as a one-shot process, while still retaining the ability to regenerate embeddings on document change. - The dump process now uses this ability: it enriches the `_vectors` fields of documents with the embeddings that were autogenerated, marking them as not `userProvided`. This allows importing the vectors from a dump without regenerating them. ### Tests This PR adds the following tests - Long-needed hybrid search tests of a simple hf embedder - Dump test that imports vectors. Due to the difficulty of actually importing a dump in tests, we just read the dump and check it contains the expected content. - Tests in the index-scheduler: this tests that documents containing the same kind of instructions as in the dump indexes as expected Co-authored-by: Louis Dureuil <louis@meilisearch.com>
This commit is contained in:
		| @@ -197,6 +197,140 @@ pub(crate) mod test { | ||||
|     use super::*; | ||||
|     use crate::reader::v6::RuntimeTogglableFeatures; | ||||
|  | ||||
|     #[test] | ||||
|     fn import_dump_v6_with_vectors() { | ||||
|         // dump containing two indexes | ||||
|         // | ||||
|         // "vector", configured with an embedder | ||||
|         // contains: | ||||
|         // - one document with an overriden vector, | ||||
|         // - one document with a natural vector | ||||
|         // - one document with a _vectors map containing one additional embedder name and a natural vector | ||||
|         // - one document with a _vectors map containing one additional embedder name and an overriden vector | ||||
|         // | ||||
|         // "novector", no embedder | ||||
|         // contains: | ||||
|         // - a document without vector | ||||
|         // - a document with a random _vectors field | ||||
|         let dump = File::open("tests/assets/v6-with-vectors.dump").unwrap(); | ||||
|         let mut dump = DumpReader::open(dump).unwrap(); | ||||
|  | ||||
|         // top level infos | ||||
|         insta::assert_display_snapshot!(dump.date().unwrap(), @"2024-05-16 15:51:34.151044 +00:00:00"); | ||||
|         insta::assert_debug_snapshot!(dump.instance_uid().unwrap(), @"None"); | ||||
|  | ||||
|         // tasks | ||||
|         let tasks = dump.tasks().unwrap().collect::<Result<Vec<_>>>().unwrap(); | ||||
|         let (tasks, update_files): (Vec<_>, Vec<_>) = tasks.into_iter().unzip(); | ||||
|         meili_snap::snapshot_hash!(meili_snap::json_string!(tasks), @"278f63325ef06ca04d01df98d8207b94"); | ||||
|         assert_eq!(update_files.len(), 10); | ||||
|         assert!(update_files[0].is_none()); // the dump creation | ||||
|         assert!(update_files[1].is_none()); | ||||
|         assert!(update_files[2].is_none()); | ||||
|         assert!(update_files[3].is_none()); | ||||
|         assert!(update_files[4].is_none()); | ||||
|         assert!(update_files[5].is_none()); | ||||
|         assert!(update_files[6].is_none()); | ||||
|         assert!(update_files[7].is_none()); | ||||
|         assert!(update_files[8].is_none()); | ||||
|         assert!(update_files[9].is_none()); | ||||
|  | ||||
|         // indexes | ||||
|         let mut indexes = dump.indexes().unwrap().collect::<Result<Vec<_>>>().unwrap(); | ||||
|         // the index are not ordered in any way by default | ||||
|         indexes.sort_by_key(|index| index.metadata().uid.to_string()); | ||||
|  | ||||
|         let mut vector_index = indexes.pop().unwrap(); | ||||
|         let mut novector_index = indexes.pop().unwrap(); | ||||
|         assert!(indexes.is_empty()); | ||||
|  | ||||
|         // vector | ||||
|  | ||||
|         insta::assert_json_snapshot!(vector_index.metadata(), @r###" | ||||
|         { | ||||
|           "uid": "vector", | ||||
|           "primaryKey": "id", | ||||
|           "createdAt": "2024-05-16T15:33:17.240962Z", | ||||
|           "updatedAt": "2024-05-16T15:40:55.723052Z" | ||||
|         } | ||||
|         "###); | ||||
|  | ||||
|         { | ||||
|             let documents: Result<Vec<_>> = vector_index.documents().unwrap().collect(); | ||||
|             let mut documents = documents.unwrap(); | ||||
|             assert_eq!(documents.len(), 4); | ||||
|  | ||||
|             documents.sort_by_key(|doc| doc.get("id").unwrap().to_string()); | ||||
|  | ||||
|             { | ||||
|                 let document = documents.pop().unwrap(); | ||||
|                 insta::assert_json_snapshot!(document); | ||||
|             } | ||||
|  | ||||
|             { | ||||
|                 let document = documents.pop().unwrap(); | ||||
|                 insta::assert_json_snapshot!(document); | ||||
|             } | ||||
|  | ||||
|             { | ||||
|                 let document = documents.pop().unwrap(); | ||||
|                 insta::assert_json_snapshot!(document); | ||||
|             } | ||||
|  | ||||
|             { | ||||
|                 let document = documents.pop().unwrap(); | ||||
|                 insta::assert_json_snapshot!(document); | ||||
|             } | ||||
|         } | ||||
|  | ||||
|         // novector | ||||
|  | ||||
|         insta::assert_json_snapshot!(novector_index.metadata(), @r###" | ||||
|         { | ||||
|           "uid": "novector", | ||||
|           "primaryKey": "id", | ||||
|           "createdAt": "2024-05-16T15:33:03.568055Z", | ||||
|           "updatedAt": "2024-05-16T15:33:07.530217Z" | ||||
|         } | ||||
|         "###); | ||||
|  | ||||
|         insta::assert_json_snapshot!(novector_index.settings().unwrap().embedders, @"null"); | ||||
|  | ||||
|         { | ||||
|             let documents: Result<Vec<_>> = novector_index.documents().unwrap().collect(); | ||||
|             let mut documents = documents.unwrap(); | ||||
|             assert_eq!(documents.len(), 2); | ||||
|  | ||||
|             documents.sort_by_key(|doc| doc.get("id").unwrap().to_string()); | ||||
|  | ||||
|             { | ||||
|                 let document = documents.pop().unwrap(); | ||||
|                 insta::assert_json_snapshot!(document, @r###" | ||||
|                 { | ||||
|                   "id": "e1", | ||||
|                   "other": "random1", | ||||
|                   "_vectors": "toto" | ||||
|                 } | ||||
|                 "###); | ||||
|             } | ||||
|  | ||||
|             { | ||||
|                 let document = documents.pop().unwrap(); | ||||
|                 insta::assert_json_snapshot!(document, @r###" | ||||
|                 { | ||||
|                   "id": "e0", | ||||
|                   "other": "random0" | ||||
|                 } | ||||
|                 "###); | ||||
|             } | ||||
|         } | ||||
|  | ||||
|         assert_eq!( | ||||
|             dump.features().unwrap().unwrap(), | ||||
|             RuntimeTogglableFeatures { vector_store: true, ..Default::default() } | ||||
|         ); | ||||
|     } | ||||
|  | ||||
|     #[test] | ||||
|     fn import_dump_v6_experimental() { | ||||
|         let dump = File::open("tests/assets/v6-with-experimental.dump").unwrap(); | ||||
|   | ||||
| @@ -0,0 +1,783 @@ | ||||
| --- | ||||
| source: dump/src/reader/mod.rs | ||||
| expression: document | ||||
| --- | ||||
| { | ||||
|   "id": "e3", | ||||
|   "desc": "overriden vector + map", | ||||
|   "_vectors": { | ||||
|     "default": [ | ||||
|       0.2, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1 | ||||
|     ], | ||||
|     "toto": [ | ||||
|       0.1 | ||||
|     ] | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,786 @@ | ||||
| --- | ||||
| source: dump/src/reader/mod.rs | ||||
| expression: document | ||||
| --- | ||||
| { | ||||
|   "id": "e2", | ||||
|   "desc": "natural vector + map", | ||||
|   "_vectors": { | ||||
|     "toto": [], | ||||
|     "default": { | ||||
|       "embeddings": [ | ||||
|         [ | ||||
|           -0.05189208313822746, | ||||
|           -0.9273212552070618, | ||||
|           0.1443813145160675, | ||||
|           0.0932632014155388, | ||||
|           0.2665371894836426, | ||||
|           0.36266782879829407, | ||||
|           0.6402910947799683, | ||||
|           0.32014018297195435, | ||||
|           0.030915971845388412, | ||||
|           -0.9312191605567932, | ||||
|           -0.3718109726905823, | ||||
|           -0.2700554132461548, | ||||
|           -1.1014580726623535, | ||||
|           0.9154956936836244, | ||||
|           -0.3406888246536255, | ||||
|           1.0077725648880005, | ||||
|           0.6577560901641846, | ||||
|           -0.3955195546150207, | ||||
|           -0.4148270785808563, | ||||
|           0.1855088472366333, | ||||
|           0.5062315464019775, | ||||
|           -0.3632686734199524, | ||||
|           -0.2277890294790268, | ||||
|           0.2560805082321167, | ||||
|           -0.3853609561920166, | ||||
|           -0.1604762226343155, | ||||
|           -0.13947471976280212, | ||||
|           -0.20147813856601715, | ||||
|           -0.4466346800327301, | ||||
|           -0.3761846721172333, | ||||
|           0.1443382054567337, | ||||
|           0.18205296993255615, | ||||
|           0.49359792470932007, | ||||
|           -0.22538000345230105, | ||||
|           -0.4996317625045776, | ||||
|           -0.22734887897968292, | ||||
|           -0.6034309267997742, | ||||
|           -0.7857939600944519, | ||||
|           -0.34923747181892395, | ||||
|           -0.3466345965862274, | ||||
|           0.21176661550998688, | ||||
|           -0.5101462006568909, | ||||
|           -0.3403083384037018, | ||||
|           0.000315118464641273, | ||||
|           0.236465722322464, | ||||
|           -0.10246097296476364, | ||||
|           -1.3013339042663574, | ||||
|           0.3419138789176941, | ||||
|           -0.32963496446609497, | ||||
|           -0.0901619717478752, | ||||
|           -0.5426247119903564, | ||||
|           0.22656650841236117, | ||||
|           -0.44758284091949463, | ||||
|           0.14151698350906372, | ||||
|           -0.1089438870549202, | ||||
|           0.5500766634941101, | ||||
|           -0.670711100101471, | ||||
|           -0.6227269768714905, | ||||
|           0.3894464075565338, | ||||
|           -0.27609574794769287, | ||||
|           0.7028202414512634, | ||||
|           -0.19697771966457367, | ||||
|           0.328511506319046, | ||||
|           0.5063360929489136, | ||||
|           0.4065195322036743, | ||||
|           0.2614171802997589, | ||||
|           -0.30274391174316406, | ||||
|           1.0393824577331543, | ||||
|           -0.7742937207221985, | ||||
|           -0.7874112129211426, | ||||
|           -0.6749666929244995, | ||||
|           0.5190866589546204, | ||||
|           0.004123548045754433, | ||||
|           -0.28312963247299194, | ||||
|           -0.038731709122657776, | ||||
|           -1.0142987966537476, | ||||
|           -0.09519586712121964, | ||||
|           0.8755272626876831, | ||||
|           0.4876938760280609, | ||||
|           0.7811151742935181, | ||||
|           0.85174959897995, | ||||
|           0.11826585978269576, | ||||
|           0.5373436808586121, | ||||
|           0.3649002015590668, | ||||
|           0.19064077734947205, | ||||
|           -0.00287026260048151, | ||||
|           -0.7305403351783752, | ||||
|           -0.015206154435873032, | ||||
|           -0.7899249196052551, | ||||
|           0.19407285749912265, | ||||
|           0.08596625179052353, | ||||
|           -0.28976231813430786, | ||||
|           -0.1525907665491104, | ||||
|           0.3798313438892365, | ||||
|           0.050306469202041626, | ||||
|           -0.5697937607765198, | ||||
|           0.4219021201133728, | ||||
|           0.276252806186676, | ||||
|           0.1559903472661972, | ||||
|           0.10030482709407806, | ||||
|           -0.4043720066547394, | ||||
|           -0.1969818025827408, | ||||
|           0.5739826560020447, | ||||
|           0.2116064727306366, | ||||
|           -1.4620544910430908, | ||||
|           -0.7802462577819824, | ||||
|           -0.24739810824394223, | ||||
|           -0.09791352599859238, | ||||
|           -0.4413802027702331, | ||||
|           0.21549351513385773, | ||||
|           -0.9520436525344848, | ||||
|           -0.08762510865926743, | ||||
|           0.08154498040676117, | ||||
|           -0.6154940724372864, | ||||
|           -1.01079523563385, | ||||
|           0.885427713394165, | ||||
|           0.6967288851737976, | ||||
|           0.27186504006385803, | ||||
|           -0.43194177746772766, | ||||
|           -0.11248451471328735, | ||||
|           0.7576630711555481, | ||||
|           0.4998855590820313, | ||||
|           0.0264343973249197, | ||||
|           0.9872855544090272, | ||||
|           0.5634694695472717, | ||||
|           0.053698331117630005, | ||||
|           0.19410227239131927, | ||||
|           0.3570743501186371, | ||||
|           -0.23670297861099243, | ||||
|           -0.9114483594894408, | ||||
|           0.07884842902421951, | ||||
|           0.7318344116210938, | ||||
|           0.44630110263824463, | ||||
|           0.08745364099740982, | ||||
|           -0.347101628780365, | ||||
|           -0.4314247667789459, | ||||
|           -0.5060274004936218, | ||||
|           0.003706763498485088, | ||||
|           0.44320008158683777, | ||||
|           -0.00788921769708395, | ||||
|           -0.1368623524904251, | ||||
|           -0.17391923069953918, | ||||
|           0.14473655819892883, | ||||
|           0.10927865654230118, | ||||
|           0.6974599361419678, | ||||
|           0.005052129738032818, | ||||
|           -0.016953065991401672, | ||||
|           -0.1256176233291626, | ||||
|           -0.036742497235536575, | ||||
|           0.5591985583305359, | ||||
|           -0.37619709968566895, | ||||
|           0.22429119050502777, | ||||
|           0.5403043031692505, | ||||
|           -0.8603790998458862, | ||||
|           -0.3456307053565979, | ||||
|           0.9292937517166138, | ||||
|           0.5074859261512756, | ||||
|           0.6310645937919617, | ||||
|           -0.3091641068458557, | ||||
|           0.46902573108673096, | ||||
|           0.7891915440559387, | ||||
|           0.4499550759792328, | ||||
|           0.2744995653629303, | ||||
|           0.2712305784225464, | ||||
|           -0.04349074140191078, | ||||
|           -0.3638863265514374, | ||||
|           0.7839881777763367, | ||||
|           0.7352104783058167, | ||||
|           -0.19457511603832245, | ||||
|           -0.5957832932472229, | ||||
|           -0.43704694509506226, | ||||
|           -1.084769368171692, | ||||
|           0.4904985725879669, | ||||
|           0.5385226011276245, | ||||
|           0.1891629993915558, | ||||
|           0.12338479608297348, | ||||
|           0.8315675258636475, | ||||
|           -0.07830192148685455, | ||||
|           1.0916285514831543, | ||||
|           -0.28066861629486084, | ||||
|           -1.3585069179534912, | ||||
|           0.5203898549079895, | ||||
|           0.08678033947944641, | ||||
|           -0.2566044330596924, | ||||
|           0.09484415501356123, | ||||
|           -0.0180208683013916, | ||||
|           1.0264745950698853, | ||||
|           -0.023572135716676712, | ||||
|           0.5864979028701782, | ||||
|           0.7625196576118469, | ||||
|           -0.2543414533138275, | ||||
|           -0.8877770900726318, | ||||
|           0.7611982822418213, | ||||
|           -0.06220436468720436, | ||||
|           0.937336564064026, | ||||
|           0.2704363465309143, | ||||
|           -0.37733694911003113, | ||||
|           0.5076137781143188, | ||||
|           -0.30641937255859375, | ||||
|           0.6252772808074951, | ||||
|           -0.0823579877614975, | ||||
|           -0.03736555948853493, | ||||
|           0.4131673276424408, | ||||
|           -0.6514252424240112, | ||||
|           0.12918265163898468, | ||||
|           -0.4483584463596344, | ||||
|           0.6750786304473877, | ||||
|           -0.37008383870124817, | ||||
|           -0.02324833907186985, | ||||
|           0.38027650117874146, | ||||
|           -0.26374951004981995, | ||||
|           0.4346931278705597, | ||||
|           0.42882832884788513, | ||||
|           -0.48798441886901855, | ||||
|           1.1882442235946655, | ||||
|           0.5132288336753845, | ||||
|           0.5284568667411804, | ||||
|           -0.03538886830210686, | ||||
|           0.29620853066444397, | ||||
|           -1.0683696269989014, | ||||
|           0.25936177372932434, | ||||
|           0.10404160618782043, | ||||
|           -0.25796034932136536, | ||||
|           0.027896970510482788, | ||||
|           -0.09225251525640488, | ||||
|           1.4811025857925415, | ||||
|           0.641173779964447, | ||||
|           -0.13838383555412292, | ||||
|           -0.3437179923057556, | ||||
|           0.5667019486427307, | ||||
|           -0.5400741696357727, | ||||
|           0.31090837717056274, | ||||
|           0.6470608115196228, | ||||
|           -0.3747067153453827, | ||||
|           -0.7364534735679626, | ||||
|           -0.07431528717279434, | ||||
|           0.5173454880714417, | ||||
|           -0.6578747034072876, | ||||
|           0.7107478976249695, | ||||
|           -0.7918999791145325, | ||||
|           -0.0648345872759819, | ||||
|           0.609937846660614, | ||||
|           -0.7329513430595398, | ||||
|           0.9741371870040894, | ||||
|           0.17912346124649048, | ||||
|           -0.02658769302070141, | ||||
|           0.5162150859832764, | ||||
|           -0.3978803157806397, | ||||
|           -0.7833885550498962, | ||||
|           -0.6497276425361633, | ||||
|           -0.3898126780986786, | ||||
|           -0.0952848568558693, | ||||
|           0.2663288116455078, | ||||
|           -0.1604052186012268, | ||||
|           0.373076468706131, | ||||
|           -0.8357769250869751, | ||||
|           -0.05217683315277099, | ||||
|           -0.2680160701274872, | ||||
|           0.8389158248901367, | ||||
|           0.6833611130714417, | ||||
|           -0.6712407469749451, | ||||
|           0.7406917214393616, | ||||
|           -0.44522786140441895, | ||||
|           -0.34645363688468933, | ||||
|           -0.27384576201438904, | ||||
|           -0.9878405928611756, | ||||
|           -0.8166060447692871, | ||||
|           0.06268279999494553, | ||||
|           0.38567957282066345, | ||||
|           -0.3274703919887543, | ||||
|           0.5296315550804138, | ||||
|           -0.11810623109340668, | ||||
|           0.23029841482639313, | ||||
|           0.08616159111261368, | ||||
|           -0.2195747196674347, | ||||
|           0.09430307894945145, | ||||
|           0.4057176411151886, | ||||
|           0.4892159104347229, | ||||
|           -0.1636916548013687, | ||||
|           -0.6071445345878601, | ||||
|           0.41256585717201233, | ||||
|           0.622254490852356, | ||||
|           -0.41223976016044617, | ||||
|           -0.6686707139015198, | ||||
|           -0.7474371790885925, | ||||
|           -0.8509522080421448, | ||||
|           -0.16754287481307983, | ||||
|           -0.9078601002693176, | ||||
|           -0.29653599858283997, | ||||
|           -0.5020652413368225, | ||||
|           0.4692700505256653, | ||||
|           0.01281109917908907, | ||||
|           -0.16071580350399017, | ||||
|           0.03388889133930206, | ||||
|           -0.020511148497462273, | ||||
|           0.5027827024459839, | ||||
|           -0.20729811489582065, | ||||
|           0.48107290267944336, | ||||
|           0.33669769763946533, | ||||
|           -0.5275911688804626, | ||||
|           0.48271527886390686, | ||||
|           0.2738940715789795, | ||||
|           -0.033152539283037186, | ||||
|           -0.13629786670207977, | ||||
|           -0.05965912342071533, | ||||
|           -0.26200807094573975, | ||||
|           0.04002794995903969, | ||||
|           -0.34095603227615356, | ||||
|           -3.986898899078369, | ||||
|           -0.46819332242012024, | ||||
|           -0.422744482755661, | ||||
|           -0.169097900390625, | ||||
|           0.6008929014205933, | ||||
|           0.058016058057546616, | ||||
|           -0.11401277780532836, | ||||
|           -0.3077819049358368, | ||||
|           -0.09595538675785063, | ||||
|           0.6723822355270386, | ||||
|           0.19367831945419312, | ||||
|           0.28304359316825867, | ||||
|           0.1609862744808197, | ||||
|           0.7567598819732666, | ||||
|           0.6889985799789429, | ||||
|           0.06907720118761063, | ||||
|           -0.04188092052936554, | ||||
|           -0.7434936165809631, | ||||
|           0.13321782648563385, | ||||
|           0.8456063270568848, | ||||
|           -0.10364038497209548, | ||||
|           -0.45084846019744873, | ||||
|           -0.4758241474628449, | ||||
|           0.43882066011428833, | ||||
|           -0.6432598829269409, | ||||
|           0.7217311859130859, | ||||
|           -0.24189773201942444, | ||||
|           0.12737572193145752, | ||||
|           -1.1008601188659668, | ||||
|           -0.3305315673351288, | ||||
|           0.14614742994308472, | ||||
|           -0.7819333076477051, | ||||
|           0.5287120342254639, | ||||
|           -0.055538054555654526, | ||||
|           0.1877404749393463, | ||||
|           -0.6907662153244019, | ||||
|           0.5616975426673889, | ||||
|           -0.4611121714115143, | ||||
|           -0.26109233498573303, | ||||
|           -0.12898315489292145, | ||||
|           -0.3724522292613983, | ||||
|           -0.7191406488418579, | ||||
|           -0.4425233602523804, | ||||
|           -0.644108235836029, | ||||
|           0.8424481153488159, | ||||
|           0.17532426118850708, | ||||
|           -0.5121750235557556, | ||||
|           -0.6467239260673523, | ||||
|           -0.0008507720194756985, | ||||
|           0.7866212129592896, | ||||
|           -0.02644744887948036, | ||||
|           -0.005045140627771616, | ||||
|           0.015782782807946205, | ||||
|           0.16334445774555206, | ||||
|           -0.1913367658853531, | ||||
|           -0.13697923719882965, | ||||
|           -0.6684983372688293, | ||||
|           0.18346354365348816, | ||||
|           -0.341105580329895, | ||||
|           0.5427411198616028, | ||||
|           0.3779832422733307, | ||||
|           -0.6778115034103394, | ||||
|           -0.2931850254535675, | ||||
|           -0.8805161714553833, | ||||
|           -0.4212774932384491, | ||||
|           -0.5368952751159668, | ||||
|           -1.3937891721725464, | ||||
|           -1.225494146347046, | ||||
|           0.4276703894138336, | ||||
|           1.1205668449401855, | ||||
|           -0.6005299687385559, | ||||
|           0.15732505917549133, | ||||
|           -0.3914784789085388, | ||||
|           -1.357046604156494, | ||||
|           -0.4707142114639282, | ||||
|           -0.1497287154197693, | ||||
|           -0.25035548210144043, | ||||
|           -0.34328439831733704, | ||||
|           0.39083412289619446, | ||||
|           0.1623048633337021, | ||||
|           -0.9275814294815063, | ||||
|           -0.6430015563964844, | ||||
|           0.2973862886428833, | ||||
|           0.5580436587333679, | ||||
|           -0.6232585310935974, | ||||
|           -0.6611042022705078, | ||||
|           0.4015969038009643, | ||||
|           -1.0232892036437988, | ||||
|           -0.2585645020008087, | ||||
|           -0.5431421399116516, | ||||
|           0.5021264553070068, | ||||
|           -0.48601630330085754, | ||||
|           -0.010242084041237833, | ||||
|           0.5862035155296326, | ||||
|           0.7316920161247253, | ||||
|           0.4036808013916016, | ||||
|           0.4269520044326782, | ||||
|           -0.705938458442688, | ||||
|           0.7747307419776917, | ||||
|           0.10164368897676468, | ||||
|           0.7887958884239197, | ||||
|           -0.9612497091293336, | ||||
|           0.12755516171455383, | ||||
|           0.06812842190265656, | ||||
|           -0.022603651508688927, | ||||
|           0.14722754061222076, | ||||
|           -0.5588505268096924, | ||||
|           -0.20689940452575684, | ||||
|           0.3557641804218292, | ||||
|           -0.6812759637832642, | ||||
|           0.2860803008079529, | ||||
|           -0.38954633474349976, | ||||
|           0.1759403496980667, | ||||
|           -0.5678874850273132, | ||||
|           -0.1692986786365509, | ||||
|           -0.14578519761562347, | ||||
|           0.5711379051208496, | ||||
|           1.0208125114440918, | ||||
|           0.7759483456611633, | ||||
|           -0.372348427772522, | ||||
|           -0.5460885763168335, | ||||
|           0.7190321683883667, | ||||
|           -0.6914990544319153, | ||||
|           0.13365162909030914, | ||||
|           -0.4854792356491089, | ||||
|           0.4054908752441406, | ||||
|           0.4502798914909363, | ||||
|           -0.3041122555732727, | ||||
|           -0.06726965308189392, | ||||
|           -0.05570871382951737, | ||||
|           -0.0455719493329525, | ||||
|           0.4785125255584717, | ||||
|           0.8867972493171692, | ||||
|           0.4107886850833893, | ||||
|           0.6121342182159424, | ||||
|           -0.20477132499217987, | ||||
|           -0.5598517656326294, | ||||
|           -0.6443566679954529, | ||||
|           -0.5905212759971619, | ||||
|           -0.5571200251579285, | ||||
|           0.17573799192905426, | ||||
|           -0.28621870279312134, | ||||
|           0.1685224026441574, | ||||
|           0.09719007462263109, | ||||
|           -0.04223639518022537, | ||||
|           -0.28623101115226746, | ||||
|           -0.1449810117483139, | ||||
|           -0.3789580464363098, | ||||
|           -0.5227636098861694, | ||||
|           -0.049728814512491226, | ||||
|           0.7849089503288269, | ||||
|           0.16792525351047516, | ||||
|           0.9849340915679932, | ||||
|           -0.6559549570083618, | ||||
|           0.35723909735679626, | ||||
|           -0.6822739243507385, | ||||
|           1.2873116731643677, | ||||
|           0.19993330538272855, | ||||
|           0.03512010723352432, | ||||
|           -0.6972134113311768, | ||||
|           0.18453484773635864, | ||||
|           -0.2437680810689926, | ||||
|           0.2156416028738022, | ||||
|           0.5230382680892944, | ||||
|           0.22020135819911957, | ||||
|           0.8314080238342285, | ||||
|           0.15627102553844452, | ||||
|           -0.7330264449119568, | ||||
|           0.3888184726238251, | ||||
|           -0.22034703195095065, | ||||
|           0.5457669496536255, | ||||
|           -0.48084837198257446, | ||||
|           -0.45576658844947815, | ||||
|           -0.09287727624177931, | ||||
|           -0.06968110054731369, | ||||
|           0.35125672817230225, | ||||
|           -0.4278119504451752, | ||||
|           0.2038476765155792, | ||||
|           0.11392722278833388, | ||||
|           0.9433983564376832, | ||||
|           -0.4097744226455689, | ||||
|           0.035297419875860214, | ||||
|           -0.4274404048919678, | ||||
|           -0.25100165605545044, | ||||
|           1.0943366289138794, | ||||
|           -0.07634022831916809, | ||||
|           -0.2925529479980469, | ||||
|           -0.7512530088424683, | ||||
|           0.2649727463722229, | ||||
|           -0.4078235328197479, | ||||
|           -0.3372223973274231, | ||||
|           0.05190162733197212, | ||||
|           0.005654910113662481, | ||||
|           -0.0001571219472680241, | ||||
|           -0.35445958375930786, | ||||
|           -0.7837416529655457, | ||||
|           0.1500556766986847, | ||||
|           0.4383024573326111, | ||||
|           0.6099548935890198, | ||||
|           0.05951934307813645, | ||||
|           -0.21325334906578064, | ||||
|           0.0199207104742527, | ||||
|           -0.22704418003559113, | ||||
|           -0.6481077671051025, | ||||
|           0.37442275881767273, | ||||
|           -1.015955924987793, | ||||
|           0.38637226819992065, | ||||
|           -0.06489371508359909, | ||||
|           -0.494120329618454, | ||||
|           0.3469836115837097, | ||||
|           0.15402406454086304, | ||||
|           -0.7660972476005554, | ||||
|           -0.7053225040435791, | ||||
|           -0.25964751839637756, | ||||
|           0.014004424214363098, | ||||
|           -0.2860170006752014, | ||||
|           -0.17565494775772095, | ||||
|           -0.45117494463920593, | ||||
|           -0.0031954257283359766, | ||||
|           0.09676837921142578, | ||||
|           -0.514464259147644, | ||||
|           0.41698193550109863, | ||||
|           -0.21642713248729703, | ||||
|           -0.5398141145706177, | ||||
|           -0.3647628426551819, | ||||
|           0.37005379796028137, | ||||
|           0.239425927400589, | ||||
|           -0.08833975344896317, | ||||
|           0.934946596622467, | ||||
|           -0.48340797424316406, | ||||
|           0.6241437792778015, | ||||
|           -0.7253676652908325, | ||||
|           -0.04303571209311485, | ||||
|           1.1125205755233765, | ||||
|           -0.15692919492721558, | ||||
|           -0.2914651036262512, | ||||
|           -0.5117168426513672, | ||||
|           0.21365483105182648, | ||||
|           0.4924402534961701, | ||||
|           0.5269662141799927, | ||||
|           0.0352792888879776, | ||||
|           -0.149167999625206, | ||||
|           -0.6019760370254517, | ||||
|           0.08245442807674408, | ||||
|           0.4900692105293274, | ||||
|           0.518824577331543, | ||||
|           -0.00005570516441366635, | ||||
|           -0.553304135799408, | ||||
|           0.22217543423175812, | ||||
|           0.5047767758369446, | ||||
|           0.135724738240242, | ||||
|           1.1511540412902832, | ||||
|           -0.3541218340396881, | ||||
|           -0.9712511897087096, | ||||
|           0.8353699445724487, | ||||
|           -0.39227569103240967, | ||||
|           -0.9117669463157654, | ||||
|           -0.26349931955337524, | ||||
|           0.05597023293375969, | ||||
|           0.20695461332798004, | ||||
|           0.3178807199001312, | ||||
|           1.0663238763809204, | ||||
|           0.5062212347984314, | ||||
|           0.7288597822189331, | ||||
|           0.09899299591779707, | ||||
|           0.553720235824585, | ||||
|           0.675009548664093, | ||||
|           -0.20067055523395536, | ||||
|           0.3138423264026642, | ||||
|           -0.6886593103408813, | ||||
|           -0.2910398542881012, | ||||
|           -1.3186300992965698, | ||||
|           -0.4684459865093231, | ||||
|           -0.095743365585804, | ||||
|           -0.1257995069026947, | ||||
|           -0.4858281314373016, | ||||
|           -0.4935407340526581, | ||||
|           -0.3266896903514862, | ||||
|           -0.3928797245025635, | ||||
|           -0.40803104639053345, | ||||
|           -0.9975396394729614, | ||||
|           0.4229583740234375, | ||||
|           0.37309643626213074, | ||||
|           0.4431034922599793, | ||||
|           0.30364808440208435, | ||||
|           -0.3765178918838501, | ||||
|           0.5616499185562134, | ||||
|           0.16904796659946442, | ||||
|           -0.7343707084655762, | ||||
|           0.2560209631919861, | ||||
|           0.6166825294494629, | ||||
|           0.3200829327106476, | ||||
|           -0.4483652710914612, | ||||
|           0.16224201023578644, | ||||
|           -0.31495288014411926, | ||||
|           -0.42713335156440735, | ||||
|           0.7270734906196594, | ||||
|           0.7049484848976135, | ||||
|           -0.0571461021900177, | ||||
|           0.04477125033736229, | ||||
|           -0.6647796034812927, | ||||
|           1.183672308921814, | ||||
|           0.36199676990509033, | ||||
|           0.046881116926670074, | ||||
|           0.4515796303749085, | ||||
|           0.9278061985969543, | ||||
|           0.31471705436706543, | ||||
|           -0.7073333859443665, | ||||
|           -0.3443860113620758, | ||||
|           0.5440067052841187, | ||||
|           -0.15020819008350372, | ||||
|           -0.541202962398529, | ||||
|           0.5203295946121216, | ||||
|           1.2192286252975464, | ||||
|           -0.9983593225479126, | ||||
|           -0.18758884072303772, | ||||
|           0.2758221924304962, | ||||
|           -0.6511523723602295, | ||||
|           -0.1584404855966568, | ||||
|           -0.236241415143013, | ||||
|           0.2692437767982483, | ||||
|           -0.4941152036190033, | ||||
|           0.4987454116344452, | ||||
|           -0.3331359028816223, | ||||
|           0.3163745701313019, | ||||
|           0.745529294013977, | ||||
|           -0.2905873656272888, | ||||
|           0.13602906465530396, | ||||
|           0.4679684340953827, | ||||
|           1.0555986166000366, | ||||
|           1.075700044631958, | ||||
|           0.5368486046791077, | ||||
|           -0.5118206739425659, | ||||
|           0.8668332099914551, | ||||
|           -0.5726966857910156, | ||||
|           -0.7811751961708069, | ||||
|           0.1938626915216446, | ||||
|           -0.1929349899291992, | ||||
|           0.1757766306400299, | ||||
|           0.6384295225143433, | ||||
|           0.26462844014167786, | ||||
|           0.9542630314826964, | ||||
|           0.19313029944896695, | ||||
|           1.264248013496399, | ||||
|           -0.6304428577423096, | ||||
|           0.0487106591463089, | ||||
|           -0.16211535036563873, | ||||
|           -0.7894763350486755, | ||||
|           0.3582514822483063, | ||||
|           -0.04153040423989296, | ||||
|           0.635784387588501, | ||||
|           0.6554391980171204, | ||||
|           -0.47010496258735657, | ||||
|           -0.8302040696144104, | ||||
|           -0.1350124627351761, | ||||
|           0.2568812072277069, | ||||
|           0.13614831864833832, | ||||
|           -0.2563649117946625, | ||||
|           -1.0434694290161133, | ||||
|           0.3232482671737671, | ||||
|           0.47882452607154846, | ||||
|           0.4298652410507202, | ||||
|           1.0563770532608032, | ||||
|           -0.28917592763900757, | ||||
|           -0.8533256649971008, | ||||
|           0.10648339986801147, | ||||
|           0.6376127004623413, | ||||
|           -0.20832888782024384, | ||||
|           0.2370245456695557, | ||||
|           0.0018312990432605147, | ||||
|           -0.2034837007522583, | ||||
|           0.01051164511591196, | ||||
|           -1.105310082435608, | ||||
|           0.29724350571632385, | ||||
|           0.15604574978351593, | ||||
|           0.1973688006401062, | ||||
|           0.44394731521606445, | ||||
|           0.3974513411521912, | ||||
|           -0.13625948131084442, | ||||
|           0.9571986198425292, | ||||
|           0.2257384955883026, | ||||
|           0.2323588728904724, | ||||
|           -0.5583669543266296, | ||||
|           -0.7854922413825989, | ||||
|           0.1647188365459442, | ||||
|           -1.6098142862319946, | ||||
|           0.318587988615036, | ||||
|           -0.13399995863437653, | ||||
|           -0.2172701060771942, | ||||
|           -0.767514705657959, | ||||
|           -0.5813586711883545, | ||||
|           -0.3195130527019501, | ||||
|           -0.04894036799669266, | ||||
|           0.2929930090904236, | ||||
|           -0.8213384747505188, | ||||
|           0.07181350141763687, | ||||
|           0.7469993829727173, | ||||
|           0.6407455801963806, | ||||
|           0.16365697979927063, | ||||
|           0.7870153188705444, | ||||
|           0.6524736881256104, | ||||
|           0.6399973630905151, | ||||
|           -0.04992736503481865, | ||||
|           -0.03959266096353531, | ||||
|           -0.2512352466583252, | ||||
|           0.8448855876922607, | ||||
|           -0.1422702670097351, | ||||
|           0.1216789186000824, | ||||
|           -1.2647287845611572, | ||||
|           0.5931149125099182, | ||||
|           0.7186052203178406, | ||||
|           -0.06118432432413101, | ||||
|           -1.1942816972732544, | ||||
|           -0.17677085101604462, | ||||
|           0.31543800234794617, | ||||
|           -0.32252824306488037, | ||||
|           0.8255583047866821, | ||||
|           -0.14529970288276672, | ||||
|           -0.2695446312427521, | ||||
|           -0.33378756046295166, | ||||
|           -0.1653425395488739, | ||||
|           0.1454019844532013, | ||||
|           -0.3920115828514099, | ||||
|           0.912214994430542, | ||||
|           -0.7279734015464783, | ||||
|           0.7374742031097412, | ||||
|           0.933980405330658, | ||||
|           0.13429680466651917, | ||||
|           -0.514870285987854, | ||||
|           0.3989711999893189, | ||||
|           -0.11613689363002776, | ||||
|           0.4022413492202759, | ||||
|           -0.9990655779838562, | ||||
|           -0.33749932050704956, | ||||
|           -0.4334589838981629, | ||||
|           -1.376373291015625, | ||||
|           -0.2993924915790558, | ||||
|           -0.09454808384180068, | ||||
|           -0.01314175222069025, | ||||
|           -0.001090060803107917, | ||||
|           0.2137461006641388, | ||||
|           0.2938512861728668, | ||||
|           0.17508235573768616, | ||||
|           0.8260607123374939, | ||||
|           -0.7218498587608337, | ||||
|           0.2414487451314926, | ||||
|           -0.47296759486198425, | ||||
|           -0.3002610504627228, | ||||
|           -1.238540768623352, | ||||
|           0.08663805574178696, | ||||
|           0.6805586218833923, | ||||
|           0.5909030437469482, | ||||
|           -0.42807504534721375, | ||||
|           -0.22887496650218964, | ||||
|           0.47537800669670105, | ||||
|           -1.0474627017974854, | ||||
|           0.6338009238243103, | ||||
|           0.06548397243022919, | ||||
|           0.4971011281013489, | ||||
|           1.3484878540039063 | ||||
|         ] | ||||
|       ], | ||||
|       "userProvided": false | ||||
|     } | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,785 @@ | ||||
| --- | ||||
| source: dump/src/reader/mod.rs | ||||
| expression: document | ||||
| --- | ||||
| { | ||||
|   "id": "e1", | ||||
|   "desc": "natural vector", | ||||
|   "_vectors": { | ||||
|     "default": { | ||||
|       "embeddings": [ | ||||
|         [ | ||||
|           -0.2979458272457123, | ||||
|           -0.5288640856742859, | ||||
|           -0.019957859069108963, | ||||
|           -0.18495318293571472, | ||||
|           0.7429973483085632, | ||||
|           0.5238497257232666, | ||||
|           0.432366281747818, | ||||
|           0.32744166254997253, | ||||
|           0.0020762972999364138, | ||||
|           -0.9507834911346436, | ||||
|           -0.35097137093544006, | ||||
|           0.08469701558351517, | ||||
|           -1.4176613092422483, | ||||
|           0.4647577106952667, | ||||
|           -0.69340580701828, | ||||
|           1.0372896194458008, | ||||
|           0.3716741800308227, | ||||
|           0.06031008064746857, | ||||
|           -0.6152024269104004, | ||||
|           0.007914665155112743, | ||||
|           0.7954924702644348, | ||||
|           -0.20773003995418549, | ||||
|           0.09376765787601472, | ||||
|           0.04508133605122566, | ||||
|           -0.2084471583366394, | ||||
|           -0.1518009901046753, | ||||
|           0.018195509910583496, | ||||
|           -0.07044368237257004, | ||||
|           -0.18119366466999057, | ||||
|           -0.4480230510234833, | ||||
|           0.3822529911994934, | ||||
|           0.1911812424659729, | ||||
|           0.4674372375011444, | ||||
|           0.06963984668254852, | ||||
|           -0.09341949224472046, | ||||
|           0.005675444379448891, | ||||
|           -0.6774799227714539, | ||||
|           -0.7066726684570313, | ||||
|           -0.39256376028060913, | ||||
|           0.04005039855837822, | ||||
|           0.2084812968969345, | ||||
|           -0.7872875928878784, | ||||
|           -0.8205880522727966, | ||||
|           0.2919981777667999, | ||||
|           -0.06004738807678223, | ||||
|           -0.4907574355602264, | ||||
|           -1.5937862396240234, | ||||
|           0.24249385297298431, | ||||
|           -0.14709846675395966, | ||||
|           -0.11860740929841997, | ||||
|           -0.8299489617347717, | ||||
|           0.472964346408844, | ||||
|           -0.497518390417099, | ||||
|           -0.22205302119255063, | ||||
|           -0.4196169078350067, | ||||
|           0.32697558403015137, | ||||
|           -0.360930860042572, | ||||
|           -0.9789686799049376, | ||||
|           0.1887447088956833, | ||||
|           -0.403737336397171, | ||||
|           0.18524253368377688, | ||||
|           0.3768732249736786, | ||||
|           0.3666233420372009, | ||||
|           0.3511938452720642, | ||||
|           0.6985810995101929, | ||||
|           0.41721710562705994, | ||||
|           0.09754953533411026, | ||||
|           0.6204307079315186, | ||||
|           -1.0762996673583984, | ||||
|           -0.06263761967420578, | ||||
|           -0.7376511693000793, | ||||
|           0.6849768161773682, | ||||
|           -0.1745152473449707, | ||||
|           -0.40449759364128113, | ||||
|           0.20757411420345304, | ||||
|           -0.8424443006515503, | ||||
|           0.330015629529953, | ||||
|           0.3489064872264862, | ||||
|           1.0954371690750122, | ||||
|           0.8487558960914612, | ||||
|           1.1076823472976685, | ||||
|           0.61430823802948, | ||||
|           0.4155903458595276, | ||||
|           0.4111340939998626, | ||||
|           0.05753209814429283, | ||||
|           -0.06429877132177353, | ||||
|           -0.765606164932251, | ||||
|           -0.41703930497169495, | ||||
|           -0.508820652961731, | ||||
|           0.19859947264194489, | ||||
|           -0.16607828438282013, | ||||
|           -0.28112146258354187, | ||||
|           0.11032675206661224, | ||||
|           0.38809511065483093, | ||||
|           -0.36498191952705383, | ||||
|           -0.48671194911003113, | ||||
|           0.6755134463310242, | ||||
|           0.03958442434668541, | ||||
|           0.4478721618652344, | ||||
|           -0.10335399955511092, | ||||
|           -0.9546685814857484, | ||||
|           -0.6087718605995178, | ||||
|           0.17498846352100372, | ||||
|           0.08320838958024979, | ||||
|           -1.4478336572647097, | ||||
|           -0.605027437210083, | ||||
|           -0.5867993235588074, | ||||
|           -0.14711688458919525, | ||||
|           -0.5447602272033691, | ||||
|           -0.026259321719408035, | ||||
|           -0.6997418403625488, | ||||
|           -0.07349082082509995, | ||||
|           0.10638900846242905, | ||||
|           -0.7133527398109436, | ||||
|           -0.9396815299987792, | ||||
|           1.087092399597168, | ||||
|           1.1885089874267578, | ||||
|           0.4011896848678589, | ||||
|           -0.4089202582836151, | ||||
|           -0.10938972979784012, | ||||
|           0.6726722121238708, | ||||
|           0.24576938152313232, | ||||
|           -0.24247920513153076, | ||||
|           1.1499971151351929, | ||||
|           0.47813335061073303, | ||||
|           -0.05331678315997124, | ||||
|           0.32338133454322815, | ||||
|           0.4870913326740265, | ||||
|           -0.23144258558750153, | ||||
|           -1.2023426294326782, | ||||
|           0.2349330335855484, | ||||
|           1.080536961555481, | ||||
|           0.29334118962287903, | ||||
|           0.391574501991272, | ||||
|           -0.15818795561790466, | ||||
|           -0.2948290705680847, | ||||
|           -0.024689948186278343, | ||||
|           0.06602869182825089, | ||||
|           0.5937030911445618, | ||||
|           -0.047901444137096405, | ||||
|           -0.512734591960907, | ||||
|           -0.35780075192451477, | ||||
|           0.28751692175865173, | ||||
|           0.4298716187477112, | ||||
|           0.9242428541183472, | ||||
|           -0.17208744585514069, | ||||
|           0.11515070497989656, | ||||
|           -0.0335976779460907, | ||||
|           -0.3422986567020416, | ||||
|           0.5344581604003906, | ||||
|           0.19895796477794647, | ||||
|           0.33001241087913513, | ||||
|           0.6390730142593384, | ||||
|           -0.6074934005737305, | ||||
|           -0.2553696632385254, | ||||
|           0.9644920229911804, | ||||
|           0.2699219584465027, | ||||
|           0.6403993368148804, | ||||
|           -0.6380003690719604, | ||||
|           -0.027310986071825027, | ||||
|           0.638815701007843, | ||||
|           0.27719101309776306, | ||||
|           -0.13553589582443237, | ||||
|           0.750195324420929, | ||||
|           0.1224869191646576, | ||||
|           -0.20613941550254825, | ||||
|           0.8444448709487915, | ||||
|           0.16200250387191772, | ||||
|           -0.24750925600528717, | ||||
|           -0.739950954914093, | ||||
|           -0.28443849086761475, | ||||
|           -1.176282525062561, | ||||
|           0.516107976436615, | ||||
|           0.3774825632572174, | ||||
|           0.10906043648719788, | ||||
|           0.07962015271186829, | ||||
|           0.7384604215621948, | ||||
|           -0.051241904497146606, | ||||
|           1.1730090379714966, | ||||
|           -0.4828610122203827, | ||||
|           -1.404372215270996, | ||||
|           0.8811132311820984, | ||||
|           -0.3839482367038727, | ||||
|           0.022516896948218346, | ||||
|           -0.0491158664226532, | ||||
|           -0.43027013540267944, | ||||
|           1.2049334049224854, | ||||
|           -0.27309560775756836, | ||||
|           0.6883630752563477, | ||||
|           0.8264574408531189, | ||||
|           -0.5020735263824463, | ||||
|           -0.4874092042446137, | ||||
|           0.6007202863693237, | ||||
|           -0.4965405762195587, | ||||
|           1.1302915811538696, | ||||
|           0.032572727650403976, | ||||
|           -0.3731859028339386, | ||||
|           0.658271849155426, | ||||
|           -0.9023059010505676, | ||||
|           0.7400162220001221, | ||||
|           0.014550759457051754, | ||||
|           -0.19699542224407196, | ||||
|           0.2319706380367279, | ||||
|           -0.789058268070221, | ||||
|           -0.14905710518360138, | ||||
|           -0.5826214551925659, | ||||
|           0.207652747631073, | ||||
|           -0.4507439732551574, | ||||
|           -0.3163885474205017, | ||||
|           0.3604124188423157, | ||||
|           -0.45119962096214294, | ||||
|           0.3428427278995514, | ||||
|           0.3005594313144684, | ||||
|           -0.36026081442832947, | ||||
|           1.1014249324798584, | ||||
|           0.40884315967559814, | ||||
|           0.34991952776908875, | ||||
|           -0.1806638240814209, | ||||
|           0.27440476417541504, | ||||
|           -0.7118373513221741, | ||||
|           0.4645499587059021, | ||||
|           0.214790478348732, | ||||
|           -0.2343102991580963, | ||||
|           0.10500429570674896, | ||||
|           -0.28034430742263794, | ||||
|           1.2267805337905884, | ||||
|           1.0561333894729614, | ||||
|           -0.497364342212677, | ||||
|           -0.6143305897712708, | ||||
|           0.24963727593421936, | ||||
|           -0.33136463165283203, | ||||
|           -0.01473914459347725, | ||||
|           0.495918869972229, | ||||
|           -0.6985538005828857, | ||||
|           -1.0033197402954102, | ||||
|           0.35937801003456116, | ||||
|           0.6325868368148804, | ||||
|           -0.6808838844299316, | ||||
|           1.0354058742523191, | ||||
|           -0.7214401960372925, | ||||
|           -0.33318862318992615, | ||||
|           0.874398410320282, | ||||
|           -0.6594992280006409, | ||||
|           0.6830640435218811, | ||||
|           -0.18534131348133087, | ||||
|           0.024834271520376205, | ||||
|           0.19901277124881744, | ||||
|           -0.5992477536201477, | ||||
|           -1.2126628160476685, | ||||
|           -0.9245557188987732, | ||||
|           -0.3898217976093292, | ||||
|           -0.1286519467830658, | ||||
|           0.4217943847179413, | ||||
|           -0.1143646091222763, | ||||
|           0.5630772709846497, | ||||
|           -0.5240639448165894, | ||||
|           0.21152715384960177, | ||||
|           -0.3792001008987427, | ||||
|           0.8266305327415466, | ||||
|           1.170984387397766, | ||||
|           -0.8072142004966736, | ||||
|           0.11382893472909927, | ||||
|           -0.17953898012638092, | ||||
|           -0.1789460331201553, | ||||
|           -0.15078622102737427, | ||||
|           -1.2082908153533936, | ||||
|           -0.7812382578849792, | ||||
|           -0.10903695970773696, | ||||
|           0.7303897142410278, | ||||
|           -0.39054441452026367, | ||||
|           0.19511254131793976, | ||||
|           -0.09121843427419662, | ||||
|           0.22400228679180145, | ||||
|           0.30143046379089355, | ||||
|           0.1141919493675232, | ||||
|           0.48112115263938904, | ||||
|           0.7307931780815125, | ||||
|           0.09701362252235413, | ||||
|           -0.2795647978782654, | ||||
|           -0.3997688889503479, | ||||
|           0.5540812611579895, | ||||
|           0.564578115940094, | ||||
|           -0.40065160393714905, | ||||
|           -0.3629159033298493, | ||||
|           -0.3789091110229492, | ||||
|           -0.7298538088798523, | ||||
|           -0.6996853351593018, | ||||
|           -0.4477842152118683, | ||||
|           -0.289089560508728, | ||||
|           -0.6430277824401855, | ||||
|           0.2344944179058075, | ||||
|           0.3742927014827728, | ||||
|           -0.5079357028007507, | ||||
|           0.28841453790664673, | ||||
|           0.06515737622976303, | ||||
|           0.707315981388092, | ||||
|           0.09498685598373412, | ||||
|           0.8365515470504761, | ||||
|           0.10002726316452026, | ||||
|           -0.7695478200912476, | ||||
|           0.6264724135398865, | ||||
|           0.7562043070793152, | ||||
|           -0.23112858831882477, | ||||
|           -0.2871039807796478, | ||||
|           -0.25010058283805847, | ||||
|           0.2783474028110504, | ||||
|           -0.03224996477365494, | ||||
|           -0.9119359850883484, | ||||
|           -3.6940200328826904, | ||||
|           -0.5099936127662659, | ||||
|           -0.1604711413383484, | ||||
|           0.17453284561634064, | ||||
|           0.41759559512138367, | ||||
|           0.1419190913438797, | ||||
|           -0.11362407356500626, | ||||
|           -0.33312007784843445, | ||||
|           0.11511333286762238, | ||||
|           0.4667884409427643, | ||||
|           -0.0031647447030991316, | ||||
|           0.15879854559898376, | ||||
|           0.3042248487472534, | ||||
|           0.5404849052429199, | ||||
|           0.8515422344207764, | ||||
|           0.06286454200744629, | ||||
|           0.43790125846862793, | ||||
|           -0.8682025074958801, | ||||
|           -0.06363756954669952, | ||||
|           0.5547921657562256, | ||||
|           -0.01483887154608965, | ||||
|           -0.07361344993114471, | ||||
|           -0.929947018623352, | ||||
|           0.3502565622329712, | ||||
|           -0.5080993175506592, | ||||
|           1.0380364656448364, | ||||
|           -0.2017953395843506, | ||||
|           0.21319580078125, | ||||
|           -1.0763001441955566, | ||||
|           -0.556368887424469, | ||||
|           0.1949922740459442, | ||||
|           -0.6445739269256592, | ||||
|           0.6791343688964844, | ||||
|           0.21188358962535855, | ||||
|           0.3736183941364288, | ||||
|           -0.21800459921360016, | ||||
|           0.7597446441650391, | ||||
|           -0.3732394874095917, | ||||
|           -0.4710160195827484, | ||||
|           0.025146087631583217, | ||||
|           0.05341297015547752, | ||||
|           -0.9522109627723694, | ||||
|           -0.6000866889953613, | ||||
|           -0.08469046652317047, | ||||
|           0.5966026186943054, | ||||
|           0.3444081246852875, | ||||
|           -0.461188405752182, | ||||
|           -0.5279349088668823, | ||||
|           0.10296865552663804, | ||||
|           0.5175143480300903, | ||||
|           -0.20671147108078003, | ||||
|           0.13392412662506104, | ||||
|           0.4812754988670349, | ||||
|           0.2993808686733246, | ||||
|           -0.3005635440349579, | ||||
|           0.5141698122024536, | ||||
|           -0.6239235401153564, | ||||
|           0.2877119481563568, | ||||
|           -0.4452739953994751, | ||||
|           0.5621107816696167, | ||||
|           0.5047508478164673, | ||||
|           -0.4226335883140564, | ||||
|           -0.18578553199768064, | ||||
|           -1.1967322826385498, | ||||
|           0.28178197145462036, | ||||
|           -0.8692031502723694, | ||||
|           -1.1812998056411743, | ||||
|           -1.4526212215423584, | ||||
|           0.4645712077617645, | ||||
|           0.9327932000160216, | ||||
|           -0.6560136675834656, | ||||
|           0.461549699306488, | ||||
|           -0.5621527433395386, | ||||
|           -1.328449010848999, | ||||
|           -0.08676894754171371, | ||||
|           0.00021918353741057217, | ||||
|           -0.18864136934280396, | ||||
|           0.1259666532278061, | ||||
|           0.18240638077259064, | ||||
|           -0.14919660985469818, | ||||
|           -0.8965857625007629, | ||||
|           -0.7539900541305542, | ||||
|           0.013973715715110302, | ||||
|           0.504276692867279, | ||||
|           -0.704748272895813, | ||||
|           -0.6428424119949341, | ||||
|           0.6303996443748474, | ||||
|           -0.5404738187789917, | ||||
|           -0.31176653504371643, | ||||
|           -0.21262824535369873, | ||||
|           0.18736739456653595, | ||||
|           -0.7998970746994019, | ||||
|           0.039946746081113815, | ||||
|           0.7390344738960266, | ||||
|           0.4283199906349182, | ||||
|           0.3795057237148285, | ||||
|           0.07204607129096985, | ||||
|           -0.9230587482452391, | ||||
|           0.9440426230430604, | ||||
|           0.26272690296173096, | ||||
|           0.5598306655883789, | ||||
|           -1.0520871877670288, | ||||
|           -0.2677186131477356, | ||||
|           -0.1888762265443802, | ||||
|           0.30426350235939026, | ||||
|           0.4746131896972656, | ||||
|           -0.5746733546257019, | ||||
|           -0.4197768568992615, | ||||
|           0.8565112948417664, | ||||
|           -0.6767723560333252, | ||||
|           0.23448683321475983, | ||||
|           -0.2010004222393036, | ||||
|           0.4112907350063324, | ||||
|           -0.6497949957847595, | ||||
|           -0.418667733669281, | ||||
|           -0.4950824975967407, | ||||
|           0.44438859820365906, | ||||
|           1.026281714439392, | ||||
|           0.482397586107254, | ||||
|           -0.26220494508743286, | ||||
|           -0.3640787005424499, | ||||
|           0.5907743573188782, | ||||
|           -0.8771642446517944, | ||||
|           0.09708411991596222, | ||||
|           -0.3671700060367584, | ||||
|           0.4331349730491638, | ||||
|           0.619417667388916, | ||||
|           -0.2684665620326996, | ||||
|           -0.5123821496963501, | ||||
|           -0.1502324342727661, | ||||
|           -0.012190685607492924, | ||||
|           0.3580845892429352, | ||||
|           0.8617186546325684, | ||||
|           0.3493645489215851, | ||||
|           1.0270192623138428, | ||||
|           0.18297909200191495, | ||||
|           -0.5881339311599731, | ||||
|           -0.1733516901731491, | ||||
|           -0.5040576457977295, | ||||
|           -0.340370237827301, | ||||
|           -0.26767754554748535, | ||||
|           -0.28570041060447693, | ||||
|           -0.032928116619586945, | ||||
|           0.6029254794120789, | ||||
|           0.17397655546665192, | ||||
|           0.09346921741962431, | ||||
|           0.27815181016921997, | ||||
|           -0.46699589490890503, | ||||
|           -0.8148876428604126, | ||||
|           -0.3964351713657379, | ||||
|           0.3812595009803772, | ||||
|           0.13547226786613464, | ||||
|           0.7126688361167908, | ||||
|           -0.3473474085330963, | ||||
|           -0.06573959439992905, | ||||
|           -0.6483767032623291, | ||||
|           1.4808889627456665, | ||||
|           0.30924928188323975, | ||||
|           -0.5085946917533875, | ||||
|           -0.8613000512123108, | ||||
|           0.3048902451992035, | ||||
|           -0.4241599142551422, | ||||
|           0.15909206867218018, | ||||
|           0.5764641761779785, | ||||
|           -0.07879110425710678, | ||||
|           1.015336513519287, | ||||
|           0.07599356025457382, | ||||
|           -0.7025855779647827, | ||||
|           0.30047643184661865, | ||||
|           -0.35094937682151794, | ||||
|           0.2522146999835968, | ||||
|           -0.2338722199201584, | ||||
|           -0.8326804637908936, | ||||
|           -0.13695412874221802, | ||||
|           -0.03452421352267265, | ||||
|           0.47974953055381775, | ||||
|           -0.18385636806488037, | ||||
|           0.32438594102859497, | ||||
|           0.1797013282775879, | ||||
|           0.787494957447052, | ||||
|           -0.12579888105392456, | ||||
|           -0.07507286965847015, | ||||
|           -0.4389670491218567, | ||||
|           0.2720070779323578, | ||||
|           0.8138866424560547, | ||||
|           0.01974171027541161, | ||||
|           -0.3057698905467987, | ||||
|           -0.6709924936294556, | ||||
|           0.0885881632566452, | ||||
|           -0.2862754464149475, | ||||
|           0.03475658595561981, | ||||
|           -0.1285519152879715, | ||||
|           0.3838353455066681, | ||||
|           -0.2944154739379883, | ||||
|           -0.4204859137535095, | ||||
|           -0.4416137933731079, | ||||
|           0.13426260650157928, | ||||
|           0.36733248829841614, | ||||
|           0.573428750038147, | ||||
|           -0.14928072690963745, | ||||
|           -0.026076916605234143, | ||||
|           0.33286052942276, | ||||
|           -0.5340145826339722, | ||||
|           -0.17279052734375, | ||||
|           -0.01154550164937973, | ||||
|           -0.6620771884918213, | ||||
|           0.18390542268753052, | ||||
|           -0.08265615254640579, | ||||
|           -0.2489682286977768, | ||||
|           0.2429984211921692, | ||||
|           -0.044153645634651184, | ||||
|           -0.986578404903412, | ||||
|           -0.33574509620666504, | ||||
|           -0.5387663841247559, | ||||
|           0.19767941534519196, | ||||
|           0.12540718913078308, | ||||
|           -0.3403128981590271, | ||||
|           -0.4154576361179352, | ||||
|           0.17275673151016235, | ||||
|           0.09407442808151244, | ||||
|           -0.5414086580276489, | ||||
|           0.4393929839134216, | ||||
|           0.1725579798221588, | ||||
|           -0.4998118281364441, | ||||
|           -0.6926208138465881, | ||||
|           0.16552448272705078, | ||||
|           0.6659538149833679, | ||||
|           -0.10949844866991044, | ||||
|           0.986426830291748, | ||||
|           0.01748848147690296, | ||||
|           0.4003709554672241, | ||||
|           -0.5430638194084167, | ||||
|           0.35347291827201843, | ||||
|           0.6887399554252625, | ||||
|           0.08274628221988678, | ||||
|           0.13407137989997864, | ||||
|           -0.591465950012207, | ||||
|           0.3446292281150818, | ||||
|           0.6069018244743347, | ||||
|           0.1935492902994156, | ||||
|           -0.0989871397614479, | ||||
|           0.07008486241102219, | ||||
|           -0.8503749370574951, | ||||
|           -0.09507356584072112, | ||||
|           0.6259510517120361, | ||||
|           0.13934025168418884, | ||||
|           0.06392545253038406, | ||||
|           -0.4112265408039093, | ||||
|           -0.08475656062364578, | ||||
|           0.4974113404750824, | ||||
|           -0.30606114864349365, | ||||
|           1.111435890197754, | ||||
|           -0.018766529858112335, | ||||
|           -0.8422622680664063, | ||||
|           0.4325508773326874, | ||||
|           -0.2832120656967163, | ||||
|           -0.4859798848628998, | ||||
|           -0.41498348116874695, | ||||
|           0.015977520495653152, | ||||
|           0.5292825698852539, | ||||
|           0.4538311660289765, | ||||
|           1.1328668594360352, | ||||
|           0.22632671892642975, | ||||
|           0.7918671369552612, | ||||
|           0.33401933312416077, | ||||
|           0.7306135296821594, | ||||
|           0.3548600673675537, | ||||
|           0.12506209313869476, | ||||
|           0.8573207855224609, | ||||
|           -0.5818327069282532, | ||||
|           -0.6953738927841187, | ||||
|           -1.6171947717666626, | ||||
|           -0.1699674427509308, | ||||
|           0.6318262815475464, | ||||
|           -0.05671752244234085, | ||||
|           -0.28145185112953186, | ||||
|           -0.3976689279079437, | ||||
|           -0.2041076272726059, | ||||
|           -0.5495951175689697, | ||||
|           -0.5152917504310608, | ||||
|           -0.9309796094894408, | ||||
|           0.101932130753994, | ||||
|           0.1367802917957306, | ||||
|           0.1490798443555832, | ||||
|           0.5304336547851563, | ||||
|           -0.5082434415817261, | ||||
|           0.06688683480024338, | ||||
|           0.14657628536224365, | ||||
|           -0.782435953617096, | ||||
|           0.2962816655635834, | ||||
|           0.6965363621711731, | ||||
|           0.8496337532997131, | ||||
|           -0.3042965829372406, | ||||
|           0.04343798756599426, | ||||
|           0.0330701619386673, | ||||
|           -0.5662598013877869, | ||||
|           1.1086925268173218, | ||||
|           0.756072998046875, | ||||
|           -0.204134538769722, | ||||
|           0.2404300570487976, | ||||
|           -0.47848284244537354, | ||||
|           1.3659011125564575, | ||||
|           0.5645433068275452, | ||||
|           -0.15836156904697418, | ||||
|           0.43395575881004333, | ||||
|           0.5944653749465942, | ||||
|           1.0043466091156006, | ||||
|           -0.49446743726730347, | ||||
|           -0.5954391360282898, | ||||
|           0.5341240763664246, | ||||
|           0.020598189905285835, | ||||
|           -0.4036853015422821, | ||||
|           0.4473709762096405, | ||||
|           1.1998231410980225, | ||||
|           -0.9317775368690492, | ||||
|           -0.23321466147899628, | ||||
|           0.2052552700042725, | ||||
|           -0.7423108816146851, | ||||
|           -0.19917210936546328, | ||||
|           -0.1722569614648819, | ||||
|           -0.034072667360305786, | ||||
|           -0.00671181408688426, | ||||
|           0.46396249532699585, | ||||
|           -0.1372445821762085, | ||||
|           0.053376372903585434, | ||||
|           0.7392690777778625, | ||||
|           -0.38447609543800354, | ||||
|           0.07497968524694443, | ||||
|           0.5197252631187439, | ||||
|           1.3746477365493774, | ||||
|           0.9060075879096984, | ||||
|           0.20000585913658145, | ||||
|           -0.4053704142570496, | ||||
|           0.7497360110282898, | ||||
|           -0.34087055921554565, | ||||
|           -1.101803183555603, | ||||
|           0.273650586605072, | ||||
|           -0.5125769376754761, | ||||
|           0.22472351789474487, | ||||
|           0.480757474899292, | ||||
|           -0.19845178723335263, | ||||
|           0.8857700824737549, | ||||
|           0.30752456188201904, | ||||
|           1.1109285354614258, | ||||
|           -0.6768012642860413, | ||||
|           0.524367094039917, | ||||
|           -0.22495046257972717, | ||||
|           -0.4224412739276886, | ||||
|           0.40753406286239624, | ||||
|           -0.23133376240730288, | ||||
|           0.3297771215438843, | ||||
|           0.4905449151992798, | ||||
|           -0.6813114285469055, | ||||
|           -0.7543983459472656, | ||||
|           -0.5599071383476257, | ||||
|           0.14351597428321838, | ||||
|           -0.029278717935085297, | ||||
|           -0.3970443606376648, | ||||
|           -0.303079217672348, | ||||
|           0.24161772429943085, | ||||
|           0.008353390730917454, | ||||
|           -0.0062365154735744, | ||||
|           1.0824860334396362, | ||||
|           -0.3704061508178711, | ||||
|           -1.0337258577346802, | ||||
|           0.04638749733567238, | ||||
|           1.163011074066162, | ||||
|           -0.31737643480300903, | ||||
|           0.013986887410283089, | ||||
|           0.19223114848136905, | ||||
|           -0.2260770797729492, | ||||
|           -0.210910826921463, | ||||
|           -1.0191949605941772, | ||||
|           0.22356095910072327, | ||||
|           0.09353553503751756, | ||||
|           0.18096882104873657, | ||||
|           0.14867214858531952, | ||||
|           0.43408671021461487, | ||||
|           -0.33312076330184937, | ||||
|           0.8173948526382446, | ||||
|           0.6428242921829224, | ||||
|           0.20215003192424777, | ||||
|           -0.6634518504142761, | ||||
|           -0.4132290482521057, | ||||
|           0.29815030097961426, | ||||
|           -1.579406976699829, | ||||
|           -0.0981958732008934, | ||||
|           -0.03941014781594277, | ||||
|           0.1709178239107132, | ||||
|           -0.5481140613555908, | ||||
|           -0.5338194966316223, | ||||
|           -0.3528362512588501, | ||||
|           -0.11561278253793716, | ||||
|           -0.21793591976165771, | ||||
|           -1.1570470333099363, | ||||
|           0.2157980799674988, | ||||
|           0.42083489894866943, | ||||
|           0.9639263153076172, | ||||
|           0.09747201204299928, | ||||
|           0.15671424567699432, | ||||
|           0.4034591615200043, | ||||
|           0.6728067994117737, | ||||
|           -0.5216875672340393, | ||||
|           0.09657668322324751, | ||||
|           -0.2416689097881317, | ||||
|           0.747975766658783, | ||||
|           0.1021689772605896, | ||||
|           0.11652665585279463, | ||||
|           -1.0484966039657593, | ||||
|           0.8489304780960083, | ||||
|           0.7169828414916992, | ||||
|           -0.09012343734502792, | ||||
|           -1.3173753023147583, | ||||
|           0.057890523225069046, | ||||
|           -0.006231260951608419, | ||||
|           -0.1018214002251625, | ||||
|           0.936040461063385, | ||||
|           -0.0502331368625164, | ||||
|           -0.4284322261810303, | ||||
|           -0.38209280371665955, | ||||
|           -0.22668412327766416, | ||||
|           0.0782942995429039, | ||||
|           -0.4881664514541626, | ||||
|           0.9268959760665894, | ||||
|           0.001867273123934865, | ||||
|           0.42261114716529846, | ||||
|           0.8283362984657288, | ||||
|           0.4256294071674347, | ||||
|           -0.7965338826179504, | ||||
|           0.4840078353881836, | ||||
|           -0.19861412048339844, | ||||
|           0.33977967500686646, | ||||
|           -0.4604192078113556, | ||||
|           -0.3107339143753052, | ||||
|           -0.2839638590812683, | ||||
|           -1.5734281539916992, | ||||
|           0.005220232997089624, | ||||
|           0.09239906817674635, | ||||
|           -0.7828494906425476, | ||||
|           -0.1397123783826828, | ||||
|           0.2576255202293396, | ||||
|           0.21372435986995697, | ||||
|           -0.23169949650764465, | ||||
|           0.4016408920288086, | ||||
|           -0.462497353553772, | ||||
|           -0.2186472862958908, | ||||
|           -0.5617868900299072, | ||||
|           -0.3649831712245941, | ||||
|           -1.1585862636566162, | ||||
|           -0.08222806453704834, | ||||
|           0.931126832962036, | ||||
|           0.4327389597892761, | ||||
|           -0.46451422572135925, | ||||
|           -0.5430706143379211, | ||||
|           -0.27434298396110535, | ||||
|           -0.9479129314422609, | ||||
|           0.1845661848783493, | ||||
|           0.3972720205783844, | ||||
|           0.4883299469947815, | ||||
|           1.04031240940094 | ||||
|         ] | ||||
|       ], | ||||
|       "userProvided": false | ||||
|     } | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,780 @@ | ||||
| --- | ||||
| source: dump/src/reader/mod.rs | ||||
| expression: document | ||||
| --- | ||||
| { | ||||
|   "id": "e0", | ||||
|   "desc": "overriden vector", | ||||
|   "_vectors": { | ||||
|     "default": [ | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1, | ||||
|       0.1 | ||||
|     ] | ||||
|   } | ||||
| } | ||||
							
								
								
									
										
											BIN
										
									
								
								dump/tests/assets/v6-with-vectors.dump
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										
											BIN
										
									
								
								dump/tests/assets/v6-with-vectors.dump
									
									
									
									
									
										Normal file
									
								
							
										
											Binary file not shown.
										
									
								
							| @@ -31,6 +31,9 @@ use meilisearch_types::milli::heed::CompactionOption; | ||||
| use meilisearch_types::milli::update::{ | ||||
|     IndexDocumentsConfig, IndexDocumentsMethod, IndexerConfig, Settings as MilliSettings, | ||||
| }; | ||||
| use meilisearch_types::milli::vector::parsed_vectors::{ | ||||
|     ExplicitVectors, VectorOrArrayOfVectors, RESERVED_VECTORS_FIELD_NAME, | ||||
| }; | ||||
| use meilisearch_types::milli::{self, Filter}; | ||||
| use meilisearch_types::settings::{apply_settings_to_builder, Settings, Unchecked}; | ||||
| use meilisearch_types::tasks::{Details, IndexSwap, Kind, KindWithContent, Status, Task}; | ||||
| @@ -916,8 +919,55 @@ impl IndexScheduler { | ||||
|                         if self.must_stop_processing.get() { | ||||
|                             return Err(Error::AbortedTask); | ||||
|                         } | ||||
|                         let (_id, doc) = ret?; | ||||
|                         let document = milli::obkv_to_json(&all_fields, &fields_ids_map, doc)?; | ||||
|  | ||||
|                         let (id, doc) = ret?; | ||||
|  | ||||
|                         let mut document = milli::obkv_to_json(&all_fields, &fields_ids_map, doc)?; | ||||
|  | ||||
|                         'inject_vectors: { | ||||
|                             let embeddings = index.embeddings(&rtxn, id)?; | ||||
|  | ||||
|                             if embeddings.is_empty() { | ||||
|                                 break 'inject_vectors; | ||||
|                             } | ||||
|  | ||||
|                             let vectors = document | ||||
|                                 .entry(RESERVED_VECTORS_FIELD_NAME.to_owned()) | ||||
|                                 .or_insert(serde_json::Value::Object(Default::default())); | ||||
|  | ||||
|                             let serde_json::Value::Object(vectors) = vectors else { | ||||
|                                 return Err(milli::Error::UserError( | ||||
|                                     milli::UserError::InvalidVectorsMapType { | ||||
|                                         document_id: { | ||||
|                                             if let Ok(Some(Ok(index))) = index | ||||
|                                                 .external_id_of(&rtxn, std::iter::once(id)) | ||||
|                                                 .map(|it| it.into_iter().next()) | ||||
|                                             { | ||||
|                                                 index | ||||
|                                             } else { | ||||
|                                                 format!("internal docid={id}") | ||||
|                                             } | ||||
|                                         }, | ||||
|                                         value: vectors.clone(), | ||||
|                                     }, | ||||
|                                 ) | ||||
|                                 .into()); | ||||
|                             }; | ||||
|  | ||||
|                             for (embedder_name, embeddings) in embeddings { | ||||
|                                 // don't change the entry if it already exists, because it was user-provided | ||||
|                                 vectors.entry(embedder_name).or_insert_with(|| { | ||||
|                                     let embeddings = ExplicitVectors { | ||||
|                                         embeddings: VectorOrArrayOfVectors::from_array_of_vectors( | ||||
|                                             embeddings, | ||||
|                                         ), | ||||
|                                         user_provided: false, | ||||
|                                     }; | ||||
|                                     serde_json::to_value(embeddings).unwrap() | ||||
|                                 }); | ||||
|                             } | ||||
|                         } | ||||
|  | ||||
|                         index_dumper.push_document(&document)?; | ||||
|                     } | ||||
|  | ||||
|   | ||||
| @@ -1774,6 +1774,7 @@ mod tests { | ||||
|     use big_s::S; | ||||
|     use crossbeam::channel::RecvTimeoutError; | ||||
|     use file_store::File; | ||||
|     use insta::assert_json_snapshot; | ||||
|     use meili_snap::{json_string, snapshot}; | ||||
|     use meilisearch_auth::AuthFilter; | ||||
|     use meilisearch_types::document_formats::DocumentFormatError; | ||||
| @@ -1851,7 +1852,7 @@ mod tests { | ||||
|  | ||||
|             // To be 100% consistent between all test we're going to start the scheduler right now | ||||
|             // and ensure it's in the expected starting state. | ||||
|             let breakpoint = match receiver.recv_timeout(std::time::Duration::from_secs(1)) { | ||||
|             let breakpoint = match receiver.recv_timeout(std::time::Duration::from_secs(10)) { | ||||
|                 Ok(b) => b, | ||||
|                 Err(RecvTimeoutError::Timeout) => { | ||||
|                     panic!("The scheduler seems to be waiting for a new task while your test is waiting for a breakpoint.") | ||||
| @@ -1962,7 +1963,7 @@ mod tests { | ||||
|         fn advance(&mut self) -> Breakpoint { | ||||
|             let (breakpoint_1, b) = match self | ||||
|                 .test_breakpoint_rcv | ||||
|                 .recv_timeout(std::time::Duration::from_secs(5)) | ||||
|                 .recv_timeout(std::time::Duration::from_secs(50)) | ||||
|             { | ||||
|                 Ok(b) => b, | ||||
|                 Err(RecvTimeoutError::Timeout) => { | ||||
| @@ -1983,7 +1984,7 @@ mod tests { | ||||
|  | ||||
|             let (breakpoint_2, b) = match self | ||||
|                 .test_breakpoint_rcv | ||||
|                 .recv_timeout(std::time::Duration::from_secs(5)) | ||||
|                 .recv_timeout(std::time::Duration::from_secs(50)) | ||||
|             { | ||||
|                 Ok(b) => b, | ||||
|                 Err(RecvTimeoutError::Timeout) => { | ||||
| @@ -4982,4 +4983,233 @@ mod tests { | ||||
|         ---------------------------------------------------------------------- | ||||
|         "###); | ||||
|     } | ||||
|  | ||||
|     #[test] | ||||
|     fn import_vectors() { | ||||
|         use meilisearch_types::settings::{Settings, Unchecked}; | ||||
|         use milli::update::Setting; | ||||
|  | ||||
|         let (index_scheduler, mut handle) = IndexScheduler::test(true, vec![]); | ||||
|  | ||||
|         let mut new_settings: Box<Settings<Unchecked>> = Box::default(); | ||||
|         let mut embedders = BTreeMap::default(); | ||||
|         let embedding_settings = milli::vector::settings::EmbeddingSettings { | ||||
|             source: Setting::Set(milli::vector::settings::EmbedderSource::Rest), | ||||
|             api_key: Setting::Set(S("My super secret")), | ||||
|             url: Setting::Set(S("http://localhost:7777")), | ||||
|             dimensions: Setting::Set(384), | ||||
|             ..Default::default() | ||||
|         }; | ||||
|         embedders.insert(S("A_fakerest"), Setting::Set(embedding_settings)); | ||||
|  | ||||
|         let embedding_settings = milli::vector::settings::EmbeddingSettings { | ||||
|             source: Setting::Set(milli::vector::settings::EmbedderSource::HuggingFace), | ||||
|             model: Setting::Set(S("sentence-transformers/all-MiniLM-L6-v2")), | ||||
|             revision: Setting::Set(S("e4ce9877abf3edfe10b0d82785e83bdcb973e22e")), | ||||
|             document_template: Setting::Set(S("{{doc.doggo}} the {{doc.breed}} best doggo")), | ||||
|             ..Default::default() | ||||
|         }; | ||||
|         embedders.insert(S("B_small_hf"), Setting::Set(embedding_settings)); | ||||
|  | ||||
|         new_settings.embedders = Setting::Set(embedders); | ||||
|  | ||||
|         index_scheduler | ||||
|             .register( | ||||
|                 KindWithContent::SettingsUpdate { | ||||
|                     index_uid: S("doggos"), | ||||
|                     new_settings, | ||||
|                     is_deletion: false, | ||||
|                     allow_index_creation: true, | ||||
|                 }, | ||||
|                 None, | ||||
|                 false, | ||||
|             ) | ||||
|             .unwrap(); | ||||
|         index_scheduler.assert_internally_consistent(); | ||||
|  | ||||
|         snapshot!(snapshot_index_scheduler(&index_scheduler), name: "after_registering_settings_task_vectors"); | ||||
|  | ||||
|         { | ||||
|             let rtxn = index_scheduler.read_txn().unwrap(); | ||||
|             let task = index_scheduler.get_task(&rtxn, 0).unwrap().unwrap(); | ||||
|             let task = meilisearch_types::task_view::TaskView::from_task(&task); | ||||
|             insta::assert_json_snapshot!(task.details); | ||||
|         } | ||||
|  | ||||
|         handle.advance_n_successful_batches(1); | ||||
|         snapshot!(snapshot_index_scheduler(&index_scheduler), name: "settings_update_processed_vectors"); | ||||
|  | ||||
|         { | ||||
|             let rtxn = index_scheduler.read_txn().unwrap(); | ||||
|             let task = index_scheduler.get_task(&rtxn, 0).unwrap().unwrap(); | ||||
|             let task = meilisearch_types::task_view::TaskView::from_task(&task); | ||||
|             insta::assert_json_snapshot!(task.details); | ||||
|         } | ||||
|  | ||||
|         let (fakerest_name, simple_hf_name, beagle_embed, lab_embed, patou_embed) = { | ||||
|             let index = index_scheduler.index("doggos").unwrap(); | ||||
|             let rtxn = index.read_txn().unwrap(); | ||||
|  | ||||
|             let configs = index.embedding_configs(&rtxn).unwrap(); | ||||
|             // for consistency with the below | ||||
|             #[allow(clippy::get_first)] | ||||
|             let (name, fakerest_config) = configs.get(0).unwrap(); | ||||
|             insta::assert_json_snapshot!(name, @r###""A_fakerest""###); | ||||
|             insta::assert_json_snapshot!(fakerest_config.embedder_options); | ||||
|             let fakerest_name = name.clone(); | ||||
|  | ||||
|             let (name, simple_hf_config) = configs.get(1).unwrap(); | ||||
|             insta::assert_json_snapshot!(name, @r###""B_small_hf""###); | ||||
|             insta::assert_json_snapshot!(simple_hf_config.embedder_options); | ||||
|             let simple_hf_name = name.clone(); | ||||
|  | ||||
|             let configs = index_scheduler.embedders(configs).unwrap(); | ||||
|             let (hf_embedder, _) = configs.get(&simple_hf_name).unwrap(); | ||||
|             let beagle_embed = hf_embedder.embed_one(S("Intel the beagle best doggo")).unwrap(); | ||||
|             let lab_embed = hf_embedder.embed_one(S("Max the lab best doggo")).unwrap(); | ||||
|             let patou_embed = hf_embedder.embed_one(S("kefir the patou best doggo")).unwrap(); | ||||
|             (fakerest_name, simple_hf_name, beagle_embed, lab_embed, patou_embed) | ||||
|         }; | ||||
|  | ||||
|         // add one doc, specifying vectors | ||||
|  | ||||
|         let doc = serde_json::json!( | ||||
|                     { | ||||
|                         "id": 0, | ||||
|                         "doggo": "Intel", | ||||
|                         "breed": "beagle", | ||||
|                         "_vectors": { | ||||
|                             &fakerest_name: { | ||||
|                                 // this will never trigger regeneration, which is good because we can't actually generate with | ||||
|                                 // this embedder | ||||
|                                 "userProvided": true, | ||||
|                                 "embeddings": beagle_embed, | ||||
|                             }, | ||||
|                             &simple_hf_name: { | ||||
|                                 // this will be regenerated on updates | ||||
|                                 "userProvided": false, | ||||
|                                 "embeddings": lab_embed, | ||||
|                             }, | ||||
|                             "noise": [0.1, 0.2, 0.3] | ||||
|                         } | ||||
|                     } | ||||
|         ); | ||||
|  | ||||
|         let (uuid, mut file) = index_scheduler.create_update_file_with_uuid(0u128).unwrap(); | ||||
|         let documents_count = read_json(doc.to_string().as_bytes(), &mut file).unwrap(); | ||||
|         assert_eq!(documents_count, 1); | ||||
|         file.persist().unwrap(); | ||||
|  | ||||
|         index_scheduler | ||||
|             .register( | ||||
|                 KindWithContent::DocumentAdditionOrUpdate { | ||||
|                     index_uid: S("doggos"), | ||||
|                     primary_key: Some(S("id")), | ||||
|                     method: UpdateDocuments, | ||||
|                     content_file: uuid, | ||||
|                     documents_count, | ||||
|                     allow_index_creation: true, | ||||
|                 }, | ||||
|                 None, | ||||
|                 false, | ||||
|             ) | ||||
|             .unwrap(); | ||||
|         index_scheduler.assert_internally_consistent(); | ||||
|  | ||||
|         snapshot!(snapshot_index_scheduler(&index_scheduler), name: "after adding Intel"); | ||||
|  | ||||
|         handle.advance_one_successful_batch(); | ||||
|  | ||||
|         snapshot!(snapshot_index_scheduler(&index_scheduler), name: "adding Intel succeeds"); | ||||
|  | ||||
|         // check embeddings | ||||
|         { | ||||
|             let index = index_scheduler.index("doggos").unwrap(); | ||||
|             let rtxn = index.read_txn().unwrap(); | ||||
|  | ||||
|             let embeddings = index.embeddings(&rtxn, 0).unwrap(); | ||||
|  | ||||
|             assert_json_snapshot!(embeddings[&simple_hf_name][0] == lab_embed, @"true"); | ||||
|             assert_json_snapshot!(embeddings[&fakerest_name][0] == beagle_embed, @"true"); | ||||
|  | ||||
|             let doc = index.documents(&rtxn, std::iter::once(0)).unwrap()[0].1; | ||||
|             let fields_ids_map = index.fields_ids_map(&rtxn).unwrap(); | ||||
|             let doc = obkv_to_json( | ||||
|                 &[ | ||||
|                     fields_ids_map.id("doggo").unwrap(), | ||||
|                     fields_ids_map.id("breed").unwrap(), | ||||
|                     fields_ids_map.id("_vectors").unwrap(), | ||||
|                 ], | ||||
|                 &fields_ids_map, | ||||
|                 doc, | ||||
|             ) | ||||
|             .unwrap(); | ||||
|             assert_json_snapshot!(doc, {"._vectors.A_fakerest.embeddings" => "[vector]"}); | ||||
|         } | ||||
|  | ||||
|         // update the doc, specifying vectors | ||||
|  | ||||
|         let doc = serde_json::json!( | ||||
|                     { | ||||
|                         "id": 0, | ||||
|                         "doggo": "kefir", | ||||
|                         "breed": "patou", | ||||
|                     } | ||||
|         ); | ||||
|  | ||||
|         let (uuid, mut file) = index_scheduler.create_update_file_with_uuid(1u128).unwrap(); | ||||
|         let documents_count = read_json(doc.to_string().as_bytes(), &mut file).unwrap(); | ||||
|         assert_eq!(documents_count, 1); | ||||
|         file.persist().unwrap(); | ||||
|  | ||||
|         index_scheduler | ||||
|             .register( | ||||
|                 KindWithContent::DocumentAdditionOrUpdate { | ||||
|                     index_uid: S("doggos"), | ||||
|                     primary_key: None, | ||||
|                     method: UpdateDocuments, | ||||
|                     content_file: uuid, | ||||
|                     documents_count, | ||||
|                     allow_index_creation: true, | ||||
|                 }, | ||||
|                 None, | ||||
|                 false, | ||||
|             ) | ||||
|             .unwrap(); | ||||
|         index_scheduler.assert_internally_consistent(); | ||||
|  | ||||
|         snapshot!(snapshot_index_scheduler(&index_scheduler), name: "Intel to kefir"); | ||||
|  | ||||
|         handle.advance_one_successful_batch(); | ||||
|         snapshot!(snapshot_index_scheduler(&index_scheduler), name: "Intel to kefir succeeds"); | ||||
|  | ||||
|         { | ||||
|             // check embeddings | ||||
|             { | ||||
|                 let index = index_scheduler.index("doggos").unwrap(); | ||||
|                 let rtxn = index.read_txn().unwrap(); | ||||
|  | ||||
|                 let embeddings = index.embeddings(&rtxn, 0).unwrap(); | ||||
|  | ||||
|                 // automatically changed to patou | ||||
|                 assert_json_snapshot!(embeddings[&simple_hf_name][0] == patou_embed, @"true"); | ||||
|                 // remained beagle because set to userProvided | ||||
|                 assert_json_snapshot!(embeddings[&fakerest_name][0] == beagle_embed, @"true"); | ||||
|  | ||||
|                 let doc = index.documents(&rtxn, std::iter::once(0)).unwrap()[0].1; | ||||
|                 let fields_ids_map = index.fields_ids_map(&rtxn).unwrap(); | ||||
|                 let doc = obkv_to_json( | ||||
|                     &[ | ||||
|                         fields_ids_map.id("doggo").unwrap(), | ||||
|                         fields_ids_map.id("breed").unwrap(), | ||||
|                         fields_ids_map.id("_vectors").unwrap(), | ||||
|                     ], | ||||
|                     &fields_ids_map, | ||||
|                     doc, | ||||
|                 ) | ||||
|                 .unwrap(); | ||||
|                 assert_json_snapshot!(doc, {"._vectors.A_fakerest.embeddings" => "[vector]"}); | ||||
|             } | ||||
|         } | ||||
|     } | ||||
| } | ||||
|   | ||||
| @@ -0,0 +1,19 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| expression: doc | ||||
| --- | ||||
| { | ||||
|   "doggo": "kefir", | ||||
|   "breed": "patou", | ||||
|   "_vectors": { | ||||
|     "A_fakerest": { | ||||
|       "embeddings": "[vector]", | ||||
|       "userProvided": true | ||||
|     }, | ||||
|     "noise": [ | ||||
|       0.1, | ||||
|       0.2, | ||||
|       0.3 | ||||
|     ] | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,20 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| expression: task.details | ||||
| --- | ||||
| { | ||||
|   "embedders": { | ||||
|     "A_fakerest": { | ||||
|       "source": "rest", | ||||
|       "apiKey": "MyXXXX...", | ||||
|       "dimensions": 384, | ||||
|       "url": "http://localhost:7777" | ||||
|     }, | ||||
|     "B_small_hf": { | ||||
|       "source": "huggingFace", | ||||
|       "model": "sentence-transformers/all-MiniLM-L6-v2", | ||||
|       "revision": "e4ce9877abf3edfe10b0d82785e83bdcb973e22e", | ||||
|       "documentTemplate": "{{doc.doggo}} the {{doc.breed}} best doggo" | ||||
|     } | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,23 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| expression: fakerest_config.embedder_options | ||||
| --- | ||||
| { | ||||
|   "Rest": { | ||||
|     "api_key": "My super secret", | ||||
|     "distribution": null, | ||||
|     "dimensions": 384, | ||||
|     "url": "http://localhost:7777", | ||||
|     "query": null, | ||||
|     "input_field": [ | ||||
|       "input" | ||||
|     ], | ||||
|     "path_to_embeddings": [ | ||||
|       "data" | ||||
|     ], | ||||
|     "embedding_object": [ | ||||
|       "embedding" | ||||
|     ], | ||||
|     "input_type": "text" | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,11 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| expression: simple_hf_config.embedder_options | ||||
| --- | ||||
| { | ||||
|   "HuggingFace": { | ||||
|     "model": "sentence-transformers/all-MiniLM-L6-v2", | ||||
|     "revision": "e4ce9877abf3edfe10b0d82785e83bdcb973e22e", | ||||
|     "distribution": null | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,19 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| expression: doc | ||||
| --- | ||||
| { | ||||
|   "doggo": "Intel", | ||||
|   "breed": "beagle", | ||||
|   "_vectors": { | ||||
|     "A_fakerest": { | ||||
|       "embeddings": "[vector]", | ||||
|       "userProvided": true | ||||
|     }, | ||||
|     "noise": [ | ||||
|       0.1, | ||||
|       0.2, | ||||
|       0.3 | ||||
|     ] | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,20 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| expression: task.details | ||||
| --- | ||||
| { | ||||
|   "embedders": { | ||||
|     "A_fakerest": { | ||||
|       "source": "rest", | ||||
|       "apiKey": "MyXXXX...", | ||||
|       "dimensions": 384, | ||||
|       "url": "http://localhost:7777" | ||||
|     }, | ||||
|     "B_small_hf": { | ||||
|       "source": "huggingFace", | ||||
|       "model": "sentence-transformers/all-MiniLM-L6-v2", | ||||
|       "revision": "e4ce9877abf3edfe10b0d82785e83bdcb973e22e", | ||||
|       "documentTemplate": "{{doc.doggo}} the {{doc.breed}} best doggo" | ||||
|     } | ||||
|   } | ||||
| } | ||||
| @@ -0,0 +1,49 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| --- | ||||
| ### Autobatching Enabled = true | ||||
| ### Processing Tasks: | ||||
| [] | ||||
| ---------------------------------------------------------------------- | ||||
| ### All Tasks: | ||||
| 0 {uid: 0, status: succeeded, details: { settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> } }, kind: SettingsUpdate { index_uid: "doggos", new_settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> }, is_deletion: false, allow_index_creation: true }} | ||||
| 1 {uid: 1, status: succeeded, details: { received_documents: 1, indexed_documents: Some(1) }, kind: DocumentAdditionOrUpdate { index_uid: "doggos", primary_key: Some("id"), method: UpdateDocuments, content_file: 00000000-0000-0000-0000-000000000000, documents_count: 1, allow_index_creation: true }} | ||||
| 2 {uid: 2, status: succeeded, details: { received_documents: 1, indexed_documents: Some(1) }, kind: DocumentAdditionOrUpdate { index_uid: "doggos", primary_key: None, method: UpdateDocuments, content_file: 00000000-0000-0000-0000-000000000001, documents_count: 1, allow_index_creation: true }} | ||||
| ---------------------------------------------------------------------- | ||||
| ### Status: | ||||
| enqueued [] | ||||
| succeeded [0,1,2,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Kind: | ||||
| "documentAdditionOrUpdate" [1,2,] | ||||
| "settingsUpdate" [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Tasks: | ||||
| doggos [0,1,2,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Mapper: | ||||
| doggos: { number_of_documents: 1, field_distribution: {"_vectors": 1, "breed": 1, "doggo": 1, "id": 1} } | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Canceled By: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Enqueued At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| [timestamp] [2,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Started At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| [timestamp] [2,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Finished At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| [timestamp] [2,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### File Store: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
|  | ||||
| @@ -0,0 +1,48 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| --- | ||||
| ### Autobatching Enabled = true | ||||
| ### Processing Tasks: | ||||
| [] | ||||
| ---------------------------------------------------------------------- | ||||
| ### All Tasks: | ||||
| 0 {uid: 0, status: succeeded, details: { settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> } }, kind: SettingsUpdate { index_uid: "doggos", new_settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> }, is_deletion: false, allow_index_creation: true }} | ||||
| 1 {uid: 1, status: succeeded, details: { received_documents: 1, indexed_documents: Some(1) }, kind: DocumentAdditionOrUpdate { index_uid: "doggos", primary_key: Some("id"), method: UpdateDocuments, content_file: 00000000-0000-0000-0000-000000000000, documents_count: 1, allow_index_creation: true }} | ||||
| 2 {uid: 2, status: enqueued, details: { received_documents: 1, indexed_documents: None }, kind: DocumentAdditionOrUpdate { index_uid: "doggos", primary_key: None, method: UpdateDocuments, content_file: 00000000-0000-0000-0000-000000000001, documents_count: 1, allow_index_creation: true }} | ||||
| ---------------------------------------------------------------------- | ||||
| ### Status: | ||||
| enqueued [2,] | ||||
| succeeded [0,1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Kind: | ||||
| "documentAdditionOrUpdate" [1,2,] | ||||
| "settingsUpdate" [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Tasks: | ||||
| doggos [0,1,2,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Mapper: | ||||
| doggos: { number_of_documents: 1, field_distribution: {"_vectors": 1, "breed": 1, "doggo": 1, "id": 1} } | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Canceled By: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Enqueued At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| [timestamp] [2,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Started At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Finished At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### File Store: | ||||
| 00000000-0000-0000-0000-000000000001 | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
|  | ||||
| @@ -0,0 +1,45 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| --- | ||||
| ### Autobatching Enabled = true | ||||
| ### Processing Tasks: | ||||
| [] | ||||
| ---------------------------------------------------------------------- | ||||
| ### All Tasks: | ||||
| 0 {uid: 0, status: succeeded, details: { settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> } }, kind: SettingsUpdate { index_uid: "doggos", new_settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> }, is_deletion: false, allow_index_creation: true }} | ||||
| 1 {uid: 1, status: succeeded, details: { received_documents: 1, indexed_documents: Some(1) }, kind: DocumentAdditionOrUpdate { index_uid: "doggos", primary_key: Some("id"), method: UpdateDocuments, content_file: 00000000-0000-0000-0000-000000000000, documents_count: 1, allow_index_creation: true }} | ||||
| ---------------------------------------------------------------------- | ||||
| ### Status: | ||||
| enqueued [] | ||||
| succeeded [0,1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Kind: | ||||
| "documentAdditionOrUpdate" [1,] | ||||
| "settingsUpdate" [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Tasks: | ||||
| doggos [0,1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Mapper: | ||||
| doggos: { number_of_documents: 1, field_distribution: {"_vectors": 1, "breed": 1, "doggo": 1, "id": 1} } | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Canceled By: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Enqueued At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Started At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Finished At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### File Store: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
|  | ||||
| @@ -0,0 +1,44 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| --- | ||||
| ### Autobatching Enabled = true | ||||
| ### Processing Tasks: | ||||
| [] | ||||
| ---------------------------------------------------------------------- | ||||
| ### All Tasks: | ||||
| 0 {uid: 0, status: succeeded, details: { settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> } }, kind: SettingsUpdate { index_uid: "doggos", new_settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> }, is_deletion: false, allow_index_creation: true }} | ||||
| 1 {uid: 1, status: enqueued, details: { received_documents: 1, indexed_documents: None }, kind: DocumentAdditionOrUpdate { index_uid: "doggos", primary_key: Some("id"), method: UpdateDocuments, content_file: 00000000-0000-0000-0000-000000000000, documents_count: 1, allow_index_creation: true }} | ||||
| ---------------------------------------------------------------------- | ||||
| ### Status: | ||||
| enqueued [1,] | ||||
| succeeded [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Kind: | ||||
| "documentAdditionOrUpdate" [1,] | ||||
| "settingsUpdate" [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Tasks: | ||||
| doggos [0,1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Mapper: | ||||
| doggos: { number_of_documents: 0, field_distribution: {} } | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Canceled By: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Enqueued At: | ||||
| [timestamp] [0,] | ||||
| [timestamp] [1,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Started At: | ||||
| [timestamp] [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Finished At: | ||||
| [timestamp] [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### File Store: | ||||
| 00000000-0000-0000-0000-000000000000 | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
|  | ||||
| @@ -0,0 +1,36 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| --- | ||||
| ### Autobatching Enabled = true | ||||
| ### Processing Tasks: | ||||
| [] | ||||
| ---------------------------------------------------------------------- | ||||
| ### All Tasks: | ||||
| 0 {uid: 0, status: enqueued, details: { settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> } }, kind: SettingsUpdate { index_uid: "doggos", new_settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> }, is_deletion: false, allow_index_creation: true }} | ||||
| ---------------------------------------------------------------------- | ||||
| ### Status: | ||||
| enqueued [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Kind: | ||||
| "settingsUpdate" [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Tasks: | ||||
| doggos [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Mapper: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Canceled By: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Enqueued At: | ||||
| [timestamp] [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Started At: | ||||
| ---------------------------------------------------------------------- | ||||
| ### Finished At: | ||||
| ---------------------------------------------------------------------- | ||||
| ### File Store: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
|  | ||||
| @@ -0,0 +1,40 @@ | ||||
| --- | ||||
| source: index-scheduler/src/lib.rs | ||||
| --- | ||||
| ### Autobatching Enabled = true | ||||
| ### Processing Tasks: | ||||
| [] | ||||
| ---------------------------------------------------------------------- | ||||
| ### All Tasks: | ||||
| 0 {uid: 0, status: succeeded, details: { settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> } }, kind: SettingsUpdate { index_uid: "doggos", new_settings: Settings { displayed_attributes: WildcardSetting(NotSet), searchable_attributes: WildcardSetting(NotSet), filterable_attributes: NotSet, sortable_attributes: NotSet, ranking_rules: NotSet, stop_words: NotSet, non_separator_tokens: NotSet, separator_tokens: NotSet, dictionary: NotSet, synonyms: NotSet, distinct_attribute: NotSet, proximity_precision: NotSet, typo_tolerance: NotSet, faceting: NotSet, pagination: NotSet, embedders: Set({"A_fakerest": Set(EmbeddingSettings { source: Set(Rest), model: NotSet, revision: NotSet, api_key: Set("My super secret"), dimensions: Set(384), document_template: NotSet, url: Set("http://localhost:7777"), query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet }), "B_small_hf": Set(EmbeddingSettings { source: Set(HuggingFace), model: Set("sentence-transformers/all-MiniLM-L6-v2"), revision: Set("e4ce9877abf3edfe10b0d82785e83bdcb973e22e"), api_key: NotSet, dimensions: NotSet, document_template: Set("{{doc.doggo}} the {{doc.breed}} best doggo"), url: NotSet, query: NotSet, input_field: NotSet, path_to_embeddings: NotSet, embedding_object: NotSet, input_type: NotSet, distribution: NotSet })}), search_cutoff_ms: NotSet, _kind: PhantomData<meilisearch_types::settings::Unchecked> }, is_deletion: false, allow_index_creation: true }} | ||||
| ---------------------------------------------------------------------- | ||||
| ### Status: | ||||
| enqueued [] | ||||
| succeeded [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Kind: | ||||
| "settingsUpdate" [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Tasks: | ||||
| doggos [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Index Mapper: | ||||
| doggos: { number_of_documents: 0, field_distribution: {} } | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Canceled By: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
| ### Enqueued At: | ||||
| [timestamp] [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Started At: | ||||
| [timestamp] [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### Finished At: | ||||
| [timestamp] [0,] | ||||
| ---------------------------------------------------------------------- | ||||
| ### File Store: | ||||
|  | ||||
| ---------------------------------------------------------------------- | ||||
|  | ||||
| @@ -384,7 +384,6 @@ impl ErrorCode for milli::Error { | ||||
|                     UserError::InvalidGeoField { .. } => Code::InvalidDocumentGeoField, | ||||
|                     UserError::InvalidVectorDimensions { .. } => Code::InvalidVectorDimensions, | ||||
|                     UserError::InvalidVectorsMapType { .. } => Code::InvalidVectorsType, | ||||
|                     UserError::InvalidVectorsType { .. } => Code::InvalidVectorsType, | ||||
|                     UserError::TooManyVectors(_, _) => Code::TooManyVectors, | ||||
|                     UserError::SortError(_) => Code::InvalidSearchSort, | ||||
|                     UserError::InvalidMinTypoWordLenSetting(_, _) => { | ||||
|   | ||||
| @@ -5,7 +5,10 @@ use crate::common::index::Index; | ||||
| use crate::common::{Server, Value}; | ||||
| use crate::json; | ||||
|  | ||||
| async fn index_with_documents<'a>(server: &'a Server, documents: &Value) -> Index<'a> { | ||||
| async fn index_with_documents_user_provided<'a>( | ||||
|     server: &'a Server, | ||||
|     documents: &Value, | ||||
| ) -> Index<'a> { | ||||
|     let index = server.index("test"); | ||||
|  | ||||
|     let (response, code) = server.set_features(json!({"vectorStore": true})).await; | ||||
| @@ -34,7 +37,39 @@ async fn index_with_documents<'a>(server: &'a Server, documents: &Value) -> Inde | ||||
|     index | ||||
| } | ||||
|  | ||||
| static SIMPLE_SEARCH_DOCUMENTS: Lazy<Value> = Lazy::new(|| { | ||||
| async fn index_with_documents_hf<'a>(server: &'a Server, documents: &Value) -> Index<'a> { | ||||
|     let index = server.index("test"); | ||||
|  | ||||
|     let (response, code) = server.set_features(json!({"vectorStore": true})).await; | ||||
|  | ||||
|     meili_snap::snapshot!(code, @"200 OK"); | ||||
|     meili_snap::snapshot!(meili_snap::json_string!(response), @r###" | ||||
|     { | ||||
|       "vectorStore": true, | ||||
|       "metrics": false, | ||||
|       "logsRoute": false, | ||||
|       "exportPuffinReports": false | ||||
|     } | ||||
|     "###); | ||||
|  | ||||
|     let (response, code) = index | ||||
|         .update_settings(json!({ "embedders": {"default": { | ||||
|             "source": "huggingFace", | ||||
|             "model": "sentence-transformers/all-MiniLM-L6-v2", | ||||
|             "revision": "e4ce9877abf3edfe10b0d82785e83bdcb973e22e", | ||||
|             "documentTemplate": "{{doc.title}}, {{doc.desc}}" | ||||
|         }}} )) | ||||
|         .await; | ||||
|     assert_eq!(202, code, "{:?}", response); | ||||
|     index.wait_task(response.uid()).await; | ||||
|  | ||||
|     let (response, code) = index.add_documents(documents.clone(), None).await; | ||||
|     assert_eq!(202, code, "{:?}", response); | ||||
|     index.wait_task(response.uid()).await; | ||||
|     index | ||||
| } | ||||
|  | ||||
| static SIMPLE_SEARCH_DOCUMENTS_VEC: Lazy<Value> = Lazy::new(|| { | ||||
|     json!([ | ||||
|     { | ||||
|         "title": "Shazam!", | ||||
| @@ -56,7 +91,7 @@ static SIMPLE_SEARCH_DOCUMENTS: Lazy<Value> = Lazy::new(|| { | ||||
|     }]) | ||||
| }); | ||||
|  | ||||
| static SINGLE_DOCUMENT: Lazy<Value> = Lazy::new(|| { | ||||
| static SINGLE_DOCUMENT_VEC: Lazy<Value> = Lazy::new(|| { | ||||
|     json!([{ | ||||
|             "title": "Shazam!", | ||||
|             "desc": "a Captain Marvel ersatz", | ||||
| @@ -65,10 +100,29 @@ static SINGLE_DOCUMENT: Lazy<Value> = Lazy::new(|| { | ||||
|     }]) | ||||
| }); | ||||
|  | ||||
| static SIMPLE_SEARCH_DOCUMENTS: Lazy<Value> = Lazy::new(|| { | ||||
|     json!([ | ||||
|     { | ||||
|         "title": "Shazam!", | ||||
|         "desc": "a Captain Marvel ersatz", | ||||
|         "id": "1", | ||||
|     }, | ||||
|     { | ||||
|         "title": "Captain Planet", | ||||
|         "desc": "He's not part of the Marvel Cinematic Universe", | ||||
|         "id": "2", | ||||
|     }, | ||||
|     { | ||||
|         "title": "Captain Marvel", | ||||
|         "desc": "a Shazam ersatz", | ||||
|         "id": "3", | ||||
|     }]) | ||||
| }); | ||||
|  | ||||
| #[actix_rt::test] | ||||
| async fn simple_search() { | ||||
|     let server = Server::new().await; | ||||
|     let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await; | ||||
|     let index = index_with_documents_user_provided(&server, &SIMPLE_SEARCH_DOCUMENTS_VEC).await; | ||||
|  | ||||
|     let (response, code) = index | ||||
|         .search_post( | ||||
| @@ -98,10 +152,59 @@ async fn simple_search() { | ||||
|     snapshot!(response["semanticHitCount"], @"3"); | ||||
| } | ||||
|  | ||||
| #[actix_rt::test] | ||||
| async fn simple_search_hf() { | ||||
|     let server = Server::new().await; | ||||
|     let index = index_with_documents_hf(&server, &SIMPLE_SEARCH_DOCUMENTS).await; | ||||
|  | ||||
|     let (response, code) = | ||||
|         index.search_post(json!({"q": "Captain", "hybrid": {"semanticRatio": 0.2}})).await; | ||||
|     snapshot!(code, @"200 OK"); | ||||
|     snapshot!(response["hits"], @r###"[{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2"},{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3"},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1"}]"###); | ||||
|     snapshot!(response["semanticHitCount"], @"0"); | ||||
|  | ||||
|     let (response, code) = index | ||||
|         .search_post( | ||||
|             // disable ranking score as the vectors between architectures are not equal | ||||
|             json!({"q": "Captain", "hybrid": {"semanticRatio": 0.55}, "showRankingScore": false}), | ||||
|         ) | ||||
|         .await; | ||||
|     snapshot!(code, @"200 OK"); | ||||
|     snapshot!(response["hits"], @r###"[{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2"},{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3"},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1"}]"###); | ||||
|     snapshot!(response["semanticHitCount"], @"1"); | ||||
|  | ||||
|     let (response, code) = index | ||||
|         .search_post( | ||||
|             json!({"q": "Captain", "hybrid": {"semanticRatio": 0.8}, "showRankingScore": false}), | ||||
|         ) | ||||
|         .await; | ||||
|     snapshot!(code, @"200 OK"); | ||||
|     snapshot!(response["hits"], @r###"[{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1"},{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3"},{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2"}]"###); | ||||
|     snapshot!(response["semanticHitCount"], @"3"); | ||||
|  | ||||
|     let (response, code) = index | ||||
|         .search_post( | ||||
|             json!({"q": "Movie World", "hybrid": {"semanticRatio": 0.2}, "showRankingScore": false}), | ||||
|         ) | ||||
|         .await; | ||||
|     snapshot!(code, @"200 OK"); | ||||
|     snapshot!(response["hits"], @r###"[{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2"},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1"},{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3"}]"###); | ||||
|     snapshot!(response["semanticHitCount"], @"3"); | ||||
|  | ||||
|     let (response, code) = index | ||||
|         .search_post( | ||||
|             json!({"q": "Wonder replacement", "hybrid": {"semanticRatio": 0.2}, "showRankingScore": false}), | ||||
|         ) | ||||
|         .await; | ||||
|     snapshot!(code, @"200 OK"); | ||||
|     snapshot!(response["hits"], @r###"[{"title":"Captain Marvel","desc":"a Shazam ersatz","id":"3"},{"title":"Shazam!","desc":"a Captain Marvel ersatz","id":"1"},{"title":"Captain Planet","desc":"He's not part of the Marvel Cinematic Universe","id":"2"}]"###); | ||||
|     snapshot!(response["semanticHitCount"], @"3"); | ||||
| } | ||||
|  | ||||
| #[actix_rt::test] | ||||
| async fn distribution_shift() { | ||||
|     let server = Server::new().await; | ||||
|     let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await; | ||||
|     let index = index_with_documents_user_provided(&server, &SIMPLE_SEARCH_DOCUMENTS_VEC).await; | ||||
|  | ||||
|     let search = json!({"q": "Captain", "vector": [1.0, 1.0], "showRankingScore": true, "hybrid": {"semanticRatio": 1.0}}); | ||||
|     let (response, code) = index.search_post(search.clone()).await; | ||||
| @@ -133,7 +236,7 @@ async fn distribution_shift() { | ||||
| #[actix_rt::test] | ||||
| async fn highlighter() { | ||||
|     let server = Server::new().await; | ||||
|     let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await; | ||||
|     let index = index_with_documents_user_provided(&server, &SIMPLE_SEARCH_DOCUMENTS_VEC).await; | ||||
|  | ||||
|     let (response, code) = index | ||||
|         .search_post(json!({"q": "Captain Marvel", "vector": [1.0, 1.0], | ||||
| @@ -184,7 +287,7 @@ async fn highlighter() { | ||||
| #[actix_rt::test] | ||||
| async fn invalid_semantic_ratio() { | ||||
|     let server = Server::new().await; | ||||
|     let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await; | ||||
|     let index = index_with_documents_user_provided(&server, &SIMPLE_SEARCH_DOCUMENTS_VEC).await; | ||||
|  | ||||
|     let (response, code) = index | ||||
|         .search_post( | ||||
| @@ -256,7 +359,7 @@ async fn invalid_semantic_ratio() { | ||||
| #[actix_rt::test] | ||||
| async fn single_document() { | ||||
|     let server = Server::new().await; | ||||
|     let index = index_with_documents(&server, &SINGLE_DOCUMENT).await; | ||||
|     let index = index_with_documents_user_provided(&server, &SINGLE_DOCUMENT_VEC).await; | ||||
|  | ||||
|     let (response, code) = index | ||||
|     .search_post( | ||||
| @@ -272,7 +375,7 @@ async fn single_document() { | ||||
| #[actix_rt::test] | ||||
| async fn query_combination() { | ||||
|     let server = Server::new().await; | ||||
|     let index = index_with_documents(&server, &SIMPLE_SEARCH_DOCUMENTS).await; | ||||
|     let index = index_with_documents_user_provided(&server, &SIMPLE_SEARCH_DOCUMENTS_VEC).await; | ||||
|  | ||||
|     // search without query and vector, but with hybrid => still placeholder | ||||
|     let (response, code) = index | ||||
|   | ||||
| @@ -895,9 +895,9 @@ async fn test_score_details() { | ||||
|                     "id": "166428", | ||||
|                     "_vectors": { | ||||
|                       "manual": [ | ||||
|                         -100, | ||||
|                         231, | ||||
|                         32 | ||||
|                         -100.0, | ||||
|                         231.0, | ||||
|                         32.0 | ||||
|                       ] | ||||
|                     }, | ||||
|                     "_rankingScoreDetails": { | ||||
| @@ -1096,9 +1096,9 @@ async fn experimental_feature_vector_store() { | ||||
|         "id": "287947", | ||||
|         "_vectors": { | ||||
|           "manual": [ | ||||
|             1, | ||||
|             2, | ||||
|             3 | ||||
|             1.0, | ||||
|             2.0, | ||||
|             3.0 | ||||
|           ] | ||||
|         }, | ||||
|         "_rankingScore": 1.0 | ||||
| @@ -1108,9 +1108,9 @@ async fn experimental_feature_vector_store() { | ||||
|         "id": "299537", | ||||
|         "_vectors": { | ||||
|           "manual": [ | ||||
|             1, | ||||
|             2, | ||||
|             54 | ||||
|             1.0, | ||||
|             2.0, | ||||
|             54.0 | ||||
|           ] | ||||
|         }, | ||||
|         "_rankingScore": 0.9129111766815186 | ||||
| @@ -1120,9 +1120,9 @@ async fn experimental_feature_vector_store() { | ||||
|         "id": "450465", | ||||
|         "_vectors": { | ||||
|           "manual": [ | ||||
|             -100, | ||||
|             340, | ||||
|             90 | ||||
|             -100.0, | ||||
|             340.0, | ||||
|             90.0 | ||||
|           ] | ||||
|         }, | ||||
|         "_rankingScore": 0.8106412887573242 | ||||
| @@ -1132,9 +1132,9 @@ async fn experimental_feature_vector_store() { | ||||
|         "id": "166428", | ||||
|         "_vectors": { | ||||
|           "manual": [ | ||||
|             -100, | ||||
|             231, | ||||
|             32 | ||||
|             -100.0, | ||||
|             231.0, | ||||
|             32.0 | ||||
|           ] | ||||
|         }, | ||||
|         "_rankingScore": 0.7412010431289673 | ||||
| @@ -1144,9 +1144,9 @@ async fn experimental_feature_vector_store() { | ||||
|         "id": "522681", | ||||
|         "_vectors": { | ||||
|           "manual": [ | ||||
|             10, | ||||
|             -23, | ||||
|             32 | ||||
|             10.0, | ||||
|             -23.0, | ||||
|             32.0 | ||||
|           ] | ||||
|         }, | ||||
|         "_rankingScore": 0.6972063183784485 | ||||
| @@ -1405,9 +1405,9 @@ async fn simple_search_with_strange_synonyms() { | ||||
|                 "id": "166428", | ||||
|                 "_vectors": { | ||||
|                   "manual": [ | ||||
|                     -100, | ||||
|                     231, | ||||
|                     32 | ||||
|                     -100.0, | ||||
|                     231.0, | ||||
|                     32.0 | ||||
|                   ] | ||||
|                 } | ||||
|               } | ||||
| @@ -1426,9 +1426,9 @@ async fn simple_search_with_strange_synonyms() { | ||||
|                 "id": "166428", | ||||
|                 "_vectors": { | ||||
|                   "manual": [ | ||||
|                     -100, | ||||
|                     231, | ||||
|                     32 | ||||
|                     -100.0, | ||||
|                     231.0, | ||||
|                     32.0 | ||||
|                   ] | ||||
|                 } | ||||
|               } | ||||
| @@ -1447,9 +1447,9 @@ async fn simple_search_with_strange_synonyms() { | ||||
|                 "id": "166428", | ||||
|                 "_vectors": { | ||||
|                   "manual": [ | ||||
|                     -100, | ||||
|                     231, | ||||
|                     32 | ||||
|                     -100.0, | ||||
|                     231.0, | ||||
|                     32.0 | ||||
|                   ] | ||||
|                 } | ||||
|               } | ||||
|   | ||||
| @@ -75,9 +75,9 @@ async fn simple_search_single_index() { | ||||
|             "id": "450465", | ||||
|             "_vectors": { | ||||
|               "manual": [ | ||||
|                 -100, | ||||
|                 340, | ||||
|                 90 | ||||
|                 -100.0, | ||||
|                 340.0, | ||||
|                 90.0 | ||||
|               ] | ||||
|             } | ||||
|           } | ||||
| @@ -96,9 +96,9 @@ async fn simple_search_single_index() { | ||||
|             "id": "299537", | ||||
|             "_vectors": { | ||||
|               "manual": [ | ||||
|                 1, | ||||
|                 2, | ||||
|                 54 | ||||
|                 1.0, | ||||
|                 2.0, | ||||
|                 54.0 | ||||
|               ] | ||||
|             } | ||||
|           } | ||||
| @@ -194,9 +194,9 @@ async fn simple_search_two_indexes() { | ||||
|             "id": "450465", | ||||
|             "_vectors": { | ||||
|               "manual": [ | ||||
|                 -100, | ||||
|                 340, | ||||
|                 90 | ||||
|                 -100.0, | ||||
|                 340.0, | ||||
|                 90.0 | ||||
|               ] | ||||
|             } | ||||
|           } | ||||
| @@ -227,9 +227,9 @@ async fn simple_search_two_indexes() { | ||||
|             "cattos": "pésti", | ||||
|             "_vectors": { | ||||
|               "manual": [ | ||||
|                 1, | ||||
|                 2, | ||||
|                 3 | ||||
|                 1.0, | ||||
|                 2.0, | ||||
|                 3.0 | ||||
|               ] | ||||
|             } | ||||
|           }, | ||||
| @@ -249,9 +249,9 @@ async fn simple_search_two_indexes() { | ||||
|             ], | ||||
|             "_vectors": { | ||||
|               "manual": [ | ||||
|                 1, | ||||
|                 2, | ||||
|                 54 | ||||
|                 1.0, | ||||
|                 2.0, | ||||
|                 54.0 | ||||
|               ] | ||||
|             } | ||||
|           } | ||||
|   | ||||
| @@ -117,10 +117,8 @@ only composed of alphanumeric characters (a-z A-Z 0-9), hyphens (-) and undersco | ||||
|     InvalidGeoField(#[from] GeoError), | ||||
|     #[error("Invalid vector dimensions: expected: `{}`, found: `{}`.", .expected, .found)] | ||||
|     InvalidVectorDimensions { expected: usize, found: usize }, | ||||
|     #[error("The `_vectors.{subfield}` field in the document with id: `{document_id}` is not an array. Was expecting an array of floats or an array of arrays of floats but instead got `{value}`.")] | ||||
|     InvalidVectorsType { document_id: Value, value: Value, subfield: String }, | ||||
|     #[error("The `_vectors` field in the document with id: `{document_id}` is not an object. Was expecting an object with a key for each embedder with manually provided vectors, but instead got `{value}`")] | ||||
|     InvalidVectorsMapType { document_id: Value, value: Value }, | ||||
|     InvalidVectorsMapType { document_id: String, value: Value }, | ||||
|     #[error("{0}")] | ||||
|     InvalidFilter(String), | ||||
|     #[error("Invalid type for filter subexpression: expected: {}, found: {1}.", .0.join(", "))] | ||||
|   | ||||
| @@ -23,7 +23,7 @@ use crate::heed_codec::{ | ||||
| }; | ||||
| use crate::order_by_map::OrderByMap; | ||||
| use crate::proximity::ProximityPrecision; | ||||
| use crate::vector::EmbeddingConfig; | ||||
| use crate::vector::{Embedding, EmbeddingConfig}; | ||||
| use crate::{ | ||||
|     default_criteria, CboRoaringBitmapCodec, Criterion, DocumentId, ExternalDocumentsIds, | ||||
|     FacetDistribution, FieldDistribution, FieldId, FieldIdMapMissingEntry, FieldIdWordCountCodec, | ||||
| @@ -1606,6 +1606,44 @@ impl Index { | ||||
|     pub(crate) fn delete_search_cutoff(&self, wtxn: &mut RwTxn<'_>) -> heed::Result<bool> { | ||||
|         self.main.remap_key_type::<Str>().delete(wtxn, main_key::SEARCH_CUTOFF) | ||||
|     } | ||||
|  | ||||
|     pub fn embeddings( | ||||
|         &self, | ||||
|         rtxn: &RoTxn<'_>, | ||||
|         docid: DocumentId, | ||||
|     ) -> Result<BTreeMap<String, Vec<Embedding>>> { | ||||
|         let mut res = BTreeMap::new(); | ||||
|         for row in self.embedder_category_id.iter(rtxn)? { | ||||
|             let (embedder_name, embedder_id) = row?; | ||||
|             let embedder_id = (embedder_id as u16) << 8; | ||||
|             let mut embeddings = Vec::new(); | ||||
|             'vectors: for i in 0..=u8::MAX { | ||||
|                 let reader = arroy::Reader::open(rtxn, embedder_id | (i as u16), self.vector_arroy) | ||||
|                     .map(Some) | ||||
|                     .or_else(|e| match e { | ||||
|                         arroy::Error::MissingMetadata => Ok(None), | ||||
|                         e => Err(e), | ||||
|                     }) | ||||
|                     .transpose(); | ||||
|  | ||||
|                 let Some(reader) = reader else { | ||||
|                     break 'vectors; | ||||
|                 }; | ||||
|  | ||||
|                 let embedding = reader?.item_vector(rtxn, docid)?; | ||||
|                 if let Some(embedding) = embedding { | ||||
|                     embeddings.push(embedding) | ||||
|                 } else { | ||||
|                     break 'vectors; | ||||
|                 } | ||||
|             } | ||||
|  | ||||
|             if !embeddings.is_empty() { | ||||
|                 res.insert(embedder_name.to_owned(), embeddings); | ||||
|             } | ||||
|         } | ||||
|         Ok(res) | ||||
|     } | ||||
| } | ||||
|  | ||||
| #[cfg(test)] | ||||
|   | ||||
| @@ -362,35 +362,6 @@ pub fn normalize_facet(original: &str) -> String { | ||||
|     CompatibilityDecompositionNormalizer.normalize_str(original.trim()).to_lowercase() | ||||
| } | ||||
|  | ||||
| /// Represents either a vector or an array of multiple vectors. | ||||
| #[derive(serde::Serialize, serde::Deserialize, Debug)] | ||||
| #[serde(transparent)] | ||||
| pub struct VectorOrArrayOfVectors { | ||||
|     #[serde(with = "either::serde_untagged_optional")] | ||||
|     inner: Option<either::Either<Vec<f32>, Vec<Vec<f32>>>>, | ||||
| } | ||||
|  | ||||
| impl VectorOrArrayOfVectors { | ||||
|     pub fn into_array_of_vectors(self) -> Option<Vec<Vec<f32>>> { | ||||
|         match self.inner? { | ||||
|             either::Either::Left(vector) => Some(vec![vector]), | ||||
|             either::Either::Right(vectors) => Some(vectors), | ||||
|         } | ||||
|     } | ||||
| } | ||||
|  | ||||
| /// Normalize a vector by dividing the dimensions by the length of it. | ||||
| pub fn normalize_vector(mut vector: Vec<f32>) -> Vec<f32> { | ||||
|     let squared: f32 = vector.iter().map(|x| x * x).sum(); | ||||
|     let length = squared.sqrt(); | ||||
|     if length <= f32::EPSILON { | ||||
|         vector | ||||
|     } else { | ||||
|         vector.iter_mut().for_each(|x| *x /= length); | ||||
|         vector | ||||
|     } | ||||
| } | ||||
|  | ||||
| #[cfg(test)] | ||||
| mod tests { | ||||
|     use serde_json::json; | ||||
|   | ||||
| @@ -10,16 +10,16 @@ use bytemuck::cast_slice; | ||||
| use grenad::Writer; | ||||
| use itertools::EitherOrBoth; | ||||
| use ordered_float::OrderedFloat; | ||||
| use serde_json::{from_slice, Value}; | ||||
| use serde_json::Value; | ||||
|  | ||||
| use super::helpers::{create_writer, writer_into_reader, GrenadParameters}; | ||||
| use crate::error::UserError; | ||||
| use crate::prompt::Prompt; | ||||
| use crate::update::del_add::{DelAdd, KvReaderDelAdd, KvWriterDelAdd}; | ||||
| use crate::update::index_documents::helpers::try_split_at; | ||||
| use crate::update::settings::InnerIndexSettingsDiff; | ||||
| use crate::vector::parsed_vectors::{ParsedVectorsDiff, RESERVED_VECTORS_FIELD_NAME}; | ||||
| use crate::vector::Embedder; | ||||
| use crate::{DocumentId, InternalError, Result, ThreadPoolNoAbort, VectorOrArrayOfVectors}; | ||||
| use crate::{DocumentId, Result, ThreadPoolNoAbort}; | ||||
|  | ||||
| /// The length of the elements that are always in the buffer when inserting new values. | ||||
| const TRUNCATE_SIZE: usize = size_of::<DocumentId>(); | ||||
| @@ -31,6 +31,10 @@ pub struct ExtractedVectorPoints { | ||||
|     pub remove_vectors: grenad::Reader<BufReader<File>>, | ||||
|     // docid -> prompt | ||||
|     pub prompts: grenad::Reader<BufReader<File>>, | ||||
|  | ||||
|     // embedder | ||||
|     pub embedder_name: String, | ||||
|     pub embedder: Arc<Embedder>, | ||||
| } | ||||
|  | ||||
| enum VectorStateDelta { | ||||
| @@ -65,6 +69,19 @@ impl VectorStateDelta { | ||||
|     } | ||||
| } | ||||
|  | ||||
| struct EmbedderVectorExtractor { | ||||
|     embedder_name: String, | ||||
|     embedder: Arc<Embedder>, | ||||
|     prompt: Arc<Prompt>, | ||||
|  | ||||
|     // (docid, _index) -> KvWriterDelAdd -> Vector | ||||
|     manual_vectors_writer: Writer<BufWriter<File>>, | ||||
|     // (docid) -> (prompt) | ||||
|     prompts_writer: Writer<BufWriter<File>>, | ||||
|     // (docid) -> () | ||||
|     remove_vectors_writer: Writer<BufWriter<File>>, | ||||
| } | ||||
|  | ||||
| /// Extracts the embedding vector contained in each document under the `_vectors` field. | ||||
| /// | ||||
| /// Returns the generated grenad reader containing the docid as key associated to the Vec<f32> | ||||
| @@ -73,34 +90,54 @@ pub fn extract_vector_points<R: io::Read + io::Seek>( | ||||
|     obkv_documents: grenad::Reader<R>, | ||||
|     indexer: GrenadParameters, | ||||
|     settings_diff: &InnerIndexSettingsDiff, | ||||
|     prompt: &Prompt, | ||||
|     embedder_name: &str, | ||||
| ) -> Result<ExtractedVectorPoints> { | ||||
| ) -> Result<Vec<ExtractedVectorPoints>> { | ||||
|     puffin::profile_function!(); | ||||
|  | ||||
|     let reindex_vectors = settings_diff.reindex_vectors(); | ||||
|  | ||||
|     let old_fields_ids_map = &settings_diff.old.fields_ids_map; | ||||
|     let new_fields_ids_map = &settings_diff.new.fields_ids_map; | ||||
|     // the vector field id may have changed | ||||
|     let old_vectors_fid = old_fields_ids_map.id(RESERVED_VECTORS_FIELD_NAME); | ||||
|     // filter the old vector fid if the settings has been changed forcing reindexing. | ||||
|     let old_vectors_fid = old_vectors_fid.filter(|_| !reindex_vectors); | ||||
|  | ||||
|     // (docid, _index) -> KvWriterDelAdd -> Vector | ||||
|     let mut manual_vectors_writer = create_writer( | ||||
|         indexer.chunk_compression_type, | ||||
|         indexer.chunk_compression_level, | ||||
|         tempfile::tempfile()?, | ||||
|     ); | ||||
|     let new_vectors_fid = new_fields_ids_map.id(RESERVED_VECTORS_FIELD_NAME); | ||||
|  | ||||
|     // (docid) -> (prompt) | ||||
|     let mut prompts_writer = create_writer( | ||||
|         indexer.chunk_compression_type, | ||||
|         indexer.chunk_compression_level, | ||||
|         tempfile::tempfile()?, | ||||
|     ); | ||||
|     let mut extractors = Vec::new(); | ||||
|     for (embedder_name, (embedder, prompt)) in | ||||
|         settings_diff.new.embedding_configs.clone().into_iter() | ||||
|     { | ||||
|         // (docid, _index) -> KvWriterDelAdd -> Vector | ||||
|         let manual_vectors_writer = create_writer( | ||||
|             indexer.chunk_compression_type, | ||||
|             indexer.chunk_compression_level, | ||||
|             tempfile::tempfile()?, | ||||
|         ); | ||||
|  | ||||
|     // (docid) -> () | ||||
|     let mut remove_vectors_writer = create_writer( | ||||
|         indexer.chunk_compression_type, | ||||
|         indexer.chunk_compression_level, | ||||
|         tempfile::tempfile()?, | ||||
|     ); | ||||
|         // (docid) -> (prompt) | ||||
|         let prompts_writer = create_writer( | ||||
|             indexer.chunk_compression_type, | ||||
|             indexer.chunk_compression_level, | ||||
|             tempfile::tempfile()?, | ||||
|         ); | ||||
|  | ||||
|         // (docid) -> () | ||||
|         let remove_vectors_writer = create_writer( | ||||
|             indexer.chunk_compression_type, | ||||
|             indexer.chunk_compression_level, | ||||
|             tempfile::tempfile()?, | ||||
|         ); | ||||
|  | ||||
|         extractors.push(EmbedderVectorExtractor { | ||||
|             embedder_name, | ||||
|             embedder, | ||||
|             prompt, | ||||
|             manual_vectors_writer, | ||||
|             prompts_writer, | ||||
|             remove_vectors_writer, | ||||
|         }); | ||||
|     } | ||||
|  | ||||
|     let mut key_buffer = Vec::new(); | ||||
|     let mut cursor = obkv_documents.into_cursor()?; | ||||
| @@ -114,152 +151,138 @@ pub fn extract_vector_points<R: io::Read + io::Seek>( | ||||
|         key_buffer.clear(); | ||||
|         key_buffer.extend_from_slice(docid_bytes); | ||||
|  | ||||
|         // since we only needs the primary key when we throw an error we create this getter to | ||||
|         // since we only need the primary key when we throw an error we create this getter to | ||||
|         // lazily get it when needed | ||||
|         let document_id = || -> Value { from_utf8(external_id_bytes).unwrap().into() }; | ||||
|  | ||||
|         // the vector field id may have changed | ||||
|         let old_vectors_fid = old_fields_ids_map.id("_vectors"); | ||||
|         // filter the old vector fid if the settings has been changed forcing reindexing. | ||||
|         let old_vectors_fid = old_vectors_fid.filter(|_| !settings_diff.reindex_vectors()); | ||||
|         let mut parsed_vectors = ParsedVectorsDiff::new(obkv, old_vectors_fid, new_vectors_fid) | ||||
|             .map_err(|error| error.to_crate_error(document_id().to_string()))?; | ||||
|  | ||||
|         let new_vectors_fid = new_fields_ids_map.id("_vectors"); | ||||
|         let vectors_field = { | ||||
|             let del = old_vectors_fid | ||||
|                 .and_then(|vectors_fid| obkv.get(vectors_fid)) | ||||
|                 .map(KvReaderDelAdd::new) | ||||
|                 .map(|obkv| to_vector_map(obkv, DelAdd::Deletion, &document_id)) | ||||
|                 .transpose()? | ||||
|                 .flatten(); | ||||
|             let add = new_vectors_fid | ||||
|                 .and_then(|vectors_fid| obkv.get(vectors_fid)) | ||||
|                 .map(KvReaderDelAdd::new) | ||||
|                 .map(|obkv| to_vector_map(obkv, DelAdd::Addition, &document_id)) | ||||
|                 .transpose()? | ||||
|                 .flatten(); | ||||
|             (del, add) | ||||
|         }; | ||||
|         for EmbedderVectorExtractor { | ||||
|             embedder_name, | ||||
|             embedder: _, | ||||
|             prompt, | ||||
|             manual_vectors_writer, | ||||
|             prompts_writer, | ||||
|             remove_vectors_writer, | ||||
|         } in extractors.iter_mut() | ||||
|         { | ||||
|             let delta = match parsed_vectors.remove(embedder_name) { | ||||
|                 (Some(old), Some(new)) => { | ||||
|                     // no autogeneration | ||||
|                     let del_vectors = old.into_array_of_vectors(); | ||||
|                     let add_vectors = new.into_array_of_vectors(); | ||||
|  | ||||
|         let (del_map, add_map) = vectors_field; | ||||
|  | ||||
|         let del_value = del_map.and_then(|mut map| map.remove(embedder_name)); | ||||
|         let add_value = add_map.and_then(|mut map| map.remove(embedder_name)); | ||||
|  | ||||
|         let delta = match (del_value, add_value) { | ||||
|             (Some(old), Some(new)) => { | ||||
|                 // no autogeneration | ||||
|                 let del_vectors = extract_vectors(old, document_id, embedder_name)?; | ||||
|                 let add_vectors = extract_vectors(new, document_id, embedder_name)?; | ||||
|  | ||||
|                 if add_vectors.len() > usize::from(u8::MAX) { | ||||
|                     return Err(crate::Error::UserError(crate::UserError::TooManyVectors( | ||||
|                         document_id().to_string(), | ||||
|                         add_vectors.len(), | ||||
|                     ))); | ||||
|                 } | ||||
|  | ||||
|                 VectorStateDelta::ManualDelta(del_vectors, add_vectors) | ||||
|             } | ||||
|             (Some(_old), None) => { | ||||
|                 // Do we keep this document? | ||||
|                 let document_is_kept = obkv | ||||
|                     .iter() | ||||
|                     .map(|(_, deladd)| KvReaderDelAdd::new(deladd)) | ||||
|                     .any(|deladd| deladd.get(DelAdd::Addition).is_some()); | ||||
|                 if document_is_kept { | ||||
|                     // becomes autogenerated | ||||
|                     VectorStateDelta::NowGenerated(prompt.render( | ||||
|                         obkv, | ||||
|                         DelAdd::Addition, | ||||
|                         new_fields_ids_map, | ||||
|                     )?) | ||||
|                 } else { | ||||
|                     VectorStateDelta::NowRemoved | ||||
|                 } | ||||
|             } | ||||
|             (None, Some(new)) => { | ||||
|                 // was possibly autogenerated, remove all vectors for that document | ||||
|                 let add_vectors = extract_vectors(new, document_id, embedder_name)?; | ||||
|                 if add_vectors.len() > usize::from(u8::MAX) { | ||||
|                     return Err(crate::Error::UserError(crate::UserError::TooManyVectors( | ||||
|                         document_id().to_string(), | ||||
|                         add_vectors.len(), | ||||
|                     ))); | ||||
|                 } | ||||
|  | ||||
|                 VectorStateDelta::WasGeneratedNowManual(add_vectors) | ||||
|             } | ||||
|             (None, None) => { | ||||
|                 // Do we keep this document? | ||||
|                 let document_is_kept = obkv | ||||
|                     .iter() | ||||
|                     .map(|(_, deladd)| KvReaderDelAdd::new(deladd)) | ||||
|                     .any(|deladd| deladd.get(DelAdd::Addition).is_some()); | ||||
|  | ||||
|                 if document_is_kept { | ||||
|                     // Don't give up if the old prompt was failing | ||||
|                     let old_prompt = Some(prompt) | ||||
|                         // TODO: this filter works because we erase the vec database when a embedding setting changes. | ||||
|                         // When vector pipeline will be optimized, this should be removed. | ||||
|                         .filter(|_| !settings_diff.reindex_vectors()) | ||||
|                         .map(|p| { | ||||
|                             p.render(obkv, DelAdd::Deletion, old_fields_ids_map).unwrap_or_default() | ||||
|                         }); | ||||
|                     let new_prompt = prompt.render(obkv, DelAdd::Addition, new_fields_ids_map)?; | ||||
|                     if old_prompt.as_ref() != Some(&new_prompt) { | ||||
|                         let old_prompt = old_prompt.unwrap_or_default(); | ||||
|                         tracing::trace!( | ||||
|                             "🚀 Changing prompt from\n{old_prompt}\n===to===\n{new_prompt}" | ||||
|                         ); | ||||
|                         VectorStateDelta::NowGenerated(new_prompt) | ||||
|                     } else { | ||||
|                         tracing::trace!("⏭️ Prompt unmodified, skipping"); | ||||
|                         VectorStateDelta::NoChange | ||||
|                     if add_vectors.len() > usize::from(u8::MAX) { | ||||
|                         return Err(crate::Error::UserError(crate::UserError::TooManyVectors( | ||||
|                             document_id().to_string(), | ||||
|                             add_vectors.len(), | ||||
|                         ))); | ||||
|                     } | ||||
|                 } else { | ||||
|                     VectorStateDelta::NowRemoved | ||||
|                 } | ||||
|             } | ||||
|         }; | ||||
|  | ||||
|         // and we finally push the unique vectors into the writer | ||||
|         push_vectors_diff( | ||||
|             &mut remove_vectors_writer, | ||||
|             &mut prompts_writer, | ||||
|             &mut manual_vectors_writer, | ||||
|             &mut key_buffer, | ||||
|             delta, | ||||
|             settings_diff, | ||||
|         )?; | ||||
|                     VectorStateDelta::ManualDelta(del_vectors, add_vectors) | ||||
|                 } | ||||
|                 (Some(_old), None) => { | ||||
|                     // Do we keep this document? | ||||
|                     let document_is_kept = obkv | ||||
|                         .iter() | ||||
|                         .map(|(_, deladd)| KvReaderDelAdd::new(deladd)) | ||||
|                         .any(|deladd| deladd.get(DelAdd::Addition).is_some()); | ||||
|                     if document_is_kept { | ||||
|                         // becomes autogenerated | ||||
|                         VectorStateDelta::NowGenerated(prompt.render( | ||||
|                             obkv, | ||||
|                             DelAdd::Addition, | ||||
|                             new_fields_ids_map, | ||||
|                         )?) | ||||
|                     } else { | ||||
|                         VectorStateDelta::NowRemoved | ||||
|                     } | ||||
|                 } | ||||
|                 (None, Some(new)) => { | ||||
|                     // was possibly autogenerated, remove all vectors for that document | ||||
|                     let add_vectors = new.into_array_of_vectors(); | ||||
|                     if add_vectors.len() > usize::from(u8::MAX) { | ||||
|                         return Err(crate::Error::UserError(crate::UserError::TooManyVectors( | ||||
|                             document_id().to_string(), | ||||
|                             add_vectors.len(), | ||||
|                         ))); | ||||
|                     } | ||||
|  | ||||
|                     VectorStateDelta::WasGeneratedNowManual(add_vectors) | ||||
|                 } | ||||
|                 (None, None) => { | ||||
|                     // Do we keep this document? | ||||
|                     let document_is_kept = obkv | ||||
|                         .iter() | ||||
|                         .map(|(_, deladd)| KvReaderDelAdd::new(deladd)) | ||||
|                         .any(|deladd| deladd.get(DelAdd::Addition).is_some()); | ||||
|  | ||||
|                     if document_is_kept { | ||||
|                         // Don't give up if the old prompt was failing | ||||
|                         let old_prompt = Some(&prompt) | ||||
|                             // TODO: this filter works because we erase the vec database when a embedding setting changes. | ||||
|                             // When vector pipeline will be optimized, this should be removed. | ||||
|                             .filter(|_| !settings_diff.reindex_vectors()) | ||||
|                             .map(|p| { | ||||
|                                 p.render(obkv, DelAdd::Deletion, old_fields_ids_map) | ||||
|                                     .unwrap_or_default() | ||||
|                             }); | ||||
|                         let new_prompt = | ||||
|                             prompt.render(obkv, DelAdd::Addition, new_fields_ids_map)?; | ||||
|                         if old_prompt.as_ref() != Some(&new_prompt) { | ||||
|                             let old_prompt = old_prompt.unwrap_or_default(); | ||||
|                             tracing::trace!( | ||||
|                                 "🚀 Changing prompt from\n{old_prompt}\n===to===\n{new_prompt}" | ||||
|                             ); | ||||
|                             VectorStateDelta::NowGenerated(new_prompt) | ||||
|                         } else { | ||||
|                             tracing::trace!("⏭️ Prompt unmodified, skipping"); | ||||
|                             VectorStateDelta::NoChange | ||||
|                         } | ||||
|                     } else { | ||||
|                         VectorStateDelta::NowRemoved | ||||
|                     } | ||||
|                 } | ||||
|             }; | ||||
|  | ||||
|             // and we finally push the unique vectors into the writer | ||||
|             push_vectors_diff( | ||||
|                 remove_vectors_writer, | ||||
|                 prompts_writer, | ||||
|                 manual_vectors_writer, | ||||
|                 &mut key_buffer, | ||||
|                 delta, | ||||
|                 reindex_vectors, | ||||
|             )?; | ||||
|         } | ||||
|     } | ||||
|  | ||||
|     Ok(ExtractedVectorPoints { | ||||
|         // docid, _index -> KvWriterDelAdd -> Vector | ||||
|         manual_vectors: writer_into_reader(manual_vectors_writer)?, | ||||
|         // docid -> () | ||||
|         remove_vectors: writer_into_reader(remove_vectors_writer)?, | ||||
|         // docid -> prompt | ||||
|         prompts: writer_into_reader(prompts_writer)?, | ||||
|     }) | ||||
| } | ||||
|     let mut results = Vec::new(); | ||||
|  | ||||
| fn to_vector_map( | ||||
|     obkv: KvReaderDelAdd, | ||||
|     side: DelAdd, | ||||
|     document_id: &impl Fn() -> Value, | ||||
| ) -> Result<Option<serde_json::Map<String, Value>>> { | ||||
|     Ok(if let Some(value) = obkv.get(side) { | ||||
|         let Ok(value) = from_slice(value) else { | ||||
|             let value = from_slice(value).map_err(InternalError::SerdeJson)?; | ||||
|             return Err(crate::Error::UserError(UserError::InvalidVectorsMapType { | ||||
|                 document_id: document_id(), | ||||
|                 value, | ||||
|             })); | ||||
|         }; | ||||
|         Some(value) | ||||
|     } else { | ||||
|         None | ||||
|     }) | ||||
|     for EmbedderVectorExtractor { | ||||
|         embedder_name, | ||||
|         embedder, | ||||
|         prompt: _, | ||||
|         manual_vectors_writer, | ||||
|         prompts_writer, | ||||
|         remove_vectors_writer, | ||||
|     } in extractors | ||||
|     { | ||||
|         results.push(ExtractedVectorPoints { | ||||
|             // docid, _index -> KvWriterDelAdd -> Vector | ||||
|             manual_vectors: writer_into_reader(manual_vectors_writer)?, | ||||
|             // docid -> () | ||||
|             remove_vectors: writer_into_reader(remove_vectors_writer)?, | ||||
|             // docid -> prompt | ||||
|             prompts: writer_into_reader(prompts_writer)?, | ||||
|  | ||||
|             embedder, | ||||
|             embedder_name, | ||||
|         }) | ||||
|     } | ||||
|  | ||||
|     Ok(results) | ||||
| } | ||||
|  | ||||
| /// Computes the diff between both Del and Add numbers and | ||||
| @@ -270,14 +293,14 @@ fn push_vectors_diff( | ||||
|     manual_vectors_writer: &mut Writer<BufWriter<File>>, | ||||
|     key_buffer: &mut Vec<u8>, | ||||
|     delta: VectorStateDelta, | ||||
|     settings_diff: &InnerIndexSettingsDiff, | ||||
|     reindex_vectors: bool, | ||||
| ) -> Result<()> { | ||||
|     puffin::profile_function!(); | ||||
|     let (must_remove, prompt, (mut del_vectors, mut add_vectors)) = delta.into_values(); | ||||
|     if must_remove | ||||
|     // TODO: the below condition works because we erase the vec database when a embedding setting changes. | ||||
|     // When vector pipeline will be optimized, this should be removed. | ||||
|     && !settings_diff.reindex_vectors() | ||||
|     && !reindex_vectors | ||||
|     { | ||||
|         key_buffer.truncate(TRUNCATE_SIZE); | ||||
|         remove_vectors_writer.insert(&key_buffer, [])?; | ||||
| @@ -308,7 +331,7 @@ fn push_vectors_diff( | ||||
|             EitherOrBoth::Left(vector) => { | ||||
|                 // TODO: the below condition works because we erase the vec database when a embedding setting changes. | ||||
|                 // When vector pipeline will be optimized, this should be removed. | ||||
|                 if !settings_diff.reindex_vectors() { | ||||
|                 if !reindex_vectors { | ||||
|                     // We insert only the Del part of the Obkv to inform | ||||
|                     // that we only want to remove all those vectors. | ||||
|                     let mut obkv = KvWriterDelAdd::memory(); | ||||
| @@ -336,26 +359,6 @@ fn compare_vectors(a: &[f32], b: &[f32]) -> Ordering { | ||||
|     a.iter().copied().map(OrderedFloat).cmp(b.iter().copied().map(OrderedFloat)) | ||||
| } | ||||
|  | ||||
| /// Extracts the vectors from a JSON value. | ||||
| fn extract_vectors( | ||||
|     value: Value, | ||||
|     document_id: impl Fn() -> Value, | ||||
|     name: &str, | ||||
| ) -> Result<Vec<Vec<f32>>> { | ||||
|     // FIXME: ugly clone of the vectors here | ||||
|     match serde_json::from_value(value.clone()) { | ||||
|         Ok(vectors) => { | ||||
|             Ok(VectorOrArrayOfVectors::into_array_of_vectors(vectors).unwrap_or_default()) | ||||
|         } | ||||
|         Err(_) => Err(UserError::InvalidVectorsType { | ||||
|             document_id: document_id(), | ||||
|             value, | ||||
|             subfield: name.to_owned(), | ||||
|         } | ||||
|         .into()), | ||||
|     } | ||||
| } | ||||
|  | ||||
| #[tracing::instrument(level = "trace", skip_all, target = "indexing::extract")] | ||||
| pub fn extract_embeddings<R: io::Read + io::Seek>( | ||||
|     // docid, prompt | ||||
|   | ||||
| @@ -226,27 +226,31 @@ fn send_original_documents_data( | ||||
|     let original_documents_chunk = | ||||
|         original_documents_chunk.and_then(|c| unsafe { as_cloneable_grenad(&c) })?; | ||||
|  | ||||
|     let documents_chunk_cloned = original_documents_chunk.clone(); | ||||
|     let lmdb_writer_sx_cloned = lmdb_writer_sx.clone(); | ||||
|  | ||||
|     let request_threads = ThreadPoolNoAbortBuilder::new() | ||||
|         .num_threads(crate::vector::REQUEST_PARALLELISM) | ||||
|         .thread_name(|index| format!("embedding-request-{index}")) | ||||
|         .build()?; | ||||
|  | ||||
|     if settings_diff.reindex_vectors() || !settings_diff.settings_update_only() { | ||||
|     let index_vectors = (settings_diff.reindex_vectors() || !settings_diff.settings_update_only()) | ||||
|         // no point in indexing vectors without embedders | ||||
|         && (!settings_diff.new.embedding_configs.inner_as_ref().is_empty()); | ||||
|  | ||||
|     if index_vectors { | ||||
|         let settings_diff = settings_diff.clone(); | ||||
|  | ||||
|         let original_documents_chunk = original_documents_chunk.clone(); | ||||
|         let lmdb_writer_sx = lmdb_writer_sx.clone(); | ||||
|         rayon::spawn(move || { | ||||
|             for (name, (embedder, prompt)) in settings_diff.new.embedding_configs.clone() { | ||||
|                 let result = extract_vector_points( | ||||
|                     documents_chunk_cloned.clone(), | ||||
|                     indexer, | ||||
|                     &settings_diff, | ||||
|                     &prompt, | ||||
|                     &name, | ||||
|                 ); | ||||
|                 match result { | ||||
|                     Ok(ExtractedVectorPoints { manual_vectors, remove_vectors, prompts }) => { | ||||
|             match extract_vector_points(original_documents_chunk.clone(), indexer, &settings_diff) { | ||||
|                 Ok(extracted_vectors) => { | ||||
|                     for ExtractedVectorPoints { | ||||
|                         manual_vectors, | ||||
|                         remove_vectors, | ||||
|                         prompts, | ||||
|                         embedder_name, | ||||
|                         embedder, | ||||
|                     } in extracted_vectors | ||||
|                     { | ||||
|                         let embeddings = match extract_embeddings( | ||||
|                             prompts, | ||||
|                             indexer, | ||||
| @@ -255,28 +259,26 @@ fn send_original_documents_data( | ||||
|                         ) { | ||||
|                             Ok(results) => Some(results), | ||||
|                             Err(error) => { | ||||
|                                 let _ = lmdb_writer_sx_cloned.send(Err(error)); | ||||
|                                 let _ = lmdb_writer_sx.send(Err(error)); | ||||
|                                 None | ||||
|                             } | ||||
|                         }; | ||||
|  | ||||
|                         if !(remove_vectors.is_empty() | ||||
|                             && manual_vectors.is_empty() | ||||
|                             && embeddings.as_ref().map_or(true, |e| e.is_empty())) | ||||
|                         { | ||||
|                             let _ = lmdb_writer_sx_cloned.send(Ok(TypedChunk::VectorPoints { | ||||
|                             let _ = lmdb_writer_sx.send(Ok(TypedChunk::VectorPoints { | ||||
|                                 remove_vectors, | ||||
|                                 embeddings, | ||||
|                                 expected_dimension: embedder.dimensions(), | ||||
|                                 manual_vectors, | ||||
|                                 embedder_name: name, | ||||
|                                 embedder_name, | ||||
|                             })); | ||||
|                         } | ||||
|                     } | ||||
|  | ||||
|                     Err(error) => { | ||||
|                         let _ = lmdb_writer_sx_cloned.send(Err(error)); | ||||
|                     } | ||||
|                 } | ||||
|                 Err(error) => { | ||||
|                     let _ = lmdb_writer_sx.send(Err(error)); | ||||
|                 } | ||||
|             } | ||||
|         }); | ||||
|   | ||||
| @@ -1,4 +1,4 @@ | ||||
| use std::collections::HashMap; | ||||
| use std::collections::{BTreeSet, HashMap}; | ||||
| use std::convert::TryInto; | ||||
| use std::fs::File; | ||||
| use std::io::{self, BufReader}; | ||||
| @@ -193,6 +193,10 @@ pub(crate) fn write_typed_chunk_into_index( | ||||
|             let span = tracing::trace_span!(target: "indexing::write_db", "documents"); | ||||
|             let _entered = span.enter(); | ||||
|  | ||||
|             let fields_ids_map = index.fields_ids_map(wtxn)?; | ||||
|             let vectors_fid = | ||||
|                 fields_ids_map.id(crate::vector::parsed_vectors::RESERVED_VECTORS_FIELD_NAME); | ||||
|  | ||||
|             let mut builder = MergerBuilder::new(keep_latest_obkv as MergeFn); | ||||
|             for typed_chunk in typed_chunks { | ||||
|                 let TypedChunk::Documents(chunk) = typed_chunk else { | ||||
| @@ -206,6 +210,10 @@ pub(crate) fn write_typed_chunk_into_index( | ||||
|  | ||||
|             let mut docids = index.documents_ids(wtxn)?; | ||||
|             let mut iter = merger.into_stream_merger_iter()?; | ||||
|  | ||||
|             let embedders: BTreeSet<_> = | ||||
|                 index.embedding_configs(wtxn)?.into_iter().map(|(k, _v)| k).collect(); | ||||
|             let mut vectors_buffer = Vec::new(); | ||||
|             while let Some((key, reader)) = iter.next()? { | ||||
|                 let mut writer: KvWriter<_, FieldId> = KvWriter::memory(); | ||||
|                 let reader: KvReader<FieldId> = KvReader::new(reader); | ||||
| @@ -219,7 +227,35 @@ pub(crate) fn write_typed_chunk_into_index( | ||||
|                     let del_add_reader = KvReaderDelAdd::new(value); | ||||
|  | ||||
|                     if let Some(addition) = del_add_reader.get(DelAdd::Addition) { | ||||
|                         writer.insert(field_id, addition)?; | ||||
|                         let addition = if vectors_fid == Some(field_id) { | ||||
|                             'vectors: { | ||||
|                                 vectors_buffer.clear(); | ||||
|                                 let Ok(mut vectors) = | ||||
|                                     crate::vector::parsed_vectors::ParsedVectors::from_bytes( | ||||
|                                         addition, | ||||
|                                     ) | ||||
|                                 else { | ||||
|                                     // if the `_vectors` field cannot be parsed as map of vectors, just write it as-is | ||||
|                                     break 'vectors Some(addition); | ||||
|                                 }; | ||||
|                                 vectors.retain_user_provided_vectors(&embedders); | ||||
|                                 let crate::vector::parsed_vectors::ParsedVectors(vectors) = vectors; | ||||
|                                 if vectors.is_empty() { | ||||
|                                     // skip writing empty `_vectors` map | ||||
|                                     break 'vectors None; | ||||
|                                 } | ||||
|  | ||||
|                                 serde_json::to_writer(&mut vectors_buffer, &vectors) | ||||
|                                     .map_err(InternalError::SerdeJson)?; | ||||
|                                 Some(vectors_buffer.as_slice()) | ||||
|                             } | ||||
|                         } else { | ||||
|                             Some(addition) | ||||
|                         }; | ||||
|  | ||||
|                         if let Some(addition) = addition { | ||||
|                             writer.insert(field_id, addition)?; | ||||
|                         } | ||||
|                     } | ||||
|                 } | ||||
|  | ||||
|   | ||||
| @@ -13,6 +13,7 @@ pub mod error; | ||||
| pub mod hf; | ||||
| pub mod manual; | ||||
| pub mod openai; | ||||
| pub mod parsed_vectors; | ||||
| pub mod settings; | ||||
|  | ||||
| pub mod ollama; | ||||
| @@ -147,6 +148,10 @@ impl EmbeddingConfigs { | ||||
|         self.get(self.get_default_embedder_name()) | ||||
|     } | ||||
|  | ||||
|     pub fn inner_as_ref(&self) -> &HashMap<String, (Arc<Embedder>, Arc<Prompt>)> { | ||||
|         &self.0 | ||||
|     } | ||||
|  | ||||
|     /// Get the name of the default embedder configuration. | ||||
|     /// | ||||
|     /// The default embedder is determined as follows: | ||||
|   | ||||
							
								
								
									
										207
									
								
								milli/src/vector/parsed_vectors.rs
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										207
									
								
								milli/src/vector/parsed_vectors.rs
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,207 @@ | ||||
| use std::collections::{BTreeMap, BTreeSet}; | ||||
|  | ||||
| use obkv::KvReader; | ||||
| use serde_json::{from_slice, Value}; | ||||
|  | ||||
| use super::Embedding; | ||||
| use crate::update::del_add::{DelAdd, KvReaderDelAdd}; | ||||
| use crate::{FieldId, InternalError, UserError}; | ||||
|  | ||||
| pub const RESERVED_VECTORS_FIELD_NAME: &str = "_vectors"; | ||||
|  | ||||
| #[derive(serde::Serialize, serde::Deserialize, Debug)] | ||||
| #[serde(untagged)] | ||||
| pub enum Vectors { | ||||
|     ImplicitlyUserProvided(VectorOrArrayOfVectors), | ||||
|     Explicit(ExplicitVectors), | ||||
| } | ||||
|  | ||||
| impl Vectors { | ||||
|     pub fn into_array_of_vectors(self) -> Vec<Embedding> { | ||||
|         match self { | ||||
|             Vectors::ImplicitlyUserProvided(embeddings) | ||||
|             | Vectors::Explicit(ExplicitVectors { embeddings, user_provided: _ }) => { | ||||
|                 embeddings.into_array_of_vectors().unwrap_or_default() | ||||
|             } | ||||
|         } | ||||
|     } | ||||
| } | ||||
|  | ||||
| #[derive(serde::Serialize, serde::Deserialize, Debug)] | ||||
| #[serde(rename_all = "camelCase")] | ||||
| pub struct ExplicitVectors { | ||||
|     pub embeddings: VectorOrArrayOfVectors, | ||||
|     pub user_provided: bool, | ||||
| } | ||||
|  | ||||
| pub struct ParsedVectorsDiff { | ||||
|     pub old: Option<BTreeMap<String, Vectors>>, | ||||
|     pub new: Option<BTreeMap<String, Vectors>>, | ||||
| } | ||||
|  | ||||
| impl ParsedVectorsDiff { | ||||
|     pub fn new( | ||||
|         documents_diff: KvReader<'_, FieldId>, | ||||
|         old_vectors_fid: Option<FieldId>, | ||||
|         new_vectors_fid: Option<FieldId>, | ||||
|     ) -> Result<Self, Error> { | ||||
|         let old = match old_vectors_fid | ||||
|             .and_then(|vectors_fid| documents_diff.get(vectors_fid)) | ||||
|             .map(KvReaderDelAdd::new) | ||||
|             .map(|obkv| to_vector_map(obkv, DelAdd::Deletion)) | ||||
|             .transpose() | ||||
|         { | ||||
|             Ok(del) => del, | ||||
|             // ignore wrong shape for old version of documents, use an empty map in this case | ||||
|             Err(Error::InvalidMap(value)) => { | ||||
|                 tracing::warn!(%value, "Previous version of the `_vectors` field had a wrong shape"); | ||||
|                 Default::default() | ||||
|             } | ||||
|             Err(error) => { | ||||
|                 return Err(error); | ||||
|             } | ||||
|         } | ||||
|         .flatten(); | ||||
|         let new = new_vectors_fid | ||||
|             .and_then(|vectors_fid| documents_diff.get(vectors_fid)) | ||||
|             .map(KvReaderDelAdd::new) | ||||
|             .map(|obkv| to_vector_map(obkv, DelAdd::Addition)) | ||||
|             .transpose()? | ||||
|             .flatten(); | ||||
|         Ok(Self { old, new }) | ||||
|     } | ||||
|  | ||||
|     pub fn remove(&mut self, embedder_name: &str) -> (Option<Vectors>, Option<Vectors>) { | ||||
|         let old = self.old.as_mut().and_then(|old| old.remove(embedder_name)); | ||||
|         let new = self.new.as_mut().and_then(|new| new.remove(embedder_name)); | ||||
|         (old, new) | ||||
|     } | ||||
| } | ||||
|  | ||||
| pub struct ParsedVectors(pub BTreeMap<String, Vectors>); | ||||
|  | ||||
| impl ParsedVectors { | ||||
|     pub fn from_bytes(value: &[u8]) -> Result<Self, Error> { | ||||
|         let Ok(value) = from_slice(value) else { | ||||
|             let value = from_slice(value).map_err(Error::InternalSerdeJson)?; | ||||
|             return Err(Error::InvalidMap(value)); | ||||
|         }; | ||||
|         Ok(ParsedVectors(value)) | ||||
|     } | ||||
|  | ||||
|     pub fn retain_user_provided_vectors(&mut self, embedders: &BTreeSet<String>) { | ||||
|         self.0.retain(|k, v| match v { | ||||
|             Vectors::ImplicitlyUserProvided(_) => true, | ||||
|             Vectors::Explicit(ExplicitVectors { embeddings: _, user_provided }) => { | ||||
|                 *user_provided | ||||
|                 // if the embedder is not in the config, then never touch it | ||||
|                 || !embedders.contains(k) | ||||
|             } | ||||
|         }); | ||||
|     } | ||||
| } | ||||
|  | ||||
| pub enum Error { | ||||
|     InvalidMap(Value), | ||||
|     InternalSerdeJson(serde_json::Error), | ||||
| } | ||||
|  | ||||
| impl Error { | ||||
|     pub fn to_crate_error(self, document_id: String) -> crate::Error { | ||||
|         match self { | ||||
|             Error::InvalidMap(value) => { | ||||
|                 crate::Error::UserError(UserError::InvalidVectorsMapType { document_id, value }) | ||||
|             } | ||||
|             Error::InternalSerdeJson(error) => { | ||||
|                 crate::Error::InternalError(InternalError::SerdeJson(error)) | ||||
|             } | ||||
|         } | ||||
|     } | ||||
| } | ||||
|  | ||||
| fn to_vector_map( | ||||
|     obkv: KvReaderDelAdd, | ||||
|     side: DelAdd, | ||||
| ) -> Result<Option<BTreeMap<String, Vectors>>, Error> { | ||||
|     Ok(if let Some(value) = obkv.get(side) { | ||||
|         let ParsedVectors(parsed_vectors) = ParsedVectors::from_bytes(value)?; | ||||
|         Some(parsed_vectors) | ||||
|     } else { | ||||
|         None | ||||
|     }) | ||||
| } | ||||
|  | ||||
| /// Represents either a vector or an array of multiple vectors. | ||||
| #[derive(serde::Serialize, serde::Deserialize, Debug)] | ||||
| #[serde(transparent)] | ||||
| pub struct VectorOrArrayOfVectors { | ||||
|     #[serde(with = "either::serde_untagged_optional")] | ||||
|     inner: Option<either::Either<Vec<Embedding>, Embedding>>, | ||||
| } | ||||
|  | ||||
| impl VectorOrArrayOfVectors { | ||||
|     pub fn into_array_of_vectors(self) -> Option<Vec<Embedding>> { | ||||
|         match self.inner? { | ||||
|             either::Either::Left(vectors) => Some(vectors), | ||||
|             either::Either::Right(vector) => Some(vec![vector]), | ||||
|         } | ||||
|     } | ||||
|  | ||||
|     pub fn from_array_of_vectors(array_of_vec: Vec<Embedding>) -> Self { | ||||
|         Self { inner: Some(either::Either::Left(array_of_vec)) } | ||||
|     } | ||||
| } | ||||
|  | ||||
| #[cfg(test)] | ||||
| mod test { | ||||
|     use super::VectorOrArrayOfVectors; | ||||
|  | ||||
|     #[test] | ||||
|     fn array_of_vectors() { | ||||
|         let null: VectorOrArrayOfVectors = serde_json::from_str("null").unwrap(); | ||||
|         let empty: VectorOrArrayOfVectors = serde_json::from_str("[]").unwrap(); | ||||
|         let one: VectorOrArrayOfVectors = serde_json::from_str("[0.1]").unwrap(); | ||||
|         let two: VectorOrArrayOfVectors = serde_json::from_str("[0.1, 0.2]").unwrap(); | ||||
|         let one_vec: VectorOrArrayOfVectors = serde_json::from_str("[[0.1, 0.2]]").unwrap(); | ||||
|         let two_vecs: VectorOrArrayOfVectors = | ||||
|             serde_json::from_str("[[0.1, 0.2], [0.3, 0.4]]").unwrap(); | ||||
|  | ||||
|         insta::assert_json_snapshot!(null.into_array_of_vectors(), @"null"); | ||||
|         insta::assert_json_snapshot!(empty.into_array_of_vectors(), @"[]"); | ||||
|         insta::assert_json_snapshot!(one.into_array_of_vectors(), @r###" | ||||
|         [ | ||||
|           [ | ||||
|             0.1 | ||||
|           ] | ||||
|         ] | ||||
|         "###); | ||||
|         insta::assert_json_snapshot!(two.into_array_of_vectors(), @r###" | ||||
|         [ | ||||
|           [ | ||||
|             0.1, | ||||
|             0.2 | ||||
|           ] | ||||
|         ] | ||||
|         "###); | ||||
|         insta::assert_json_snapshot!(one_vec.into_array_of_vectors(), @r###" | ||||
|         [ | ||||
|           [ | ||||
|             0.1, | ||||
|             0.2 | ||||
|           ] | ||||
|         ] | ||||
|         "###); | ||||
|         insta::assert_json_snapshot!(two_vecs.into_array_of_vectors(), @r###" | ||||
|         [ | ||||
|           [ | ||||
|             0.1, | ||||
|             0.2 | ||||
|           ], | ||||
|           [ | ||||
|             0.3, | ||||
|             0.4 | ||||
|           ] | ||||
|         ] | ||||
|         "###); | ||||
|     } | ||||
| } | ||||
		Reference in New Issue
	
	Block a user