feature: MMR takes 2x page size such that final results may differ

devflowinc · Dec 4, 2024 · d4e9e30 · d4e9e30
1 parent a82163c
commit d4e9e30
Show file tree

Hide file tree

Showing 5 changed files with 148 additions and 59 deletions.
diff --git a/frontends/chat/src/components/Layouts/MainLayout.tsx b/frontends/chat/src/components/Layouts/MainLayout.tsx
@@ -79,6 +79,8 @@ const MainLayout = (props: LayoutProps) => {
   >(null);
 
   const [useImages, setUseImages] = createSignal<boolean | null>(null);
+  const [useMmr, setUseMmr] = createSignal<boolean | null>(false);
+  const [mmrLambda, setMmrLambda] = createSignal<number | null>(0.5);
   const [useGroupSearch, setUseGroupSearch] = createSignal<boolean | null>(
     null,
   );
@@ -232,6 +234,12 @@ const MainLayout = (props: LayoutProps) => {
               use_images: useImages(),
             },
           },
+          sort_options: {
+            mmr: {
+              use_mmr: useMmr(),
+              mmr_lambda: mmrLambda(),
+            },
+          },
           no_result_message: noResultMessage(),
           use_group_search: useGroupSearch(),
           search_type: searchType(),
@@ -344,6 +352,13 @@ const MainLayout = (props: LayoutProps) => {
                         filters: getFiltersFromStorage(dataset.dataset.id),
                         concat_user_messages_query: concatUserMessagesQuery(),
                         page_size: pageSize(),
+                        sort_options: {
+                          mmr: {
+                            use_mmr: useMmr(),
+                            mmr_lambda: mmrLambda(),
+                          },
+                        },
+                        use_group_search: useGroupSearch(),
                         search_query:
                           searchQuery() != "" ? searchQuery() : undefined,
                         score_threshold: minScore(),
@@ -514,6 +529,33 @@ const MainLayout = (props: LayoutProps) => {
                       }}
                     />
                   </div>
+                  <div class="flex w-full items-center gap-x-2">
+                    <div class="flex items-center gap-x-2">
+                      <label for="concat_user_messages">Use MMR</label>
+                    </div>
+                    <input
+                      type="checkbox"
+                      id="concat_user_messages"
+                      class="h-4 w-4 rounded-md border border-neutral-300 bg-neutral-100 p-1 dark:border-neutral-900 dark:bg-neutral-800"
+                      checked={useMmr() ?? false}
+                      onChange={(e) => {
+                        setUseMmr(e.target.checked);
+                      }}
+                    />
+                  </div>
+                  <div class="flex w-full items-center gap-x-2">
+                    <label for="search_query">MMR Lambda:</label>
+                    <input
+                      type="text"
+                      id="search_query"
+                      class="w-12 rounded-md border border-neutral-300 bg-neutral-100 p-1 dark:border-neutral-900 dark:bg-neutral-700"
+                      step={"any"}
+                      value={mmrLambda() ?? ""}
+                      onChange={(e) => {
+                        setMmrLambda(parseFloat(e.target.value));
+                      }}
+                    />
+                  </div>
                   <div class="flex w-full items-center gap-x-2">
                     <label for="page_size">Page Size:</label>
                     <input

diff --git a/server/src/data/models.rs b/server/src/data/models.rs
@@ -6667,7 +6667,7 @@ pub struct SortOptions {
 }
 
 #[derive(Serialize, Deserialize, Debug, Clone, ToSchema, Default)]
-/// MMR Options lets you specify different methods to rerank the chunks in the result set. If not specified, this defaults to the score of the chunks.
+/// MMR Options lets you specify different methods to rerank the chunks in the result set using Maximal Marginal Relevance. If not specified, this defaults to the score of the chunks.
 pub struct MmrOptions {
     /// Set use_mmr to true to use the Maximal Marginal Relevance algorithm to rerank the results.
     pub use_mmr: bool,

diff --git a/server/src/handlers/message_handler.rs b/server/src/handlers/message_handler.rs
@@ -100,10 +100,10 @@ pub struct CreateMessageReqPayload {
     pub page_size: Option<u64>,
     /// Sort Options lets you specify different methods to rerank the chunks in the result set. If not specified, this defaults to the score of the chunks.
     pub sort_options: Option<SortOptions>,
-    /// Filters is a JSON object which can be used to filter chunks. This is useful for when you want to filter chunks by arbitrary metadata. Unlike with tag filtering, there is a performance hit for filtering on metadata.
-    pub filters: Option<ChunkFilter>,
     /// Set score_threshold to a float to filter out chunks with a score below the threshold. This threshold applies before weight and bias modifications. If not specified, this defaults to 0.0.
     pub score_threshold: Option<f32>,
+    /// Filters is a JSON object which can be used to filter chunks. This is useful for when you want to filter chunks by arbitrary metadata. Unlike with tag filtering, there is a performance hit for filtering on metadata.
+    pub filters: Option<ChunkFilter>,
     /// LLM options to use for the completion. If not specified, this defaults to the dataset's LLM options.
     pub llm_options: Option<LLMOptions>,
     /// Context options to use for the completion. If not specified, all options will default to false.

diff --git a/server/src/operators/qdrant_operator.rs b/server/src/operators/qdrant_operator.rs
@@ -873,7 +873,11 @@ pub async fn search_over_groups_qdrant_query(
 
             QueryPointGroups {
                 collection_name: qdrant_collection.to_string(),
-                limit: Some(query.limit * page),
+                limit: if use_mmr && query.limit < 20 {
+                    Some(query.limit * 2)
+                } else {
+                    Some(query.limit * page)
+                },
                 prefetch,
                 using: vector_name,
                 query: Some(qdrant_query),
@@ -1101,7 +1105,11 @@ pub async fn search_qdrant_query(
 
             QueryPoints {
                 collection_name: qdrant_collection.to_string(),
-                limit: Some(query.limit),
+                limit: if use_mmr && query.limit < 20 {
+                    Some(query.limit * 2)
+                } else {
+                    Some(query.limit * page)
+                },
                 offset: Some(offset),
                 prefetch,
                 using: vector_name,