climatepolicyradar · kdutia · Dec 18, 2024 · Dec 18, 2024 · Dec 18, 2024 · Dec 18, 2024
@@ -1,5 +1,5 @@
 _MAJOR = "1"
-_MINOR = "11"
+_MINOR = "12"
 _PATCH = "0"
 _SUFFIX = ""
 

@@ -5,6 +5,15 @@ schema document_passage {
         stemming: none
     }
 
+    field language type string {
+        indexing: "en" | set_language
+    }
+
+    field text_block_bolding type string {
+        indexing: input text_block | summary | index
+        bolding: true
+    }
+
     document document_passage {
 
         field search_weights_ref type reference<search_weights> {
@@ -139,91 +148,57 @@ schema document_passage {
         summary concepts {}
     }
 
-    document-summary search_summary_with_tokens {
-        summary family_name {}
-        summary family_description {}
-        summary family_import_id {}
-        summary family_slug {}
-        summary family_category {}
-        summary family_publication_ts {}
-        summary family_geography {}
-        summary family_geographies {}
-        summary family_source {}
-        summary document_import_id {}
-        summary document_slug {}
-        summary document_languages {}
-        summary document_content_type {}
-        summary document_cdn_object {}
-        summary document_source_url {}
-        summary corpus_import_id {}
-        summary corpus_type_name {}
-        summary metadata {}
-        summary text_block {}
-        summary text_block_id {}
-        summary text_block_type {}
-        summary text_block_page {}
-        summary text_block_coords {}
-        summary concepts {}
+    document-summary search_summary_with_tokens inherits search_summary {
         summary text_block_tokens {
             source: text_block
             tokens
         }
     }
-
-    rank-profile exact inherits default {
-        function text_score() {
-            expression: attribute(passage_weight) * fieldMatch(text_block)
-        }
-        first-phase {
-            expression: text_score()
-        }
-        summary-features: text_score() fieldMatch(text_block)
-    }
 
     rank-profile exact_not_stemmed inherits default {
         function text_score() {
-            expression: attribute(passage_weight) * fieldMatch(text_block_not_stemmed)
+            expression: fieldMatch(text_block_not_stemmed)
         }
         first-phase {
-            expression: text_score()
+            expression: attribute(passage_weight) * text_score()
         }
-        summary-features: text_score() fieldMatch(text_block)
-    }
-
-    rank-profile hybrid_no_closeness inherits default {
-        function text_score() {
-            expression: attribute(passage_weight) * bm25(text_block)
-        }
-        first-phase {
-            expression: text_score()
-        }
-        summary-features: text_score() bm25(text_block)
+        summary-features: attribute(passage_weight) text_score()
     }
 
     rank-profile hybrid inherits default {
         inputs {
             query(query_embedding) tensor<float>(x[768])
+            query(passage_bm25_weight) double: 1.0
+            query(passage_closeness_weight) double: 1.0
         }
         function text_score() {
-            expression: attribute(passage_weight) * (bm25(text_block) + closeness(text_embedding))
+            expression: query(passage_bm25_weight) * bm25(text_block) + query(passage_closeness_weight) * closeness(text_embedding)
         }
         first-phase {
-            expression: text_score()
+            expression: attribute(passage_weight) * text_score()
         }
-        summary-features: text_score() bm25(text_block) closeness(text_embedding)
+        summary-features: text_score() bm25(text_block) closeness(text_embedding) attribute(passage_weight)
     }
 
-    rank-profile hybrid_custom_weight inherits default {
+    rank-profile hybrid_nativerank inherits default {
         inputs {
             query(query_embedding) tensor<float>(x[768])
-            query(bm25_weight) double
+            query(passage_nativerank_weight) double: 1.0
+            query(passage_closeness_weight) double: 1.0
         }
         function text_score() {
-            expression: attribute(passage_weight) * (query(bm25_weight) * bm25(text_block) + closeness(text_embedding))
+            expression: query(passage_nativerank_weight) * nativeRank(text_block) + query(passage_closeness_weight) * closeness(text_embedding)
         }
         first-phase {
-            expression: text_score()
+            expression: attribute(passage_weight) * text_score()
         }
-        summary-features: text_score() bm25(text_block) closeness(text_embedding)
+        summary-features: text_score() nativeRank(text_block) closeness(text_embedding) attribute(passage_weight)
     }
+
+    rank-profile hybrid_no_closeness inherits hybrid {
+        inputs {
+            query(passage_closeness_weight) double: 0.0
+        }
+    }
+
 }
@@ -10,6 +10,20 @@ schema family_document {
         stemming: none
     }
 
+    field family_name_bolding type string {
+        indexing: input family_name_index | summary | index
+        bolding: true
+    }
+
+    field family_description_bolding type string {
+        indexing: input family_description_index | summary | index
+        bolding: true
+    }
+
+    field language type string {
+        indexing: "en" | set_language
+    }
+
     document family_document {
 
         field search_weights_ref type reference<search_weights> {
@@ -168,95 +182,61 @@ schema family_document {
         fields: family_name_index, family_description_index
     }
 
-    rank-profile exact inherits default {
-        function name_score() {
-            expression: attribute(name_weight) * fieldMatch(family_name_index)
-        }
-        function description_score() {
-            expression: attribute(description_weight) * fieldMatch(family_description_index)
-        }
-        first-phase {
-            expression: name_score() + description_score()
-        }
-        summary-features: name_score() description_score()
-    }
-
     rank-profile exact_not_stemmed inherits default {
         function name_score() {
-            expression: attribute(name_weight) * fieldMatch(family_name_not_stemmed)
+            expression: fieldMatch(family_name_not_stemmed)
         }
         function description_score() {
-            expression: attribute(description_weight) * fieldMatch(family_description_not_stemmed)
+            expression: fieldMatch(family_description_not_stemmed)
         }
         first-phase {
-            expression: name_score() + description_score()
+            expression: attribute(name_weight) * name_score() + attribute(description_weight) * description_score()
         }
-        summary-features: name_score() description_score()
-    }
-
-    rank-profile hybrid_no_closeness inherits default {
-        function name_score() {
-            expression: attribute(name_weight) * bm25(family_name_index)
-        }
-        function description_score() {
-            expression: attribute(description_weight) * bm25(family_description_index)
-        }
-        first-phase {
-            expression: name_score() + description_score()
-        }
-        summary-features: name_score() description_score()
+        summary-features: name_score() description_score() attribute(name_weight) attribute(description_weight)
     }
 
     rank-profile hybrid inherits default {
         inputs {
             query(query_embedding) tensor<float>(x[768])
+            query(description_bm25_weight) double: 1.0
+            query(description_closeness_weight) double: 1.0
         }
         function name_score() {
-            expression: attribute(name_weight) * bm25(family_name_index)
+            expression: bm25(family_name_index)
         }
         function description_score() {
-            expression: attribute(description_weight) * (bm25(family_description_index) + closeness(family_description_embedding))
+            expression: query(description_bm25_weight) * bm25(family_description_index) + query(descriptione_closeness_weight) * closeness(family_description_embedding)
         }
         first-phase {
-            expression: name_score() + description_score()
+            expression: (attribute(name_weight) * name_score()) + (attribute(description_weight) * description_score())
         }
-        summary-features: name_score() description_score()
+        summary-features: name_score() description_score() bm25(family_name_index) bm25(family_description_index) closeness(family_description_embedding)
     }
 
-    rank-profile hybrid_no_description_embedding inherits default {
+    rank-profile hybrid_nativerank inherits default {
         inputs {
             query(query_embedding) tensor<float>(x[768])
+            query(description_nativerank_weight) double: 1.0
+            query(description_closeness_weight) double: 1.0
         }
         function name_score() {
-            expression: attribute(name_weight) * bm25(family_name_index)
+            expression: nativeRank(family_name_index)
         }
         function description_score() {
-            expression: attribute(description_weight) * bm25(family_description_index)
+            expression: query(description_nativerank_weight) * nativeRank(family_description_index) + query(descriptione_closeness_weight) * closeness(family_description_embedding)
         }
         first-phase {
-            expression: name_score() + description_score()
+            expression: (attribute(name_weight) * name_score()) + (attribute(description_weight) * description_score())
         }
-        summary-features: name_score() description_score()
+        summary-features: name_score() description_score() nativeRank(family_name_index) nativeRank(family_description_index) closeness(family_description_embedding)
     }
 
-    rank-profile hybrid_custom_weight inherits default {
+    rank-profile hybrid_no_closeness inherits hybrid {
         inputs {
-            query(query_embedding) tensor<float>(x[768])
-            query(bm25_weight) double
-        }
-        function name_score() {
-            expression: attribute(name_weight) * bm25(family_name_index)
-        }
-        function description_score() {
-            expression: attribute(description_weight) * bm25(family_description_index)
+            query(description_closeness_weight) double: 0.0
         }
-        first-phase {
-            expression: name_score() + description_score()
-        }
-        summary-features: name_score() description_score()
     }
-
-
+
     document-summary search_summary {
         summary family_name {}
         summary family_description {}
@@ -281,28 +261,7 @@ schema family_document {
         summary collection_summary {}
     }
 
-    document-summary search_summary_with_tokens {
-        summary family_name {}
-        summary family_description {}
-        summary family_import_id {}
-        summary family_slug {}
-        summary family_category {}
-        summary family_publication_ts {}
-        summary family_geography {}
-        summary family_geographies {}
-        summary family_source {}
-        summary document_import_id {}
-        summary document_title {}
-        summary document_slug {}
-        summary document_languages {}
-        summary document_content_type {}
-        summary document_cdn_object {}
-        summary document_source_url {}
-        summary metadata {}
-        summary corpus_import_id {}
-        summary corpus_type_name {}
-        summary collection_title {}
-        summary collection_summary {}
+    document-summary search_summary_with_tokens inherits search_summary {
         summary family_name_index {}
         summary family_name_index_tokens {
             source: family_name_index