Spaces:

SiddharthAK
/

TextLSRDemo

Running

App Files Files Community

SiddharthAK commited on 20 days ago

Commit

f384e43

verified ·

1 Parent(s): 3e832a4

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -15

app.py CHANGED Viewed

@@ -113,7 +113,7 @@ def get_splade_cocondenser_representation(text):
     sorted_representation = sorted(meaningful_tokens.items(), key=lambda item: item[1], reverse=True)
-    formatted_output = "SPLADE-cocondenser-distil Representation (Weighting and Expansion):\n"
     if not sorted_representation:
         formatted_output += "No significant terms found for this input.\n"
     else:
@@ -237,9 +237,9 @@ def get_splade_doc_representation(text):
 def predict_representation_explorer(model_choice, text):
     if model_choice == "SPLADE-cocondenser-distil (weighting and expansion)":
         return get_splade_cocondenser_representation(text)
-    elif model_choice == "SPLADE-v3-Lexical (weighting)":
         return get_splade_lexical_representation(text)
-    elif model_choice == "SPLADE-v3-Doc (binary)":
         return get_splade_doc_representation(text)
     else:
         return "Please select a model."
@@ -357,12 +357,12 @@ def format_sparse_vector_output(splade_vector, tokenizer, is_binary=False):
 # --- NEW/MODIFIED: Helper to get the correct vector function, tokenizer, and binary flag ---
 def get_model_assets(model_choice_str):
-    if model_choice_str == "SPLADE-cocondenser-distil (weighting and expansion)":
-        return get_splade_cocondenser_vector, tokenizer_splade, False, "SPLADE-cocondenser-distil (Weighting and Expansion)"
-    elif model_choice_str == "SPLADE-v3-Lexical (weighting)":
-        return get_splade_lexical_vector, tokenizer_splade_lexical, False, "SPLADE-v3-Lexical (Weighting)"
-    elif model_choice_str == "SPLADE-v3-Doc (binary)":
-        return get_splade_doc_vector, tokenizer_splade_doc, True, "SPLADE-v3-Doc (Binary)"
     else:
         return None, None, False, "Unknown Model"
@@ -418,7 +418,7 @@ with gr.Blocks(title="SPLADE Demos") as demo:
                             "Binary Encoder"
                         ],
                         label="Choose Sparse Encoder",
-                        value="SPLADE-cocondenser-distil (weighting and expansion)"
                     ),
                     gr.Textbox(
                         lines=5,
@@ -437,9 +437,9 @@ with gr.Blocks(title="SPLADE Demos") as demo:
             # Define the common model choices for cleaner code
             model_choices = [
-                "SPLADE-cocondenser-distil (weighting and expansion)",
-                "SPLADE-v3-Lexical (weighting)",
-                "SPLADE-v3-Doc (binary)"
             ]
             gr.Interface(
@@ -448,12 +448,12 @@ with gr.Blocks(title="SPLADE Demos") as demo:
                     gr.Radio(
                         model_choices,
                         label="Choose Query Encoding Model",
-                        value="SPLADE-cocondenser-distil (weighting and expansion)" # Default value
                     ),
                     gr.Radio(
                         model_choices,
                         label="Choose Document Encoding Model",
-                        value="SPLADE-cocondenser-distil (weighting and expansion)" # Default value
                     ),
                     gr.Textbox(
                         lines=3,

     sorted_representation = sorted(meaningful_tokens.items(), key=lambda item: item[1], reverse=True)
+    formatted_output = "MLM encoder (SPLADE-cocondenser-distil):\n"
     if not sorted_representation:
         formatted_output += "No significant terms found for this input.\n"
     else:
 def predict_representation_explorer(model_choice, text):
     if model_choice == "SPLADE-cocondenser-distil (weighting and expansion)":
         return get_splade_cocondenser_representation(text)
+    elif model_choice == "MLP encoder (SPLADE-v3-lexical)":
         return get_splade_lexical_representation(text)
+    elif model_choice == "Binary encoder":
         return get_splade_doc_representation(text)
     else:
         return "Please select a model."
 # --- NEW/MODIFIED: Helper to get the correct vector function, tokenizer, and binary flag ---
 def get_model_assets(model_choice_str):
+    if model_choice_str == "MLM encoder (SPLADE-cocondenser-distil)":
+        return get_splade_cocondenser_vector, tokenizer_splade, False, "MLM encoder (SPLADE-cocondenser-distil)"
+    elif model_choice_str == "MLP encoder (SPLADE-v3-lexical)":
+        return get_splade_lexical_vector, tokenizer_splade_lexical, False, "MLP encoder (SPLADE-v3-lexical)"
+    elif model_choice_str == "Binary encoder":
+        return get_splade_doc_vector, tokenizer_splade_doc, True, "Binary encoder"
     else:
         return None, None, False, "Unknown Model"
                             "Binary Encoder"
                         ],
                         label="Choose Sparse Encoder",
+                        value="MLM encoder (SPLADE-cocondenser-distil)"
                     ),
                     gr.Textbox(
                         lines=5,
             # Define the common model choices for cleaner code
             model_choices = [
+                "MLM encoder (SPLADE-cocondenser-distil)",
+                "MLP encoder (SPLADE-v3-lexical)",
+                "Binary encoder"
             ]
             gr.Interface(
                     gr.Radio(
                         model_choices,
                         label="Choose Query Encoding Model",
+                        value="MLM encoder (SPLADE-cocondenser-distil)" # Default value
                     ),
                     gr.Radio(
                         model_choices,
                         label="Choose Document Encoding Model",
+                        value="MLM encoder (SPLADE-cocondenser-distil)" # Default value
                     ),
                     gr.Textbox(
                         lines=3,