Spaces:

AdnanElAssadi
/

MTEB-Human-Eval-Demo

Sleeping

App Files Files Community

AdnanElAssadi commited on Apr 6

Commit

bc57cf2

verified ·

1 Parent(s): 7307de0

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -14

app.py CHANGED Viewed

@@ -10,24 +10,27 @@ def create_reranking_interface(task_data):
     completed_samples = {s["id"]: False for s in samples}
     def save_ranking(rankings, sample_id):
-        """Save the current set of rankings."""
         try:
             # Check if all documents have rankings
             all_ranked = all(r is not None and r != "" for r in rankings)
             if not all_ranked:
                 return "⚠️ Please assign a rank to all documents before submitting", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
-            # Convert rankings to integers with better error handling
             try:
                 processed_rankings = [int(r) for r in rankings]
-            except ValueError:
                 return "⚠️ Invalid ranking value. Please use only numbers.", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
             # Check for duplicate rankings
             if len(set(processed_rankings)) != len(processed_rankings):
                 return "⚠️ Each document must have a unique rank. Please review your rankings.", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
-            # Store this annotation in memory
             existing_idx = next((i for i, a in enumerate(results["annotations"]) if a["sample_id"] == sample_id), None)
             if existing_idx is not None:
                 results["annotations"][existing_idx] = {
@@ -40,20 +43,23 @@ def create_reranking_interface(task_data):
                     "rankings": processed_rankings
                 })
             completed_samples[sample_id] = True
-            # Try to save to file, but continue even if it fails
-            try:
-                output_path = f"{task_data['task_name']}_human_results.json"
-                with open(output_path, "w") as f:
-                    json.dump(results, f, indent=2)
-                return f"✅ Rankings saved successfully (in memory and to file)", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
-            except:
-                # If file saving fails, still mark as success since we saved in memory
-                return f"✅ Rankings saved in memory (file save failed)", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
         except Exception as e:
-            # Return specific error message
             return f"Error: {str(e)}", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
     with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown(f"# {task_data['task_name']} - Human Reranking Evaluation")

     completed_samples = {s["id"]: False for s in samples}
     def save_ranking(rankings, sample_id):
+        print("DEBUG: Rankings received:", rankings)
+        print("DEBUG: sample_id received:", sample_id, type(sample_id))
         try:
             # Check if all documents have rankings
             all_ranked = all(r is not None and r != "" for r in rankings)
             if not all_ranked:
                 return "⚠️ Please assign a rank to all documents before submitting", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
+            # Convert rankings to integers
             try:
                 processed_rankings = [int(r) for r in rankings]
+                print("DEBUG: Processed rankings:", processed_rankings)
+            except ValueError as ve:
+                print("DEBUG: ValueError in ranking conversion:", ve)
                 return "⚠️ Invalid ranking value. Please use only numbers.", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
             # Check for duplicate rankings
             if len(set(processed_rankings)) != len(processed_rankings):
                 return "⚠️ Each document must have a unique rank. Please review your rankings.", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
+            # Store annotation in memory
             existing_idx = next((i for i, a in enumerate(results["annotations"]) if a["sample_id"] == sample_id), None)
             if existing_idx is not None:
                 results["annotations"][existing_idx] = {
                     "rankings": processed_rankings
                 })
+            # Convert sample_id if necessary
+            if sample_id not in completed_samples:
+                try:
+                    sample_id = int(sample_id)
+                except:
+                    pass
+            print("DEBUG: Completed samples keys:", completed_samples.keys())
             completed_samples[sample_id] = True
+            output_path = f"{task_data['task_name']}_human_results.json"
+            with open(output_path, "w") as f:
+                json.dump(results, f, indent=2)
+            return "✅ Rankings saved successfully", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
         except Exception as e:
+            print("DEBUG: Exception occurred:", e)
             return f"Error: {str(e)}", f"Progress: {sum(completed_samples.values())}/{len(samples)}"
     with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown(f"# {task_data['task_name']} - Human Reranking Evaluation")