Spaces:

satyamr196
/

ASR-FairBench-Server

Running

satyamr196 commited on May 14

Commit

25106b9

1 Parent(s): 547836e

small bug fix

Files changed (1) hide show

ASR_Server.py CHANGED Viewed

@@ -32,10 +32,10 @@ csv_result = f"test_with_{ASR_model.replace("/","_")}_WER.csv"
 df = pd.read_csv(csv_path)
 print(f"CSV Loaded with {len(df)} rows")
-# # Load dataset without decoding audio (required!)
-# dataset = load_dataset("satyamr196/asr_fairness_audio", split="train")
-# # dataset = dataset.with_format("python", decode_audio=False)
-# dataset = dataset.cast_column("audio", Audio(decode=False))
 def generateTranscript(ASR_model):
     import os
@@ -81,7 +81,7 @@ def generateTranscript(ASR_model):
     # dataset = dataset.with_format("python", decode_audio=False)
     dataset_map = {
         os.path.basename(sample["audio"]["path"]).lower(): sample
-        # for sample in dataset #uncomment this line to use the dataset
     }
     transcripts = []

 df = pd.read_csv(csv_path)
 print(f"CSV Loaded with {len(df)} rows")
+# Load dataset without decoding audio (required!)
+dataset = load_dataset("satyamr196/asr_fairness_audio", split="train")
+# dataset = dataset.with_format("python", decode_audio=False)
+dataset = dataset.cast_column("audio", Audio(decode=False))
 def generateTranscript(ASR_model):
     import os
     # dataset = dataset.with_format("python", decode_audio=False)
     dataset_map = {
         os.path.basename(sample["audio"]["path"]).lower(): sample
+        for sample in dataset #uncomment this line to use the dataset
     }
     transcripts = []