Spaces:

tahirsher
/

ASR_Model_for_Transcription_into_Text

Sleeping

tahirsher commited on Mar 10

Commit

eda3536

verified ·

1 Parent(s): 2ff2cbe

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -83,10 +83,21 @@ if audio_file:
     # ================================
     # ✅ Preprocess Audio with Processor (Corrected)
     # ================================
     inputs = processor(adversarial_waveform.squeeze().numpy(), sampling_rate=16000, return_tensors="pt", padding=True)
-    # Ensure the input has batch dimension (even if it's one example)
-    input_features = inputs["input_features"].to("cuda" if torch.cuda.is_available() else "cpu")
     # ================================
     # ✅ Fast Transcription Processing with Conformer

     # ================================
     # ✅ Preprocess Audio with Processor (Corrected)
     # ================================
+    # Ensure the input has batch dimension (even if it's one example)
     inputs = processor(adversarial_waveform.squeeze().numpy(), sampling_rate=16000, return_tensors="pt", padding=True)
+    # Check the structure of the returned `inputs` to understand what it contains
+    st.write("Processor Output:", inputs)
+    # Extract the correct key (input_features or input_values depending on the model)
+    if "input_features" in inputs:
+        input_features = inputs["input_features"]
+    elif "input_values" in inputs:
+        input_features = inputs["input_values"]
+    else:
+        raise ValueError("❌ The processor output does not contain 'input_features' or 'input_values'.")
+    input_features = input_features.to("cuda" if torch.cuda.is_available() else "cpu")
     # ================================
     # ✅ Fast Transcription Processing with Conformer