gender_identification

Runtime error

ksang commited on May 5, 2023

Commit

448fd25

•

1 Parent(s): eef135d

Upload 3 files

Files changed (3) hide show

app.py CHANGED Viewed

@@ -39,24 +39,32 @@ model.load_state_dict(checkpoint)
 # %%
 def predict(input):
-    waveform, sr = librosa.load(input)
-    waveform = torch.from_numpy(waveform).unsqueeze(0)
-    waveform = torchaudio.transforms.Resample(sr, 16_000)(waveform)
-    inputs = feature_extractor(waveform, sampling_rate=feature_extractor.sampling_rate,
-                            max_length=16000, truncation=True)
-    tensor = torch.tensor(inputs['input_values'][0])
-    with torch.no_grad():
-        output = model(tensor)
-        logits = output['logits'][0]
-        label_id = torch.argmax(logits).item()
-    label_name = id2label[str(label_id)]
-    return label_name
 # %%
 demo = gr.Interface(
     fn=predict,
-    inputs=gr.Audio(source="microphone", type="filepath", label="Speak to classify your voice!"), # record audio, save in temp file to feed to inference func
-    outputs="text"
 )
 # %%

 # %%
 def predict(input):
+    if input == None:
+        return "Please input a valid file or record yourself by clicking the microphone"
+    elif input:
+        waveform, sr = librosa.load(input)
+        waveform = torch.from_numpy(waveform).unsqueeze(0)
+        waveform = torchaudio.transforms.Resample(sr, 16_000)(waveform)
+        inputs = feature_extractor(waveform, sampling_rate=feature_extractor.sampling_rate,
+                                max_length=16000, truncation=True)
+        tensor = torch.tensor(inputs['input_values'][0])
+        with torch.no_grad():
+            output = model(tensor)
+            logits = output['logits'][0]
+            label_id = torch.argmax(logits).item()
+        label_name = id2label[str(label_id)]
+        return label_name
+    else:
+        return "File is not valid"
 # %%
 demo = gr.Interface(
     fn=predict,
+    title="Audio Gender Classification",
+    description="Record your voice or upload an audio file to see what gender our model classifies it as",
+    inputs=gr.Audio(source="microphone", type="filepath", optional=False, label="Speak to classify your voice!"), # record audio, save in temp file to feed to inference func
+    outputs="text",
+    examples= [["male.mp3"], ["female.mp3"]]
 )
 # %%

female.mp3 ADDED Viewed

Binary file (61.7 kB). View file

male.mp3 ADDED Viewed

Binary file (18.7 kB). View file