Spaces:

KevinGeng
/

Laronix_Recording

Runtime error

App Files Files Community

KevinGeng commited on Nov 6, 2023

Commit

2b3114a

1 Parent(s): 5f636d7

add loose threshold/ remove speed limitation

Browse files

Files changed (5) hide show

.gitignore +2 -1
app.py +22 -6
config/Arthur.yaml +2 -5
local/check_data.py +15 -1
local/indicator_plot.py +97 -0

.gitignore CHANGED Viewed

@@ -540,4 +540,5 @@ user/
 .vscode
-!data/Patient_sil_trim_16k_normed_5_snr_40/*

 .vscode
+!data/Patient_sil_trim_16k_normed_5_snr_40/*
+downloads

app.py CHANGED Viewed

@@ -178,6 +178,13 @@ def calc_mos(_, audio_path, id, ref, pre_ppm, fig=None):
         truth_transform=transformation,
         hypothesis_transform=transformation,
     )
     # MOS
     batch = {
         "wav": out_wavs,
@@ -187,7 +194,12 @@ def calc_mos(_, audio_path, id, ref, pre_ppm, fig=None):
     with torch.no_grad():
         output = model(batch)
     predic_mos = output.mean(dim=1).squeeze().detach().numpy() * 2 + 3
     # Phonemes per minute (PPM)
     with torch.no_grad():
         logits = phoneme_model(out_wavs).logits
@@ -204,6 +216,10 @@ def calc_mos(_, audio_path, id, ref, pre_ppm, fig=None):
     fig_h = plot_UV(wav_vad.numpy().squeeze(), a_h, sr=sr)
     ppm = len(lst_phonemes) / (wav_vad.shape[-1] / sr) * 60
     error_msg = "!!! ERROR MESSAGE !!!\n"
     if audio_path == _ or audio_path == None:
         error_msg += "ERROR: Fail recording, Please start from the beginning again."
@@ -216,11 +232,11 @@ def calc_mos(_, audio_path, id, ref, pre_ppm, fig=None):
             ppm,
             error_msg,
         )
-    if ppm >= float(pre_ppm) + float(config["thre"]["maxppm"]):
-        error_msg += "ERROR: Please speak slower.\n"
-    elif ppm <= float(pre_ppm) - float(config["thre"]["minppm"]):
-        error_msg += "ERROR: Please speak faster.\n"
-    elif predic_mos <= float(config["thre"]["AUTOMOS"]):
         error_msg += "ERROR: Naturalness is too low, Please try again.\n"
     elif wer >= float(config["thre"]["WER"]):
         error_msg += "ERROR: Intelligibility is too low, Please try again\n"

         truth_transform=transformation,
         hypothesis_transform=transformation,
     )
+    # round to 1 decimal
+    wer = np.round(wer, 1)
+    # WER convert to Intellibility score
+    INTELI_score = WER2INTELI(wer*100)
     # MOS
     batch = {
         "wav": out_wavs,
     with torch.no_grad():
         output = model(batch)
     predic_mos = output.mean(dim=1).squeeze().detach().numpy() * 2 + 3
+    # round to 1 decimal
+    predic_mos = np.round(predic_mos, 1)
+    # MOS to AVA MOS
+    AVA_MOS = nat2avaMOS(predic_mos)
     # Phonemes per minute (PPM)
     with torch.no_grad():
         logits = phoneme_model(out_wavs).logits
     fig_h = plot_UV(wav_vad.numpy().squeeze(), a_h, sr=sr)
     ppm = len(lst_phonemes) / (wav_vad.shape[-1] / sr) * 60
+    ppm = np.round(ppm, 1)
     error_msg = "!!! ERROR MESSAGE !!!\n"
     if audio_path == _ or audio_path == None:
         error_msg += "ERROR: Fail recording, Please start from the beginning again."
             ppm,
             error_msg,
         )
+    # if ppm >= float(pre_ppm) + float(config["thre"]["maxppm"]):
+    #     error_msg += "ERROR: Please speak slower.\n"
+    # elif ppm <= float(pre_ppm) - float(config["thre"]["minppm"]):
+    #     error_msg += "ERROR: Please speak faster.\n"
+    if predic_mos <= float(config["thre"]["AUTOMOS"]):
         error_msg += "ERROR: Naturalness is too low, Please try again.\n"
     elif wer >= float(config["thre"]["WER"]):
         error_msg += "ERROR: Intelligibility is too low, Please try again\n"

config/Arthur.yaml CHANGED Viewed

@@ -3,10 +3,7 @@ ref_txt: data/Arthur_the_rat.txt
 ref_feature: data/Patient_sil_trim_16k_normed_5_snr_40/Arthur_the_rat.csv
 ref_wavs: data/Patient_sil_trim_16k_normed_5_snr_40/Arthur_the_rat
 thre:
-  minppm: 300
-  maxppm: 300
   WER: 0.5
   AUTOMOS: 2.0
-auth:
-  username: Kath
-  password: Kath

 ref_feature: data/Patient_sil_trim_16k_normed_5_snr_40/Arthur_the_rat.csv
 ref_wavs: data/Patient_sil_trim_16k_normed_5_snr_40/Arthur_the_rat
 thre:
+  minppm: 0
+  maxppm: 1000
   WER: 0.5
   AUTOMOS: 2.0

local/check_data.py CHANGED Viewed

@@ -27,9 +27,23 @@ import io
 import sys
 file_id = sys.argv[1]
 # "1YjON2ObGM826KaaqF-sKM7CO0tAtzWGg"
 # Get the file's metadata
-file = service.files().get(fileId=file_id).execute()
 request = service.files().get_media(fileId=file_id)
 with open(file['name'], 'wb') as file_obj:

 import sys
 file_id = sys.argv[1]
+if file_id == "all":
+    results = service.files().list().execute()
+    files = results.get('files', [])
+    # download all files
+    for file in files:
+        request = service.files().get_media(fileId=file['id'])
+        with open("download/" + file['name'], 'wb') as file_obj:
+            downloader = MediaIoBaseDownload(file_obj, request)
+            done = False
+            while not done:
+                status, done = downloader.next_chunk()
+                print(f"Download {int(status.progress() * 100)}%.")
 # "1YjON2ObGM826KaaqF-sKM7CO0tAtzWGg"
 # Get the file's metadata
+else:
+    file = service.files().get(fileId=file_id).execute()
 request = service.files().get_media(fileId=file_id)
 with open(file['name'], 'wb') as file_obj:

local/indicator_plot.py ADDED Viewed

	@@ -0,0 +1,97 @@

+import plotly.graph_objects as go
+def Intelligibility_Plot(Int_Score, fair_thre=30, good_thre = 70, Upper=100, Lower=0):
+    '''
+    Int_Score: a float number between 0 and 100
+    Upper: the upper bound of the plot
+    Lower: the lower bound of the plot
+    '''
+    # Assert Nat_Score is a float number between 0 and 100
+    assert isinstance(Int_Score, float|int)
+    assert Int_Score >= Lower
+    assert Int_Score <= Upper
+    # Indicator plot with different colors, under fair_threshold the plot is red, then yellow, then green
+    # Design 1: Show bar in different colors refer to the threshold
+    color = "#75DA99"
+    if Int_Score <= fair_thre:
+        color = "#F2ADA0"
+    elif Int_Score <= good_thre:
+        color = "#e8ee89"
+    else:
+        color = "#75DA99"
+    fig = go.Figure(go.Indicator(
+        mode="number+gauge",
+        gauge={'shape': "bullet",
+               'axis':{'range': [Lower, Upper]},
+               'bgcolor': 'white',
+               'bar': {'color': color},
+               },
+        value=Int_Score,
+        domain = {'x': [0, 1], 'y': [0, 1]},
+        )
+    )
+    # # Design 2: Show all thresholds in the background
+    # fig = go.Figure(go.Indicator(
+    #     mode = "number+gauge",
+    #     gauge = {'shape': "bullet",
+    #              'axis': {'range': [Lower, Upper]},
+    #              'bgcolor': 'white',
+    #              'steps': [
+    #                 {'range': [Lower, fair_thre], 'color': "#F2ADA0"},
+    #                 {'range': [fair_thre, good_thre], 'color': "#e8ee89"},
+    #                 {'range': [good_thre, Upper], 'color': " #75DA99"}],
+    #             'bar': {'color': "grey"},
+    #             },
+    #         value = Int_Score,
+    #     domain = {'x': [0, 1], 'y': [0, 1]},
+    #     )
+    # )
+    fig.update_layout(height=300, width=1000)
+    return fig
+def Naturalness_Plot(Nat_Score, fair_thre=2, good_thre = 4, Upper=5, Lower=1.0):
+    '''
+    Int_Score: a float number between 0 and 100
+    Upper: the upper bound of the plot
+    Lower: the lower bound of the plot
+    '''
+    # Assert Nat_Score is a float number between 0 and 100
+    assert isinstance(Nat_Score, float|int)
+    assert Nat_Score >= Lower
+    assert Nat_Score <= Upper
+    # Indicator plot with different colors, under fair_threshold the plot is red, then yellow, then green
+    color = "#75DA99"
+    if Nat_Score <= fair_thre:
+        color = "#F2ADA0"
+    elif Nat_Score <= good_thre:
+        color = "#e8ee89"
+    else:
+        color = "#75DA99"
+    fig = go.Figure(go.Indicator(
+        mode="number+gauge",
+        gauge={'shape': "bullet",
+               'axis':{'range': [Lower, Upper]},
+               'bgcolor': 'white',
+               'bar': {'color': color},
+               },
+        value=Nat_Score,
+        domain = {'x': [0, 1], 'y': [0, 1]},
+        )
+    )
+    fig.update_layout(height=300, width=1000)
+    return fig
+# test case Intelligibility_Plot
+x = Intelligibility_Plot(10)
+x.show()
+x = Intelligibility_Plot(50)
+x.show()
+x = Intelligibility_Plot(90)
+x.show()