├── __init__.py ├── AR-SCR ├── __init__.py ├── __pycache__ │ └── ts_dataloader.cpython-36.pyc ├── source_target_pairing.py ├── ts_dataloader.py └── main.py ├── DM-SCR ├── __init__.py ├── source_target_pairing.py ├── ts_dataloader.py └── main.py ├── LT-SCR ├── __init__.py ├── source_target_pairing.py ├── ts_dataloader.py └── main.py ├── run_ar.sh ├── run_dm.sh ├── run_lt.sh ├── prepare_ar_data.py ├── prepare_dm_data.py ├── prepare_lt_data.py ├── illustration.png ├── weight └── pr_attRNN.h5 ├── is23-best-student-paper-candidates.png ├── .gitignore ├── Datasets ├── DM-SCR │ ├── make_data.py │ ├── test_full.csv │ └── train_full.csv ├── AR-SCR │ ├── make_data.py │ ├── dev_full.csv │ └── test_full.csv └── LT-SCR │ ├── make_data.py │ ├── dev_full.csv │ ├── test_full.csv │ ├── noise_full.csv │ └── train_limit20.csv ├── audioUtils.py ├── SpeechModels.py ├── SpeechGenerator.py ├── ts_model.py ├── README.md ├── similarity_mapping.py ├── funcs.py ├── repr-scr.yml ├── utils.py └── SpeechDownloader.py /__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /AR-SCR/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /DM-SCR/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /LT-SCR/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /run_ar.sh: -------------------------------------------------------------------------------- 1 | python AR-SCR/main.py 2 | -------------------------------------------------------------------------------- /run_dm.sh: -------------------------------------------------------------------------------- 1 | python DM-SCR/main.py 2 | -------------------------------------------------------------------------------- /run_lt.sh: -------------------------------------------------------------------------------- 1 | python LT-SCR/main.py 2 | -------------------------------------------------------------------------------- /prepare_ar_data.py: -------------------------------------------------------------------------------- 1 | cd Datasets/AR-SCR 2 | python make_data.py 3 | -------------------------------------------------------------------------------- /prepare_dm_data.py: -------------------------------------------------------------------------------- 1 | cd Datasets/DM-SCR 2 | python make_data.py 3 | -------------------------------------------------------------------------------- /prepare_lt_data.py: -------------------------------------------------------------------------------- 1 | cd Datasets/LT-SCR 2 | python make_data.py 3 | -------------------------------------------------------------------------------- /illustration.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dodohow1011/SpeechAdvReprogram/HEAD/illustration.png -------------------------------------------------------------------------------- /weight/pr_attRNN.h5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dodohow1011/SpeechAdvReprogram/HEAD/weight/pr_attRNN.h5 -------------------------------------------------------------------------------- /is23-best-student-paper-candidates.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dodohow1011/SpeechAdvReprogram/HEAD/is23-best-student-paper-candidates.png -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- 1 | AR-SCR/weight 2 | LT-SCR/weight 3 | DM-SCR/weight 4 | AR-SCR/__pycache__ 5 | LT-SCR/__pycache__ 6 | DM-SCR/__pycache__ 7 | __pycache__ 8 | -------------------------------------------------------------------------------- /AR-SCR/__pycache__/ts_dataloader.cpython-36.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dodohow1011/SpeechAdvReprogram/HEAD/AR-SCR/__pycache__/ts_dataloader.cpython-36.pyc -------------------------------------------------------------------------------- /AR-SCR/source_target_pairing.py: -------------------------------------------------------------------------------- 1 | import os 2 | import sys 3 | sys.path.append(os.getcwd()) 4 | 5 | import SpeechDownloader 6 | import SpeechGenerator 7 | from similarity_mapping import source_target_mapping 8 | from ts_dataloader import load_data 9 | 10 | 11 | if __name__ == "__main__": 12 | gscInfo, n_Categs = SpeechDownloader.PrepareGoogleSpeechCmd(version=2, task='35word') 13 | SourceGen = SpeechGenerator.SpeechGen(gscInfo['train']['files'], gscInfo['train']['labels'], shuffle=False) 14 | target_csv = 'Datasets/AR-SCR/train_full.csv' 15 | target_audios, target_labels = load_data(target_csv) 16 | source_target_mapping(SourceGen, target_audios, target_labels) 17 | 18 | 19 | -------------------------------------------------------------------------------- /DM-SCR/source_target_pairing.py: -------------------------------------------------------------------------------- 1 | import os 2 | import sys 3 | sys.path.append(os.getcwd()) 4 | 5 | import SpeechDownloader 6 | import SpeechGenerator 7 | from similarity_mapping import source_target_mapping 8 | from ts_dataloader import load_data 9 | 10 | 11 | if __name__ == "__main__": 12 | gscInfo, n_Categs = SpeechDownloader.PrepareGoogleSpeechCmd(version=2, task='35word') 13 | SourceGen = SpeechGenerator.SpeechGen(gscInfo['train']['files'], gscInfo['train']['labels'], shuffle=False) 14 | target_csv = 'Datasets/DM-SCR/train_full.csv' 15 | target_audios, target_labels = load_data(target_csv) 16 | source_target_mapping(SourceGen, target_audios, target_labels) 17 | 18 | 19 | -------------------------------------------------------------------------------- /LT-SCR/source_target_pairing.py: -------------------------------------------------------------------------------- 1 | import os 2 | import sys 3 | sys.path.append(os.getcwd()) 4 | 5 | import SpeechDownloader 6 | import SpeechGenerator 7 | from similarity_mapping import source_target_mapping 8 | from ts_dataloader import load_data 9 | 10 | 11 | if __name__ == "__main__": 12 | gscInfo, n_Categs = SpeechDownloader.PrepareGoogleSpeechCmd(version=2, task='35word') 13 | SourceGen = SpeechGenerator.SpeechGen(gscInfo['train']['files'], gscInfo['train']['labels'], shuffle=False) 14 | target_csv = 'Datasets/LT-SCR/train_limit20.csv' 15 | target_audios, target_labels = load_data(target_csv, 1109) 16 | source_target_mapping(SourceGen, target_audios, target_labels) 17 | 18 | 19 | -------------------------------------------------------------------------------- /AR-SCR/ts_dataloader.py: -------------------------------------------------------------------------------- 1 | import sys 2 | sys.path.append('..') 3 | 4 | import librosa 5 | import numpy as np 6 | import pandas as pd 7 | import soundfile as sound 8 | 9 | from tensorflow import keras 10 | 11 | 12 | def load_data(data_csv): 13 | data_df = pd.read_csv(data_csv, sep='\t') 14 | wavpath = data_df['filename'].tolist() 15 | labels = data_df['label'].to_list() 16 | 17 | x, y = list(), list() 18 | 19 | for wav, label in zip(wavpath, labels): 20 | stereo, sr = sound.read(wav) 21 | stereo = stereo / np.abs(stereo).max() 22 | if sr != 16000: 23 | stereo = librosa.resample(stereo, sr, 16000) 24 | if stereo.shape[0] > 16000: 25 | start = np.random.choice(len(stereo) - 16000 + 1) 26 | x.append(stereo[start:start+16000]) 27 | else: 28 | x.append(np.pad(stereo, (0, 16000-stereo.shape[0]))) 29 | 30 | y.append(label) 31 | 32 | return np.array(x), y 33 | -------------------------------------------------------------------------------- /Datasets/DM-SCR/make_data.py: -------------------------------------------------------------------------------- 1 | import os 2 | import random 3 | import pandas as pd 4 | 5 | data_dir = "/work/dodohow1011/dysarthria_zh_command/" 6 | train_full = list() 7 | test_full = list() 8 | 9 | for i in [1,2,3]: 10 | spk_dir = data_dir + "D_SPK{}".format(i) 11 | for (dirpath, dirnames, filenames) in os.walk(spk_dir): 12 | s = random.sample(range(10), 3) 13 | label = dirpath.split('/')[-1] 14 | for i,f in enumerate(filenames): 15 | if not f.endswith(".wav"): 16 | continue 17 | 18 | if i in s: 19 | test_full += [[os.path.join(dirpath, f), label]] 20 | else: 21 | train_full += [[os.path.join(dirpath, f), label]] 22 | 23 | 24 | train_full_csv = pd.DataFrame(train_full, columns=["filename", "label"]) 25 | train_full_csv.to_csv("train_full.csv", sep='\t', index=False) 26 | test_full_csv = pd.DataFrame(test_full, columns=["filename", "label"]) 27 | test_full_csv.to_csv("test_full.csv", sep='\t', index=False) 28 | -------------------------------------------------------------------------------- /DM-SCR/ts_dataloader.py: -------------------------------------------------------------------------------- 1 | import librosa 2 | import numpy as np 3 | import pandas as pd 4 | import soundfile as sound 5 | 6 | from tensorflow import keras 7 | 8 | 9 | def load_data(data_csv): 10 | data_df = pd.read_csv(data_csv, sep='\t') 11 | wavpath = data_df['filename'].tolist() 12 | labels = data_df['label'].to_list() 13 | 14 | x, y = list(), list() 15 | omits = [10,13,14,15,16,19] 16 | for wav, label in zip(wavpath, labels): 17 | if label in omits: 18 | continue 19 | stereo, sr = sound.read(wav) 20 | stereo, index = librosa.effects.trim(stereo, top_db=20) 21 | if sr != 16000: 22 | stereo = librosa.resample(stereo, sr, 16000) 23 | if stereo.shape[0] > 16000: 24 | start = (stereo.shape[0] - 16000) // 2 25 | x.append(stereo[start:start+16000]) 26 | else: 27 | x.append(np.pad(stereo, (0, 16000-stereo.shape[0]))) 28 | 29 | y.append(label) 30 | 31 | return np.array(x), np.array(y) 32 | -------------------------------------------------------------------------------- /Datasets/AR-SCR/make_data.py: -------------------------------------------------------------------------------- 1 | import os 2 | import random 3 | import pandas as pd 4 | 5 | data_dir = "/work/dodohow1011/AR_SpeechCommands/" 6 | train_full = list() 7 | dev_full = list() 8 | test_full = list() 9 | 10 | command_dir = os.path.join(data_dir, "commands") 11 | number_dir = os.path.join(data_dir, "numbers") 12 | 13 | for wav in os.listdir(command_dir): 14 | coin = random.random() 15 | command = wav[0] 16 | if coin <= 0.2: 17 | test_full += [[os.path.join(command_dir, wav), command]] 18 | else: 19 | c = random.random() 20 | if c <= 0.1: 21 | dev_full += [[os.path.join(command_dir, wav), command]] 22 | else: 23 | train_full += [[os.path.join(command_dir, wav), command]] 24 | 25 | for wav in os.listdir(number_dir): 26 | coin = random.random() 27 | number = wav[0] 28 | if coin <= 0.2: 29 | test_full += [[os.path.join(number_dir, wav), number]] 30 | else: 31 | c = random.random() 32 | if c <= 0.1: 33 | dev_full += [[os.path.join(number_dir, wav), number]] 34 | else: 35 | train_full += [[os.path.join(number_dir, wav), number]] 36 | 37 | train_full_csv = pd.DataFrame(train_full, columns=["filename", "label"]) 38 | train_full_csv.to_csv("train_full.csv", sep='\t', index=False) 39 | dev_full_csv = pd.DataFrame(dev_full, columns=["filename", "label"]) 40 | dev_full_csv.to_csv("dev_full.csv", sep='\t', index=False) 41 | test_full_csv = pd.DataFrame(test_full, columns=["filename", "label"]) 42 | test_full_csv.to_csv("test_full.csv", sep='\t', index=False) 43 | -------------------------------------------------------------------------------- /audioUtils.py: -------------------------------------------------------------------------------- 1 | """ 2 | Utility functions for audio files 3 | """ 4 | import librosa 5 | import os 6 | from tqdm import tqdm 7 | import numpy as np 8 | import matplotlib.pyplot as plt 9 | import itertools 10 | 11 | 12 | def plot_confusion_matrix(cm, classes, 13 | normalize=False, 14 | title='Confusion matrix', 15 | cmap=plt.cm.Blues): 16 | """ 17 | This function prints and plots the confusion matrix. 18 | Normalization can be applied by setting `normalize=True`. 19 | """ 20 | if normalize: 21 | cm = cm.astype('float') / cm.sum(axis=1)[:, np.newaxis] 22 | print("Normalized confusion matrix") 23 | else: 24 | print('Confusion matrix, without normalization') 25 | 26 | plt.figure(figsize=(15, 15)) 27 | plt.imshow(cm, interpolation='nearest', cmap=cmap) 28 | plt.title(title, fontsize=30) 29 | plt.colorbar() 30 | tick_marks = np.arange(len(classes)) 31 | plt.xticks(tick_marks, classes, rotation=45, fontsize=15) 32 | plt.yticks(tick_marks, classes, fontsize=15) 33 | 34 | fmt = '.3f' if normalize else 'd' 35 | thresh = cm.max() / 2. 36 | for i, j in itertools.product(range(cm.shape[0]), range(cm.shape[1])): 37 | plt.text(j, i, format(cm[i, j], fmt), size=11, 38 | horizontalalignment="center", 39 | color="white" if cm[i, j] > thresh else "black") 40 | 41 | plt.ylabel('True label', fontsize=30) 42 | plt.xlabel('Predicted label', fontsize=30) 43 | plt.savefig('picConfMatrix.png', dpi=400) 44 | plt.tight_layout() 45 | 46 | 47 | def WAV2Numpy(folder, sr=None): 48 | """ 49 | Recursively converts WAV to numpy arrays. 50 | Deletes the WAV files in the process 51 | 52 | folder - folder to convert. 53 | """ 54 | allFiles = [] 55 | for root, dirs, files in os.walk(folder): 56 | allFiles += [os.path.join(root, f) for f in files 57 | if f.endswith('.wav')] 58 | 59 | for file in tqdm(allFiles): 60 | y, sr = librosa.load(file, sr=None) 61 | 62 | # if we want to write the file later 63 | # librosa.output.write_wav('file.wav', y, sr, norm=False) 64 | np.save(file + '.npy', y) 65 | os.remove(file) 66 | -------------------------------------------------------------------------------- /SpeechModels.py: -------------------------------------------------------------------------------- 1 | from tensorflow.keras.models import Model, load_model 2 | from tensorflow.keras import layers as L 3 | from tensorflow.keras import backend as K 4 | from tensorflow.keras.utils import to_categorical 5 | from tensorflow.keras.callbacks import EarlyStopping, ModelCheckpoint, LearningRateScheduler 6 | from tensorflow.keras import backend as K 7 | from tensorflow.keras import optimizers 8 | from kapre.time_frequency import Melspectrogram, Spectrogram 9 | from kapre.utils import Normalization2D 10 | 11 | def AttRNNSpeechModel(nCategories, samplingrate=16000, 12 | inputLength=16000, unet = False, rnn_func=L.LSTM): 13 | # simple LSTM 14 | sr = samplingrate 15 | iLen = inputLength 16 | 17 | inputs = L.Input((inputLength,), name='input') 18 | 19 | x = L.Reshape((1, -1))(inputs) 20 | 21 | m = Melspectrogram(n_dft=1024, n_hop=128, input_shape=(1, iLen), 22 | padding='same', sr=sr, n_mels=80, 23 | fmin=40.0, fmax=sr / 2, power_melgram=1.0, 24 | return_decibel_melgram=True, trainable_fb=False, 25 | trainable_kernel=False, 26 | name='mel_stft') 27 | m.trainable = False 28 | 29 | x = m(x) 30 | 31 | x = Normalization2D(int_axis=0, name='mel_stft_norm')(x) 32 | 33 | # note that Melspectrogram puts the sequence in shape (batch_size, melDim, timeSteps, 1) 34 | # we would rather have it the other way around for LSTMs 35 | 36 | x = L.Permute((2, 1, 3))(x) 37 | x = L.Conv2D(10, (5, 1), activation='relu', padding='same')(x) 38 | x = L.BatchNormalization()(x) 39 | x = L.Conv2D(1, (5, 1), activation='relu', padding='same')(x) 40 | x = L.BatchNormalization()(x) 41 | 42 | # x = Reshape((125, 80)) (x) 43 | # keras.backend.squeeze(x, axis) 44 | x = L.Lambda(lambda q: K.squeeze(q, -1), name='squeeze_last_dim')(x) 45 | 46 | x = L.Bidirectional(rnn_func(64, return_sequences=True) 47 | )(x) # [b_s, seq_len, vec_dim] 48 | x = L.Bidirectional(rnn_func(64, return_sequences=True) 49 | )(x) # [b_s, seq_len, vec_dim] 50 | 51 | xFirst = L.Lambda(lambda q: q[:, -1])(x) # [b_s, vec_dim] 52 | query = L.Dense(128)(xFirst) 53 | 54 | # dot product attention 55 | attScores = L.Dot(axes=[1, 2])([query, x]) 56 | attScores = L.Softmax(name='attSoftmax')(attScores) # [b_s, seq_len] 57 | 58 | # rescale sequence 59 | attVector = L.Dot(axes=[1, 1])([attScores, x]) # [b_s, vec_dim] 60 | 61 | x = L.Dense(64, activation='relu')(attVector) 62 | x = L.Dense(32)(x) 63 | 64 | output = L.Dense(nCategories, activation='softmax', name='output')(x) 65 | 66 | model = Model(inputs=[inputs], outputs=[output]) 67 | 68 | return model 69 | 70 | -------------------------------------------------------------------------------- /Datasets/LT-SCR/make_data.py: -------------------------------------------------------------------------------- 1 | import os 2 | import re 3 | import random 4 | import hashlib 5 | import pandas as pd 6 | 7 | limit = 20 8 | 9 | data_dir = "/work/dodohow1011/lt_speech_commands/dataset" 10 | train_full, dev_full, test_full = list(), list(), list() 11 | bg_audio_list = list() 12 | 13 | MAX_NUM_WAVS_PER_CLASS = 2**27 - 1 14 | words = 'ne,ačiū,stop,įjunk,išjunk,į_viršų,į_apačią,į_dešinę,į_kairę,startas,pauzė,labas,iki' 15 | bg = '_background_noise_' 16 | 17 | def which_set(fname, dev_percentage=10., test_percentage=10.): 18 | """ 19 | See https://github.com/tensorflow/tensorflow/blob/master/tensorflow/examples/speech_commands/input_data.py#L70 20 | """ 21 | base_name = fname 22 | hash_name = re.sub(r'_nohash_.*$', '', base_name) 23 | hash_name_hashed = hashlib.sha1(hash_name.encode('UTF-8')).hexdigest() 24 | percentage_hash = ((int(hash_name_hashed, 16) % (MAX_NUM_WAVS_PER_CLASS + 1)) * (100.0 / MAX_NUM_WAVS_PER_CLASS)) 25 | if percentage_hash < dev_percentage: 26 | return "DEV" 27 | if percentage_hash < dev_percentage + test_percentage: 28 | return "TEST" 29 | return "TRAIN" 30 | 31 | if __name__ == '__main__': 32 | train_label_cnt = dict() 33 | for command in os.listdir(data_dir): 34 | if command == bg: 35 | bg_dir = os.path.join(data_dir, bg) 36 | for wav in os.listdir(bg_dir): 37 | bg_audio_list.append([os.path.join(bg_dir, wav), "silence"]) 38 | continue 39 | 40 | command_dir = os.path.join(data_dir, command) 41 | for wav in os.listdir(command_dir): 42 | t = which_set(wav, 10., 10.) 43 | if t == "TEST": 44 | if command not in words: 45 | label = "unknown" 46 | else: 47 | label = command 48 | test_full += [[os.path.join(command_dir, wav), label]] 49 | elif t == "DEV": 50 | if command not in words: 51 | label = "unknown" 52 | else: 53 | label = command 54 | dev_full += [[os.path.join(command_dir, wav), label]] 55 | else: 56 | if command not in train_label_cnt: 57 | train_label_cnt[command] = 0 58 | train_label_cnt[command] += 1 59 | if train_label_cnt[command] > limit: 60 | continue 61 | else: 62 | if command not in words: 63 | label = "unknown" 64 | else: 65 | label = command 66 | train_full += [[os.path.join(command_dir, wav), label]] 67 | 68 | 69 | train_full_csv = pd.DataFrame(train_full, columns=["filename", "label"]) 70 | train_full_csv.to_csv("train_limit{}.csv".format(limit), sep='\t', index=False) 71 | 72 | dev_full_csv = pd.DataFrame(dev_full, columns=["filename", "label"]) 73 | dev_full_csv.to_csv("dev_full.csv", sep='\t', index=False) 74 | test_full_csv = pd.DataFrame(test_full, columns=["filename", "label"]) 75 | test_full_csv.to_csv("test_full.csv", sep='\t', index=False) 76 | 77 | bg_full_csv = pd.DataFrame(bg_audio_list, columns=["filename", "label"]) 78 | bg_full_csv.to_csv("noise_full.csv", sep='\t', index=False) 79 | -------------------------------------------------------------------------------- /SpeechGenerator.py: -------------------------------------------------------------------------------- 1 | """ 2 | A generator for reading and serving audio files 3 | 4 | https://stanford.edu/~shervine/blog/keras-how-to-generate-data-on-the-fly.html 5 | 6 | Remember to use multiprocessing: 7 | # Train model on dataset 8 | model.fit_generator(generator=training_generator, 9 | validation_data=validation_generator, 10 | use_multiprocessing=True, 11 | workers=6) 12 | 13 | """ 14 | 15 | import numpy as np 16 | import tensorflow.keras 17 | 18 | 19 | class SpeechGen(tensorflow.keras.utils.Sequence): 20 | """ 21 | 'Generates data for Keras' 22 | 23 | list_IDs - list of files that this generator should load 24 | labels - dictionary of corresponding (integer) category 25 | to each file in list_IDs 26 | 27 | Expects list_IDs and labels to be of the same length 28 | """ 29 | def __init__(self, list_IDs, labels, batch_size=32, 30 | dim=16000, shuffle=True): 31 | 'Initialization' 32 | self.dim = dim 33 | self.batch_size = batch_size 34 | self.labels = labels 35 | self.list_IDs = list_IDs 36 | self.shuffle = shuffle 37 | self.on_epoch_end() 38 | 39 | def __len__(self): 40 | 'Denotes the number of batches per epoch' 41 | return int(np.floor(len(self.list_IDs) / self.batch_size)) 42 | 43 | def __getitem__(self, index): 44 | 'Generate one batch of data' 45 | # Generate indexes of the batch 46 | indexes = self.indexes[index*self.batch_size:(index+1)*self.batch_size] 47 | 48 | # Find list of IDs 49 | list_IDs_temp = [self.list_IDs[k] for k in indexes] 50 | 51 | # Generate data 52 | X, y = self.__data_generation(list_IDs_temp) 53 | 54 | return X, y 55 | 56 | def on_epoch_end(self): 57 | 'Updates indexes after each epoch' 58 | self.indexes = np.arange(len(self.list_IDs)) 59 | if self.shuffle: 60 | np.random.shuffle(self.indexes) 61 | 62 | def __data_generation(self, list_IDs_temp): 63 | 'Generates data containing batch_size samples' 64 | # X : (n_samples, *dim, n_channels) 65 | # Initialization 66 | X = np.empty((self.batch_size, self.dim)) 67 | y = np.empty((self.batch_size), dtype=int) 68 | 69 | # Generate data 70 | for i, ID in enumerate(list_IDs_temp): 71 | 72 | # load data from file, saved as numpy array on disk 73 | curX = np.load(ID) 74 | 75 | # normalize 76 | # invMax = 1/(np.max(np.abs(curX))+1e-3) 77 | # curX *= invMax 78 | 79 | # curX could be bigger or smaller than self.dim 80 | if curX.shape[0] == self.dim: 81 | X[i] = curX 82 | elif curX.shape[0] > self.dim: # bigger 83 | # we can choose any position in curX-self.dim 84 | randPos = np.random.randint(curX.shape[0]-self.dim) 85 | X[i] = curX[randPos:randPos+self.dim] 86 | else: # smaller 87 | randPos = np.random.randint(self.dim-curX.shape[0]) 88 | X[i, randPos:randPos + curX.shape[0]] = curX 89 | # print('File dim smaller') 90 | 91 | # Store class 92 | y[i] = self.labels[ID] 93 | 94 | return X, y 95 | -------------------------------------------------------------------------------- /DM-SCR/main.py: -------------------------------------------------------------------------------- 1 | import os 2 | import sys 3 | sys.path.append(os.getcwd()) 4 | 5 | import argparse 6 | 7 | import numpy as np 8 | import tensorflow as tf 9 | from tensorflow import keras 10 | import tensorflow.keras.backend as K 11 | 12 | from funcs import LR_Warmup 13 | from ts_dataloader import load_data 14 | from ts_model import AttRNN_Model, ARTLayer, WARTmodel, make_model 15 | 16 | 17 | # Learning phase is set to 0 since we want the network to use the pretrained moving mean/var 18 | # K.clear_session() 19 | 20 | def main(args): 21 | 22 | train_csv = 'Datasets/DM-SCR/train_full.csv' 23 | test_csv = 'Datasets/DM-SCR/test_full.csv' 24 | 25 | x_train, y_train = load_data(train_csv) 26 | x_test, y_test = load_data(test_csv) 27 | 28 | classes = np.unique(y_train) 29 | cls2label = {label: i for i, label in enumerate(classes.tolist())} 30 | num_classes = len(classes) 31 | 32 | y_train = [cls2label[y] for y in y_train] 33 | y_test = [cls2label[y] for y in y_test] 34 | y_train = keras.utils.to_categorical(y_train, num_classes=num_classes) 35 | y_test = keras.utils.to_categorical(y_test, num_classes=num_classes) 36 | 37 | 38 | print("--- X shape : ", x_train[0].shape, "--- Num of Classes : ", num_classes) ## target class 39 | 40 | 41 | ## Pre-trained Model for Adv Program 42 | pr_model = AttRNN_Model() 43 | 44 | 45 | ## # of Source classes in Pre-trained Model 46 | source_classes = 36 ## Google Speech Commands 47 | 48 | target_shape = (x_train[0].shape[0], 1) 49 | 50 | ## Adv Program Time Series (ART) 51 | mapping_num = args.mapping 52 | try: 53 | assert mapping_num*num_classes <= source_classes 54 | except AssertionError: 55 | print("Error: The mapping num should be smaller than source_classes / num_classes: {}".format(source_classes//num_classes)) 56 | exit(1) 57 | 58 | model = WARTmodel(target_shape, pr_model, source_classes, mapping_num, num_classes, args.dropout) 59 | 60 | ## Loss 61 | adam = tf.keras.optimizers.Adam() 62 | model.compile(loss='categorical_crossentropy', optimizer = adam, metrics=['accuracy']) 63 | 64 | lr_scheduler = LR_Warmup(lr_base=args.lr,min_lr=0.001,decay=args.lr_decay,warmup_epochs=30) 65 | 66 | save_path = "DM-SCR/weight/" + str(args.lr) + "-" + str(args.lr_decay) + "-{epoch:02d}.h5" 67 | if not os.path.exists('DN-SCR/weight'): 68 | os.makedirs('DM-SCR/weight') 69 | 70 | 71 | checkpoints = tf.keras.callbacks.ModelCheckpoint(save_path,save_weights_only=True) 72 | exp_callback = [lr_scheduler, checkpoints] 73 | 74 | 75 | model.summary() 76 | 77 | batch_size = 32 78 | epochs = args.eps 79 | exp_history = model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, verbose=1, callbacks= exp_callback) 80 | 81 | score = model.evaluate(x_test, y_test, verbose=0) 82 | print('--- Test loss:', score[0]) 83 | print('- Test accuracy:', score[1]) 84 | 85 | return score 86 | 87 | if __name__ == '__main__': 88 | parser = argparse.ArgumentParser() 89 | parser.add_argument("--mapping", type=int, default=2, help="Number of multi-mapping") 90 | parser.add_argument("--eps", type=int, default=100, help="Epochs") 91 | parser.add_argument("--dropout", type=float, default=0.3, help="Dropout") 92 | parser.add_argument("--lr", type=float, default=0.008, help="Initial learning rate") 93 | parser.add_argument("--lr_decay", type=float, default=0.005, help="Learnig rate decay rate") 94 | args = parser.parse_args() 95 | 96 | main(args) 97 | -------------------------------------------------------------------------------- /ts_model.py: -------------------------------------------------------------------------------- 1 | # CHH Yang et al. 2021 (http://proceedings.mlr.press/v139/yang21j/yang21j.pdf) 2 | # Apache Apache-2.0 License 3 | import sys 4 | 5 | import numpy as np 6 | 7 | import tensorflow as tf 8 | import kapre 9 | from tensorflow.keras.models import Model, load_model 10 | from kapre.time_frequency import Melspectrogram, Spectrogram 11 | from tensorflow.keras.layers import ZeroPadding2D, Input, Layer, ZeroPadding1D, Reshape, Permute, Dense, Dropout 12 | from tensorflow.keras import initializers,regularizers 13 | from tensorflow.keras.preprocessing.sequence import pad_sequences 14 | import tensorflow.keras.backend as K 15 | from kapre.utils import Normalization2D 16 | from SpeechModels import AttRNNSpeechModel 17 | from utils import multi_mapping 18 | from tensorflow import keras 19 | 20 | print("tensorflow vr. ", tf.__version__, "kapre vr. ",kapre.__version__) 21 | 22 | def AttRNN_Model(): 23 | 24 | nCategs=36 25 | sr=16000 26 | #iLen=16000 27 | 28 | model = AttRNNSpeechModel(nCategs, samplingrate = sr, inputLength = None) 29 | model.compile(optimizer='adam', loss=['sparse_categorical_crossentropy'], metrics=['sparse_categorical_accuracy']) 30 | 31 | model.load_weights('weight/pr_attRNN.h5') 32 | 33 | return model 34 | 35 | 36 | # Adverserial Reprogramming layer 37 | class ARTLayer(Layer): 38 | def __init__(self, W_regularizer=0.05, **kwargs): 39 | self.init = initializers.GlorotUniform() 40 | self.W_regularizer = regularizers.l2(W_regularizer) 41 | super(ARTLayer, self).__init__(**kwargs) 42 | 43 | def build(self, input_shape): 44 | assert len(input_shape) == 3 45 | # Create a trainable weight variable for this layer. 46 | self.W = self.add_weight(name='kernel', 47 | shape=(16000,1), 48 | initializer=self.init,regularizer = self.W_regularizer, 49 | trainable=True) 50 | 51 | super(ARTLayer, self).build(input_shape) # Be sure to call this at the end 52 | 53 | def call(self, x, dropout=0.4, training=True): 54 | prog = Dropout(dropout)(self.W, training=training) # remove K.tanh 55 | out = x + prog 56 | return out 57 | 58 | def compute_output_shape(self, input_shape): 59 | return (input_shape[0],input_shape[1], input_shape[2]) 60 | 61 | 62 | # White Adversairal Reprogramming Time Series (WART) Model 63 | def WARTmodel(input_shape, pr_model, source_classes, mapping_num, target_classes, dropout=0.5): 64 | x = Input(shape=input_shape) 65 | out = ARTLayer()(x,dropout) 66 | out = Reshape([16000,])(out) 67 | probs = pr_model(out) 68 | 69 | map_probs = multi_mapping(probs, source_classes, mapping_num, target_classes) 70 | model = Model(inputs=x, outputs= map_probs) 71 | 72 | return model 73 | 74 | 75 | def make_model(input_shape, num_classes): 76 | input_layer = keras.layers.Input(input_shape) 77 | 78 | conv1 = keras.layers.Conv1D(filters=64, kernel_size=3, padding="same")(input_layer) 79 | conv1 = keras.layers.BatchNormalization()(conv1) 80 | conv1 = keras.layers.ReLU()(conv1) 81 | 82 | conv2 = keras.layers.Conv1D(filters=64, kernel_size=3, padding="same")(conv1) 83 | conv2 = keras.layers.BatchNormalization()(conv2) 84 | conv2 = keras.layers.ReLU()(conv2) 85 | 86 | conv3 = keras.layers.Conv1D(filters=64, kernel_size=3, padding="same")(conv2) 87 | conv3 = keras.layers.BatchNormalization()(conv3) 88 | conv3 = keras.layers.ReLU()(conv3) 89 | 90 | gap = keras.layers.GlobalAveragePooling1D()(conv3) 91 | 92 | output_layer = keras.layers.Dense(num_classes, activation="softmax")(gap) 93 | 94 | return keras.models.Model(inputs=input_layer, outputs=output_layer) 95 | -------------------------------------------------------------------------------- /AR-SCR/main.py: -------------------------------------------------------------------------------- 1 | import os 2 | import sys 3 | sys.path.append(os.getcwd()) 4 | 5 | import argparse 6 | 7 | import numpy as np 8 | import tensorflow as tf 9 | from tensorflow import keras 10 | import tensorflow.keras.backend as K 11 | 12 | from funcs import EarlyStopping 13 | from ts_dataloader import load_data 14 | from ts_model import AttRNN_Model, ARTLayer, WARTmodel, make_model 15 | 16 | # Learning phase is set to 0 since we want the network to use the pretrained moving mean/var 17 | # K.clear_session() 18 | 19 | def main(args): 20 | 21 | train_csv = 'Datasets/AR-SCR/train_full.csv' 22 | dev_csv = 'Datasets/AR-SCR/dev_full.csv' 23 | test_csv = 'Datasets/AR-SCR/test_full.csv' 24 | 25 | 26 | x_train, y_train = load_data(train_csv) 27 | x_dev, y_dev = load_data(dev_csv) 28 | x_test, y_test = load_data(test_csv) 29 | 30 | classes = np.unique(y_train) 31 | cls2label = {label: i for i, label in enumerate(classes.tolist())} 32 | num_classes = len(classes) 33 | 34 | y_train = [cls2label[y] for y in y_train] 35 | y_dev = [cls2label[y] for y in y_dev] 36 | y_test = [cls2label[y] for y in y_test] 37 | y_train = keras.utils.to_categorical(y_train, num_classes=num_classes) 38 | y_dev = keras.utils.to_categorical(y_dev, num_classes=num_classes) 39 | y_test = keras.utils.to_categorical(y_test, num_classes=num_classes) 40 | 41 | 42 | print("--- X shape : ", x_train[0].shape, "--- Num of Classes : ", num_classes) ## target class 43 | 44 | 45 | ## Pre-trained Model for Adv Program 46 | pr_model = AttRNN_Model() 47 | 48 | 49 | ## # of Source classes in Pre-trained Model 50 | source_classes = 36 ## Google Speech Commands 51 | 52 | target_shape = (x_train[0].shape[0], 1) 53 | 54 | ## Adv Program Time Series (ART) 55 | mapping_num = args.mapping 56 | try: 57 | assert mapping_num*num_classes <= source_classes 58 | except AssertionError: 59 | print("Error: The mapping num should be smaller than source_classes / num_classes: {}".format(source_classes//num_classes)) 60 | exit(1) 61 | 62 | model = WARTmodel(target_shape, pr_model, source_classes, mapping_num, num_classes, args.dropout) 63 | 64 | ## Loss 65 | adam = tf.keras.optimizers.Adam(lr=args.lr) 66 | model.compile(loss='categorical_crossentropy', optimizer = adam, metrics=['accuracy']) 67 | 68 | ## Checkpoints 69 | save_path = "AR-SCR/weight/" + str(args.lr) + "-{epoch:02d}-{val_accuracy:.4f}.h5" 70 | if not os.path.exists('AR-SCR/weight'): 71 | os.makedirs('AR-SCR/weight') 72 | 73 | checkpoints = tf.keras.callbacks.ModelCheckpoint(save_path,save_weights_only=True) 74 | earlystop = EarlyStopping(monitor='val_loss', patience=10, start_epoch=50, restore_best_weights=True) 75 | exp_callback = [earlystop, checkpoints] 76 | 77 | 78 | model.summary() 79 | 80 | batch_size = 32 81 | epochs = args.eps 82 | 83 | exp_history = model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, verbose=1, 84 | validation_data=(x_dev, y_dev), callbacks= exp_callback) 85 | 86 | score = model.evaluate(x_test, y_test, verbose=0) 87 | print('--- Test loss:', score[0]) 88 | print('- Test accuracy:', score[1]) 89 | 90 | return score 91 | 92 | if __name__ == '__main__': 93 | parser = argparse.ArgumentParser() 94 | parser.add_argument("--mapping", type=int, default=1, help="Number of multi-mapping") 95 | parser.add_argument("--eps", type=int, default=50, help="Epochs") 96 | parser.add_argument("--dropout", type=float, default=0.5, help="Dropout") 97 | parser.add_argument("--lr", type=float, default=0.001, help="Initial learning rate") 98 | args = parser.parse_args() 99 | 100 | main(args) 101 | -------------------------------------------------------------------------------- /LT-SCR/ts_dataloader.py: -------------------------------------------------------------------------------- 1 | import librosa 2 | import numpy as np 3 | import pandas as pd 4 | import soundfile as sound 5 | 6 | from tensorflow import keras 7 | 8 | sr = 16000 9 | def load_data(data_csv, rnd): 10 | data_df = pd.read_csv(data_csv, sep='\t') 11 | wavpath = data_df['filename'].tolist() 12 | labels = data_df['label'].to_list() 13 | 14 | x, y = list(), list() 15 | for wav, label in zip(wavpath, labels): 16 | stereo, fs = sound.read(wav) 17 | stereo = stereo / np.abs(stereo).max() 18 | if fs != sr: 19 | stereo = librosa.resample(stereo, fs, sr) 20 | if stereo.shape[0] > sr: 21 | start = rnd.choice(len(stereo) - sr + 1) 22 | x.append(stereo[start:start+sr]) 23 | else: 24 | x.append(np.pad(stereo, (0, sr-stereo.shape[0]))) 25 | 26 | y.append(label) 27 | 28 | return np.array(x), y 29 | 30 | 31 | class DataGenerator(keras.utils.Sequence): 32 | def __init__(self, datas, labels, bg_audio, classes, rnd, batch_size=32, shuffle=True): 33 | self.unknowns = list() 34 | self.commands = list() 35 | 36 | self._split_unknown(datas, labels) 37 | 38 | self.datas = list() 39 | 40 | self.bg_audio = bg_audio 41 | 42 | self.classes = classes 43 | self.add_noise = "silence" in self.classes 44 | 45 | self.rnd = rnd 46 | 47 | self.batch_size = batch_size 48 | self.shuffle = shuffle 49 | self.epoch = 0 50 | self.on_epoch_end() 51 | 52 | def _split_unknown(self, datas, labels): 53 | for wav, label in zip(datas, labels): 54 | if label == "unknown": 55 | self.unknowns.append((wav, label)) 56 | else: 57 | self.commands.append((wav, label)) 58 | 59 | def __len__(self): 60 | return int(np.floor(len(self.datas) / self.batch_size)) 61 | 62 | def __getitem__(self, index): 63 | indexes = self.indexes[index*self.batch_size:(index+1)*self.batch_size] 64 | 65 | batch = list() 66 | for k in indexes: 67 | batch.append(self.datas[k]) 68 | 69 | X, y = self.__data_generation(batch) 70 | 71 | return X, y 72 | 73 | def on_epoch_end(self): 74 | self.datas = list() 75 | """ 76 | self.datas.extend(self.commands) 77 | 78 | for _ in range(int(len(self.commands)*0.1)): 79 | unk = np.random.choice(len(self.unknowns)) 80 | unknown = self.unknowns[unk] 81 | self.datas.append(unknown) 82 | 83 | if self.add_noise: 84 | sil = np.random.choice(len(self.bg_audio)) 85 | silence = self.bg_audio[sil] 86 | self.datas.append((silence, "silence")) 87 | """ 88 | for _ in range(self.batch_size*7): 89 | coin = self.rnd.random() 90 | if coin < 0.1: 91 | unk = self.rnd.choice(len(self.unknowns)) 92 | unknown = self.unknowns[unk] 93 | self.datas.append(unknown) 94 | elif coin < 0.15: 95 | sil = self.rnd.choice(len(self.bg_audio)) 96 | silence = self.bg_audio[sil] 97 | self.datas.append((silence, "silence")) 98 | else: 99 | com = self.rnd.choice(len(self.commands)) 100 | command = self.commands[com] 101 | self.datas.append(command) 102 | 103 | self.indexes = np.arange(len(self.datas)) 104 | if self.shuffle == True: 105 | self.rnd.shuffle(self.indexes) 106 | 107 | def __data_generation(self, batch): 108 | X, y = list(), list() 109 | for wav, label in batch: 110 | X.append(wav) 111 | y.append(self.classes[label]) 112 | 113 | X = np.array(X) 114 | X = X.reshape((X.shape[0], X.shape[1], 1)) 115 | 116 | return X, keras.utils.to_categorical(y, num_classes=len(self.classes)) 117 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | ## Adversarial Reprogramming on Speech Command Recognition 2 | 3 | 4 | 5 | ### Environment 6 | 7 | Tensorflow 2.2 (CUDA=10.0) and Kapre 0.2.0. 8 | 9 | - option 1 (from yml) 10 | 11 | ```shell 12 | conda env create -f repr-scr.yml 13 | source activate repr-scr 14 | ``` 15 | 16 | - option 2 (from clean python 3.6) 17 | 18 | ```shell 19 | pip install tensorflow-gpu==2.1.0 20 | pip install kapre==0.2.0 21 | pip install h5py==2.10.0 22 | ``` 23 | 24 | ### Dataset 25 | 26 | Arabic Speech Commands dataset 27 | 28 | - Please download the Arabic Speech Commands dataset [here](https://github.com/ltkbenamer/AR_Speech_Database.git). 29 | 30 | ```shell 31 | ./prepare_ar_data.sh 32 | ``` 33 | 34 | Lithuanian Speech Commands dataset 35 | 36 | - Please download the Lithuanian Speech Commands dataset [here](https://github.com/kolesov93/lt_speech_commands). 37 | 38 | ```shell 39 | ./prepare_lt_data.sh 40 | ``` 41 | 42 | Dysarthric Speech Commands dataset 43 | 44 | - Please download the Lithuanian Speech Commands dataset [here](https://reurl.cc/a5vAG4). 45 | 46 | ```shell 47 | ./prepare_dm_data.sh 48 | ``` 49 | 50 | ### Training 51 | 52 | For training and evaluating the three speech command recognition results. 53 | 54 | ```shell 55 | ./run_ar.sh 56 | ./run_lt.sh 57 | ./run_dm.sh 58 | ``` 59 | For more details please refer to [AR-SCR](https://github.com/dodohow1011/SpeechAdvReprogram/blob/main/AR-SCR/main.py), [LT-SCR](https://github.com/dodohow1011/SpeechAdvReprogram/blob/main/LT-SCR/main.py) and [DM-SCR](https://github.com/dodohow1011/SpeechAdvReprogram/blob/main/DM-SCR/main.py) 60 | 61 | (**Optional**) Note that in our default setting we use the random mapping strategy. To enable the similarity mapping, 62 | please modify the code at [utils.py](https://github.com/dodohow1011/SpeechAdvReprogram/blob/main/utils.py#L19) as followed: 63 | ```python 64 | def multi_mapping(prob, source_num, mapping_num, target_num): 65 | 66 | similarity_mapping = True 67 | ``` 68 | And choose [lable_map](https://github.com/dodohow1011/SpeechAdvReprogram/blob/27db34e75f048903f296981d5c6e9a2d7a32f742/utils.py#L31-L33) according to your task. You can also see and check mapping results for each task by running the following command: 69 | ```sh 70 | python AR-SCR/source_target_pairing.py 71 | python LT-SCR/source_target_pairing.py 72 | python DM-SCR/source_target_pairing.py 73 | ``` 74 | 75 | 76 | #### Please consider to cite this work if you use the provided code or find the idea related to your research. Thank you! 77 | 78 | - A Study of Low-Resource Speech Commands Recognition Based on Adversarial Reprogramming [Paper](https://arxiv.org/pdf/2110.03894.pdf) 79 | 80 | ```bib 81 | 82 | @article{yen2023neural, 83 | title={Neural model reprogramming with similarity based mapping for low-resource spoken command classification}, 84 | author={Yen, Hao and Ku, Pin-Jui and Yang, Chao-Han Huck and Hu, Hu and Siniscalchi, Sabato Marco and Chen, Pin-Yu and Tsao, Yu}, 85 | journal={Proc. of Interspeech}, 86 | year={2023} 87 | } 88 | 89 | ``` 90 | 91 | ### Related References 92 | 93 | 94 | - Voice2Series: Reprogramming Acoustic Models for Time Series Classification [Paper](https://arxiv.org/pdf/2106.09296.pdf) 95 | 96 | ```bib 97 | 98 | @InProceedings{pmlr-v139-yang21j, 99 | title = {Voice2Series: Reprogramming Acoustic Models for Time Series Classification}, 100 | author = {Yang, Chao-Han Huck and Tsai, Yun-Yun and Chen, Pin-Yu}, 101 | booktitle = {Proceedings of the 38th International Conference on Machine Learning}, 102 | pages = {11808--11819}, 103 | year = {2021}, 104 | volume = {139}, 105 | series = {Proceedings of Machine Learning Research}, 106 | month = {18--24 Jul}, 107 | publisher = {PMLR}, 108 | } 109 | 110 | ``` 111 | 112 | - Database for Arabic Speech Commands Recognition [Paper](https://www.researchgate.net/publication/346962582_Database_for_Arabic_Speech_Commands_Recognition) 113 | 114 | - Voice Activation for Low-Resource Languages [Paper](https://www.mdpi.com/2076-3417/11/14/6298) 115 | 116 | - Unsupervised Pre-Training for Voice Activation [Paper](https://www.mdpi.com/2076-3417/10/23/8643) 117 | 118 | - A Speech Command Control-Based Recognition System for Dysarthric Patients Based on Deep Learning Technology [Paper](https://www.mdpi.com/2076-3417/11/6/2477) 119 | -------------------------------------------------------------------------------- /LT-SCR/main.py: -------------------------------------------------------------------------------- 1 | import os 2 | import sys 3 | sys.path.append(os.getcwd()) 4 | 5 | import argparse 6 | 7 | import numpy as np 8 | import tensorflow as tf 9 | from tensorflow import keras 10 | import tensorflow.keras.backend as K 11 | 12 | from funcs import EarlyStopping, LR_Warmup 13 | from ts_dataloader import load_data, DataGenerator 14 | from ts_model import AttRNN_Model, ARTLayer, WARTmodel, make_model 15 | 16 | 17 | # Learning phase is set to 0 since we want the network to use the pretrained moving mean/var 18 | # K.clear_session() 19 | 20 | def main(args, rnd): 21 | 22 | train_csv = 'Datasets/LT-SCR/train_limit20.csv' 23 | dev_csv = 'Datasets/LT-SCR/dev_full.csv' 24 | test_csv = 'Datasets/LT-SCR/test_full.csv' 25 | 26 | noise_csv = 'Datasets/LT-SCR/noise_full.csv' 27 | 28 | x_train, y_train = load_data(train_csv, rnd) 29 | x_dev, y_dev = load_data(dev_csv, rnd) 30 | x_test, y_test = load_data(test_csv, rnd) 31 | 32 | classes = np.unique(y_train) 33 | 34 | bg_audio = load_data(noise_csv, rnd)[0] 35 | bg_audio = [noise * rnd.random() * 0.1 for noise in bg_audio] 36 | 37 | rnd.shuffle(bg_audio) 38 | x_test = np.concatenate((x_test, bg_audio[:10]), axis=0) 39 | x_dev = np.concatenate((x_dev, bg_audio[10:20]), axis=0) 40 | y_test.extend(["silence"]*10) 41 | y_dev.extend(["silence"]*10) 42 | 43 | classes = np.append(classes, ["silence"]) 44 | 45 | cls2label = {label: i for i, label in enumerate(classes.tolist())} 46 | num_classes = len(classes) 47 | 48 | train_generator = DataGenerator(x_train, y_train, bg_audio[20:], cls2label, rnd) 49 | y_dev = [cls2label[y] for y in y_dev] 50 | y_test = [cls2label[y] for y in y_test] 51 | y_dev = keras.utils.to_categorical(y_dev, num_classes=num_classes) 52 | y_test = keras.utils.to_categorical(y_test, num_classes=num_classes) 53 | 54 | 55 | print("--- X shape : ", x_train[0].shape, "--- Num of Classes : ", num_classes) ## target class 56 | 57 | 58 | ## Pre-trained Model for Adv Program 59 | pr_model = AttRNN_Model() 60 | 61 | ## # of Source classes in Pre-trained Model 62 | source_classes = 36 ## Google Speech Commands 63 | 64 | target_shape = (x_train[0].shape[0], 1) 65 | 66 | ## Adv Program Time Series (ART) 67 | mapping_num = args.mapping 68 | try: 69 | assert mapping_num*num_classes <= source_classes 70 | except AssertionError: 71 | print("Error: The mapping num should be smaller than source_classes / num_classes: {}".format(source_classes//num_classes)) 72 | exit(1) 73 | 74 | model = WARTmodel(target_shape, pr_model, source_classes, mapping_num, num_classes, args.dropout) 75 | 76 | ## Loss 77 | adam = tf.keras.optimizers.Adam() 78 | model.compile(loss='categorical_crossentropy', optimizer = adam, metrics=['accuracy']) 79 | 80 | lr_scheduler = LR_Warmup(lr_base=args.lr,decay=args.lr_decay,warmup_epochs=20) 81 | 82 | save_path = "LT-SCR/weight/" + str(args.lr) + "-" + str(args.lr_decay) + "-{epoch:02d}-{val_loss:.4f}-{val_accuracy:.4f}.h5" 83 | if not os.path.exists('LT-SCR/weight'): 84 | os.makedirs('LT-SCR/weight') 85 | 86 | 87 | checkpoints = tf.keras.callbacks.ModelCheckpoint(save_path, monitor='val_accuracy', save_weights_only=True, save_best_only=True) 88 | earlystop = EarlyStopping(monitor='val_accuracy', patience=10, start_epoch=70, restore_best_weights=True) 89 | exp_callback = [earlystop, lr_scheduler, checkpoints] 90 | 91 | 92 | model.summary() 93 | 94 | batch_size = 32 95 | epochs = args.eps 96 | exp_history = model.fit(train_generator, batch_size=batch_size, epochs=epochs, verbose=1, 97 | validation_data=(x_dev, y_dev),callbacks= exp_callback) 98 | 99 | 100 | score = model.evaluate(x_test, y_test, verbose=0) 101 | print('--- Test loss:', score[0]) 102 | print('- Test accuracy:', score[1]) 103 | 104 | return score 105 | 106 | if __name__ == '__main__': 107 | parser = argparse.ArgumentParser() 108 | parser.add_argument("--mapping", type=int, default=2, help="Number of multi-mapping") 109 | parser.add_argument("--eps", type=int, default=200, help="Epochs") 110 | parser.add_argument("--dropout", type=float, default=0.5, help="Dropout") 111 | parser.add_argument("--lr", type=float, default=0.01, help="Initial learning rate") 112 | parser.add_argument("--lr_decay", type=float, default=0.005, help="Learnig rate decay rate") 113 | args = parser.parse_args() 114 | 115 | rnd = np.random.RandomState(seed=1109) 116 | main(args, rnd) 117 | 118 | -------------------------------------------------------------------------------- /similarity_mapping.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import tensorflow.keras.backend as K 3 | 4 | from ts_model import AttRNN_Model 5 | 6 | GSm_w2nMapping = { 7 | 'unknown': 0, 8 | 'nine': 1, 9 | 'yes': 2, 10 | 'no': 3, 11 | 'up': 4, 12 | 'down': 5, 13 | 'left': 6, 14 | 'right': 7, 15 | 'on': 8, 16 | 'off': 9, 17 | 'stop': 10, 18 | 'go': 11, 19 | 'zero': 12, 20 | 'one': 13, 21 | 'two': 14, 22 | 'three': 15, 23 | 'four': 16, 24 | 'five': 17, 25 | 'six': 18, 26 | 'seven': 19, 27 | 'eight': 20, 28 | 'backward': 21, 29 | 'bed': 22, 30 | 'bird': 23, 31 | 'cat': 24, 32 | 'dog': 25, 33 | 'follow': 26, 34 | 'forward': 27, 35 | 'happy': 28, 36 | 'house': 29, 37 | 'learn': 30, 38 | 'marvin': 31, 39 | 'sheila': 32, 40 | 'tree': 33, 41 | 'visual': 34, 42 | 'wow': 35 43 | } 44 | 45 | 46 | Gsm_n2wMapping= { 47 | 0: 'unknown', 48 | 1: 'nine', 49 | 2: 'yes', 50 | 3: 'no', 51 | 4: 'up', 52 | 5: 'down', 53 | 6: 'left', 54 | 7: 'right', 55 | 8: 'on', 56 | 9: 'off', 57 | 10: 'stop', 58 | 11: 'go', 59 | 12: 'zero', 60 | 13: 'one', 61 | 14: 'two', 62 | 15: 'three', 63 | 16: 'four', 64 | 17: 'five', 65 | 18: 'six', 66 | 19: 'seven', 67 | 20: 'eight', 68 | 21: 'backward', 69 | 22: 'bed', 70 | 23: 'bird', 71 | 24: 'cat', 72 | 25: 'dog', 73 | 26: 'follow', 74 | 27: 'forward', 75 | 28: 'happy', 76 | 29: 'house', 77 | 30: 'learn', 78 | 31: 'marvin', 79 | 32: 'sheila', 80 | 33: 'tree', 81 | 34: 'visual', 82 | 35: 'wow' 83 | } 84 | 85 | 86 | def source_target_mapping(sourceGen, target_audios, target_labels): 87 | 88 | target_classes = np.unique(target_labels, axis=0) 89 | target_cls2label = {label: i for i, label in enumerate(target_classes.tolist())} 90 | target_label2cls = {i: label for label, i in target_cls2label.items()} 91 | target_labels = [target_cls2label[cls] for cls in target_labels] 92 | 93 | 94 | # We wants the last hidden output for clustering 95 | Gsm_model = AttRNN_Model() 96 | Gsm_model.summary() 97 | Gsm_model = K.function([Gsm_model.input], [Gsm_model.layers[-2].output]) 98 | 99 | source_centers = [[] for i in range(36)] 100 | target_centers = [[] for i in range(len(target_classes))] 101 | 102 | for audio, label in zip(target_audios, target_labels): 103 | audio = audio.reshape((1,-1)) 104 | out = Gsm_model([audio]) 105 | center = out[0] 106 | target_centers[label].append(center) 107 | 108 | for i in range(len(target_centers)): 109 | target_centers[i] = np.concatenate(target_centers[i], axis=0).mean(axis=0) 110 | 111 | for i in range(len(sourceGen)): 112 | audios, labels = sourceGen.__getitem__(i) 113 | batch_size, _ = audios.shape 114 | batch_center = Gsm_model([audios])[0] 115 | for j in range(batch_size): 116 | center = batch_center[j].reshape(1, -1) 117 | label = labels[j] 118 | source_centers[label].append(center) 119 | 120 | for i in range(len(source_centers)): 121 | source_centers[i] = np.concatenate(source_centers[i], axis=0).mean(axis=0) 122 | 123 | 124 | # Now we have a representative vector for each target and source class. 125 | # Next we need to pair then. 126 | 127 | 128 | counter = [0]*len(target_centers) 129 | pair_result = {i: [] for i in range(len(target_centers))} 130 | 131 | 132 | for s in range(len(source_centers)): 133 | sims = {} 134 | for t in range(len(target_centers)): 135 | sim = np.dot(source_centers[s], target_centers[t]) / (np.linalg.norm(source_centers[s])*np.linalg.norm(target_centers[t])) 136 | sims[t] = sim 137 | sorted_sims = {k: v for k, v in sorted(sims.items(), key=lambda x:x[1], reverse=True)} 138 | 139 | is_paired = False 140 | for k, v in sorted_sims.items(): 141 | if counter[k] < 2: 142 | pair_result[k].append(s) 143 | counter[k]+=1 144 | is_paired = True 145 | break 146 | 147 | if is_paired: 148 | continue 149 | # Every body have 2. Now let them be three 150 | for k, v in sorted_sims.items(): 151 | if counter[k] < 3: 152 | pair_result[k].append(s) 153 | counter[k]+=1 154 | break 155 | 156 | pairing = [] 157 | for t, ss in pair_result.items(): 158 | print("source class: {} is paired with target class: {}".format( [Gsm_n2wMapping[s] for s in ss], target_label2cls[t])) 159 | pairing.append(ss) 160 | 161 | 162 | print("The label_map result is {}".format(pairing)) 163 | 164 | #np.save('source_centers.npy', source_centers) 165 | #np.save('target_centers.npy', target_centers) 166 | -------------------------------------------------------------------------------- /funcs.py: -------------------------------------------------------------------------------- 1 | import sys 2 | import numpy as np 3 | from tensorflow import keras 4 | import tensorflow.keras.backend as K 5 | 6 | 7 | class LR_Warmup(keras.callbacks.Callback): 8 | def __init__(self, lr_base=0.01, min_lr=0.0001, decay=0, warmup_epochs=0): 9 | self.num_passed_batchs = 0 10 | self.warmup_epochs = warmup_epochs 11 | self.lr = lr_base 12 | self.min_lr = min_lr 13 | self.decay = decay 14 | self.steps_per_epoch = 0 15 | 16 | def on_batch_begin(self, batch, logs=None): 17 | if self.steps_per_epoch == 0: 18 | if self.params['steps'] == None: 19 | self.steps_per_epoch = np.ceil(1. * self.params['samples'] / self.params['batch_size']) 20 | else: 21 | self.steps_per_epoch = self.params['steps'] 22 | if self.num_passed_batchs < self.steps_per_epoch * self.warmup_epochs: 23 | K.set_value(self.model.optimizer.lr, 24 | self.lr * (self.num_passed_batchs + 1) / self.steps_per_epoch / self.warmup_epochs) 25 | else: 26 | K.set_value(self.model.optimizer.lr, 27 | max(self.min_lr, self.lr * ((1-self.decay)**(self.num_passed_batchs-self.steps_per_epoch*self.warmup_epochs)))) 28 | self.num_passed_batchs += 1 29 | 30 | def on_epoch_begin(self,epoch,logs=None): 31 | print("learning_rate:", K.get_value(self.model.optimizer.lr)) 32 | 33 | 34 | class EarlyStopping(keras.callbacks.Callback): 35 | def __init__(self, 36 | monitor='val_loss', 37 | min_delta=0, 38 | patience=0, 39 | verbose=0, 40 | start_epoch=0, 41 | mode='auto', 42 | baseline=None, 43 | restore_best_weights=False): 44 | super(EarlyStopping, self).__init__() 45 | 46 | self.monitor = monitor 47 | self.patience = patience 48 | self.verbose = verbose 49 | self.baseline = baseline 50 | self.min_delta = abs(min_delta) 51 | self.wait = 0 52 | self.stopped_epoch = 0 53 | self.start_epoch = start_epoch 54 | self.restore_best_weights = restore_best_weights 55 | self.best_weights = None 56 | 57 | if mode not in ['auto', 'min', 'max']: 58 | logging.warning('EarlyStopping mode %s is unknown, ' 59 | 'fallback to auto mode.', mode) 60 | mode = 'auto' 61 | 62 | if mode == 'min': 63 | self.monitor_op = np.less 64 | elif mode == 'max': 65 | self.monitor_op = np.greater 66 | else: 67 | if 'acc' in self.monitor: 68 | self.monitor_op = np.greater 69 | else: 70 | self.monitor_op = np.less 71 | 72 | if self.monitor_op == np.greater: 73 | self.min_delta *= 1 74 | else: 75 | self.min_delta *= -1 76 | 77 | def on_train_begin(self, logs=None): 78 | # Allow instances to be re-used 79 | self.wait = 0 80 | self.stopped_epoch = 0 81 | self.best = np.Inf if self.monitor_op == np.less else -np.Inf 82 | self.best_weights = None 83 | 84 | def on_epoch_end(self, epoch, logs=None): 85 | current = self.get_monitor_value(logs) 86 | if current is None or epoch < self.start_epoch: 87 | return 88 | if self.restore_best_weights and self.best_weights is None: 89 | # Restore the weights after first epoch if no progress is ever made. 90 | self.best_weights = self.model.get_weights() 91 | 92 | self.wait += 1 93 | if self._is_improvement(current, self.best): 94 | self.best = current 95 | if self.restore_best_weights: 96 | self.best_weights = self.model.get_weights() 97 | # Only restart wait if we beat both the baseline and our previous best. 98 | if self.baseline is None or self._is_improvement(current, self.baseline): 99 | self.wait = 0 100 | 101 | # Only check after the first epoch. 102 | if self.wait >= self.patience: 103 | self.stopped_epoch = epoch 104 | self.model.stop_training = True 105 | if self.restore_best_weights and self.best_weights is not None: 106 | if self.verbose > 0: 107 | print('Restoring model weights from the end of the best epoch.') 108 | self.model.set_weights(self.best_weights) 109 | 110 | def on_train_end(self, logs=None): 111 | if self.stopped_epoch > 0 and self.verbose > 0: 112 | print('Epoch %05d: early stopping' % (self.stopped_epoch + 1)) 113 | 114 | def get_monitor_value(self, logs): 115 | logs = logs or {} 116 | monitor_value = logs.get(self.monitor) 117 | if monitor_value is None: 118 | logging.warning('Early stopping conditioned on metric `%s` ' 119 | 'which is not available. Available metrics are: %s', 120 | self.monitor, ','.join(list(logs.keys()))) 121 | return monitor_value 122 | 123 | def _is_improvement(self, monitor_value, reference_value): 124 | return self.monitor_op(monitor_value - self.min_delta, reference_value) 125 | -------------------------------------------------------------------------------- /Datasets/LT-SCR/dev_full.csv: -------------------------------------------------------------------------------- 1 | filename label 2 | /work/dodohow1011/lt_speech_commands/dataset/du/20_nohash_0.wav unknown 3 | /work/dodohow1011/lt_speech_commands/dataset/du/04_nohash_0.wav unknown 4 | /work/dodohow1011/lt_speech_commands/dataset/du/11_nohash_0.wav unknown 5 | /work/dodohow1011/lt_speech_commands/dataset/du/07_nohash_0.wav unknown 6 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/04_nohash_0.wav išjunk 7 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/11_nohash_0.wav išjunk 8 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/07_nohash_0.wav išjunk 9 | /work/dodohow1011/lt_speech_commands/dataset/keturi/20_nohash_0.wav unknown 10 | /work/dodohow1011/lt_speech_commands/dataset/keturi/04_nohash_0.wav unknown 11 | /work/dodohow1011/lt_speech_commands/dataset/keturi/11_nohash_0.wav unknown 12 | /work/dodohow1011/lt_speech_commands/dataset/keturi/07_nohash_0.wav unknown 13 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/20_nohash_0.wav ačiū 14 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/04_nohash_0.wav ačiū 15 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/11_nohash_0.wav ačiū 16 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/07_nohash_0.wav ačiū 17 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/22_nohash_0.wav ačiū 18 | /work/dodohow1011/lt_speech_commands/dataset/taip/20_nohash_0.wav unknown 19 | /work/dodohow1011/lt_speech_commands/dataset/taip/04_nohash_0.wav unknown 20 | /work/dodohow1011/lt_speech_commands/dataset/taip/11_nohash_0.wav unknown 21 | /work/dodohow1011/lt_speech_commands/dataset/taip/07_nohash_0.wav unknown 22 | /work/dodohow1011/lt_speech_commands/dataset/taip/22_nohash_0.wav unknown 23 | /work/dodohow1011/lt_speech_commands/dataset/labas/20_nohash_0.wav labas 24 | /work/dodohow1011/lt_speech_commands/dataset/labas/04_nohash_0.wav labas 25 | /work/dodohow1011/lt_speech_commands/dataset/labas/11_nohash_0.wav labas 26 | /work/dodohow1011/lt_speech_commands/dataset/labas/07_nohash_0.wav labas 27 | /work/dodohow1011/lt_speech_commands/dataset/labas/22_nohash_0.wav labas 28 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/11_nohash_0.wav į_viršų 29 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/07_nohash_0.wav į_viršų 30 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/22_nohash_0.wav į_viršų 31 | /work/dodohow1011/lt_speech_commands/dataset/stop/20_nohash_0.wav stop 32 | /work/dodohow1011/lt_speech_commands/dataset/stop/04_nohash_0.wav stop 33 | /work/dodohow1011/lt_speech_commands/dataset/stop/11_nohash_0.wav stop 34 | /work/dodohow1011/lt_speech_commands/dataset/stop/07_nohash_0.wav stop 35 | /work/dodohow1011/lt_speech_commands/dataset/stop/22_nohash_0.wav stop 36 | /work/dodohow1011/lt_speech_commands/dataset/vienas/20_nohash_0.wav unknown 37 | /work/dodohow1011/lt_speech_commands/dataset/vienas/11_nohash_0.wav unknown 38 | /work/dodohow1011/lt_speech_commands/dataset/vienas/07_nohash_0.wav unknown 39 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/22_nohash_0.wav į_apačią 40 | /work/dodohow1011/lt_speech_commands/dataset/ne/20_nohash_0.wav ne 41 | /work/dodohow1011/lt_speech_commands/dataset/ne/04_nohash_0.wav ne 42 | /work/dodohow1011/lt_speech_commands/dataset/ne/11_nohash_0.wav ne 43 | /work/dodohow1011/lt_speech_commands/dataset/ne/07_nohash_0.wav ne 44 | /work/dodohow1011/lt_speech_commands/dataset/ne/22_nohash_0.wav ne 45 | /work/dodohow1011/lt_speech_commands/dataset/nulis/20_nohash_0.wav unknown 46 | /work/dodohow1011/lt_speech_commands/dataset/nulis/11_nohash_0.wav unknown 47 | /work/dodohow1011/lt_speech_commands/dataset/nulis/07_nohash_0.wav unknown 48 | /work/dodohow1011/lt_speech_commands/dataset/penki/20_nohash_0.wav unknown 49 | /work/dodohow1011/lt_speech_commands/dataset/penki/04_nohash_0.wav unknown 50 | /work/dodohow1011/lt_speech_commands/dataset/penki/11_nohash_0.wav unknown 51 | /work/dodohow1011/lt_speech_commands/dataset/penki/07_nohash_0.wav unknown 52 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/20_nohash_0.wav pauzė 53 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/04_nohash_0.wav pauzė 54 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/11_nohash_0.wav pauzė 55 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/07_nohash_0.wav pauzė 56 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/22_nohash_0.wav pauzė 57 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/11_nohash_0.wav į_kairę 58 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/07_nohash_0.wav į_kairę 59 | /work/dodohow1011/lt_speech_commands/dataset/iki/20_nohash_0.wav iki 60 | /work/dodohow1011/lt_speech_commands/dataset/iki/04_nohash_0.wav iki 61 | /work/dodohow1011/lt_speech_commands/dataset/iki/11_nohash_0.wav iki 62 | /work/dodohow1011/lt_speech_commands/dataset/iki/07_nohash_0.wav iki 63 | /work/dodohow1011/lt_speech_commands/dataset/iki/22_nohash_0.wav iki 64 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/20_nohash_0.wav įjunk 65 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/04_nohash_0.wav įjunk 66 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/11_nohash_0.wav įjunk 67 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/07_nohash_0.wav įjunk 68 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/22_nohash_0.wav įjunk 69 | /work/dodohow1011/lt_speech_commands/dataset/startas/20_nohash_0.wav startas 70 | /work/dodohow1011/lt_speech_commands/dataset/startas/07_nohash_0.wav startas 71 | /work/dodohow1011/lt_speech_commands/dataset/startas/22_nohash_0.wav startas 72 | /work/dodohow1011/lt_speech_commands/dataset/trys/20_nohash_0.wav unknown 73 | /work/dodohow1011/lt_speech_commands/dataset/trys/04_nohash_0.wav unknown 74 | /work/dodohow1011/lt_speech_commands/dataset/trys/11_nohash_0.wav unknown 75 | /work/dodohow1011/lt_speech_commands/dataset/trys/07_nohash_0.wav unknown 76 | /work/dodohow1011/lt_speech_commands/dataset/trys/22_nohash_0.wav unknown 77 | -------------------------------------------------------------------------------- /Datasets/LT-SCR/test_full.csv: -------------------------------------------------------------------------------- 1 | filename label 2 | /work/dodohow1011/lt_speech_commands/dataset/du/13_nohash_0.wav unknown 3 | /work/dodohow1011/lt_speech_commands/dataset/du/12_nohash_0.wav unknown 4 | /work/dodohow1011/lt_speech_commands/dataset/du/02_nohash_0.wav unknown 5 | /work/dodohow1011/lt_speech_commands/dataset/du/17_nohash_0.wav unknown 6 | /work/dodohow1011/lt_speech_commands/dataset/du/28_nohash_0.wav unknown 7 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/13_nohash_0.wav išjunk 8 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/12_nohash_0.wav išjunk 9 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/02_nohash_0.wav išjunk 10 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/28_nohash_0.wav išjunk 11 | /work/dodohow1011/lt_speech_commands/dataset/keturi/13_nohash_0.wav unknown 12 | /work/dodohow1011/lt_speech_commands/dataset/keturi/12_nohash_0.wav unknown 13 | /work/dodohow1011/lt_speech_commands/dataset/keturi/02_nohash_0.wav unknown 14 | /work/dodohow1011/lt_speech_commands/dataset/keturi/17_nohash_0.wav unknown 15 | /work/dodohow1011/lt_speech_commands/dataset/keturi/28_nohash_0.wav unknown 16 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/13_nohash_0.wav į_dešinę 17 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/12_nohash_0.wav į_dešinę 18 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/02_nohash_0.wav į_dešinę 19 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/28_nohash_0.wav į_dešinę 20 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/13_nohash_0.wav ačiū 21 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/12_nohash_0.wav ačiū 22 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/02_nohash_0.wav ačiū 23 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/28_nohash_0.wav ačiū 24 | /work/dodohow1011/lt_speech_commands/dataset/taip/13_nohash_0.wav unknown 25 | /work/dodohow1011/lt_speech_commands/dataset/taip/12_nohash_0.wav unknown 26 | /work/dodohow1011/lt_speech_commands/dataset/taip/02_nohash_0.wav unknown 27 | /work/dodohow1011/lt_speech_commands/dataset/taip/17_nohash_0.wav unknown 28 | /work/dodohow1011/lt_speech_commands/dataset/taip/28_nohash_0.wav unknown 29 | /work/dodohow1011/lt_speech_commands/dataset/labas/13_nohash_0.wav labas 30 | /work/dodohow1011/lt_speech_commands/dataset/labas/12_nohash_0.wav labas 31 | /work/dodohow1011/lt_speech_commands/dataset/labas/02_nohash_0.wav labas 32 | /work/dodohow1011/lt_speech_commands/dataset/labas/28_nohash_0.wav labas 33 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/13_nohash_0.wav į_viršų 34 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/12_nohash_0.wav į_viršų 35 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/02_nohash_0.wav į_viršų 36 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/28_nohash_0.wav į_viršų 37 | /work/dodohow1011/lt_speech_commands/dataset/stop/13_nohash_0.wav stop 38 | /work/dodohow1011/lt_speech_commands/dataset/stop/12_nohash_0.wav stop 39 | /work/dodohow1011/lt_speech_commands/dataset/stop/02_nohash_0.wav stop 40 | /work/dodohow1011/lt_speech_commands/dataset/stop/17_nohash_0.wav stop 41 | /work/dodohow1011/lt_speech_commands/dataset/stop/28_nohash_0.wav stop 42 | /work/dodohow1011/lt_speech_commands/dataset/vienas/13_nohash_0.wav unknown 43 | /work/dodohow1011/lt_speech_commands/dataset/vienas/12_nohash_0.wav unknown 44 | /work/dodohow1011/lt_speech_commands/dataset/vienas/02_nohash_0.wav unknown 45 | /work/dodohow1011/lt_speech_commands/dataset/vienas/28_nohash_0.wav unknown 46 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/13_nohash_0.wav į_apačią 47 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/12_nohash_0.wav į_apačią 48 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/02_nohash_0.wav į_apačią 49 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/28_nohash_0.wav į_apačią 50 | /work/dodohow1011/lt_speech_commands/dataset/ne/13_nohash_0.wav ne 51 | /work/dodohow1011/lt_speech_commands/dataset/ne/12_nohash_0.wav ne 52 | /work/dodohow1011/lt_speech_commands/dataset/ne/02_nohash_0.wav ne 53 | /work/dodohow1011/lt_speech_commands/dataset/ne/17_nohash_0.wav ne 54 | /work/dodohow1011/lt_speech_commands/dataset/ne/28_nohash_0.wav ne 55 | /work/dodohow1011/lt_speech_commands/dataset/nulis/13_nohash_0.wav unknown 56 | /work/dodohow1011/lt_speech_commands/dataset/nulis/12_nohash_0.wav unknown 57 | /work/dodohow1011/lt_speech_commands/dataset/nulis/02_nohash_0.wav unknown 58 | /work/dodohow1011/lt_speech_commands/dataset/nulis/17_nohash_0.wav unknown 59 | /work/dodohow1011/lt_speech_commands/dataset/nulis/28_nohash_0.wav unknown 60 | /work/dodohow1011/lt_speech_commands/dataset/penki/13_nohash_0.wav unknown 61 | /work/dodohow1011/lt_speech_commands/dataset/penki/12_nohash_0.wav unknown 62 | /work/dodohow1011/lt_speech_commands/dataset/penki/02_nohash_0.wav unknown 63 | /work/dodohow1011/lt_speech_commands/dataset/penki/28_nohash_0.wav unknown 64 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/13_nohash_0.wav pauzė 65 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/12_nohash_0.wav pauzė 66 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/02_nohash_0.wav pauzė 67 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/28_nohash_0.wav pauzė 68 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/13_nohash_0.wav į_kairę 69 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/12_nohash_0.wav į_kairę 70 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/02_nohash_0.wav į_kairę 71 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/28_nohash_0.wav į_kairę 72 | /work/dodohow1011/lt_speech_commands/dataset/iki/13_nohash_0.wav iki 73 | /work/dodohow1011/lt_speech_commands/dataset/iki/12_nohash_0.wav iki 74 | /work/dodohow1011/lt_speech_commands/dataset/iki/02_nohash_0.wav iki 75 | /work/dodohow1011/lt_speech_commands/dataset/iki/28_nohash_0.wav iki 76 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/13_nohash_0.wav įjunk 77 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/12_nohash_0.wav įjunk 78 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/02_nohash_0.wav įjunk 79 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/17_nohash_0.wav įjunk 80 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/28_nohash_0.wav įjunk 81 | /work/dodohow1011/lt_speech_commands/dataset/startas/13_nohash_0.wav startas 82 | /work/dodohow1011/lt_speech_commands/dataset/startas/12_nohash_0.wav startas 83 | /work/dodohow1011/lt_speech_commands/dataset/startas/02_nohash_0.wav startas 84 | /work/dodohow1011/lt_speech_commands/dataset/startas/28_nohash_0.wav startas 85 | /work/dodohow1011/lt_speech_commands/dataset/trys/13_nohash_0.wav unknown 86 | /work/dodohow1011/lt_speech_commands/dataset/trys/12_nohash_0.wav unknown 87 | /work/dodohow1011/lt_speech_commands/dataset/trys/02_nohash_0.wav unknown 88 | /work/dodohow1011/lt_speech_commands/dataset/trys/17_nohash_0.wav unknown 89 | /work/dodohow1011/lt_speech_commands/dataset/trys/28_nohash_0.wav unknown 90 | -------------------------------------------------------------------------------- /repr-scr.yml: -------------------------------------------------------------------------------- 1 | name: repr-scr 2 | channels: 3 | - conda-forge 4 | - anaconda 5 | - defaults 6 | dependencies: 7 | - _tflow_select=2.1.0=gpu 8 | - absl-py=0.10.0=py36_0 9 | - aiohttp=3.6.3=py36h7b6447c_0 10 | - astunparse=1.6.3=py_0 11 | - async-timeout=3.0.1=py36_0 12 | - attrs=20.2.0=py_0 13 | - blinker=1.4=py36_0 14 | - brotlipy=0.7.0=py36h7b6447c_1000 15 | - c-ares=1.16.1=h7b6447c_0 16 | - ca-certificates=2020.10.14=0 17 | - cachetools=4.1.1=py_0 18 | - certifi=2020.6.20=py36_0 19 | - chardet=3.0.4=py36_1003 20 | - click=7.1.2=py_0 21 | - cryptography=3.1.1=py36h1ba5d50_0 22 | - cudatoolkit=10.1.243=h6bb024c_0 23 | - cudnn=7.6.5=cuda10.1_0 24 | - cupti=10.1.168=0 25 | - cython=0.29.21=py36he6710b0_0 26 | - gast=0.3.3=py_0 27 | - google-auth=1.22.1=py_0 28 | - google-auth-oauthlib=0.4.1=py_2 29 | - google-pasta=0.2.0=py_0 30 | - grpcio=1.31.0=py36hf8bcb03_0 31 | - h5py=2.10.0=py36hd6299e0_1 32 | - hdf5=1.10.6=hb1b8bf9_0 33 | - idna=2.10=py_0 34 | - idna_ssl=1.1.0=py36_0 35 | - importlib-metadata=2.0.0=py_1 36 | - intel-openmp=2020.2=254 37 | - keras-preprocessing=1.1.0=py_1 38 | - lcms2=2.11=h396b838_0 39 | - libgfortran-ng=7.3.0=hdf63c60_0 40 | - libprotobuf=3.13.0.1=hd408876_0 41 | - markdown=3.3.2=py36_0 42 | - mkl=2019.4=243 43 | - mkl-service=2.3.0=py36he904b0f_0 44 | - mkl_random=1.1.0=py36hd6b4f25_0 45 | - multidict=4.7.6=py36h7b6447c_1 46 | - oauthlib=3.1.0=py_0 47 | - olefile=0.46=py_0 48 | - openssl=1.1.1h=h7b6447c_0 49 | - opt_einsum=3.1.0=py_0 50 | - pandas=1.1.3=py36he6710b0_0 51 | - pillow=8.0.0=py36h9a89aac_0 52 | - protobuf=3.13.0.1=py36he6710b0_1 53 | - pyasn1=0.4.8=py_0 54 | - pyasn1-modules=0.2.8=py_0 55 | - pycparser=2.20=py_2 56 | - pyjwt=1.7.1=py36_0 57 | - pyopenssl=19.1.0=py_1 58 | - pysocks=1.7.1=py36_0 59 | - python-dateutil=2.8.1=py_0 60 | - pytz=2020.1=py_0 61 | - requests=2.24.0=py_0 62 | - requests-oauthlib=1.3.0=py_0 63 | - rsa=4.6=py_0 64 | - seaborn=0.11.0=py_0 65 | - six=1.15.0=py_0 66 | - tensorboard=2.2.1=pyh532a8cf_0 67 | - tensorboard-plugin-wit=1.6.0=py_0 68 | - tensorflow=2.2.0=gpu_py36hf933387_0 69 | - tensorflow-base=2.2.0=gpu_py36h8a81be8_0 70 | - tensorflow-estimator=2.2.0=pyh208ff02_0 71 | - tensorflow-gpu=2.2.0=h0d30ee6_0 72 | - termcolor=1.1.0=py36_1 73 | - typing_extensions=3.7.4.3=py_0 74 | - urllib3=1.25.11=py_0 75 | - werkzeug=1.0.1=py_0 76 | - wrapt=1.12.1=py36h7b6447c_1 77 | - yarl=1.6.2=py36h7b6447c_0 78 | - zipp=3.3.1=py_0 79 | - _libgcc_mutex=0.1=conda_forge 80 | - _openmp_mutex=4.5=1_gnu 81 | - blas=2.14=openblas 82 | - bzip2=1.0.8=h516909a_3 83 | - cairo=1.16.0=h9f066cc_1006 84 | - cffi=1.14.4=py36h211aa47_0 85 | - cycler=0.10.0=py_2 86 | - dbus=1.13.6=hfdff14a_1 87 | - expat=2.2.9=he1b5a44_2 88 | - ffmpeg=4.3.1=h3215721_1 89 | - fontconfig=2.13.1=h7e3eb15_1002 90 | - freetype=2.10.4=h7ca028e_0 91 | - gettext=0.19.8.1=hf34092f_1004 92 | - glib=2.66.3=h58526e2_0 93 | - gmp=6.2.1=h58526e2_0 94 | - gnutls=3.6.13=h85f3911_1 95 | - graphite2=1.3.13=h58526e2_1001 96 | - gst-plugins-base=1.14.5=h0935bb2_2 97 | - gstreamer=1.14.5=h36ae1b5_2 98 | - harfbuzz=2.7.2=ha5b49bf_1 99 | - icu=67.1=he1b5a44_0 100 | - jasper=1.900.1=h07fcdf6_1006 101 | - jpeg=9d=h36c2ea0_0 102 | - kiwisolver=1.3.1=py36h51d7077_0 103 | - krb5=1.17.2=h926e7f8_0 104 | - lame=3.100=h14c3975_1001 105 | - libblas=3.8.0=14_openblas 106 | - libcblas=3.8.0=14_openblas 107 | - libclang=10.0.1=default_hde54327_1 108 | - libevent=2.1.10=hcdb4288_3 109 | - libffi=3.2.1=he1b5a44_1007 110 | - libflac=1.3.3=he1b5a44_0 111 | - libgcc-ng=9.3.0=h5dbcf3e_17 112 | - libglib=2.66.3=hbe7bbb4_0 113 | - libgomp=9.3.0=h5dbcf3e_17 114 | - libiconv=1.16=h516909a_0 115 | - liblapack=3.8.0=14_openblas 116 | - liblapacke=3.8.0=14_openblas 117 | - libllvm10=10.0.1=he513fc3_3 118 | - libogg=1.3.2=h516909a_1002 119 | - libopenblas=0.3.7=h5ec1e0e_6 120 | - libopencv=4.5.0=py36_2 121 | - libpng=1.6.37=h21135ba_2 122 | - libpq=12.3=h5513abc_2 123 | - libsndfile=1.0.29=he1b5a44_0 124 | - libtiff=4.1.0=h4f3a223_6 125 | - libuuid=2.32.1=h14c3975_1000 126 | - libvorbis=1.3.7=he1b5a44_0 127 | - libwebp-base=1.1.0=h36c2ea0_3 128 | - libxcb=1.13=h14c3975_1002 129 | - libxkbcommon=0.10.0=he1b5a44_0 130 | - libxml2=2.9.10=h68273f3_2 131 | - llvmlite=0.34.0=py36hfa65bc7_2 132 | - lz4-c=1.9.2=he1b5a44_3 133 | - matplotlib=3.3.3=py36h5fab9bb_0 134 | - matplotlib-base=3.3.3=py36he12231b_0 135 | - mkl_fft=1.1.0=py36hc1659b7_1 136 | - mysql-common=8.0.21=2 137 | - mysql-libs=8.0.21=hf3661c5_2 138 | - nettle=3.6=he412f7d_0 139 | - nspr=4.29=he1b5a44_1 140 | - nss=3.59=h2c00c37_0 141 | - numba=0.51.2=py36h7c3b610_0 142 | - numpy=1.19.4=py36h8732dcd_1 143 | - opencv=4.5.0=py36_2 144 | - openh264=2.1.1=h8b12597_0 145 | - pcre=8.44=he1b5a44_0 146 | - pixman=0.40.0=h36c2ea0_0 147 | - pot=0.6.0=py36hb3f55d8_1 148 | - pthread-stubs=0.4=h36c2ea0_1001 149 | - py-opencv=4.5.0=py36hac0dd68_2 150 | - pyparsing=2.4.7=pyh9f0ad1d_0 151 | - pyqt=5.12.3=py36haa643ae_4 152 | - pysoundfile=0.10.3.post1=pyhd3deb0d_0 153 | - python=3.6.11=h425cb1d_0_cpython 154 | - python_abi=3.6=1_cp36m 155 | - qt=5.12.9=h1f2b2cb_0 156 | - resampy=0.2.2=py_0 157 | - scipy=1.5.2=py36h3a855aa_0 158 | - tornado=6.1=py36h1d69622_0 159 | - tqdm=4.54.1=pyhd8ed1ab_0 160 | - x264=1!152.20180806=h14c3975_0 161 | - xorg-kbproto=1.0.7=h14c3975_1002 162 | - xorg-libice=1.0.10=h516909a_0 163 | - xorg-libsm=1.2.3=h84519dc_1000 164 | - xorg-libx11=1.6.12=h516909a_0 165 | - xorg-libxau=1.0.9=h14c3975_0 166 | - xorg-libxdmcp=1.1.3=h516909a_0 167 | - xorg-libxext=1.3.4=h516909a_0 168 | - xorg-libxrender=0.9.10=h516909a_1002 169 | - xorg-renderproto=0.11.1=h14c3975_1002 170 | - xorg-xextproto=7.3.0=h14c3975_1002 171 | - xorg-xproto=7.0.31=h14c3975_1007 172 | - zstd=1.4.5=h6597ccf_2 173 | - joblib=1.0.0=pyhd3eb1b0_0 174 | - ld_impl_linux-64=2.33.1=h53a641e_7 175 | - libedit=3.1.20191231=h14c3975_1 176 | - libstdcxx-ng=9.1.0=hdf63c60_0 177 | - ncurses=6.2=he6710b0_1 178 | - numpy-base=1.18.5=py36h2f8d375_0 179 | - pip=20.3.1=py36h06a4308_0 180 | - readline=8.0=h7b6447c_0 181 | - scikit-learn=0.21.3=py36h22eb022_0 182 | - setuptools=51.0.0=py36h06a4308_2 183 | - sqlite=3.33.0=h62c20be_0 184 | - tk=8.6.10=hbc83047_0 185 | - wheel=0.36.1=pyhd3eb1b0_0 186 | - xz=5.2.5=h7b6447c_0 187 | - zlib=1.2.11=h7b6447c_3 188 | - pip: 189 | - appdirs==1.4.4 190 | - audioread==2.1.9 191 | - decorator==4.4.2 192 | - filelock==3.0.12 193 | - future==0.18.2 194 | - gdown==3.12.2 195 | - jams==0.3.4 196 | - jsonschema==3.2.0 197 | - kapre==0.2.0 198 | - librosa==0.8.0 199 | - mir-eval==0.6 200 | - packaging==20.7 201 | - pooch==1.3.0 202 | - pumpp==0.5.0 203 | - pyqt5==5.12.3 204 | - pyqt5-sip==4.19.18 205 | - pyqtchart==5.12 206 | - pyqtwebengine==5.12.1 207 | - pyrsistent==0.17.3 208 | - pyts==0.11.0 209 | - sortedcontainers==2.3.0 210 | - soundfile==0.10.3.post1 211 | - threadpoolctl==2.1.0 212 | prefix: /home/ma-prof/anaconda3/envs/repr-adv 213 | 214 | -------------------------------------------------------------------------------- /Datasets/AR-SCR/dev_full.csv: -------------------------------------------------------------------------------- 1 | filename label 2 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete5.wav D 3 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm100.wav E 4 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add25.wav A 5 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back56.wav B 6 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete65.wav D 7 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue67.wav F 8 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue65.wav F 9 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back41.wav B 10 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back3.wav B 11 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back13.wav B 12 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back28.wav B 13 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm7.wav E 14 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel76.wav C 15 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm75.wav E 16 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm63.wav E 17 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add40.wav A 18 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm14.wav E 19 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel4.wav C 20 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete94.wav D 21 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel89.wav C 22 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete98.wav D 23 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete24.wav D 24 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel97.wav C 25 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add28.wav A 26 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel1.wav C 27 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add86.wav A 28 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm11.wav E 29 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel49.wav C 30 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm10.wav E 31 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete32.wav D 32 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue51.wav F 33 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back27.wav B 34 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue6.wav F 35 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back32.wav B 36 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back35.wav B 37 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete69.wav D 38 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel83.wav C 39 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm22.wav E 40 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue43.wav F 41 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue25.wav F 42 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add83.wav A 43 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add72.wav A 44 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel21.wav C 45 | /work/dodohow1011/AR_SpeechCommands/numbers/7_100.wav 7 46 | /work/dodohow1011/AR_SpeechCommands/numbers/7_89.wav 7 47 | /work/dodohow1011/AR_SpeechCommands/numbers/1_92.wav 1 48 | /work/dodohow1011/AR_SpeechCommands/numbers/1_46.wav 1 49 | /work/dodohow1011/AR_SpeechCommands/numbers/3_29.wav 3 50 | /work/dodohow1011/AR_SpeechCommands/numbers/2_49.wav 2 51 | /work/dodohow1011/AR_SpeechCommands/numbers/6_27.wav 6 52 | /work/dodohow1011/AR_SpeechCommands/numbers/4_95.wav 4 53 | /work/dodohow1011/AR_SpeechCommands/numbers/9_58.wav 9 54 | /work/dodohow1011/AR_SpeechCommands/numbers/7_16.wav 7 55 | /work/dodohow1011/AR_SpeechCommands/numbers/0_68.wav 0 56 | /work/dodohow1011/AR_SpeechCommands/numbers/2_45.wav 2 57 | /work/dodohow1011/AR_SpeechCommands/numbers/4_79.wav 4 58 | /work/dodohow1011/AR_SpeechCommands/numbers/0_31.wav 0 59 | /work/dodohow1011/AR_SpeechCommands/numbers/5_35.wav 5 60 | /work/dodohow1011/AR_SpeechCommands/numbers/3_80.wav 3 61 | /work/dodohow1011/AR_SpeechCommands/numbers/0_64.wav 0 62 | /work/dodohow1011/AR_SpeechCommands/numbers/3_44.wav 3 63 | /work/dodohow1011/AR_SpeechCommands/numbers/4_93.wav 4 64 | /work/dodohow1011/AR_SpeechCommands/numbers/3_72.wav 3 65 | /work/dodohow1011/AR_SpeechCommands/numbers/1_77.wav 1 66 | /work/dodohow1011/AR_SpeechCommands/numbers/0_56.wav 0 67 | /work/dodohow1011/AR_SpeechCommands/numbers/8_76.wav 8 68 | /work/dodohow1011/AR_SpeechCommands/numbers/1_81.wav 1 69 | /work/dodohow1011/AR_SpeechCommands/numbers/1_2.wav 1 70 | /work/dodohow1011/AR_SpeechCommands/numbers/2_43.wav 2 71 | /work/dodohow1011/AR_SpeechCommands/numbers/2_66.wav 2 72 | /work/dodohow1011/AR_SpeechCommands/numbers/9_65.wav 9 73 | /work/dodohow1011/AR_SpeechCommands/numbers/6_49.wav 6 74 | /work/dodohow1011/AR_SpeechCommands/numbers/9_93.wav 9 75 | /work/dodohow1011/AR_SpeechCommands/numbers/1_37.wav 1 76 | /work/dodohow1011/AR_SpeechCommands/numbers/4_17.wav 4 77 | /work/dodohow1011/AR_SpeechCommands/numbers/9_10.wav 9 78 | /work/dodohow1011/AR_SpeechCommands/numbers/7_15.wav 7 79 | /work/dodohow1011/AR_SpeechCommands/numbers/1_29.wav 1 80 | /work/dodohow1011/AR_SpeechCommands/numbers/1_6.wav 1 81 | /work/dodohow1011/AR_SpeechCommands/numbers/7_48.wav 7 82 | /work/dodohow1011/AR_SpeechCommands/numbers/8_50.wav 8 83 | /work/dodohow1011/AR_SpeechCommands/numbers/6_3.wav 6 84 | /work/dodohow1011/AR_SpeechCommands/numbers/3_10.wav 3 85 | /work/dodohow1011/AR_SpeechCommands/numbers/6_37.wav 6 86 | /work/dodohow1011/AR_SpeechCommands/numbers/7_11.wav 7 87 | /work/dodohow1011/AR_SpeechCommands/numbers/0_63.wav 0 88 | /work/dodohow1011/AR_SpeechCommands/numbers/3_61.wav 3 89 | /work/dodohow1011/AR_SpeechCommands/numbers/0_45.wav 0 90 | /work/dodohow1011/AR_SpeechCommands/numbers/9_86.wav 9 91 | /work/dodohow1011/AR_SpeechCommands/numbers/1_94.wav 1 92 | /work/dodohow1011/AR_SpeechCommands/numbers/9_68.wav 9 93 | /work/dodohow1011/AR_SpeechCommands/numbers/0_55.wav 0 94 | /work/dodohow1011/AR_SpeechCommands/numbers/7_54.wav 7 95 | /work/dodohow1011/AR_SpeechCommands/numbers/5_30.wav 5 96 | /work/dodohow1011/AR_SpeechCommands/numbers/7_36.wav 7 97 | /work/dodohow1011/AR_SpeechCommands/numbers/5_45.wav 5 98 | /work/dodohow1011/AR_SpeechCommands/numbers/4_70.wav 4 99 | /work/dodohow1011/AR_SpeechCommands/numbers/8_71.wav 8 100 | /work/dodohow1011/AR_SpeechCommands/numbers/5_96.wav 5 101 | /work/dodohow1011/AR_SpeechCommands/numbers/2_39.wav 2 102 | /work/dodohow1011/AR_SpeechCommands/numbers/1_18.wav 1 103 | /work/dodohow1011/AR_SpeechCommands/numbers/1_87.wav 1 104 | /work/dodohow1011/AR_SpeechCommands/numbers/3_92.wav 3 105 | /work/dodohow1011/AR_SpeechCommands/numbers/1_50.wav 1 106 | /work/dodohow1011/AR_SpeechCommands/numbers/4_77.wav 4 107 | /work/dodohow1011/AR_SpeechCommands/numbers/5_7.wav 5 108 | /work/dodohow1011/AR_SpeechCommands/numbers/5_48.wav 5 109 | /work/dodohow1011/AR_SpeechCommands/numbers/1_10.wav 1 110 | /work/dodohow1011/AR_SpeechCommands/numbers/1_20.wav 1 111 | /work/dodohow1011/AR_SpeechCommands/numbers/7_86.wav 7 112 | /work/dodohow1011/AR_SpeechCommands/numbers/8_89.wav 8 113 | /work/dodohow1011/AR_SpeechCommands/numbers/8_60.wav 8 114 | /work/dodohow1011/AR_SpeechCommands/numbers/1_71.wav 1 115 | /work/dodohow1011/AR_SpeechCommands/numbers/2_74.wav 2 116 | /work/dodohow1011/AR_SpeechCommands/numbers/9_45.wav 9 117 | /work/dodohow1011/AR_SpeechCommands/numbers/3_77.wav 3 118 | /work/dodohow1011/AR_SpeechCommands/numbers/6_39.wav 6 119 | /work/dodohow1011/AR_SpeechCommands/numbers/8_8.wav 8 120 | /work/dodohow1011/AR_SpeechCommands/numbers/8_85.wav 8 121 | /work/dodohow1011/AR_SpeechCommands/numbers/8_67.wav 8 122 | /work/dodohow1011/AR_SpeechCommands/numbers/0_75.wav 0 123 | /work/dodohow1011/AR_SpeechCommands/numbers/9_29.wav 9 124 | /work/dodohow1011/AR_SpeechCommands/numbers/0_39.wav 0 125 | -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import tensorflow as tf 3 | from tensorflow.keras.models import Model, load_model 4 | from SpeechModels import AttRNNSpeechModel 5 | import tensorflow.keras.backend as K 6 | from tensorflow import keras 7 | from tensorflow.keras import models 8 | import os 9 | import librosa 10 | import librosa.display 11 | import matplotlib.pyplot as plt 12 | import matplotlib.cm as cm 13 | import matplotlib.image as mpimg 14 | import itertools 15 | from mpl_toolkits.axes_grid1 import make_axes_locatable 16 | 17 | def multi_mapping(prob, source_num, mapping_num, target_num): 18 | 19 | similarity_mapping = False 20 | if not similairty_mapping: 21 | mt = mapping_num * target_num ##mt must smaller than source_num 22 | label_map = np.zeros([source_num, mt]) ##[source_num, map_num*target_num] 23 | label_map[0:mt, 0:mt] = np.eye(mt) ##[source_num, map_num*target_num] 24 | map_prob = tf.matmul(prob, tf.constant(label_map, dtype=tf.float32)) ## [1, source_num] * [source_num, map_num*target_num] = [1, map_num*target_num] 25 | final_prob = tf.reduce_mean(tf.reshape(map_prob, shape=[tf.shape(map_prob)[0], target_num, mapping_num]), axis=-1) ##[target_num] 26 | 27 | else: 28 | # Use similarity mapping result. 29 | # Note that you should choose the correct label_map according to the datast. 30 | weight = np.zeros([source_num, target_num]) 31 | label_map = [[14,18], [2,13,35], [15,22,23], [6,21], [4,8], [26,27], [10,24], [19,29], [1,3], [30,31], [0,25,34], [12,16,32], [9,23], [17,28], [7,20], [5,11]] # AR-SCR mapping 32 | #label_map = [[4,7], [20,24], [16,26,32], [6,13,31], [1,3,30], [9,19], [0,8], [17,18], [10,25], [5,11], [2,23], [21,27,35], [15,22,33], [28,29,34], [12,14]] # LT-SCR mapping 33 | #label_map = [[20,22,28], [4,8], [10,13], [14,23,27], [0,21], [12,18,29], [2,15,33], [6,7,31], [11,25,26], [1,5,30], [17,19,35], [9,16,32], [3,24,34]] # DM-SCR mapping 34 | for i, ls in enumerate(label_map): 35 | for num in ls: 36 | weight[num][i] = 1 37 | final_prob = tf.matmul(prob, tf.constant(weight,dtype=tf.float32)) 38 | 39 | return final_prob 40 | 41 | def layer_output(in_feats, model, ly_name = "batch_normalization_6 ", n = 7): 42 | conv_layer = model.get_layer(ly_name) 43 | heatmap_model = models.Model([model.inputs], [conv_layer.output, model.output]) 44 | 45 | with tf.GradientTape() as gtape: 46 | conv_output, predictions = heatmap_model(in_feats[n:n+1]) 47 | loss = predictions[:, np.argmax(predictions[0])] 48 | grads = gtape.gradient(loss, conv_output) 49 | pooled_grads = K.mean(grads, axis=(0, 1, 2)) 50 | 51 | heatmap = tf.reduce_mean(tf.multiply(pooled_grads, conv_output), axis=-1) 52 | return heatmap, conv_output 53 | 54 | def vis_map(heatmap): 55 | heatmap = np.maximum(heatmap, 0) 56 | max_heat = np.max(heatmap) 57 | if max_heat == 0: 58 | max_heat = 1e-10 59 | heatmap /= max_heat 60 | return heatmap 61 | 62 | def to_rgb(heatmap, h_x, w_x): 63 | heatmap = np.uint8(255 * vis_map((heatmap[0]))) 64 | # We use jet colormap to colorize heatmap 65 | jet = cm.get_cmap("jet") 66 | 67 | # We use RGB values of the colormap 68 | jet_colors = jet(np.arange(256))[:, :3] 69 | jet_heatmap = jet_colors[np.flipud(np.transpose(heatmap))] 70 | 71 | # We create an image with RGB colorized heatmap 72 | jet_heatmap = keras.preprocessing.image.array_to_img(jet_heatmap) 73 | 74 | jet_heatmap = jet_heatmap.resize(( w_x, h_x)) 75 | 76 | jet_heatmap = keras.preprocessing.image.img_to_array(jet_heatmap) 77 | 78 | # Save the superimposed image 79 | superimposed_img = keras.preprocessing.image.array_to_img(jet_heatmap) 80 | 81 | return superimposed_img 82 | 83 | def ts_CAM(model, x_test, y_test): 84 | get_last_conv = K.function([model.layers[0].input, K.learning_phase()], [model.layers[-2].output]) 85 | last_conv = get_last_conv([x_test[:100], 1])[0] 86 | get_softmax = keras.backend.function([model.layers[0].input, keras.backend.learning_phase()], [model.layers[-1].output]) 87 | softmax = get_softmax(([x_test[:100], 1]))[0] 88 | softmax_weight = model.get_weights()[-2] 89 | CAM = np.dot(last_conv, softmax_weight) 90 | k = 0 91 | # for k in range(5): 92 | CAM = (CAM - CAM.min(axis=1, keepdims=True)) / (CAM.max(axis=1, keepdims=True) - CAM.min(axis=1, keepdims=True)) 93 | c = np.exp(CAM) / np.sum(np.exp(CAM), axis=1, keepdims=True) 94 | plt.figure(figsize=(13, 7)) 95 | plt.plot(x_test[k].squeeze()) 96 | plt.scatter(np.arange(len(x_test[k])), x_test[k].squeeze(), cmap='hot_r', c=c[k, :, :, int(y_test[k])].squeeze(), s=100) 97 | plt.title('True label:' + str(y_test[k]) + ' likelihood of label ' + str(y_test[k]) + ': ' + str(softmax[k][int(y_test[k])])) 98 | plt.colorbar() 99 | plt.savefig("cam.pdf") 100 | 101 | 102 | def plot_acc_loss(x_history, eps, map_num): 103 | 104 | plt.figure() 105 | plt.style.use("seaborn") 106 | fig, (ax1, ax2) = plt.subplots(2, 1, figsize=(6, 9)) 107 | 108 | ax1.plot(x_history.history["val_accuracy"], label="Val. acc") 109 | ax1.plot(x_history.history["accuracy"], label="Training acc") 110 | ax1.set_ylabel("Accuracy") 111 | ax1.set_ylim([0, 1]) 112 | ax1.set_xlabel("Epoch") 113 | ax1.legend() 114 | 115 | ax2.plot(x_history.history["val_loss"], label="Val. loss") 116 | ax2.plot(x_history.history["loss"], label="Training loss") 117 | ax2.set_ylabel("Loss") 118 | #ax2.set_ylim(top=5.5) 119 | ax2.set_xlabel("Epoch") 120 | ax2.legend() 121 | plt.tight_layout() 122 | plt.savefig("results/AR-SpeechCommands" + "_eps" + eps + "_map" + map_num + "_.png") #PadCenter/ 123 | 124 | 125 | def plot_confusion_matrix(cm, classes, 126 | normalize=False, 127 | title='Confusion matrix', 128 | cmap=plt.cm.Blues): 129 | """ 130 | This function prints and plots the confusion matrix. 131 | Normalization can be applied by setting `normalize=True`. 132 | """ 133 | if normalize: 134 | cm = cm.astype('float') / cm.sum(axis=1)[:, np.newaxis] 135 | print("Normalized confusion matrix") 136 | else: 137 | print('Confusion matrix, without normalization') 138 | 139 | print(cm) 140 | 141 | fig = plt.figure(figsize=(10,10)) 142 | ax = fig.add_subplot(1, 1, 1) 143 | im = ax.imshow(cm, interpolation='nearest', cmap=cmap) 144 | 145 | divider = make_axes_locatable(ax) 146 | cax = divider.append_axes("right", size="5%", pad=0.05) 147 | plt.colorbar(im,cax=cax) 148 | 149 | ax.set_title(title, fontsize='large') 150 | 151 | tick_marks = np.arange(len(classes)) 152 | ax.set_xticks(tick_marks) 153 | ax.set_yticks(tick_marks) 154 | 155 | ax.set_xticklabels(classes) 156 | ax.set_yticklabels(classes) 157 | plt.setp(ax.get_xticklabels(), rotation=45, ha="right", rotation_mode="anchor") 158 | 159 | fmt = '.2f' if normalize else 'd' 160 | thresh = cm.max() / 2. 161 | for i, j in itertools.product(range(cm.shape[0]), range(cm.shape[1])): 162 | ax.text(j, i, format(cm[i, j], fmt), 163 | horizontalalignment="center", 164 | color="white" if cm[i, j] > thresh else "black") 165 | 166 | ax.set_ylabel('True label') 167 | ax.set_xlabel('Predicted label') 168 | plt.tight_layout() 169 | -------------------------------------------------------------------------------- /SpeechDownloader.py: -------------------------------------------------------------------------------- 1 | """ 2 | File containing scripts to download audio from various datasets 3 | 4 | Also has tools to convert audio into numpy 5 | """ 6 | from tqdm import tqdm 7 | import requests 8 | import math 9 | import os 10 | import tarfile 11 | import numpy as np 12 | import librosa 13 | import pandas as pd 14 | 15 | import audioUtils 16 | 17 | 18 | # ################## 19 | # Google Speech Commands Dataset V2 20 | # ################## 21 | 22 | # GSCmdV2Categs = {'unknown' : 0, 'silence' : 1, '_unknown_' : 0,'_silence_' : 1, '_background_noise_' : 1, 'yes' : 2, 23 | # 'no' : 3, 'up' : 4, 'down' : 5, 'left' : 6, 'right' : 7, 'on' : 8, 'off' : 9, 'stop' : 10, 'go' : 11} 24 | # numGSCmdV2Categs = 12 25 | 26 | # "Yes", "No", "Up", "Down", "Left", "Right", "On", "Off", "Stop", "Go", "Zero", 27 | # "One", "Two", "Three", "Four", "Five", "Six", "Seven", "Eight", and "Nine" 28 | 29 | GSCmdV2Categs = { 30 | 'unknown': 0, 31 | 'silence': 0, 32 | '_unknown_': 0, 33 | '_silence_': 0, 34 | '_background_noise_': 0, 35 | 'yes': 2, 36 | 'no': 3, 37 | 'up': 4, 38 | 'down': 5, 39 | 'left': 6, 40 | 'right': 7, 41 | 'on': 8, 42 | 'off': 9, 43 | 'stop': 10, 44 | 'go': 11, 45 | 'zero': 12, 46 | 'one': 13, 47 | 'two': 14, 48 | 'three': 15, 49 | 'four': 16, 50 | 'five': 17, 51 | 'six': 18, 52 | 'seven': 19, 53 | 'eight': 20, 54 | 'nine': 1} 55 | numGSCmdV2Categs = 21 56 | 57 | 58 | def PrepareGoogleSpeechCmd(version=2, forceDownload=False, task='20cmd'): 59 | """ 60 | Prepares Google Speech commands dataset version 2 for use 61 | 62 | tasks: 20cmd, 12cmd, leftright or 35word 63 | 64 | Returns full path to training, validation and test file list and file categories 65 | """ 66 | allowedTasks = ['12cmd', 'leftright', '35word', '20cmd'] 67 | if task not in allowedTasks: 68 | raise Exception('Task must be one of: {}'.format(allowedTasks)) 69 | 70 | basePath = None 71 | if version == 2: 72 | _DownloadGoogleSpeechCmdV2(forceDownload) 73 | basePath = '/home/kuray107/sd_GSCmdV2' 74 | elif version == 1: 75 | _DownloadGoogleSpeechCmdV1(forceDownload) 76 | basePath = 'sd_GSCmdV1' 77 | else: 78 | raise Exception('Version must be 1 or 2') 79 | 80 | if task == '12cmd': 81 | GSCmdV2Categs = { 82 | 'unknown': 0, 83 | 'silence': 1, 84 | '_unknown_': 0, 85 | '_silence_': 1, 86 | '_background_noise_': 1, 87 | 'yes': 2, 88 | 'no': 3, 89 | 'up': 4, 90 | 'down': 5, 91 | 'left': 6, 92 | 'right': 7, 93 | 'on': 8, 94 | 'off': 9, 95 | 'stop': 10, 96 | 'go': 11} 97 | numGSCmdV2Categs = 12 98 | elif task == 'leftright': 99 | GSCmdV2Categs = { 100 | 'unknown': 0, 101 | 'silence': 0, 102 | '_unknown_': 0, 103 | '_silence_': 0, 104 | '_background_noise_': 0, 105 | 'left': 1, 106 | 'right': 2} 107 | numGSCmdV2Categs = 3 108 | elif task == '35word': 109 | GSCmdV2Categs = { 110 | 'unknown': 0, 111 | 'silence': 0, 112 | '_unknown_': 0, 113 | '_silence_': 0, 114 | '_background_noise_': 0, 115 | 'yes': 2, 116 | 'no': 3, 117 | 'up': 4, 118 | 'down': 5, 119 | 'left': 6, 120 | 'right': 7, 121 | 'on': 8, 122 | 'off': 9, 123 | 'stop': 10, 124 | 'go': 11, 125 | 'zero': 12, 126 | 'one': 13, 127 | 'two': 14, 128 | 'three': 15, 129 | 'four': 16, 130 | 'five': 17, 131 | 'six': 18, 132 | 'seven': 19, 133 | 'eight': 20, 134 | 'nine': 1, 135 | 'backward': 21, 136 | 'bed': 22, 137 | 'bird': 23, 138 | 'cat': 24, 139 | 'dog': 25, 140 | 'follow': 26, 141 | 'forward': 27, 142 | 'happy': 28, 143 | 'house': 29, 144 | 'learn': 30, 145 | 'marvin': 31, 146 | 'sheila': 32, 147 | 'tree': 33, 148 | 'visual': 34, 149 | 'wow': 35} 150 | numGSCmdV2Categs = 36 151 | elif task == '20cmd': 152 | GSCmdV2Categs = { 153 | 'unknown': 0, 154 | 'silence': 0, 155 | '_unknown_': 0, 156 | '_silence_': 0, 157 | '_background_noise_': 0, 158 | 'yes': 2, 159 | 'no': 3, 160 | 'up': 4, 161 | 'down': 5, 162 | 'left': 6, 163 | 'right': 7, 164 | 'on': 8, 165 | 'off': 9, 166 | 'stop': 10, 167 | 'go': 11, 168 | 'zero': 12, 169 | 'one': 13, 170 | 'two': 14, 171 | 'three': 15, 172 | 'four': 16, 173 | 'five': 17, 174 | 'six': 18, 175 | 'seven': 19, 176 | 'eight': 20, 177 | 'nine': 1} 178 | numGSCmdV2Categs = 21 179 | 180 | print('Converting test set WAVs to numpy files') 181 | audioUtils.WAV2Numpy(basePath + '/test/') 182 | print('Converting training set WAVs to numpy files') 183 | audioUtils.WAV2Numpy(basePath + '/train/') 184 | 185 | # read split from files and all files in folders 186 | testWAVs = pd.read_csv(basePath + '/train/testing_list.txt', 187 | sep=" ", header=None)[0].tolist() 188 | valWAVs = pd.read_csv(basePath + '/train/validation_list.txt', 189 | sep=" ", header=None)[0].tolist() 190 | 191 | testWAVs = [os.path.join(basePath + '/train/', f + '.npy') 192 | for f in testWAVs if f.endswith('.wav')] 193 | valWAVs = [os.path.join(basePath + '/train/', f + '.npy') 194 | for f in valWAVs if f.endswith('.wav')] 195 | allWAVs = [] 196 | for root, dirs, files in os.walk(basePath + '/train/'): 197 | allWAVs += [root + '/' + f for f in files if f.endswith('.wav.npy')] 198 | trainWAVs = list(set(allWAVs) - set(valWAVs) - set(testWAVs)) 199 | 200 | testWAVsREAL = [] 201 | for root, dirs, files in os.walk(basePath + '/test/'): 202 | testWAVsREAL += [root + '/' + 203 | f for f in files if f.endswith('.wav.npy')] 204 | 205 | # get categories 206 | testWAVlabels = [_getFileCategory(f, GSCmdV2Categs) for f in testWAVs] 207 | valWAVlabels = [_getFileCategory(f, GSCmdV2Categs) for f in valWAVs] 208 | trainWAVlabels = [_getFileCategory(f, GSCmdV2Categs) for f in trainWAVs] 209 | testWAVREALlabels = [_getFileCategory(f, GSCmdV2Categs) 210 | for f in testWAVsREAL] 211 | 212 | # background noise should be used for validation as well 213 | backNoiseFiles = [trainWAVs[i] for i in range(len(trainWAVlabels)) 214 | if trainWAVlabels[i] == GSCmdV2Categs['silence']] 215 | backNoiseCats = [GSCmdV2Categs['silence'] 216 | for i in range(len(backNoiseFiles))] 217 | if numGSCmdV2Categs == 12: 218 | valWAVs += backNoiseFiles 219 | valWAVlabels += backNoiseCats 220 | 221 | # build dictionaries 222 | testWAVlabelsDict = dict(zip(testWAVs, testWAVlabels)) 223 | valWAVlabelsDict = dict(zip(valWAVs, valWAVlabels)) 224 | trainWAVlabelsDict = dict(zip(trainWAVs, trainWAVlabels)) 225 | testWAVREALlabelsDict = dict(zip(testWAVsREAL, testWAVREALlabels)) 226 | 227 | # a tweak here: we will heavily underuse silence samples because there are few files. 228 | # we can add them to the training list to reuse them multiple times 229 | # note that since we already added the files to the label dicts we don't 230 | # need to do it again 231 | 232 | # for i in range(200): 233 | # trainWAVs = trainWAVs + backNoiseFiles 234 | 235 | # info dictionary 236 | trainInfo = {'files': trainWAVs, 'labels': trainWAVlabelsDict} 237 | valInfo = {'files': valWAVs, 'labels': valWAVlabelsDict} 238 | testInfo = {'files': testWAVs, 'labels': testWAVlabelsDict} 239 | testREALInfo = {'files': testWAVsREAL, 'labels': testWAVREALlabelsDict} 240 | gscInfo = {'train': trainInfo, 241 | 'test': testInfo, 242 | 'val': valInfo, 243 | 'testREAL': testREALInfo} 244 | 245 | print('Done preparing Google Speech commands dataset version {}'.format(version)) 246 | 247 | return gscInfo, numGSCmdV2Categs 248 | 249 | 250 | def _getFileCategory(file, catDict): 251 | """ 252 | Receives a file with name sd_GSCmdV2/train// and returns an integer that is catDict[cat] 253 | """ 254 | categ = os.path.basename(os.path.dirname(file)) 255 | return catDict.get(categ, 0) 256 | 257 | 258 | def _DownloadGoogleSpeechCmdV2(forceDownload=False): 259 | """ 260 | Downloads Google Speech commands dataset version 2 261 | """ 262 | if os.path.isdir("/home/kuray107/sd_GSCmdV2/") and not forceDownload: 263 | print('Google Speech commands dataset version 2 already exists. Skipping download.') 264 | else: 265 | if not os.path.exists("sd_GSCmdV2/"): 266 | os.makedirs("sd_GSCmdV2/") 267 | trainFiles = 'http://download.tensorflow.org/data/speech_commands_v0.02.tar.gz' 268 | testFiles = 'http://download.tensorflow.org/data/speech_commands_test_set_v0.02.tar.gz' 269 | _downloadFile(testFiles, 'sd_GSCmdV2/test.tar.gz') 270 | _downloadFile(trainFiles, 'sd_GSCmdV2/train.tar.gz') 271 | 272 | # extract files 273 | if not os.path.isdir("/home/kuray107/sd_GSCmdV2/test/"): 274 | _extractTar('sd_GSCmdV2/test.tar.gz', 'sd_GSCmdV2/test/') 275 | 276 | if not os.path.isdir("/home/kuray107/sd_GSCmdV2/train/"): 277 | _extractTar('sd_GSCmdV2/train.tar.gz', 'sd_GSCmdV2/train/') 278 | 279 | 280 | def _DownloadGoogleSpeechCmdV1(forceDownload=False): 281 | """ 282 | Downloads Google Speech commands dataset version 1 283 | """ 284 | if os.path.isdir("sd_GSCmdV1/") and not forceDownload: 285 | print('Google Speech commands dataset version 1 already exists. Skipping download.') 286 | else: 287 | if not os.path.exists("sd_GSCmdV1/"): 288 | os.makedirs("sd_GSCmdV1/") 289 | trainFiles = 'http://download.tensorflow.org/data/speech_commands_v0.01.tar.gz' 290 | testFiles = 'http://download.tensorflow.org/data/speech_commands_test_set_v0.01.tar.gz' 291 | _downloadFile(testFiles, 'sd_GSCmdV1/test.tar.gz') 292 | _downloadFile(trainFiles, 'sd_GSCmdV1/train.tar.gz') 293 | 294 | # extract files 295 | if not os.path.isdir("sd_GSCmdV1/test/"): 296 | _extractTar('sd_GSCmdV1/test.tar.gz', 'sd_GSCmdV1/test/') 297 | 298 | if not os.path.isdir("sd_GSCmdV1/train/"): 299 | _extractTar('sd_GSCmdV1/train.tar.gz', 'sd_GSCmdV1/train/') 300 | 301 | ############## 302 | # Utilities 303 | ############## 304 | 305 | 306 | def _downloadFile(url, fName): 307 | # Streaming, so we can iterate over the response. 308 | r = requests.get(url, stream=True) 309 | 310 | # Total size in bytes. 311 | total_size = int(r.headers.get('content-length', 0)) 312 | block_size = 1024 313 | wrote = 0 314 | print('Downloading {} into {}'.format(url, fName)) 315 | with open(fName, 'wb') as f: 316 | for data in tqdm(r.iter_content(block_size), 317 | total=math.ceil(total_size // block_size), 318 | unit='KB', 319 | unit_scale=True): 320 | wrote = wrote + len(data) 321 | f.write(data) 322 | if total_size != 0 and wrote != total_size: 323 | print("ERROR, something went wrong") 324 | 325 | 326 | def _extractTar(fname, folder): 327 | print('Extracting {} into {}'.format(fname, folder)) 328 | if (fname.endswith("tar.gz")): 329 | tar = tarfile.open(fname, "r:gz") 330 | tar.extractall(path=folder) 331 | tar.close() 332 | elif (fname.endswith("tar")): 333 | tar = tarfile.open(fname, "r:") 334 | tar.extractall(path=folder) 335 | tar.close() 336 | -------------------------------------------------------------------------------- /Datasets/DM-SCR/test_full.csv: -------------------------------------------------------------------------------- 1 | filename label 2 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (7).wav 02 3 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (6).wav 02 4 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (5).wav 02 5 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (8).wav 05 6 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (3).wav 05 7 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (7).wav 05 8 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (2).wav 08 9 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (5).wav 08 10 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (10).wav 08 11 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (6).wav 11 12 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (5).wav 11 13 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (1).wav 11 14 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (9).wav 19 15 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (8).wav 19 16 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (7).wav 19 17 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (6).wav 14 18 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (4).wav 14 19 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (1).wav 14 20 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (9).wav 17 21 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (1).wav 17 22 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (5).wav 17 23 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (10).wav 01 24 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (9).wav 01 25 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (7).wav 01 26 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (1).wav 09 27 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (4).wav 09 28 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (10).wav 09 29 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (8).wav 04 30 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (6).wav 04 31 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (9).wav 04 32 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (1).wav 07 33 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (8).wav 07 34 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (5).wav 07 35 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (3).wav 13 36 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (5).wav 13 37 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (1).wav 13 38 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (5).wav 16 39 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (10).wav 16 40 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (3).wav 16 41 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (10).wav 03 42 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (2).wav 03 43 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (5).wav 03 44 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (3).wav 06 45 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (10).wav 06 46 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (1).wav 06 47 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (7).wav 12 48 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (9).wav 12 49 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (2).wav 12 50 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (2).wav 15 51 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (10).wav 15 52 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (9).wav 15 53 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (10).wav 10 54 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (2).wav 10 55 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (6).wav 10 56 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (6).wav 18 57 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (3).wav 18 58 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (10).wav 18 59 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (10).wav 02 60 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (7).wav 02 61 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (8).wav 02 62 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (10).wav 05 63 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (7).wav 05 64 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (4).wav 05 65 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (10).wav 08 66 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (6).wav 08 67 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (8).wav 08 68 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (1).wav 11 69 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (8).wav 11 70 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (5).wav 11 71 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (2).wav 19 72 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (10).wav 19 73 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (9).wav 19 74 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (4).wav 14 75 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (5).wav 14 76 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (7).wav 14 77 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (10).wav 17 78 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (1).wav 17 79 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (7).wav 17 80 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (4).wav 01 81 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (10).wav 01 82 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (8).wav 01 83 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (2).wav 09 84 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (3).wav 09 85 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (7).wav 09 86 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (7).wav 04 87 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (6).wav 04 88 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (5).wav 04 89 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (1).wav 07 90 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (6).wav 07 91 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (7).wav 07 92 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (7).wav 13 93 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (4).wav 13 94 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (3).wav 13 95 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (1).wav 16 96 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (6).wav 16 97 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (8).wav 16 98 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (3).wav 03 99 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (10).wav 03 100 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (1).wav 03 101 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (6).wav 06 102 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (1).wav 06 103 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (8).wav 06 104 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (5).wav 12 105 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (7).wav 12 106 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (9).wav 12 107 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (7).wav 15 108 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (10).wav 15 109 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (3).wav 15 110 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (8).wav 10 111 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (9).wav 10 112 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (5).wav 10 113 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (7).wav 18 114 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (9).wav 18 115 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (4).wav 18 116 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (9).wav 02 117 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (8).wav 02 118 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (6).wav 02 119 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (7).wav 05 120 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (9).wav 05 121 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (8).wav 05 122 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (7).wav 08 123 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (4).wav 08 124 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (6).wav 08 125 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (10).wav 11 126 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (7).wav 11 127 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (9).wav 11 128 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (8).wav 19 129 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (5).wav 19 130 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (4).wav 19 131 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (2).wav 14 132 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (8).wav 14 133 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (4).wav 14 134 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (4).wav 17 135 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (7).wav 17 136 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (1).wav 17 137 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (10).wav 01 138 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (1).wav 01 139 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (7).wav 01 140 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (6).wav 09 141 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (3).wav 09 142 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (9).wav 09 143 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (6).wav 04 144 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (3).wav 04 145 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (2).wav 04 146 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (3).wav 07 147 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (10).wav 07 148 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (9).wav 07 149 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (5).wav 13 150 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (6).wav 13 151 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (8).wav 13 152 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (6).wav 16 153 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (2).wav 16 154 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (9).wav 16 155 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (2).wav 03 156 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (7).wav 03 157 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (6).wav 03 158 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (9).wav 06 159 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (8).wav 06 160 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (5).wav 06 161 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (3).wav 12 162 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (10).wav 12 163 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (2).wav 12 164 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (1).wav 15 165 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (4).wav 15 166 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (3).wav 15 167 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (1).wav 10 168 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (9).wav 10 169 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (8).wav 10 170 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (3).wav 18 171 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (2).wav 18 172 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (4).wav 18 173 | -------------------------------------------------------------------------------- /Datasets/AR-SCR/test_full.csv: -------------------------------------------------------------------------------- 1 | filename label 2 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete82.wav D 3 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back66.wav B 4 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel55.wav C 5 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add51.wav A 6 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add44.wav A 7 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel90.wav C 8 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel88.wav C 9 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add61.wav A 10 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue78.wav F 11 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add91.wav A 12 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete44.wav D 13 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel78.wav C 14 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue68.wav F 15 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add21.wav A 16 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel65.wav C 17 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add60.wav A 18 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back78.wav B 19 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add56.wav A 20 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm29.wav E 21 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add81.wav A 22 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back84.wav B 23 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel60.wav C 24 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm69.wav E 25 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue32.wav F 26 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel99.wav C 27 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete9.wav D 28 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back4.wav B 29 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back57.wav B 30 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue72.wav F 31 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue92.wav F 32 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add73.wav A 33 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete28.wav D 34 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel10.wav C 35 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm39.wav E 36 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete91.wav D 37 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue23.wav F 38 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue55.wav F 39 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel30.wav C 40 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add11.wav A 41 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete1.wav D 42 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back31.wav B 43 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue85.wav F 44 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back51.wav B 45 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete74.wav D 46 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue63.wav F 47 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete30.wav D 48 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back1.wav B 49 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm44.wav E 50 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel45.wav C 51 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete56.wav D 52 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back65.wav B 53 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm23.wav E 54 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add93.wav A 55 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete53.wav D 56 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm20.wav E 57 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add29.wav A 58 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue70.wav F 59 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm43.wav E 60 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel64.wav C 61 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete95.wav D 62 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back71.wav B 63 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete29.wav D 64 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back43.wav B 65 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm76.wav E 66 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue73.wav F 67 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add53.wav A 68 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm6.wav E 69 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add97.wav A 70 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue12.wav F 71 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm99.wav E 72 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm46.wav E 73 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm5.wav E 74 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete22.wav D 75 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete66.wav D 76 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete54.wav D 77 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel75.wav C 78 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel74.wav C 79 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue53.wav F 80 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back7.wav B 81 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue86.wav F 82 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add82.wav A 83 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete43.wav D 84 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel11.wav C 85 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back54.wav B 86 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm82.wav E 87 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm92.wav E 88 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue19.wav F 89 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add71.wav A 90 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add9.wav A 91 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete4.wav D 92 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm70.wav E 93 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm26.wav E 94 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel92.wav C 95 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue38.wav F 96 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add12.wav A 97 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete61.wav D 98 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add70.wav A 99 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue2.wav F 100 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel66.wav C 101 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm1.wav E 102 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue69.wav F 103 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add54.wav A 104 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete15.wav D 105 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm98.wav E 106 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm32.wav E 107 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm68.wav E 108 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete26.wav D 109 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back36.wav B 110 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete96.wav D 111 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue97.wav F 112 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back67.wav B 113 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete20.wav D 114 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel32.wav C 115 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue14.wav F 116 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete68.wav D 117 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel22.wav C 118 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back61.wav B 119 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete49.wav D 120 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back58.wav B 121 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel35.wav C 122 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue91.wav F 123 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel77.wav C 124 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm79.wav E 125 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue15.wav F 126 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel86.wav C 127 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel26.wav C 128 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back55.wav B 129 | /work/dodohow1011/AR_SpeechCommands/commands/C_Cancel39.wav C 130 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm90.wav E 131 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm31.wav E 132 | /work/dodohow1011/AR_SpeechCommands/commands/F_Continue30.wav F 133 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add87.wav A 134 | /work/dodohow1011/AR_SpeechCommands/commands/D_Delete47.wav D 135 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add30.wav A 136 | /work/dodohow1011/AR_SpeechCommands/commands/B_Back39.wav B 137 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm53.wav E 138 | /work/dodohow1011/AR_SpeechCommands/commands/A_Add31.wav A 139 | /work/dodohow1011/AR_SpeechCommands/commands/E_Confirm89.wav E 140 | /work/dodohow1011/AR_SpeechCommands/numbers/8_81.wav 8 141 | /work/dodohow1011/AR_SpeechCommands/numbers/9_43.wav 9 142 | /work/dodohow1011/AR_SpeechCommands/numbers/8_22.wav 8 143 | /work/dodohow1011/AR_SpeechCommands/numbers/1_74.wav 1 144 | /work/dodohow1011/AR_SpeechCommands/numbers/9_25.wav 9 145 | /work/dodohow1011/AR_SpeechCommands/numbers/1_97.wav 1 146 | /work/dodohow1011/AR_SpeechCommands/numbers/7_70.wav 7 147 | /work/dodohow1011/AR_SpeechCommands/numbers/3_51.wav 3 148 | /work/dodohow1011/AR_SpeechCommands/numbers/8_9.wav 8 149 | /work/dodohow1011/AR_SpeechCommands/numbers/6_78.wav 6 150 | /work/dodohow1011/AR_SpeechCommands/numbers/2_59.wav 2 151 | /work/dodohow1011/AR_SpeechCommands/numbers/9_76.wav 9 152 | /work/dodohow1011/AR_SpeechCommands/numbers/6_31.wav 6 153 | /work/dodohow1011/AR_SpeechCommands/numbers/4_8.wav 4 154 | /work/dodohow1011/AR_SpeechCommands/numbers/3_15.wav 3 155 | /work/dodohow1011/AR_SpeechCommands/numbers/2_40.wav 2 156 | /work/dodohow1011/AR_SpeechCommands/numbers/1_60.wav 1 157 | /work/dodohow1011/AR_SpeechCommands/numbers/6_82.wav 6 158 | /work/dodohow1011/AR_SpeechCommands/numbers/2_63.wav 2 159 | /work/dodohow1011/AR_SpeechCommands/numbers/5_100.wav 5 160 | /work/dodohow1011/AR_SpeechCommands/numbers/5_20.wav 5 161 | /work/dodohow1011/AR_SpeechCommands/numbers/1_70.wav 1 162 | /work/dodohow1011/AR_SpeechCommands/numbers/0_78.wav 0 163 | /work/dodohow1011/AR_SpeechCommands/numbers/3_76.wav 3 164 | /work/dodohow1011/AR_SpeechCommands/numbers/3_99.wav 3 165 | /work/dodohow1011/AR_SpeechCommands/numbers/3_7.wav 3 166 | /work/dodohow1011/AR_SpeechCommands/numbers/7_77.wav 7 167 | /work/dodohow1011/AR_SpeechCommands/numbers/7_30.wav 7 168 | /work/dodohow1011/AR_SpeechCommands/numbers/0_82.wav 0 169 | /work/dodohow1011/AR_SpeechCommands/numbers/6_1.wav 6 170 | /work/dodohow1011/AR_SpeechCommands/numbers/4_14.wav 4 171 | /work/dodohow1011/AR_SpeechCommands/numbers/6_4.wav 6 172 | /work/dodohow1011/AR_SpeechCommands/numbers/3_62.wav 3 173 | /work/dodohow1011/AR_SpeechCommands/numbers/7_40.wav 7 174 | /work/dodohow1011/AR_SpeechCommands/numbers/6_89.wav 6 175 | /work/dodohow1011/AR_SpeechCommands/numbers/4_24.wav 4 176 | /work/dodohow1011/AR_SpeechCommands/numbers/0_74.wav 0 177 | /work/dodohow1011/AR_SpeechCommands/numbers/8_25.wav 8 178 | /work/dodohow1011/AR_SpeechCommands/numbers/7_91.wav 7 179 | /work/dodohow1011/AR_SpeechCommands/numbers/4_75.wav 4 180 | /work/dodohow1011/AR_SpeechCommands/numbers/5_78.wav 5 181 | /work/dodohow1011/AR_SpeechCommands/numbers/3_54.wav 3 182 | /work/dodohow1011/AR_SpeechCommands/numbers/1_30.wav 1 183 | /work/dodohow1011/AR_SpeechCommands/numbers/7_96.wav 7 184 | /work/dodohow1011/AR_SpeechCommands/numbers/6_52.wav 6 185 | /work/dodohow1011/AR_SpeechCommands/numbers/4_57.wav 4 186 | /work/dodohow1011/AR_SpeechCommands/numbers/7_9.wav 7 187 | /work/dodohow1011/AR_SpeechCommands/numbers/9_50.wav 9 188 | /work/dodohow1011/AR_SpeechCommands/numbers/5_31.wav 5 189 | /work/dodohow1011/AR_SpeechCommands/numbers/4_10.wav 4 190 | /work/dodohow1011/AR_SpeechCommands/numbers/9_32.wav 9 191 | /work/dodohow1011/AR_SpeechCommands/numbers/1_40.wav 1 192 | /work/dodohow1011/AR_SpeechCommands/numbers/0_60.wav 0 193 | /work/dodohow1011/AR_SpeechCommands/numbers/8_11.wav 8 194 | /work/dodohow1011/AR_SpeechCommands/numbers/6_16.wav 6 195 | /work/dodohow1011/AR_SpeechCommands/numbers/5_82.wav 5 196 | /work/dodohow1011/AR_SpeechCommands/numbers/1_5.wav 1 197 | /work/dodohow1011/AR_SpeechCommands/numbers/9_14.wav 9 198 | /work/dodohow1011/AR_SpeechCommands/numbers/7_19.wav 7 199 | /work/dodohow1011/AR_SpeechCommands/numbers/7_88.wav 7 200 | /work/dodohow1011/AR_SpeechCommands/numbers/1_91.wav 1 201 | /work/dodohow1011/AR_SpeechCommands/numbers/5_23.wav 5 202 | /work/dodohow1011/AR_SpeechCommands/numbers/8_21.wav 8 203 | /work/dodohow1011/AR_SpeechCommands/numbers/1_73.wav 1 204 | /work/dodohow1011/AR_SpeechCommands/numbers/8_90.wav 8 205 | /work/dodohow1011/AR_SpeechCommands/numbers/8_44.wav 8 206 | /work/dodohow1011/AR_SpeechCommands/numbers/2_76.wav 2 207 | /work/dodohow1011/AR_SpeechCommands/numbers/5_74.wav 5 208 | /work/dodohow1011/AR_SpeechCommands/numbers/3_79.wav 3 209 | /work/dodohow1011/AR_SpeechCommands/numbers/1_55.wav 1 210 | /work/dodohow1011/AR_SpeechCommands/numbers/6_77.wav 6 211 | /work/dodohow1011/AR_SpeechCommands/numbers/2_4.wav 2 212 | /work/dodohow1011/AR_SpeechCommands/numbers/3_32.wav 3 213 | /work/dodohow1011/AR_SpeechCommands/numbers/2_7.wav 2 214 | /work/dodohow1011/AR_SpeechCommands/numbers/9_98.wav 9 215 | /work/dodohow1011/AR_SpeechCommands/numbers/0_16.wav 0 216 | /work/dodohow1011/AR_SpeechCommands/numbers/3_14.wav 3 217 | /work/dodohow1011/AR_SpeechCommands/numbers/1_88.wav 1 218 | /work/dodohow1011/AR_SpeechCommands/numbers/9_39.wav 9 219 | /work/dodohow1011/AR_SpeechCommands/numbers/4_86.wav 4 220 | /work/dodohow1011/AR_SpeechCommands/numbers/3_42.wav 3 221 | /work/dodohow1011/AR_SpeechCommands/numbers/0_67.wav 0 222 | /work/dodohow1011/AR_SpeechCommands/numbers/7_43.wav 7 223 | /work/dodohow1011/AR_SpeechCommands/numbers/3_24.wav 3 224 | /work/dodohow1011/AR_SpeechCommands/numbers/6_22.wav 6 225 | /work/dodohow1011/AR_SpeechCommands/numbers/7_25.wav 7 226 | /work/dodohow1011/AR_SpeechCommands/numbers/1_3.wav 1 227 | /work/dodohow1011/AR_SpeechCommands/numbers/8_100.wav 8 228 | /work/dodohow1011/AR_SpeechCommands/numbers/3_75.wav 3 229 | /work/dodohow1011/AR_SpeechCommands/numbers/2_95.wav 2 230 | /work/dodohow1011/AR_SpeechCommands/numbers/1_51.wav 1 231 | /work/dodohow1011/AR_SpeechCommands/numbers/3_98.wav 3 232 | /work/dodohow1011/AR_SpeechCommands/numbers/0_30.wav 0 233 | /work/dodohow1011/AR_SpeechCommands/numbers/7_76.wav 7 234 | /work/dodohow1011/AR_SpeechCommands/numbers/5_52.wav 5 235 | /work/dodohow1011/AR_SpeechCommands/numbers/3_57.wav 3 236 | /work/dodohow1011/AR_SpeechCommands/numbers/9_53.wav 9 237 | /work/dodohow1011/AR_SpeechCommands/numbers/7_58.wav 7 238 | /work/dodohow1011/AR_SpeechCommands/numbers/2_18.wav 2 239 | /work/dodohow1011/AR_SpeechCommands/numbers/8_14.wav 8 240 | /work/dodohow1011/AR_SpeechCommands/numbers/6_19.wav 6 241 | /work/dodohow1011/AR_SpeechCommands/numbers/4_64.wav 4 242 | /work/dodohow1011/AR_SpeechCommands/numbers/2_28.wav 2 243 | /work/dodohow1011/AR_SpeechCommands/numbers/1_48.wav 1 244 | /work/dodohow1011/AR_SpeechCommands/numbers/8_65.wav 8 245 | /work/dodohow1011/AR_SpeechCommands/numbers/7_21.wav 7 246 | /work/dodohow1011/AR_SpeechCommands/numbers/4_46.wav 4 247 | /work/dodohow1011/AR_SpeechCommands/numbers/8_24.wav 8 248 | /work/dodohow1011/AR_SpeechCommands/numbers/7_90.wav 7 249 | /work/dodohow1011/AR_SpeechCommands/numbers/5_2.wav 5 250 | /work/dodohow1011/AR_SpeechCommands/numbers/8_47.wav 8 251 | /work/dodohow1011/AR_SpeechCommands/numbers/1_99.wav 1 252 | /work/dodohow1011/AR_SpeechCommands/numbers/7_72.wav 7 253 | /work/dodohow1011/AR_SpeechCommands/numbers/5_77.wav 5 254 | /work/dodohow1011/AR_SpeechCommands/numbers/7_95.wav 7 255 | /work/dodohow1011/AR_SpeechCommands/numbers/4_56.wav 4 256 | /work/dodohow1011/AR_SpeechCommands/numbers/2_32.wav 2 257 | /work/dodohow1011/AR_SpeechCommands/numbers/9_78.wav 9 258 | /work/dodohow1011/AR_SpeechCommands/numbers/3_35.wav 3 259 | /work/dodohow1011/AR_SpeechCommands/numbers/8_57.wav 8 260 | /work/dodohow1011/AR_SpeechCommands/numbers/4_38.wav 4 261 | /work/dodohow1011/AR_SpeechCommands/numbers/0_19.wav 0 262 | /work/dodohow1011/AR_SpeechCommands/numbers/1_7.wav 1 263 | /work/dodohow1011/AR_SpeechCommands/numbers/9_31.wav 9 264 | /work/dodohow1011/AR_SpeechCommands/numbers/5_81.wav 5 265 | /work/dodohow1011/AR_SpeechCommands/numbers/1_21.wav 1 266 | /work/dodohow1011/AR_SpeechCommands/numbers/5_63.wav 5 267 | /work/dodohow1011/AR_SpeechCommands/numbers/0_29.wav 0 268 | /work/dodohow1011/AR_SpeechCommands/numbers/1_44.wav 1 269 | /work/dodohow1011/AR_SpeechCommands/numbers/8_61.wav 8 270 | /work/dodohow1011/AR_SpeechCommands/numbers/5_22.wav 5 271 | /work/dodohow1011/AR_SpeechCommands/numbers/8_20.wav 8 272 | /work/dodohow1011/AR_SpeechCommands/numbers/6_25.wav 6 273 | /work/dodohow1011/AR_SpeechCommands/numbers/6_94.wav 6 274 | /work/dodohow1011/AR_SpeechCommands/numbers/9_92.wav 9 275 | /work/dodohow1011/AR_SpeechCommands/numbers/5_73.wav 5 276 | /work/dodohow1011/AR_SpeechCommands/numbers/1_54.wav 1 277 | /work/dodohow1011/AR_SpeechCommands/numbers/6_76.wav 6 278 | /work/dodohow1011/AR_SpeechCommands/numbers/7_79.wav 7 279 | /work/dodohow1011/AR_SpeechCommands/numbers/5_55.wav 5 280 | /work/dodohow1011/AR_SpeechCommands/numbers/3_31.wav 3 281 | /work/dodohow1011/AR_SpeechCommands/numbers/6_58.wav 6 282 | /work/dodohow1011/AR_SpeechCommands/numbers/7_32.wav 7 283 | /work/dodohow1011/AR_SpeechCommands/numbers/5_3.wav 5 284 | /work/dodohow1011/AR_SpeechCommands/numbers/3_13.wav 3 285 | /work/dodohow1011/AR_SpeechCommands/numbers/6_11.wav 6 286 | /work/dodohow1011/AR_SpeechCommands/numbers/6_80.wav 6 287 | /work/dodohow1011/AR_SpeechCommands/numbers/4_85.wav 4 288 | /work/dodohow1011/AR_SpeechCommands/numbers/3_41.wav 3 289 | /work/dodohow1011/AR_SpeechCommands/numbers/2_20.wav 2 290 | /work/dodohow1011/AR_SpeechCommands/numbers/1_69.wav 1 291 | /work/dodohow1011/AR_SpeechCommands/numbers/3_23.wav 3 292 | /work/dodohow1011/AR_SpeechCommands/numbers/9_89.wav 9 293 | /work/dodohow1011/AR_SpeechCommands/numbers/1_8.wav 1 294 | /work/dodohow1011/AR_SpeechCommands/numbers/3_46.wav 3 295 | /work/dodohow1011/AR_SpeechCommands/numbers/6_44.wav 6 296 | /work/dodohow1011/AR_SpeechCommands/numbers/0_58.wav 0 297 | /work/dodohow1011/AR_SpeechCommands/numbers/8_78.wav 8 298 | /work/dodohow1011/AR_SpeechCommands/numbers/4_59.wav 4 299 | /work/dodohow1011/AR_SpeechCommands/numbers/7_57.wav 7 300 | /work/dodohow1011/AR_SpeechCommands/numbers/0_80.wav 0 301 | /work/dodohow1011/AR_SpeechCommands/numbers/6_36.wav 6 302 | /work/dodohow1011/AR_SpeechCommands/numbers/0_4.wav 0 303 | /work/dodohow1011/AR_SpeechCommands/numbers/7_39.wav 7 304 | /work/dodohow1011/AR_SpeechCommands/numbers/7_10.wav 7 305 | /work/dodohow1011/AR_SpeechCommands/numbers/4_81.wav 4 306 | /work/dodohow1011/AR_SpeechCommands/numbers/0_62.wav 0 307 | /work/dodohow1011/AR_SpeechCommands/numbers/6_18.wav 6 308 | /work/dodohow1011/AR_SpeechCommands/numbers/5_84.wav 5 309 | /work/dodohow1011/AR_SpeechCommands/numbers/4_40.wav 4 310 | /work/dodohow1011/AR_SpeechCommands/numbers/2_68.wav 2 311 | /work/dodohow1011/AR_SpeechCommands/numbers/1_24.wav 1 312 | /work/dodohow1011/AR_SpeechCommands/numbers/0_90.wav 0 313 | /work/dodohow1011/AR_SpeechCommands/numbers/7_61.wav 7 314 | /work/dodohow1011/AR_SpeechCommands/numbers/9_67.wav 9 315 | /work/dodohow1011/AR_SpeechCommands/numbers/5_94.wav 5 316 | /work/dodohow1011/AR_SpeechCommands/numbers/1_75.wav 1 317 | /work/dodohow1011/AR_SpeechCommands/numbers/0_95.wav 0 318 | /work/dodohow1011/AR_SpeechCommands/numbers/1_98.wav 1 319 | /work/dodohow1011/AR_SpeechCommands/numbers/0_54.wav 0 320 | /work/dodohow1011/AR_SpeechCommands/numbers/3_52.wav 3 321 | /work/dodohow1011/AR_SpeechCommands/numbers/1_57.wav 1 322 | /work/dodohow1011/AR_SpeechCommands/numbers/6_50.wav 6 323 | /work/dodohow1011/AR_SpeechCommands/numbers/4_55.wav 4 324 | /work/dodohow1011/AR_SpeechCommands/numbers/0_36.wav 0 325 | /work/dodohow1011/AR_SpeechCommands/numbers/8_4.wav 8 326 | /work/dodohow1011/AR_SpeechCommands/numbers/8_97.wav 8 327 | /work/dodohow1011/AR_SpeechCommands/numbers/8_7.wav 8 328 | /work/dodohow1011/AR_SpeechCommands/numbers/0_18.wav 0 329 | /work/dodohow1011/AR_SpeechCommands/numbers/9_30.wav 9 330 | /work/dodohow1011/AR_SpeechCommands/numbers/2_82.wav 2 331 | /work/dodohow1011/AR_SpeechCommands/numbers/0_87.wav 0 332 | /work/dodohow1011/AR_SpeechCommands/numbers/6_14.wav 6 333 | /work/dodohow1011/AR_SpeechCommands/numbers/2_41.wav 2 334 | /work/dodohow1011/AR_SpeechCommands/numbers/4_6.wav 4 335 | /work/dodohow1011/AR_SpeechCommands/numbers/6_83.wav 6 336 | /work/dodohow1011/AR_SpeechCommands/numbers/6_42.wav 6 337 | /work/dodohow1011/AR_SpeechCommands/numbers/3_67.wav 3 338 | /work/dodohow1011/AR_SpeechCommands/numbers/0_28.wav 0 339 | /work/dodohow1011/AR_SpeechCommands/numbers/5_21.wav 5 340 | /work/dodohow1011/AR_SpeechCommands/numbers/6_24.wav 6 341 | /work/dodohow1011/AR_SpeechCommands/numbers/4_29.wav 4 342 | /work/dodohow1011/AR_SpeechCommands/numbers/5_90.wav 5 343 | /work/dodohow1011/AR_SpeechCommands/numbers/3_49.wav 3 344 | /work/dodohow1011/AR_SpeechCommands/numbers/0_5.wav 0 345 | /work/dodohow1011/AR_SpeechCommands/numbers/0_8.wav 0 346 | /work/dodohow1011/AR_SpeechCommands/numbers/0_50.wav 0 347 | /work/dodohow1011/AR_SpeechCommands/numbers/6_98.wav 6 348 | /work/dodohow1011/AR_SpeechCommands/numbers/3_30.wav 3 349 | /work/dodohow1011/AR_SpeechCommands/numbers/1_35.wav 1 350 | /work/dodohow1011/AR_SpeechCommands/numbers/3_5.wav 3 351 | /work/dodohow1011/AR_SpeechCommands/numbers/2_38.wav 2 352 | /work/dodohow1011/AR_SpeechCommands/numbers/7_31.wav 7 353 | /work/dodohow1011/AR_SpeechCommands/numbers/0_42.wav 0 354 | /work/dodohow1011/AR_SpeechCommands/numbers/5_87.wav 5 355 | /work/dodohow1011/AR_SpeechCommands/numbers/0_24.wav 0 356 | /work/dodohow1011/AR_SpeechCommands/numbers/7_41.wav 7 357 | /work/dodohow1011/AR_SpeechCommands/numbers/6_61.wav 6 358 | /work/dodohow1011/AR_SpeechCommands/numbers/0_93.wav 0 359 | /work/dodohow1011/AR_SpeechCommands/numbers/4_94.wav 4 360 | /work/dodohow1011/AR_SpeechCommands/numbers/4_48.wav 4 361 | /work/dodohow1011/AR_SpeechCommands/numbers/8_26.wav 8 362 | /work/dodohow1011/AR_SpeechCommands/numbers/7_46.wav 7 363 | /work/dodohow1011/AR_SpeechCommands/numbers/6_71.wav 6 364 | /work/dodohow1011/AR_SpeechCommands/numbers/3_55.wav 3 365 | /work/dodohow1011/AR_SpeechCommands/numbers/7_56.wav 7 366 | /work/dodohow1011/AR_SpeechCommands/numbers/1_13.wav 1 367 | /work/dodohow1011/AR_SpeechCommands/numbers/0_9.wav 0 368 | /work/dodohow1011/AR_SpeechCommands/numbers/2_16.wav 2 369 | /work/dodohow1011/AR_SpeechCommands/numbers/3_100.wav 3 370 | /work/dodohow1011/AR_SpeechCommands/numbers/9_33.wav 9 371 | /work/dodohow1011/AR_SpeechCommands/numbers/2_85.wav 2 372 | -------------------------------------------------------------------------------- /Datasets/LT-SCR/noise_full.csv: -------------------------------------------------------------------------------- 1 | filename label 2 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/55.wav silence 3 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/136.wav silence 4 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/139.wav silence 5 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/201.wav silence 6 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/204.wav silence 7 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/162.wav silence 8 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/34.wav silence 9 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/156.wav silence 10 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/159.wav silence 11 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/221.wav silence 12 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/30.wav silence 13 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/224.wav silence 14 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/227.wav silence 15 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/13.wav silence 16 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/182.wav silence 17 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/37.wav silence 18 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/179.wav silence 19 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/241.wav silence 20 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/244.wav silence 21 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/247.wav silence 22 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/100.wav silence 23 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/16.wav silence 24 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/199.wav silence 25 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/261.wav silence 26 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/81.wav silence 27 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/264.wav silence 28 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/267.wav silence 29 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/120.wav silence 30 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/88.wav silence 31 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/123.wav silence 32 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/19.wav silence 33 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/60.wav silence 34 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/117.wav silence 35 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/84.wav silence 36 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/284.wav silence 37 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/287.wav silence 38 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/140.wav silence 39 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/67.wav silence 40 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/143.wav silence 41 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/63.wav silence 42 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/202.wav silence 43 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/205.wav silence 44 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/160.wav silence 45 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/208.wav silence 46 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/163.wav silence 47 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/42.wav silence 48 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/166.wav silence 49 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/222.wav silence 50 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/66.wav silence 51 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/225.wav silence 52 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/180.wav silence 53 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/228.wav silence 54 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/49.wav silence 55 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/183.wav silence 56 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/1.wav silence 57 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/186.wav silence 58 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/45.wav silence 59 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/245.wav silence 60 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/248.wav silence 61 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/101.wav silence 62 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/24.wav silence 63 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/104.wav silence 64 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/20.wav silence 65 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/265.wav silence 66 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/268.wav silence 67 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/121.wav silence 68 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/124.wav silence 69 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/96.wav silence 70 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/27.wav silence 71 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/291.wav silence 72 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/127.wav silence 73 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/285.wav silence 74 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/92.wav silence 75 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/288.wav silence 76 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/141.wav silence 77 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/144.wav silence 78 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/3.wav silence 79 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/99.wav silence 80 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/147.wav silence 81 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/71.wav silence 82 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/206.wav silence 83 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/161.wav silence 84 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/209.wav silence 85 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/164.wav silence 86 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/78.wav silence 87 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/167.wav silence 88 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/50.wav silence 89 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/74.wav silence 90 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/226.wav silence 91 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/181.wav silence 92 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/229.wav silence 93 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/57.wav silence 94 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/184.wav silence 95 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/187.wav silence 96 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/53.wav silence 97 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/252.wav silence 98 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/246.wav silence 99 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/249.wav silence 100 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/102.wav silence 101 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/105.wav silence 102 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/32.wav silence 103 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/5.wav silence 104 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/272.wav silence 105 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/108.wav silence 106 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/56.wav silence 107 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/269.wav silence 108 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/122.wav silence 109 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/39.wav silence 110 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/125.wav silence 111 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/292.wav silence 112 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/35.wav silence 113 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/128.wav silence 114 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/289.wav silence 115 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/142.wav silence 116 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/145.wav silence 117 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/14.wav silence 118 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/148.wav silence 119 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/210.wav silence 120 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/38.wav silence 121 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/213.wav silence 122 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/10.wav silence 123 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/207.wav silence 124 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/165.wav silence 125 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/86.wav silence 126 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/168.wav silence 127 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/230.wav silence 128 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/17.wav silence 129 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/7.wav silence 130 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/233.wav silence 131 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/82.wav silence 132 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/191.wav silence 133 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/185.wav silence 134 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/188.wav silence 135 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/250.wav silence 136 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/89.wav silence 137 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/253.wav silence 138 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/61.wav silence 139 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/256.wav silence 140 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/85.wav silence 141 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/103.wav silence 142 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/270.wav silence 143 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/106.wav silence 144 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/68.wav silence 145 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/40.wav silence 146 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/273.wav silence 147 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/109.wav silence 148 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/276.wav silence 149 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/64.wav silence 150 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/290.wav silence 151 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/126.wav silence 152 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/9.wav silence 153 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/129.wav silence 154 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/43.wav silence 155 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/152.wav silence 156 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/146.wav silence 157 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/22.wav silence 158 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/149.wav silence 159 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/211.wav silence 160 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/214.wav silence 161 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/46.wav silence 162 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/217.wav silence 163 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/172.wav silence 164 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/29.wav silence 165 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/169.wav silence 166 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/231.wav silence 167 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/25.wav silence 168 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/234.wav silence 169 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/237.wav silence 170 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/90.wav silence 171 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/21.wav silence 172 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/192.wav silence 173 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/189.wav silence 174 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/251.wav silence 175 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/254.wav silence 176 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/97.wav silence 177 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/28.wav silence 178 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/257.wav silence 179 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/110.wav silence 180 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/93.wav silence 181 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/113.wav silence 182 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/271.wav silence 183 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/107.wav silence 184 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/76.wav silence 185 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/274.wav silence 186 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/277.wav silence 187 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/72.wav silence 188 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/130.wav silence 189 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/133.wav silence 190 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/79.wav silence 191 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/51.wav silence 192 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/150.wav silence 193 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/75.wav silence 194 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/153.wav silence 195 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/58.wav silence 196 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/212.wav silence 197 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/215.wav silence 198 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/54.wav silence 199 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/170.wav silence 200 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/218.wav silence 201 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/173.wav silence 202 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/176.wav silence 203 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/232.wav silence 204 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/235.wav silence 205 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/33.wav silence 206 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/190.wav silence 207 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/238.wav silence 208 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/193.wav silence 209 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/196.wav silence 210 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/12.wav silence 211 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/255.wav silence 212 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/36.wav silence 213 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/258.wav silence 214 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/111.wav silence 215 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/114.wav silence 216 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/2.wav silence 217 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/281.wav silence 218 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/275.wav silence 219 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/15.wav silence 220 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/278.wav silence 221 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/131.wav silence 222 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/80.wav silence 223 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/11.wav silence 224 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/134.wav silence 225 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/137.wav silence 226 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/87.wav silence 227 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/18.wav silence 228 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/151.wav silence 229 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/83.wav silence 230 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/154.wav silence 231 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/157.wav silence 232 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/216.wav silence 233 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/171.wav silence 234 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/219.wav silence 235 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/62.wav silence 236 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/174.wav silence 237 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/177.wav silence 238 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/4.wav silence 239 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/242.wav silence 240 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/236.wav silence 241 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/69.wav silence 242 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/41.wav silence 243 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/239.wav silence 244 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/194.wav silence 245 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/65.wav silence 246 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/197.wav silence 247 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/262.wav silence 248 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/48.wav silence 249 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/259.wav silence 250 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/44.wav silence 251 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/112.wav silence 252 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/115.wav silence 253 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/282.wav silence 254 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/118.wav silence 255 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/23.wav silence 256 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/279.wav silence 257 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/132.wav silence 258 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/47.wav silence 259 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/135.wav silence 260 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/6.wav silence 261 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/138.wav silence 262 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/200.wav silence 263 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/203.wav silence 264 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/95.wav silence 265 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/26.wav silence 266 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/155.wav silence 267 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/91.wav silence 268 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/158.wav silence 269 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/220.wav silence 270 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/223.wav silence 271 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/98.wav silence 272 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/70.wav silence 273 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/175.wav silence 274 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/178.wav silence 275 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/240.wav silence 276 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/94.wav silence 277 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/243.wav silence 278 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/77.wav silence 279 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/195.wav silence 280 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/73.wav silence 281 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/198.wav silence 282 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/260.wav silence 283 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/8.wav silence 284 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/263.wav silence 285 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/266.wav silence 286 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/52.wav silence 287 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/280.wav silence 288 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/116.wav silence 289 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/283.wav silence 290 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/119.wav silence 291 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/286.wav silence 292 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/59.wav silence 293 | /work/dodohow1011/lt_speech_commands/dataset/_background_noise_/31.wav silence 294 | -------------------------------------------------------------------------------- /Datasets/LT-SCR/train_limit20.csv: -------------------------------------------------------------------------------- 1 | filename label 2 | /work/dodohow1011/lt_speech_commands/dataset/du/27_nohash_0.wav unknown 3 | /work/dodohow1011/lt_speech_commands/dataset/du/24_nohash_0.wav unknown 4 | /work/dodohow1011/lt_speech_commands/dataset/du/25_nohash_0.wav unknown 5 | /work/dodohow1011/lt_speech_commands/dataset/du/23_nohash_0.wav unknown 6 | /work/dodohow1011/lt_speech_commands/dataset/du/08_nohash_0.wav unknown 7 | /work/dodohow1011/lt_speech_commands/dataset/du/03_nohash_0.wav unknown 8 | /work/dodohow1011/lt_speech_commands/dataset/du/29_nohash_0.wav unknown 9 | /work/dodohow1011/lt_speech_commands/dataset/du/30_nohash_0.wav unknown 10 | /work/dodohow1011/lt_speech_commands/dataset/du/06_nohash_0.wav unknown 11 | /work/dodohow1011/lt_speech_commands/dataset/du/18_nohash_0.wav unknown 12 | /work/dodohow1011/lt_speech_commands/dataset/du/05_nohash_0.wav unknown 13 | /work/dodohow1011/lt_speech_commands/dataset/du/26_nohash_0.wav unknown 14 | /work/dodohow1011/lt_speech_commands/dataset/du/09_nohash_0.wav unknown 15 | /work/dodohow1011/lt_speech_commands/dataset/du/21_nohash_0.wav unknown 16 | /work/dodohow1011/lt_speech_commands/dataset/du/01_nohash_0.wav unknown 17 | /work/dodohow1011/lt_speech_commands/dataset/du/19_nohash_0.wav unknown 18 | /work/dodohow1011/lt_speech_commands/dataset/du/10_nohash_0.wav unknown 19 | /work/dodohow1011/lt_speech_commands/dataset/du/16_nohash_0.wav unknown 20 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/27_nohash_0.wav išjunk 21 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/24_nohash_0.wav išjunk 22 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/23_nohash_0.wav išjunk 23 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/08_nohash_0.wav išjunk 24 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/03_nohash_0.wav išjunk 25 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/29_nohash_0.wav išjunk 26 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/30_nohash_0.wav išjunk 27 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/06_nohash_0.wav išjunk 28 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/18_nohash_0.wav išjunk 29 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/05_nohash_0.wav išjunk 30 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/26_nohash_0.wav išjunk 31 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/09_nohash_0.wav išjunk 32 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/21_nohash_0.wav išjunk 33 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/01_nohash_0.wav išjunk 34 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/19_nohash_0.wav išjunk 35 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/10_nohash_0.wav išjunk 36 | /work/dodohow1011/lt_speech_commands/dataset/išjunk/16_nohash_0.wav išjunk 37 | /work/dodohow1011/lt_speech_commands/dataset/keturi/27_nohash_0.wav unknown 38 | /work/dodohow1011/lt_speech_commands/dataset/keturi/24_nohash_0.wav unknown 39 | /work/dodohow1011/lt_speech_commands/dataset/keturi/25_nohash_0.wav unknown 40 | /work/dodohow1011/lt_speech_commands/dataset/keturi/23_nohash_0.wav unknown 41 | /work/dodohow1011/lt_speech_commands/dataset/keturi/08_nohash_0.wav unknown 42 | /work/dodohow1011/lt_speech_commands/dataset/keturi/03_nohash_0.wav unknown 43 | /work/dodohow1011/lt_speech_commands/dataset/keturi/29_nohash_0.wav unknown 44 | /work/dodohow1011/lt_speech_commands/dataset/keturi/30_nohash_0.wav unknown 45 | /work/dodohow1011/lt_speech_commands/dataset/keturi/06_nohash_0.wav unknown 46 | /work/dodohow1011/lt_speech_commands/dataset/keturi/18_nohash_0.wav unknown 47 | /work/dodohow1011/lt_speech_commands/dataset/keturi/05_nohash_0.wav unknown 48 | /work/dodohow1011/lt_speech_commands/dataset/keturi/26_nohash_0.wav unknown 49 | /work/dodohow1011/lt_speech_commands/dataset/keturi/21_nohash_0.wav unknown 50 | /work/dodohow1011/lt_speech_commands/dataset/keturi/01_nohash_0.wav unknown 51 | /work/dodohow1011/lt_speech_commands/dataset/keturi/19_nohash_0.wav unknown 52 | /work/dodohow1011/lt_speech_commands/dataset/keturi/10_nohash_0.wav unknown 53 | /work/dodohow1011/lt_speech_commands/dataset/keturi/16_nohash_0.wav unknown 54 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/23_nohash_0.wav į_dešinę 55 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/08_nohash_0.wav į_dešinę 56 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/03_nohash_0.wav į_dešinę 57 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/29_nohash_0.wav į_dešinę 58 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/30_nohash_0.wav į_dešinę 59 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/06_nohash_0.wav į_dešinę 60 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/18_nohash_0.wav į_dešinę 61 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/09_nohash_0.wav į_dešinę 62 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/19_nohash_0.wav į_dešinę 63 | /work/dodohow1011/lt_speech_commands/dataset/į_dešinę/16_nohash_0.wav į_dešinę 64 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/27_nohash_0.wav ačiū 65 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/24_nohash_0.wav ačiū 66 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/25_nohash_0.wav ačiū 67 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/23_nohash_0.wav ačiū 68 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/08_nohash_0.wav ačiū 69 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/03_nohash_0.wav ačiū 70 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/29_nohash_0.wav ačiū 71 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/30_nohash_0.wav ačiū 72 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/06_nohash_0.wav ačiū 73 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/18_nohash_0.wav ačiū 74 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/05_nohash_0.wav ačiū 75 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/26_nohash_0.wav ačiū 76 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/09_nohash_0.wav ačiū 77 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/21_nohash_0.wav ačiū 78 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/01_nohash_0.wav ačiū 79 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/19_nohash_0.wav ačiū 80 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/10_nohash_0.wav ačiū 81 | /work/dodohow1011/lt_speech_commands/dataset/ačiū/16_nohash_0.wav ačiū 82 | /work/dodohow1011/lt_speech_commands/dataset/taip/27_nohash_0.wav unknown 83 | /work/dodohow1011/lt_speech_commands/dataset/taip/24_nohash_0.wav unknown 84 | /work/dodohow1011/lt_speech_commands/dataset/taip/25_nohash_0.wav unknown 85 | /work/dodohow1011/lt_speech_commands/dataset/taip/23_nohash_0.wav unknown 86 | /work/dodohow1011/lt_speech_commands/dataset/taip/08_nohash_0.wav unknown 87 | /work/dodohow1011/lt_speech_commands/dataset/taip/03_nohash_0.wav unknown 88 | /work/dodohow1011/lt_speech_commands/dataset/taip/29_nohash_0.wav unknown 89 | /work/dodohow1011/lt_speech_commands/dataset/taip/30_nohash_0.wav unknown 90 | /work/dodohow1011/lt_speech_commands/dataset/taip/06_nohash_0.wav unknown 91 | /work/dodohow1011/lt_speech_commands/dataset/taip/18_nohash_0.wav unknown 92 | /work/dodohow1011/lt_speech_commands/dataset/taip/05_nohash_0.wav unknown 93 | /work/dodohow1011/lt_speech_commands/dataset/taip/26_nohash_0.wav unknown 94 | /work/dodohow1011/lt_speech_commands/dataset/taip/09_nohash_0.wav unknown 95 | /work/dodohow1011/lt_speech_commands/dataset/taip/21_nohash_0.wav unknown 96 | /work/dodohow1011/lt_speech_commands/dataset/taip/01_nohash_0.wav unknown 97 | /work/dodohow1011/lt_speech_commands/dataset/taip/19_nohash_0.wav unknown 98 | /work/dodohow1011/lt_speech_commands/dataset/taip/10_nohash_0.wav unknown 99 | /work/dodohow1011/lt_speech_commands/dataset/taip/16_nohash_0.wav unknown 100 | /work/dodohow1011/lt_speech_commands/dataset/labas/27_nohash_0.wav labas 101 | /work/dodohow1011/lt_speech_commands/dataset/labas/24_nohash_0.wav labas 102 | /work/dodohow1011/lt_speech_commands/dataset/labas/25_nohash_0.wav labas 103 | /work/dodohow1011/lt_speech_commands/dataset/labas/23_nohash_0.wav labas 104 | /work/dodohow1011/lt_speech_commands/dataset/labas/08_nohash_0.wav labas 105 | /work/dodohow1011/lt_speech_commands/dataset/labas/03_nohash_0.wav labas 106 | /work/dodohow1011/lt_speech_commands/dataset/labas/29_nohash_0.wav labas 107 | /work/dodohow1011/lt_speech_commands/dataset/labas/30_nohash_0.wav labas 108 | /work/dodohow1011/lt_speech_commands/dataset/labas/06_nohash_0.wav labas 109 | /work/dodohow1011/lt_speech_commands/dataset/labas/18_nohash_0.wav labas 110 | /work/dodohow1011/lt_speech_commands/dataset/labas/05_nohash_0.wav labas 111 | /work/dodohow1011/lt_speech_commands/dataset/labas/26_nohash_0.wav labas 112 | /work/dodohow1011/lt_speech_commands/dataset/labas/09_nohash_0.wav labas 113 | /work/dodohow1011/lt_speech_commands/dataset/labas/21_nohash_0.wav labas 114 | /work/dodohow1011/lt_speech_commands/dataset/labas/01_nohash_0.wav labas 115 | /work/dodohow1011/lt_speech_commands/dataset/labas/19_nohash_0.wav labas 116 | /work/dodohow1011/lt_speech_commands/dataset/labas/10_nohash_0.wav labas 117 | /work/dodohow1011/lt_speech_commands/dataset/labas/16_nohash_0.wav labas 118 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/27_nohash_0.wav į_viršų 119 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/24_nohash_0.wav į_viršų 120 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/25_nohash_0.wav į_viršų 121 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/23_nohash_0.wav į_viršų 122 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/08_nohash_0.wav į_viršų 123 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/29_nohash_0.wav į_viršų 124 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/30_nohash_0.wav į_viršų 125 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/06_nohash_0.wav į_viršų 126 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/18_nohash_0.wav į_viršų 127 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/05_nohash_0.wav į_viršų 128 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/26_nohash_0.wav į_viršų 129 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/09_nohash_0.wav į_viršų 130 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/01_nohash_0.wav į_viršų 131 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/19_nohash_0.wav į_viršų 132 | /work/dodohow1011/lt_speech_commands/dataset/į_viršų/16_nohash_0.wav į_viršų 133 | /work/dodohow1011/lt_speech_commands/dataset/stop/27_nohash_0.wav stop 134 | /work/dodohow1011/lt_speech_commands/dataset/stop/24_nohash_0.wav stop 135 | /work/dodohow1011/lt_speech_commands/dataset/stop/25_nohash_0.wav stop 136 | /work/dodohow1011/lt_speech_commands/dataset/stop/23_nohash_0.wav stop 137 | /work/dodohow1011/lt_speech_commands/dataset/stop/08_nohash_0.wav stop 138 | /work/dodohow1011/lt_speech_commands/dataset/stop/03_nohash_0.wav stop 139 | /work/dodohow1011/lt_speech_commands/dataset/stop/29_nohash_0.wav stop 140 | /work/dodohow1011/lt_speech_commands/dataset/stop/30_nohash_0.wav stop 141 | /work/dodohow1011/lt_speech_commands/dataset/stop/06_nohash_0.wav stop 142 | /work/dodohow1011/lt_speech_commands/dataset/stop/18_nohash_0.wav stop 143 | /work/dodohow1011/lt_speech_commands/dataset/stop/05_nohash_0.wav stop 144 | /work/dodohow1011/lt_speech_commands/dataset/stop/26_nohash_0.wav stop 145 | /work/dodohow1011/lt_speech_commands/dataset/stop/09_nohash_0.wav stop 146 | /work/dodohow1011/lt_speech_commands/dataset/stop/21_nohash_0.wav stop 147 | /work/dodohow1011/lt_speech_commands/dataset/stop/01_nohash_0.wav stop 148 | /work/dodohow1011/lt_speech_commands/dataset/stop/19_nohash_0.wav stop 149 | /work/dodohow1011/lt_speech_commands/dataset/stop/10_nohash_0.wav stop 150 | /work/dodohow1011/lt_speech_commands/dataset/stop/16_nohash_0.wav stop 151 | /work/dodohow1011/lt_speech_commands/dataset/vienas/27_nohash_0.wav unknown 152 | /work/dodohow1011/lt_speech_commands/dataset/vienas/24_nohash_0.wav unknown 153 | /work/dodohow1011/lt_speech_commands/dataset/vienas/23_nohash_0.wav unknown 154 | /work/dodohow1011/lt_speech_commands/dataset/vienas/08_nohash_0.wav unknown 155 | /work/dodohow1011/lt_speech_commands/dataset/vienas/03_nohash_0.wav unknown 156 | /work/dodohow1011/lt_speech_commands/dataset/vienas/29_nohash_0.wav unknown 157 | /work/dodohow1011/lt_speech_commands/dataset/vienas/30_nohash_0.wav unknown 158 | /work/dodohow1011/lt_speech_commands/dataset/vienas/06_nohash_0.wav unknown 159 | /work/dodohow1011/lt_speech_commands/dataset/vienas/18_nohash_0.wav unknown 160 | /work/dodohow1011/lt_speech_commands/dataset/vienas/05_nohash_0.wav unknown 161 | /work/dodohow1011/lt_speech_commands/dataset/vienas/26_nohash_0.wav unknown 162 | /work/dodohow1011/lt_speech_commands/dataset/vienas/09_nohash_0.wav unknown 163 | /work/dodohow1011/lt_speech_commands/dataset/vienas/21_nohash_0.wav unknown 164 | /work/dodohow1011/lt_speech_commands/dataset/vienas/01_nohash_0.wav unknown 165 | /work/dodohow1011/lt_speech_commands/dataset/vienas/19_nohash_0.wav unknown 166 | /work/dodohow1011/lt_speech_commands/dataset/vienas/16_nohash_0.wav unknown 167 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/24_nohash_0.wav į_apačią 168 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/23_nohash_0.wav į_apačią 169 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/08_nohash_0.wav į_apačią 170 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/03_nohash_0.wav į_apačią 171 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/29_nohash_0.wav į_apačią 172 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/06_nohash_0.wav į_apačią 173 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/18_nohash_0.wav į_apačią 174 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/05_nohash_0.wav į_apačią 175 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/26_nohash_0.wav į_apačią 176 | /work/dodohow1011/lt_speech_commands/dataset/į_apačią/19_nohash_0.wav į_apačią 177 | /work/dodohow1011/lt_speech_commands/dataset/ne/27_nohash_0.wav ne 178 | /work/dodohow1011/lt_speech_commands/dataset/ne/24_nohash_0.wav ne 179 | /work/dodohow1011/lt_speech_commands/dataset/ne/25_nohash_0.wav ne 180 | /work/dodohow1011/lt_speech_commands/dataset/ne/23_nohash_0.wav ne 181 | /work/dodohow1011/lt_speech_commands/dataset/ne/08_nohash_0.wav ne 182 | /work/dodohow1011/lt_speech_commands/dataset/ne/03_nohash_0.wav ne 183 | /work/dodohow1011/lt_speech_commands/dataset/ne/29_nohash_0.wav ne 184 | /work/dodohow1011/lt_speech_commands/dataset/ne/30_nohash_0.wav ne 185 | /work/dodohow1011/lt_speech_commands/dataset/ne/06_nohash_0.wav ne 186 | /work/dodohow1011/lt_speech_commands/dataset/ne/18_nohash_0.wav ne 187 | /work/dodohow1011/lt_speech_commands/dataset/ne/05_nohash_0.wav ne 188 | /work/dodohow1011/lt_speech_commands/dataset/ne/26_nohash_0.wav ne 189 | /work/dodohow1011/lt_speech_commands/dataset/ne/09_nohash_0.wav ne 190 | /work/dodohow1011/lt_speech_commands/dataset/ne/21_nohash_0.wav ne 191 | /work/dodohow1011/lt_speech_commands/dataset/ne/01_nohash_0.wav ne 192 | /work/dodohow1011/lt_speech_commands/dataset/ne/19_nohash_0.wav ne 193 | /work/dodohow1011/lt_speech_commands/dataset/ne/10_nohash_0.wav ne 194 | /work/dodohow1011/lt_speech_commands/dataset/ne/16_nohash_0.wav ne 195 | /work/dodohow1011/lt_speech_commands/dataset/nulis/27_nohash_0.wav unknown 196 | /work/dodohow1011/lt_speech_commands/dataset/nulis/24_nohash_0.wav unknown 197 | /work/dodohow1011/lt_speech_commands/dataset/nulis/25_nohash_0.wav unknown 198 | /work/dodohow1011/lt_speech_commands/dataset/nulis/23_nohash_0.wav unknown 199 | /work/dodohow1011/lt_speech_commands/dataset/nulis/03_nohash_0.wav unknown 200 | /work/dodohow1011/lt_speech_commands/dataset/nulis/29_nohash_0.wav unknown 201 | /work/dodohow1011/lt_speech_commands/dataset/nulis/30_nohash_0.wav unknown 202 | /work/dodohow1011/lt_speech_commands/dataset/nulis/06_nohash_0.wav unknown 203 | /work/dodohow1011/lt_speech_commands/dataset/nulis/18_nohash_0.wav unknown 204 | /work/dodohow1011/lt_speech_commands/dataset/nulis/05_nohash_0.wav unknown 205 | /work/dodohow1011/lt_speech_commands/dataset/nulis/26_nohash_0.wav unknown 206 | /work/dodohow1011/lt_speech_commands/dataset/nulis/09_nohash_0.wav unknown 207 | /work/dodohow1011/lt_speech_commands/dataset/nulis/21_nohash_0.wav unknown 208 | /work/dodohow1011/lt_speech_commands/dataset/nulis/01_nohash_0.wav unknown 209 | /work/dodohow1011/lt_speech_commands/dataset/nulis/19_nohash_0.wav unknown 210 | /work/dodohow1011/lt_speech_commands/dataset/nulis/10_nohash_0.wav unknown 211 | /work/dodohow1011/lt_speech_commands/dataset/nulis/16_nohash_0.wav unknown 212 | /work/dodohow1011/lt_speech_commands/dataset/penki/27_nohash_0.wav unknown 213 | /work/dodohow1011/lt_speech_commands/dataset/penki/24_nohash_0.wav unknown 214 | /work/dodohow1011/lt_speech_commands/dataset/penki/25_nohash_0.wav unknown 215 | /work/dodohow1011/lt_speech_commands/dataset/penki/23_nohash_0.wav unknown 216 | /work/dodohow1011/lt_speech_commands/dataset/penki/08_nohash_0.wav unknown 217 | /work/dodohow1011/lt_speech_commands/dataset/penki/03_nohash_0.wav unknown 218 | /work/dodohow1011/lt_speech_commands/dataset/penki/29_nohash_0.wav unknown 219 | /work/dodohow1011/lt_speech_commands/dataset/penki/30_nohash_0.wav unknown 220 | /work/dodohow1011/lt_speech_commands/dataset/penki/06_nohash_0.wav unknown 221 | /work/dodohow1011/lt_speech_commands/dataset/penki/18_nohash_0.wav unknown 222 | /work/dodohow1011/lt_speech_commands/dataset/penki/05_nohash_0.wav unknown 223 | /work/dodohow1011/lt_speech_commands/dataset/penki/26_nohash_0.wav unknown 224 | /work/dodohow1011/lt_speech_commands/dataset/penki/09_nohash_0.wav unknown 225 | /work/dodohow1011/lt_speech_commands/dataset/penki/21_nohash_0.wav unknown 226 | /work/dodohow1011/lt_speech_commands/dataset/penki/01_nohash_0.wav unknown 227 | /work/dodohow1011/lt_speech_commands/dataset/penki/19_nohash_0.wav unknown 228 | /work/dodohow1011/lt_speech_commands/dataset/penki/10_nohash_0.wav unknown 229 | /work/dodohow1011/lt_speech_commands/dataset/penki/16_nohash_0.wav unknown 230 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/27_nohash_0.wav pauzė 231 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/24_nohash_0.wav pauzė 232 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/25_nohash_0.wav pauzė 233 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/23_nohash_0.wav pauzė 234 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/08_nohash_0.wav pauzė 235 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/03_nohash_0.wav pauzė 236 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/29_nohash_0.wav pauzė 237 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/30_nohash_0.wav pauzė 238 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/06_nohash_0.wav pauzė 239 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/18_nohash_0.wav pauzė 240 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/05_nohash_0.wav pauzė 241 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/26_nohash_0.wav pauzė 242 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/09_nohash_0.wav pauzė 243 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/21_nohash_0.wav pauzė 244 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/01_nohash_0.wav pauzė 245 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/19_nohash_0.wav pauzė 246 | /work/dodohow1011/lt_speech_commands/dataset/pauzė/16_nohash_0.wav pauzė 247 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/27_nohash_0.wav į_kairę 248 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/25_nohash_0.wav į_kairę 249 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/23_nohash_0.wav į_kairę 250 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/08_nohash_0.wav į_kairę 251 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/03_nohash_0.wav į_kairę 252 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/29_nohash_0.wav į_kairę 253 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/30_nohash_0.wav į_kairę 254 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/06_nohash_0.wav į_kairę 255 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/18_nohash_0.wav į_kairę 256 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/05_nohash_0.wav į_kairę 257 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/26_nohash_0.wav į_kairę 258 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/09_nohash_0.wav į_kairę 259 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/21_nohash_0.wav į_kairę 260 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/19_nohash_0.wav į_kairę 261 | /work/dodohow1011/lt_speech_commands/dataset/į_kairę/16_nohash_0.wav į_kairę 262 | /work/dodohow1011/lt_speech_commands/dataset/iki/27_nohash_0.wav iki 263 | /work/dodohow1011/lt_speech_commands/dataset/iki/24_nohash_0.wav iki 264 | /work/dodohow1011/lt_speech_commands/dataset/iki/25_nohash_0.wav iki 265 | /work/dodohow1011/lt_speech_commands/dataset/iki/23_nohash_0.wav iki 266 | /work/dodohow1011/lt_speech_commands/dataset/iki/08_nohash_0.wav iki 267 | /work/dodohow1011/lt_speech_commands/dataset/iki/03_nohash_0.wav iki 268 | /work/dodohow1011/lt_speech_commands/dataset/iki/29_nohash_0.wav iki 269 | /work/dodohow1011/lt_speech_commands/dataset/iki/30_nohash_0.wav iki 270 | /work/dodohow1011/lt_speech_commands/dataset/iki/06_nohash_0.wav iki 271 | /work/dodohow1011/lt_speech_commands/dataset/iki/18_nohash_0.wav iki 272 | /work/dodohow1011/lt_speech_commands/dataset/iki/05_nohash_0.wav iki 273 | /work/dodohow1011/lt_speech_commands/dataset/iki/26_nohash_0.wav iki 274 | /work/dodohow1011/lt_speech_commands/dataset/iki/09_nohash_0.wav iki 275 | /work/dodohow1011/lt_speech_commands/dataset/iki/21_nohash_0.wav iki 276 | /work/dodohow1011/lt_speech_commands/dataset/iki/19_nohash_0.wav iki 277 | /work/dodohow1011/lt_speech_commands/dataset/iki/10_nohash_0.wav iki 278 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/27_nohash_0.wav įjunk 279 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/24_nohash_0.wav įjunk 280 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/25_nohash_0.wav įjunk 281 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/23_nohash_0.wav įjunk 282 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/08_nohash_0.wav įjunk 283 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/03_nohash_0.wav įjunk 284 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/29_nohash_0.wav įjunk 285 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/30_nohash_0.wav įjunk 286 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/06_nohash_0.wav įjunk 287 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/18_nohash_0.wav įjunk 288 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/05_nohash_0.wav įjunk 289 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/26_nohash_0.wav įjunk 290 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/09_nohash_0.wav įjunk 291 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/21_nohash_0.wav įjunk 292 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/01_nohash_0.wav įjunk 293 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/19_nohash_0.wav įjunk 294 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/10_nohash_0.wav įjunk 295 | /work/dodohow1011/lt_speech_commands/dataset/įjunk/16_nohash_0.wav įjunk 296 | /work/dodohow1011/lt_speech_commands/dataset/startas/27_nohash_0.wav startas 297 | /work/dodohow1011/lt_speech_commands/dataset/startas/24_nohash_0.wav startas 298 | /work/dodohow1011/lt_speech_commands/dataset/startas/23_nohash_0.wav startas 299 | /work/dodohow1011/lt_speech_commands/dataset/startas/08_nohash_0.wav startas 300 | /work/dodohow1011/lt_speech_commands/dataset/startas/03_nohash_0.wav startas 301 | /work/dodohow1011/lt_speech_commands/dataset/startas/29_nohash_0.wav startas 302 | /work/dodohow1011/lt_speech_commands/dataset/startas/30_nohash_0.wav startas 303 | /work/dodohow1011/lt_speech_commands/dataset/startas/06_nohash_0.wav startas 304 | /work/dodohow1011/lt_speech_commands/dataset/startas/18_nohash_0.wav startas 305 | /work/dodohow1011/lt_speech_commands/dataset/startas/26_nohash_0.wav startas 306 | /work/dodohow1011/lt_speech_commands/dataset/startas/21_nohash_0.wav startas 307 | /work/dodohow1011/lt_speech_commands/dataset/startas/01_nohash_0.wav startas 308 | /work/dodohow1011/lt_speech_commands/dataset/startas/19_nohash_0.wav startas 309 | /work/dodohow1011/lt_speech_commands/dataset/startas/16_nohash_0.wav startas 310 | /work/dodohow1011/lt_speech_commands/dataset/trys/27_nohash_0.wav unknown 311 | /work/dodohow1011/lt_speech_commands/dataset/trys/24_nohash_0.wav unknown 312 | /work/dodohow1011/lt_speech_commands/dataset/trys/25_nohash_0.wav unknown 313 | /work/dodohow1011/lt_speech_commands/dataset/trys/23_nohash_0.wav unknown 314 | /work/dodohow1011/lt_speech_commands/dataset/trys/08_nohash_0.wav unknown 315 | /work/dodohow1011/lt_speech_commands/dataset/trys/03_nohash_0.wav unknown 316 | /work/dodohow1011/lt_speech_commands/dataset/trys/29_nohash_0.wav unknown 317 | /work/dodohow1011/lt_speech_commands/dataset/trys/30_nohash_0.wav unknown 318 | /work/dodohow1011/lt_speech_commands/dataset/trys/06_nohash_0.wav unknown 319 | /work/dodohow1011/lt_speech_commands/dataset/trys/18_nohash_0.wav unknown 320 | /work/dodohow1011/lt_speech_commands/dataset/trys/05_nohash_0.wav unknown 321 | /work/dodohow1011/lt_speech_commands/dataset/trys/26_nohash_0.wav unknown 322 | /work/dodohow1011/lt_speech_commands/dataset/trys/09_nohash_0.wav unknown 323 | /work/dodohow1011/lt_speech_commands/dataset/trys/21_nohash_0.wav unknown 324 | /work/dodohow1011/lt_speech_commands/dataset/trys/01_nohash_0.wav unknown 325 | /work/dodohow1011/lt_speech_commands/dataset/trys/19_nohash_0.wav unknown 326 | /work/dodohow1011/lt_speech_commands/dataset/trys/10_nohash_0.wav unknown 327 | /work/dodohow1011/lt_speech_commands/dataset/trys/16_nohash_0.wav unknown 328 | -------------------------------------------------------------------------------- /Datasets/DM-SCR/train_full.csv: -------------------------------------------------------------------------------- 1 | filename label 2 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (4).wav 02 3 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (8).wav 02 4 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (3).wav 02 5 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (9).wav 02 6 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (10).wav 02 7 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (2).wav 02 8 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/02/D_SPK1_c2 (1).wav 02 9 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (4).wav 05 10 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (10).wav 05 11 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (9).wav 05 12 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (1).wav 05 13 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (5).wav 05 14 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (6).wav 05 15 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/05/D_SPK1_c5 (2).wav 05 16 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (1).wav 08 17 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (4).wav 08 18 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (3).wav 08 19 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (9).wav 08 20 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (7).wav 08 21 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (6).wav 08 22 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/08/D_SPK1_c8 (8).wav 08 23 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (3).wav 11 24 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (9).wav 11 25 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (4).wav 11 26 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (7).wav 11 27 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (10).wav 11 28 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (2).wav 11 29 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/11/D_SPK1_c11 (8).wav 11 30 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (10).wav 19 31 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (4).wav 19 32 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (1).wav 19 33 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (3).wav 19 34 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (5).wav 19 35 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (2).wav 19 36 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/19/D_SPK1_c19 (6).wav 19 37 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (2).wav 14 38 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (5).wav 14 39 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (3).wav 14 40 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (9).wav 14 41 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (7).wav 14 42 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (8).wav 14 43 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/14/D_SPK1_c14 (10).wav 14 44 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (8).wav 17 45 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (2).wav 17 46 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (3).wav 17 47 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (4).wav 17 48 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (6).wav 17 49 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (10).wav 17 50 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/17/D_SPK1_c17 (7).wav 17 51 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (2).wav 01 52 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (8).wav 01 53 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (4).wav 01 54 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (6).wav 01 55 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (5).wav 01 56 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (1).wav 01 57 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/01/D_SPK1_c (3).wav 01 58 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (2).wav 09 59 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (5).wav 09 60 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (8).wav 09 61 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (3).wav 09 62 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (9).wav 09 63 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (6).wav 09 64 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/09/D_SPK1_c9 (7).wav 09 65 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (3).wav 04 66 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (2).wav 04 67 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (1).wav 04 68 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (4).wav 04 69 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (5).wav 04 70 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (10).wav 04 71 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/04/D_SPK1_c4 (7).wav 04 72 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (4).wav 07 73 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (10).wav 07 74 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (9).wav 07 75 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (3).wav 07 76 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (7).wav 07 77 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (2).wav 07 78 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/07/D_SPK1_c7 (6).wav 07 79 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (10).wav 13 80 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (7).wav 13 81 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (9).wav 13 82 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (8).wav 13 83 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (2).wav 13 84 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (4).wav 13 85 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/13/D_SPK1_c13 (6).wav 13 86 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (2).wav 16 87 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (4).wav 16 88 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (6).wav 16 89 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (8).wav 16 90 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (1).wav 16 91 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (7).wav 16 92 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/16/D_SPK1_c16 (9).wav 16 93 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (6).wav 03 94 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (8).wav 03 95 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (3).wav 03 96 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (9).wav 03 97 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (7).wav 03 98 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (4).wav 03 99 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/03/D_SPK1_c3 (1).wav 03 100 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (9).wav 06 101 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (4).wav 06 102 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (2).wav 06 103 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (5).wav 06 104 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (7).wav 06 105 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (6).wav 06 106 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/06/D_SPK1_c6 (8).wav 06 107 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (8).wav 12 108 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (10).wav 12 109 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (1).wav 12 110 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (3).wav 12 111 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (4).wav 12 112 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (6).wav 12 113 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/12/D_SPK1_c12 (5).wav 12 114 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (3).wav 15 115 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (6).wav 15 116 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (4).wav 15 117 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (7).wav 15 118 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (8).wav 15 119 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (5).wav 15 120 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/15/D_SPK1_c15 (1).wav 15 121 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (7).wav 10 122 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (5).wav 10 123 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (4).wav 10 124 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (9).wav 10 125 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (3).wav 10 126 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (1).wav 10 127 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/10/D_SPK1_c10 (8).wav 10 128 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (8).wav 18 129 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (2).wav 18 130 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (7).wav 18 131 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (5).wav 18 132 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (4).wav 18 133 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (9).wav 18 134 | /work/dodohow1011/dysarthria_zh_command/D_SPK1/18/D_SPK1_c18 (1).wav 18 135 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (9).wav 02 136 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (2).wav 02 137 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (5).wav 02 138 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (4).wav 02 139 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (3).wav 02 140 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (1).wav 02 141 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/02/D_SPK2_c2 (6).wav 02 142 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (1).wav 05 143 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (2).wav 05 144 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (6).wav 05 145 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (5).wav 05 146 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (3).wav 05 147 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (8).wav 05 148 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/05/D_SPK2_c5 (9).wav 05 149 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (9).wav 08 150 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (4).wav 08 151 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (2).wav 08 152 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (1).wav 08 153 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (7).wav 08 154 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (5).wav 08 155 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/08/D_SPK2_c8 (3).wav 08 156 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (10).wav 11 157 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (2).wav 11 158 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (7).wav 11 159 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (3).wav 11 160 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (4).wav 11 161 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (6).wav 11 162 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/11/D_SPK2_c11 (9).wav 11 163 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (5).wav 19 164 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (4).wav 19 165 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (8).wav 19 166 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (6).wav 19 167 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (7).wav 19 168 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (1).wav 19 169 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/19/D_SPK2_c19 (3).wav 19 170 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (3).wav 14 171 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (8).wav 14 172 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (9).wav 14 173 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (10).wav 14 174 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (2).wav 14 175 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (6).wav 14 176 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/14/D_SPK2_c14 (1).wav 14 177 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (4).wav 17 178 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (5).wav 17 179 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (3).wav 17 180 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (2).wav 17 181 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (9).wav 17 182 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (8).wav 17 183 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/17/D_SPK2_c17 (6).wav 17 184 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (5).wav 01 185 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (3).wav 01 186 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (6).wav 01 187 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (2).wav 01 188 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (9).wav 01 189 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (1).wav 01 190 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/01/D_SPK2_c1 (7).wav 01 191 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (8).wav 09 192 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (5).wav 09 193 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (4).wav 09 194 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (9).wav 09 195 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (6).wav 09 196 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (1).wav 09 197 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/09/D_SPK2_c9 (10).wav 09 198 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (3).wav 04 199 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (10).wav 04 200 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (8).wav 04 201 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (4).wav 04 202 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (9).wav 04 203 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (1).wav 04 204 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/04/D_SPK2_c4 (2).wav 04 205 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (8).wav 07 206 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (3).wav 07 207 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (5).wav 07 208 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (10).wav 07 209 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (2).wav 07 210 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (9).wav 07 211 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/07/D_SPK2_c7 (4).wav 07 212 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (6).wav 13 213 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (5).wav 13 214 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (9).wav 13 215 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (8).wav 13 216 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (10).wav 13 217 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (1).wav 13 218 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/13/D_SPK2_c13 (2).wav 13 219 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (10).wav 16 220 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (7).wav 16 221 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (2).wav 16 222 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (3).wav 16 223 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (5).wav 16 224 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (9).wav 16 225 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/16/D_SPK2_c16 (4).wav 16 226 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (9).wav 03 227 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (2).wav 03 228 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (8).wav 03 229 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (7).wav 03 230 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (6).wav 03 231 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (5).wav 03 232 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/03/D_SPK2_c3 (4).wav 03 233 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (10).wav 06 234 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (4).wav 06 235 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (2).wav 06 236 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (9).wav 06 237 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (7).wav 06 238 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (3).wav 06 239 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/06/D_SPK2_c6 (5).wav 06 240 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (10).wav 12 241 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (1).wav 12 242 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (2).wav 12 243 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (4).wav 12 244 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (6).wav 12 245 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (8).wav 12 246 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/12/D_SPK2_c12 (3).wav 12 247 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (2).wav 15 248 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (8).wav 15 249 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (9).wav 15 250 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (1).wav 15 251 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (6).wav 15 252 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (5).wav 15 253 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/15/D_SPK2_c15 (4).wav 15 254 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (6).wav 10 255 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (10).wav 10 256 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (3).wav 10 257 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (2).wav 10 258 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (4).wav 10 259 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (1).wav 10 260 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/10/D_SPK2_c10 (7).wav 10 261 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (8).wav 18 262 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (3).wav 18 263 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (10).wav 18 264 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (2).wav 18 265 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (1).wav 18 266 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (6).wav 18 267 | /work/dodohow1011/dysarthria_zh_command/D_SPK2/18/D_SPK2_c18 (5).wav 18 268 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (3).wav 02 269 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (10).wav 02 270 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (1).wav 02 271 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (5).wav 02 272 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (4).wav 02 273 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (7).wav 02 274 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/02/D_SPK3_c2 (2).wav 02 275 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (4).wav 05 276 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (3).wav 05 277 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (1).wav 05 278 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (2).wav 05 279 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (10).wav 05 280 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (5).wav 05 281 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/05/D_SPK3_c5 (6).wav 05 282 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (9).wav 08 283 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (3).wav 08 284 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (10).wav 08 285 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (1).wav 08 286 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (8).wav 08 287 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (5).wav 08 288 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/08/D_SPK3_c8 (2).wav 08 289 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (4).wav 11 290 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (5).wav 11 291 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (1).wav 11 292 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (2).wav 11 293 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (3).wav 11 294 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (6).wav 11 295 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/11/D_SPK3_c11 (8).wav 11 296 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (1).wav 19 297 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (2).wav 19 298 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (3).wav 19 299 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (10).wav 19 300 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (9).wav 19 301 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (7).wav 19 302 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/19/D_SPK3_c19 (6).wav 19 303 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (7).wav 14 304 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (9).wav 14 305 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (10).wav 14 306 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (6).wav 14 307 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (3).wav 14 308 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (5).wav 14 309 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/14/D_SPK3_c14 (1).wav 14 310 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (10).wav 17 311 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (5).wav 17 312 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (2).wav 17 313 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (6).wav 17 314 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (9).wav 17 315 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (3).wav 17 316 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/17/D_SPK3_c17 (8).wav 17 317 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (5).wav 01 318 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (4).wav 01 319 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (8).wav 01 320 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (6).wav 01 321 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (3).wav 01 322 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (2).wav 01 323 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/01/D_SPK3_c1 (9).wav 01 324 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (1).wav 09 325 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (7).wav 09 326 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (4).wav 09 327 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (10).wav 09 328 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (8).wav 09 329 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (5).wav 09 330 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/09/D_SPK3_c9 (2).wav 09 331 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (7).wav 04 332 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (9).wav 04 333 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (5).wav 04 334 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (4).wav 04 335 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (10).wav 04 336 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (8).wav 04 337 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/04/D_SPK3_c4 (1).wav 04 338 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (5).wav 07 339 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (4).wav 07 340 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (6).wav 07 341 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (2).wav 07 342 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (8).wav 07 343 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (1).wav 07 344 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/07/D_SPK3_c7 (7).wav 07 345 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (2).wav 13 346 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (4).wav 13 347 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (9).wav 13 348 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (1).wav 13 349 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (10).wav 13 350 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (3).wav 13 351 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/13/D_SPK3_c13 (7).wav 13 352 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (5).wav 16 353 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (7).wav 16 354 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (1).wav 16 355 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (3).wav 16 356 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (10).wav 16 357 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (8).wav 16 358 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/16/D_SPK3_c16 (4).wav 16 359 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (8).wav 03 360 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (1).wav 03 361 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (3).wav 03 362 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (9).wav 03 363 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (10).wav 03 364 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (4).wav 03 365 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/03/D_SPK3_c3 (5).wav 03 366 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (6).wav 06 367 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (3).wav 06 368 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (10).wav 06 369 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (7).wav 06 370 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (4).wav 06 371 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (1).wav 06 372 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/06/D_SPK3_c6 (2).wav 06 373 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (1).wav 12 374 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (4).wav 12 375 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (9).wav 12 376 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (7).wav 12 377 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (6).wav 12 378 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (8).wav 12 379 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/12/D_SPK3_c12 (5).wav 12 380 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (5).wav 15 381 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (2).wav 15 382 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (9).wav 15 383 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (7).wav 15 384 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (8).wav 15 385 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (6).wav 15 386 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/15/D_SPK3_c15 (10).wav 15 387 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (7).wav 10 388 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (10).wav 10 389 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (4).wav 10 390 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (3).wav 10 391 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (5).wav 10 392 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (6).wav 10 393 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/10/D_SPK3_c10 (2).wav 10 394 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (1).wav 18 395 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (7).wav 18 396 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (8).wav 18 397 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (6).wav 18 398 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (5).wav 18 399 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (10).wav 18 400 | /work/dodohow1011/dysarthria_zh_command/D_SPK3/18/D_SPK3_c18 (9).wav 18 401 | --------------------------------------------------------------------------------