training: !!bool "false" device: "mps" unprocessed_data: './DATA_DIR/*/*.wav' --- data: train_path: './train_tisv' train_path_unprocessed: './TIMIT/TRAIN/*/*/*.wav' test_path: './test_tisv' test_path_unprocessed: './TIMIT/TEST/*/*/*.wav' data_preprocessed: !!bool "true" sr: 16000 nfft: 512 #For mel spectrogram preprocess window: 0.025 #(s) hop: 0.01 #(s) nmels: 40 #Number of mel energies tisv_frame: 180 #Max number of time steps in input after preprocess --- model: hidden: 768 #Number of LSTM hidden layer units num_layer: 3 #Number of LSTM layers proj: 256 #Embedding size model_path: './speech_id_checkpoint/ckpt_epoch_840_batch_id_6.pth' #Model path for testing, inference, or resuming training --- train: N : 4 #Number of speakers in batch M : 6 #Number of utterances per speaker num_workers: 0 #number of workers for dataloader lr: 0.01 epochs: 1000 #Max training speaker epoch log_interval: 30 #Epochs before printing progress log_file: './speech_id_checkpoint/Stats' checkpoint_interval: 100 #Save model after x speaker epochs checkpoint_dir: './speech_id_checkpoint' restore: !!bool "true" #Resume training from previous model path --- test: N : 4 #Number of speakers in batch M : 6 #Number of utterances per speaker num_workers: 8 #number of workers for data laoder epochs: 10 #testing speaker epochs