diff options
author | Pherkel | 2023-09-12 14:19:15 +0200 |
---|---|---|
committer | GitHub | 2023-09-12 14:19:15 +0200 |
commit | 7a9a6c783e69b5a537a3d3f5bfe8d5fdc656c807 (patch) | |
tree | 0725631b9b68aeb65b292420a15941dcfa3fc04f /config.yaml | |
parent | f9846193289c81d89342b6a36e951605c2cfa189 (diff) | |
parent | 7b71dab87591e04d874cd636614450b0e65e3f2b (diff) |
Merge pull request #37 from Algo-Boys/fix/ultimate
Fix/ultimate
Diffstat (limited to 'config.yaml')
-rw-r--r-- | config.yaml | 34 |
1 files changed, 34 insertions, 0 deletions
diff --git a/config.yaml b/config.yaml new file mode 100644 index 0000000..e5ff43a --- /dev/null +++ b/config.yaml @@ -0,0 +1,34 @@ +model: + n_cnn_layers: 3 + n_rnn_layers: 5 + rnn_dim: 512 + n_feats: 128 # number of mel features + stride: 2 + dropout: 0.3 # recommended to be around 0.4 for smaller datasets, 0.1 for really large datasets + +training: + learning_rate: 5e-4 + batch_size: 8 # recommended to maximum number that fits on the GPU (batch size of 32 fits on a 12GB GPU) + epochs: 3 + eval_every_n: 3 # evaluate every n epochs + num_workers: 8 # number of workers for dataloader + +dataset: + download: True + dataset_root_path: "YOUR/PATH" # files will be downloaded into this dir + language_name: "mls_german_opus" + limited_supervision: False # set to True if you want to use limited supervision + dataset_percentage: 1.0 # percentage of dataset to use (1.0 = 100%) + shuffle: True + +tokenizer: + tokenizer_path: "data/tokenizers/char_tokenizer_german.yaml" + +checkpoints: + model_load_path: "YOUR/PATH" # path to load model from + model_save_path: "YOUR/PATH" # path to save model to + +inference: + model_load_path: "YOUR/PATH" # path to load model from + beam_width: 10 # beam width for beam search + device: "cuda" # device to run inference on if gpu is available, else "cpu" will be set automatically
\ No newline at end of file |