diff options
author | Philipp Merkel | 2023-09-04 14:07:54 +0000 |
---|---|---|
committer | Philipp Merkel | 2023-09-04 14:07:54 +0000 |
commit | cd15a49ccee83c21ada481d6815d004f134147fe (patch) | |
tree | 19b8872940527986d2d97ea24965bc14e7a27eb2 /swr2_asr/train.py | |
parent | acafe88a1a360832b727651b713806ce0404db3f (diff) |
applied fixes to download and tokenizers
Diffstat (limited to 'swr2_asr/train.py')
-rw-r--r-- | swr2_asr/train.py | 3 |
1 files changed, 1 insertions, 2 deletions
diff --git a/swr2_asr/train.py b/swr2_asr/train.py index 8fc0b78..aea99e0 100644 --- a/swr2_asr/train.py +++ b/swr2_asr/train.py @@ -173,7 +173,6 @@ def run( split="all", download=False, out_path="data/tokenizers/char_tokenizer_german.json", - vocab_size=3000, ) tokenizer = CharTokenizer.from_file("data/tokenizers/char_tokenizer_german.json") @@ -305,4 +304,4 @@ def run_cli( if __name__ == "__main__": - run(1e-3, 10, 1, False, "", "/Volumes/pherkel/SWR2-ASR", "mls_german_opus") + run_cli() |