aboutsummaryrefslogtreecommitdiff
path: root/swr2_asr/train.py
diff options
context:
space:
mode:
authorPhilipp Merkel2023-09-04 14:07:54 +0000
committerPhilipp Merkel2023-09-04 14:07:54 +0000
commitcd15a49ccee83c21ada481d6815d004f134147fe (patch)
tree19b8872940527986d2d97ea24965bc14e7a27eb2 /swr2_asr/train.py
parentacafe88a1a360832b727651b713806ce0404db3f (diff)
applied fixes to download and tokenizers
Diffstat (limited to 'swr2_asr/train.py')
-rw-r--r--swr2_asr/train.py3
1 files changed, 1 insertions, 2 deletions
diff --git a/swr2_asr/train.py b/swr2_asr/train.py
index 8fc0b78..aea99e0 100644
--- a/swr2_asr/train.py
+++ b/swr2_asr/train.py
@@ -173,7 +173,6 @@ def run(
split="all",
download=False,
out_path="data/tokenizers/char_tokenizer_german.json",
- vocab_size=3000,
)
tokenizer = CharTokenizer.from_file("data/tokenizers/char_tokenizer_german.json")
@@ -305,4 +304,4 @@ def run_cli(
if __name__ == "__main__":
- run(1e-3, 10, 1, False, "", "/Volumes/pherkel/SWR2-ASR", "mls_german_opus")
+ run_cli()