diff options
Diffstat (limited to 'swr2_asr/utils/data.py')
-rw-r--r-- | swr2_asr/utils/data.py | 6 |
1 files changed, 4 insertions, 2 deletions
diff --git a/swr2_asr/utils/data.py b/swr2_asr/utils/data.py index f484bdd..19605f6 100644 --- a/swr2_asr/utils/data.py +++ b/swr2_asr/utils/data.py @@ -344,7 +344,7 @@ class MLSDataset(Dataset): idx, ) # type: ignore - def create_lexicon(vocab_counts_path, lexicon_path): +def create_lexicon(vocab_counts_path, lexicon_path): words_list = [] with open(vocab_counts_path, 'r') as file: @@ -361,6 +361,8 @@ class MLSDataset(Dataset): file.write(f"{word} ") for char in word: file.write(char + ' ') - file.write("|") + file.write("<SPACE>") + +
\ No newline at end of file |