aboutsummaryrefslogtreecommitdiff
path: root/swr2_asr/utils/data.py
diff options
context:
space:
mode:
authorJoJoBarthold22023-09-18 12:19:31 +0200
committerJoJoBarthold22023-09-18 12:19:31 +0200
commit0f14789f1c33d55dc270bcd154201cce2c4d516e (patch)
tree7d3e80fc80233eba2005399dc85afaa52452a854 /swr2_asr/utils/data.py
parentec8bfe9df205608282e5297635363fc8fc8fe55b (diff)
reset commit history
Diffstat (limited to 'swr2_asr/utils/data.py')
-rw-r--r--swr2_asr/utils/data.py6
1 files changed, 4 insertions, 2 deletions
diff --git a/swr2_asr/utils/data.py b/swr2_asr/utils/data.py
index f484bdd..19605f6 100644
--- a/swr2_asr/utils/data.py
+++ b/swr2_asr/utils/data.py
@@ -344,7 +344,7 @@ class MLSDataset(Dataset):
idx,
) # type: ignore
- def create_lexicon(vocab_counts_path, lexicon_path):
+def create_lexicon(vocab_counts_path, lexicon_path):
words_list = []
with open(vocab_counts_path, 'r') as file:
@@ -361,6 +361,8 @@ class MLSDataset(Dataset):
file.write(f"{word} ")
for char in word:
file.write(char + ' ')
- file.write("|")
+ file.write("<SPACE>")
+
+
\ No newline at end of file