marinone94
commited on
Commit
•
bf11fb8
1
Parent(s):
57ad2fb
fix column removal issue
Browse files
run_speech_recognition_ctc.py
CHANGED
@@ -331,7 +331,7 @@ def create_vocabulary_from_data(
|
|
331 |
batched=True,
|
332 |
batch_size=10000,
|
333 |
keep_in_memory=False,
|
334 |
-
remove_columns=datasets["train"].column_names,
|
335 |
)
|
336 |
|
337 |
# take union of all unique characters in each dataset
|
|
|
331 |
batched=True,
|
332 |
batch_size=10000,
|
333 |
keep_in_memory=False,
|
334 |
+
remove_columns=[col for col in datasets["train"].column_names if col in datasets["eval"].column_names],
|
335 |
)
|
336 |
|
337 |
# take union of all unique characters in each dataset
|