marinone94 commited on
Commit
bf11fb8
1 Parent(s): 57ad2fb

fix column removal issue

Browse files
Files changed (1) hide show
  1. run_speech_recognition_ctc.py +1 -1
run_speech_recognition_ctc.py CHANGED
@@ -331,7 +331,7 @@ def create_vocabulary_from_data(
331
  batched=True,
332
  batch_size=10000,
333
  keep_in_memory=False,
334
- remove_columns=datasets["train"].column_names,
335
  )
336
 
337
  # take union of all unique characters in each dataset
 
331
  batched=True,
332
  batch_size=10000,
333
  keep_in_memory=False,
334
+ remove_columns=[col for col in datasets["train"].column_names if col in datasets["eval"].column_names],
335
  )
336
 
337
  # take union of all unique characters in each dataset