Merge pull request #3380 from piraka9011/patch-1

Convert channels for CV2 dataset
2020-10-17 00:43:08 +02:00 · 2020-10-17 00:43:08 +02:00 · 0798698e97
commit 0798698e97
parent e508cd30b7 521842deea
1 changed files with 2 additions and 1 deletions
--- a/bin/import_cv2.py
+++ b/bin/import_cv2.py
@ -27,6 +27,7 @@ from ds_ctcdecoder import Alphabet

 FIELDNAMES = ["wav_filename", "wav_filesize", "transcript"]
 SAMPLE_RATE = 16000
+CHANNELS = 1
 MAX_SECS = 10
 PARAMS = None
 FILTER_OBJ = None
@ -179,7 +180,7 @@ def _preprocess_data(tsv_dir, audio_dir, space_after_every_character=False):
 def _maybe_convert_wav(mp3_filename, wav_filename):
    if not os.path.exists(wav_filename):
        transformer = sox.Transformer()
-        transformer.convert(samplerate=SAMPLE_RATE)
+        transformer.convert(samplerate=SAMPLE_RATE, n_channels=CHANNELS)
        try:
            transformer.build(mp3_filename, wav_filename)
        except sox.core.SoxError: