From afbcc01369664dfc298f84b1b91666b9833c9a21 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Tue, 20 Jul 2021 08:13:07 -0400
Subject: [PATCH 01/17] Break out config instantiation and setting

---
 training/coqui_stt_training/train.py       |  7 +++++--
 training/coqui_stt_training/util/config.py | 17 +++++++++++------
 2 files changed, 16 insertions(+), 8 deletions(-)

diff --git a/training/coqui_stt_training/train.py b/training/coqui_stt_training/train.py
index 2cf02397..2abb5226 100644
--- a/training/coqui_stt_training/train.py
+++ b/training/coqui_stt_training/train.py
@@ -45,7 +45,7 @@ from .util.checkpoints import (
 from .util.config import (
     Config,
     create_progressbar,
-    initialize_globals,
+    initialize_config_globals,
     log_debug,
     log_error,
     log_info,
@@ -1249,7 +1249,10 @@ def early_training_checks():
 
 
 def main():
-    initialize_globals()
+    Config = _SttConfig()
+    Config.parse_args(arg_prefix="") # parse CLI args
+    initialize_config_globals(Config)
+
     early_training_checks()
 
     if Config.train_files:
diff --git a/training/coqui_stt_training/util/config.py b/training/coqui_stt_training/util/config.py
index e0c925b9..969866c3 100755
--- a/training/coqui_stt_training/util/config.py
+++ b/training/coqui_stt_training/util/config.py
@@ -546,9 +546,10 @@ class _SttConfig(Coqpit):
         check_argument("one_shot_infer", c, is_path=True)
 
 
-def initialize_globals():
-    c = _SttConfig()
-    c.parse_args(arg_prefix="")
+def initialize_config_globals(c):
+    """
+    input: config class object (i.e. coqpit.Coqpit)
+    """
 
     # Augmentations
     c.augmentations = parse_augmentations(c.augment)
@@ -617,7 +618,7 @@ def initialize_globals():
 
     if c.bytes_output_mode:
         c.alphabet = UTF8Alphabet()
-    else:
+    elif c.alphabet_config_path:
         c.alphabet = Alphabet(os.path.abspath(c.alphabet_config_path))
 
     # Geometric Constants
@@ -647,8 +648,12 @@ def initialize_globals():
     # The number of units in the third layer, which feeds in to the LSTM
     c.n_hidden_3 = c.n_cell_dim
 
-    # Units in the sixth layer = number of characters in the target language plus one
-    c.n_hidden_6 = c.alphabet.GetSize() + 1  # +1 for CTC blank label
+    # Units in the last layer = number of characters in the alphabet plus one
+    try:
+        # +1 for CTC blank label
+        c.n_hidden_6 = c.alphabet.GetSize() + 1
+    except:
+        AttributeError
 
     # Size of audio window in samples
     if (c.feature_win_len * c.audio_sample_rate) % 1000 != 0:

From 848a612efebad3704f49f483d1ee301442c85385 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Tue, 20 Jul 2021 08:41:22 -0400
Subject: [PATCH 02/17] Import _SttConfig

---
 lm_optimizer.py                         | 5 +++--
 training/coqui_stt_training/evaluate.py | 6 ++++--
 training/coqui_stt_training/train.py    | 1 +
 transcribe.py                           | 5 +++--
 4 files changed, 11 insertions(+), 6 deletions(-)

diff --git a/lm_optimizer.py b/lm_optimizer.py
index 86100ec4..d4787137 100644
--- a/lm_optimizer.py
+++ b/lm_optimizer.py
@@ -10,7 +10,7 @@ import tensorflow.compat.v1 as tfv1
 from coqui_stt_ctcdecoder import Scorer
 from coqui_stt_training.evaluate import evaluate
 from coqui_stt_training.train import create_model
-from coqui_stt_training.util.config import Config, initialize_globals
+from coqui_stt_training.util.config import Config, _SttConfig, initialize_config_globals
 from coqui_stt_training.util.evaluate_tools import wer_cer_batch
 from coqui_stt_training.util.flags import FLAGS, create_flags
 from coqui_stt_training.util.logging import log_error
@@ -52,7 +52,8 @@ def objective(trial):
 
 
 def main(_):
-    initialize_globals()
+    Config = _SttConfig()
+    initialize_config_globals(Config)
 
     if not FLAGS.test_files:
         log_error(
diff --git a/training/coqui_stt_training/evaluate.py b/training/coqui_stt_training/evaluate.py
index ecff4502..cff3dc1e 100755
--- a/training/coqui_stt_training/evaluate.py
+++ b/training/coqui_stt_training/evaluate.py
@@ -17,8 +17,9 @@ from .util.augmentations import NormalizeSampleRate
 from .util.checkpoints import load_graph_for_evaluation
 from .util.config import (
     Config,
+    _SttConfig,
     create_progressbar,
-    initialize_globals,
+    initialize_config_globals,
     log_error,
     log_progress,
 )
@@ -169,7 +170,8 @@ def evaluate(test_csvs, create_model):
 
 
 def main():
-    initialize_globals()
+    Config = _SttConfig()
+    initialize_config_globals(Config)
 
     if not Config.test_files:
         log_error(
diff --git a/training/coqui_stt_training/train.py b/training/coqui_stt_training/train.py
index 2abb5226..619b2d1d 100644
--- a/training/coqui_stt_training/train.py
+++ b/training/coqui_stt_training/train.py
@@ -44,6 +44,7 @@ from .util.checkpoints import (
 )
 from .util.config import (
     Config,
+    _SttConfig,
     create_progressbar,
     initialize_config_globals,
     log_debug,
diff --git a/transcribe.py b/transcribe.py
index b0492c87..b6f5af9a 100755
--- a/transcribe.py
+++ b/transcribe.py
@@ -20,7 +20,7 @@ from multiprocessing import Process, cpu_count
 
 from coqui_stt_ctcdecoder import Scorer, ctc_beam_search_decoder_batch
 from coqui_stt_training.util.audio import AudioFile
-from coqui_stt_training.util.config import Config, initialize_globals
+from coqui_stt_training.util.config import Config, _SttConfig, initialize_config_globals
 from coqui_stt_training.util.feeding import split_audio_file
 from coqui_stt_training.util.flags import FLAGS, create_flags
 from coqui_stt_training.util.logging import (
@@ -42,7 +42,8 @@ def transcribe_file(audio_path, tlog_path):
     )
     from coqui_stt_training.util.checkpoints import load_graph_for_evaluation
 
-    initialize_globals()
+    Config = _SttConfig()
+    initialize_config_globals(Config)
     scorer = Scorer(FLAGS.lm_alpha, FLAGS.lm_beta, FLAGS.scorer_path, Config.alphabet)
     try:
         num_processes = cpu_count()

From 920e92d68a96382017a82ea09459b240e2018203 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Tue, 20 Jul 2021 09:34:44 -0400
Subject: [PATCH 03/17] Remove check_values and default alphabet

---
 training/coqui_stt_training/util/config.py | 7 +------
 1 file changed, 1 insertion(+), 6 deletions(-)

diff --git a/training/coqui_stt_training/util/config.py b/training/coqui_stt_training/util/config.py
index 969866c3..1896eb7c 100755
--- a/training/coqui_stt_training/util/config.py
+++ b/training/coqui_stt_training/util/config.py
@@ -472,7 +472,7 @@ class _SttConfig(Coqpit):
         ),
     )
     alphabet_config_path: str = field(
-        default="data/alphabet.txt",
+        default="",
         metadata=dict(
             help="path to the configuration file specifying the alphabet used by the network. See the comment in data/alphabet.txt for a description of the format."
         ),
@@ -540,11 +540,6 @@ class _SttConfig(Coqpit):
         ),
     )
 
-    def check_values(self):
-        c = asdict(self)
-        check_argument("alphabet_config_path", c, is_path=True)
-        check_argument("one_shot_infer", c, is_path=True)
-
 
 def initialize_config_globals(c):
     """

From 5b4fa274670726e12cb5557269cedbde18968d20 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Tue, 20 Jul 2021 09:50:47 -0400
Subject: [PATCH 04/17] Add required alphabet path to CI tests

---
 bin/run-ci-graph_augmentations.sh         | 2 +-
 bin/run-ci-ldc93s1_checkpoint.sh          | 2 +-
 bin/run-ci-ldc93s1_checkpoint_bytes.sh    | 2 +-
 bin/run-ci-ldc93s1_checkpoint_sdb.sh      | 2 +-
 bin/run-ci-ldc93s1_new.sh                 | 2 +-
 bin/run-ci-ldc93s1_new_bytes.sh           | 2 +-
 bin/run-ci-ldc93s1_new_bytes_tflite.sh    | 2 +-
 bin/run-ci-ldc93s1_new_metrics.sh         | 2 +-
 bin/run-ci-ldc93s1_new_sdb.sh             | 2 +-
 bin/run-ci-ldc93s1_new_sdb_csv.sh         | 2 +-
 bin/run-ci-ldc93s1_singleshotinference.sh | 4 ++--
 bin/run-ci-ldc93s1_tflite.sh              | 4 ++--
 bin/run-ldc93s1.sh                        | 2 +-
 13 files changed, 15 insertions(+), 15 deletions(-)

diff --git a/bin/run-ci-graph_augmentations.sh b/bin/run-ci-graph_augmentations.sh
index ed01ccb7..bd4855b9 100755
--- a/bin/run-ci-graph_augmentations.sh
+++ b/bin/run-ci-graph_augmentations.sh
@@ -14,7 +14,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --scorer "" \
   --augment dropout \
diff --git a/bin/run-ci-ldc93s1_checkpoint.sh b/bin/run-ci-ldc93s1_checkpoint.sh
index 68ebc8bd..80aeea5d 100755
--- a/bin/run-ci-ldc93s1_checkpoint.sh
+++ b/bin/run-ci-ldc93s1_checkpoint.sh
@@ -14,7 +14,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
   --test_files ${ldc93s1_csv} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_checkpoint_bytes.sh b/bin/run-ci-ldc93s1_checkpoint_bytes.sh
index 6c068eee..96cf5998 100755
--- a/bin/run-ci-ldc93s1_checkpoint_bytes.sh
+++ b/bin/run-ci-ldc93s1_checkpoint_bytes.sh
@@ -14,7 +14,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
   --test_files ${ldc93s1_csv} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_checkpoint_sdb.sh b/bin/run-ci-ldc93s1_checkpoint_sdb.sh
index 30708451..02d87b66 100755
--- a/bin/run-ci-ldc93s1_checkpoint_sdb.sh
+++ b/bin/run-ci-ldc93s1_checkpoint_sdb.sh
@@ -20,7 +20,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_sdb} --train_batch_size 1 \
   --dev_files ${ldc93s1_sdb} --dev_batch_size 1 \
   --test_files ${ldc93s1_sdb} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new.sh b/bin/run-ci-ldc93s1_new.sh
index f67f2765..ff7d7d25 100755
--- a/bin/run-ci-ldc93s1_new.sh
+++ b/bin/run-ci-ldc93s1_new.sh
@@ -17,7 +17,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --feature_cache '/tmp/ldc93s1_cache' \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_bytes.sh b/bin/run-ci-ldc93s1_new_bytes.sh
index 5dec1fed..17c65af4 100755
--- a/bin/run-ci-ldc93s1_new_bytes.sh
+++ b/bin/run-ci-ldc93s1_new_bytes.sh
@@ -17,7 +17,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --feature_cache '/tmp/ldc93s1_cache' \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_bytes_tflite.sh b/bin/run-ci-ldc93s1_new_bytes_tflite.sh
index 22558942..eb74eac1 100755
--- a/bin/run-ci-ldc93s1_new_bytes_tflite.sh
+++ b/bin/run-ci-ldc93s1_new_bytes_tflite.sh
@@ -16,7 +16,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false \
   --n_hidden 100 \
   --checkpoint_dir '/tmp/ckpt_bytes' \
   --export_dir '/tmp/train_bytes_tflite' \
diff --git a/bin/run-ci-ldc93s1_new_metrics.sh b/bin/run-ci-ldc93s1_new_metrics.sh
index ee87c6b5..d0fd8ccc 100755
--- a/bin/run-ci-ldc93s1_new_metrics.sh
+++ b/bin/run-ci-ldc93s1_new_metrics.sh
@@ -17,7 +17,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
   --test_files ${ldc93s1_csv} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_sdb.sh b/bin/run-ci-ldc93s1_new_sdb.sh
index 0e9a5293..e3b26937 100755
--- a/bin/run-ci-ldc93s1_new_sdb.sh
+++ b/bin/run-ci-ldc93s1_new_sdb.sh
@@ -23,7 +23,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_sdb} --train_batch_size 1 \
   --dev_files ${ldc93s1_sdb} --dev_batch_size 1 \
   --test_files ${ldc93s1_sdb} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_sdb_csv.sh b/bin/run-ci-ldc93s1_new_sdb_csv.sh
index ca8cd388..cacd880a 100755
--- a/bin/run-ci-ldc93s1_new_sdb_csv.sh
+++ b/bin/run-ci-ldc93s1_new_sdb_csv.sh
@@ -23,7 +23,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_sdb} ${ldc93s1_csv} --train_batch_size 1 \
   --feature_cache '/tmp/ldc93s1_cache_sdb_csv' \
   --dev_files ${ldc93s1_sdb} ${ldc93s1_csv} --dev_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_singleshotinference.sh b/bin/run-ci-ldc93s1_singleshotinference.sh
index 8aaced54..c8e3839b 100755
--- a/bin/run-ci-ldc93s1_singleshotinference.sh
+++ b/bin/run-ci-ldc93s1_singleshotinference.sh
@@ -14,7 +14,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
   --test_files ${ldc93s1_csv} --test_batch_size 1 \
@@ -23,7 +23,7 @@ python -u train.py --show_progressbar false --early_stop false \
   --learning_rate 0.001 --dropout_rate 0.05 \
   --scorer_path 'data/smoke_test/pruned_lm.scorer'
 
-python -u train.py \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
   --n_hidden 100 \
   --checkpoint_dir '/tmp/ckpt' \
   --scorer_path 'data/smoke_test/pruned_lm.scorer' \
diff --git a/bin/run-ci-ldc93s1_tflite.sh b/bin/run-ci-ldc93s1_tflite.sh
index 0156d969..6d79313f 100755
--- a/bin/run-ci-ldc93s1_tflite.sh
+++ b/bin/run-ci-ldc93s1_tflite.sh
@@ -16,7 +16,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false \
   --n_hidden 100 \
   --checkpoint_dir '/tmp/ckpt' \
   --export_dir '/tmp/train_tflite' \
@@ -26,7 +26,7 @@ python -u train.py --show_progressbar false \
 
 mkdir /tmp/train_tflite/en-us
 
-python -u train.py --show_progressbar false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false \
   --n_hidden 100 \
   --checkpoint_dir '/tmp/ckpt' \
   --export_dir '/tmp/train_tflite/en-us' \
diff --git a/bin/run-ldc93s1.sh b/bin/run-ldc93s1.sh
index fdf34609..46efa667 100755
--- a/bin/run-ldc93s1.sh
+++ b/bin/run-ldc93s1.sh
@@ -20,7 +20,7 @@ fi
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --show_progressbar false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false \
   --train_files data/ldc93s1/ldc93s1.csv \
   --test_files data/ldc93s1/ldc93s1.csv \
   --train_batch_size 1 \

From 4dc565beca8b0ef7d1d54115dff2f73c298f9897 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 05:00:05 -0400
Subject: [PATCH 05/17] Move checking logic into __post_init__()

---
 lm_optimizer.py                            |   5 +-
 training/coqui_stt_training/evaluate.py    |   6 +-
 training/coqui_stt_training/train.py       |   8 +-
 training/coqui_stt_training/util/config.py | 323 +++++++++++----------
 transcribe.py                              |   6 +-
 5 files changed, 174 insertions(+), 174 deletions(-)

diff --git a/lm_optimizer.py b/lm_optimizer.py
index d4787137..85ca1fd5 100644
--- a/lm_optimizer.py
+++ b/lm_optimizer.py
@@ -10,7 +10,7 @@ import tensorflow.compat.v1 as tfv1
 from coqui_stt_ctcdecoder import Scorer
 from coqui_stt_training.evaluate import evaluate
 from coqui_stt_training.train import create_model
-from coqui_stt_training.util.config import Config, _SttConfig, initialize_config_globals
+from coqui_stt_training.util.config import Config, initialize_globals_from_cli
 from coqui_stt_training.util.evaluate_tools import wer_cer_batch
 from coqui_stt_training.util.flags import FLAGS, create_flags
 from coqui_stt_training.util.logging import log_error
@@ -52,8 +52,7 @@ def objective(trial):
 
 
 def main(_):
-    Config = _SttConfig()
-    initialize_config_globals(Config)
+    initialize_globals_from_cli()
 
     if not FLAGS.test_files:
         log_error(
diff --git a/training/coqui_stt_training/evaluate.py b/training/coqui_stt_training/evaluate.py
index cff3dc1e..4425582b 100755
--- a/training/coqui_stt_training/evaluate.py
+++ b/training/coqui_stt_training/evaluate.py
@@ -17,9 +17,8 @@ from .util.augmentations import NormalizeSampleRate
 from .util.checkpoints import load_graph_for_evaluation
 from .util.config import (
     Config,
-    _SttConfig,
     create_progressbar,
-    initialize_config_globals,
+    initialize_globals_from_cli,
     log_error,
     log_progress,
 )
@@ -170,8 +169,7 @@ def evaluate(test_csvs, create_model):
 
 
 def main():
-    Config = _SttConfig()
-    initialize_config_globals(Config)
+    initialize_globals_from_cli()
 
     if not Config.test_files:
         log_error(
diff --git a/training/coqui_stt_training/train.py b/training/coqui_stt_training/train.py
index 619b2d1d..b6cfaec9 100644
--- a/training/coqui_stt_training/train.py
+++ b/training/coqui_stt_training/train.py
@@ -44,9 +44,8 @@ from .util.checkpoints import (
 )
 from .util.config import (
     Config,
-    _SttConfig,
     create_progressbar,
-    initialize_config_globals,
+    initialize_globals_from_cli,
     log_debug,
     log_error,
     log_info,
@@ -1250,10 +1249,7 @@ def early_training_checks():
 
 
 def main():
-    Config = _SttConfig()
-    Config.parse_args(arg_prefix="") # parse CLI args
-    initialize_config_globals(Config)
-
+    initialize_globals_from_cli()
     early_training_checks()
 
     if Config.train_files:
diff --git a/training/coqui_stt_training/util/config.py b/training/coqui_stt_training/util/config.py
index 1896eb7c..0a04ad77 100755
--- a/training/coqui_stt_training/util/config.py
+++ b/training/coqui_stt_training/util/config.py
@@ -36,6 +36,163 @@ Config = _ConfigSingleton()  # pylint: disable=invalid-name
 
 @dataclass
 class _SttConfig(Coqpit):
+    def __post_init__(self):
+        # Augmentations
+        self.augmentations = parse_augmentations(self.augment)
+        if self.augmentations:
+            print(f"Parsed augmentations: {self.augmentations}")
+        if self.augmentations and self.feature_cache and self.cache_for_epochs == 0:
+            print(
+                "Due to current feature-cache settings the exact same sample augmentations of the first "
+                "epoch will be repeated on all following epochs. This could lead to unintended over-fitting. "
+                "You could use --cache_for_epochs <n_epochs> to invalidate the cache after a given number of epochs."
+            )
+
+        if self.normalize_sample_rate:
+            self.augmentations = [NormalizeSampleRate(self.audio_sample_rate)] + self[
+                "augmentations"
+            ]
+
+        # Caching
+        if self.cache_for_epochs == 1:
+            print(
+                "--cache_for_epochs == 1 is (re-)creating the feature cache on every epoch but will never use it."
+                "You can either set --cache_for_epochs > 1, or not use feature caching at all."
+            )
+
+        # Read-buffer
+        self.read_buffer = parse_file_size(self.read_buffer)
+
+        # Set default dropout rates
+        if self.dropout_rate2 < 0:
+            self.dropout_rate2 = self.dropout_rate
+        if self.dropout_rate3 < 0:
+            self.dropout_rate3 = self.dropout_rate
+        if self.dropout_rate6 < 0:
+            self.dropout_rate6 = self.dropout_rate
+
+        # Set default checkpoint dir
+        if not self.checkpoint_dir:
+            self.checkpoint_dir = xdg.save_data_path(os.path.join("stt", "checkpoints"))
+
+        if self.load_train not in ["last", "best", "init", "auto"]:
+            self.load_train = "auto"
+
+        if self.load_evaluate not in ["last", "best", "auto"]:
+            self.load_evaluate = "auto"
+
+        # Set default summary dir
+        if not self.summary_dir:
+            self.summary_dir = xdg.save_data_path(os.path.join("stt", "summaries"))
+
+        # Standard session configuration that'll be used for all new sessions.
+        self.session_config = tfv1.ConfigProto(
+            allow_soft_placement=True,
+            log_device_placement=self.log_placement,
+            inter_op_parallelism_threads=self.inter_op_parallelism_threads,
+            intra_op_parallelism_threads=self.intra_op_parallelism_threads,
+            gpu_options=tfv1.GPUOptions(allow_growth=self.use_allow_growth),
+        )
+
+        # CPU device
+        self.cpu_device = "/cpu:0"
+
+        # Available GPU devices
+        self.available_devices = get_available_gpus(self.session_config)
+
+        # If there is no GPU available, we fall back to CPU based operation
+        if not self.available_devices:
+            self.available_devices = [self.cpu_device]
+
+        if self.bytes_output_mode:
+            self.alphabet = UTF8Alphabet()
+        elif self.alphabet_config_path:
+            self.alphabet = Alphabet(os.path.abspath(self.alphabet_config_path))
+
+        # Geometric Constants
+        # ===================
+
+        # For an explanation of the meaning of the geometric constants
+        # please refer to doc/Geometry.md
+
+        # Number of MFCC features
+        self.n_input = 26 # TODO: Determine this programmatically from the sample rate
+
+        # The number of frames in the context
+        self.n_context = 9 # TODO: Determine the optimal value using a validation data set
+
+        # Number of units in hidden layers
+        self.n_hidden = self.n_hidden
+
+        self.n_hidden_1 = self.n_hidden
+
+        self.n_hidden_2 = self.n_hidden
+
+        self.n_hidden_5 = self.n_hidden
+
+        # LSTM cell state dimension
+        self.n_cell_dim = self.n_hidden
+
+        # The number of units in the third layer, which feeds in to the LSTM
+        self.n_hidden_3 = self.n_cell_dim
+
+        # Dims in last layer = number of characters in alphabet plus one
+        try:
+            # +1 for CTC blank label
+            self.n_hidden_6 = self.alphabet.GetSize() + 1
+        except:
+            AttributeError
+
+        # Size of audio window in samples
+        if (self.feature_win_len * self.audio_sample_rate) % 1000 != 0:
+            log_error(
+                "--feature_win_len value ({}) in milliseconds ({}) multiplied "
+                "by --audio_sample_rate value ({}) must be an integer value. Adjust "
+                "your --feature_win_len value or resample your audio accordingly."
+                "".format(self.feature_win_len, self.feature_win_len / 1000, self.audio_sample_rate)
+            )
+            sys.exit(1)
+
+        self.audio_window_samples = self.audio_sample_rate * (self.feature_win_len / 1000)
+
+        # Stride for feature computations in samples
+        if (self.feature_win_step * self.audio_sample_rate) % 1000 != 0:
+            log_error(
+                "--feature_win_step value ({}) in milliseconds ({}) multiplied "
+                "by --audio_sample_rate value ({}) must be an integer value. Adjust "
+                "your --feature_win_step value or resample your audio accordingly."
+                "".format(
+                    self.feature_win_step, self.feature_win_step / 1000, self.audio_sample_rate
+                )
+            )
+            sys.exit(1)
+
+        self.audio_step_samples = self.audio_sample_rate * (self.feature_win_step / 1000)
+
+        if self.one_shot_infer:
+            if not path_exists_remote(self.one_shot_infer):
+                log_error("Path specified in --one_shot_infer is not a valid file.")
+                sys.exit(1)
+
+        if self.train_cudnn and self.load_cudnn:
+            log_error(
+                "Trying to use --train_cudnn, but --load_cudnn "
+                "was also specified. The --load_cudnn flag is only "
+                "needed when converting a CuDNN RNN checkpoint to "
+                "a CPU-capable graph. If your system is capable of "
+                "using CuDNN RNN, you can just specify the CuDNN RNN "
+                "checkpoint normally with --save_checkpoint_dir."
+            )
+            sys.exit(1)
+
+        # If separate save and load flags were not specified, default to load and save
+        # from the same dir.
+        if not self.save_checkpoint_dir:
+            self.save_checkpoint_dir = self.checkpoint_dir
+
+        if not self.load_checkpoint_dir:
+            self.load_checkpoint_dir = self.checkpoint_dir
+
     train_files: List[str] = field(
         default_factory=list,
         metadata=dict(
@@ -541,165 +698,15 @@ class _SttConfig(Coqpit):
     )
 
 
-def initialize_config_globals(c):
-    """
-    input: config class object (i.e. coqpit.Coqpit)
-    """
-
-    # Augmentations
-    c.augmentations = parse_augmentations(c.augment)
-    print(f"Parsed augmentations from flags: {c.augmentations}")
-    if c.augmentations and c.feature_cache and c.cache_for_epochs == 0:
-        print(
-            "Due to current feature-cache settings the exact same sample augmentations of the first "
-            "epoch will be repeated on all following epochs. This could lead to unintended over-fitting. "
-            "You could use --cache_for_epochs <n_epochs> to invalidate the cache after a given number of epochs."
-        )
-
-    if c.normalize_sample_rate:
-        c.augmentations = [NormalizeSampleRate(c.audio_sample_rate)] + c[
-            "augmentations"
-        ]
-
-    # Caching
-    if c.cache_for_epochs == 1:
-        print(
-            "--cache_for_epochs == 1 is (re-)creating the feature cache on every epoch but will never use it."
-        )
-
-    # Read-buffer
-    c.read_buffer = parse_file_size(c.read_buffer)
-
-    # Set default dropout rates
-    if c.dropout_rate2 < 0:
-        c.dropout_rate2 = c.dropout_rate
-    if c.dropout_rate3 < 0:
-        c.dropout_rate3 = c.dropout_rate
-    if c.dropout_rate6 < 0:
-        c.dropout_rate6 = c.dropout_rate
-
-    # Set default checkpoint dir
-    if not c.checkpoint_dir:
-        c.checkpoint_dir = xdg.save_data_path(os.path.join("stt", "checkpoints"))
-
-    if c.load_train not in ["last", "best", "init", "auto"]:
-        c.load_train = "auto"
-
-    if c.load_evaluate not in ["last", "best", "auto"]:
-        c.load_evaluate = "auto"
-
-    # Set default summary dir
-    if not c.summary_dir:
-        c.summary_dir = xdg.save_data_path(os.path.join("stt", "summaries"))
-
-    # Standard session configuration that'll be used for all new sessions.
-    c.session_config = tfv1.ConfigProto(
-        allow_soft_placement=True,
-        log_device_placement=c.log_placement,
-        inter_op_parallelism_threads=c.inter_op_parallelism_threads,
-        intra_op_parallelism_threads=c.intra_op_parallelism_threads,
-        gpu_options=tfv1.GPUOptions(allow_growth=c.use_allow_growth),
-    )
-
-    # CPU device
-    c.cpu_device = "/cpu:0"
-
-    # Available GPU devices
-    c.available_devices = get_available_gpus(c.session_config)
-
-    # If there is no GPU available, we fall back to CPU based operation
-    if not c.available_devices:
-        c.available_devices = [c.cpu_device]
-
-    if c.bytes_output_mode:
-        c.alphabet = UTF8Alphabet()
-    elif c.alphabet_config_path:
-        c.alphabet = Alphabet(os.path.abspath(c.alphabet_config_path))
-
-    # Geometric Constants
-    # ===================
-
-    # For an explanation of the meaning of the geometric constants, please refer to
-    # doc/Geometry.md
-
-    # Number of MFCC features
-    c.n_input = 26  # TODO: Determine this programmatically from the sample rate
-
-    # The number of frames in the context
-    c.n_context = 9  # TODO: Determine the optimal value using a validation data set
-
-    # Number of units in hidden layers
-    c.n_hidden = c.n_hidden
-
-    c.n_hidden_1 = c.n_hidden
-
-    c.n_hidden_2 = c.n_hidden
-
-    c.n_hidden_5 = c.n_hidden
-
-    # LSTM cell state dimension
-    c.n_cell_dim = c.n_hidden
-
-    # The number of units in the third layer, which feeds in to the LSTM
-    c.n_hidden_3 = c.n_cell_dim
-
-    # Units in the last layer = number of characters in the alphabet plus one
-    try:
-        # +1 for CTC blank label
-        c.n_hidden_6 = c.alphabet.GetSize() + 1
-    except:
-        AttributeError
-
-    # Size of audio window in samples
-    if (c.feature_win_len * c.audio_sample_rate) % 1000 != 0:
-        log_error(
-            "--feature_win_len value ({}) in milliseconds ({}) multiplied "
-            "by --audio_sample_rate value ({}) must be an integer value. Adjust "
-            "your --feature_win_len value or resample your audio accordingly."
-            "".format(c.feature_win_len, c.feature_win_len / 1000, c.audio_sample_rate)
-        )
-        sys.exit(1)
-
-    c.audio_window_samples = c.audio_sample_rate * (c.feature_win_len / 1000)
-
-    # Stride for feature computations in samples
-    if (c.feature_win_step * c.audio_sample_rate) % 1000 != 0:
-        log_error(
-            "--feature_win_step value ({}) in milliseconds ({}) multiplied "
-            "by --audio_sample_rate value ({}) must be an integer value. Adjust "
-            "your --feature_win_step value or resample your audio accordingly."
-            "".format(
-                c.feature_win_step, c.feature_win_step / 1000, c.audio_sample_rate
-            )
-        )
-        sys.exit(1)
-
-    c.audio_step_samples = c.audio_sample_rate * (c.feature_win_step / 1000)
-
-    if c.one_shot_infer:
-        if not path_exists_remote(c.one_shot_infer):
-            log_error("Path specified in --one_shot_infer is not a valid file.")
-            sys.exit(1)
-
-    if c.train_cudnn and c.load_cudnn:
-        log_error(
-            "Trying to use --train_cudnn, but --load_cudnn "
-            "was also specified. The --load_cudnn flag is only "
-            "needed when converting a CuDNN RNN checkpoint to "
-            "a CPU-capable graph. If your system is capable of "
-            "using CuDNN RNN, you can just specify the CuDNN RNN "
-            "checkpoint normally with --save_checkpoint_dir."
-        )
-        sys.exit(1)
-
-    # If separate save and load flags were not specified, default to load and save
-    # from the same dir.
-    if not c.save_checkpoint_dir:
-        c.save_checkpoint_dir = c.checkpoint_dir
-
-    if not c.load_checkpoint_dir:
-        c.load_checkpoint_dir = c.checkpoint_dir
+def initialize_globals_from_cli():
+    c = _SttConfig()
+    c.parse_args(arg_prefix="")
+    c.__post_init__()
+    _ConfigSingleton._config = c  # pylint: disable=protected-access
 
+def initialize_globals_from_args(**override_args):
+    # Update Config with new args
+    c = _SttConfig(**override_args)
     _ConfigSingleton._config = c  # pylint: disable=protected-access
 
 
diff --git a/transcribe.py b/transcribe.py
index b6f5af9a..2792ae2f 100755
--- a/transcribe.py
+++ b/transcribe.py
@@ -20,7 +20,7 @@ from multiprocessing import Process, cpu_count
 
 from coqui_stt_ctcdecoder import Scorer, ctc_beam_search_decoder_batch
 from coqui_stt_training.util.audio import AudioFile
-from coqui_stt_training.util.config import Config, _SttConfig, initialize_config_globals
+from coqui_stt_training.util.config import Config, initialize_globals_from_cli
 from coqui_stt_training.util.feeding import split_audio_file
 from coqui_stt_training.util.flags import FLAGS, create_flags
 from coqui_stt_training.util.logging import (
@@ -42,8 +42,8 @@ def transcribe_file(audio_path, tlog_path):
     )
     from coqui_stt_training.util.checkpoints import load_graph_for_evaluation
 
-    Config = _SttConfig()
-    initialize_config_globals(Config)
+    initialize_globals_from_cli()
+
     scorer = Scorer(FLAGS.lm_alpha, FLAGS.lm_beta, FLAGS.scorer_path, Config.alphabet)
     try:
         num_processes = cpu_count()

From f6bd7bcf7dbdbeddd4645c06f25f539162cb246c Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 06:23:19 -0400
Subject: [PATCH 06/17] Handle file_size passed as int

---
 training/coqui_stt_training/util/helpers.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/training/coqui_stt_training/util/helpers.py b/training/coqui_stt_training/util/helpers.py
index c8aa788a..6e386125 100644
--- a/training/coqui_stt_training/util/helpers.py
+++ b/training/coqui_stt_training/util/helpers.py
@@ -19,7 +19,8 @@ ValueRange = namedtuple("ValueRange", "start end r")
 
 
 def parse_file_size(file_size):
-    file_size = file_size.lower().strip()
+    if type(file_size) is str:
+        file_size = file_size.lower().strip()
     if len(file_size) == 0:
         return 0
     n = int(keep_only_digits(file_size))

From 4342906c50e43c593a2d8d5a223b50f73dc87d71 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 06:37:25 -0400
Subject: [PATCH 07/17] Better file_size handling

---
 training/coqui_stt_training/util/helpers.py | 18 +++++++++++-------
 1 file changed, 11 insertions(+), 7 deletions(-)

diff --git a/training/coqui_stt_training/util/helpers.py b/training/coqui_stt_training/util/helpers.py
index 6e386125..b897e4a9 100644
--- a/training/coqui_stt_training/util/helpers.py
+++ b/training/coqui_stt_training/util/helpers.py
@@ -21,13 +21,17 @@ ValueRange = namedtuple("ValueRange", "start end r")
 def parse_file_size(file_size):
     if type(file_size) is str:
         file_size = file_size.lower().strip()
-    if len(file_size) == 0:
-        return 0
-    n = int(keep_only_digits(file_size))
-    if file_size[-1] == "b":
-        file_size = file_size[:-1]
-    e = file_size[-1]
-    return SIZE_PREFIX_LOOKUP[e] * n if e in SIZE_PREFIX_LOOKUP else n
+        if len(file_size) == 0:
+            return 0
+        n = int(keep_only_digits(file_size))
+        if file_size[-1] == "b":
+            file_size = file_size[:-1]
+        e = file_size[-1]
+        return SIZE_PREFIX_LOOKUP[e] * n if e in SIZE_PREFIX_LOOKUP else n
+    elif type(file_size) is int:
+        return file_size
+    else:
+        raise ValueError("file_size not of type 'int' or 'str'")
 
 
 def keep_only_digits(txt):

From 0389560a927a5c692e3747e7f4beac27e7069bb6 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 07:16:58 -0400
Subject: [PATCH 08/17] Remove alphabet.txt from CI tests with
 bytes_output_mode

---
 bin/run-ci-ldc93s1_checkpoint_bytes.sh | 2 +-
 bin/run-ci-ldc93s1_new_bytes.sh        | 2 +-
 bin/run-ci-ldc93s1_new_bytes_tflite.sh | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/bin/run-ci-ldc93s1_checkpoint_bytes.sh b/bin/run-ci-ldc93s1_checkpoint_bytes.sh
index 96cf5998..6c068eee 100755
--- a/bin/run-ci-ldc93s1_checkpoint_bytes.sh
+++ b/bin/run-ci-ldc93s1_checkpoint_bytes.sh
@@ -14,7 +14,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
   --test_files ${ldc93s1_csv} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_bytes.sh b/bin/run-ci-ldc93s1_new_bytes.sh
index 17c65af4..5dec1fed 100755
--- a/bin/run-ci-ldc93s1_new_bytes.sh
+++ b/bin/run-ci-ldc93s1_new_bytes.sh
@@ -17,7 +17,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --feature_cache '/tmp/ldc93s1_cache' \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_bytes_tflite.sh b/bin/run-ci-ldc93s1_new_bytes_tflite.sh
index eb74eac1..22558942 100755
--- a/bin/run-ci-ldc93s1_new_bytes_tflite.sh
+++ b/bin/run-ci-ldc93s1_new_bytes_tflite.sh
@@ -16,7 +16,7 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false \
+python -u train.py --show_progressbar false \
   --n_hidden 100 \
   --checkpoint_dir '/tmp/ckpt_bytes' \
   --export_dir '/tmp/train_bytes_tflite' \

From 6da7b5fc269c9b01a6bbbc65e19027b522608e03 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 08:44:57 -0400
Subject: [PATCH 09/17] Raise error when alphabet and bytes_mode both specified

---
 training/coqui_stt_training/util/config.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/training/coqui_stt_training/util/config.py b/training/coqui_stt_training/util/config.py
index 0a04ad77..6bb35f3a 100755
--- a/training/coqui_stt_training/util/config.py
+++ b/training/coqui_stt_training/util/config.py
@@ -104,7 +104,11 @@ class _SttConfig(Coqpit):
         if not self.available_devices:
             self.available_devices = [self.cpu_device]
 
-        if self.bytes_output_mode:
+        if self.bytes_output_mode and self.alphabet_config_path:
+            raise RuntimeError(
+                "You cannot set --alphabet_config_path *and* --bytes_output_mode"
+            )
+        elif self.bytes_output_mode:
             self.alphabet = UTF8Alphabet()
         elif self.alphabet_config_path:
             self.alphabet = Alphabet(os.path.abspath(self.alphabet_config_path))

From 90ce16fa152a168990fa62196f9025e99a338d9a Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 09:37:32 -0400
Subject: [PATCH 10/17] Shortening some print statements

---
 training/coqui_stt_training/util/config.py | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/training/coqui_stt_training/util/config.py b/training/coqui_stt_training/util/config.py
index 6bb35f3a..4698e254 100755
--- a/training/coqui_stt_training/util/config.py
+++ b/training/coqui_stt_training/util/config.py
@@ -43,9 +43,11 @@ class _SttConfig(Coqpit):
             print(f"Parsed augmentations: {self.augmentations}")
         if self.augmentations and self.feature_cache and self.cache_for_epochs == 0:
             print(
-                "Due to current feature-cache settings the exact same sample augmentations of the first "
-                "epoch will be repeated on all following epochs. This could lead to unintended over-fitting. "
-                "You could use --cache_for_epochs <n_epochs> to invalidate the cache after a given number of epochs."
+                "Due to your feature-cache settings, augmentations of "
+                "the first epoch will be repeated on all following epochs. "
+                "This may lead to unintended over-fitting. "
+                "You can use --cache_for_epochs <n_epochs> to invalidate "
+                "the cache after a given number of epochs."
             )
 
         if self.normalize_sample_rate:
@@ -56,8 +58,9 @@ class _SttConfig(Coqpit):
         # Caching
         if self.cache_for_epochs == 1:
             print(
-                "--cache_for_epochs == 1 is (re-)creating the feature cache on every epoch but will never use it."
-                "You can either set --cache_for_epochs > 1, or not use feature caching at all."
+                "--cache_for_epochs == 1 is (re-)creating the feature cache "
+                "on every epoch but will never use it. You can either set "
+                "--cache_for_epochs > 1, or not use feature caching at all."
             )
 
         # Read-buffer
@@ -200,7 +203,7 @@ class _SttConfig(Coqpit):
     train_files: List[str] = field(
         default_factory=list,
         metadata=dict(
-            help="space-separated list of files specifying the dataset used for training. Multiple files will get merged. If empty, training will not be run."
+            help="space-separated list of files specifying the datasets used for training. Multiple files will get merged. If empty, training will not be run."
         ),
     )
     dev_files: List[str] = field(

From 3438dd2beb116bae49d4778a673f14e476592723 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 11:53:11 -0400
Subject: [PATCH 11/17] Fix checkpoint setting logic

---
 training/coqui_stt_training/util/config.py | 27 ++++++++++++++--------
 1 file changed, 17 insertions(+), 10 deletions(-)

diff --git a/training/coqui_stt_training/util/config.py b/training/coqui_stt_training/util/config.py
index 4698e254..d7a19ffa 100755
--- a/training/coqui_stt_training/util/config.py
+++ b/training/coqui_stt_training/util/config.py
@@ -75,8 +75,23 @@ class _SttConfig(Coqpit):
             self.dropout_rate6 = self.dropout_rate
 
         # Set default checkpoint dir
-        if not self.checkpoint_dir:
-            self.checkpoint_dir = xdg.save_data_path(os.path.join("stt", "checkpoints"))
+        # If separate save and load flags were not specified, default to load and save
+        # from the same dir.
+
+        # if save_checkpoint_dir hasn't been set, or checkpoint_dir is new
+        if (not self.save_checkpoint_dir) or (self.save_checkpoint_dir is not self.checkpoint_dir):
+            if not self.checkpoint_dir:
+                self.checkpoint_dir = xdg.save_data_path(os.path.join("stt", "checkpoints"))
+                self.save_checkpoint_dir = self.checkpoint_dir
+            else:
+                self.save_checkpoint_dir = self.checkpoint_dir
+        # if load_checkpoint_dir hasn't been set, or checkpoint_dir is new
+        if (not self.load_checkpoint_dir) or (self.load_checkpoint_dir is not self.checkpoint_dir):
+            if not self.checkpoint_dir:
+                self.checkpoint_dir = xdg.load_data_path(os.path.join("stt", "checkpoints"))
+                self.load_checkpoint_dir = self.checkpoint_dir
+            else:
+                self.load_checkpoint_dir = self.checkpoint_dir
 
         if self.load_train not in ["last", "best", "init", "auto"]:
             self.load_train = "auto"
@@ -192,14 +207,6 @@ class _SttConfig(Coqpit):
             )
             sys.exit(1)
 
-        # If separate save and load flags were not specified, default to load and save
-        # from the same dir.
-        if not self.save_checkpoint_dir:
-            self.save_checkpoint_dir = self.checkpoint_dir
-
-        if not self.load_checkpoint_dir:
-            self.load_checkpoint_dir = self.checkpoint_dir
-
     train_files: List[str] = field(
         default_factory=list,
         metadata=dict(

From a050b076cba271a0fe189fe1e552601b8aabb0fe Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 12:07:24 -0400
Subject: [PATCH 12/17] Cleaner lines for CI args

---
 bin/run-ci-graph_augmentations.sh         | 3 ++-
 bin/run-ci-ldc93s1_checkpoint.sh          | 3 ++-
 bin/run-ci-ldc93s1_checkpoint_sdb.sh      | 3 ++-
 bin/run-ci-ldc93s1_new.sh                 | 3 ++-
 bin/run-ci-ldc93s1_new_metrics.sh         | 3 ++-
 bin/run-ci-ldc93s1_new_sdb.sh             | 3 ++-
 bin/run-ci-ldc93s1_new_sdb_csv.sh         | 3 ++-
 bin/run-ci-ldc93s1_singleshotinference.sh | 3 ++-
 bin/run-ci-ldc93s1_tflite.sh              | 6 ++++--
 9 files changed, 20 insertions(+), 10 deletions(-)

diff --git a/bin/run-ci-graph_augmentations.sh b/bin/run-ci-graph_augmentations.sh
index bd4855b9..85b5661c 100755
--- a/bin/run-ci-graph_augmentations.sh
+++ b/bin/run-ci-graph_augmentations.sh
@@ -14,7 +14,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --scorer "" \
   --augment dropout \
diff --git a/bin/run-ci-ldc93s1_checkpoint.sh b/bin/run-ci-ldc93s1_checkpoint.sh
index 80aeea5d..a4591215 100755
--- a/bin/run-ci-ldc93s1_checkpoint.sh
+++ b/bin/run-ci-ldc93s1_checkpoint.sh
@@ -14,7 +14,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
   --test_files ${ldc93s1_csv} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_checkpoint_sdb.sh b/bin/run-ci-ldc93s1_checkpoint_sdb.sh
index 02d87b66..81126575 100755
--- a/bin/run-ci-ldc93s1_checkpoint_sdb.sh
+++ b/bin/run-ci-ldc93s1_checkpoint_sdb.sh
@@ -20,7 +20,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_sdb} --train_batch_size 1 \
   --dev_files ${ldc93s1_sdb} --dev_batch_size 1 \
   --test_files ${ldc93s1_sdb} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new.sh b/bin/run-ci-ldc93s1_new.sh
index ff7d7d25..a0261257 100755
--- a/bin/run-ci-ldc93s1_new.sh
+++ b/bin/run-ci-ldc93s1_new.sh
@@ -17,7 +17,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --feature_cache '/tmp/ldc93s1_cache' \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_metrics.sh b/bin/run-ci-ldc93s1_new_metrics.sh
index d0fd8ccc..cf31bf22 100755
--- a/bin/run-ci-ldc93s1_new_metrics.sh
+++ b/bin/run-ci-ldc93s1_new_metrics.sh
@@ -17,7 +17,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
   --test_files ${ldc93s1_csv} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_sdb.sh b/bin/run-ci-ldc93s1_new_sdb.sh
index e3b26937..aa26e2c8 100755
--- a/bin/run-ci-ldc93s1_new_sdb.sh
+++ b/bin/run-ci-ldc93s1_new_sdb.sh
@@ -23,7 +23,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_sdb} --train_batch_size 1 \
   --dev_files ${ldc93s1_sdb} --dev_batch_size 1 \
   --test_files ${ldc93s1_sdb} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_new_sdb_csv.sh b/bin/run-ci-ldc93s1_new_sdb_csv.sh
index cacd880a..9f9a185b 100755
--- a/bin/run-ci-ldc93s1_new_sdb_csv.sh
+++ b/bin/run-ci-ldc93s1_new_sdb_csv.sh
@@ -23,7 +23,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_sdb} ${ldc93s1_csv} --train_batch_size 1 \
   --feature_cache '/tmp/ldc93s1_cache_sdb_csv' \
   --dev_files ${ldc93s1_sdb} ${ldc93s1_csv} --dev_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_singleshotinference.sh b/bin/run-ci-ldc93s1_singleshotinference.sh
index c8e3839b..699b09cb 100755
--- a/bin/run-ci-ldc93s1_singleshotinference.sh
+++ b/bin/run-ci-ldc93s1_singleshotinference.sh
@@ -14,7 +14,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false --early_stop false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false --early_stop false \
   --train_files ${ldc93s1_csv} --train_batch_size 1 \
   --dev_files ${ldc93s1_csv} --dev_batch_size 1 \
   --test_files ${ldc93s1_csv} --test_batch_size 1 \
diff --git a/bin/run-ci-ldc93s1_tflite.sh b/bin/run-ci-ldc93s1_tflite.sh
index 6d79313f..66342472 100755
--- a/bin/run-ci-ldc93s1_tflite.sh
+++ b/bin/run-ci-ldc93s1_tflite.sh
@@ -16,7 +16,8 @@ fi;
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false \
   --n_hidden 100 \
   --checkpoint_dir '/tmp/ckpt' \
   --export_dir '/tmp/train_tflite' \
@@ -26,7 +27,8 @@ python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar
 
 mkdir /tmp/train_tflite/en-us
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false \
   --n_hidden 100 \
   --checkpoint_dir '/tmp/ckpt' \
   --export_dir '/tmp/train_tflite/en-us' \

From ae9280ef1a716525f3815012b5c737d038af422c Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 12:09:43 -0400
Subject: [PATCH 13/17] Cleaner lines for CI args

---
 bin/run-ldc93s1.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bin/run-ldc93s1.sh b/bin/run-ldc93s1.sh
index 46efa667..8fe87e87 100755
--- a/bin/run-ldc93s1.sh
+++ b/bin/run-ldc93s1.sh
@@ -20,7 +20,8 @@ fi
 # and when trying to run on multiple devices (like GPUs), this will break
 export CUDA_VISIBLE_DEVICES=0
 
-python -u train.py --alphabet_config_path "data/alphabet.txt" --show_progressbar false \
+python -u train.py --alphabet_config_path "data/alphabet.txt" \
+  --show_progressbar false \
   --train_files data/ldc93s1/ldc93s1.csv \
   --test_files data/ldc93s1/ldc93s1.csv \
   --train_batch_size 1 \

From ec37b3324a64d473590607e906dfb144b4792c93 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 15:13:39 -0400
Subject: [PATCH 14/17] Add example python script with
 initialize_globals_from_args()

---
 bin/run-ldc93s1.py | 27 +++++++++++++++++++++++++++
 1 file changed, 27 insertions(+)
 create mode 100755 bin/run-ldc93s1.py

diff --git a/bin/run-ldc93s1.py b/bin/run-ldc93s1.py
new file mode 100755
index 00000000..ac81ff66
--- /dev/null
+++ b/bin/run-ldc93s1.py
@@ -0,0 +1,27 @@
+#!/usr/bin/env python
+import os
+from import_ldc93s1 import _download_and_preprocess_data as download_ldc
+from coqui_stt_training.util.config import Config, initialize_globals_from_args
+from coqui_stt_training.train import train, test, early_training_checks
+from coqui_stt_ctcdecoder import Alphabet
+import tensorflow.compat.v1 as tfv1
+
+# only one GPU for only one training sample
+os.environ['CUDA_VISIBLE_DEVICES']='0'
+
+download_ldc("data/ldc93s1")
+
+initialize_globals_from_args(
+    alphabet_config_path="data/alphabet.txt",
+    train_files=["data/ldc93s1/ldc93s1.csv"],
+    dev_files=["data/ldc93s1/ldc93s1.csv"],
+    test_files=["data/ldc93s1/ldc93s1.csv"],
+    n_hidden=100,
+    epochs=200
+)
+
+early_training_checks()
+
+train()
+tfv1.reset_default_graph()
+test()

From 414748f1fe7b611d4f11918afe44114fd6e4a7b5 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 15:23:56 -0400
Subject: [PATCH 15/17] Remove extra imports

---
 bin/run-ldc93s1.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/bin/run-ldc93s1.py b/bin/run-ldc93s1.py
index ac81ff66..d6103128 100755
--- a/bin/run-ldc93s1.py
+++ b/bin/run-ldc93s1.py
@@ -1,9 +1,8 @@
 #!/usr/bin/env python
 import os
 from import_ldc93s1 import _download_and_preprocess_data as download_ldc
-from coqui_stt_training.util.config import Config, initialize_globals_from_args
+from coqui_stt_training.util.config import initialize_globals_from_args
 from coqui_stt_training.train import train, test, early_training_checks
-from coqui_stt_ctcdecoder import Alphabet
 import tensorflow.compat.v1 as tfv1
 
 # only one GPU for only one training sample
@@ -16,8 +15,9 @@ initialize_globals_from_args(
     train_files=["data/ldc93s1/ldc93s1.csv"],
     dev_files=["data/ldc93s1/ldc93s1.csv"],
     test_files=["data/ldc93s1/ldc93s1.csv"],
+    augment=["time_mask"],
     n_hidden=100,
-    epochs=200
+    epochs=100
 )
 
 early_training_checks()

From b6d40a34516b5441561340179c1d93e0370dd734 Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Wed, 21 Jul 2021 15:35:33 -0400
Subject: [PATCH 16/17] Add CI test for in-script variable setting

---
 bin/run-ldc93s1.py              | 3 ++-
 ci_scripts/train-extra-tests.sh | 3 +++
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/bin/run-ldc93s1.py b/bin/run-ldc93s1.py
index d6103128..610d20ba 100755
--- a/bin/run-ldc93s1.py
+++ b/bin/run-ldc93s1.py
@@ -11,13 +11,14 @@ os.environ['CUDA_VISIBLE_DEVICES']='0'
 download_ldc("data/ldc93s1")
 
 initialize_globals_from_args(
+    load_train="init",
     alphabet_config_path="data/alphabet.txt",
     train_files=["data/ldc93s1/ldc93s1.csv"],
     dev_files=["data/ldc93s1/ldc93s1.csv"],
     test_files=["data/ldc93s1/ldc93s1.csv"],
     augment=["time_mask"],
     n_hidden=100,
-    epochs=100
+    epochs=200
 )
 
 early_training_checks()
diff --git a/ci_scripts/train-extra-tests.sh b/ci_scripts/train-extra-tests.sh
index 1f76a0ed..50265afc 100755
--- a/ci_scripts/train-extra-tests.sh
+++ b/ci_scripts/train-extra-tests.sh
@@ -66,3 +66,6 @@ time ./bin/run-ci-ldc93s1_checkpoint_sdb.sh
 
 # Bytes output mode, resuming from checkpoint
 time ./bin/run-ci-ldc93s1_checkpoint_bytes.sh
+
+# Training with args set via initialize_globals_from_args()
+time python ./bin/run-ldc93s1.py

From b4827fa4623baa7b2d8a76f2c8c00a20086e00dd Mon Sep 17 00:00:00 2001
From: Josh Meyer <joshua.richard.meyer@gmail.com>
Date: Thu, 22 Jul 2021 05:39:45 -0400
Subject: [PATCH 17/17] Formatting changes from pre-commit

---
 bin/run-ldc93s1.py                         |  4 +--
 training/coqui_stt_training/util/config.py | 41 ++++++++++++++++------
 2 files changed, 33 insertions(+), 12 deletions(-)

diff --git a/bin/run-ldc93s1.py b/bin/run-ldc93s1.py
index 610d20ba..e266b7a4 100755
--- a/bin/run-ldc93s1.py
+++ b/bin/run-ldc93s1.py
@@ -6,7 +6,7 @@ from coqui_stt_training.train import train, test, early_training_checks
 import tensorflow.compat.v1 as tfv1
 
 # only one GPU for only one training sample
-os.environ['CUDA_VISIBLE_DEVICES']='0'
+os.environ["CUDA_VISIBLE_DEVICES"] = "0"
 
 download_ldc("data/ldc93s1")
 
@@ -18,7 +18,7 @@ initialize_globals_from_args(
     test_files=["data/ldc93s1/ldc93s1.csv"],
     augment=["time_mask"],
     n_hidden=100,
-    epochs=200
+    epochs=200,
 )
 
 early_training_checks()
diff --git a/training/coqui_stt_training/util/config.py b/training/coqui_stt_training/util/config.py
index d7a19ffa..9427c382 100755
--- a/training/coqui_stt_training/util/config.py
+++ b/training/coqui_stt_training/util/config.py
@@ -79,16 +79,24 @@ class _SttConfig(Coqpit):
         # from the same dir.
 
         # if save_checkpoint_dir hasn't been set, or checkpoint_dir is new
-        if (not self.save_checkpoint_dir) or (self.save_checkpoint_dir is not self.checkpoint_dir):
+        if (not self.save_checkpoint_dir) or (
+            self.save_checkpoint_dir is not self.checkpoint_dir
+        ):
             if not self.checkpoint_dir:
-                self.checkpoint_dir = xdg.save_data_path(os.path.join("stt", "checkpoints"))
+                self.checkpoint_dir = xdg.save_data_path(
+                    os.path.join("stt", "checkpoints")
+                )
                 self.save_checkpoint_dir = self.checkpoint_dir
             else:
                 self.save_checkpoint_dir = self.checkpoint_dir
         # if load_checkpoint_dir hasn't been set, or checkpoint_dir is new
-        if (not self.load_checkpoint_dir) or (self.load_checkpoint_dir is not self.checkpoint_dir):
+        if (not self.load_checkpoint_dir) or (
+            self.load_checkpoint_dir is not self.checkpoint_dir
+        ):
             if not self.checkpoint_dir:
-                self.checkpoint_dir = xdg.load_data_path(os.path.join("stt", "checkpoints"))
+                self.checkpoint_dir = xdg.load_data_path(
+                    os.path.join("stt", "checkpoints")
+                )
                 self.load_checkpoint_dir = self.checkpoint_dir
             else:
                 self.load_checkpoint_dir = self.checkpoint_dir
@@ -138,10 +146,12 @@ class _SttConfig(Coqpit):
         # please refer to doc/Geometry.md
 
         # Number of MFCC features
-        self.n_input = 26 # TODO: Determine this programmatically from the sample rate
+        self.n_input = 26  # TODO: Determine this programmatically from the sample rate
 
         # The number of frames in the context
-        self.n_context = 9 # TODO: Determine the optimal value using a validation data set
+        self.n_context = (
+            9  # TODO: Determine the optimal value using a validation data set
+        )
 
         # Number of units in hidden layers
         self.n_hidden = self.n_hidden
@@ -171,11 +181,17 @@ class _SttConfig(Coqpit):
                 "--feature_win_len value ({}) in milliseconds ({}) multiplied "
                 "by --audio_sample_rate value ({}) must be an integer value. Adjust "
                 "your --feature_win_len value or resample your audio accordingly."
-                "".format(self.feature_win_len, self.feature_win_len / 1000, self.audio_sample_rate)
+                "".format(
+                    self.feature_win_len,
+                    self.feature_win_len / 1000,
+                    self.audio_sample_rate,
+                )
             )
             sys.exit(1)
 
-        self.audio_window_samples = self.audio_sample_rate * (self.feature_win_len / 1000)
+        self.audio_window_samples = self.audio_sample_rate * (
+            self.feature_win_len / 1000
+        )
 
         # Stride for feature computations in samples
         if (self.feature_win_step * self.audio_sample_rate) % 1000 != 0:
@@ -184,12 +200,16 @@ class _SttConfig(Coqpit):
                 "by --audio_sample_rate value ({}) must be an integer value. Adjust "
                 "your --feature_win_step value or resample your audio accordingly."
                 "".format(
-                    self.feature_win_step, self.feature_win_step / 1000, self.audio_sample_rate
+                    self.feature_win_step,
+                    self.feature_win_step / 1000,
+                    self.audio_sample_rate,
                 )
             )
             sys.exit(1)
 
-        self.audio_step_samples = self.audio_sample_rate * (self.feature_win_step / 1000)
+        self.audio_step_samples = self.audio_sample_rate * (
+            self.feature_win_step / 1000
+        )
 
         if self.one_shot_infer:
             if not path_exists_remote(self.one_shot_infer):
@@ -718,6 +738,7 @@ def initialize_globals_from_cli():
     c.__post_init__()
     _ConfigSingleton._config = c  # pylint: disable=protected-access
 
+
 def initialize_globals_from_args(**override_args):
     # Update Config with new args
     c = _SttConfig(**override_args)