Merge pull request #177 from TensorSpeech/fix/refactor

Refactor repository
TensorSpeech · Apr 17, 2021 · 0143857 · 0143857
2 parents ac06a8b + 11d6afc
commit 0143857
Show file tree

Hide file tree

Showing 136 changed files with 3,508 additions and 7,975 deletions.
diff --git a/README.md b/README.md
@@ -21,6 +21,7 @@ TensorFlowASR implements some automatic speech recognition architectures such as
 
 ## What's New?
 
+- (04/17/2021) Refactor repository with new version 1.x
 - (02/16/2021) Supported for TPU training
 - (12/27/2020) Supported _naive_ token level timestamp, see [demo](./examples/demonstration/conformer.py) with flag `--timestamp`
 - (12/17/2020) Supported ContextNet [http://arxiv.org/abs/2005.03191](http://arxiv.org/abs/2005.03191)

diff --git a/examples/conformer/config.yml b/examples/conformer/config.yml
@@ -24,14 +24,14 @@ speech_config:
   normalize_per_feature: False
 
 decoder_config:
-  vocabulary: null
+  vocabulary: ./vocabularies/librispeech/librispeech_train_10_1008.subwords
   target_vocab_size: 1000
   max_subword_length: 10
   blank_at_zero: True
-  beam_width: 5
+  beam_width: 0
   norm_score: True
   corpus_files:
-    - /media/nlhuy/Data/ML/Datasets/ASR/Raw/LibriSpeech/train-clean-100/transcripts.tsv
+    - /mnt/h/ML/Datasets/ASR/Raw/LibriSpeech/train-clean-100/transcripts.tsv
 
 model_config:
   name: conformer
@@ -40,7 +40,7 @@ model_config:
     filters: 144
     kernel_size: 3
     strides: 2
-  encoder_positional_encoding: sinusoid_concat_v2
+  encoder_positional_encoding: sinusoid_concat
   encoder_dmodel: 144
   encoder_num_blocks: 16
   encoder_head_size: 36
@@ -66,7 +66,7 @@ learning_config:
   train_dataset_config:
     use_tf: True
     augmentation_config:
-      after:
+      feature_augment:
         time_masking:
           num_masks: 10
           mask_factor: 100
@@ -75,19 +75,18 @@ learning_config:
           num_masks: 1
           mask_factor: 27
     data_paths:
-      - /mnt/Data/ML/Datasets/ASR/Raw/LibriSpeech/train-clean-100/transcripts.tsv
-    tfrecords_dir: /mnt/Miscellanea/Datasets/Speech/LibriSpeech/tfrecords
+      - /mnt/h/ML/Datasets/ASR/Raw/LibriSpeech/train-clean-100/transcripts.tsv
+    tfrecords_dir: null
     shuffle: True
     cache: True
-    cache_percent: 0.2
     buffer_size: 100
     drop_remainder: True
     stage: train
 
   eval_dataset_config:
     use_tf: True
     data_paths: null
-    tfrecords_dir: /mnt/Miscellanea/Datasets/Speech/LibriSpeech/tfrecords
+    tfrecords_dir: null
     shuffle: False
     cache: True
     buffer_size: 100
@@ -97,7 +96,7 @@ learning_config:
   test_dataset_config:
     use_tf: True
     data_paths: null
-    tfrecords_dir: /mnt/Miscellanea/Datasets/Speech/LibriSpeech/tfrecords
+    tfrecords_dir: null
     shuffle: False
     cache: True
     buffer_size: 100
@@ -106,26 +105,21 @@ learning_config:
 
   optimizer_config:
     warmup_steps: 40000
-    beta1: 0.9
-    beta2: 0.98
+    beta_1: 0.9
+    beta_2: 0.98
     epsilon: 1e-9
 
   running_config:
     batch_size: 2
-    accumulation_steps: 4
     num_epochs: 50
-    outdir: /mnt/Miscellanea/Models/local/conformer
-    log_interval_steps: 300
-    eval_interval_steps: 500
-    save_interval_steps: 1000
     checkpoint:
-      filepath: /mnt/Miscellanea/Models/local/conformer/checkpoints/{epoch:02d}.h5
+      filepath: /mnt/e/Models/local/conformer/checkpoints/{epoch:02d}.h5
       save_best_only: True
-      save_weights_only: False
+      save_weights_only: True
       save_freq: epoch
-    states_dir: /mnt/Miscellanea/Models/local/conformer/states
+    states_dir: /mnt/e/Models/local/conformer/states
     tensorboard:
-      log_dir: /mnt/Miscellanea/Models/local/conformer/tensorboard
+      log_dir: /mnt/e/Models/local/conformer/tensorboard
       histogram_freq: 1
       write_graph: True
       write_images: True

diff --git a/examples/conformer/masking/README.md b/examples/conformer/masking/README.md
diff --git a/examples/conformer/masking/masking.py b/examples/conformer/masking/masking.py
diff --git a/examples/conformer/masking/train_ga_masking_conformer.py b/examples/conformer/masking/train_ga_masking_conformer.py