Skip to content

Commit

Permalink
Merge pull request #177 from TensorSpeech/fix/refactor
Browse files Browse the repository at this point in the history
Refactor repository
  • Loading branch information
nglehuy authored Apr 17, 2021
2 parents ac06a8b + 11d6afc commit 0143857
Show file tree
Hide file tree
Showing 136 changed files with 3,508 additions and 7,975 deletions.
1 change: 1 addition & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -21,6 +21,7 @@ TensorFlowASR implements some automatic speech recognition architectures such as

## What's New?

- (04/17/2021) Refactor repository with new version 1.x
- (02/16/2021) Supported for TPU training
- (12/27/2020) Supported _naive_ token level timestamp, see [demo](./examples/demonstration/conformer.py) with flag `--timestamp`
- (12/17/2020) Supported ContextNet [http://arxiv.org/abs/2005.03191](http://arxiv.org/abs/2005.03191)
Expand Down
36 changes: 15 additions & 21 deletions examples/conformer/config.yml
Original file line number Diff line number Diff line change
Expand Up @@ -24,14 +24,14 @@ speech_config:
normalize_per_feature: False

decoder_config:
vocabulary: null
vocabulary: ./vocabularies/librispeech/librispeech_train_10_1008.subwords
target_vocab_size: 1000
max_subword_length: 10
blank_at_zero: True
beam_width: 5
beam_width: 0
norm_score: True
corpus_files:
- /media/nlhuy/Data/ML/Datasets/ASR/Raw/LibriSpeech/train-clean-100/transcripts.tsv
- /mnt/h/ML/Datasets/ASR/Raw/LibriSpeech/train-clean-100/transcripts.tsv

model_config:
name: conformer
Expand All @@ -40,7 +40,7 @@ model_config:
filters: 144
kernel_size: 3
strides: 2
encoder_positional_encoding: sinusoid_concat_v2
encoder_positional_encoding: sinusoid_concat
encoder_dmodel: 144
encoder_num_blocks: 16
encoder_head_size: 36
Expand All @@ -66,7 +66,7 @@ learning_config:
train_dataset_config:
use_tf: True
augmentation_config:
after:
feature_augment:
time_masking:
num_masks: 10
mask_factor: 100
Expand All @@ -75,19 +75,18 @@ learning_config:
num_masks: 1
mask_factor: 27
data_paths:
- /mnt/Data/ML/Datasets/ASR/Raw/LibriSpeech/train-clean-100/transcripts.tsv
tfrecords_dir: /mnt/Miscellanea/Datasets/Speech/LibriSpeech/tfrecords
- /mnt/h/ML/Datasets/ASR/Raw/LibriSpeech/train-clean-100/transcripts.tsv
tfrecords_dir: null
shuffle: True
cache: True
cache_percent: 0.2
buffer_size: 100
drop_remainder: True
stage: train

eval_dataset_config:
use_tf: True
data_paths: null
tfrecords_dir: /mnt/Miscellanea/Datasets/Speech/LibriSpeech/tfrecords
tfrecords_dir: null
shuffle: False
cache: True
buffer_size: 100
Expand All @@ -97,7 +96,7 @@ learning_config:
test_dataset_config:
use_tf: True
data_paths: null
tfrecords_dir: /mnt/Miscellanea/Datasets/Speech/LibriSpeech/tfrecords
tfrecords_dir: null
shuffle: False
cache: True
buffer_size: 100
Expand All @@ -106,26 +105,21 @@ learning_config:

optimizer_config:
warmup_steps: 40000
beta1: 0.9
beta2: 0.98
beta_1: 0.9
beta_2: 0.98
epsilon: 1e-9

running_config:
batch_size: 2
accumulation_steps: 4
num_epochs: 50
outdir: /mnt/Miscellanea/Models/local/conformer
log_interval_steps: 300
eval_interval_steps: 500
save_interval_steps: 1000
checkpoint:
filepath: /mnt/Miscellanea/Models/local/conformer/checkpoints/{epoch:02d}.h5
filepath: /mnt/e/Models/local/conformer/checkpoints/{epoch:02d}.h5
save_best_only: True
save_weights_only: False
save_weights_only: True
save_freq: epoch
states_dir: /mnt/Miscellanea/Models/local/conformer/states
states_dir: /mnt/e/Models/local/conformer/states
tensorboard:
log_dir: /mnt/Miscellanea/Models/local/conformer/tensorboard
log_dir: /mnt/e/Models/local/conformer/tensorboard
histogram_freq: 1
write_graph: True
write_images: True
Expand Down
5 changes: 0 additions & 5 deletions examples/conformer/masking/README.md

This file was deleted.

32 changes: 0 additions & 32 deletions examples/conformer/masking/masking.py

This file was deleted.

131 changes: 0 additions & 131 deletions examples/conformer/masking/train_ga_masking_conformer.py

This file was deleted.

Loading

0 comments on commit 0143857

Please sign in to comment.