Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 6 additions & 0 deletions examples/asr/conf/carnelinet/carnelinet_384.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,8 @@ model:
use_start_end_token: false
max_duration: 16.7
shuffle: true
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -50,13 +52,17 @@ model:
batch_size: 32
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

test_ds:
manifest_filepath: null
sample_rate: 16000
batch_size: 32
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

model_defaults:
repeat: 5
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/citrinet/citrinet_1024.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,8 @@ model:
max_duration: 20.0
shuffle: true
use_start_end_token: false
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -39,13 +41,17 @@ model:
batch_size: 32
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

test_ds:
manifest_filepath: null
sample_rate: 16000
batch_size: 32
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

model_defaults:
repeat: 5
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/citrinet/citrinet_384.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,8 @@ model:
max_duration: 16.7
shuffle: true
use_start_end_token: false
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -39,13 +41,17 @@ model:
batch_size: 32
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

test_ds:
manifest_filepath: null
sample_rate: 16000
batch_size: 32
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

model_defaults:
repeat: 5
Expand Down
4 changes: 4 additions & 0 deletions examples/asr/conf/citrinet/config_bpe.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,8 @@ model:
trim_silence: True
max_duration: 16.7
shuffle: True
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -26,6 +28,8 @@ model:
sample_rate: 16000
batch_size: 32
shuffle: False
num_workers: 8
pin_memory: true

tokenizer:
dir: ??? # path to directory which contains either tokenizer.model (bpe) or vocab.txt (for wpe)
Expand Down
4 changes: 4 additions & 0 deletions examples/asr/conf/config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,8 @@ model:
trim_silence: True
max_duration: 16.7
shuffle: True
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -29,6 +31,8 @@ model:
labels: *labels
batch_size: 32
shuffle: False
num_workers: 8
pin_memory: true

preprocessor:
_target_: nemo.collections.asr.modules.AudioToMelSpectrogramPreprocessor
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/contextnet_rnnt/config_rnnt.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,8 @@ model:
max_duration: 16.7
labels: ${model.labels}
shuffle: true
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -30,13 +32,17 @@ model:
batch_size: 32
shuffle: false
labels: ${model.labels}
num_workers: 8
pin_memory: true

test_ds:
manifest_filepath: null
sample_rate: ${model.sample_rate}
batch_size: 32
shuffle: false
labels: ${model.labels}
num_workers: 8
pin_memory: true

model_defaults:
repeat: 5
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/contextnet_rnnt/config_rnnt_bpe.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,8 @@ model:
max_duration: 16.7
labels: []
shuffle: true
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -30,13 +32,17 @@ model:
batch_size: 32
shuffle: false
labels: []
num_workers: 8
pin_memory: true

test_ds:
manifest_filepath: null
sample_rate: ${model.sample_rate}
batch_size: 32
shuffle: false
labels: []
num_workers: 8
pin_memory: true

model_defaults:
repeat: 5
Expand Down
4 changes: 4 additions & 0 deletions examples/asr/conf/jasper/jasper_10x5dr.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,8 @@ model:
trim_silence: True
max_duration: 16.7
shuffle: True
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -28,6 +30,8 @@ model:
labels: *labels
batch_size: 32
shuffle: False
num_workers: 8
pin_memory: true

preprocessor:
_target_: nemo.collections.asr.modules.AudioToMelSpectrogramPreprocessor
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/marblenet/marblenet_3x2x64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -19,6 +19,8 @@ model:
tarred_audio_filepaths: null
tarred_shard_strategy: "scatter"
shuffle_n: 2048
num_workers: 8
pin_memory: true
# bucketing params
bucketing_strategy: "synced_randomized"
bucketing_batch_size: null
Expand All @@ -38,6 +40,8 @@ model:
labels: ${model.labels}
batch_size: 128
shuffle: False
num_workers: 8
pin_memory: true
val_loss_idx: 0

test_ds:
Expand All @@ -46,6 +50,8 @@ model:
labels: ${model.labels}
batch_size: 128
shuffle: False
num_workers: 8
pin_memory: true
test_loss_idx: 0

preprocessor:
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/matchboxnet/matchboxnet_3x1x64_v1.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -21,6 +21,8 @@ model:
labels: ${model.labels}
batch_size: 128
shuffle: True
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -44,6 +46,8 @@ model:
labels: ${model.labels}
batch_size: 128
shuffle: False
num_workers: 8
pin_memory: true
val_loss_idx: 0

test_ds:
Expand All @@ -52,6 +56,8 @@ model:
labels: ${model.labels}
batch_size: 128
shuffle: False
num_workers: 8
pin_memory: true
test_loss_idx: 0

preprocessor:
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/matchboxnet/matchboxnet_3x1x64_v2.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -21,6 +21,8 @@ model:
labels: ${model.labels}
batch_size: 128
shuffle: True
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -44,6 +46,8 @@ model:
labels: ${model.labels}
batch_size: 128
shuffle: False
num_workers: 8
pin_memory: true
val_loss_idx: 0

test_ds:
Expand All @@ -52,6 +56,8 @@ model:
labels: ${model.labels}
batch_size: 128
shuffle: False
num_workers: 8
pin_memory: true
test_loss_idx: 0

preprocessor:
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/quartznet/quartznet_15x5.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,8 @@ model:
trim_silence: True
max_duration: 16.7
shuffle: True
num_workers: 8
pin_memory: true
# tarred datasets
is_tarred: false
tarred_audio_filepaths: null
Expand All @@ -30,13 +32,17 @@ model:
labels: *labels
batch_size: 32
shuffle: False
num_workers: 8
pin_memory: true

test_ds:
manifest_filepath: null
sample_rate: 16000
labels: *labels
batch_size: 32
shuffle: False
num_workers: 8
pin_memory: true

preprocessor:
_target_: nemo.collections.asr.modules.AudioToMelSpectrogramPreprocessor
Expand Down
4 changes: 4 additions & 0 deletions examples/asr/conf/ssl/citrinet/citrinet_ssl_1024.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -28,6 +28,8 @@ model:
tarred_audio_filepaths: null
shuffle_n: 2048
use_start_end_token: false
num_workers: 8
pin_memory: true
# bucketing params
bucketing_strategy: "synced_randomized"
bucketing_batch_size: null
Expand All @@ -38,6 +40,8 @@ model:
batch_size: 32
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true
max_duration: 35.0
min_duration: 8.0

Expand Down
2 changes: 2 additions & 0 deletions examples/asr/conf/ssl/citrinet/citrinet_ssl_ci.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,8 @@ model:
is_tarred: false
tarred_audio_filepaths: null
use_start_end_token: false
num_workers: 8
pin_memory: true
# bucketing params
bucketing_strategy: "synced_randomized"
bucketing_batch_size: null
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/wav2vec/wav2vecCTC.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -19,20 +19,26 @@ model:
is_tarred: false
tarred_audio_filepaths: null
use_start_end_token: false
num_workers: 8
pin_memory: true

validation_ds:
manifest_filepath: ???
sample_rate: *sample_rate
batch_size: ??
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

test_ds:
manifest_filepath: null
sample_rate: *sample_rate
batch_size: null
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

tokenizer:
dir: ??? # path to directory which contains either tokenizer.model (bpe) or vocab.txt (for wpe)
Expand Down
6 changes: 6 additions & 0 deletions examples/asr/conf/wav2vec/wav2vecCTC_large.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -18,20 +18,26 @@ model:
is_tarred: false
tarred_audio_filepaths: null
use_start_end_token: false
num_workers: 8
pin_memory: true

validation_ds:
manifest_filepath: ???
sample_rate: *sample_rate
batch_size: 4
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

test_ds:
manifest_filepath: null
sample_rate: *sample_rate
batch_size: null
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

tokenizer:
dir: ??? # path to directory which contains either tokenizer.model (bpe) or vocab.txt (for wpe)
Expand Down
4 changes: 4 additions & 0 deletions examples/asr/conf/wav2vec/wav2vec_pretrain.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -24,13 +24,17 @@ model:
is_tarred: false
tarred_audio_filepaths: null
use_start_end_token: false
num_workers: 8
pin_memory: true

validation_ds:
manifest_filepath: ???
sample_rate: *sample_rate
batch_size: ???
shuffle: false
use_start_end_token: false
num_workers: 8
pin_memory: true

preprocessor:
_target_: nemo.collections.asr.modules.wav2vec_modules.ConvFeatureEncoder
Expand Down
Loading