NVIDIA-NeMo · titu1994 · May 26, 2022 · May 26, 2022
diff --git a/examples/asr/conf/carnelinet/carnelinet_384.yaml b/examples/asr/conf/carnelinet/carnelinet_384.yaml
@@ -35,6 +35,8 @@ model:
     use_start_end_token: false
     max_duration: 16.7
     shuffle: true
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -50,13 +52,17 @@ model:
     batch_size: 32
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   test_ds:
     manifest_filepath: null
     sample_rate: 16000
     batch_size: 32
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   model_defaults:
     repeat: 5

diff --git a/examples/asr/conf/citrinet/citrinet_1024.yaml b/examples/asr/conf/citrinet/citrinet_1024.yaml
@@ -25,6 +25,8 @@ model:
     max_duration: 20.0
     shuffle: true
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -39,13 +41,17 @@ model:
     batch_size: 32
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   test_ds:
     manifest_filepath: null
     sample_rate: 16000
     batch_size: 32
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   model_defaults:
     repeat: 5

diff --git a/examples/asr/conf/citrinet/citrinet_384.yaml b/examples/asr/conf/citrinet/citrinet_384.yaml
@@ -24,6 +24,8 @@ model:
     max_duration: 16.7
     shuffle: true
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -39,13 +41,17 @@ model:
     batch_size: 32
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   test_ds:
     manifest_filepath: null
     sample_rate: 16000
     batch_size: 32
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   model_defaults:
     repeat: 5

diff --git a/examples/asr/conf/citrinet/config_bpe.yaml b/examples/asr/conf/citrinet/config_bpe.yaml
@@ -12,6 +12,8 @@ model:
     trim_silence: True
     max_duration: 16.7
     shuffle: True
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -26,6 +28,8 @@ model:
     sample_rate: 16000
     batch_size: 32
     shuffle: False
+    num_workers: 8
+    pin_memory: true
 
   tokenizer:
     dir: ???  # path to directory which contains either tokenizer.model (bpe) or vocab.txt (for wpe)

diff --git a/examples/asr/conf/config.yaml b/examples/asr/conf/config.yaml
@@ -15,6 +15,8 @@ model:
     trim_silence: True
     max_duration: 16.7
     shuffle: True
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -29,6 +31,8 @@ model:
     labels: *labels
     batch_size: 32
     shuffle: False
+    num_workers: 8
+    pin_memory: true
 
   preprocessor:
     _target_: nemo.collections.asr.modules.AudioToMelSpectrogramPreprocessor

diff --git a/examples/asr/conf/contextnet_rnnt/config_rnnt.yaml b/examples/asr/conf/contextnet_rnnt/config_rnnt.yaml
@@ -15,6 +15,8 @@ model:
     max_duration: 16.7
     labels: ${model.labels}
     shuffle: true
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -30,13 +32,17 @@ model:
     batch_size: 32
     shuffle: false
     labels: ${model.labels}
+    num_workers: 8
+    pin_memory: true
 
   test_ds:
     manifest_filepath: null
     sample_rate: ${model.sample_rate}
     batch_size: 32
     shuffle: false
     labels: ${model.labels}
+    num_workers: 8
+    pin_memory: true
 
   model_defaults:
     repeat: 5

diff --git a/examples/asr/conf/contextnet_rnnt/config_rnnt_bpe.yaml b/examples/asr/conf/contextnet_rnnt/config_rnnt_bpe.yaml
@@ -16,6 +16,8 @@ model:
     max_duration: 16.7
     labels: []
     shuffle: true
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -30,13 +32,17 @@ model:
     batch_size: 32
     shuffle: false
     labels: []
+    num_workers: 8
+    pin_memory: true
 
   test_ds:
     manifest_filepath: null
     sample_rate: ${model.sample_rate}
     batch_size: 32
     shuffle: false
     labels: []
+    num_workers: 8
+    pin_memory: true
 
   model_defaults:
     repeat: 5

diff --git a/examples/asr/conf/jasper/jasper_10x5dr.yaml b/examples/asr/conf/jasper/jasper_10x5dr.yaml
@@ -13,6 +13,8 @@ model:
     trim_silence: True
     max_duration: 16.7
     shuffle: True
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -28,6 +30,8 @@ model:
     labels: *labels
     batch_size: 32
     shuffle: False
+    num_workers: 8
+    pin_memory: true
 
   preprocessor:
     _target_: nemo.collections.asr.modules.AudioToMelSpectrogramPreprocessor

diff --git a/examples/asr/conf/marblenet/marblenet_3x2x64.yaml b/examples/asr/conf/marblenet/marblenet_3x2x64.yaml
@@ -19,6 +19,8 @@ model:
     tarred_audio_filepaths: null
     tarred_shard_strategy: "scatter"
     shuffle_n: 2048
+    num_workers: 8
+    pin_memory: true
     # bucketing params
     bucketing_strategy: "synced_randomized"
     bucketing_batch_size: null
@@ -38,6 +40,8 @@ model:
     labels: ${model.labels}
     batch_size: 128
     shuffle: False
+    num_workers: 8
+    pin_memory: true
     val_loss_idx: 0
 
   test_ds:
@@ -46,6 +50,8 @@ model:
     labels: ${model.labels}
     batch_size: 128
     shuffle: False
+    num_workers: 8
+    pin_memory: true
     test_loss_idx: 0
 
   preprocessor:

diff --git a/examples/asr/conf/matchboxnet/matchboxnet_3x1x64_v1.yaml b/examples/asr/conf/matchboxnet/matchboxnet_3x1x64_v1.yaml
@@ -21,6 +21,8 @@ model:
     labels: ${model.labels}
     batch_size: 128
     shuffle: True
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -44,6 +46,8 @@ model:
     labels: ${model.labels}
     batch_size: 128
     shuffle: False
+    num_workers: 8
+    pin_memory: true
     val_loss_idx: 0
 
   test_ds:
@@ -52,6 +56,8 @@ model:
     labels: ${model.labels}
     batch_size: 128
     shuffle: False
+    num_workers: 8
+    pin_memory: true
     test_loss_idx: 0
 
   preprocessor:

diff --git a/examples/asr/conf/matchboxnet/matchboxnet_3x1x64_v2.yaml b/examples/asr/conf/matchboxnet/matchboxnet_3x1x64_v2.yaml
@@ -21,6 +21,8 @@ model:
     labels: ${model.labels}
     batch_size: 128
     shuffle: True
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -44,6 +46,8 @@ model:
     labels: ${model.labels}
     batch_size: 128
     shuffle: False
+    num_workers: 8
+    pin_memory: true
     val_loss_idx: 0
 
   test_ds:
@@ -52,6 +56,8 @@ model:
     labels: ${model.labels}
     batch_size: 128
     shuffle: False
+    num_workers: 8
+    pin_memory: true
     test_loss_idx: 0
 
   preprocessor:

diff --git a/examples/asr/conf/quartznet/quartznet_15x5.yaml b/examples/asr/conf/quartznet/quartznet_15x5.yaml
@@ -16,6 +16,8 @@ model:
     trim_silence: True
     max_duration: 16.7
     shuffle: True
+    num_workers: 8
+    pin_memory: true
     # tarred datasets
     is_tarred: false
     tarred_audio_filepaths: null
@@ -30,13 +32,17 @@ model:
     labels: *labels
     batch_size: 32
     shuffle: False
+    num_workers: 8
+    pin_memory: true
 
   test_ds:
     manifest_filepath: null
     sample_rate: 16000
     labels: *labels
     batch_size: 32
     shuffle: False
+    num_workers: 8
+    pin_memory: true
 
   preprocessor:
     _target_: nemo.collections.asr.modules.AudioToMelSpectrogramPreprocessor

diff --git a/examples/asr/conf/ssl/citrinet/citrinet_ssl_1024.yaml b/examples/asr/conf/ssl/citrinet/citrinet_ssl_1024.yaml
@@ -28,6 +28,8 @@ model:
     tarred_audio_filepaths: null
     shuffle_n: 2048
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
     # bucketing params
     bucketing_strategy: "synced_randomized"
     bucketing_batch_size: null
@@ -38,6 +40,8 @@ model:
     batch_size: 32
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
     max_duration: 35.0
     min_duration: 8.0
 

diff --git a/examples/asr/conf/ssl/citrinet/citrinet_ssl_ci.yaml b/examples/asr/conf/ssl/citrinet/citrinet_ssl_ci.yaml
@@ -16,6 +16,8 @@ model:
     is_tarred: false
     tarred_audio_filepaths: null
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
     # bucketing params
     bucketing_strategy: "synced_randomized"
     bucketing_batch_size: null

diff --git a/examples/asr/conf/wav2vec/wav2vecCTC.yaml b/examples/asr/conf/wav2vec/wav2vecCTC.yaml
@@ -19,20 +19,26 @@ model:
     is_tarred: false
     tarred_audio_filepaths: null
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   validation_ds:
     manifest_filepath: ???
     sample_rate: *sample_rate
     batch_size: ??
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   test_ds:
     manifest_filepath: null
     sample_rate: *sample_rate
     batch_size: null
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   tokenizer:
     dir: ??? # path to directory which contains either tokenizer.model (bpe) or vocab.txt (for wpe)

diff --git a/examples/asr/conf/wav2vec/wav2vecCTC_large.yaml b/examples/asr/conf/wav2vec/wav2vecCTC_large.yaml
@@ -18,20 +18,26 @@ model:
     is_tarred: false
     tarred_audio_filepaths: null
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   validation_ds:
     manifest_filepath: ???
     sample_rate: *sample_rate
     batch_size: 4
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   test_ds:
     manifest_filepath: null
     sample_rate: *sample_rate
     batch_size: null
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   tokenizer:
     dir: ??? # path to directory which contains either tokenizer.model (bpe) or vocab.txt (for wpe)

diff --git a/examples/asr/conf/wav2vec/wav2vec_pretrain.yaml b/examples/asr/conf/wav2vec/wav2vec_pretrain.yaml
@@ -24,13 +24,17 @@ model:
     is_tarred: false
     tarred_audio_filepaths: null
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   validation_ds:
     manifest_filepath: ???
     sample_rate: *sample_rate
     batch_size: ???
     shuffle: false
     use_start_end_token: false
+    num_workers: 8
+    pin_memory: true
 
   preprocessor:
     _target_: nemo.collections.asr.modules.wav2vec_modules.ConvFeatureEncoder