speechbrain
diff --git a/‎recipes/AISHELL-1/ASR/transformer/train.py‎
Lines changed: 1 addition & 1 deletion b/‎recipes/AISHELL-1/ASR/transformer/train.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎recipes/AISHELL-1/ASR/transformer/train_with_wav2vect.py‎
Lines changed: 1 addition & 1 deletion b/‎recipes/AISHELL-1/ASR/transformer/train_with_wav2vect.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎recipes/AMI/Diarization/experiment.py‎
Lines changed: 3 additions & 3 deletions b/‎recipes/AMI/Diarization/experiment.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎recipes/Aishell1Mix/separation/scripts/create_wham_metadata.py‎
Lines changed: 1 addition & 1 deletion b/‎recipes/Aishell1Mix/separation/scripts/create_wham_metadata.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎recipes/CommonLanguage/common_language_prepare.py‎
Lines changed: 5 additions & 5 deletions b/‎recipes/CommonLanguage/common_language_prepare.py‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎recipes/CommonLanguage/lang_id/README.md‎
Lines changed: 1 addition & 1 deletion b/‎recipes/CommonLanguage/lang_id/README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎recipes/CommonLanguage/lang_id/hparams/train_ecapa_tdnn.yaml‎
Lines changed: 1 addition & 1 deletion b/‎recipes/CommonLanguage/lang_id/hparams/train_ecapa_tdnn.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎recipes/CommonLanguage/lang_id/train.py‎
Lines changed: 3 additions & 3 deletions b/‎recipes/CommonLanguage/lang_id/train.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎recipes/CommonVoice/ASR/CTC/train_with_wav2vec.py‎
Lines changed: 1 addition & 1 deletion b/‎recipes/CommonVoice/ASR/CTC/train_with_wav2vec.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎recipes/CommonVoice/ASR/seq2seq/train_with_wav2vec.py‎
Lines changed: 1 addition & 1 deletion b/‎recipes/CommonVoice/ASR/seq2seq/train_with_wav2vec.py‎
Lines changed: 1 addition & 1 deletion
@@ -256,7 +256,7 @@ def on_fit_start(self):
                 self.checkpointer.recover_if_possible()
 
     def on_evaluate_start(self, max_key=None, min_key=None):
-        """perform checkpoint averge if needed"""
+        """perform checkpoint average if needed"""
         super().on_evaluate_start()
 
         ckpts = self.checkpointer.find_checkpoints(
 
@@ -241,7 +241,7 @@ def on_fit_start(self):
                 )
 
     def on_evaluate_start(self, max_key=None, min_key=None):
-        """perform checkpoint averge if needed"""
+        """perform checkpoint average if needed"""
         super().on_evaluate_start()
 
         ckpts = self.checkpointer.find_checkpoints(
 
@@ -109,7 +109,7 @@ def embedding_computation_loop(split, set_loader, stat_file):
         modelset = np.array(modelset, dtype="|O")
         segset = np.array(segset, dtype="|O")
 
-        # Intialize variables for start, stop and stat0.
+        # Initialize variables for start, stop and stat0.
         s = np.array([None] * embeddings.shape[0])
         b = np.array([[1.0]] * embeddings.shape[0])
 
@@ -397,7 +397,7 @@ def dev_nn_tuner(full_meta, split_type):
     DER_list = []
     pval = None
 
-    # Now assumming oracle num of speakers.
+    # Now assuming oracle num of speakers.
     n_lambdas = 4
 
     for nn in range(5, 15):
@@ -511,7 +511,7 @@ def audio_pipeline(wav):
     with open(params_file) as fin:
         params = load_hyperpyyaml(fin, overrides)
 
-    # Dataset prep (peparing metadata files)
+    # Dataset prep (preparing metadata files)
     from ami_prepare import prepare_ami  # noqa
 
     if not params["skip_prep"]:
 
@@ -52,7 +52,7 @@ def create_wham_noise_metadata(wham_noise_dir, md_dir):
         dir_metadata = dir_metadata[dir_metadata["length"] >= num_samples]
         # Create save path
         save_path = os.path.join(md_dir, name + ".csv")
-        print(f"Medatada file created in {save_path}")
+        print(f"Metadata file created in {save_path}")
         dir_metadata.to_csv(save_path, index=False)
 
 
 
@@ -80,7 +80,7 @@ def prepare_common_language(data_folder, save_folder, skip_prep=False):
     save_folder : str
         The directory where to store the csv files.
     max_duration : int, optional
-        Max duration (in seconds) of training uterances.
+        Max duration (in seconds) of training utterances.
     skip_prep: bool
         If True, skip data preparation.
 
@@ -102,7 +102,7 @@ def prepare_common_language(data_folder, save_folder, skip_prep=False):
     # Setting the save folder
     os.makedirs(save_folder, exist_ok=True)
 
-    # Setting ouput files
+    # Setting output files
     save_csv_train = os.path.join(save_folder, "train.csv")
     save_csv_dev = os.path.join(save_folder, "dev.csv")
     save_csv_test = os.path.join(save_folder, "test.csv")
@@ -246,7 +246,7 @@ def create_csv(wav_list, csv_file):
         # Actual name of the language
         language = path_parts[-4]
 
-        # Create a row with whole utterences
+        # Create a row with whole utterances
         csv_line = [
             idx,  # ID
             wav_file,  # File name
@@ -264,7 +264,7 @@ def create_csv(wav_list, csv_file):
     # CSV column titles
     csv_header = ["ID", "wav", "wav_format", "duration", "language"]
 
-    # Add titles to the list at indexx 0
+    # Add titles to the list at index 0
     csv_lines.insert(0, csv_header)
 
     # Writing the csv lines
@@ -277,7 +277,7 @@ def create_csv(wav_list, csv_file):
             csv_writer.writerow(line)
 
     # Final prints
-    msg = f"{csv_file} sucessfully created!"
+    msg = f"{csv_file} successfully created!"
     logger.info(msg)
     msg = f"Number of samples: {len(wav_list)}."
     logger.info(msg)
 
@@ -9,7 +9,7 @@ Similar to the X-Vector a bigger and more powerful ECAPA-TDNN model can be used.
 The experiment is also fine-tuning of the trained speaker embeddings done for Speaker Identification task on VoxCeleb, and can be accessed on [HuggingFace](https://huggingface.co/speechbrain/spkrec-ecapa-voxceleb). Therefore, most of the architecture choices come from that task.
 
 Data augmentation and environmental corruption are done by concatenating waveforms, dropout, speed change, reverberation, noise, and noise+rev. The batch is double size of the original one. This may lead to
-better performance, at the cost of longer training time and higher compute resourses.
+better performance, at the cost of longer training time and higher compute resources.
 
 # Performance
 | Release | hyperparams file | Val. Err | Test Err | Model link | GPUs |
 
@@ -136,7 +136,7 @@ embedding_model: !new:speechbrain.lobes.models.ECAPA_TDNN.ECAPA_TDNN
     attention_channels: !ref <emb_attention_channels>
     lin_neurons: !ref <emb_dim>
 
-# Classifier baseed on cosine distance
+# Classifier based on cosine distance
 classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
     input_size: !ref <emb_dim>
     out_neurons: !ref <n_languages>
 
@@ -193,7 +193,7 @@ def dataio_prep(hparams):
         to the appropriate DynamicItemDataset object.
     """
 
-    # Initialization of the label encoder. The label encoder assignes to each
+    # Initialization of the label encoder. The label encoder assigns to each
     # of the observed label a unique index (e.g, 'lang01': 0, 'lang02': 1, ..)
     language_encoder = sb.dataio.encoder.CategoricalEncoder()
 
@@ -229,7 +229,7 @@ def label_pipeline(language):
 
     # Load or compute the label encoder (with multi-GPU DDP support)
     # Please, take a look into the lab_enc_file to see the label to index
-    # mappinng.
+    # mapping.
     language_encoder_file = os.path.join(
         hparams["save_folder"], "language_encoder.txt"
     )
@@ -278,7 +278,7 @@ def label_pipeline(language):
     # Create dataset objects "train", "dev", and "test" and language_encoder
     datasets, language_encoder = dataio_prep(hparams)
 
-    # Fetch and laod pretrained modules
+    # Fetch and load pretrained modules
     sb.utils.distributed.run_on_main(hparams["pretrainer"].collect_files)
     hparams["pretrainer"].load_collected()
 
 
@@ -7,7 +7,7 @@
 > python train_with_wav2vec2.py hparams/train_with_wav2vec2.yaml
 
 With the default hyperparameters, the system employs a pretrained wav2vec2 encoder.
-The wav2vec2 model is pretrained following the model given in the hprams file.
+The wav2vec2 model is pretrained following the model given in the hparams file.
 It may be dependent on the language.
 
 The neural network is trained with CTC on sub-word units estimated with
 
@@ -7,7 +7,7 @@
 > python train_with_wav2vec2.py hparams/train_with_wav2vec2.yaml
 
 With the default hyperparameters, the system employs a pretrained wav2vec2 encoder.
-The wav2vec2 model is pretrained following the XSLR French HuggingFace model:
+The wav2vec2 model is pretrained following the XLSR French HuggingFace model:
 facebook/wav2vec2-large-xlsr-53-french
 
 The decoder is based on a standard GRU and BeamSearch (no LM).
Original file line number	Diff line number	Diff line change
`@@ -241,7 +241,7 @@ def on_fit_start(self):`
`241`	`241`	`)`
`242`	`242`
`243`	`243`	`def on_evaluate_start(self, max_key=None, min_key=None):`
`244`		`- """perform checkpoint averge if needed"""`
	`244`	`+ """perform checkpoint average if needed"""`
`245`	`245`	`super().on_evaluate_start()`
`246`	`246`
`247`	`247`	`ckpts = self.checkpointer.find_checkpoints(`