diff --git a/README.md b/README.md index 328035f..2cb1eb8 100644 --- a/README.md +++ b/README.md @@ -104,7 +104,7 @@ Train AudioSep from scratch: python train.py --workspace workspace/AudioSep --config_yaml config/audiosep_base.yaml --resume_checkpoint_path checkpoint/ '' ``` -Finetune AudioSep from pretrained checkpoint: +Finetune AudioSep from pre-trained checkpoint: ```python python train.py --workspace workspace/AudioSep --config_yaml config/audiosep_base.yaml --resume_checkpoint_path path_to_checkpoint ``` diff --git a/data/datamodules.py b/data/datamodules.py index 73136ad..3327e5d 100644 --- a/data/datamodules.py +++ b/data/datamodules.py @@ -47,7 +47,7 @@ def setup(self, stage: Optional[str] = None) -> NoReturn: # called on every process in DDP # SegmentSampler is used for selecting segments for training. - # On multiple devices, each SegmentSampler samples a part of mini-batch + # On multiple devices, each SegmentSampler samples a part of a mini-batch # data. self.train_dataset = self._train_dataset @@ -119,4 +119,4 @@ def collate_fn(list_data_dict): 'audio_text': at_data_dict } - return data_dict \ No newline at end of file + return data_dict diff --git a/data/waveform_mixers.py b/data/waveform_mixers.py index 3b3f4df..4543d24 100644 --- a/data/waveform_mixers.py +++ b/data/waveform_mixers.py @@ -43,10 +43,10 @@ def __call__(self, waveforms): # randomly normalize background noise noise = dynamic_loudnorm(audio=noise, reference=segment, **self.loudness_param) - # create audio mixyure + # create an audio mixture mixture = segment + noise - # declipping if need be + # Declipping if need be max_value = torch.max(torch.abs(mixture)) if max_value > 1: segment *= 0.9 / max_value diff --git a/evaluation/evaluate_audiocaps.py b/evaluation/evaluate_audiocaps.py index a3a3d21..628db0e 100644 --- a/evaluation/evaluate_audiocaps.py +++ b/evaluation/evaluate_audiocaps.py @@ -51,7 +51,7 @@ def __call__( self, pl_model: pl.LightningModule ) -> Dict: - r"""Evalute.""" + r"""Evaluate.""" print(f'Evaluation on AudioCaps with [{self.query}] queries.') @@ -107,4 +107,4 @@ def __call__( mean_sisdr = np.mean(sisdrs_list) mean_sdri = np.mean(sdris_list) - return mean_sisdr, mean_sdri \ No newline at end of file + return mean_sisdr, mean_sdri diff --git a/evaluation/evaluate_audioset.py b/evaluation/evaluate_audioset.py index 21128bd..fd1e878 100644 --- a/evaluation/evaluate_audioset.py +++ b/evaluation/evaluate_audioset.py @@ -62,7 +62,7 @@ def __call__( self, pl_model: pl.LightningModule ) -> Dict: - r"""Evalute.""" + r"""Evaluate.""" pl_model.eval() diff --git a/evaluation/evaluate_clotho.py b/evaluation/evaluate_clotho.py index c552986..2284fb0 100644 --- a/evaluation/evaluate_clotho.py +++ b/evaluation/evaluate_clotho.py @@ -46,7 +46,7 @@ def __call__( self, pl_model: pl.LightningModule ) -> Dict: - r"""Evalute.""" + r"""Evaluate.""" print(f'Evaluation on Clotho Evaluation with [caption] queries.') @@ -99,4 +99,4 @@ def __call__( mean_sisdr = np.mean(sisdrs_list) mean_sdri = np.mean(sdris_list) - return mean_sisdr, mean_sdri \ No newline at end of file + return mean_sisdr, mean_sdri diff --git a/evaluation/evaluate_esc50.py b/evaluation/evaluate_esc50.py index bc71111..8e7f638 100644 --- a/evaluation/evaluate_esc50.py +++ b/evaluation/evaluate_esc50.py @@ -47,7 +47,7 @@ def __call__( self, pl_model: pl.LightningModule ) -> Dict: - r"""Evalute.""" + r"""Evaluate.""" print(f'Evaluation on ESC-50 with [text label] queries.') diff --git a/evaluation/evaluate_music.py b/evaluation/evaluate_music.py index 40c03d8..ffbd75d 100644 --- a/evaluation/evaluate_music.py +++ b/evaluation/evaluate_music.py @@ -54,7 +54,7 @@ def __call__( self, pl_model: pl.LightningModule ) -> Dict: - r"""Evalute.""" + r"""Evaluate.""" print(f'Evaluation on MUSIC Test with [text label] queries.') @@ -115,4 +115,4 @@ def __call__( mean_sdri = np.mean(mean_sdri_list) mean_sisdr = np.mean(mean_sisdr_list) - return mean_sisdr, mean_sdri \ No newline at end of file + return mean_sisdr, mean_sdri diff --git a/evaluation/evaluate_vggsound.py b/evaluation/evaluate_vggsound.py index 5000e03..01bdb02 100644 --- a/evaluation/evaluate_vggsound.py +++ b/evaluation/evaluate_vggsound.py @@ -49,7 +49,7 @@ def __call__( self, pl_model: pl.LightningModule ) -> Dict: - r"""Evalute.""" + r"""Evaluate.""" print(f'Evaluation on VGGSound+ with [text label] queries.') @@ -111,4 +111,4 @@ def __call__( mean_sisdr = np.mean(sisdrs_list) mean_sdri = np.mean(sdris_list) - return mean_sisdr, mean_sdri \ No newline at end of file + return mean_sisdr, mean_sdri