diff --git a/examples/expresso/dataset.py b/examples/expresso/dataset.py index 9f2deef..d96da37 100644 --- a/examples/expresso/dataset.py +++ b/examples/expresso/dataset.py @@ -304,6 +304,7 @@ def __init__( # Output filename if name_parts: + # Take the last 3 parts in the path parts = Path(audio).parts fname_out_name = os.path.splitext("_".join(parts[-3:]))[0] else: diff --git a/examples/expresso/models.py b/examples/expresso/models.py index 23303e9..1cc8908 100644 --- a/examples/expresso/models.py +++ b/examples/expresso/models.py @@ -42,14 +42,15 @@ def _upsample(signal, max_frames): signal = signal.unsqueeze(2) bsz, channels, cond_length = signal.size() else: + assert signal.dim() == 1, signal.dim() signal = signal.view(-1, 1, 1) bsz, channels, cond_length = signal.size() signal = signal.unsqueeze(3).repeat(1, 1, 1, max_frames // cond_length) # pad zeros as needed (if signal's shape does not divide completely with max_frames) - reminder = (max_frames - signal.shape[2] * signal.shape[3]) // signal.shape[3] - if reminder > 0: + remainder = (max_frames - signal.shape[2] * signal.shape[3]) // signal.shape[3] + if remainder > 0: raise NotImplementedError( "Padding condition signal - misalignment between condition features." )