facebookresearch · tuanh208 · Aug 29, 2023
diff --git a/examples/expresso/dataset.py b/examples/expresso/dataset.py
@@ -304,6 +304,7 @@ def __init__(
 
                 # Output filename
                 if name_parts:
+                    # Take the last 3 parts in the path
                     parts = Path(audio).parts
                     fname_out_name = os.path.splitext("_".join(parts[-3:]))[0]
                 else:

diff --git a/examples/expresso/models.py b/examples/expresso/models.py
@@ -42,14 +42,15 @@ def _upsample(signal, max_frames):
             signal = signal.unsqueeze(2)
             bsz, channels, cond_length = signal.size()
         else:
+            assert signal.dim() == 1, signal.dim()
             signal = signal.view(-1, 1, 1)
             bsz, channels, cond_length = signal.size()
 
         signal = signal.unsqueeze(3).repeat(1, 1, 1, max_frames // cond_length)
 
         # pad zeros as needed (if signal's shape does not divide completely with max_frames)
-        reminder = (max_frames - signal.shape[2] * signal.shape[3]) // signal.shape[3]
-        if reminder > 0:
+        remainder = (max_frames - signal.shape[2] * signal.shape[3]) // signal.shape[3]
+        if remainder > 0:
             raise NotImplementedError(
                 "Padding condition signal - misalignment between condition features."
             )