Merge pull request #27 from ktonal/develop

v0.2.6
ktonal · Jun 29, 2021 · a05b34e · a05b34e
2 parents 3194581 + 545c115
commit a05b34e
Show file tree

Hide file tree

Showing 5 changed files with 15 additions and 13 deletions.
diff --git a/mimikit/__init__.py b/mimikit/__init__.py
@@ -1,4 +1,4 @@
-__version__ = '0.2.5'
+__version__ = '0.2.6'
 
 from . import audios
 from . import connectors

diff --git a/mimikit/audios/features.py b/mimikit/audios/features.py
@@ -15,7 +15,7 @@
 ]
 
 
-@dtc.dataclass
+@dtc.dataclass(unsafe_hash=True)
 class AudioSignal(Feature):
     """
     audio signal managers

diff --git a/mimikit/audios/fmodules.py b/mimikit/audios/fmodules.py
@@ -103,7 +103,7 @@ def __call__(self, inputs):
 
 @dtc.dataclass
 class Normalize(FModule):
-    p: int = 1
+    p: int = float('inf')
     dim: int = -1
 
     @property
@@ -209,14 +209,15 @@ class STFT(FModule):
     def functions(self):
         def np_func(inputs):
             # returned shape is (time x freq)
-            return librosa.stft(inputs, n_fft=self.n_fft, hop_length=self.hop_length).T
+            S =librosa.stft(inputs, n_fft=self.n_fft, hop_length=self.hop_length).T
+            S = np.stack((abs(S), np.angle(S)), axis=-1)
+            return S
 
         def torch_func(inputs):
             mod = T.Spectrogram(self.n_fft, hop_length=self.hop_length, power=1.,
                                 wkwargs=dict(device=inputs.device))
             # returned shape is (..., time x freq)
             return mod(inputs).transpose(-1, -2).contiguous()
-
         return {
             np.ndarray: np_func,
             torch.Tensor: torch_func
@@ -235,8 +236,8 @@ def np_func(inputs):
             return librosa.istft(inputs.T, n_fft=self.n_fft, hop_length=self.hop_length, )
 
         def torch_func(inputs):
-            # inputs is of shape (time x freq)
-            y = torch.istft(inputs.transpose(-1, -2).contiguous(),
+            inputs = inputs[..., 0] * torch.exp(1j * inputs[..., 1])
+            y = torch.istft(inputs.transpose(1, 2).contiguous(),
                             n_fft=self.n_fft, hop_length=self.hop_length,
                             window=torch.hann_window(self.n_fft, device=inputs.device))
             return y
@@ -256,8 +257,8 @@ def functions(self):
         # dict comprehension would result in a single function for
         # all types, so we declare the dict manually...
         return {
-            np.ndarray: lambda x: abs(sup_f[np.ndarray](x)),
-            torch.Tensor: lambda x: abs(sup_f[torch.Tensor](x))
+            np.ndarray: lambda x: abs(sup_f[np.ndarray](x)[..., 0]),
+            torch.Tensor: lambda x: abs(sup_f[torch.Tensor](x)[..., 0])
         }
 
 

diff --git a/mimikit/data/feature.py b/mimikit/data/feature.py
@@ -89,8 +89,8 @@ def encode(self, inputs):
         -------
 
         """
-        if hasattr(super(type(self), self), 'encoders'):
-            inputs = super(type(self), self).encoders[type(inputs)](inputs)
+        if hasattr(super(), 'encoders'):
+            inputs = super().encoders[type(inputs)](inputs)
         return self.encoders[type(inputs)](inputs)
 
     def decode(self, inputs):
@@ -106,8 +106,8 @@ def decode(self, inputs):
 
         """
         inputs = self.decoders[type(inputs)](inputs)
-        if hasattr(super(type(self), self), 'decoders'):
-            inputs = super(type(self), self).decoders[type(inputs)](inputs)
+        if hasattr(super(), 'decoders'):
+            inputs = super().decoders[type(inputs)](inputs)
         return inputs
 
     def load(self, path):

diff --git a/mimikit/networks/__init__.py b/mimikit/networks/__init__.py
@@ -1,4 +1,5 @@
 from .freqnet import *
+from .generating_net import *
 from .parametrized_gaussian import *
 from .sample_rnn import *
 from .s2s_lstm import *