Spaces:
Sleeping
Sleeping
| from models.frame_passt.fpasst import get_model | |
| from models.frame_passt.preprocess import AugmentMelSTFT | |
| from models.transformer_wrapper import BaseModelWrapper | |
| class FPaSSTWrapper(BaseModelWrapper): | |
| def __init__(self): | |
| super().__init__() | |
| self.mel = AugmentMelSTFT( | |
| n_mels=128, | |
| sr=16_000, | |
| win_length=400, | |
| hopsize=160, | |
| n_fft=512, | |
| freqm=0, | |
| timem=0, | |
| htk=False, | |
| fmin=0.0, | |
| fmax=None, | |
| norm=1, | |
| fmin_aug_range=10, | |
| fmax_aug_range=2000, | |
| fast_norm=True, | |
| preamp=True, | |
| ) | |
| self.fpasst = get_model( | |
| arch="passt_deit_bd_p16_384", | |
| n_classes=527, | |
| pos_embed_length=250, | |
| frame_patchout=0, | |
| in_channels=16 | |
| ) | |
| def mel_forward(self, x): | |
| return self.mel(x) | |
| def forward(self, x): | |
| return self.fpasst(x) | |
| def separate_params(self): | |
| pt_params = [[], [], [], [], [], [], [], [], [], [], [], []] | |
| for k, p in self.fpasst.named_parameters(): | |
| if k in ['cls_token', | |
| 'dist_token', | |
| 'new_pos_embed', | |
| 'freq_new_pos_embed', | |
| 'time_new_pos_embed', | |
| 'conv_in_1.weight', | |
| 'conv_in_1.bias', | |
| 'conv_in_2.weight', | |
| 'conv_in_2.bias', | |
| 'conv_in_3.weight', | |
| 'conv_in_3.bias', | |
| 'patch_embed.proj.weight', | |
| 'patch_embed.proj.bias', | |
| ]: | |
| pt_params[0].append(p) | |
| elif 'blocks.0.' in k: | |
| pt_params[0].append(p) | |
| elif 'blocks.1.' in k: | |
| pt_params[1].append(p) | |
| elif 'blocks.2.' in k: | |
| pt_params[2].append(p) | |
| elif 'blocks.3.' in k: | |
| pt_params[3].append(p) | |
| elif 'blocks.4.' in k: | |
| pt_params[4].append(p) | |
| elif 'blocks.5.' in k: | |
| pt_params[5].append(p) | |
| elif 'blocks.6.' in k: | |
| pt_params[6].append(p) | |
| elif 'blocks.7.' in k: | |
| pt_params[7].append(p) | |
| elif 'blocks.8.' in k: | |
| pt_params[8].append(p) | |
| elif 'blocks.9.' in k: | |
| pt_params[9].append(p) | |
| elif 'blocks.10.' in k: | |
| pt_params[10].append(p) | |
| elif 'blocks.11.' in k: | |
| pt_params[11].append(p) | |
| elif k in ['norm.weight', 'norm.bias']: | |
| pt_params[11].append(p) | |
| else: | |
| raise ValueError(f"Check separate params for frame-passt! Unexpected key: {k}") | |
| return list(reversed(pt_params)) | |