diff --git a/utils.py b/utils.py index fb60150..960b8f8 100644 --- a/utils.py +++ b/utils.py @@ -232,7 +232,7 @@ def get_hubert_content(hmodel, wav_16k_tensor): inputs = { "source": feats.to(wav_16k_tensor.device), "padding_mask": padding_mask.to(wav_16k_tensor.device), - "output_layer": 9, # layer 9 + "output_layer": 12, # layer 12 } with torch.no_grad(): logits = hmodel.extract_features(**inputs)