2023-05-13 15:45:56 +00:00
|
|
|
class SpeechEncoder(object):
|
2023-06-21 18:04:03 +00:00
|
|
|
def __init__(self, vec_path="pretrain/checkpoint_best_legacy_500.pt", device=None):
|
|
|
|
self.model = None # This is Model
|
2023-05-13 15:45:56 +00:00
|
|
|
self.hidden_dim = 768
|
|
|
|
pass
|
|
|
|
|
2023-06-22 16:49:30 +00:00
|
|
|
|
2023-06-22 16:52:53 +00:00
|
|
|
def encoder(self, wav):
|
2023-06-22 16:51:19 +00:00
|
|
|
"""
|
2023-06-15 17:08:20 +00:00
|
|
|
input: wav:[signal_length]
|
2023-06-01 18:15:42 +00:00
|
|
|
output: embedding:[batchsize,hidden_dim,wav_frame]
|
2023-06-21 18:04:03 +00:00
|
|
|
"""
|
|
|
|
pass
|