U qsd@sHddlmZddlZddlmZmZddlmZmZGdddeZ dS)) SpeechEncoderN)WhisperModelDimensions) pad_or_trimlog_mel_spectrogramc@seZdZdddZddZdS) WhisperPPGpretrain/medium.ptNcCsz|dkr$ttjrdnd|_n t||_tj||d}tf|d}t|}||d||_ | |j|_ dS)Ncudacpu) map_locationdimsZmodel_state_dict) torchdevicer is_availabledevloadrrload_state_dict hidden_dimtomodel)selfZvec_pathr checkpointr rr,D:\sovits更新测试\vencoder\WhisperPPG.py__init__ s zWhisperPPG.__init__c Cs|}|jd}|d}t|}t||j}tl|j| d j }t|d|f|j}|dddddfddW5QRSQRXdS)Nri@)shaperrrrr no_gradrencoder unsqueezesqueezedatar floatnumpy FloatTensor transpose)rwavaudioZaudlnZppglnmelZppgrrrrs  $zWhisperPPG.encoder)rN)__name__ __module__ __qualname__rrrrrrrs r) Zvencoder.encoderrr Zvencoder.whisper.modelrrZvencoder.whisper.audiorrrrrrrs