This commit is contained in:
comfyanonymous
2025-09-12 18:57:04 -07:00
committed by GitHub
parent 2559dee492
commit 29bf807b0e
2 changed files with 2 additions and 2 deletions

View File

@@ -31,7 +31,7 @@ class AudioEncoderModel():
def encode_audio(self, audio, sample_rate): def encode_audio(self, audio, sample_rate):
comfy.model_management.load_model_gpu(self.patcher) comfy.model_management.load_model_gpu(self.patcher)
audio = torchaudio.functional.resample(audio, sample_rate, self.model_sample_rate) audio = torchaudio.functional.resample(audio, sample_rate, self.model_sample_rate)
out, all_layers = self.model(audio.to(self.load_device), sr=self.model_sample_rate) out, all_layers = self.model(audio.to(self.load_device))
outputs = {} outputs = {}
outputs["encoded_audio"] = out outputs["encoded_audio"] = out
outputs["encoded_audio_all_layers"] = all_layers outputs["encoded_audio_all_layers"] = all_layers

View File

@@ -238,7 +238,7 @@ class Wav2Vec2Model(nn.Module):
device=device, dtype=dtype, operations=operations device=device, dtype=dtype, operations=operations
) )
def forward(self, x, sr=16000, mask_time_indices=None, return_dict=False): def forward(self, x, mask_time_indices=None, return_dict=False):
x = torch.mean(x, dim=1) x = torch.mean(x, dim=1)
if self.do_normalize: if self.do_normalize: