coreml : fix ANE optimized encoder (#1716)

This commit is contained in:
Yajing Tang
2024-01-04 06:28:30 -08:00
committed by GitHub
parent ab0a8593c5
commit ba5bcde874
3 changed files with 4 additions and 17 deletions

View File

@ -143,20 +143,7 @@ class AudioEncoderANE(AudioEncoder):
x = block(x)
x = self.ln_post(x)
# """
# TODO:
# I think we need to transpose the result here to make it fit whisper.cpp memory order.
# However, even doing this, the results are still wrong. Kind of less wrong compared to
# not transposing, but still wrong.
# Also, I don't know why the original OpenAI implementation does not need to transpose
# transpose to (batch_size, n_ctx, n_state)
# x : torch.Tensor, shape = (batch_size, n_state, 1, n_ctx)
# """
# x = x.transpose(1,3)
x = x.squeeze(2).transpose(1, 2)
return x