mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2024-12-23 06:22:22 +00:00
e08c62149b
* CUDA: refactor mmq, dmmv, mmvq * fix out-of-bounds write * struct for qk, qr, qi * fix cmake build * mmq_type_traits
10 lines
325 B
Plaintext
10 lines
325 B
Plaintext
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
|
|
|
|
#include "../fattn-wmma-f16.cuh"
|
|
|
|
DECL_FATTN_WMMA_F16_CASE(64, 32, float);
|
|
DECL_FATTN_WMMA_F16_CASE(80, 32, float);
|
|
DECL_FATTN_WMMA_F16_CASE(96, 32, float);
|
|
DECL_FATTN_WMMA_F16_CASE(112, 32, float);
|
|
DECL_FATTN_WMMA_F16_CASE(128, 32, float);
|