ggml_flash_attn_back method
Pointer<ggml_tensor>
ggml_flash_attn_back(
- Pointer<
ggml_context> ctx, - Pointer<
ggml_tensor> q, - Pointer<
ggml_tensor> k, - Pointer<
ggml_tensor> v, - Pointer<
ggml_tensor> d, - bool masked,
TODO: needs to be adapted to ggml_flash_attn_ext
Implementation
ffi.Pointer<ggml_tensor> ggml_flash_attn_back(
ffi.Pointer<ggml_context> ctx,
ffi.Pointer<ggml_tensor> q,
ffi.Pointer<ggml_tensor> k,
ffi.Pointer<ggml_tensor> v,
ffi.Pointer<ggml_tensor> d,
bool masked,
) {
return _ggml_flash_attn_back(
ctx,
q,
k,
v,
d,
masked,
);
}