ggml_flash_attn_back method

TODO: needs to be adapted to ggml_flash_attn_ext

Implementation

ffi.Pointer<ggml_tensor> ggml_flash_attn_back(
  ffi.Pointer<ggml_context> ctx,
  ffi.Pointer<ggml_tensor> q,
  ffi.Pointer<ggml_tensor> k,
  ffi.Pointer<ggml_tensor> v,
  ffi.Pointer<ggml_tensor> d,
  bool masked,
) {
  return _ggml_flash_attn_back(
    ctx,
    q,
    k,
    v,
    d,
    masked,
  );
}