Split mode graph for Minimax-M2 (#1195)

* Split mode graph for Minimax-M2

* Cleanup

* Forgotten ffn_exp_probs_b
This commit is contained in:
Kawrakow
2026-01-29 07:27:06 +02:00
committed by GitHub
parent 68cd52e583
commit 68ed62447c
4 changed files with 238 additions and 60 deletions

View File

@@ -3570,6 +3570,13 @@ static bool ggml_cuda_compute_forward(ggml_backend_cuda_context & ctx, struct gg
return false;
}
#if 0
if (auto err = cudaStreamSynchronize(ctx.stream()); err != cudaSuccess) {
GGML_CUDA_LOG_ERROR("%s: %s failed\n", __func__, ggml_op_desc(dst));
CUDA_CHECK(err);
}
#endif
cudaError_t err = cudaGetLastError();
if (err != cudaSuccess) {
GGML_CUDA_LOG_ERROR("%s: %s failed\n", __func__, ggml_op_desc(dst));