mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-04-30 11:21:56 +00:00
Split mode graph for Minimax-M2 (#1195)
* Split mode graph for Minimax-M2 * Cleanup * Forgotten ffn_exp_probs_b
This commit is contained in:
@@ -3570,6 +3570,13 @@ static bool ggml_cuda_compute_forward(ggml_backend_cuda_context & ctx, struct gg
|
||||
return false;
|
||||
}
|
||||
|
||||
#if 0
|
||||
if (auto err = cudaStreamSynchronize(ctx.stream()); err != cudaSuccess) {
|
||||
GGML_CUDA_LOG_ERROR("%s: %s failed\n", __func__, ggml_op_desc(dst));
|
||||
CUDA_CHECK(err);
|
||||
}
|
||||
#endif
|
||||
|
||||
cudaError_t err = cudaGetLastError();
|
||||
if (err != cudaSuccess) {
|
||||
GGML_CUDA_LOG_ERROR("%s: %s failed\n", __func__, ggml_op_desc(dst));
|
||||
|
||||
Reference in New Issue
Block a user