mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-04-30 19:31:48 +00:00
Minor
This commit is contained in:
@@ -2206,7 +2206,6 @@ std::string fs_get_cache_file(const std::string & filename) {
|
|||||||
// Model utils
|
// Model utils
|
||||||
//
|
//
|
||||||
struct llama_init_result llama_init_from_gpt_params(gpt_params & params) {
|
struct llama_init_result llama_init_from_gpt_params(gpt_params & params) {
|
||||||
printf("================================================== %s\n", __func__);
|
|
||||||
llama_init_result iparams;
|
llama_init_result iparams;
|
||||||
auto mparams = llama_model_params_from_gpt_params(params);
|
auto mparams = llama_model_params_from_gpt_params(params);
|
||||||
|
|
||||||
@@ -2234,7 +2233,6 @@ struct llama_init_result llama_init_from_gpt_params(gpt_params & params) {
|
|||||||
return iparams;
|
return iparams;
|
||||||
}
|
}
|
||||||
|
|
||||||
printf("%d entries in params.offload_policy\n", (int)params.offload_policy.size());
|
|
||||||
for (auto [op, on_off] : params.offload_policy) {
|
for (auto [op, on_off] : params.offload_policy) {
|
||||||
llama_set_offload_policy(lctx, op, on_off);
|
llama_set_offload_policy(lctx, op, on_off);
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -23239,6 +23239,7 @@ void llama_log_callback_default(ggml_log_level level, const char * text, void *
|
|||||||
|
|
||||||
void llama_set_offload_policy(struct llama_context * lctx, int op, bool on_or_off) {
|
void llama_set_offload_policy(struct llama_context * lctx, int op, bool on_or_off) {
|
||||||
if (!lctx || !lctx->sched) return;
|
if (!lctx || !lctx->sched) return;
|
||||||
printf("XXXXXXXXXXXXXXXXXXXXXXXXXXXX offload(%s) = %d\n", ggml_op_name(ggml_op(op)), on_or_off);
|
const char * op_name = op < 0 || op >= int(GGML_OP_COUNT) ? "all ops" : ggml_op_name(ggml_op(op));
|
||||||
|
printf("XXXXXXXXXXXXXXXXXXXXXXXXXXXX offload(%s) = %d\n", op_name, on_or_off);
|
||||||
ggml_backend_sched_set_op_offload(lctx->sched, ggml_op(op), on_or_off);
|
ggml_backend_sched_set_op_offload(lctx->sched, ggml_op(op), on_or_off);
|
||||||
}
|
}
|
||||||
|
|||||||
Reference in New Issue
Block a user