mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-04-30 19:31:48 +00:00
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
This commit is contained in:
@@ -5733,10 +5733,10 @@ struct llama_data_read {
|
|||||||
std::vector<uint8_t> aux;
|
std::vector<uint8_t> aux;
|
||||||
for (int id = 0; id < extra->n_device; ++id) {
|
for (int id = 0; id < extra->n_device; ++id) {
|
||||||
auto split = extra->splits[id];
|
auto split = extra->splits[id];
|
||||||
GGML_ASSERT(split->type == tensor->type);
|
|
||||||
auto kv_split = kv_extra->splits[id];
|
auto kv_split = kv_extra->splits[id];
|
||||||
GGML_ASSERT((split && kv_split) || (!split && !kv_split));
|
GGML_ASSERT((split && kv_split) || (!split && !kv_split));
|
||||||
if (!split) continue;
|
if (!split) continue;
|
||||||
|
GGML_ASSERT(split->type == tensor->type);
|
||||||
auto split_row_size = ggml_row_size(tensor->type, kv_split->ne[1]);
|
auto split_row_size = ggml_row_size(tensor->type, kv_split->ne[1]);
|
||||||
aux.resize(split_row_size*nrows);
|
aux.resize(split_row_size*nrows);
|
||||||
auto src = data + sum_split_row_size;
|
auto src = data + sum_split_row_size;
|
||||||
|
|||||||
Reference in New Issue
Block a user