Merging mainline - WIP

2026-04-29 19:01:47 +00:00 · 2024-07-26 16:32:40 +03:00
parent 0684c3e9c7
commit 6b2b52d2fe
613 changed files with 50831 additions and 165912 deletions
--- a/examples/lookup/lookup-stats.cpp
+++ b/examples/lookup/lookup-stats.cpp
@@ -31,7 +31,6 @@ int main(int argc, char ** argv){

    // load the model
    std::tie(model, ctx) = llama_init_from_gpt_params(params);
-    GGML_ASSERT(llama_n_vocab(model) < (1 << 16));

    // tokenize the prompt
    std::vector<llama_token> inp;
@@ -65,7 +64,7 @@ int main(int argc, char ** argv){
    }

    const int n_input = inp.size();
-    const int n_ctx = params.n_ctx;
+    const int n_ctx = llama_n_ctx(ctx);

    int n_drafted = 0;
    int n_accept  = 0;