llama : add option to override model tensor buffers (#11397)

* llama : add option to override tensor buffers * ggml : fix possible underflow in ggml_nbytes
2025-04-02 14:52:01 +02:00
parent a10b36c91a
commit e0e912f49b
12 changed files with 108 additions and 9 deletions
--- a/src/llama-model.h
+++ b/src/llama-model.h
@@ -382,6 +382,8 @@ struct llama_model {

    ggml_backend_buffer_type_t select_buft(int il) const;

+    bool has_tensor_overrides() const;
+
    const struct ggml_tensor * get_tensor(const char * name) const;

    // TODO: move this to new llm_arch_model_i interface