model : print tensor size during load (#12711)

* model : print tensor size during load * cont : fix units MB -> MiB Co-authored-by: Diego Devesa <slarengh@gmail.com> --------- Co-authored-by: Diego Devesa <slarengh@gmail.com>
2025-04-16 03:26:08 +00:00 · 2025-04-02 16:38:54 +03:00 · 2025-04-02 16:38:54 +03:00 · 833e2b7409
commit 833e2b7409
parent e0e912f49b
1 changed files with 3 additions and 1 deletions
--- a/src/llama-model-loader.cpp
+++ b/src/llama-model-loader.cpp
@ -603,7 +603,9 @@ llama_model_loader::llama_model_loader(

            if (trace > 0) {
                const uint16_t sid = w.idx;
-                LLAMA_LOG_INFO("%s: - tensor split %2d: %32s %-8s [ %s ]\n", __func__, sid, ggml_get_name(tensor), ggml_type_name(type), llama_format_tensor_shape(tensor).c_str());
+                LLAMA_LOG_INFO("%s: - tensor split %2d: %32s %-8s [ %s ] %8.2f MiB\n", __func__,
+                        sid, ggml_get_name(tensor), ggml_type_name(type), llama_format_tensor_shape(tensor).c_str(),
+                        ggml_nbytes(tensor)/1024.0f/1024.0f);
            }
        }