0020-ollama-debug-tensor.patch 1.1 KB

123456789101112131415161718192021222324252627282930313233
  1. From 0000000000000000000000000000000000000000 Mon Sep 17 00:00:00 2001
  2. From: Michael Yang <mxyng@pm.me>
  3. Date: Sun, 9 Mar 2025 14:44:16 -0700
  4. Subject: [PATCH] ollama debug tensor
  5. ---
  6. ggml/src/ggml-cpu/ggml-cpu.c | 6 ++++++
  7. 1 file changed, 6 insertions(+)
  8. diff --git a/ggml/src/ggml-cpu/ggml-cpu.c b/ggml/src/ggml-cpu/ggml-cpu.c
  9. index 2f606d82..ec60e8fc 100644
  10. --- a/ggml/src/ggml-cpu/ggml-cpu.c
  11. +++ b/ggml/src/ggml-cpu/ggml-cpu.c
  12. @@ -11,6 +11,8 @@
  13. #include "ggml-threading.h"
  14. #include "ggml.h"
  15. +#include "ollama-debug.h"
  16. +
  17. #if defined(_MSC_VER) || defined(__MINGW32__)
  18. #include <malloc.h> // using malloc.h with MSC/MINGW
  19. #elif !defined(__FreeBSD__) && !defined(__NetBSD__) && !defined(__OpenBSD__)
  20. @@ -14103,6 +14105,10 @@ static thread_ret_t ggml_graph_compute_thread(void * data) {
  21. ggml_compute_forward(&params, node);
  22. +#ifdef OLLAMA_DEBUG
  23. + ollama_debug(node, true);
  24. +#endif
  25. +
  26. if (state->ith == 0 && cplan->abort_callback &&
  27. cplan->abort_callback(cplan->abort_callback_data)) {
  28. atomic_store_explicit(&tp->abort, node_n + 1, memory_order_relaxed);