ggml : improve graph build time via hash table lookup (#2329)

* improve graph build time * ggml_tensor : use 1 bit per flag * use a hash table instead
author: slaren <slarengh@gmail.com> 2023-07-25 14:32:20 +0200
committer: GitHub <noreply@github.com> 2023-07-25 15:32:20 +0300
commit: da1889834a036a63ead2b0ca5c9ed8967712568c (patch)
tree: 0cdebeac93a7ff69bfc8b4cec1307d74d984f79c /llama.cpp
parent: 82552b7f5403ca13957ac9a2cdc1732470057b62 (diff)
1 files changed, 2 insertions, 0 deletions
diff --git a/llama.cpp b/llama.cpp
index 2d737bb..febefba 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -1714,6 +1714,8 @@ static bool llama_eval_internal(
     // run the computation
     ggml_build_forward_expand(&gf, cur);
 
+    // fprintf(stderr, "graph build time: %.3f ms (%d nodes, %d leafs)\n", (ggml_time_us() - t_start_us)/1000.0, gf.n_nodes, gf.n_leafs);
+
 #if GGML_USE_MPI
     ggml_mpi_graph_compute_pre(lctx.ctx_mpi, &gf, n_layer);
 #endif
author	slaren <slarengh@gmail.com>	2023-07-25 14:32:20 +0200
committer	GitHub <noreply@github.com>	2023-07-25 15:32:20 +0300
commit	da1889834a036a63ead2b0ca5c9ed8967712568c (patch)
tree	0cdebeac93a7ff69bfc8b4cec1307d74d984f79c /llama.cpp
parent	82552b7f5403ca13957ac9a2cdc1732470057b62 (diff)