aboutsummaryrefslogtreecommitdiff
path: root/llama.cpp
diff options
context:
space:
mode:
authorslaren <slarengh@gmail.com>2023-07-25 14:32:20 +0200
committerGitHub <noreply@github.com>2023-07-25 15:32:20 +0300
commitda1889834a036a63ead2b0ca5c9ed8967712568c (patch)
tree0cdebeac93a7ff69bfc8b4cec1307d74d984f79c /llama.cpp
parent82552b7f5403ca13957ac9a2cdc1732470057b62 (diff)
ggml : improve graph build time via hash table lookup (#2329)
* improve graph build time * ggml_tensor : use 1 bit per flag * use a hash table instead
Diffstat (limited to 'llama.cpp')
-rw-r--r--llama.cpp2
1 files changed, 2 insertions, 0 deletions
diff --git a/llama.cpp b/llama.cpp
index 2d737bb..febefba 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -1714,6 +1714,8 @@ static bool llama_eval_internal(
// run the computation
ggml_build_forward_expand(&gf, cur);
+ // fprintf(stderr, "graph build time: %.3f ms (%d nodes, %d leafs)\n", (ggml_time_us() - t_start_us)/1000.0, gf.n_nodes, gf.n_leafs);
+
#if GGML_USE_MPI
ggml_mpi_graph_compute_pre(lctx.ctx_mpi, &gf, n_layer);
#endif