From ec9cdb6752dd96b3cc74d90ad1adeba5b4fa2b0e Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Sun, 23 Apr 2023 18:32:52 +0300 Subject: [PATCH] ggml : do not print perf ops that have not been used at all --- ggml.c | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/ggml.c b/ggml.c index 23dae2d..f8f73af 100644 --- a/ggml.c +++ b/ggml.c @@ -11237,7 +11237,7 @@ void ggml_graph_print(const struct ggml_cgraph * cgraph) { for (int i = 0; i < cgraph->n_nodes; i++) { struct ggml_tensor * node = cgraph->nodes[i]; - perf_total_per_op_us[node->op] += node->perf_time_us; + perf_total_per_op_us[node->op] += MAX(1, node->perf_time_us); GGML_PRINT(" - %3d: [ %5" PRId64 ", %5" PRId64 ", %5" PRId64 "] %16s %s (%3d) cpu = %7.3f / %7.3f ms, wall = %7.3f / %7.3f ms\n", i, @@ -11260,6 +11260,10 @@ void ggml_graph_print(const struct ggml_cgraph * cgraph) { } for (int i = 0; i < GGML_OP_COUNT; i++) { + if (perf_total_per_op_us[i] == 0) { + continue; + } + GGML_PRINT("perf_total_per_op_us[%16s] = %7.3f ms\n", GGML_OP_LABEL[i], (double) perf_total_per_op_us[i] / 1000.0); }