Name | Module | Max Thread Time / Walltime gcc_0 (%) | Coverage gcc_0 (%) | Coverage Excluding Loops gcc_0 (%) | Max Inclusive Time Over Threads gcc_0 (s) | Max Exclusive Time Over Threads gcc_0 (s) | Inclusive Time w.r.t. Wall Time gcc_0 (s) | Exclusive Time w.r.t. Wall Time gcc_0 (s) | Nb Threads gcc_0 | Deviation (coverage) gcc_0 | Deviation (walltime) gcc_0 | Categories gcc_0 | GFLOPS gcc_0 | Compilation Options |
○gomp_team_barrier_wait_end | libgomp.so.1.0.0 | 3.48 | 48.51 | 48.51 | 5.20 | 5.20 | 3.64 | 3.64 | 192 | 4.95 | 0.32 | OMP (%): 100.00 | 0.00 | |
►void (anonymous namespace)::tinygemm_kernel_amx<block_q8_0, block_q8_0, float, 32, 0>(int, int, int, void const*, void const*, float*, int) [clone .constprop.0]+ | libggml-cpu.so | 1.41 | 25.44 | 25.41 | 2.11 | 2.11 | 1.91 | 1.91 | 189 | 2.09 | 0.15 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 683.76 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
○Loop 516 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 515 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 521 - mmq.cpp:520-2194 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 519 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 520 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 511 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.01 | 0.01 | 0.01 | 0.01 | 0.01 | 0.00 | 0.00 | 116 | 0.04 | 0.00 | | 1772.60 | |
○Loop 518 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 523 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 525 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 513 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.01 | 0.00 | 0.00 | 0.01 | 0.01 | 0.00 | 0.00 | 141 | 0.02 | 0.00 | | 5672.31 | |
○Loop 512 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.01 | 0.01 | 0.01 | 0.01 | 0.00 | 0.00 | 139 | 0.02 | 0.00 | | 3171.62 | |
○Loop 514 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.01 | 0.01 | 0.01 | 0.01 | 0.01 | 0.00 | 0.00 | 144 | 0.03 | 0.00 | | 3122.06 | |
○Loop 522 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 517 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 524 - mmq.cpp:1140-1140 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○gomp_barrier_wait_end | libgomp.so.1.0.0 | 0.40 | 7.28 | 7.28 | 0.59 | 0.59 | 0.55 | 0.55 | 191 | 0.34 | 0.02 | OMP (%): 100.00 | 0.00 | |
►ggml_cpu_fp32_to_fp16+ | libggml-cpu.so | 0.46 | 4.10 | 4.06 | 0.68 | 0.68 | 0.31 | 0.30 | 183 | 2.85 | 0.21 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 0.76 | GNU C11 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma -m... |
○Loop 5 - ggml-cpu.c:3204-3204 - libggml-cpu.so [...] | | 0.01 | 0.04 | 0.04 | 0.02 | 0.02 | 0.00 | 0.00 | 86 | 0.05 | 0.00 | | 0.00 | |
○ggml_threadpool_chunk_add | libggml-cpu.so | 0.30 | 3.96 | 3.96 | 0.45 | 0.45 | 0.30 | 0.30 | 192 | 0.70 | 0.05 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 0.73 | GNU C11 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma -m... |
○gomp_team_barrier_wait | libgomp.so.1.0.0 | 0.25 | 2.99 | 2.99 | 0.38 | 0.38 | 0.22 | 0.22 | 192 | 0.98 | 0.07 | OMP (%): 100.00 | 0.18 | |
►void (anonymous namespace)::tinyBLAS<16, float __vector(16), float __vector(16), unsigned short, unsigned short, float>::gemm_bloc<4, 6>(long, long)+ | libggml-cpu.so | 0.14 | 1.87 | 0.18 | 0.21 | 0.05 | 0.14 | 0.01 | 192 | 0.42 | 0.03 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 1997.48 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
○Loop 1842 - sgemm.cpp:425-427 - libggml-cpu.so [...] | | 0.02 | 0.11 | 0.11 | 0.03 | 0.03 | 0.01 | 0.01 | 192 | 0.09 | 0.01 | | 4816.60 | |
○Loop 1843 - sgemm.cpp:399-399 - libggml-cpu.so [...] | | 0.12 | 1.58 | 1.58 | 0.18 | 0.18 | 0.12 | 0.12 | 192 | 0.37 | 0.03 | | 1943.42 | |
►ggml_compute_forward_soft_max+ | libggml-cpu.so | 0.07 | 0.90 | 0.01 | 0.11 | 0.02 | 0.07 | 0.00 | 192 | 0.25 | 0.02 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 88.87 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
►Loop 1399 - ops.cpp:5889-5944 - libggml-cpu.so [...]+ | | 0.00 | 0.89 | 0.00 | 0.19 | 0.01 | 0.07 | 0.00 | 2 | 0.05 | 0.00 | | 297.34 | |
►Loop 1398 - ops.cpp:5890-5944 - libggml-cpu.so [...]+ | | 0.00 | 0.89 | 0.00 | 0.19 | 0.00 | 0.07 | 0.00 | 7 | 0.00 | 0.00 | | 0.00 | |
►Loop 1397 - ops.cpp:5891-5944 - libggml-cpu.so [...]+ | | 0.01 | 0.89 | 0.01 | 0.19 | 0.01 | 0.07 | 0.00 | 100 | 0.03 | 0.00 | | 1314.98 | |
○Loop 1403 - ops.cpp:5915-5916 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 1404 - ops.cpp:5915-5916 - libggml-cpu.so | | 0.01 | 0.03 | 0.03 | 0.01 | 0.01 | 0.00 | 0.00 | 174 | 0.05 | 0.00 | | 726.26 | |
○Loop 1395 - vec.h:89-89 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 1401 - vec.h:677-677 - libggml-cpu.so [...] | | 0.01 | 0.01 | 0.01 | 0.01 | 0.01 | 0.00 | 0.00 | 40 | 0.04 | 0.00 | | 634.32 | |
○Loop 1396 - vec.h:1444-1445 - libggml-cpu.so | | 0.02 | 0.11 | 0.11 | 0.03 | 0.03 | 0.01 | 0.01 | 192 | 0.09 | 0.01 | | 234.94 | |
○Loop 1407 - vec.h:89-89 - libggml-cpu.so | | 0.06 | 0.59 | 0.59 | 0.09 | 0.09 | 0.04 | 0.04 | 192 | 0.20 | 0.01 | | 14.24 | |
○Loop 1405 - vec.h:687-688 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 1402 - ops.cpp:5911-5912 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 1400 - vec.h:687-688 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 1406 - vec.h:677-677 - libggml-cpu.so [...] | | 0.03 | 0.14 | 0.14 | 0.04 | 0.04 | 0.01 | 0.01 | 165 | 0.11 | 0.01 | | 46.04 | |
►ggml_compute_forward_set_rows+ | libggml-cpu.so | 0.07 | 0.70 | 0.00 | 0.10 | 0.00 | 0.05 | 0.00 | 192 | 0.24 | 0.02 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 3.32 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
►Loop 1386 - ops.cpp:5550-5563 - libggml-cpu.so+ | | 0.00 | 0.70 | 0.00 | 0.11 | 0.00 | 0.05 | 0.00 | 1 | 0.00 | 0.00 | | 0.00 | |
►Loop 1385 - ops.cpp:5551-5563 - libggml-cpu.so+ | | 0.00 | 0.70 | 0.00 | 0.10 | 0.00 | 0.05 | 0.00 | 1 | 0.00 | 0.00 | | 0.00 | |
○Loop 1387 - ops.cpp:5552-5563 - libggml-cpu.so | | 0.07 | 0.70 | 0.70 | 0.10 | 0.10 | 0.05 | 0.05 | 192 | 0.23 | 0.02 | | 3.31 | |
►ggml_compute_forward_rope_f32(ggml_compute_params const*, ggml_tensor*, bool)+ | libggml-cpu.so | 0.04 | 0.47 | 0.00 | 0.07 | 0.01 | 0.04 | 0.00 | 192 | 0.18 | 0.01 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 658.01 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
►Loop 985 - ops.cpp:6210-6484 - libggml-cpu.so [...]+ | | 0.00 | 0.46 | 0.00 | 0.11 | 0.00 | 0.03 | 0.00 | 1 | 0.00 | 0.00 | | 0.00 | |
►Loop 984 - ops.cpp:6210-6484 - libggml-cpu.so [...]+ | | 0.01 | 0.46 | 0.01 | 0.11 | 0.01 | 0.03 | 0.00 | 139 | 0.03 | 0.00 | | 196.99 | |
○Loop 994 - ops.cpp:6210-6245 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 986 - ops.cpp:6407-6484 - libggml-cpu.so [...]+ | | 0.01 | 0.08 | 0.03 | 0.04 | 0.02 | 0.01 | 0.00 | 159 | 0.06 | 0.00 | | 96.96 | |
○Loop 989 - ops.cpp:6446-6456 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 993 - ops.cpp:6429-6442 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 991 - ops.cpp:6462-6475 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 990 - ops.cpp:6446-6456 - libggml-cpu.so [...] | | 0.01 | 0.04 | 0.04 | 0.02 | 0.02 | 0.00 | 0.00 | 159 | 0.06 | 0.00 | | 252.08 | |
○Loop 988 - ops.cpp:6479-6484 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 987 - ops.cpp:6479-6484 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 992 - ops.cpp:6413-6426 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 996 - ops.cpp:6210-6245 - libggml-cpu.so [...] | | 0.04 | 0.38 | 0.38 | 0.06 | 0.06 | 0.03 | 0.03 | 192 | 0.16 | 0.01 | | 773.26 | |
○Loop 995 - ops.cpp:6220-6245 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 997 - ops.cpp:6368-6372 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○f64xsubf128 | libm.so.6 | 0.05 | 0.45 | 0.45 | 0.08 | 0.08 | 0.03 | 0.03 | 192 | 0.18 | 0.01 | Math (%): 100.00 | 447.22 | |
○mkl_blas_avx512_sgemm_kernel_nocopy_TN_b0 | libmkl_avx512.so.2 | 0.06 | 0.30 | 0.30 | 0.09 | 0.09 | 0.02 | 0.02 | 192 | 14.28 | 0.01 | Math (%): 100.00 | 5944.28 | |
►ggml_compute_forward_rms_norm+ | libggml-cpu.so | 0.03 | 0.29 | 0.00 | 0.05 | 0.00 | 0.02 | 0.00 | 192 | 0.13 | 0.01 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 79.68 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
►Loop 1317 - ops.cpp:4319-4365 - libggml-cpu.so [...]+ | | 0.00 | 0.29 | 0.00 | 0.07 | 0.00 | 0.02 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 1318 - ops.cpp:4320-4365 - libggml-cpu.so [...]+ | | 0.00 | 0.29 | 0.00 | 0.07 | 0.00 | 0.02 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 1319 - ops.cpp:4321-4365 - libggml-cpu.so [...]+ | | 0.01 | 0.29 | 0.01 | 0.07 | 0.01 | 0.02 | 0.00 | 19 | 0.03 | 0.00 | | 74.33 | |
○Loop 1321 - vec.h:677-677 - libggml-cpu.so [...] | | 0.01 | 0.04 | 0.04 | 0.02 | 0.02 | 0.00 | 0.00 | 125 | 0.06 | 0.00 | | 219.66 | |
○Loop 1322 - ops.cpp:4325-4326 - libggml-cpu.so | | 0.03 | 0.25 | 0.25 | 0.04 | 0.04 | 0.02 | 0.02 | 192 | 0.12 | 0.01 | | 57.80 | |
○Loop 1320 - vec.h:687-688 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►ggml_compute_forward_mul_mat+ | libggml-cpu.so | 0.04 | 0.29 | 0.00 | 0.06 | 0.01 | 0.02 | 0.00 | 191 | 0.14 | 0.01 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 27.77 | GNU C11 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma -m... |
►Loop 69 - ggml-cpu.c:1248-1260 - libggml-cpu.so+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 70 - ggml-cpu.c:1249-1260 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 68 - ggml-cpu.c:1289-1297 - libggml-cpu.so+ | | 0.00 | 0.29 | 0.00 | 0.07 | 0.00 | 0.02 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 67 - ggml-cpu.c:1290-1297 - libggml-cpu.so+ | | 0.01 | 0.29 | 0.01 | 0.07 | 0.01 | 0.02 | 0.00 | 17 | 0.03 | 0.00 | | 2.06 | |
○Loop 66 - ggml-cpu.c:1291-1297 - libggml-cpu.so | | 0.04 | 0.28 | 0.28 | 0.06 | 0.06 | 0.02 | 0.02 | 191 | 0.14 | 0.01 | | 28.71 | |
►Loop 56 - ggml-cpu.c:1125-1397 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 59 - ggml-cpu.c:1162-1397 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 60 - ggml-cpu.c:1163-1198 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 61 - ggml-cpu.c:1164-1198 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 62 - ggml-cpu.c:1197-1198 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 58 - ggml-cpu.c:1163-1397 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 63 - ggml-cpu.c:1164-1397 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 64 - ggml-cpu.c:1193-1194 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 65 - ggml-cpu.c:1193-1194 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 57 - ggml-cpu.c:1197-1198 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 54 - ggml-cpu.c:1316-1328 - libggml-cpu.so+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 55 - ggml-cpu.c:1317-1328 - libggml-cpu.so | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 3 | 0.00 | 0.00 | | 0.00 | |
○__GI___sched_yield | libc.so.6 | 0.04 | 0.28 | 0.28 | 0.06 | 0.06 | 0.02 | 0.02 | 190 | 14.40 | 0.01 | System (%): 100.00 | 0.00 | |
○ggml_barrier | libggml-cpu.so | 0.05 | 0.24 | 0.24 | 0.08 | 0.08 | 0.02 | 0.02 | 166 | 0.20 | 0.01 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 0.22 | GNU C11 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma -m... |
○mkl_blas_avx512_sgemm_kernel_nocopy_TN_b1 | libmkl_avx512.so.2 | 0.04 | 0.20 | 0.20 | 0.05 | 0.05 | 0.01 | 0.01 | 192 | 11.95 | 0.01 | Math (%): 100.00 | 8857.04 | |
○void (anonymous namespace)::pack_qs<block_q8_0>(void*, block_q8_0 const*, int) | libggml-cpu.so | 0.02 | 0.17 | 0.17 | 0.04 | 0.04 | 0.01 | 0.01 | 182 | 0.10 | 0.01 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 0.00 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
►ggml_vec_swiglu_f32+ | libggml-cpu.so | 0.03 | 0.16 | 0.00 | 0.05 | 0.01 | 0.01 | 0.00 | 171 | 0.13 | 0.01 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 1571.28 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
○Loop 962 - vec.cpp:402-403 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 963 - vec.cpp:372-372 - libggml-cpu.so [...] | | 0.03 | 0.16 | 0.16 | 0.05 | 0.05 | 0.01 | 0.01 | 171 | 0.13 | 0.01 | | 1581.66 | |
►ggml_compute_forward_mul+ | libggml-cpu.so | 0.03 | 0.16 | 0.00 | 0.04 | 0.01 | 0.01 | 0.00 | 165 | 0.11 | 0.01 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 46.97 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
►Loop 678 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 680 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 681 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 682 - binary-ops.cpp:18-32 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 679 - binary-ops.cpp:18-31 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 683 - binary-ops.cpp:18-44 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 677 - binary-ops.cpp:126-139 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 690 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 693 - binary-ops.cpp:18-45 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 692 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 691 - binary-ops.cpp:18-32 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 706 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 708 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 707 - binary-ops.cpp:18-32 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 711 - binary-ops.cpp:18-45 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 709 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 710 - binary-ops.cpp:18-101 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 694 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 696 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 697 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 698 - binary-ops.cpp:18-32 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 695 - binary-ops.cpp:31-31 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 699 - binary-ops.cpp:42-44 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 712 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.15 | 0.00 | 0.05 | 0.01 | 0.01 | 0.00 | 13 | 0.02 | 0.00 | | 12.39 | |
►Loop 714 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.15 | 0.00 | 0.04 | 0.00 | 0.01 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 713 - binary-ops.cpp:18-32 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 715 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.15 | 0.00 | 0.04 | 0.00 | 0.01 | 0.00 | 2 | 0.00 | 0.00 | | 74.33 | |
○Loop 716 - binary-ops.cpp:18-32 - libggml-cpu.so [...] | | 0.03 | 0.15 | 0.15 | 0.04 | 0.04 | 0.01 | 0.01 | 160 | 0.11 | 0.01 | | 48.96 | |
○Loop 717 - binary-ops.cpp:18-45 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 684 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 689 - binary-ops.cpp:18-44 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 686 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 685 - binary-ops.cpp:18-31 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 687 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 688 - binary-ops.cpp:18-32 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 700 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 702 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►Loop 703 - binary-ops.cpp:18-101 - libggml-cpu.so [...]+ | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 704 - binary-ops.cpp:18-32 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 701 - binary-ops.cpp:31-31 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 705 - binary-ops.cpp:42-44 - libggml-cpu.so [...] | | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
►void parallel_for<(anonymous namespace)::convert_B_packed_format<block_q8_0, 32>(void*, block_q8_0 const*, int, int)::{lambda(int, int)#1}>(int, (anonymous namespace)::convert_B_packed_format<block_q8_0, 32>(void*, block_q8_0 const*, int,...+ | libggml-cpu.so | 0.03 | 0.14 | 0.00 | 0.04 | 0.01 | 0.01 | 0.00 | 145 | 0.12 | 0.01 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 0.00 | GNU C++17 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma ... |
►Loop 456 - mmq.cpp:822-1392 - libggml-cpu.so [...]+ | | 0.00 | 0.14 | 0.00 | 0.04 | 0.00 | 0.01 | 0.00 | 0 | 0.00 | 0.00 | | 0.00 | |
○Loop 455 - mmq.cpp:822-1392 - libggml-cpu.so [...] | | 0.03 | 0.14 | 0.14 | 0.04 | 0.04 | 0.01 | 0.01 | 145 | 0.12 | 0.01 | | 0.00 | |
►quantize_row_q8_0+ | libggml-cpu.so | 0.96 | 0.10 | 0.00 | 1.43 | 0.00 | 0.01 | 0.00 | 1 | 0.00 | 0.00 | /beegfs/hackathon/users/eoseret/qaas_runs_test/176-060-7658/intel/llama.cpp/build/llama.cpp/../gcc/bin/libggml-blas.so (%): 100.00 | 707.15 | GNU C11 14.2.0 -march=graniterapids -mmmx -mpopcnt -msse -msse2 -msse3 -mssse3 -msse4.1 -msse4.2 -mavx -mavx2 -mno-sse4a -mno-fma4 -mno-xop -mfma -mavx512f -mbmi -mbmi2 -maes -mpclmul -mavx512vl -mavx512bw -mavx512dq -mavx512cd -mavx512vbmi -mavx512ifma -m... |
○Loop 2214 - quants.c:298-321 - libggml-cpu.so [...] | | 0.96 | 0.10 | 0.10 | 1.43 | 1.43 | 0.01 | 0.01 | 1 | 0.00 | 0.00 | | 707.09 | |