options

Profiling node o404 - process 189318 - thread 189318

NameModuleCoverage (%)Time (s)
kmp_flag_64::wait(kmp_info*, int, void*)libiomp5.so19.412.91
hypre_ParCSRRelaxThreads.extracted.57+exec19.372.91
Loop 3038 - ams.c:3664-3684 - exec+15.542.32
Loop 3042 - ams.c:3672-3675 - exec13.281.99
Loop 3041 - ams.c:3672-3675 - exec2.230.33
Loop 3040 - ams.c:3677-3680 - exec0.030
hypre_BoomerAMGBuildMultipass+exec19.172.88
Loop 832 - par_multi_interp.c:488-514 - exec+6.290.94
Loop 834 - par_multi_interp.c:491-498 - exec6.290.94
Loop 812 - par_multi_interp.c:646-661 - exec+5.690.85
Loop 814 - par_multi_interp.c:651-655 - exec5.660.85
Loop 813 - par_multi_interp.c:657-661 - exec0.030
Loop 815 - par_multi_interp.c:205-600 - exec+4.030.61
Loop 822 - par_multi_interp.c:205-571 - exec+4.030.61
Loop 824 - par_multi_interp.c:554-557 - exec4.030.61
Loop 845 - par_multi_interp.c:385-399 - exec1.20.18
Loop 791 - par_multi_interp.c:1158-1161 - exec0.40.06
Loop 794 - par_multi_interp.c:205-891 - exec+0.030
Loop 804 - par_multi_interp.c:205-758 - exec+0.030
Loop 805 - par_multi_interp.c:205-758 - exec+0.030
Loop 808 - par_multi_interp.c:742-745 - exec0.030
hypre_CSRMatrixMatvecOutOfPlace.extracted+exec10.691.61
Loop 4040 - csr_matvec.c:248-314 - exec+4.030.6
Loop 4042 - csr_matvec.c:310-312 - exec3.360.5
Loop 4041 - csr_matvec.c:310-312 - exec0.670.1
Loop 4052 - csr_matvec.c:248-263 - exec+3.730.56
Loop 4054 - csr_matvec.c:259-261 - exec3.230.48
Loop 4053 - csr_matvec.c:259-261 - exec0.50.08
Loop 4034 - csr_matvec.c:248-341 - exec+0.460.07
Loop 4035 - csr_matvec.c:337-339 - exec0.330.05
Loop 4036 - csr_matvec.c:337-339 - exec0.130.02
hypre_CSRMatrixMatvecOutOfPlace+exec6.160.93
Loop 4007 - csr_matvec.c:166-167 - exec6.160.93
hypre_CSRMatrixMatvecT.extracted.49+exec2.30.34
Loop 4080 - csr_matvec.c:560-569 - exec+0.630.09
Loop 4081 - csr_matvec.c:564-567 - exec0.530.08
Loop 4082 - csr_matvec.c:564-567 - exec0.10.01
Loop 4076 - csr_matvec.c:560-582 - exec+0.10.01
Loop 4077 - csr_matvec.c:577-579 - exec0.10.01
hypre_BoomerAMGBuildMultipass.extracted.34+exec2.060.31
Loop 940 - par_multi_interp.c:917-1124 - exec+0.20.03
Loop 943 - par_multi_interp.c:917-1099 - exec+0.20.03
Loop 946 - par_multi_interp.c:1082-1088 - exec0.20.03
Loop 951 - par_multi_interp.c:917-997 - exec+0.20.03
Loop 954 - par_multi_interp.c:917-970 - exec+0.20.03
Loop 957 - par_multi_interp.c:951-958 - exec0.20.03
unknown_kernel_regionkernel1.660.25
hypre_BoomerAMGBuildMultipass.extracted.28+exec1.630.25
Loop 916 - par_multi_interp.c:1747-1876 - exec+0.630.1
Loop 929 - par_multi_interp.c:1799-1803 - exec0.40.06
Loop 923 - par_multi_interp.c:1747-1865 - exec+0.230.04
Loop 927 - par_multi_interp.c:1816-1822 - exec0.230.04
Loop 937 - par_multi_interp.c:1760-1761 - exec0.170.03
hypre_BoomerAMGCreate2ndS.extracted.17+exec1.60.24
Loop 2368 - par_strength.c:1998-2083 - exec+0.80.12
Loop 2372 - par_strength.c:2011-2048 - exec+0.80.12
Loop 2374 - par_strength.c:2024-2034 - exec0.80.12
Loop 2391 - par_strength.c:1714-1797 - exec+0.70.11
Loop 2395 - par_strength.c:1731-1765 - exec+0.70.11
Loop 2397 - par_strength.c:1743-1752 - exec0.70.11
hypre_Randexec1.60.24
hypre_ParMatmul.extracted.12+exec1.360.21
Loop 3393 - par_csr_matop.c:865-989 - exec+1.030.15
Loop 3394 - par_csr_matop.c:937-989 - exec+1.030.15
Loop 3396 - par_csr_matop.c:946-965 - exec10.15
Loop 3395 - par_csr_matop.c:970-989 - exec0.030
hypre_ParMatmul_RowSizes.extracted+exec1.230.19
Loop 3372 - par_csr_matop.c:127-242 - exec+0.640.1
Loop 3373 - par_csr_matop.c:187-231 - exec+0.640.1
Loop 3375 - par_csr_matop.c:195-208 - exec0.570.09
Loop 3374 - par_csr_matop.c:218-231 - exec0.070.01
hypre_BoomerAMGCoarsenPMIS.extracted.35+exec0.730.11
Loop 263 - par_coarsen.c:2133-2137 - exec0.730.11
hypre_BoomerAMGCoarsenPMIS.extracted.15+exec0.730.11
Loop 254 - par_coarsen.c:2356-2385 - exec+0.60.09
Loop 256 - par_coarsen.c:2361-2381 - exec0.60.09
BuildIJLaplacian27pt.extracted+exec0.670.1
Loop 11 - amg.c:794-1367 - exec+0.40.06
Loop 12 - amg.c:796-1367 - exec+0.40.06
Loop 13 - amg.c:798-1367 - exec0.40.06
Loop 7 - amg.c:1402-2344 - exec+0.270.04
Loop 8 - amg.c:1404-2344 - exec+0.270.04
Loop 9 - amg.c:1406-2344 - exec0.270.04
hypre_CSRMatrixMultiply.extracted+exec0.60.09
Loop 3927 - csr_matop.c:271-298 - exec+0.30.04
Loop 3928 - csr_matop.c:282-298 - exec+0.30.04
Loop 3929 - csr_matop.c:286-298 - exec0.30.04
Loop 3937 - csr_matop.c:214-231 - exec+0.130.02
Loop 3938 - csr_matop.c:222-231 - exec+0.130.02
Loop 3939 - csr_matop.c:225-231 - exec0.130.02
__intel_avx_rep_memcpyexec0.50.07
hypre_CSRMatrixSetRownnz+exec0.50.07
Loop 3956 - csr_matrix.c:145-148 - exec0.30.04
Loop 3955 - csr_matrix.c:161-164 - exec0.20.03
hypre_SeqVectorAxpy.extracted+exec0.470.07
Loop 4113 - vector.c:451-452 - exec0.470.07
hypre_IJMatrixSetDiagOffdSizesParCSR+exec0.430.06
Loop 3652 - IJMatrix_parcsr.c:199-200 - exec0.30.04
Loop 3650 - IJMatrix_parcsr.c:207-208 - exec0.130.02
hypre_BoomerAMGCreateS.extracted+exec0.370.06
Loop 2309 - par_strength.c:253-472 - exec+0.20.03
Loop 2311 - par_strength.c:451-460 - exec0.170.03
Loop 2310 - par_strength.c:463-472 - exec0.030
Loop 2306 - par_strength.c:492-513 - exec+0.170.02
Loop 2308 - par_strength.c:498-503 - exec0.170.02
hypre_BoomerAMGCorrectCFMarker+exec0.370.05
Loop 2303 - par_strength.c:2311-2316 - exec0.370.05
hypre_BoomerAMGIndepSetInit+exec0.370.05
Loop 389 - par_indepset.c:65-67 - exec0.370.05
hypre_BoomerAMGCoarsenPMIS.extracted.10+exec0.370.05
Loop 251 - par_coarsen.c:2437-2481 - exec+0.330.05
Loop 253 - par_coarsen.c:2465-2470 - exec0.330.05
hypre_BoomerAMGCoarsenPMIS+exec0.370.05
Loop 236 - par_coarsen.c:2232-2243 - exec0.230.04
Loop 221 - par_coarsen.c:2159-2589 - exec+0.10.01
Loop 222 - par_coarsen.c:2492-2497 - exec+0.070.01
Loop 223 - par_coarsen.c:2495-2497 - exec0.070.01
Loop 229 - par_coarsen.c:2405-2415 - exec0.030
Loop 233 - par_coarsen.c:2058-2268 - exec+0.030
Loop 235 - par_coarsen.c:2265-2268 - exec0.030
hypre_BoomerAMGBuildMultipass.extracted.27+exec0.330.05
Loop 903 - par_multi_interp.c:1585-1660 - exec+0.230.03
Loop 911 - par_multi_interp.c:1618-1628 - exec0.20.03
Loop 912 - par_multi_interp.c:1612-1615 - exec0.030
Loop 915 - par_multi_interp.c:1590-1591 - exec0.10.01
hypre_SeqVectorInnerProd.extracted+exec0.30.04
Loop 4116 - vector.c:485-486 - exec0.30.04
I_MPI_memcpy_multipage_avx512libmpi.so.12.0.00.270.04
hypre_qsort0+exec0.270.04
Loop 4166 - hypre_qsort.c:31-186 - exec+0.270.04
Loop 4168 - hypre_qsort.c:31-182 - exec0.270.04
hypre_BoomerAMGCoarseParms+exec0.270.04
Loop 301 - par_coarse_parms.c:94-96 - exec0.270.04
hypre_IJMatrixAssembleParCSR.extracted.25+exec0.230.04
Loop 3778 - IJMatrix_parcsr.c:2800-2815 - exec+0.230.03
Loop 3780 - IJMatrix_parcsr.c:2803-2812 - exec0.130.02
Loop 3779 - IJMatrix_parcsr.c:2803-2812 - exec0.10.01
hypre_IJMatrixSetValuesOMPParCSR.extracted.28exec0.230.04
kmp_flag_native::notdone_check()libiomp5.so0.20.03
hypre_CSRMatrixMatvecOutOfPlace.extracted.24+exec0.20.03
Loop 4069 - csr_matvec.c:160-161 - exec0.20.03
unknown_functionUnknown module0.20.03
MPL_gpu_cuda_finalizelibmpi.so.12.0.00.170.02
hypre_BoomerAMGBuildExtPIInterp.extracted+exec0.170.02
Loop 1238 - par_lr_interp.c:1221-1757 - exec+0.060
Loop 1242 - par_lr_interp.c:1221-1743 - exec0.030
Loop 1256 - par_lr_interp.c:1494-1545 - exec+0.030
Loop 1258 - par_lr_interp.c:1516-1526 - exec0.030
Loop 1276 - par_lr_interp.c:1244-1350 - exec+0.030
Loop 1279 - par_lr_interp.c:1264-1303 - exec+0.030
Loop 1281 - par_lr_interp.c:1277-1285 - exec0.030
Loop 1264 - par_lr_interp.c:1444-1445 - exec0.030
hypre_BoomerAMGCoarsenPMIS.extracted+exec0.170.02
Loop 246 - par_coarsen.c:2562-2567 - exec0.130.02
Loop 250 - par_coarsen.c:2528-2540 - exec0.030
__GI___pthread_mutex_locklibpthread-2.28.so0.170.02
hypre_BinarySearch+exec0.130.02
Loop 4145 - binsearch.c:35-44 - exec0.130.02
hypre_ParCSRComputeL1NormsThreads.extracted+exec0.130.02
Loop 2956 - ams.c:3365-3544 - exec+0.070.01
Loop 2959 - ams.c:3532-3534 - exec0.070.01
Loop 2990 - ams.c:3382-3517 - exec+0.060
Loop 2994 - ams.c:3388-3389 - exec0.030
Loop 2995 - ams.c:3388-3389 - exec0.030
I_MPI_memcpy_stream_nontemporal_avx512libmpi.so.12.0.00.10.01
hypre_ParTMatmul.extracted+exec0.10.01
Loop 3451 - par_csr_matop.c:3467-3640 - exec+0.070.01
Loop 3452 - par_csr_matop.c:3467-3634 - exec+0.070.01
Loop 3456 - par_csr_matop.c:3505-3608 - exec0.070.01
Loop 3465 - par_csr_matop.c:3467-3528 - exec+0.030
Loop 3466 - par_csr_matop.c:3467-3522 - exec+0.030
Loop 3470 - par_csr_matop.c:3504-3505 - exec0.030
hypre_ParCSRRelaxThreadsexec0.10.01
pthread_mutex_unlock@pltlibmlx-fi.so0.10.01
MPIDI_OFI_progresslibmpi.so.12.0.00.070.01
__kmp_invoke_microtasklibiomp5.so0.070.01
MPIR_Progress_hook_exec_on_vcilibmpi.so.12.0.00.070.01
inflate_fastlibmpi.so.12.0.00.070.01
__intel_avx_rep_memsetexec0.070.01
hypre_SeqVectorScale.extracted+exec0.070.01
Loop 4111 - vector.c:415-416 - exec0.070.01
hypre_SeqVectorSetConstantValues.extracted+exec0.070.01
Loop 4106 - vector.c:270-271 - exec0.070.01
hypre_CSRMatrixTranspose.extracted+exec0.070.01
Loop 3944 - csr_matop.c:540-548 - exec+0.030
Loop 3945 - csr_matop.c:541-548 - exec0.030
ofi_mutex_lock_nooplibmlx-fi.so0.070.01
hypre_BoomerAMGCoarsenPMIS.extracted.25+exec0.070.01
Loop 260 - par_coarsen.c:2329-2336 - exec0.070.01
__pthread_mutex_unlock_usercntlibpthread-2.28.so0.070.01
MPID_Progress_completion_count_getlibmpi.so.12.0.00.030
MPIR_Waitalllibmpi.so.12.0.00.030
__kmp_hardware_timestamplibiomp5.so0.030
MPIDU_Init_shm_barrierlibmpi.so.12.0.00.030
__kmp_task_team_synclibiomp5.so0.030
I_MPI_memcpy_nontemporal_avx512libmpi.so.12.0.00.030
impi_malloclibmpi.so.12.0.00.030
MPID_Progress_waitlibmpi.so.12.0.00.030
MPIDI_Progress_testlibmpi.so.12.0.00.030
hypre_UnorderedIntSetCreate.extractedexec0.030
kmp_flag_native::done_check()libiomp5.so0.030
hypre_qsort2iexec0.030
ofi_cq_readfromlibmlx-fi.so0.030
ofi_cq_readlibmlx-fi.so0.030
hypre_CSRMatrixMatvecOutOfPlace.extracted.9+exec0.030
Loop 4056 - csr_matvec.c:236-237 - exec0.030
adler32_zlibmpi.so.12.0.00.030
ucp_worker_progresslibucp.so.0.0.00.030
hypre_BoomerAMGCreate2ndSexec0.030
hypre_BoomerAMGBuildMultipass.extracted.85+exec0.030
Loop 964 - par_multi_interp.c:274-276 - exec0.030
ofi_mutex_unlock_nooplibmlx-fi.so0.030
ucs_mpool_getlibucs.so.0.0.00.030
mainexec0.030
×