********************************************************************************
MAQAO 2026.0.0 - 25769f03a52addf00a8c34d7a506d855fd8fb167::20260225-140255 || 2026/02/25
/home/mlkaps_org/kevin/maqao oneview -R1 -WS -WC --replace -c=config.json -dbg=1 -xp=test_m1-128_o1_perf009_allowextra_scala_kptr -lprof-params=--allow-extra-threads -- /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
CPY: [true] /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libmumps_common.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libmumps_common.so
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libdmumps.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libdmumps.so
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_0" --mpi-command="mpirun -np 1 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_0: At cluster level, discarded 90 functions cumulating 0.6% of application profiled time
Run run_0: At cluster level, discarded 104 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_1" --mpi-command="mpirun -np 2 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_1: At cluster level, discarded 164 functions cumulating 0.6% of application profiled time
Run run_1: At cluster level, discarded 155 loops cumulating 0.6% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_2" --mpi-command="mpirun -np 4 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_2: At cluster level, discarded 190 functions cumulating 0.6% of application profiled time
Run run_2: At cluster level, discarded 163 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_3" --mpi-command="mpirun -np 8 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_3: At cluster level, discarded 208 functions cumulating 0.5% of application profiled time
Run run_3: At cluster level, discarded 171 loops cumulating 0.4% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_4" --mpi-command="mpirun -np 16 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_4: At cluster level, discarded 254 functions cumulating 0.5% of application profiled time
Run run_4: At cluster level, discarded 177 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_5" --mpi-command="mpirun -np 32 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_5: At cluster level, discarded 308 functions cumulating 0.4% of application profiled time
Run run_5: At cluster level, discarded 184 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_6" --mpi-command="mpirun -np 64 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_6: At cluster level, discarded 401 functions cumulating 0.4% of application profiled time
Run run_6: At cluster level, discarded 209 loops cumulating 0.2% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_7" --mpi-command="mpirun -np 128 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_7: At cluster level, discarded 547 functions cumulating 0.4% of application profiled time
Run run_7: At cluster level, discarded 235 loops cumulating 0.2% of application profiled time
CMD: /home/mlkaps_org/kevin/maqao otter -input=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/input_manifest.csv -output=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/output_manifest.csv -dbg=1 --reduce-threads-files=on
********************************************************************************
MAQAO 2026.0.0 - 25769f03a52addf00a8c34d7a506d855fd8fb167::20260225-140255 || 2026/02/25
/home/mlkaps_org/kevin/maqao oneview -R1 -WS -WC --replace -c=config.json -dbg=1 -xp=test_m1-128_o1_perf009_allowextra_scala_kptr -lprof-params=--allow-extra-threads -- /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
CPY: [true] /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libmumps_common.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libmumps_common.so
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libdmumps.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libdmumps.so
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_0" --mpi-command="mpirun -np 1 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_0: At cluster level, discarded 90 functions cumulating 0.6% of application profiled time
Run run_0: At cluster level, discarded 104 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_1" --mpi-command="mpirun -np 2 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_1: At cluster level, discarded 164 functions cumulating 0.6% of application profiled time
Run run_1: At cluster level, discarded 155 loops cumulating 0.6% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_2" --mpi-command="mpirun -np 4 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_2: At cluster level, discarded 190 functions cumulating 0.6% of application profiled time
Run run_2: At cluster level, discarded 163 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_3" --mpi-command="mpirun -np 8 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_3: At cluster level, discarded 208 functions cumulating 0.5% of application profiled time
Run run_3: At cluster level, discarded 171 loops cumulating 0.4% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_4" --mpi-command="mpirun -np 16 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_4: At cluster level, discarded 254 functions cumulating 0.5% of application profiled time
Run run_4: At cluster level, discarded 177 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_5" --mpi-command="mpirun -np 32 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_5: At cluster level, discarded 308 functions cumulating 0.4% of application profiled time
Run run_5: At cluster level, discarded 184 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_6" --mpi-command="mpirun -np 64 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_6: At cluster level, discarded 401 functions cumulating 0.4% of application profiled time
Run run_6: At cluster level, discarded 209 loops cumulating 0.2% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_7" --mpi-command="mpirun -np 128 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_7: At cluster level, discarded 547 functions cumulating 0.4% of application profiled time
Run run_7: At cluster level, discarded 235 loops cumulating 0.2% of application profiled time
CMD: /home/mlkaps_org/kevin/maqao otter -input=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/input_manifest.csv -output=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/output_manifest.csv -dbg=1 --reduce-threads-files=on
********************************************************************************
MAQAO 2026.0.0 - 25769f03a52addf00a8c34d7a506d855fd8fb167::20260225-140255 || 2026/02/25
/home/mlkaps_org/kevin/maqao oneview -R1 -WS -WC --replace -c=config.json -dbg=1 -xp=test_m1-128_o1_perf009_allowextra_scala_kptr -lprof-params=--allow-extra-threads -- /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
CPY: [true] /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libmumps_common.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libmumps_common.so
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libdmumps.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libdmumps.so
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_0" --mpi-command="mpirun -np 1 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_0: At cluster level, discarded 90 functions cumulating 0.6% of application profiled time
Run run_0: At cluster level, discarded 104 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_1" --mpi-command="mpirun -np 2 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_1: At cluster level, discarded 164 functions cumulating 0.6% of application profiled time
Run run_1: At cluster level, discarded 155 loops cumulating 0.6% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_2" --mpi-command="mpirun -np 4 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_2: At cluster level, discarded 190 functions cumulating 0.6% of application profiled time
Run run_2: At cluster level, discarded 163 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_3" --mpi-command="mpirun -np 8 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_3: At cluster level, discarded 208 functions cumulating 0.5% of application profiled time
Run run_3: At cluster level, discarded 171 loops cumulating 0.4% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_4" --mpi-command="mpirun -np 16 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_4: At cluster level, discarded 254 functions cumulating 0.5% of application profiled time
Run run_4: At cluster level, discarded 177 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_5" --mpi-command="mpirun -np 32 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_5: At cluster level, discarded 308 functions cumulating 0.4% of application profiled time
Run run_5: At cluster level, discarded 184 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_6" --mpi-command="mpirun -np 64 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_6: At cluster level, discarded 401 functions cumulating 0.4% of application profiled time
Run run_6: At cluster level, discarded 209 loops cumulating 0.2% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_7" --mpi-command="mpirun -np 128 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_7: At cluster level, discarded 547 functions cumulating 0.4% of application profiled time
Run run_7: At cluster level, discarded 235 loops cumulating 0.2% of application profiled time
CMD: /home/mlkaps_org/kevin/maqao otter -input=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/input_manifest.csv -output=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/output_manifest.csv -dbg=1 --reduce-threads-files=on
********************************************************************************
MAQAO 2026.0.0 - 25769f03a52addf00a8c34d7a506d855fd8fb167::20260225-140255 || 2026/02/25
/home/mlkaps_org/kevin/maqao oneview -R1 -WS -WC --replace -c=config.json -dbg=1 -xp=test_m1-128_o1_perf009_allowextra_scala_kptr -lprof-params=--allow-extra-threads -- /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
CPY: [true] /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libmumps_common.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libmumps_common.so
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libdmumps.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libdmumps.so
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_0" --mpi-command="mpirun -np 1 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_0: At cluster level, discarded 90 functions cumulating 0.6% of application profiled time
Run run_0: At cluster level, discarded 104 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_1" --mpi-command="mpirun -np 2 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_1: At cluster level, discarded 164 functions cumulating 0.6% of application profiled time
Run run_1: At cluster level, discarded 155 loops cumulating 0.6% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_2" --mpi-command="mpirun -np 4 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_2: At cluster level, discarded 190 functions cumulating 0.6% of application profiled time
Run run_2: At cluster level, discarded 163 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_3" --mpi-command="mpirun -np 8 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_3: At cluster level, discarded 208 functions cumulating 0.5% of application profiled time
Run run_3: At cluster level, discarded 171 loops cumulating 0.4% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_4" --mpi-command="mpirun -np 16 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_4: At cluster level, discarded 254 functions cumulating 0.5% of application profiled time
Run run_4: At cluster level, discarded 177 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_5" --mpi-command="mpirun -np 32 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_5: At cluster level, discarded 308 functions cumulating 0.4% of application profiled time
Run run_5: At cluster level, discarded 184 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_6" --mpi-command="mpirun -np 64 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_6: At cluster level, discarded 401 functions cumulating 0.4% of application profiled time
Run run_6: At cluster level, discarded 209 loops cumulating 0.2% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_7" --mpi-command="mpirun -np 128 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_7: At cluster level, discarded 547 functions cumulating 0.4% of application profiled time
Run run_7: At cluster level, discarded 235 loops cumulating 0.2% of application profiled time
CMD: /home/mlkaps_org/kevin/maqao otter -input=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/input_manifest.csv -output=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/output_manifest.csv -dbg=1 --reduce-threads-files=on
********************************************************************************
MAQAO 2026.0.0 - 25769f03a52addf00a8c34d7a506d855fd8fb167::20260225-140255 || 2026/02/25
/home/mlkaps_org/kevin/maqao oneview -R1 -WS -WC --replace -c=config.json -dbg=1 -xp=test_m1-128_o1_perf009_allowextra_scala_kptr -lprof-params=--allow-extra-threads -- /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
CPY: [true] /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libmumps_common.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libmumps_common.so
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libdmumps.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libdmumps.so
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_0" --mpi-command="mpirun -np 1 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_0: At cluster level, discarded 90 functions cumulating 0.6% of application profiled time
Run run_0: At cluster level, discarded 104 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_1" --mpi-command="mpirun -np 2 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_1: At cluster level, discarded 164 functions cumulating 0.6% of application profiled time
Run run_1: At cluster level, discarded 155 loops cumulating 0.6% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_2" --mpi-command="mpirun -np 4 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_2: At cluster level, discarded 190 functions cumulating 0.6% of application profiled time
Run run_2: At cluster level, discarded 163 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_3" --mpi-command="mpirun -np 8 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_3: At cluster level, discarded 208 functions cumulating 0.5% of application profiled time
Run run_3: At cluster level, discarded 171 loops cumulating 0.4% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_4" --mpi-command="mpirun -np 16 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_4: At cluster level, discarded 254 functions cumulating 0.5% of application profiled time
Run run_4: At cluster level, discarded 177 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_5" --mpi-command="mpirun -np 32 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_5: At cluster level, discarded 308 functions cumulating 0.4% of application profiled time
Run run_5: At cluster level, discarded 184 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_6" --mpi-command="mpirun -np 64 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_6: At cluster level, discarded 401 functions cumulating 0.4% of application profiled time
Run run_6: At cluster level, discarded 209 loops cumulating 0.2% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_7" --mpi-command="mpirun -np 128 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_7: At cluster level, discarded 547 functions cumulating 0.4% of application profiled time
Run run_7: At cluster level, discarded 235 loops cumulating 0.2% of application profiled time
CMD: /home/mlkaps_org/kevin/maqao otter -input=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/input_manifest.csv -output=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/output_manifest.csv -dbg=1 --reduce-threads-files=on
********************************************************************************
MAQAO 2026.0.0 - 25769f03a52addf00a8c34d7a506d855fd8fb167::20260225-140255 || 2026/02/25
/home/mlkaps_org/kevin/maqao oneview -R1 -WS -WC --replace -c=config.json -dbg=1 -xp=test_m1-128_o1_perf009_allowextra_scala_kptr -lprof-params=--allow-extra-threads -- /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
CPY: [true] /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libmumps_common.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libmumps_common.so
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libdmumps.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libdmumps.so
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_0" --mpi-command="mpirun -np 1 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_0: At cluster level, discarded 90 functions cumulating 0.6% of application profiled time
Run run_0: At cluster level, discarded 104 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_1" --mpi-command="mpirun -np 2 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_1: At cluster level, discarded 164 functions cumulating 0.6% of application profiled time
Run run_1: At cluster level, discarded 155 loops cumulating 0.6% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_2" --mpi-command="mpirun -np 4 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_2: At cluster level, discarded 190 functions cumulating 0.6% of application profiled time
Run run_2: At cluster level, discarded 163 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_3" --mpi-command="mpirun -np 8 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_3: At cluster level, discarded 208 functions cumulating 0.5% of application profiled time
Run run_3: At cluster level, discarded 171 loops cumulating 0.4% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_4" --mpi-command="mpirun -np 16 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_4: At cluster level, discarded 254 functions cumulating 0.5% of application profiled time
Run run_4: At cluster level, discarded 177 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_5" --mpi-command="mpirun -np 32 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_5: At cluster level, discarded 308 functions cumulating 0.4% of application profiled time
Run run_5: At cluster level, discarded 184 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_6" --mpi-command="mpirun -np 64 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_6: At cluster level, discarded 401 functions cumulating 0.4% of application profiled time
Run run_6: At cluster level, discarded 209 loops cumulating 0.2% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_7" --mpi-command="mpirun -np 128 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_7: At cluster level, discarded 547 functions cumulating 0.4% of application profiled time
Run run_7: At cluster level, discarded 235 loops cumulating 0.2% of application profiled time
CMD: /home/mlkaps_org/kevin/maqao otter -input=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/input_manifest.csv -output=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/output_manifest.csv -dbg=1 --reduce-threads-files=on
********************************************************************************
MAQAO 2026.0.0 - 25769f03a52addf00a8c34d7a506d855fd8fb167::20260225-140255 || 2026/02/25
/home/mlkaps_org/kevin/maqao oneview -R1 -WS -WC --replace -c=config.json -dbg=1 -xp=test_m1-128_o1_perf009_allowextra_scala_kptr -lprof-params=--allow-extra-threads -- /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
CPY: [true] /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libmumps_common.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libmumps_common.so
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libdmumps.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libdmumps.so
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_0" --mpi-command="mpirun -np 1 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_0: At cluster level, discarded 90 functions cumulating 0.6% of application profiled time
Run run_0: At cluster level, discarded 104 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_1" --mpi-command="mpirun -np 2 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_1: At cluster level, discarded 164 functions cumulating 0.6% of application profiled time
Run run_1: At cluster level, discarded 155 loops cumulating 0.6% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_2" --mpi-command="mpirun -np 4 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_2: At cluster level, discarded 190 functions cumulating 0.6% of application profiled time
Run run_2: At cluster level, discarded 163 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_3" --mpi-command="mpirun -np 8 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_3: At cluster level, discarded 208 functions cumulating 0.5% of application profiled time
Run run_3: At cluster level, discarded 171 loops cumulating 0.4% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_4" --mpi-command="mpirun -np 16 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_4: At cluster level, discarded 254 functions cumulating 0.5% of application profiled time
Run run_4: At cluster level, discarded 177 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_5" --mpi-command="mpirun -np 32 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_5: At cluster level, discarded 308 functions cumulating 0.4% of application profiled time
Run run_5: At cluster level, discarded 184 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_6" --mpi-command="mpirun -np 64 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_6: At cluster level, discarded 401 functions cumulating 0.4% of application profiled time
Run run_6: At cluster level, discarded 209 loops cumulating 0.2% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_7" --mpi-command="mpirun -np 128 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_7: At cluster level, discarded 547 functions cumulating 0.4% of application profiled time
Run run_7: At cluster level, discarded 235 loops cumulating 0.2% of application profiled time
CMD: /home/mlkaps_org/kevin/maqao otter -input=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/input_manifest.csv -output=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/output_manifest.csv -dbg=1 --reduce-threads-files=on
********************************************************************************
MAQAO 2026.0.0 - 25769f03a52addf00a8c34d7a506d855fd8fb167::20260225-140255 || 2026/02/25
/home/mlkaps_org/kevin/maqao oneview -R1 -WS -WC --replace -c=config.json -dbg=1 -xp=test_m1-128_o1_perf009_allowextra_scala_kptr -lprof-params=--allow-extra-threads -- /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
CPY: [true] /home/mlkaps_org/kevin/spack/opt/spack/linux-sapphirerapids/mumps-parametrable-launcher-0.1.0-x5qsule44eio2cizekgf4n4mtlhxpzf6/bin/mumps-parametrable-launcher --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libmumps_common.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libmumps_common.so
CPY: [true] /home/mlkaps_org/kevin/MUMPS_5.8.2/lib/libdmumps.so --> /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/libs/libdmumps.so
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_0" --mpi-command="mpirun -np 1 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_0: At cluster level, discarded 90 functions cumulating 0.6% of application profiled time
Run run_0: At cluster level, discarded 104 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_1" --mpi-command="mpirun -np 2 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_1: At cluster level, discarded 164 functions cumulating 0.6% of application profiled time
Run run_1: At cluster level, discarded 155 loops cumulating 0.6% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_2" --mpi-command="mpirun -np 4 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_2: At cluster level, discarded 190 functions cumulating 0.6% of application profiled time
Run run_2: At cluster level, discarded 163 loops cumulating 0.5% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_3" --mpi-command="mpirun -np 8 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_3: At cluster level, discarded 208 functions cumulating 0.5% of application profiled time
Run run_3: At cluster level, discarded 171 loops cumulating 0.4% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_4" --mpi-command="mpirun -np 16 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_4: At cluster level, discarded 254 functions cumulating 0.5% of application profiled time
Run run_4: At cluster level, discarded 177 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_5" --mpi-command="mpirun -np 32 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_5: At cluster level, discarded 308 functions cumulating 0.4% of application profiled time
Run run_5: At cluster level, discarded 184 loops cumulating 0.3% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_6" --mpi-command="mpirun -np 64 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_6: At cluster level, discarded 401 functions cumulating 0.4% of application profiled time
Run run_6: At cluster level, discarded 209 loops cumulating 0.2% of application profiled time
CMD: OMP_NUM_THREADS=1 /home/mlkaps_org/kevin/maqao lprof _caller=oneview --allow-extra-threads --xp="/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/tools/lprof_run_7" --mpi-command="mpirun -np 128 --bind-to core --map-by numa" --collect-CPU-time-intervals --collect-topology tpp=1 -ldi=libmumps_common.so,libdmumps.so -- /home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/binaries/mumps-parametrable-launcher -i perf009araff.mtx 1 0 0 0
Run run_7: At cluster level, discarded 547 functions cumulating 0.4% of application profiled time
Run run_7: At cluster level, discarded 235 loops cumulating 0.2% of application profiled time
CMD: /home/mlkaps_org/kevin/maqao otter -input=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/input_manifest.csv -output=/home/mlkaps_org/kevin/matrices/test_m1-128_o1_perf009_allowextra_scala_kptr/OTTER/output_manifest.csv -dbg=1 --reduce-threads-files=on