[goodhel] rerun 102 tput tests on itscrd90 - all ok

STARTED AT Mon Sep 2 12:36:25 PM CEST 2024 ./tput/teeThroughputX.sh -mix -hrd -makej -eemumu -ggtt -ggttg -ggttgg -gqttq -ggttggg -makeclean ENDED(1) AT Mon Sep 2 12:59:35 PM CEST 2024 [Status=0] ./tput/teeThroughputX.sh -flt -hrd -makej -eemumu -ggtt -ggttgg -inlonly -makeclean ENDED(2) AT Mon Sep 2 01:08:27 PM CEST 2024 [Status=0] ./tput/teeThroughputX.sh -makej -eemumu -ggtt -ggttg -gqttq -ggttgg -ggttggg -flt -bridge -makeclean ENDED(3) AT Mon Sep 2 01:16:51 PM CEST 2024 [Status=0] ./tput/teeThroughputX.sh -eemumu -ggtt -ggttgg -flt -rmbhst ENDED(4) AT Mon Sep 2 01:19:36 PM CEST 2024 [Status=0] ./tput/teeThroughputX.sh -eemumu -ggtt -ggttgg -flt -curhst ENDED(5) AT Mon Sep 2 01:22:18 PM CEST 2024 [Status=0] ./tput/teeThroughputX.sh -eemumu -ggtt -ggttgg -flt -common ENDED(6) AT Mon Sep 2 01:25:06 PM CEST 2024 [Status=0] ./tput/teeThroughputX.sh -mix -hrd -makej -susyggtt -susyggt1t1 -smeftggtttt -heftggbb -makeclean ENDED(7) AT Mon Sep 2 01:36:00 PM CEST 2024 [Status=0]
valassi · Sep 2, 2024 · 48fa9bf · 48fa9bf
1 parent 016433b
commit 48fa9bf
Show file tree

Hide file tree

Showing 102 changed files with 4,722 additions and 4,722 deletions.
diff --git a/epochX/cudacpp/tput/logs_eemumu_mad/log_eemumu_mad_d_inl0_hrd0.txt b/epochX/cudacpp/tput/logs_eemumu_mad/log_eemumu_mad_d_inl0_hrd0.txt
@@ -40,7 +40,7 @@ make[1]: Entering directory '/data/avalassi/GPU2023/madgraph4gpuX/epochX/cudacpp
 make[1]: Nothing to be done for 'all'.
 make[1]: Leaving directory '/data/avalassi/GPU2023/madgraph4gpuX/epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum'
 
-DATE: 2024-08-08_19:47:50
+DATE: 2024-09-02_12:41:34
 
 On itscrd90.cern.ch [CPU: Intel(R) Xeon(R) Silver 4216 CPU] [GPU: 1x Tesla V100S-PCIE-32GB]:
 =========================================================================
@@ -49,15 +49,15 @@ INFO: The following Floating Point Exceptions will cause SIGFPE program aborts:
 Process                     = SIGMA_SM_EPEM_MUPMUM_CUDA [nvcc 12.0.140 (gcc 11.3.1)] [inlineHel=0] [hardcodePARAM=0]
 Workflow summary            = CUD:DBL+THX:CURDEV+RMBDEV+MESDEV/none+NAVBRK
 FP precision                = DOUBLE (NaN/abnormal=0, zero=0)
-EvtsPerSec[Rmb+ME]     (23) = ( 6.598959e+07                 )  sec^-1
-EvtsPerSec[MatrixElems] (3) = ( 4.638501e+08                 )  sec^-1
-EvtsPerSec[MECalcOnly] (3a) = ( 7.177835e+08                 )  sec^-1
+EvtsPerSec[Rmb+ME]     (23) = ( 7.315961e+07                 )  sec^-1
+EvtsPerSec[MatrixElems] (3) = ( 4.832584e+08                 )  sec^-1
+EvtsPerSec[MECalcOnly] (3a) = ( 7.179479e+08                 )  sec^-1
 MeanMatrixElemValue         = ( 1.371706e-02 +- 3.270315e-06 )  GeV^0
-TOTAL       :     0.698559 sec
+TOTAL       :     0.672014 sec
 INFO: No Floating Point Exceptions have been reported
-     2,601,897,002      cycles                           #    2.808 GHz                    
-     4,040,507,104      instructions                     #    1.55  insn per cycle         
-       0.999350103 seconds time elapsed
+     2,648,088,093      cycles                           #    2.915 GHz                    
+     4,076,818,915      instructions                     #    1.54  insn per cycle         
+       0.971331198 seconds time elapsed
 runNcu /data/avalassi/GPU2023/madgraph4gpuX/epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum/build.cuda_d_inl0_hrd0/check_cuda.exe -p 2048 256 1
 ==PROF== Profiling "sigmaKin": launch__registers_per_thread 166
 ==PROF== Profiling "sigmaKin": sm__sass_average_branch_targets_threads_uniform.pct 100%
@@ -82,15 +82,15 @@ Process                     = SIGMA_SM_EPEM_MUPMUM_CPP [gcc 11.3.1] [inlineHel=0
 Workflow summary            = CPP:DBL+CXS:CURHST+RMBHST+MESHST/none+NAVBRK
 FP precision                = DOUBLE (NaN/abnormal=0, zero=0)
 Internal loops fptype_sv    = SCALAR ('none': ~vector[1], no SIMD)
-EvtsPerSec[Rmb+ME]     (23) = ( 1.054108e+06                 )  sec^-1
-EvtsPerSec[MatrixElems] (3) = ( 1.229313e+06                 )  sec^-1
-EvtsPerSec[MECalcOnly] (3a) = ( 1.229313e+06                 )  sec^-1
+EvtsPerSec[Rmb+ME]     (23) = ( 1.056764e+06                 )  sec^-1
+EvtsPerSec[MatrixElems] (3) = ( 1.230740e+06                 )  sec^-1
+EvtsPerSec[MECalcOnly] (3a) = ( 1.230740e+06                 )  sec^-1
 MeanMatrixElemValue         = ( 1.371706e-02 +- 3.270315e-06 )  GeV^0
-TOTAL       :     6.402837 sec
+TOTAL       :     6.351497 sec
 INFO: No Floating Point Exceptions have been reported
-    19,233,855,272      cycles                           #    3.000 GHz                    
-    46,180,507,769      instructions                     #    2.40  insn per cycle         
-       6.412153445 seconds time elapsed
+    19,058,066,313      cycles                           #    2.999 GHz                    
+    46,075,424,260      instructions                     #    2.42  insn per cycle         
+       6.356657261 seconds time elapsed
 =Symbols in CPPProcess_cpp.o= (~sse4:  463) (avx2:    0) (512y:    0) (512z:    0)
 -------------------------------------------------------------------------
 runTest /data/avalassi/GPU2023/madgraph4gpuX/epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum/build.none_d_inl0_hrd0/runTest_cpp.exe
@@ -111,15 +111,15 @@ Process                     = SIGMA_SM_EPEM_MUPMUM_CPP [gcc 11.3.1] [inlineHel=0
 Workflow summary            = CPP:DBL+CXS:CURHST+RMBHST+MESHST/sse4+CXVBRK
 FP precision                = DOUBLE (NaN/abnormal=0, zero=0)
 Internal loops fptype_sv    = VECTOR[2] ('sse4': SSE4.2, 128bit) [cxtype_ref=YES]
-EvtsPerSec[Rmb+ME]     (23) = ( 1.601848e+06                 )  sec^-1
-EvtsPerSec[MatrixElems] (3) = ( 2.093713e+06                 )  sec^-1
-EvtsPerSec[MECalcOnly] (3a) = ( 2.093713e+06                 )  sec^-1
+EvtsPerSec[Rmb+ME]     (23) = ( 1.583618e+06                 )  sec^-1
+EvtsPerSec[MatrixElems] (3) = ( 2.054185e+06                 )  sec^-1
+EvtsPerSec[MECalcOnly] (3a) = ( 2.054185e+06                 )  sec^-1
 MeanMatrixElemValue         = ( 1.371706e-02 +- 3.270315e-06 )  GeV^0
-TOTAL       :     4.363298 sec
+TOTAL       :     4.384026 sec
 INFO: No Floating Point Exceptions have been reported
-    13,100,720,322      cycles                           #    2.997 GHz                    
-    31,716,075,564      instructions                     #    2.42  insn per cycle         
-       4.372588931 seconds time elapsed
+    12,908,939,930      cycles                           #    2.942 GHz                    
+    31,610,854,085      instructions                     #    2.45  insn per cycle         
+       4.389237812 seconds time elapsed
 =Symbols in CPPProcess_cpp.o= (~sse4: 1664) (avx2:    0) (512y:    0) (512z:    0)
 -------------------------------------------------------------------------
 runTest /data/avalassi/GPU2023/madgraph4gpuX/epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum/build.sse4_d_inl0_hrd0/runTest_cpp.exe
@@ -140,15 +140,15 @@ Process                     = SIGMA_SM_EPEM_MUPMUM_CPP [gcc 11.3.1] [inlineHel=0
 Workflow summary            = CPP:DBL+CXS:CURHST+RMBHST+MESHST/avx2+CXVBRK
 FP precision                = DOUBLE (NaN/abnormal=0, zero=0)
 Internal loops fptype_sv    = VECTOR[4] ('avx2': AVX2, 256bit) [cxtype_ref=YES]
-EvtsPerSec[Rmb+ME]     (23) = ( 2.042973e+06                 )  sec^-1
-EvtsPerSec[MatrixElems] (3) = ( 2.858628e+06                 )  sec^-1
-EvtsPerSec[MECalcOnly] (3a) = ( 2.858628e+06                 )  sec^-1
+EvtsPerSec[Rmb+ME]     (23) = ( 2.043196e+06                 )  sec^-1
+EvtsPerSec[MatrixElems] (3) = ( 2.835712e+06                 )  sec^-1
+EvtsPerSec[MECalcOnly] (3a) = ( 2.835712e+06                 )  sec^-1
 MeanMatrixElemValue         = ( 1.371706e-02 +- 3.270315e-06 )  GeV^0
-TOTAL       :     3.509207 sec
+TOTAL       :     3.479638 sec
 INFO: No Floating Point Exceptions have been reported
-    10,205,028,097      cycles                           #    2.901 GHz                    
-    19,707,283,623      instructions                     #    1.93  insn per cycle         
-       3.518316321 seconds time elapsed
+    10,002,988,331      cycles                           #    2.871 GHz                    
+    19,601,442,945      instructions                     #    1.96  insn per cycle         
+       3.484968912 seconds time elapsed
 =Symbols in CPPProcess_cpp.o= (~sse4:    0) (avx2: 1946) (512y:    0) (512z:    0)
 -------------------------------------------------------------------------
 runTest /data/avalassi/GPU2023/madgraph4gpuX/epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum/build.avx2_d_inl0_hrd0/runTest_cpp.exe
@@ -169,15 +169,15 @@ Process                     = SIGMA_SM_EPEM_MUPMUM_CPP [gcc 11.3.1] [inlineHel=0
 Workflow summary            = CPP:DBL+CXS:CURHST+RMBHST+MESHST/512y+CXVBRK
 FP precision                = DOUBLE (NaN/abnormal=0, zero=0)
 Internal loops fptype_sv    = VECTOR[4] ('512y': AVX512, 256bit) [cxtype_ref=YES]
-EvtsPerSec[Rmb+ME]     (23) = ( 2.068954e+06                 )  sec^-1
-EvtsPerSec[MatrixElems] (3) = ( 2.924439e+06                 )  sec^-1
-EvtsPerSec[MECalcOnly] (3a) = ( 2.924439e+06                 )  sec^-1
+EvtsPerSec[Rmb+ME]     (23) = ( 2.065045e+06                 )  sec^-1
+EvtsPerSec[MatrixElems] (3) = ( 2.908107e+06                 )  sec^-1
+EvtsPerSec[MECalcOnly] (3a) = ( 2.908107e+06                 )  sec^-1
 MeanMatrixElemValue         = ( 1.371706e-02 +- 3.270315e-06 )  GeV^0
-TOTAL       :     3.473859 sec
+TOTAL       :     3.447676 sec
 INFO: No Floating Point Exceptions have been reported
-    10,004,130,884      cycles                           #    2.873 GHz                    
-    19,357,111,804      instructions                     #    1.93  insn per cycle         
-       3.483068816 seconds time elapsed
+     9,813,749,852      cycles                           #    2.843 GHz                    
+    19,249,476,875      instructions                     #    1.96  insn per cycle         
+       3.452987591 seconds time elapsed
 =Symbols in CPPProcess_cpp.o= (~sse4:    0) (avx2: 1685) (512y:  178) (512z:    0)
 -------------------------------------------------------------------------
 runTest /data/avalassi/GPU2023/madgraph4gpuX/epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum/build.512y_d_inl0_hrd0/runTest_cpp.exe
@@ -198,15 +198,15 @@ Process                     = SIGMA_SM_EPEM_MUPMUM_CPP [gcc 11.3.1] [inlineHel=0
 Workflow summary            = CPP:DBL+CXS:CURHST+RMBHST+MESHST/512z+CXVBRK
 FP precision                = DOUBLE (NaN/abnormal=0, zero=0)
 Internal loops fptype_sv    = VECTOR[8] ('512z': AVX512, 512bit) [cxtype_ref=YES]
-EvtsPerSec[Rmb+ME]     (23) = ( 1.804457e+06                 )  sec^-1
-EvtsPerSec[MatrixElems] (3) = ( 2.421604e+06                 )  sec^-1
-EvtsPerSec[MECalcOnly] (3a) = ( 2.421604e+06                 )  sec^-1
+EvtsPerSec[Rmb+ME]     (23) = ( 1.786232e+06                 )  sec^-1
+EvtsPerSec[MatrixElems] (3) = ( 2.368079e+06                 )  sec^-1
+EvtsPerSec[MECalcOnly] (3a) = ( 2.368079e+06                 )  sec^-1
 MeanMatrixElemValue         = ( 1.371706e-02 +- 3.270315e-06 )  GeV^0
-TOTAL       :     3.921670 sec
+TOTAL       :     3.926479 sec
 INFO: No Floating Point Exceptions have been reported
-     8,766,336,363      cycles                           #    2.231 GHz                    
-    15,830,799,810      instructions                     #    1.81  insn per cycle         
-       3.930866073 seconds time elapsed
+     8,570,213,038      cycles                           #    2.180 GHz                    
+    15,723,160,890      instructions                     #    1.83  insn per cycle         
+       3.931625600 seconds time elapsed
 =Symbols in CPPProcess_cpp.o= (~sse4:    0) (avx2:  880) (512y:  156) (512z: 1257)
 -------------------------------------------------------------------------
 runTest /data/avalassi/GPU2023/madgraph4gpuX/epochX/cudacpp/ee_mumu.mad/SubProcesses/P1_epem_mupmum/build.512z_d_inl0_hrd0/runTest_cpp.exe