diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..938c81f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +405,12.0974,8.79032,12.8804 +1566,46.2209,9.0806,49.3488 +6183,181.159,9.20569,189.324 +12339,342.937,9.06822,356.197 +24678,626.709,8.08964,656.577 +49329,971.099,7.8621,1058.14 +98631,1417.29,8.33524,1371.79 +197262,1662.67,7.19463,1655.15 +394524,1623.27,5.15081,1670.4 +577935,1724.22,5.04846,1773.47 +1155843,1887.69,4.83564,1913.84 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..e015e2b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +405,46.2209,9.0806,49.3488 +1566,113.68995,9.07441,119.3364 +6183,181.159,9.06822,189.324 +12339,342.937,9.06822,356.197 +24678,626.709,8.33524,656.577 +49329,971.099,8.08964,1058.14 +98631,1417.29,7.8621,1371.79 +197262,1623.27,7.19463,1655.15 +394524,1662.67,5.15081,1670.4 +577935,1693.4450000000002,5.099635,1721.935 +1155843,1724.22,5.04846,1773.47 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_flops_raw.csv new file mode 100644 index 0000000..a04b9a4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +405,18.0915,13.1459,19.2625 +1566,69.2993,13.6146,73.989 +6183,271.794,13.8113,284.043 +12339,514.567,13.6066,534.463 +24678,940.413,12.139,985.231 +49329,1457.23,11.7979,1587.84 +98631,2126.82,12.508,2058.54 +197262,2495.05,10.7965,2483.77 +394524,2435.93,7.72949,2506.66 +577935,2587.42,7.57591,2661.33 +1155843,2832.74,7.25656,2871.99 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_flops_smoothed.csv new file mode 100644 index 0000000..edaf351 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_DIFFUSION3DPA_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +405,69.2993,13.6146,73.989 +1566,170.54665,13.6106,179.01600000000002 +6183,271.794,13.6066,284.043 +12339,514.567,13.6066,534.463 +24678,940.413,12.508,985.231 +49329,1457.23,12.139,1587.84 +98631,2126.82,11.7979,2058.54 +197262,2435.93,10.7965,2483.77 +394524,2495.05,7.72949,2506.66 +577935,2541.235,7.6527,2583.995 +1155843,2587.42,7.57591,2661.33 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_bandwidth_raw.csv new file mode 100644 index 0000000..8b54d46 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +512,0.197104,0.0229243,0.196309 +3375,0.802097,0.0221669,0.801571 +17576,2.64385,0.0217854,2.65177 +35937,2.7385,0.021533,2.74046 +79507,3.30983,0.021455,3.29378 +166375,3.43745,0.0213676,3.42995 +343000,3.568,0.0213174,3.55459 +704969,3.6228,0.0213042,3.60819 +1442897,3.65749,0.0211735,3.64609 +2146689,3.67155,0.0212504,3.66075 +4410944,3.67202,0.0211402,3.65886 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..384c5f5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +512,0.802097,0.0221669,0.801571 +3375,1.7229735,0.02197615,1.7266705 +17576,2.64385,0.0217854,2.65177 +35937,2.7385,0.021533,2.74046 +79507,3.30983,0.021455,3.29378 +166375,3.43745,0.0213676,3.42995 +343000,3.568,0.0213174,3.55459 +704969,3.6228,0.0213042,3.60819 +1442897,3.65749,0.0212504,3.64609 +2146689,3.66452,0.02121195,3.652475 +4410944,3.67155,0.0211735,3.65886 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_flops_raw.csv new file mode 100644 index 0000000..c62dbf2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +512,80.6755,9.38302,80.35 +3375,339.719,9.38853,339.496 +17576,1140.57,9.39835,1143.99 +35937,1188.01,9.34143,1188.86 +79507,1442.95,9.35348,1435.95 +166375,1503.98,9.34894,1500.7 +343000,1565.47,9.35308,1559.59 +704969,1593.03,9.36795,1586.61 +1442897,1611.09,9.32671,1606.07 +2146689,1618.58,9.36815,1613.82 +4410944,1620.76,9.33091,1614.96 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_flops_smoothed.csv new file mode 100644 index 0000000..8bcd8d8 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_EDGE3D_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +512,339.719,9.38853,339.496 +3375,740.1445,9.385774999999999,741.7429999999999 +17576,1140.57,9.38302,1143.99 +35937,1188.01,9.35348,1188.86 +79507,1442.95,9.35308,1435.95 +166375,1503.98,9.35308,1500.7 +343000,1565.47,9.35308,1559.59 +704969,1593.03,9.35308,1586.61 +1442897,1611.09,9.35308,1606.07 +2146689,1614.835,9.34943,1609.945 +4410944,1618.58,9.33091,1613.82 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_bandwidth_raw.csv new file mode 100644 index 0000000..de0283f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +417,6.49675,48.7956,6.50062 +1667,25.3733,47.0544,25.255 +6667,100.275,47.0702,99.7526 +13334,199.931,47.2522,199.262 +26667,391.454,48.6333,390.714 +53334,727.103,37.0917,724.576 +106667,1325.45,33.7378,1326.25 +213334,2240.46,32.8315,2251.23 +426667,3105.64,30.7464,3097.01 +625000,2943.18,26.281,2934.85 +1250000,2643.02,18.7451,2646.71 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_bandwidth_smoothed.csv new file mode 100644 index 0000000..2b5d700 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +417,25.3733,47.0702,25.255 +1667,62.82415,47.1612,62.5038 +6667,100.275,47.2522,99.7526 +13334,199.931,47.0702,199.262 +26667,391.454,47.0702,390.714 +53334,727.103,37.0917,724.576 +106667,1325.45,33.7378,1326.25 +213334,2240.46,32.8315,2251.23 +426667,2643.02,30.7464,2646.71 +625000,2793.1,28.5137,2790.7799999999997 +1250000,2943.18,26.281,2934.85 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_flops_raw.csv new file mode 100644 index 0000000..e4fc7cd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +417,1.77625,13.341,1.77731 +1667,6.93723,12.865,6.90487 +6667,27.4158,12.8693,27.273 +13334,54.6624,12.9191,54.4796 +26667,107.026,13.2967,106.824 +53334,198.795,10.1411,198.104 +106667,362.386,9.22412,362.606 +213334,612.557,8.97634,615.5 +426667,849.103,8.40628,846.742 +625000,804.683,7.18539,802.407 +1250000,722.619,5.12504,723.629 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_flops_smoothed.csv new file mode 100644 index 0000000..d6f6d65 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_ENERGY_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +417,6.93723,12.8693,6.90487 +1667,17.176515000000002,12.894200000000001,17.088935 +6667,27.4158,12.9191,27.273 +13334,54.6624,12.8693,54.4796 +26667,107.026,12.8693,106.824 +53334,198.795,10.1411,198.104 +106667,362.386,9.22412,362.606 +213334,612.557,8.97634,615.5 +426667,722.619,8.40628,723.629 +625000,763.6510000000001,7.795835,763.018 +1250000,804.683,7.18539,802.407 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_bandwidth_raw.csv new file mode 100644 index 0000000..99e4c87 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_CUDA-block_128,Base_Seq-default,RAJA_CUDA-block_128 +31104,14.928049999999999,0.6055889999999999,10.06305 +73728,24.5073,0.5725,16.3838 +144000,34.1906,0.578163,23.3096 +248832,44.7641,0.599649,30.9269 +395136,46.0821,0.602929,36.1339 +589824,53.0155,0.594489,42.4744 +1152000,58.4488,0.566533,48.8716 +1533312,61.8105,0.521593,52.502 +1990656,65.9083,0.509787,55.1352 +2530944,66.4358,0.498932,57.3794 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_bandwidth_smoothed.csv new file mode 100644 index 0000000..da72393 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_CUDA-block_128,Base_Seq-default,RAJA_CUDA-block_128 +31104,19.745,0.586811,13.2291 +73728,24.5073,0.595459,16.3838 +144000,34.1906,0.599649,23.3096 +248832,44.7641,0.594489,30.9269 +395136,46.0821,0.594489,36.1339 +589824,53.0155,0.594489,42.4744 +1152000,58.4488,0.566533,48.8716 +1533312,61.8105,0.521593,52.502 +1990656,63.859399999999994,0.51569,53.8186 +2530944,65.9083,0.509787,55.1352 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_flops_raw.csv new file mode 100644 index 0000000..7722ab4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_CUDA-block_128,Base_Seq-default,RAJA_CUDA-block_128 +31104,83.12595,3.37219,56.03545 +73728,132.791,3.10205,88.7746 +144000,182.372,3.08391,124.333 +248832,236.347,3.16604,163.289 +395136,241.569,3.16064,189.419 +589824,276.445,3.09991,221.479 +1152000,302.549,2.93255,252.975 +1533312,319.107,2.69281,271.05 +1990656,339.519,2.62611,284.022 +2530944,341.606,2.56545,295.038 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_flops_smoothed.csv new file mode 100644 index 0000000..9f306fb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_FEMSWEEP_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_CUDA-block_128,Base_Seq-default,RAJA_CUDA-block_128 +31104,108.1106,3.208915,72.43655000000001 +73728,132.791,3.16604,88.7746 +144000,182.372,3.16064,124.333 +248832,236.347,3.10205,163.289 +395136,241.569,3.09991,189.419 +589824,276.445,3.09991,221.479 +1152000,302.549,2.93255,252.975 +1533312,319.107,2.69281,271.05 +1990656,329.313,2.65946,277.536 +2530944,339.519,2.62611,284.022 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_bandwidth_raw.csv new file mode 100644 index 0000000..ca12900 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +1728,0.511948,0.0515405,0.517215 +5832,1.71116,0.0532159,1.72196 +17576,4.83834,0.0532582,4.94421 +39304,9.85649,0.0530228,10.1052 +74088,15.1717,0.0530315,11.2695 +140608,15.8649,0.0529853,13.8482 +287496,17.2826,0.0527919,14.9171 +551368,18.8845,0.0527725,15.7543 +1124864,19.8885,0.0527279,16.5051 +1643032,20.0555,0.0526587,16.6066 +3241792,20.4644,0.0526191,16.9192 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv new file mode 100644 index 0000000..33eca74 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +1728,1.71116,0.0532159,1.72196 +5832,3.27475,0.053119349999999996,3.333085 +17576,4.83834,0.0530315,4.94421 +39304,9.85649,0.0530315,10.1052 +74088,15.1717,0.0530228,11.2695 +140608,15.8649,0.0529853,13.8482 +287496,17.2826,0.0527919,14.9171 +551368,18.8845,0.0527725,15.7543 +1124864,19.8885,0.0527279,16.5051 +1643032,19.972,0.0526933,16.55585 +3241792,20.0555,0.0526587,16.6066 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_flops_raw.csv new file mode 100644 index 0000000..2c6328d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +1728,40.5816,4.08557,40.9991 +5832,137.471,4.27525,138.338 +17576,391.7,4.31165,400.271 +39304,801.073,4.30936,821.286 +74088,1235.97,4.32023,918.07 +140608,1294.89,4.32463,1130.28 +287496,1412.94,4.31601,1219.55 +551368,1545.74,4.31956,1289.52 +1124864,1629.6,4.32034,1352.37 +1643032,1644.02,4.31662,1361.3 +3241792,1678.67,4.31628,1387.86 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_flops_smoothed.csv new file mode 100644 index 0000000..3480b0e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_INTSC_HEXRECT_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +1728,137.471,4.27525,138.338 +5832,264.5855,4.292305,269.3045 +17576,391.7,4.30936,400.271 +39304,801.073,4.31165,821.286 +74088,1235.97,4.31601,918.07 +140608,1294.89,4.31956,1130.28 +287496,1412.94,4.32023,1219.55 +551368,1545.74,4.31956,1289.52 +1124864,1629.6,4.31662,1352.37 +1643032,1636.81,4.31809,1356.835 +3241792,1644.02,4.31662,1361.3 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_bandwidth_raw.csv new file mode 100644 index 0000000..4b2db93 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_CUDA-cached_block_stride_loop_64,RAJA_CUDA-compile_time_block_stride_loop_64 +196608,13.5704,0.189198,19.1632,20.2873 +389120,26.8231,0.189853,38.096,40.0042 +778240,53.0688,0.192069,75.3143,79.797 +1556480,94.9269,0.191844,108.856,117.855 +3108864,162.839,0.187071,152.047,164.577 +6213632,179.945,0.186147,175.507,192.851 +9101312,188.677,0.185918,180.851,198.776 +18198528,218.752,0.185614,201.752,224.806 +24260608,220.49,0.184607,201.658,224.953 +30326784,222.162,0.186821,202.225,225.791 +36392960,228.994,0.184956,208.098,214.629 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_bandwidth_smoothed.csv new file mode 100644 index 0000000..0c271f7 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_CUDA-cached_block_stride_loop_64,RAJA_CUDA-compile_time_block_stride_loop_64 +196608,26.8231,0.189853,38.096,40.0042 +389120,39.94595,0.19084849999999998,56.70515,59.9006 +778240,53.0688,0.189853,75.3143,79.797 +1556480,94.9269,0.189853,108.856,117.855 +3108864,162.839,0.187071,152.047,164.577 +6213632,179.945,0.186147,175.507,192.851 +9101312,188.677,0.185918,180.851,198.776 +18198528,218.752,0.185918,201.658,224.806 +24260608,220.49,0.185614,201.752,224.806 +30326784,221.32600000000002,0.185285,201.9885,224.8795 +36392960,222.162,0.184956,202.225,224.953 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_flops_raw.csv new file mode 100644 index 0000000..141b654 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_CUDA-cached_block_stride_loop_64,RAJA_CUDA-compile_time_block_stride_loop_64 +196608,12.371,0.172475,17.4694,18.4941 +389120,24.4534,0.173081,34.7305,36.4701 +778240,48.3817,0.175105,68.6625,72.7492 +1556480,86.5439,0.174902,99.2427,107.447 +3108864,148.459,0.170552,138.621,150.044 +6213632,164.056,0.16971,160.009,175.822 +9101312,172.016,0.169502,164.882,181.224 +18198528,199.437,0.169224,183.938,204.956 +24260608,201.02,0.168307,183.852,205.09 +30326784,202.545,0.170325,184.368,205.854 +36392960,208.774,0.168625,189.723,195.678 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_flops_smoothed.csv new file mode 100644 index 0000000..dac9ea2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DEA_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_CUDA-cached_block_stride_loop_64,RAJA_CUDA-compile_time_block_stride_loop_64 +196608,24.4534,0.173081,34.7305,36.4701 +389120,36.41755,0.17399150000000002,51.6965,54.60965 +778240,48.3817,0.173081,68.6625,72.7492 +1556480,86.5439,0.173081,99.2427,107.447 +3108864,148.459,0.170552,138.621,150.044 +6213632,164.056,0.16971,160.009,175.822 +9101312,172.016,0.169502,164.882,181.224 +18198528,199.437,0.169502,183.852,204.956 +24260608,201.02,0.169224,183.938,204.956 +30326784,201.7825,0.1689245,184.153,205.023 +36392960,202.545,0.168625,184.368,205.09 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv new file mode 100644 index 0000000..205c707 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +729,15.994,5.63123,15.9327 +3375,78.6741,5.57301,78.0764 +9261,195.668,5.48866,198.452 +19683,342.273,5.42675,339.859 +35937,493.318,5.50448,492.121 +68921,646.287,5.32245,641.236 +132651,753.564,5.48991,756.865 +250047,788.718,5.13006,788.566 +531441,823.891,4.66743,823.152 +753571,852.829,5.21751,852.44 +1442897,854.982,4.43834,854.334 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv new file mode 100644 index 0000000..61bfc3f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +729,78.6741,5.57301,78.0764 +3375,137.17105,5.530835,138.26420000000002 +9261,195.668,5.50448,198.452 +19683,342.273,5.48866,339.859 +35937,493.318,5.48866,492.121 +68921,646.287,5.42675,641.236 +132651,753.564,5.32245,756.865 +250047,788.718,5.21751,788.566 +531441,823.891,5.13006,823.152 +753571,838.3599999999999,4.898745,837.796 +1442897,852.829,4.66743,852.44 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_flops_raw.csv new file mode 100644 index 0000000..cbdceb6 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +729,31.9709,11.2564,31.8483 +3375,163.533,11.5841,162.29 +9261,412.739,11.5777,418.612 +19683,727.574,11.5357,722.443 +35937,1053.65,11.7567,1051.09 +68921,1386.0,11.4143,1375.17 +132651,1621.29,11.8115,1628.39 +250047,1701.15,11.0648,1700.82 +531441,1781.14,10.0903,1779.54 +753571,1845.33,11.2895,1844.49 +1442897,1852.55,9.61689,1851.15 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv new file mode 100644 index 0000000..d2030fc --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +729,163.533,11.5777,162.29 +3375,288.13599999999997,11.5567,290.451 +9261,412.739,11.5777,418.612 +19683,727.574,11.5777,722.443 +35937,1053.65,11.5777,1051.09 +68921,1386.0,11.5357,1375.17 +132651,1621.29,11.4143,1628.39 +250047,1701.15,11.2895,1700.82 +531441,1781.14,11.0648,1779.54 +753571,1813.2350000000001,10.577549999999999,1812.0149999999999 +1442897,1845.33,10.0903,1844.49 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..ca39381 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_64,Base_CUDA-runtime_block_stride_loop_64,Base_Seq-default,RAJA_CUDA-cached_block_stride_loop_64,RAJA_CUDA-direct_64,RAJA_CUDA-runtime_block_stride_loop_64 +5376,10.3695,6.36613,3.89184,6.69729,10.9591,6.75047 +21312,40.5998,25.2277,3.97645,26.1748,41.7224,26.2766 +85056,159.182,96.3617,4.09511,101.046,166.765,101.436 +169920,279.378,178.801,4.1078,186.69,291.695,187.242 +339840,430.166,304.323,4.06186,312.599,446.023,312.635 +679680,568.529,380.403,4.04509,380.057,557.927,379.635 +1359360,681.084,458.687,4.14675,454.106,672.94,453.847 +2718720,729.4,500.232,4.08355,488.989,724.725,489.954 +5437248,758.443,521.457,3.72476,492.28,749.481,492.59 +7964736,776.721,533.27,3.74583,502.632,767.326,502.798 +15929280,797.352,547.173,3.68644,514.449,788.629,514.867 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..37756c6 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_64,Base_CUDA-runtime_block_stride_loop_64,Base_Seq-default,RAJA_CUDA-cached_block_stride_loop_64,RAJA_CUDA-direct_64,RAJA_CUDA-runtime_block_stride_loop_64 +5376,40.5998,25.2277,3.97645,26.1748,41.7224,26.2766 +21312,99.89089999999999,60.7947,4.03578,63.610400000000006,104.24369999999999,63.856300000000005 +85056,159.182,96.3617,4.06186,101.046,166.765,101.436 +169920,279.378,178.801,4.06186,186.69,291.695,187.242 +339840,430.166,304.323,4.09511,312.599,446.023,312.635 +679680,568.529,380.403,4.08355,380.057,557.927,379.635 +1359360,681.084,458.687,4.06186,454.106,672.94,453.847 +2718720,729.4,500.232,4.04509,488.989,724.725,489.954 +5437248,758.443,521.457,3.74583,492.28,749.481,492.59 +7964736,767.582,527.3634999999999,3.735295,497.456,758.4035,497.69399999999996 +15929280,776.721,533.27,3.72476,502.632,767.326,502.798 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_flops_raw.csv new file mode 100644 index 0000000..9483ffc --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_64,Base_CUDA-runtime_block_stride_loop_64,Base_Seq-default,RAJA_CUDA-cached_block_stride_loop_64,RAJA_CUDA-direct_64,RAJA_CUDA-runtime_block_stride_loop_64 +5376,33.9294,20.8302,12.7342,21.9138,35.8586,22.0878 +21312,133.032,82.6628,13.0295,85.7661,136.71,86.0997 +85056,521.775,315.859,13.4231,331.214,546.63,332.491 +169920,915.812,586.117,13.4656,611.976,956.187,613.788 +339840,1410.14,997.613,13.3154,1024.74,1462.13,1024.86 +679680,1863.74,1247.03,13.2606,1245.9,1828.99,1244.51 +1359360,2232.74,1503.67,13.5939,1488.66,2206.04,1487.81 +2718720,2391.14,1639.87,13.3868,1603.02,2375.81,1606.18 +5437248,2486.35,1709.46,12.2106,1613.81,2456.97,1614.83 +7964736,2546.27,1748.18,12.2797,1647.75,2515.47,1648.29 +15929280,2613.91,1793.76,12.085,1686.48,2585.31,1687.86 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_flops_smoothed.csv new file mode 100644 index 0000000..f095778 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_MASSVEC3DPA_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_64,Base_CUDA-runtime_block_stride_loop_64,Base_Seq-default,RAJA_CUDA-cached_block_stride_loop_64,RAJA_CUDA-direct_64,RAJA_CUDA-runtime_block_stride_loop_64 +5376,133.032,82.6628,13.0295,85.7661,136.71,86.0997 +21312,327.4035,199.2609,13.2263,208.49005,341.67,209.29534999999998 +85056,521.775,315.859,13.3154,331.214,546.63,332.491 +169920,915.812,586.117,13.3154,611.976,956.187,613.788 +339840,1410.14,997.613,13.4231,1024.74,1462.13,1024.86 +679680,1863.74,1247.03,13.3868,1245.9,1828.99,1244.51 +1359360,2232.74,1503.67,13.3154,1488.66,2206.04,1487.81 +2718720,2391.14,1639.87,13.2606,1603.02,2375.81,1606.18 +5437248,2486.35,1709.46,12.2797,1613.81,2456.97,1614.83 +7964736,2516.31,1728.8200000000002,12.245149999999999,1630.78,2486.22,1631.56 +15929280,2546.27,1748.18,12.2106,1647.75,2515.47,1648.29 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv new file mode 100644 index 0000000..6a4e355 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +1000,12.2151,16.4161,12.3837 +5832,67.436,15.1809,68.5372 +27000,270.556,14.9014,271.53 +54872,429.436,14.3179,428.486 +117649,621.341,13.8423,621.106 +238328,725.36,15.265,725.675 +493039,835.056,15.2577,832.406 +1000000,892.939,14.9065,891.696 +2048383,871.264,10.7769,870.975 +2985984,883.048,9.88076,883.978 +6028568,912.551,9.65281,912.545 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..ad663fc --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +1000,67.436,15.1809,68.5372 +5832,168.99599999999998,15.04115,170.03359999999998 +27000,270.556,14.9014,271.53 +54872,429.436,14.9014,428.486 +117649,621.341,14.9014,621.106 +238328,725.36,14.9065,725.675 +493039,835.056,14.9065,832.406 +1000000,871.264,14.9065,870.975 +2048383,883.048,10.7769,883.978 +2985984,887.9935,10.32883,887.837 +6028568,883.048,9.88076,883.978 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv new file mode 100644 index 0000000..2c5503e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +1000,3.16501,4.25353,3.20872 +5832,18.717,4.21348,19.0226 +27000,77.6896,4.27892,77.9693 +54872,124.635,4.15548,124.359 +117649,181.954,4.05361,181.886 +238328,213.795,4.49925,213.888 +493039,247.421,4.52073,246.636 +1000000,265.634,4.43443,265.264 +2048383,260.018,3.21622,259.931 +2985984,263.904,2.95292,264.181 +6028568,273.316,2.89109,273.314 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv new file mode 100644 index 0000000..0a371cb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +1000,18.717,4.25353,19.0226 +5832,48.2033,4.233504999999999,48.49595 +27000,77.6896,4.21348,77.9693 +54872,124.635,4.21348,124.359 +117649,181.954,4.27892,181.886 +238328,213.795,4.43443,213.888 +493039,247.421,4.43443,246.636 +1000000,260.018,4.43443,259.931 +2048383,263.904,3.21622,264.181 +2985984,264.769,3.0845700000000003,264.72249999999997 +6028568,263.904,2.95292,264.181 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_bandwidth_raw.csv new file mode 100644 index 0000000..69efd20 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +512,16.812,4.748,17.1316 +3375,66.2827,4.63757,69.0584 +17576,236.888,4.47421,282.851 +35937,438.487,4.4415,456.743 +79507,801.284,4.36589,843.566 +166375,1161.75,4.4135,1359.29 +343000,1425.42,4.48746,1946.07 +704969,2057.77,4.37656,2367.49 +1442897,1902.98,4.06895,1987.7 +2146689,1944.11,4.01726,2091.45 +4410944,2036.84,3.88335,2212.54 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..396bc52 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +512,66.2827,4.63757,69.0584 +3375,151.58535,4.55589,175.9547 +17576,236.888,4.47421,282.851 +35937,438.487,4.4415,456.743 +79507,801.284,4.4415,843.566 +166375,1161.75,4.4135,1359.29 +343000,1425.42,4.37656,1946.07 +704969,1902.98,4.37656,1987.7 +1442897,1944.11,4.06895,2091.45 +2146689,1990.475,4.043105000000001,2151.995 +4410944,1944.11,4.01726,2091.45 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_flops_raw.csv new file mode 100644 index 0000000..a85bfa5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +512,37.4941,10.589,38.2069 +3375,152.965,10.7024,159.37 +17576,556.835,10.5172,664.877 +35937,1036.49,10.4987,1079.64 +79507,1903.39,10.3709,2003.83 +166375,2769.61,10.5217,3240.53 +343000,3407.7,10.728,4652.4 +704969,4930.32,10.486,5672.4 +1442897,4567.41,9.76601,4770.74 +2146689,4669.88,9.64971,5023.79 +4410944,4898.57,9.33941,5321.13 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_flops_smoothed.csv new file mode 100644 index 0000000..4ce9ee2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/Apps_VOL3D_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +512,152.965,10.589,159.37 +3375,354.90000000000003,10.5531,412.1235 +17576,556.835,10.5172,664.877 +35937,1036.49,10.5172,1079.64 +79507,1903.39,10.5172,2003.83 +166375,2769.61,10.4987,3240.53 +343000,3407.7,10.486,4652.4 +704969,4567.41,10.486,4770.74 +1442897,4669.88,9.76601,5023.79 +2146689,4784.225,9.70786,5172.46 +4410944,4669.88,9.64971,5023.79 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_DIFFUSION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_DIFFUSION3DPA.csv new file mode 100644 index 0000000..a5ca480 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_DIFFUSION3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DIFFUSION3DPA-Base_Seq-default,405.0,13.1459,8.79032 +Apps_DIFFUSION3DPA-Base_CUDA-block_64,197262.0,2495.05,1662.67 +Apps_DIFFUSION3DPA-RAJA_CUDA-block_64,197262.0,2483.77,1655.15 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_EDGE3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_EDGE3D.csv new file mode 100644 index 0000000..aae5034 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_EDGE3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_EDGE3D-Base_Seq-default,512.0,9.38302,0.0229243 +Apps_EDGE3D-Base_CUDA-block_256,166375.0,1503.98,3.43745 +Apps_EDGE3D-RAJA_CUDA-block_256,166375.0,1500.7,3.42995 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_ENERGY.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_ENERGY.csv new file mode 100644 index 0000000..add0c02 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_ENERGY.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_ENERGY-Base_Seq-default,417.0,13.341,48.7956 +Apps_ENERGY-Base_CUDA-block_256,625000.0,804.683,2943.18 +Apps_ENERGY-RAJA_CUDA-block_256,426667.0,846.742,3097.01 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_FEMSWEEP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_FEMSWEEP.csv new file mode 100644 index 0000000..dbf40c9 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_FEMSWEEP.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_FEMSWEEP-Base_Seq-default,31104.0,3.31578,0.595459 +Apps_FEMSWEEP-Base_CUDA-block_128,1533312.0,319.107,61.8105 +Apps_FEMSWEEP-RAJA_CUDA-block_128,1533312.0,271.05,52.502 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_INTSC_HEXRECT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_INTSC_HEXRECT.csv new file mode 100644 index 0000000..7c83aa5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_INTSC_HEXRECT.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_INTSC_HEXRECT-Base_Seq-default,1728.0,4.08557,0.0515405 +Apps_INTSC_HEXRECT-Base_CUDA-block_64,551368.0,1545.74,18.8845 +Apps_INTSC_HEXRECT-RAJA_CUDA-block_64,551368.0,1289.52,15.7543 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASS3DEA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASS3DEA.csv new file mode 100644 index 0000000..8b1ba38 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASS3DEA.csv @@ -0,0 +1,5 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DEA-Base_Seq-default,196608.0,0.172475,0.189198 +Apps_MASS3DEA-Base_CUDA-compile_time_block_stride_loop_64,18198528.0,199.437,218.752 +Apps_MASS3DEA-RAJA_CUDA-compile_time_block_stride_loop_64,18198528.0,204.956,224.806 +Apps_MASS3DEA-RAJA_CUDA-cached_block_stride_loop_64,18198528.0,183.938,201.752 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASS3DPA_ATOMIC.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASS3DPA_ATOMIC.csv new file mode 100644 index 0000000..503371e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASS3DPA_ATOMIC.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DPA_ATOMIC-Base_Seq-default,729.0,11.2564,5.63123 +Apps_MASS3DPA_ATOMIC-Base_CUDA-block_64,250047.0,1701.15,788.718 +Apps_MASS3DPA_ATOMIC-RAJA_CUDA-block_64,250047.0,1700.82,788.566 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASSVEC3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASSVEC3DPA.csv new file mode 100644 index 0000000..4941eaa --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_MASSVEC3DPA.csv @@ -0,0 +1,7 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASSVEC3DPA-Base_Seq-default,5376.0,12.7342,3.89184 +Apps_MASSVEC3DPA-Base_CUDA-runtime_block_stride_loop_64,2718720.0,1639.87,500.232 +Apps_MASSVEC3DPA-Base_CUDA-direct_64,2718720.0,2391.14,729.4 +Apps_MASSVEC3DPA-RAJA_CUDA-runtime_block_stride_loop_64,1359360.0,1487.81,453.847 +Apps_MASSVEC3DPA-RAJA_CUDA-direct_64,2718720.0,2375.81,724.725 +Apps_MASSVEC3DPA-RAJA_CUDA-cached_block_stride_loop_64,1359360.0,1488.66,454.106 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_NODAL_ACCUMULATION_3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_NODAL_ACCUMULATION_3D.csv new file mode 100644 index 0000000..01186d7 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_NODAL_ACCUMULATION_3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_NODAL_ACCUMULATION_3D-Base_Seq-default,1000.0,4.25353,16.4161 +Apps_NODAL_ACCUMULATION_3D-Base_CUDA-block_256,493039.0,247.421,835.056 +Apps_NODAL_ACCUMULATION_3D-RAJA_CUDA-block_256,493039.0,246.636,832.406 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_VOL3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_VOL3D.csv new file mode 100644 index 0000000..e13b272 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/Apps_VOL3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_VOL3D-Base_Seq-default,512.0,10.589,4.748 +Apps_VOL3D-Base_CUDA-block_256,704969.0,4930.32,2057.77 +Apps_VOL3D-RAJA_CUDA-block_256,343000.0,4652.4,1946.07 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/combined_fom.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/combined_fom.csv new file mode 100644 index 0000000..db12ccb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/FOM/combined_fom.csv @@ -0,0 +1,35 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DIFFUSION3DPA-Base_CUDA-block_64,197262.0,2495.05,1662.67 +Apps_DIFFUSION3DPA-Base_Seq-default,405.0,13.1459,8.79032 +Apps_DIFFUSION3DPA-RAJA_CUDA-block_64,197262.0,2483.77,1655.15 +Apps_EDGE3D-Base_CUDA-block_256,166375.0,1503.98,3.43745 +Apps_EDGE3D-Base_Seq-default,512.0,9.38302,0.0229243 +Apps_EDGE3D-RAJA_CUDA-block_256,166375.0,1500.7,3.42995 +Apps_ENERGY-Base_CUDA-block_256,625000.0,804.683,2943.18 +Apps_ENERGY-Base_Seq-default,417.0,13.341,48.7956 +Apps_ENERGY-RAJA_CUDA-block_256,426667.0,846.742,3097.01 +Apps_FEMSWEEP-Base_CUDA-block_128,1533312.0,319.107,61.8105 +Apps_FEMSWEEP-Base_Seq-default,31104.0,3.31578,0.595459 +Apps_FEMSWEEP-RAJA_CUDA-block_128,1533312.0,271.05,52.502 +Apps_INTSC_HEXRECT-Base_CUDA-block_64,551368.0,1545.74,18.8845 +Apps_INTSC_HEXRECT-Base_Seq-default,1728.0,4.08557,0.0515405 +Apps_INTSC_HEXRECT-RAJA_CUDA-block_64,551368.0,1289.52,15.7543 +Apps_MASS3DEA-Base_CUDA-compile_time_block_stride_loop_64,18198528.0,199.437,218.752 +Apps_MASS3DEA-Base_Seq-default,196608.0,0.172475,0.189198 +Apps_MASS3DEA-RAJA_CUDA-cached_block_stride_loop_64,18198528.0,183.938,201.752 +Apps_MASS3DEA-RAJA_CUDA-compile_time_block_stride_loop_64,18198528.0,204.956,224.806 +Apps_MASS3DPA_ATOMIC-Base_CUDA-block_64,250047.0,1701.15,788.718 +Apps_MASS3DPA_ATOMIC-Base_Seq-default,729.0,11.2564,5.63123 +Apps_MASS3DPA_ATOMIC-RAJA_CUDA-block_64,250047.0,1700.82,788.566 +Apps_MASSVEC3DPA-Base_CUDA-direct_64,2718720.0,2391.14,729.4 +Apps_MASSVEC3DPA-Base_CUDA-runtime_block_stride_loop_64,2718720.0,1639.87,500.232 +Apps_MASSVEC3DPA-Base_Seq-default,5376.0,12.7342,3.89184 +Apps_MASSVEC3DPA-RAJA_CUDA-cached_block_stride_loop_64,1359360.0,1488.66,454.106 +Apps_MASSVEC3DPA-RAJA_CUDA-direct_64,2718720.0,2375.81,724.725 +Apps_MASSVEC3DPA-RAJA_CUDA-runtime_block_stride_loop_64,1359360.0,1487.81,453.847 +Apps_NODAL_ACCUMULATION_3D-Base_CUDA-block_256,493039.0,247.421,835.056 +Apps_NODAL_ACCUMULATION_3D-Base_Seq-default,1000.0,4.25353,16.4161 +Apps_NODAL_ACCUMULATION_3D-RAJA_CUDA-block_256,493039.0,246.636,832.406 +Apps_VOL3D-Base_CUDA-block_256,704969.0,4930.32,2057.77 +Apps_VOL3D-Base_Seq-default,512.0,10.589,4.748 +Apps_VOL3D-RAJA_CUDA-block_256,343000.0,4652.4,1946.07 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/combined_table.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/combined_table.csv new file mode 100644 index 0000000..997f8ae --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/combined_table.csv @@ -0,0 +1,375 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning +Apps_DIFFUSION3DPA,Base_Seq,default,405, PASSED ,5.93228e-06,8.79032,13.1459,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,405, PASSED ,4.31058e-06,12.0974,18.0915,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,405, PASSED ,4.04854e-06,12.8804,19.2625,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,394524, PASSED ,0.00982831,5.15081,7.72949,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,394524, PASSED ,3.11863e-05,1623.27,2435.93,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,394524, PASSED ,3.03064e-05,1670.4,2506.66,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,49329, PASSED ,0.00080511,7.8621,11.7979,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,49329, PASSED ,6.51824e-06,971.099,1457.23,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,49329, PASSED ,5.98208e-06,1058.14,1587.84,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,577935, PASSED ,0.0146893,5.04846,7.57591,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,577935, PASSED ,4.30098e-05,1724.22,2587.42,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,577935, PASSED ,4.18154e-05,1773.47,2661.33,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,6183, PASSED ,8.62026e-05,9.20569,13.8113,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,6183, PASSED ,4.38042e-06,181.159,271.794,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,6183, PASSED ,4.19152e-06,189.324,284.043,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,98631, PASSED ,0.00151838,8.33524,12.508,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,98631, PASSED ,8.92974e-06,1417.29,2126.82,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,98631, PASSED ,9.22594e-06,1371.79,2058.54,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,1155843, PASSED ,0.0306708,4.83564,7.25656,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,1155843, PASSED ,7.85685e-05,1887.69,2832.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,1155843, PASSED ,7.74947e-05,1913.84,2871.99,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,12339, PASSED ,0.000174617,9.06822,13.6066,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,12339, PASSED ,4.61736e-06,342.937,514.567,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,12339, PASSED ,4.44548e-06,356.197,534.463,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,1566, PASSED ,2.21484e-05,9.0806,13.6146,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,1566, PASSED ,4.3513e-06,46.2209,69.2993,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,1566, PASSED ,4.0755e-06,49.3488,73.989,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,197262, PASSED ,0.00351817,7.19463,10.7965,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,197262, PASSED ,1.52237e-05,1662.67,2495.05,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,197262, PASSED ,1.52928e-05,1655.15,2483.77,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,24678, PASSED ,0.000391458,8.08964,12.139,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_CUDA,block_64,24678, PASSED ,5.05298e-06,626.709,940.413,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,24678, PASSED ,4.82312e-06,656.577,985.231,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_EDGE3D,Base_Seq,default,512, PASSED ,0.00199132,0.0229243,9.38302,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,512, PASSED ,0.000231602,0.197104,80.6755,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,512, PASSED ,0.00023254,0.196309,80.35,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,1442897, PASSED ,2.23003,0.0211735,9.32671,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,1442897, PASSED ,0.0129098,3.65749,1611.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,1442897, PASSED ,0.0129501,3.64609,1606.07,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,166375, PASSED ,0.280277,0.0213676,9.34894,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,166375, PASSED ,0.00174224,3.43745,1503.98,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,166375, PASSED ,0.00174605,3.42995,1500.7,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,2146689, PASSED ,3.26817,0.0212504,9.36815,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,2146689, PASSED ,0.0189157,3.67155,1618.58,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,2146689, PASSED ,0.0189716,3.66075,1613.82,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,17576, PASSED ,0.0353438,0.0217854,9.39835,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,17576, PASSED ,0.000291234,2.64385,1140.57,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,17576, PASSED ,0.000290364,2.65177,1143.99,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,343000, PASSED ,0.556814,0.0213174,9.35308,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,343000, PASSED ,0.00332675,3.568,1565.47,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,343000, PASSED ,0.0033393,3.55459,1559.59,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,4410944, PASSED ,6.63446,0.0211402,9.33091,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,4410944, PASSED ,0.0381953,3.67202,1620.76,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,4410944, PASSED ,0.0383327,3.65886,1614.96,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,35937, PASSED ,0.0676711,0.021533,9.34143,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,35937, PASSED ,0.000532102,2.7385,1188.01,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,35937, PASSED ,0.000531721,2.74046,1188.86,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,3375, PASSED ,0.0085813,0.0221669,9.38853,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,3375, PASSED ,0.000237154,0.802097,339.719,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,3375, PASSED ,0.00023731,0.801571,339.496,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,704969, PASSED ,1.10992,0.0213042,9.36795,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,704969, PASSED ,0.00652701,3.6228,1593.03,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,704969, PASSED ,0.00655342,3.60819,1586.61,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_EDGE3D,Base_Seq,default,79507, PASSED ,0.140297,0.021455,9.35348,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_CUDA,block_256,79507, PASSED ,0.000909437,3.30983,1442.95,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_EDGE3D,RAJA_CUDA,block_256,79507, PASSED ,0.000913869,3.29378,1435.95,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,417, PASSED ,1.71913e-06,48.7956,13.341,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,417, PASSED ,1.2912e-05,6.49675,1.77625,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,417, PASSED ,1.29043e-05,6.50062,1.77731,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,426667, PASSED ,0.00279157,30.7464,8.40628,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,426667, PASSED ,2.7637e-05,3105.64,849.103,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,426667, PASSED ,2.77141e-05,3097.01,846.742,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,53334, PASSED ,0.000289255,37.0917,10.1411,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,53334, PASSED ,1.47558e-05,727.103,198.795,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,53334, PASSED ,1.48072e-05,724.576,198.104,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,625000, PASSED ,0.00478401,26.281,7.18539,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,625000, PASSED ,4.27187e-05,2943.18,804.683,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,625000, PASSED ,4.28399e-05,2934.85,802.407,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,6667, PASSED ,2.8493e-05,47.0702,12.8693,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,6667, PASSED ,1.3375e-05,100.275,27.4158,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,6667, PASSED ,1.3445e-05,99.7526,27.273,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,106667, PASSED ,0.000636015,33.7378,9.22412,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,106667, PASSED ,1.6189e-05,1325.45,362.386,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,106667, PASSED ,1.61792e-05,1326.25,362.606,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,1250000, PASSED ,0.0134145,18.7451,5.12504,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,1250000, PASSED ,9.514e-05,2643.02,722.619,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,1250000, PASSED ,9.50073e-05,2646.71,723.629,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,13334, PASSED ,5.67665e-05,47.2522,12.9191,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,13334, PASSED ,1.34163e-05,199.931,54.6624,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,13334, PASSED ,1.34614e-05,199.262,54.4796,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,1667, PASSED ,7.12671e-06,47.0544,12.865,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,1667, PASSED ,1.32164e-05,25.3733,6.93723,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,1667, PASSED ,1.32783e-05,25.255,6.90487,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,213334, PASSED ,0.00130714,32.8315,8.97634,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,213334, PASSED ,1.91547e-05,2240.46,612.557,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,213334, PASSED ,1.90631e-05,2251.23,615.5,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_ENERGY,Base_Seq,default,26667, PASSED ,0.000110305,48.6333,13.2967,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_CUDA,block_256,26667, PASSED ,1.3704e-05,391.454,107.026,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_ENERGY,RAJA_CUDA,block_256,26667, PASSED ,1.373e-05,390.714,106.824,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_FEMSWEEP,Base_Seq,default,395136, PASSED ,0.10823,0.602929,3.16064,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,395136, PASSED ,0.00141605,46.0821,241.569,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,395136, PASSED ,0.00180592,36.1339,189.419,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,73728, PASSED ,0.0201786,0.5725,3.10205,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,73728, PASSED ,0.000471381,24.5073,132.791,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,73728, PASSED ,0.000705101,16.3838,88.7746,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,589824, PASSED ,0.165251,0.594489,3.09991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,589824, PASSED ,0.00185304,53.0155,276.445,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,589824, PASSED ,0.00231291,42.4744,221.479,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,144000, PASSED ,0.0400073,0.578163,3.08391,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,144000, PASSED ,0.000676525,34.1906,182.372,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,144000, PASSED ,0.000992328,23.3096,124.333,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,1152000, PASSED ,0.342707,0.566533,2.93255,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,1152000, PASSED ,0.00332179,58.4488,302.549,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,1152000, PASSED ,0.00397275,48.8716,252.975,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00784217,0.595459,3.31578,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,31104, PASSED ,0.000313963,14.8734,82.8217,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,31104, PASSED ,0.000463523,10.0744,56.0985,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,1533312, PASSED ,0.49756,0.521593,2.69281,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,1533312, PASSED ,0.0041987,61.8105,319.107,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,1533312, PASSED ,0.00494313,52.502,271.05,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,1990656, PASSED ,0.663273,0.509787,2.62611,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,1990656, PASSED ,0.00513028,65.9083,339.519,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,1990656, PASSED ,0.0061327,55.1352,284.022,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,248832, PASSED ,0.067748,0.599649,3.16604,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,248832, PASSED ,0.000907535,44.7641,236.347,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,248832, PASSED ,0.00131358,30.9269,163.289,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,2530944, PASSED ,0.864216,0.498932,2.56545,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,2530944, PASSED ,0.00649025,66.4358,341.606,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,2530944, PASSED ,0.00751464,57.3794,295.038,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00758414,0.615719,3.4286,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_CUDA,block_128,31104, PASSED ,0.000311673,14.9827,83.4302,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_128 +Apps_FEMSWEEP,RAJA_CUDA,block_128,31104, PASSED ,0.000464567,10.0517,55.9724,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128 +Apps_INTSC_HEXRECT,Base_Seq,default,1728, PASSED ,0.00152263,0.0515405,4.08557,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,1728, PASSED ,0.000153291,0.511948,40.5816,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,1728, PASSED ,0.00015173,0.517215,40.9991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,1124864, PASSED ,0.937313,0.0527279,4.32034,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,1124864, PASSED ,0.00248498,19.8885,1629.6,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,1124864, PASSED ,0.00299439,16.5051,1352.37,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,140608, PASSED ,0.117048,0.0529853,4.32463,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,140608, PASSED ,0.000390914,15.8649,1294.89,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,140608, PASSED ,0.000447843,13.8482,1130.28,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,1643032, PASSED ,1.37027,0.0526587,4.31662,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,1643032, PASSED ,0.00359784,20.0555,1644.02,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,1643032, PASSED ,0.00434504,16.6066,1361.3,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,17576, PASSED ,0.014675,0.0532582,4.31165,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,17576, PASSED ,0.000161536,4.83834,391.7,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,17576, PASSED ,0.000158077,4.94421,400.271,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,287496, PASSED ,0.239802,0.0527919,4.31601,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,287496, PASSED ,0.000732505,17.2826,1412.94,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,287496, PASSED ,0.000848664,14.9171,1219.55,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,3241792, PASSED ,2.70382,0.0526191,4.31628,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,3241792, PASSED ,0.0069522,20.4644,1678.67,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,3241792, PASSED ,0.00840893,16.9192,1387.86,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,39304, PASSED ,0.0328342,0.0530228,4.30936,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,39304, PASSED ,0.000176631,9.85649,801.073,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,39304, PASSED ,0.000172284,10.1052,821.286,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,5832, PASSED ,0.00491087,0.0532159,4.27525,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,5832, PASSED ,0.000152725,1.71116,137.471,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,5832, PASSED ,0.000151767,1.72196,138.338,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,551368, PASSED ,0.459521,0.0527725,4.31956,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,551368, PASSED ,0.00128413,18.8845,1545.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,551368, PASSED ,0.00153927,15.7543,1289.52,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,74088, PASSED ,0.0617367,0.0530315,4.32023,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_CUDA,block_64,74088, PASSED ,0.000215796,15.1717,1235.97,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,74088, PASSED ,0.000290519,11.2695,918.07,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DEA,Base_Seq,default,6213632, PASSED ,0.256293,0.186147,0.16971,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,6213632, PASSED ,0.000265126,179.945,164.056,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,6213632, PASSED ,0.000247383,192.851,175.822,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,6213632, PASSED ,0.000271831,175.507,160.009,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,778240, PASSED ,0.0311109,0.192069,0.175105,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,778240, PASSED ,0.000112598,53.0688,48.3817,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,778240, PASSED ,7.4883e-05,79.797,72.7492,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,778240, PASSED ,7.934e-05,75.3143,68.6625,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,9101312, PASSED ,0.375862,0.185918,0.169502,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,9101312, PASSED ,0.000370367,188.677,172.016,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,9101312, PASSED ,0.000351549,198.776,181.224,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,9101312, PASSED ,0.000386393,180.851,164.882,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,1556480, PASSED ,0.062294,0.191844,0.174902,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,1556480, PASSED ,0.000125894,94.9269,86.5439,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,1556480, PASSED ,0.000101402,117.855,107.447,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,1556480, PASSED ,0.000109785,108.856,99.2427,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,18198528, PASSED ,0.752786,0.185614,0.169224,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,18198528, PASSED ,0.000638748,218.752,199.437,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,18198528, PASSED ,0.000621548,224.806,204.956,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,18198528, PASSED ,0.00069257,201.752,183.938,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,196608, PASSED ,0.00797947,0.189198,0.172475,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,196608, PASSED ,0.000111249,13.5704,12.371,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,196608, PASSED ,7.4416e-05,20.2873,18.4941,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,196608, PASSED ,7.8781e-05,19.1632,17.4694,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,24260608, PASSED ,1.00902,0.184607,0.168307,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,24260608, PASSED ,0.000844811,220.49,201.02,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,24260608, PASSED ,0.000828049,224.953,205.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,24260608, PASSED ,0.000923702,201.658,183.852,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,30326784, PASSED ,1.24637,0.186821,0.170325,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,30326784, PASSED ,0.0010481,222.162,202.545,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,30326784, PASSED ,0.00103125,225.791,205.854,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,30326784, PASSED ,0.00115143,202.225,184.368,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,3108864, PASSED ,0.127598,0.187071,0.170552,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,3108864, PASSED ,0.000146586,162.839,148.459,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,3108864, PASSED ,0.000145038,164.577,150.044,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,3108864, PASSED ,0.00015699,152.047,138.621,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,36392960, PASSED ,1.51075,0.184956,0.168625,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,36392960, PASSED ,0.00122022,228.994,208.774,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,36392960, PASSED ,0.00130189,214.629,195.678,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,36392960, PASSED ,0.00134275,208.098,189.723,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,389120, PASSED ,0.0157374,0.189853,0.173081,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,389120, PASSED ,0.000111389,26.8231,24.4534,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,389120, PASSED ,7.4687e-05,40.0042,36.4701,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,389120, PASSED ,7.8428e-05,38.096,34.7305,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,729, PASSED ,1.06151e-05,5.63123,11.2564,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,729, PASSED ,3.7374e-06,15.994,31.9709,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,729, PASSED ,3.75178e-06,15.9327,31.8483,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,531441, PASSED ,0.0118418,4.66743,10.0903,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,531441, PASSED ,6.70852e-05,823.891,1781.14,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,531441, PASSED ,6.71454e-05,823.152,1779.54,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,68921, PASSED ,0.00130854,5.32245,11.4143,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,68921, PASSED ,1.07764e-05,646.287,1386.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,68921, PASSED ,1.08612e-05,641.236,1375.17,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,753571, PASSED ,0.0150698,5.21751,11.2895,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,753571, PASSED ,9.21952e-05,852.829,1845.33,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,753571, PASSED ,9.22373e-05,852.44,1844.49,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,9261, PASSED ,0.000161258,5.48866,11.5777,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,9261, PASSED ,4.52344e-06,195.668,412.739,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,9261, PASSED ,4.45998e-06,198.452,418.612,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,132651, PASSED ,0.00246978,5.48991,11.8115,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,132651, PASSED ,1.7993e-05,753.564,1621.29,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,132651, PASSED ,1.79145e-05,756.865,1628.39,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,1442897, PASSED ,0.0340937,4.43834,9.61689,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,1442897, PASSED ,0.000176986,854.982,1852.55,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,1442897, PASSED ,0.00017712,854.334,1851.15,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,19683, PASSED ,0.000355574,5.42675,11.5357,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,19683, PASSED ,5.63764e-06,342.273,727.574,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,19683, PASSED ,5.67768e-06,339.859,722.443,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,3375, PASSED ,5.5281e-05,5.57301,11.5841,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,3375, PASSED ,3.91592e-06,78.6741,163.533,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,3375, PASSED ,3.9459e-06,78.0764,162.29,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,250047, PASSED ,0.00502674,5.13006,11.0648,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,250047, PASSED ,3.26954e-05,788.718,1701.15,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,250047, PASSED ,3.27017e-05,788.566,1700.82,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,35937, PASSED ,0.00065046,5.50448,11.7567,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,35937, PASSED ,7.25788e-06,493.318,1053.65,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,35937, PASSED ,7.27554e-06,492.121,1051.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_MASSVEC3DPA,Base_Seq,default,5376, PASSED ,1.21374e-05,3.89184,12.7342,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,5376, PASSED ,7.42e-06,6.36613,20.8302,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,5376, PASSED ,4.55534e-06,10.3695,33.9294,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,5376, PASSED ,6.99754e-06,6.75047,22.0878,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,5376, PASSED ,4.31026e-06,10.9591,35.8586,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,5376, PASSED ,7.0531e-06,6.69729,21.9138,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,5437248, PASSED ,0.012802,3.72476,12.2106,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,5437248, PASSED ,9.14447e-05,521.457,1709.46,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,5437248, PASSED ,6.28716e-05,758.443,2486.35,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,5437248, PASSED ,9.68036e-05,492.59,1614.83,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,5437248, PASSED ,6.36234e-05,749.481,2456.97,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,5437248, PASSED ,9.68645e-05,492.28,1613.81,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,679680, PASSED ,0.0014736,4.04509,13.2606,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,679680, PASSED ,1.56698e-05,380.403,1247.03,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,679680, PASSED ,1.04847e-05,568.529,1863.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,679680, PASSED ,1.57015e-05,379.635,1244.51,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,679680, PASSED ,1.06839e-05,557.927,1828.99,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,679680, PASSED ,1.56841e-05,380.057,1245.9,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,7964736, PASSED ,0.0186475,3.74583,12.2797,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,7964736, PASSED ,0.000130985,533.27,1748.18,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,7964736, PASSED ,8.993e-05,776.721,2546.27,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,7964736, PASSED ,0.000138923,502.798,1648.29,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,7964736, PASSED ,9.1031e-05,767.326,2515.47,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,7964736, PASSED ,0.000138969,502.632,1647.75,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,85056, PASSED ,0.000182175,4.09511,13.4231,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,85056, PASSED ,7.74194e-06,96.3617,315.859,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,85056, PASSED ,4.68662e-06,159.182,521.775,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,85056, PASSED ,7.35466e-06,101.436,332.491,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,85056, PASSED ,4.47352e-06,166.765,546.63,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,85056, PASSED ,7.38302e-06,101.046,331.214,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,1359360, PASSED ,0.00287493,4.14675,13.5939,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,1359360, PASSED ,2.59907e-05,458.687,1503.67,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,1359360, PASSED ,1.75039e-05,681.084,2232.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,1359360, PASSED ,2.62679e-05,453.847,1487.81,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,1359360, PASSED ,1.77157e-05,672.94,2206.04,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,1359360, PASSED ,2.62529e-05,454.106,1488.66,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,15929280, PASSED ,0.0378954,3.68644,12.085,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,15929280, PASSED ,0.000255311,547.173,1793.76,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,15929280, PASSED ,0.000175204,797.352,2613.91,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,15929280, PASSED ,0.00027133,514.867,1687.86,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,15929280, PASSED ,0.000177142,788.629,2585.31,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,15929280, PASSED ,0.000271551,514.449,1686.48,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,169920, PASSED ,0.000362792,4.1078,13.4656,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,169920, PASSED ,8.33486e-06,178.801,586.117,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,169920, PASSED ,5.33428e-06,279.378,915.812,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,169920, PASSED ,7.9591e-06,187.242,613.788,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,169920, PASSED ,5.10904e-06,291.695,956.187,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,169920, PASSED ,7.98266e-06,186.69,611.976,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,21312, PASSED ,4.70255e-05,3.97645,13.0295,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,21312, PASSED ,7.41228e-06,25.2277,82.6628,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,21312, PASSED ,4.6058e-06,40.5998,133.032,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,21312, PASSED ,7.1164e-06,26.2766,86.0997,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,21312, PASSED ,4.48188e-06,41.7224,136.71,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,21312, PASSED ,7.14408e-06,26.1748,85.7661,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,2718720, PASSED ,0.00583883,4.08355,13.3868,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,2718720, PASSED ,4.76641e-05,500.232,1639.87,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,2718720, PASSED ,3.26887e-05,729.4,2391.14,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,2718720, PASSED ,4.8664e-05,489.954,1606.18,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,2718720, PASSED ,3.28996e-05,724.725,2375.81,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,2718720, PASSED ,4.87601e-05,488.989,1603.02,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,339840, PASSED ,0.000733769,4.06186,13.3154,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,339840, PASSED ,9.79378e-06,304.323,997.613,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,339840, PASSED ,6.92866e-06,430.166,1410.14,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,339840, PASSED ,9.53338e-06,312.635,1024.86,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,339840, PASSED ,6.68232e-06,446.023,1462.13,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,339840, PASSED ,9.53448e-06,312.599,1024.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000, PASSED ,2.11589e-06,16.4161,4.25353,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,1000, PASSED ,2.84359e-06,12.2151,3.16501,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,1000, PASSED ,2.80486e-06,12.3837,3.20872,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2048383, PASSED ,0.00573203,10.7769,3.21622,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,2048383, PASSED ,7.09007e-05,871.264,260.018,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,2048383, PASSED ,7.09243e-05,870.975,259.931,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,238328, PASSED ,0.000476735,15.265,4.49925,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,238328, PASSED ,1.00328e-05,725.36,213.795,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,238328, PASSED ,1.00284e-05,725.675,213.888,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2985984, PASSED ,0.00910079,9.88076,2.95292,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,2985984, PASSED ,0.000101832,883.048,263.904,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,2985984, PASSED ,0.000101725,883.978,264.181,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,27000, PASSED ,5.67901e-05,14.9014,4.27892,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,27000, PASSED ,3.12783e-06,270.556,77.6896,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,27000, PASSED ,3.11661e-06,271.53,77.9693,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,493039, PASSED ,0.000981555,15.2577,4.52073,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,493039, PASSED ,1.79344e-05,835.056,247.421,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,493039, PASSED ,1.79915e-05,832.406,246.636,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,6028568, PASSED ,0.018767,9.65281,2.89109,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,6028568, PASSED ,0.000198514,912.551,273.316,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,6028568, PASSED ,0.000198515,912.545,273.314,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,54872, PASSED ,0.000118843,14.3179,4.15548,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,54872, PASSED ,3.96236e-06,429.436,124.635,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,54872, PASSED ,3.97114e-06,428.486,124.359,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,5832, PASSED ,1.24572e-05,15.1809,4.21348,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,5832, PASSED ,2.8043e-06,67.436,18.717,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,5832, PASSED ,2.75924e-06,68.5372,19.0226,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000000, PASSED ,0.00202957,14.9065,4.43443,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,1000000, PASSED ,3.38812e-05,892.939,265.634,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,1000000, PASSED ,3.39284e-05,891.696,265.264,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,117649, PASSED ,0.00026121,13.8423,4.05361,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,117649, PASSED ,5.81927e-06,621.341,181.954,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,117649, PASSED ,5.82147e-06,621.106,181.886,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,512, PASSED ,9.61451e-06,4.748,10.589,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,512, PASSED ,2.71531e-06,16.812,37.4941,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,512, PASSED ,2.66465e-06,17.1316,38.2069,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,1442897, PASSED ,0.0116043,4.06895,9.76601,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,1442897, PASSED ,2.48123e-05,1902.98,4567.41,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,1442897, PASSED ,2.37548e-05,1987.7,4770.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,166375, PASSED ,0.00135694,4.4135,10.5217,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,166375, PASSED ,5.15502e-06,1161.75,2769.61,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,166375, PASSED ,4.40588e-06,1359.29,3240.53,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,2146689, PASSED ,0.0172879,4.01726,9.64971,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,2146689, PASSED ,3.57233e-05,1944.11,4669.88,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,2146689, PASSED ,3.32067e-05,2091.45,5023.79,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,17576, PASSED ,0.000172093,4.47421,10.5172,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,17576, PASSED ,3.2504e-06,236.888,556.835,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,17576, PASSED ,2.72221e-06,282.851,664.877,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,343000, PASSED ,0.00264511,4.48746,10.728,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,343000, PASSED ,8.32725e-06,1425.42,3407.7,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,343000, PASSED ,6.09938e-06,1946.07,4652.4,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,4410944, PASSED ,0.0361167,3.88335,9.33941,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,4410944, PASSED ,6.88587e-05,2036.84,4898.57,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,4410944, PASSED ,6.33905e-05,2212.54,5321.13,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,35937, PASSED ,0.000328079,4.4415,10.4987,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,35937, PASSED ,3.32316e-06,438.487,1036.49,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,35937, PASSED ,3.19033e-06,456.743,1079.64,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,3375, PASSED ,4.10173e-05,4.63757,10.7024,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,3375, PASSED ,2.86984e-06,66.2827,152.965,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,3375, PASSED ,2.75449e-06,69.0584,159.37,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,704969, PASSED ,0.00540288,4.37656,10.486,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,704969, PASSED ,1.14911e-05,2057.77,4930.32,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,704969, PASSED ,9.98778e-06,2367.49,5672.4,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_VOL3D,Base_Seq,default,79507, PASSED ,0.000689456,4.36589,10.3709,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_CUDA,block_256,79507, PASSED ,3.75658e-06,801.284,1903.39,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_VOL3D,RAJA_CUDA,block_256,79507, PASSED ,3.56829e-06,843.566,2003.83,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_DIFFUSION3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_DIFFUSION3DPA_bandwidth.png new file mode 100644 index 0000000..9b87854 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_DIFFUSION3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_DIFFUSION3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_DIFFUSION3DPA_flops.png new file mode 100644 index 0000000..7c99724 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_DIFFUSION3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_EDGE3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_EDGE3D_bandwidth.png new file mode 100644 index 0000000..2ba0b9f Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_EDGE3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_EDGE3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_EDGE3D_flops.png new file mode 100644 index 0000000..bf065ae Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_EDGE3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_ENERGY_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_ENERGY_bandwidth.png new file mode 100644 index 0000000..b72238a Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_ENERGY_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_ENERGY_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_ENERGY_flops.png new file mode 100644 index 0000000..cdf3e27 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_ENERGY_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_FEMSWEEP_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_FEMSWEEP_bandwidth.png new file mode 100644 index 0000000..f790e14 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_FEMSWEEP_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_FEMSWEEP_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_FEMSWEEP_flops.png new file mode 100644 index 0000000..3745c84 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_FEMSWEEP_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_INTSC_HEXRECT_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_INTSC_HEXRECT_bandwidth.png new file mode 100644 index 0000000..0015928 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_INTSC_HEXRECT_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_INTSC_HEXRECT_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_INTSC_HEXRECT_flops.png new file mode 100644 index 0000000..ee594a8 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_INTSC_HEXRECT_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DEA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DEA_bandwidth.png new file mode 100644 index 0000000..2ac4f31 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DEA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DEA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DEA_flops.png new file mode 100644 index 0000000..94ce57c Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DEA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png new file mode 100644 index 0000000..34aca57 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DPA_ATOMIC_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DPA_ATOMIC_flops.png new file mode 100644 index 0000000..512929c Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASS3DPA_ATOMIC_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASSVEC3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASSVEC3DPA_bandwidth.png new file mode 100644 index 0000000..41270ff Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASSVEC3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASSVEC3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASSVEC3DPA_flops.png new file mode 100644 index 0000000..2e8b786 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_MASSVEC3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png new file mode 100644 index 0000000..9118d47 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_NODAL_ACCUMULATION_3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_NODAL_ACCUMULATION_3D_flops.png new file mode 100644 index 0000000..1e5984a Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_NODAL_ACCUMULATION_3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_VOL3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_VOL3D_bandwidth.png new file mode 100644 index 0000000..69bd3fd Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_VOL3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_VOL3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_VOL3D_flops.png new file mode 100644 index 0000000..f8fe1d6 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/figures/Apps_VOL3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/output_with_variant_tuning.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/output_with_variant_tuning.csv new file mode 100644 index 0000000..eb8f9b3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/output_with_variant_tuning.csv @@ -0,0 +1,375 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning,Smoothed Mean flops (gigaFLOP per sec.),Smoothed Bandwidth (GiB per sec.) +Apps_DIFFUSION3DPA,Base_Seq,default,405, PASSED ,5.93228e-06,8.79032,13.1459,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,13.6146,9.0806 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,405, PASSED ,4.31058e-06,12.0974,18.0915,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64,69.2993,46.2209 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,405, PASSED ,4.04854e-06,12.8804,19.2625,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,73.989,49.3488 +Apps_DIFFUSION3DPA,Base_Seq,default,394524, PASSED ,0.00982831,5.15081,7.72949,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,7.72949,5.15081 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,394524, PASSED ,3.11863e-05,1623.27,2435.93,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2495.05,1662.67 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,394524, PASSED ,3.03064e-05,1670.4,2506.66,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2506.66,1670.4 +Apps_DIFFUSION3DPA,Base_Seq,default,49329, PASSED ,0.00080511,7.8621,11.7979,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,12.139,8.08964 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,49329, PASSED ,6.51824e-06,971.099,1457.23,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1457.23,971.099 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,49329, PASSED ,5.98208e-06,1058.14,1587.84,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1587.84,1058.14 +Apps_DIFFUSION3DPA,Base_Seq,default,577935, PASSED ,0.0146893,5.04846,7.57591,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,7.6527,5.099635 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,577935, PASSED ,4.30098e-05,1724.22,2587.42,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2541.235,1693.4450000000002 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,577935, PASSED ,4.18154e-05,1773.47,2661.33,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2583.995,1721.935 +Apps_DIFFUSION3DPA,Base_Seq,default,6183, PASSED ,8.62026e-05,9.20569,13.8113,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,13.6066,9.06822 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,6183, PASSED ,4.38042e-06,181.159,271.794,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64,271.794,181.159 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,6183, PASSED ,4.19152e-06,189.324,284.043,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,284.043,189.324 +Apps_DIFFUSION3DPA,Base_Seq,default,98631, PASSED ,0.00151838,8.33524,12.508,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,11.7979,7.8621 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,98631, PASSED ,8.92974e-06,1417.29,2126.82,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2126.82,1417.29 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,98631, PASSED ,9.22594e-06,1371.79,2058.54,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2058.54,1371.79 +Apps_DIFFUSION3DPA,Base_Seq,default,1155843, PASSED ,0.0306708,4.83564,7.25656,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,7.57591,5.04846 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,1155843, PASSED ,7.85685e-05,1887.69,2832.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2587.42,1724.22 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,1155843, PASSED ,7.74947e-05,1913.84,2871.99,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2661.33,1773.47 +Apps_DIFFUSION3DPA,Base_Seq,default,12339, PASSED ,0.000174617,9.06822,13.6066,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,13.6066,9.06822 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,12339, PASSED ,4.61736e-06,342.937,514.567,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64,514.567,342.937 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,12339, PASSED ,4.44548e-06,356.197,534.463,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,534.463,356.197 +Apps_DIFFUSION3DPA,Base_Seq,default,1566, PASSED ,2.21484e-05,9.0806,13.6146,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,13.6106,9.07441 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,1566, PASSED ,4.3513e-06,46.2209,69.2993,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64,170.54665,113.68995 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,1566, PASSED ,4.0755e-06,49.3488,73.989,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,179.01600000000002,119.3364 +Apps_DIFFUSION3DPA,Base_Seq,default,197262, PASSED ,0.00351817,7.19463,10.7965,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,10.7965,7.19463 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,197262, PASSED ,1.52237e-05,1662.67,2495.05,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2435.93,1623.27 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,197262, PASSED ,1.52928e-05,1655.15,2483.77,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2483.77,1655.15 +Apps_DIFFUSION3DPA,Base_Seq,default,24678, PASSED ,0.000391458,8.08964,12.139,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,12.508,8.33524 +Apps_DIFFUSION3DPA,Base_CUDA,block_64,24678, PASSED ,5.05298e-06,626.709,940.413,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64,940.413,626.709 +Apps_DIFFUSION3DPA,RAJA_CUDA,block_64,24678, PASSED ,4.82312e-06,656.577,985.231,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/DIFFUSION3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,985.231,656.577 +Apps_EDGE3D,Base_Seq,default,512, PASSED ,0.00199132,0.0229243,9.38302,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,9.38853,0.0221669 +Apps_EDGE3D,Base_CUDA,block_256,512, PASSED ,0.000231602,0.197104,80.6755,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256,339.719,0.802097 +Apps_EDGE3D,RAJA_CUDA,block_256,512, PASSED ,0.00023254,0.196309,80.35,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,339.496,0.801571 +Apps_EDGE3D,Base_Seq,default,1442897, PASSED ,2.23003,0.0211735,9.32671,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,9.35308,0.0212504 +Apps_EDGE3D,Base_CUDA,block_256,1442897, PASSED ,0.0129098,3.65749,1611.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1611.09,3.65749 +Apps_EDGE3D,RAJA_CUDA,block_256,1442897, PASSED ,0.0129501,3.64609,1606.07,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1606.07,3.64609 +Apps_EDGE3D,Base_Seq,default,166375, PASSED ,0.280277,0.0213676,9.34894,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,9.35308,0.0213676 +Apps_EDGE3D,Base_CUDA,block_256,166375, PASSED ,0.00174224,3.43745,1503.98,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1503.98,3.43745 +Apps_EDGE3D,RAJA_CUDA,block_256,166375, PASSED ,0.00174605,3.42995,1500.7,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1500.7,3.42995 +Apps_EDGE3D,Base_Seq,default,2146689, PASSED ,3.26817,0.0212504,9.36815,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,9.34943,0.02121195 +Apps_EDGE3D,Base_CUDA,block_256,2146689, PASSED ,0.0189157,3.67155,1618.58,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1614.835,3.66452 +Apps_EDGE3D,RAJA_CUDA,block_256,2146689, PASSED ,0.0189716,3.66075,1613.82,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1609.945,3.652475 +Apps_EDGE3D,Base_Seq,default,17576, PASSED ,0.0353438,0.0217854,9.39835,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,9.38302,0.0217854 +Apps_EDGE3D,Base_CUDA,block_256,17576, PASSED ,0.000291234,2.64385,1140.57,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1140.57,2.64385 +Apps_EDGE3D,RAJA_CUDA,block_256,17576, PASSED ,0.000290364,2.65177,1143.99,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1143.99,2.65177 +Apps_EDGE3D,Base_Seq,default,343000, PASSED ,0.556814,0.0213174,9.35308,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,9.35308,0.0213174 +Apps_EDGE3D,Base_CUDA,block_256,343000, PASSED ,0.00332675,3.568,1565.47,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1565.47,3.568 +Apps_EDGE3D,RAJA_CUDA,block_256,343000, PASSED ,0.0033393,3.55459,1559.59,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1559.59,3.55459 +Apps_EDGE3D,Base_Seq,default,4410944, PASSED ,6.63446,0.0211402,9.33091,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,9.33091,0.0211735 +Apps_EDGE3D,Base_CUDA,block_256,4410944, PASSED ,0.0381953,3.67202,1620.76,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1618.58,3.67155 +Apps_EDGE3D,RAJA_CUDA,block_256,4410944, PASSED ,0.0383327,3.65886,1614.96,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1613.82,3.65886 +Apps_EDGE3D,Base_Seq,default,35937, PASSED ,0.0676711,0.021533,9.34143,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,9.35348,0.021533 +Apps_EDGE3D,Base_CUDA,block_256,35937, PASSED ,0.000532102,2.7385,1188.01,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1188.01,2.7385 +Apps_EDGE3D,RAJA_CUDA,block_256,35937, PASSED ,0.000531721,2.74046,1188.86,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1188.86,2.74046 +Apps_EDGE3D,Base_Seq,default,3375, PASSED ,0.0085813,0.0221669,9.38853,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,9.385774999999999,0.02197615 +Apps_EDGE3D,Base_CUDA,block_256,3375, PASSED ,0.000237154,0.802097,339.719,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256,740.1445,1.7229735 +Apps_EDGE3D,RAJA_CUDA,block_256,3375, PASSED ,0.00023731,0.801571,339.496,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,741.7429999999999,1.7266705 +Apps_EDGE3D,Base_Seq,default,704969, PASSED ,1.10992,0.0213042,9.36795,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,9.35308,0.0213042 +Apps_EDGE3D,Base_CUDA,block_256,704969, PASSED ,0.00652701,3.6228,1593.03,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1593.03,3.6228 +Apps_EDGE3D,RAJA_CUDA,block_256,704969, PASSED ,0.00655342,3.60819,1586.61,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1586.61,3.60819 +Apps_EDGE3D,Base_Seq,default,79507, PASSED ,0.140297,0.021455,9.35348,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,9.35308,0.021455 +Apps_EDGE3D,Base_CUDA,block_256,79507, PASSED ,0.000909437,3.30983,1442.95,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1442.95,3.30983 +Apps_EDGE3D,RAJA_CUDA,block_256,79507, PASSED ,0.000913869,3.29378,1435.95,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/EDGE3D_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1435.95,3.29378 +Apps_ENERGY,Base_Seq,default,417, PASSED ,1.71913e-06,48.7956,13.341,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,12.8693,47.0702 +Apps_ENERGY,Base_CUDA,block_256,417, PASSED ,1.2912e-05,6.49675,1.77625,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256,6.93723,25.3733 +Apps_ENERGY,RAJA_CUDA,block_256,417, PASSED ,1.29043e-05,6.50062,1.77731,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,6.90487,25.255 +Apps_ENERGY,Base_Seq,default,426667, PASSED ,0.00279157,30.7464,8.40628,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,8.40628,30.7464 +Apps_ENERGY,Base_CUDA,block_256,426667, PASSED ,2.7637e-05,3105.64,849.103,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256,722.619,2643.02 +Apps_ENERGY,RAJA_CUDA,block_256,426667, PASSED ,2.77141e-05,3097.01,846.742,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,723.629,2646.71 +Apps_ENERGY,Base_Seq,default,53334, PASSED ,0.000289255,37.0917,10.1411,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.1411,37.0917 +Apps_ENERGY,Base_CUDA,block_256,53334, PASSED ,1.47558e-05,727.103,198.795,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256,198.795,727.103 +Apps_ENERGY,RAJA_CUDA,block_256,53334, PASSED ,1.48072e-05,724.576,198.104,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,198.104,724.576 +Apps_ENERGY,Base_Seq,default,625000, PASSED ,0.00478401,26.281,7.18539,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,7.795835,28.5137 +Apps_ENERGY,Base_CUDA,block_256,625000, PASSED ,4.27187e-05,2943.18,804.683,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256,763.6510000000001,2793.1 +Apps_ENERGY,RAJA_CUDA,block_256,625000, PASSED ,4.28399e-05,2934.85,802.407,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,763.018,2790.7799999999997 +Apps_ENERGY,Base_Seq,default,6667, PASSED ,2.8493e-05,47.0702,12.8693,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,12.9191,47.2522 +Apps_ENERGY,Base_CUDA,block_256,6667, PASSED ,1.3375e-05,100.275,27.4158,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256,27.4158,100.275 +Apps_ENERGY,RAJA_CUDA,block_256,6667, PASSED ,1.3445e-05,99.7526,27.273,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,27.273,99.7526 +Apps_ENERGY,Base_Seq,default,106667, PASSED ,0.000636015,33.7378,9.22412,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,9.22412,33.7378 +Apps_ENERGY,Base_CUDA,block_256,106667, PASSED ,1.6189e-05,1325.45,362.386,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256,362.386,1325.45 +Apps_ENERGY,RAJA_CUDA,block_256,106667, PASSED ,1.61792e-05,1326.25,362.606,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,362.606,1326.25 +Apps_ENERGY,Base_Seq,default,1250000, PASSED ,0.0134145,18.7451,5.12504,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,7.18539,26.281 +Apps_ENERGY,Base_CUDA,block_256,1250000, PASSED ,9.514e-05,2643.02,722.619,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,804.683,2943.18 +Apps_ENERGY,RAJA_CUDA,block_256,1250000, PASSED ,9.50073e-05,2646.71,723.629,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,802.407,2934.85 +Apps_ENERGY,Base_Seq,default,13334, PASSED ,5.67665e-05,47.2522,12.9191,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,12.8693,47.0702 +Apps_ENERGY,Base_CUDA,block_256,13334, PASSED ,1.34163e-05,199.931,54.6624,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256,54.6624,199.931 +Apps_ENERGY,RAJA_CUDA,block_256,13334, PASSED ,1.34614e-05,199.262,54.4796,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,54.4796,199.262 +Apps_ENERGY,Base_Seq,default,1667, PASSED ,7.12671e-06,47.0544,12.865,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,12.894200000000001,47.1612 +Apps_ENERGY,Base_CUDA,block_256,1667, PASSED ,1.32164e-05,25.3733,6.93723,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256,17.176515000000002,62.82415 +Apps_ENERGY,RAJA_CUDA,block_256,1667, PASSED ,1.32783e-05,25.255,6.90487,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,17.088935,62.5038 +Apps_ENERGY,Base_Seq,default,213334, PASSED ,0.00130714,32.8315,8.97634,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,8.97634,32.8315 +Apps_ENERGY,Base_CUDA,block_256,213334, PASSED ,1.91547e-05,2240.46,612.557,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256,612.557,2240.46 +Apps_ENERGY,RAJA_CUDA,block_256,213334, PASSED ,1.90631e-05,2251.23,615.5,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,615.5,2251.23 +Apps_ENERGY,Base_Seq,default,26667, PASSED ,0.000110305,48.6333,13.2967,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,12.8693,47.0702 +Apps_ENERGY,Base_CUDA,block_256,26667, PASSED ,1.3704e-05,391.454,107.026,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256,107.026,391.454 +Apps_ENERGY,RAJA_CUDA,block_256,26667, PASSED ,1.373e-05,390.714,106.824,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/ENERGY_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,106.824,390.714 +Apps_FEMSWEEP,Base_Seq,default,395136, PASSED ,0.10823,0.602929,3.16064,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,3.09991,0.594489 +Apps_FEMSWEEP,Base_CUDA,block_128,395136, PASSED ,0.00141605,46.0821,241.569,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_128,241.569,46.0821 +Apps_FEMSWEEP,RAJA_CUDA,block_128,395136, PASSED ,0.00180592,36.1339,189.419,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,189.419,36.1339 +Apps_FEMSWEEP,Base_Seq,default,73728, PASSED ,0.0201786,0.5725,3.10205,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,3.16604,0.595459 +Apps_FEMSWEEP,Base_CUDA,block_128,73728, PASSED ,0.000471381,24.5073,132.791,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_128,132.791,24.5073 +Apps_FEMSWEEP,RAJA_CUDA,block_128,73728, PASSED ,0.000705101,16.3838,88.7746,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,88.7746,16.3838 +Apps_FEMSWEEP,Base_Seq,default,589824, PASSED ,0.165251,0.594489,3.09991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,3.09991,0.594489 +Apps_FEMSWEEP,Base_CUDA,block_128,589824, PASSED ,0.00185304,53.0155,276.445,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_128,276.445,53.0155 +Apps_FEMSWEEP,RAJA_CUDA,block_128,589824, PASSED ,0.00231291,42.4744,221.479,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,221.479,42.4744 +Apps_FEMSWEEP,Base_Seq,default,144000, PASSED ,0.0400073,0.578163,3.08391,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,3.16064,0.599649 +Apps_FEMSWEEP,Base_CUDA,block_128,144000, PASSED ,0.000676525,34.1906,182.372,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_128,182.372,34.1906 +Apps_FEMSWEEP,RAJA_CUDA,block_128,144000, PASSED ,0.000992328,23.3096,124.333,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,124.333,23.3096 +Apps_FEMSWEEP,Base_Seq,default,1152000, PASSED ,0.342707,0.566533,2.93255,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,2.93255,0.566533 +Apps_FEMSWEEP,Base_CUDA,block_128,1152000, PASSED ,0.00332179,58.4488,302.549,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_128,302.549,58.4488 +Apps_FEMSWEEP,RAJA_CUDA,block_128,1152000, PASSED ,0.00397275,48.8716,252.975,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,252.975,48.8716 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00784217,0.595459,3.31578,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,3.208915,0.586811 +Apps_FEMSWEEP,Base_CUDA,block_128,31104, PASSED ,0.000313963,14.8734,82.8217,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_128,108.1106,19.745 +Apps_FEMSWEEP,RAJA_CUDA,block_128,31104, PASSED ,0.000463523,10.0744,56.0985,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,72.43655000000001,13.2291 +Apps_FEMSWEEP,Base_Seq,default,1533312, PASSED ,0.49756,0.521593,2.69281,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,2.69281,0.521593 +Apps_FEMSWEEP,Base_CUDA,block_128,1533312, PASSED ,0.0041987,61.8105,319.107,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-block_128,319.107,61.8105 +Apps_FEMSWEEP,RAJA_CUDA,block_128,1533312, PASSED ,0.00494313,52.502,271.05,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,271.05,52.502 +Apps_FEMSWEEP,Base_Seq,default,1990656, PASSED ,0.663273,0.509787,2.62611,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default,2.65946,0.51569 +Apps_FEMSWEEP,Base_CUDA,block_128,1990656, PASSED ,0.00513028,65.9083,339.519,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-block_128,329.313,63.859399999999994 +Apps_FEMSWEEP,RAJA_CUDA,block_128,1990656, PASSED ,0.0061327,55.1352,284.022,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,277.536,53.8186 +Apps_FEMSWEEP,Base_Seq,default,248832, PASSED ,0.067748,0.599649,3.16604,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,3.10205,0.594489 +Apps_FEMSWEEP,Base_CUDA,block_128,248832, PASSED ,0.000907535,44.7641,236.347,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_128,236.347,44.7641 +Apps_FEMSWEEP,RAJA_CUDA,block_128,248832, PASSED ,0.00131358,30.9269,163.289,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,163.289,30.9269 +Apps_FEMSWEEP,Base_Seq,default,2530944, PASSED ,0.864216,0.498932,2.56545,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default,2.62611,0.509787 +Apps_FEMSWEEP,Base_CUDA,block_128,2530944, PASSED ,0.00649025,66.4358,341.606,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-block_128,339.519,65.9083 +Apps_FEMSWEEP,RAJA_CUDA,block_128,2530944, PASSED ,0.00751464,57.3794,295.038,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,284.022,55.1352 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00758414,0.615719,3.4286,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,3.208915,0.586811 +Apps_FEMSWEEP,Base_CUDA,block_128,31104, PASSED ,0.000311673,14.9827,83.4302,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_128,108.1106,19.745 +Apps_FEMSWEEP,RAJA_CUDA,block_128,31104, PASSED ,0.000464567,10.0517,55.9724,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/FEMSWEEP_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_128,72.43655000000001,13.2291 +Apps_INTSC_HEXRECT,Base_Seq,default,1728, PASSED ,0.00152263,0.0515405,4.08557,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,4.27525,0.0532159 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,1728, PASSED ,0.000153291,0.511948,40.5816,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64,137.471,1.71116 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,1728, PASSED ,0.00015173,0.517215,40.9991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,138.338,1.72196 +Apps_INTSC_HEXRECT,Base_Seq,default,1124864, PASSED ,0.937313,0.0527279,4.32034,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,4.31662,0.0527279 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,1124864, PASSED ,0.00248498,19.8885,1629.6,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1629.6,19.8885 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,1124864, PASSED ,0.00299439,16.5051,1352.37,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1352.37,16.5051 +Apps_INTSC_HEXRECT,Base_Seq,default,140608, PASSED ,0.117048,0.0529853,4.32463,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,4.31956,0.0529853 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,140608, PASSED ,0.000390914,15.8649,1294.89,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1294.89,15.8649 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,140608, PASSED ,0.000447843,13.8482,1130.28,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1130.28,13.8482 +Apps_INTSC_HEXRECT,Base_Seq,default,1643032, PASSED ,1.37027,0.0526587,4.31662,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,4.31809,0.0526933 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,1643032, PASSED ,0.00359784,20.0555,1644.02,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1636.81,19.972 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,1643032, PASSED ,0.00434504,16.6066,1361.3,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1356.835,16.55585 +Apps_INTSC_HEXRECT,Base_Seq,default,17576, PASSED ,0.014675,0.0532582,4.31165,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,4.30936,0.0530315 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,17576, PASSED ,0.000161536,4.83834,391.7,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64,391.7,4.83834 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,17576, PASSED ,0.000158077,4.94421,400.271,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,400.271,4.94421 +Apps_INTSC_HEXRECT,Base_Seq,default,287496, PASSED ,0.239802,0.0527919,4.31601,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,4.32023,0.0527919 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,287496, PASSED ,0.000732505,17.2826,1412.94,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1412.94,17.2826 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,287496, PASSED ,0.000848664,14.9171,1219.55,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1219.55,14.9171 +Apps_INTSC_HEXRECT,Base_Seq,default,3241792, PASSED ,2.70382,0.0526191,4.31628,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,4.31662,0.0526587 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,3241792, PASSED ,0.0069522,20.4644,1678.67,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1644.02,20.0555 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,3241792, PASSED ,0.00840893,16.9192,1387.86,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1361.3,16.6066 +Apps_INTSC_HEXRECT,Base_Seq,default,39304, PASSED ,0.0328342,0.0530228,4.30936,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,4.31165,0.0530315 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,39304, PASSED ,0.000176631,9.85649,801.073,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64,801.073,9.85649 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,39304, PASSED ,0.000172284,10.1052,821.286,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,821.286,10.1052 +Apps_INTSC_HEXRECT,Base_Seq,default,5832, PASSED ,0.00491087,0.0532159,4.27525,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,4.292305,0.053119349999999996 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,5832, PASSED ,0.000152725,1.71116,137.471,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64,264.5855,3.27475 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,5832, PASSED ,0.000151767,1.72196,138.338,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,269.3045,3.333085 +Apps_INTSC_HEXRECT,Base_Seq,default,551368, PASSED ,0.459521,0.0527725,4.31956,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,4.31956,0.0527725 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,551368, PASSED ,0.00128413,18.8845,1545.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1545.74,18.8845 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,551368, PASSED ,0.00153927,15.7543,1289.52,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1289.52,15.7543 +Apps_INTSC_HEXRECT,Base_Seq,default,74088, PASSED ,0.0617367,0.0530315,4.32023,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,4.31601,0.0530228 +Apps_INTSC_HEXRECT,Base_CUDA,block_64,74088, PASSED ,0.000215796,15.1717,1235.97,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1235.97,15.1717 +Apps_INTSC_HEXRECT,RAJA_CUDA,block_64,74088, PASSED ,0.000290519,11.2695,918.07,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/INTSC_HEXRECT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,918.07,11.2695 +Apps_MASS3DEA,Base_Seq,default,6213632, PASSED ,0.256293,0.186147,0.16971,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.16971,0.186147 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,6213632, PASSED ,0.000265126,179.945,164.056,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,164.056,179.945 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,6213632, PASSED ,0.000247383,192.851,175.822,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,175.822,192.851 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,6213632, PASSED ,0.000271831,175.507,160.009,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,160.009,175.507 +Apps_MASS3DEA,Base_Seq,default,778240, PASSED ,0.0311109,0.192069,0.175105,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.173081,0.189853 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,778240, PASSED ,0.000112598,53.0688,48.3817,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,48.3817,53.0688 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,778240, PASSED ,7.4883e-05,79.797,72.7492,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,72.7492,79.797 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,778240, PASSED ,7.934e-05,75.3143,68.6625,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,68.6625,75.3143 +Apps_MASS3DEA,Base_Seq,default,9101312, PASSED ,0.375862,0.185918,0.169502,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.169502,0.185918 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,9101312, PASSED ,0.000370367,188.677,172.016,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,172.016,188.677 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,9101312, PASSED ,0.000351549,198.776,181.224,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,181.224,198.776 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,9101312, PASSED ,0.000386393,180.851,164.882,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,164.882,180.851 +Apps_MASS3DEA,Base_Seq,default,1556480, PASSED ,0.062294,0.191844,0.174902,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.173081,0.189853 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,1556480, PASSED ,0.000125894,94.9269,86.5439,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,86.5439,94.9269 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,1556480, PASSED ,0.000101402,117.855,107.447,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,107.447,117.855 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,1556480, PASSED ,0.000109785,108.856,99.2427,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,99.2427,108.856 +Apps_MASS3DEA,Base_Seq,default,18198528, PASSED ,0.752786,0.185614,0.169224,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,0.169502,0.185918 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,18198528, PASSED ,0.000638748,218.752,199.437,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,199.437,218.752 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,18198528, PASSED ,0.000621548,224.806,204.956,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,204.956,224.806 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,18198528, PASSED ,0.00069257,201.752,183.938,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,183.852,201.658 +Apps_MASS3DEA,Base_Seq,default,196608, PASSED ,0.00797947,0.189198,0.172475,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.173081,0.189853 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,196608, PASSED ,0.000111249,13.5704,12.371,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,24.4534,26.8231 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,196608, PASSED ,7.4416e-05,20.2873,18.4941,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,36.4701,40.0042 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,196608, PASSED ,7.8781e-05,19.1632,17.4694,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,34.7305,38.096 +Apps_MASS3DEA,Base_Seq,default,24260608, PASSED ,1.00902,0.184607,0.168307,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,0.169224,0.185614 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,24260608, PASSED ,0.000844811,220.49,201.02,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,201.02,220.49 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,24260608, PASSED ,0.000828049,224.953,205.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,204.956,224.806 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,24260608, PASSED ,0.000923702,201.658,183.852,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,183.938,201.752 +Apps_MASS3DEA,Base_Seq,default,30326784, PASSED ,1.24637,0.186821,0.170325,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default,0.1689245,0.185285 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,30326784, PASSED ,0.0010481,222.162,202.545,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,201.7825,221.32600000000002 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,30326784, PASSED ,0.00103125,225.791,205.854,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,205.023,224.8795 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,30326784, PASSED ,0.00115143,202.225,184.368,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,184.153,201.9885 +Apps_MASS3DEA,Base_Seq,default,3108864, PASSED ,0.127598,0.187071,0.170552,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.170552,0.187071 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,3108864, PASSED ,0.000146586,162.839,148.459,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,148.459,162.839 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,3108864, PASSED ,0.000145038,164.577,150.044,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,150.044,164.577 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,3108864, PASSED ,0.00015699,152.047,138.621,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,138.621,152.047 +Apps_MASS3DEA,Base_Seq,default,36392960, PASSED ,1.51075,0.184956,0.168625,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default,0.168625,0.184956 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,36392960, PASSED ,0.00122022,228.994,208.774,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,202.545,222.162 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,36392960, PASSED ,0.00130189,214.629,195.678,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,205.09,224.953 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,36392960, PASSED ,0.00134275,208.098,189.723,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,184.368,202.225 +Apps_MASS3DEA,Base_Seq,default,389120, PASSED ,0.0157374,0.189853,0.173081,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.17399150000000002,0.19084849999999998 +Apps_MASS3DEA,Base_CUDA,compile_time_block_stride_loop_64,389120, PASSED ,0.000111389,26.8231,24.4534,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-compile_time_block_stride_loop_64,36.41755,39.94595 +Apps_MASS3DEA,RAJA_CUDA,compile_time_block_stride_loop_64,389120, PASSED ,7.4687e-05,40.0042,36.4701,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-compile_time_block_stride_loop_64,54.60965,59.9006 +Apps_MASS3DEA,RAJA_CUDA,cached_block_stride_loop_64,389120, PASSED ,7.8428e-05,38.096,34.7305,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DEA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,51.6965,56.70515 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,729, PASSED ,1.06151e-05,5.63123,11.2564,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,11.5777,5.57301 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,729, PASSED ,3.7374e-06,15.994,31.9709,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64,163.533,78.6741 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,729, PASSED ,3.75178e-06,15.9327,31.8483,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,162.29,78.0764 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,531441, PASSED ,0.0118418,4.66743,10.0903,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,11.0648,5.13006 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,531441, PASSED ,6.70852e-05,823.891,1781.14,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1781.14,823.891 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,531441, PASSED ,6.71454e-05,823.152,1779.54,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1779.54,823.152 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,68921, PASSED ,0.00130854,5.32245,11.4143,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,11.5357,5.42675 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,68921, PASSED ,1.07764e-05,646.287,1386.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1386.0,646.287 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,68921, PASSED ,1.08612e-05,641.236,1375.17,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1375.17,641.236 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,753571, PASSED ,0.0150698,5.21751,11.2895,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,10.577549999999999,4.898745 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,753571, PASSED ,9.21952e-05,852.829,1845.33,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1813.2350000000001,838.3599999999999 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,753571, PASSED ,9.22373e-05,852.44,1844.49,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1812.0149999999999,837.796 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,9261, PASSED ,0.000161258,5.48866,11.5777,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,11.5777,5.50448 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,9261, PASSED ,4.52344e-06,195.668,412.739,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64,412.739,195.668 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,9261, PASSED ,4.45998e-06,198.452,418.612,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,418.612,198.452 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,132651, PASSED ,0.00246978,5.48991,11.8115,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,11.4143,5.32245 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,132651, PASSED ,1.7993e-05,753.564,1621.29,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1621.29,753.564 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,132651, PASSED ,1.79145e-05,756.865,1628.39,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1628.39,756.865 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,1442897, PASSED ,0.0340937,4.43834,9.61689,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,10.0903,4.66743 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,1442897, PASSED ,0.000176986,854.982,1852.55,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1845.33,852.829 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,1442897, PASSED ,0.00017712,854.334,1851.15,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1844.49,852.44 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,19683, PASSED ,0.000355574,5.42675,11.5357,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,11.5777,5.48866 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,19683, PASSED ,5.63764e-06,342.273,727.574,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64,727.574,342.273 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,19683, PASSED ,5.67768e-06,339.859,722.443,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,722.443,339.859 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,3375, PASSED ,5.5281e-05,5.57301,11.5841,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,11.5567,5.530835 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,3375, PASSED ,3.91592e-06,78.6741,163.533,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64,288.13599999999997,137.17105 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,3375, PASSED ,3.9459e-06,78.0764,162.29,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,290.451,138.26420000000002 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,250047, PASSED ,0.00502674,5.13006,11.0648,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,11.2895,5.21751 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,250047, PASSED ,3.26954e-05,788.718,1701.15,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1701.15,788.718 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,250047, PASSED ,3.27017e-05,788.566,1700.82,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1700.82,788.566 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,35937, PASSED ,0.00065046,5.50448,11.7567,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,11.5777,5.48866 +Apps_MASS3DPA_ATOMIC,Base_CUDA,block_64,35937, PASSED ,7.25788e-06,493.318,1053.65,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1053.65,493.318 +Apps_MASS3DPA_ATOMIC,RAJA_CUDA,block_64,35937, PASSED ,7.27554e-06,492.121,1051.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1051.09,492.121 +Apps_MASSVEC3DPA,Base_Seq,default,5376, PASSED ,1.21374e-05,3.89184,12.7342,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,13.0295,3.97645 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,5376, PASSED ,7.42e-06,6.36613,20.8302,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,82.6628,25.2277 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,5376, PASSED ,4.55534e-06,10.3695,33.9294,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,133.032,40.5998 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,5376, PASSED ,6.99754e-06,6.75047,22.0878,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,86.0997,26.2766 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,5376, PASSED ,4.31026e-06,10.9591,35.8586,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,136.71,41.7224 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,5376, PASSED ,7.0531e-06,6.69729,21.9138,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,85.7661,26.1748 +Apps_MASSVEC3DPA,Base_Seq,default,5437248, PASSED ,0.012802,3.72476,12.2106,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,12.2797,3.74583 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,5437248, PASSED ,9.14447e-05,521.457,1709.46,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,1709.46,521.457 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,5437248, PASSED ,6.28716e-05,758.443,2486.35,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,2486.35,758.443 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,5437248, PASSED ,9.68036e-05,492.59,1614.83,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,1614.83,492.59 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,5437248, PASSED ,6.36234e-05,749.481,2456.97,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,2456.97,749.481 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,5437248, PASSED ,9.68645e-05,492.28,1613.81,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,1613.81,492.28 +Apps_MASSVEC3DPA,Base_Seq,default,679680, PASSED ,0.0014736,4.04509,13.2606,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,13.3868,4.08355 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,679680, PASSED ,1.56698e-05,380.403,1247.03,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,1247.03,380.403 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,679680, PASSED ,1.04847e-05,568.529,1863.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,1863.74,568.529 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,679680, PASSED ,1.57015e-05,379.635,1244.51,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,1244.51,379.635 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,679680, PASSED ,1.06839e-05,557.927,1828.99,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,1828.99,557.927 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,679680, PASSED ,1.56841e-05,380.057,1245.9,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,1245.9,380.057 +Apps_MASSVEC3DPA,Base_Seq,default,7964736, PASSED ,0.0186475,3.74583,12.2797,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,12.245149999999999,3.735295 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,7964736, PASSED ,0.000130985,533.27,1748.18,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,1728.8200000000002,527.3634999999999 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,7964736, PASSED ,8.993e-05,776.721,2546.27,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,2516.31,767.582 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,7964736, PASSED ,0.000138923,502.798,1648.29,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,1631.56,497.69399999999996 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,7964736, PASSED ,9.1031e-05,767.326,2515.47,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,2486.22,758.4035 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,7964736, PASSED ,0.000138969,502.632,1647.75,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,1630.78,497.456 +Apps_MASSVEC3DPA,Base_Seq,default,85056, PASSED ,0.000182175,4.09511,13.4231,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,13.3154,4.06186 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,85056, PASSED ,7.74194e-06,96.3617,315.859,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,315.859,96.3617 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,85056, PASSED ,4.68662e-06,159.182,521.775,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,521.775,159.182 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,85056, PASSED ,7.35466e-06,101.436,332.491,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,332.491,101.436 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,85056, PASSED ,4.47352e-06,166.765,546.63,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,546.63,166.765 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,85056, PASSED ,7.38302e-06,101.046,331.214,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,331.214,101.046 +Apps_MASSVEC3DPA,Base_Seq,default,1359360, PASSED ,0.00287493,4.14675,13.5939,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,13.3154,4.06186 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,1359360, PASSED ,2.59907e-05,458.687,1503.67,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,1503.67,458.687 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,1359360, PASSED ,1.75039e-05,681.084,2232.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,2232.74,681.084 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,1359360, PASSED ,2.62679e-05,453.847,1487.81,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,1487.81,453.847 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,1359360, PASSED ,1.77157e-05,672.94,2206.04,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,2206.04,672.94 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,1359360, PASSED ,2.62529e-05,454.106,1488.66,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,1488.66,454.106 +Apps_MASSVEC3DPA,Base_Seq,default,15929280, PASSED ,0.0378954,3.68644,12.085,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,12.2106,3.72476 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,15929280, PASSED ,0.000255311,547.173,1793.76,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,1748.18,533.27 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,15929280, PASSED ,0.000175204,797.352,2613.91,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,2546.27,776.721 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,15929280, PASSED ,0.00027133,514.867,1687.86,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,1648.29,502.798 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,15929280, PASSED ,0.000177142,788.629,2585.31,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,2515.47,767.326 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,15929280, PASSED ,0.000271551,514.449,1686.48,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,1647.75,502.632 +Apps_MASSVEC3DPA,Base_Seq,default,169920, PASSED ,0.000362792,4.1078,13.4656,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,13.3154,4.06186 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,169920, PASSED ,8.33486e-06,178.801,586.117,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,586.117,178.801 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,169920, PASSED ,5.33428e-06,279.378,915.812,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,915.812,279.378 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,169920, PASSED ,7.9591e-06,187.242,613.788,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,613.788,187.242 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,169920, PASSED ,5.10904e-06,291.695,956.187,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,956.187,291.695 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,169920, PASSED ,7.98266e-06,186.69,611.976,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,611.976,186.69 +Apps_MASSVEC3DPA,Base_Seq,default,21312, PASSED ,4.70255e-05,3.97645,13.0295,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,13.2263,4.03578 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,21312, PASSED ,7.41228e-06,25.2277,82.6628,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,199.2609,60.7947 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,21312, PASSED ,4.6058e-06,40.5998,133.032,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,327.4035,99.89089999999999 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,21312, PASSED ,7.1164e-06,26.2766,86.0997,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,209.29534999999998,63.856300000000005 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,21312, PASSED ,4.48188e-06,41.7224,136.71,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,341.67,104.24369999999999 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,21312, PASSED ,7.14408e-06,26.1748,85.7661,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,208.49005,63.610400000000006 +Apps_MASSVEC3DPA,Base_Seq,default,2718720, PASSED ,0.00583883,4.08355,13.3868,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,13.2606,4.04509 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,2718720, PASSED ,4.76641e-05,500.232,1639.87,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,1639.87,500.232 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,2718720, PASSED ,3.26887e-05,729.4,2391.14,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,2391.14,729.4 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,2718720, PASSED ,4.8664e-05,489.954,1606.18,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,1606.18,489.954 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,2718720, PASSED ,3.28996e-05,724.725,2375.81,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,2375.81,724.725 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,2718720, PASSED ,4.87601e-05,488.989,1603.02,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,1603.02,488.989 +Apps_MASSVEC3DPA,Base_Seq,default,339840, PASSED ,0.000733769,4.06186,13.3154,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,13.4231,4.09511 +Apps_MASSVEC3DPA,Base_CUDA,runtime_block_stride_loop_64,339840, PASSED ,9.79378e-06,304.323,997.613,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-runtime_block_stride_loop_64,997.613,304.323 +Apps_MASSVEC3DPA,Base_CUDA,direct_64,339840, PASSED ,6.92866e-06,430.166,1410.14,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-direct_64,1410.14,430.166 +Apps_MASSVEC3DPA,RAJA_CUDA,runtime_block_stride_loop_64,339840, PASSED ,9.53338e-06,312.635,1024.86,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-runtime_block_stride_loop_64,1024.86,312.635 +Apps_MASSVEC3DPA,RAJA_CUDA,direct_64,339840, PASSED ,6.68232e-06,446.023,1462.13,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_64,1462.13,446.023 +Apps_MASSVEC3DPA,RAJA_CUDA,cached_block_stride_loop_64,339840, PASSED ,9.53448e-06,312.599,1024.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/MASSVEC3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-cached_block_stride_loop_64,1024.74,312.599 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000, PASSED ,2.11589e-06,16.4161,4.25353,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,4.25353,15.1809 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,1000, PASSED ,2.84359e-06,12.2151,3.16501,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256,18.717,67.436 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,1000, PASSED ,2.80486e-06,12.3837,3.20872,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,19.0226,68.5372 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2048383, PASSED ,0.00573203,10.7769,3.21622,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,3.21622,10.7769 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,2048383, PASSED ,7.09007e-05,871.264,260.018,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256,263.904,883.048 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,2048383, PASSED ,7.09243e-05,870.975,259.931,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,264.181,883.978 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,238328, PASSED ,0.000476735,15.265,4.49925,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,4.43443,14.9065 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,238328, PASSED ,1.00328e-05,725.36,213.795,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256,213.795,725.36 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,238328, PASSED ,1.00284e-05,725.675,213.888,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,213.888,725.675 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2985984, PASSED ,0.00910079,9.88076,2.95292,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,3.0845700000000003,10.32883 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,2985984, PASSED ,0.000101832,883.048,263.904,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256,264.769,887.9935 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,2985984, PASSED ,0.000101725,883.978,264.181,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,264.72249999999997,887.837 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,27000, PASSED ,5.67901e-05,14.9014,4.27892,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,4.21348,14.9014 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,27000, PASSED ,3.12783e-06,270.556,77.6896,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256,77.6896,270.556 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,27000, PASSED ,3.11661e-06,271.53,77.9693,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,77.9693,271.53 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,493039, PASSED ,0.000981555,15.2577,4.52073,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,4.43443,14.9065 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,493039, PASSED ,1.79344e-05,835.056,247.421,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256,247.421,835.056 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,493039, PASSED ,1.79915e-05,832.406,246.636,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,246.636,832.406 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,6028568, PASSED ,0.018767,9.65281,2.89109,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,2.95292,9.88076 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,6028568, PASSED ,0.000198514,912.551,273.316,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,263.904,883.048 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,6028568, PASSED ,0.000198515,912.545,273.314,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,264.181,883.978 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,54872, PASSED ,0.000118843,14.3179,4.15548,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,4.21348,14.9014 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,54872, PASSED ,3.96236e-06,429.436,124.635,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256,124.635,429.436 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,54872, PASSED ,3.97114e-06,428.486,124.359,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,124.359,428.486 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,5832, PASSED ,1.24572e-05,15.1809,4.21348,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,4.233504999999999,15.04115 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,5832, PASSED ,2.8043e-06,67.436,18.717,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256,48.2033,168.99599999999998 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,5832, PASSED ,2.75924e-06,68.5372,19.0226,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,48.49595,170.03359999999998 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000000, PASSED ,0.00202957,14.9065,4.43443,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,4.43443,14.9065 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,1000000, PASSED ,3.38812e-05,892.939,265.634,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256,260.018,871.264 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,1000000, PASSED ,3.39284e-05,891.696,265.264,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,259.931,870.975 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,117649, PASSED ,0.00026121,13.8423,4.05361,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,4.27892,14.9014 +Apps_NODAL_ACCUMULATION_3D,Base_CUDA,block_256,117649, PASSED ,5.81927e-06,621.341,181.954,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256,181.954,621.341 +Apps_NODAL_ACCUMULATION_3D,RAJA_CUDA,block_256,117649, PASSED ,5.82147e-06,621.106,181.886,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,181.886,621.106 +Apps_VOL3D,Base_Seq,default,512, PASSED ,9.61451e-06,4.748,10.589,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,10.589,4.63757 +Apps_VOL3D,Base_CUDA,block_256,512, PASSED ,2.71531e-06,16.812,37.4941,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256,152.965,66.2827 +Apps_VOL3D,RAJA_CUDA,block_256,512, PASSED ,2.66465e-06,17.1316,38.2069,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,159.37,69.0584 +Apps_VOL3D,Base_Seq,default,1442897, PASSED ,0.0116043,4.06895,9.76601,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,9.76601,4.06895 +Apps_VOL3D,Base_CUDA,block_256,1442897, PASSED ,2.48123e-05,1902.98,4567.41,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256,4669.88,1944.11 +Apps_VOL3D,RAJA_CUDA,block_256,1442897, PASSED ,2.37548e-05,1987.7,4770.74,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,5023.79,2091.45 +Apps_VOL3D,Base_Seq,default,166375, PASSED ,0.00135694,4.4135,10.5217,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.4987,4.4135 +Apps_VOL3D,Base_CUDA,block_256,166375, PASSED ,5.15502e-06,1161.75,2769.61,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256,2769.61,1161.75 +Apps_VOL3D,RAJA_CUDA,block_256,166375, PASSED ,4.40588e-06,1359.29,3240.53,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,3240.53,1359.29 +Apps_VOL3D,Base_Seq,default,2146689, PASSED ,0.0172879,4.01726,9.64971,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,9.70786,4.043105000000001 +Apps_VOL3D,Base_CUDA,block_256,2146689, PASSED ,3.57233e-05,1944.11,4669.88,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256,4784.225,1990.475 +Apps_VOL3D,RAJA_CUDA,block_256,2146689, PASSED ,3.32067e-05,2091.45,5023.79,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,5172.46,2151.995 +Apps_VOL3D,Base_Seq,default,17576, PASSED ,0.000172093,4.47421,10.5172,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,10.5172,4.47421 +Apps_VOL3D,Base_CUDA,block_256,17576, PASSED ,3.2504e-06,236.888,556.835,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256,556.835,236.888 +Apps_VOL3D,RAJA_CUDA,block_256,17576, PASSED ,2.72221e-06,282.851,664.877,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,664.877,282.851 +Apps_VOL3D,Base_Seq,default,343000, PASSED ,0.00264511,4.48746,10.728,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,10.486,4.37656 +Apps_VOL3D,Base_CUDA,block_256,343000, PASSED ,8.32725e-06,1425.42,3407.7,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256,3407.7,1425.42 +Apps_VOL3D,RAJA_CUDA,block_256,343000, PASSED ,6.09938e-06,1946.07,4652.4,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,4652.4,1946.07 +Apps_VOL3D,Base_Seq,default,4410944, PASSED ,0.0361167,3.88335,9.33941,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,9.64971,4.01726 +Apps_VOL3D,Base_CUDA,block_256,4410944, PASSED ,6.88587e-05,2036.84,4898.57,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,4669.88,1944.11 +Apps_VOL3D,RAJA_CUDA,block_256,4410944, PASSED ,6.33905e-05,2212.54,5321.13,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,5023.79,2091.45 +Apps_VOL3D,Base_Seq,default,35937, PASSED ,0.000328079,4.4415,10.4987,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,10.5172,4.4415 +Apps_VOL3D,Base_CUDA,block_256,35937, PASSED ,3.32316e-06,438.487,1036.49,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1036.49,438.487 +Apps_VOL3D,RAJA_CUDA,block_256,35937, PASSED ,3.19033e-06,456.743,1079.64,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1079.64,456.743 +Apps_VOL3D,Base_Seq,default,3375, PASSED ,4.10173e-05,4.63757,10.7024,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,10.5531,4.55589 +Apps_VOL3D,Base_CUDA,block_256,3375, PASSED ,2.86984e-06,66.2827,152.965,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256,354.90000000000003,151.58535 +Apps_VOL3D,RAJA_CUDA,block_256,3375, PASSED ,2.75449e-06,69.0584,159.37,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,412.1235,175.9547 +Apps_VOL3D,Base_Seq,default,704969, PASSED ,0.00540288,4.37656,10.486,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,10.486,4.37656 +Apps_VOL3D,Base_CUDA,block_256,704969, PASSED ,1.14911e-05,2057.77,4930.32,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256,4567.41,1902.98 +Apps_VOL3D,RAJA_CUDA,block_256,704969, PASSED ,9.98778e-06,2367.49,5672.4,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,4770.74,1987.7 +Apps_VOL3D,Base_Seq,default,79507, PASSED ,0.000689456,4.36589,10.3709,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,10.5172,4.4415 +Apps_VOL3D,Base_CUDA,block_256,79507, PASSED ,3.75658e-06,801.284,1903.39,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1903.39,801.284 +Apps_VOL3D,RAJA_CUDA,block_256,79507, PASSED ,3.56829e-06,843.566,2003.83,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier1/VOL3D_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,2003.83,843.566 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_DIFFUSION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_DIFFUSION3DPA.csv new file mode 100644 index 0000000..d379592 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_DIFFUSION3DPA.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64 (raw),Base_CUDA-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_64 (raw),RAJA_CUDA-block_64 (smoothed),Base_CUDA-block_64 (raw B/W),Base_CUDA-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_64 (raw B/W),RAJA_CUDA-block_64 (smoothed B/W) +405,18.0915,69.2993,13.1459,13.6146,19.2625,73.989,12.0974,46.2209,8.79032,9.0806,12.8804,49.3488 +1566,69.2993,170.54665,13.6146,13.6106,73.989,179.01600000000002,46.2209,113.68995,9.0806,9.07441,49.3488,119.3364 +6183,271.794,271.794,13.8113,13.6066,284.043,284.043,181.159,181.159,9.20569,9.06822,189.324,189.324 +12339,514.567,514.567,13.6066,13.6066,534.463,534.463,342.937,342.937,9.06822,9.06822,356.197,356.197 +24678,940.413,940.413,12.139,12.508,985.231,985.231,626.709,626.709,8.08964,8.33524,656.577,656.577 +49329,1457.23,1457.23,11.7979,12.139,1587.84,1587.84,971.099,971.099,7.8621,8.08964,1058.14,1058.14 +98631,2126.82,2126.82,12.508,11.7979,2058.54,2058.54,1417.29,1417.29,8.33524,7.8621,1371.79,1371.79 +197262,2495.05,2435.93,10.7965,10.7965,2483.77,2483.77,1662.67,1623.27,7.19463,7.19463,1655.15,1655.15 +394524,2435.93,2495.05,7.72949,7.72949,2506.66,2506.66,1623.27,1662.67,5.15081,5.15081,1670.4,1670.4 +577935,2587.42,2541.235,7.57591,7.6527,2661.33,2583.995,1724.22,1693.4450000000002,5.04846,5.099635,1773.47,1721.935 +1155843,2832.74,2587.42,7.25656,7.57591,2871.99,2661.33,1887.69,1724.22,4.83564,5.04846,1913.84,1773.47 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_EDGE3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_EDGE3D.csv new file mode 100644 index 0000000..ed7498a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_EDGE3D.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256 (raw),Base_CUDA-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_256 (raw),RAJA_CUDA-block_256 (smoothed),Base_CUDA-block_256 (raw B/W),Base_CUDA-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_256 (raw B/W),RAJA_CUDA-block_256 (smoothed B/W) +512,80.6755,339.719,9.38302,9.38853,80.35,339.496,0.197104,0.802097,0.0229243,0.0221669,0.196309,0.801571 +3375,339.719,740.1445,9.38853,9.385774999999999,339.496,741.7429999999999,0.802097,1.7229735,0.0221669,0.02197615,0.801571,1.7266705 +17576,1140.57,1140.57,9.39835,9.38302,1143.99,1143.99,2.64385,2.64385,0.0217854,0.0217854,2.65177,2.65177 +35937,1188.01,1188.01,9.34143,9.35348,1188.86,1188.86,2.7385,2.7385,0.021533,0.021533,2.74046,2.74046 +79507,1442.95,1442.95,9.35348,9.35308,1435.95,1435.95,3.30983,3.30983,0.021455,0.021455,3.29378,3.29378 +166375,1503.98,1503.98,9.34894,9.35308,1500.7,1500.7,3.43745,3.43745,0.0213676,0.0213676,3.42995,3.42995 +343000,1565.47,1565.47,9.35308,9.35308,1559.59,1559.59,3.568,3.568,0.0213174,0.0213174,3.55459,3.55459 +704969,1593.03,1593.03,9.36795,9.35308,1586.61,1586.61,3.6228,3.6228,0.0213042,0.0213042,3.60819,3.60819 +1442897,1611.09,1611.09,9.32671,9.35308,1606.07,1606.07,3.65749,3.65749,0.0211735,0.0212504,3.64609,3.64609 +2146689,1618.58,1614.835,9.36815,9.34943,1613.82,1609.945,3.67155,3.66452,0.0212504,0.02121195,3.66075,3.652475 +4410944,1620.76,1618.58,9.33091,9.33091,1614.96,1613.82,3.67202,3.67155,0.0211402,0.0211735,3.65886,3.65886 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_ENERGY.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_ENERGY.csv new file mode 100644 index 0000000..bf898db --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_ENERGY.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256 (raw),Base_CUDA-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_256 (raw),RAJA_CUDA-block_256 (smoothed),Base_CUDA-block_256 (raw B/W),Base_CUDA-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_256 (raw B/W),RAJA_CUDA-block_256 (smoothed B/W) +417,1.77625,6.93723,13.341,12.8693,1.77731,6.90487,6.49675,25.3733,48.7956,47.0702,6.50062,25.255 +1667,6.93723,17.176515000000002,12.865,12.894200000000001,6.90487,17.088935,25.3733,62.82415,47.0544,47.1612,25.255,62.5038 +6667,27.4158,27.4158,12.8693,12.9191,27.273,27.273,100.275,100.275,47.0702,47.2522,99.7526,99.7526 +13334,54.6624,54.6624,12.9191,12.8693,54.4796,54.4796,199.931,199.931,47.2522,47.0702,199.262,199.262 +26667,107.026,107.026,13.2967,12.8693,106.824,106.824,391.454,391.454,48.6333,47.0702,390.714,390.714 +53334,198.795,198.795,10.1411,10.1411,198.104,198.104,727.103,727.103,37.0917,37.0917,724.576,724.576 +106667,362.386,362.386,9.22412,9.22412,362.606,362.606,1325.45,1325.45,33.7378,33.7378,1326.25,1326.25 +213334,612.557,612.557,8.97634,8.97634,615.5,615.5,2240.46,2240.46,32.8315,32.8315,2251.23,2251.23 +426667,849.103,722.619,8.40628,8.40628,846.742,723.629,3105.64,2643.02,30.7464,30.7464,3097.01,2646.71 +625000,804.683,763.6510000000001,7.18539,7.795835,802.407,763.018,2943.18,2793.1,26.281,28.5137,2934.85,2790.7799999999997 +1250000,722.619,804.683,5.12504,7.18539,723.629,802.407,2643.02,2943.18,18.7451,26.281,2646.71,2934.85 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_FEMSWEEP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_FEMSWEEP.csv new file mode 100644 index 0000000..e16d398 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_FEMSWEEP.csv @@ -0,0 +1,11 @@ +Problem size,Base_CUDA-block_128 (raw),Base_CUDA-block_128 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_128 (raw),RAJA_CUDA-block_128 (smoothed),Base_CUDA-block_128 (raw B/W),Base_CUDA-block_128 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_128 (raw B/W),RAJA_CUDA-block_128 (smoothed B/W) +31104,83.12595,108.1106,3.37219,3.208915,56.03545,72.43655000000001,14.928049999999999,19.745,0.6055889999999999,0.586811,10.06305,13.2291 +73728,132.791,132.791,3.10205,3.16604,88.7746,88.7746,24.5073,24.5073,0.5725,0.595459,16.3838,16.3838 +144000,182.372,182.372,3.08391,3.16064,124.333,124.333,34.1906,34.1906,0.578163,0.599649,23.3096,23.3096 +248832,236.347,236.347,3.16604,3.10205,163.289,163.289,44.7641,44.7641,0.599649,0.594489,30.9269,30.9269 +395136,241.569,241.569,3.16064,3.09991,189.419,189.419,46.0821,46.0821,0.602929,0.594489,36.1339,36.1339 +589824,276.445,276.445,3.09991,3.09991,221.479,221.479,53.0155,53.0155,0.594489,0.594489,42.4744,42.4744 +1152000,302.549,302.549,2.93255,2.93255,252.975,252.975,58.4488,58.4488,0.566533,0.566533,48.8716,48.8716 +1533312,319.107,319.107,2.69281,2.69281,271.05,271.05,61.8105,61.8105,0.521593,0.521593,52.502,52.502 +1990656,339.519,329.313,2.62611,2.65946,284.022,277.536,65.9083,63.859399999999994,0.509787,0.51569,55.1352,53.8186 +2530944,341.606,339.519,2.56545,2.62611,295.038,284.022,66.4358,65.9083,0.498932,0.509787,57.3794,55.1352 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_INTSC_HEXRECT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_INTSC_HEXRECT.csv new file mode 100644 index 0000000..0f86b40 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_INTSC_HEXRECT.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64 (raw),Base_CUDA-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_64 (raw),RAJA_CUDA-block_64 (smoothed),Base_CUDA-block_64 (raw B/W),Base_CUDA-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_64 (raw B/W),RAJA_CUDA-block_64 (smoothed B/W) +1728,40.5816,137.471,4.08557,4.27525,40.9991,138.338,0.511948,1.71116,0.0515405,0.0532159,0.517215,1.72196 +5832,137.471,264.5855,4.27525,4.292305,138.338,269.3045,1.71116,3.27475,0.0532159,0.053119349999999996,1.72196,3.333085 +17576,391.7,391.7,4.31165,4.30936,400.271,400.271,4.83834,4.83834,0.0532582,0.0530315,4.94421,4.94421 +39304,801.073,801.073,4.30936,4.31165,821.286,821.286,9.85649,9.85649,0.0530228,0.0530315,10.1052,10.1052 +74088,1235.97,1235.97,4.32023,4.31601,918.07,918.07,15.1717,15.1717,0.0530315,0.0530228,11.2695,11.2695 +140608,1294.89,1294.89,4.32463,4.31956,1130.28,1130.28,15.8649,15.8649,0.0529853,0.0529853,13.8482,13.8482 +287496,1412.94,1412.94,4.31601,4.32023,1219.55,1219.55,17.2826,17.2826,0.0527919,0.0527919,14.9171,14.9171 +551368,1545.74,1545.74,4.31956,4.31956,1289.52,1289.52,18.8845,18.8845,0.0527725,0.0527725,15.7543,15.7543 +1124864,1629.6,1629.6,4.32034,4.31662,1352.37,1352.37,19.8885,19.8885,0.0527279,0.0527279,16.5051,16.5051 +1643032,1644.02,1636.81,4.31662,4.31809,1361.3,1356.835,20.0555,19.972,0.0526587,0.0526933,16.6066,16.55585 +3241792,1678.67,1644.02,4.31628,4.31662,1387.86,1361.3,20.4644,20.0555,0.0526191,0.0526587,16.9192,16.6066 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASS3DEA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASS3DEA.csv new file mode 100644 index 0000000..47a2359 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASS3DEA.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-compile_time_block_stride_loop_64 (raw),Base_CUDA-compile_time_block_stride_loop_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-cached_block_stride_loop_64 (raw),RAJA_CUDA-cached_block_stride_loop_64 (smoothed),RAJA_CUDA-compile_time_block_stride_loop_64 (raw),RAJA_CUDA-compile_time_block_stride_loop_64 (smoothed),Base_CUDA-compile_time_block_stride_loop_64 (raw B/W),Base_CUDA-compile_time_block_stride_loop_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-cached_block_stride_loop_64 (raw B/W),RAJA_CUDA-cached_block_stride_loop_64 (smoothed B/W),RAJA_CUDA-compile_time_block_stride_loop_64 (raw B/W),RAJA_CUDA-compile_time_block_stride_loop_64 (smoothed B/W) +196608,12.371,24.4534,0.172475,0.173081,17.4694,34.7305,18.4941,36.4701,13.5704,26.8231,0.189198,0.189853,19.1632,38.096,20.2873,40.0042 +389120,24.4534,36.41755,0.173081,0.17399150000000002,34.7305,51.6965,36.4701,54.60965,26.8231,39.94595,0.189853,0.19084849999999998,38.096,56.70515,40.0042,59.9006 +778240,48.3817,48.3817,0.175105,0.173081,68.6625,68.6625,72.7492,72.7492,53.0688,53.0688,0.192069,0.189853,75.3143,75.3143,79.797,79.797 +1556480,86.5439,86.5439,0.174902,0.173081,99.2427,99.2427,107.447,107.447,94.9269,94.9269,0.191844,0.189853,108.856,108.856,117.855,117.855 +3108864,148.459,148.459,0.170552,0.170552,138.621,138.621,150.044,150.044,162.839,162.839,0.187071,0.187071,152.047,152.047,164.577,164.577 +6213632,164.056,164.056,0.16971,0.16971,160.009,160.009,175.822,175.822,179.945,179.945,0.186147,0.186147,175.507,175.507,192.851,192.851 +9101312,172.016,172.016,0.169502,0.169502,164.882,164.882,181.224,181.224,188.677,188.677,0.185918,0.185918,180.851,180.851,198.776,198.776 +18198528,199.437,199.437,0.169224,0.169502,183.938,183.852,204.956,204.956,218.752,218.752,0.185614,0.185918,201.752,201.658,224.806,224.806 +24260608,201.02,201.02,0.168307,0.169224,183.852,183.938,205.09,204.956,220.49,220.49,0.184607,0.185614,201.658,201.752,224.953,224.806 +30326784,202.545,201.7825,0.170325,0.1689245,184.368,184.153,205.854,205.023,222.162,221.32600000000002,0.186821,0.185285,202.225,201.9885,225.791,224.8795 +36392960,208.774,202.545,0.168625,0.168625,189.723,184.368,195.678,205.09,228.994,222.162,0.184956,0.184956,208.098,202.225,214.629,224.953 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv new file mode 100644 index 0000000..b6a46fd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64 (raw),Base_CUDA-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_64 (raw),RAJA_CUDA-block_64 (smoothed),Base_CUDA-block_64 (raw B/W),Base_CUDA-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_64 (raw B/W),RAJA_CUDA-block_64 (smoothed B/W) +729,31.9709,163.533,11.2564,11.5777,31.8483,162.29,15.994,78.6741,5.63123,5.57301,15.9327,78.0764 +3375,163.533,288.13599999999997,11.5841,11.5567,162.29,290.451,78.6741,137.17105,5.57301,5.530835,78.0764,138.26420000000002 +9261,412.739,412.739,11.5777,11.5777,418.612,418.612,195.668,195.668,5.48866,5.50448,198.452,198.452 +19683,727.574,727.574,11.5357,11.5777,722.443,722.443,342.273,342.273,5.42675,5.48866,339.859,339.859 +35937,1053.65,1053.65,11.7567,11.5777,1051.09,1051.09,493.318,493.318,5.50448,5.48866,492.121,492.121 +68921,1386.0,1386.0,11.4143,11.5357,1375.17,1375.17,646.287,646.287,5.32245,5.42675,641.236,641.236 +132651,1621.29,1621.29,11.8115,11.4143,1628.39,1628.39,753.564,753.564,5.48991,5.32245,756.865,756.865 +250047,1701.15,1701.15,11.0648,11.2895,1700.82,1700.82,788.718,788.718,5.13006,5.21751,788.566,788.566 +531441,1781.14,1781.14,10.0903,11.0648,1779.54,1779.54,823.891,823.891,4.66743,5.13006,823.152,823.152 +753571,1845.33,1813.2350000000001,11.2895,10.577549999999999,1844.49,1812.0149999999999,852.829,838.3599999999999,5.21751,4.898745,852.44,837.796 +1442897,1852.55,1845.33,9.61689,10.0903,1851.15,1844.49,854.982,852.829,4.43834,4.66743,854.334,852.44 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASSVEC3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASSVEC3DPA.csv new file mode 100644 index 0000000..3b137b5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_MASSVEC3DPA.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_64 (raw),Base_CUDA-direct_64 (smoothed),Base_CUDA-runtime_block_stride_loop_64 (raw),Base_CUDA-runtime_block_stride_loop_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-cached_block_stride_loop_64 (raw),RAJA_CUDA-cached_block_stride_loop_64 (smoothed),RAJA_CUDA-direct_64 (raw),RAJA_CUDA-direct_64 (smoothed),RAJA_CUDA-runtime_block_stride_loop_64 (raw),RAJA_CUDA-runtime_block_stride_loop_64 (smoothed),Base_CUDA-direct_64 (raw B/W),Base_CUDA-direct_64 (smoothed B/W),Base_CUDA-runtime_block_stride_loop_64 (raw B/W),Base_CUDA-runtime_block_stride_loop_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-cached_block_stride_loop_64 (raw B/W),RAJA_CUDA-cached_block_stride_loop_64 (smoothed B/W),RAJA_CUDA-direct_64 (raw B/W),RAJA_CUDA-direct_64 (smoothed B/W),RAJA_CUDA-runtime_block_stride_loop_64 (raw B/W),RAJA_CUDA-runtime_block_stride_loop_64 (smoothed B/W) +5376,33.9294,133.032,20.8302,82.6628,12.7342,13.0295,21.9138,85.7661,35.8586,136.71,22.0878,86.0997,10.3695,40.5998,6.36613,25.2277,3.89184,3.97645,6.69729,26.1748,10.9591,41.7224,6.75047,26.2766 +21312,133.032,327.4035,82.6628,199.2609,13.0295,13.2263,85.7661,208.49005,136.71,341.67,86.0997,209.29534999999998,40.5998,99.89089999999999,25.2277,60.7947,3.97645,4.03578,26.1748,63.610400000000006,41.7224,104.24369999999999,26.2766,63.856300000000005 +85056,521.775,521.775,315.859,315.859,13.4231,13.3154,331.214,331.214,546.63,546.63,332.491,332.491,159.182,159.182,96.3617,96.3617,4.09511,4.06186,101.046,101.046,166.765,166.765,101.436,101.436 +169920,915.812,915.812,586.117,586.117,13.4656,13.3154,611.976,611.976,956.187,956.187,613.788,613.788,279.378,279.378,178.801,178.801,4.1078,4.06186,186.69,186.69,291.695,291.695,187.242,187.242 +339840,1410.14,1410.14,997.613,997.613,13.3154,13.4231,1024.74,1024.74,1462.13,1462.13,1024.86,1024.86,430.166,430.166,304.323,304.323,4.06186,4.09511,312.599,312.599,446.023,446.023,312.635,312.635 +679680,1863.74,1863.74,1247.03,1247.03,13.2606,13.3868,1245.9,1245.9,1828.99,1828.99,1244.51,1244.51,568.529,568.529,380.403,380.403,4.04509,4.08355,380.057,380.057,557.927,557.927,379.635,379.635 +1359360,2232.74,2232.74,1503.67,1503.67,13.5939,13.3154,1488.66,1488.66,2206.04,2206.04,1487.81,1487.81,681.084,681.084,458.687,458.687,4.14675,4.06186,454.106,454.106,672.94,672.94,453.847,453.847 +2718720,2391.14,2391.14,1639.87,1639.87,13.3868,13.2606,1603.02,1603.02,2375.81,2375.81,1606.18,1606.18,729.4,729.4,500.232,500.232,4.08355,4.04509,488.989,488.989,724.725,724.725,489.954,489.954 +5437248,2486.35,2486.35,1709.46,1709.46,12.2106,12.2797,1613.81,1613.81,2456.97,2456.97,1614.83,1614.83,758.443,758.443,521.457,521.457,3.72476,3.74583,492.28,492.28,749.481,749.481,492.59,492.59 +7964736,2546.27,2516.31,1748.18,1728.8200000000002,12.2797,12.245149999999999,1647.75,1630.78,2515.47,2486.22,1648.29,1631.56,776.721,767.582,533.27,527.3634999999999,3.74583,3.735295,502.632,497.456,767.326,758.4035,502.798,497.69399999999996 +15929280,2613.91,2546.27,1793.76,1748.18,12.085,12.2106,1686.48,1647.75,2585.31,2515.47,1687.86,1648.29,797.352,776.721,547.173,533.27,3.68644,3.72476,514.449,502.632,788.629,767.326,514.867,502.798 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv new file mode 100644 index 0000000..c3c0780 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256 (raw),Base_CUDA-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_256 (raw),RAJA_CUDA-block_256 (smoothed),Base_CUDA-block_256 (raw B/W),Base_CUDA-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_256 (raw B/W),RAJA_CUDA-block_256 (smoothed B/W) +1000,3.16501,18.717,4.25353,4.25353,3.20872,19.0226,12.2151,67.436,16.4161,15.1809,12.3837,68.5372 +5832,18.717,48.2033,4.21348,4.233504999999999,19.0226,48.49595,67.436,168.99599999999998,15.1809,15.04115,68.5372,170.03359999999998 +27000,77.6896,77.6896,4.27892,4.21348,77.9693,77.9693,270.556,270.556,14.9014,14.9014,271.53,271.53 +54872,124.635,124.635,4.15548,4.21348,124.359,124.359,429.436,429.436,14.3179,14.9014,428.486,428.486 +117649,181.954,181.954,4.05361,4.27892,181.886,181.886,621.341,621.341,13.8423,14.9014,621.106,621.106 +238328,213.795,213.795,4.49925,4.43443,213.888,213.888,725.36,725.36,15.265,14.9065,725.675,725.675 +493039,247.421,247.421,4.52073,4.43443,246.636,246.636,835.056,835.056,15.2577,14.9065,832.406,832.406 +1000000,265.634,260.018,4.43443,4.43443,265.264,259.931,892.939,871.264,14.9065,14.9065,891.696,870.975 +2048383,260.018,263.904,3.21622,3.21622,259.931,264.181,871.264,883.048,10.7769,10.7769,870.975,883.978 +2985984,263.904,264.769,2.95292,3.0845700000000003,264.181,264.72249999999997,883.048,887.9935,9.88076,10.32883,883.978,887.837 +6028568,273.316,263.904,2.89109,2.95292,273.314,264.181,912.551,883.048,9.65281,9.88076,912.545,883.978 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_VOL3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_VOL3D.csv new file mode 100644 index 0000000..89e7ff1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier1/saturation-curve-data/Apps_VOL3D.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256 (raw),Base_CUDA-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_256 (raw),RAJA_CUDA-block_256 (smoothed),Base_CUDA-block_256 (raw B/W),Base_CUDA-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_256 (raw B/W),RAJA_CUDA-block_256 (smoothed B/W) +512,37.4941,152.965,10.589,10.589,38.2069,159.37,16.812,66.2827,4.748,4.63757,17.1316,69.0584 +3375,152.965,354.90000000000003,10.7024,10.5531,159.37,412.1235,66.2827,151.58535,4.63757,4.55589,69.0584,175.9547 +17576,556.835,556.835,10.5172,10.5172,664.877,664.877,236.888,236.888,4.47421,4.47421,282.851,282.851 +35937,1036.49,1036.49,10.4987,10.5172,1079.64,1079.64,438.487,438.487,4.4415,4.4415,456.743,456.743 +79507,1903.39,1903.39,10.3709,10.5172,2003.83,2003.83,801.284,801.284,4.36589,4.4415,843.566,843.566 +166375,2769.61,2769.61,10.5217,10.4987,3240.53,3240.53,1161.75,1161.75,4.4135,4.4135,1359.29,1359.29 +343000,3407.7,3407.7,10.728,10.486,4652.4,4652.4,1425.42,1425.42,4.48746,4.37656,1946.07,1946.07 +704969,4930.32,4567.41,10.486,10.486,5672.4,4770.74,2057.77,1902.98,4.37656,4.37656,2367.49,1987.7 +1442897,4567.41,4669.88,9.76601,9.76601,4770.74,5023.79,1902.98,1944.11,4.06895,4.06895,1987.7,2091.45 +2146689,4669.88,4784.225,9.64971,9.70786,5023.79,5172.46,1944.11,1990.475,4.01726,4.043105000000001,2091.45,2151.995 +4410944,4898.57,4669.88,9.33941,9.64971,5321.13,5023.79,2036.84,1944.11,3.88335,4.01726,2212.54,2091.45 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..d80dda6 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +702,13.0808,8.99998,12.8703 +2754,51.003,9.58193,50.311 +10989,195.584,9.833,195.773 +21951,352.724,9.68897,352.946 +43902,580.97,9.23949,589.277 +87804,902.974,8.59976,846.664 +175608,1139.85,9.40624,1121.27 +351216,1299.59,8.95436,1294.09 +702459,1372.29,8.36122,1332.77 +1028970,1429.44,6.95626,1388.59 +2057940,1512.12,6.7363,1470.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..29f70d2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +702,51.003,9.58193,50.311 +2754,123.2935,9.635449999999999,123.042 +10989,195.584,9.58193,195.773 +21951,352.724,9.58193,352.946 +43902,580.97,9.40624,589.277 +87804,902.974,9.23949,846.664 +175608,1139.85,8.95436,1121.27 +351216,1299.59,8.59976,1294.09 +702459,1372.29,8.36122,1332.77 +1028970,1400.865,7.65874,1360.6799999999998 +2057940,1429.44,6.95626,1388.59 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_flops_raw.csv new file mode 100644 index 0000000..8575ec4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +702,23.566,16.2141,23.1867 +2754,92.2323,17.3277,90.981 +10989,354.031,17.799,354.374 +21951,638.578,17.5411,638.979 +43902,1051.88,16.7287,1066.92 +87804,1634.96,15.571,1533.0 +175608,2063.9,17.0316,2030.26 +351216,2353.16,16.2136,2343.2 +702459,2484.81,15.1397,2413.24 +1028970,2588.29,12.5957,2514.33 +2057940,2738.0,12.1975,2661.73 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_flops_smoothed.csv new file mode 100644 index 0000000..2527e93 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_CONVECTION3DPA_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +702,92.2323,17.3277,90.981 +2754,223.13165,17.4344,222.6775 +10989,354.031,17.3277,354.374 +21951,638.578,17.3277,638.979 +43902,1051.88,17.0316,1066.92 +87804,1634.96,16.7287,1533.0 +175608,2063.9,16.2136,2030.26 +351216,2353.16,15.571,2343.2 +702459,2484.81,15.1397,2413.24 +1028970,2536.55,13.8677,2463.785 +2057940,2588.29,12.5957,2514.33 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv new file mode 100644 index 0000000..b0d8e35 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +841,14.1366,9.00417,14.0566 +3844,62.6523,8.87021,62.6087 +15876,252.507,8.7674,254.62 +32400,487.276,8.77331,484.718 +65025,871.018,8.46653,880.787 +131044,1449.86,8.92438,1458.49 +264196,2284.61,8.45538,2284.84 +528529,2750.66,8.14447,2764.07 +1060900,2197.32,7.43151,2197.41 +1555009,2312.22,7.15839,2314.53 +3115225,2453.4,7.14469,2456.31 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv new file mode 100644 index 0000000..e42b1f5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +841,62.6523,8.87021,62.6087 +3844,157.57965000000002,8.821760000000001,158.61435 +15876,252.507,8.77331,254.62 +32400,487.276,8.77331,484.718 +65025,871.018,8.7674,880.787 +131044,1449.86,8.46653,1458.49 +264196,2197.32,8.45538,2197.41 +528529,2284.61,8.14447,2284.84 +1060900,2312.22,7.43151,2314.53 +1555009,2382.81,7.29495,2385.42 +3115225,2312.22,7.15839,2314.53 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_flops_raw.csv new file mode 100644 index 0000000..6dbd464 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +841,16.3134,10.3907,16.2211 +3844,74.0756,10.4875,74.024 +15876,301.812,10.4793,304.338 +32400,584.269,10.5197,581.203 +65025,1046.67,10.1739,1058.41 +131044,1744.94,10.7407,1755.33 +264196,2752.57,10.1873,2752.84 +528529,3316.6,9.82016,3332.77 +1060900,2650.84,8.96536,2650.95 +1555009,2790.09,8.63781,2792.87 +3115225,2961.37,8.62398,2964.89 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv new file mode 100644 index 0000000..24a3b4f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +841,74.0756,10.4793,74.024 +3844,187.9438,10.4834,189.181 +15876,301.812,10.4793,304.338 +32400,584.269,10.4875,581.203 +65025,1046.67,10.4793,1058.41 +131044,1744.94,10.1873,1755.33 +264196,2650.84,10.1739,2650.95 +528529,2752.57,9.82016,2752.84 +1060900,2790.09,8.96536,2792.87 +1555009,2875.73,8.801585,2878.88 +3115225,2790.09,8.63781,2792.87 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_bandwidth_raw.csv new file mode 100644 index 0000000..790fd40 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +27,3.69148,0.0989909,3.63502 +64,6.3289,0.0997673,7.04729 +216,13.3653,0.100273,13.4897 +512,18.409,0.100642,18.1464 +1000,21.4014,0.100583,21.0388 +1728,22.7549,0.100606,22.7431 +3375,24.0204,0.100667,23.9383 +6859,24.7604,0.100644,24.7607 +13824,25.1391,0.100584,25.1178 +19683,25.1981,0.100496,25.2033 +39304,25.3024,0.100719,25.3391 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv new file mode 100644 index 0000000..f2adee3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +27,6.3289,0.0997673,7.04729 +64,9.8471,0.10002015,10.268495 +216,13.3653,0.100273,13.4897 +512,18.409,0.100583,18.1464 +1000,21.4014,0.100606,21.0388 +1728,22.7549,0.100642,22.7431 +3375,24.0204,0.100606,23.9383 +6859,24.7604,0.100606,24.7607 +13824,25.1391,0.100644,25.1178 +19683,25.168599999999998,0.10061400000000001,25.16055 +39304,25.1981,0.100584,25.2033 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_flops_raw.csv new file mode 100644 index 0000000..6d8c8df --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +27,171.232,4.59175,168.613 +64,293.57,4.62777,326.893 +216,619.958,4.65123,625.73 +512,853.911,4.66836,841.732 +1000,992.716,4.66559,975.897 +1728,1055.5,4.66666,1054.95 +3375,1114.2,4.66949,1110.39 +6859,1148.53,4.66843,1148.54 +13824,1166.1,4.66566,1165.1 +19683,1168.83,4.66159,1169.07 +39304,1173.67,4.67192,1175.37 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_flops_smoothed.csv new file mode 100644 index 0000000..7ba6227 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_INTSC_HEXHEX_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64,Base_Seq-default,RAJA_CUDA-block_64 +27,293.57,4.62777,326.893 +64,456.764,4.6395,476.3115 +216,619.958,4.65123,625.73 +512,853.911,4.66559,841.732 +1000,992.716,4.66666,975.897 +1728,1055.5,4.66836,1054.95 +3375,1114.2,4.66666,1110.39 +6859,1148.53,4.66666,1148.54 +13824,1166.1,4.66843,1165.1 +19683,1167.465,4.667045,1167.085 +39304,1168.83,4.66566,1169.07 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_bandwidth_raw.csv new file mode 100644 index 0000000..7165526 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-kernel_256,RAJA_CUDA-launch_256 +1344,28.1899,7.18731,27.6239,27.5332 +4992,102.646,7.10145,97.9681,101.627 +19392,313.487,7.10468,297.509,303.501 +38784,444.111,7.10163,426.672,445.238 +77568,634.204,7.11226,620.637,617.555 +154944,773.189,7.02907,763.865,783.746 +309696,894.303,6.9884,885.243,914.464 +619392,966.655,6.86713,960.322,995.561 +1238784,953.226,7.0928,928.741,937.816 +1814592,969.049,6.32401,943.198,952.809 +3629184,987.865,6.24426,961.381,971.802 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_bandwidth_smoothed.csv new file mode 100644 index 0000000..5b6f626 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-kernel_256,RAJA_CUDA-launch_256 +1344,102.646,7.10468,97.9681,101.627 +4992,208.06650000000002,7.103155,197.73855,202.564 +19392,313.487,7.10468,297.509,303.501 +38784,444.111,7.10163,426.672,445.238 +77568,634.204,7.10163,620.637,617.555 +154944,773.189,7.02907,763.865,783.746 +309696,894.303,7.02907,885.243,914.464 +619392,953.226,6.9884,928.741,937.816 +1238784,966.655,6.86713,943.198,952.809 +1814592,967.852,6.59557,951.76,962.3054999999999 +3629184,969.049,6.32401,943.198,952.809 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_flops_raw.csv new file mode 100644 index 0000000..e89e96c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-kernel_256,RAJA_CUDA-launch_256 +1344,20.0297,5.10678,19.6275,19.5631 +4992,73.568,5.08973,70.2153,72.8381 +19392,225.218,5.1042,213.739,218.043 +38784,319.194,5.10412,306.66,320.004 +77568,455.913,5.11283,446.16,443.945 +154944,555.883,5.05354,549.18,563.474 +309696,642.991,5.02456,636.478,657.487 +619392,695.03,4.9375,690.477,715.813 +1238784,685.383,5.09983,667.778,674.303 +1814592,696.763,4.54707,678.176,685.086 +3629184,710.295,4.48975,691.252,698.745 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_flops_smoothed.csv new file mode 100644 index 0000000..d5ccad4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_LTIMES_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-kernel_256,RAJA_CUDA-launch_256 +1344,73.568,5.1042,70.2153,72.8381 +4992,149.393,5.10416,141.97715,145.44055 +19392,225.218,5.1042,213.739,218.043 +38784,319.194,5.10412,306.66,320.004 +77568,455.913,5.10412,446.16,443.945 +154944,555.883,5.05354,549.18,563.474 +309696,642.991,5.05354,636.478,657.487 +619392,685.383,5.02456,667.778,674.303 +1238784,695.03,4.9375,678.176,685.086 +1814592,695.8965000000001,4.742285,684.3265,691.9155000000001 +3629184,696.763,4.54707,678.176,685.086 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..0d113d5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_25,Base_Seq-default,RAJA_CUDA-block_25 +1600,15.285,6.5807,15.3135 +6336,61.5,6.95157,60.989 +25344,236.56,7.01696,236.652 +50624,422.384,7.02056,422.768 +101184,667.038,6.83109,667.937 +202368,1033.94,6.88576,1032.6 +404736,1270.66,6.77938,1264.16 +809536,1432.49,6.86773,1425.82 +1619008,1489.37,6.4805,1479.04 +2371584,1545.07,5.83072,1536.46 +4743104,1606.41,5.71091,1599.49 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..55b74ef --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_25,Base_Seq-default,RAJA_CUDA-block_25 +1600,61.5,6.95157,60.989 +6336,149.03,6.984265000000001,148.82049999999998 +25344,236.56,6.95157,236.652 +50624,422.384,6.95157,422.768 +101184,667.038,6.88576,667.937 +202368,1033.94,6.86773,1032.6 +404736,1270.66,6.83109,1264.16 +809536,1432.49,6.77938,1425.82 +1619008,1489.37,6.4805,1479.04 +2371584,1517.2199999999998,6.15561,1507.75 +4743104,1545.07,5.83072,1536.46 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_flops_raw.csv new file mode 100644 index 0000000..8d78788 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_25,Base_Seq-default,RAJA_CUDA-block_25 +1600,32.6401,14.0527,32.701 +6336,131.824,14.9006,130.729 +25344,507.546,15.0551,507.744 +50624,906.382,15.0652,907.206 +101184,1431.49,14.6598,1433.42 +202368,2218.97,14.7777,2216.09 +404736,2727.06,14.5497,2713.09 +809536,3074.41,14.7395,3060.07 +1619008,3196.5,13.9085,3174.31 +2371584,3316.03,12.5139,3297.56 +4743104,3447.69,12.2568,3432.84 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_flops_smoothed.csv new file mode 100644 index 0000000..50db2e2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MASS3DPA_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_25,Base_Seq-default,RAJA_CUDA-block_25 +1600,131.824,14.9006,130.729 +6336,319.685,14.97785,319.23650000000004 +25344,507.546,14.9006,507.744 +50624,906.382,14.9006,907.206 +101184,1431.49,14.7777,1433.42 +202368,2218.97,14.7395,2216.09 +404736,2727.06,14.6598,2713.09 +809536,3074.41,14.5497,3060.07 +1619008,3196.5,13.9085,3174.31 +2371584,3256.2650000000003,13.2112,3235.935 +4743104,3316.03,12.5139,3297.56 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv new file mode 100644 index 0000000..295da51 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +64,3.64713,17.6762,4.39112 +512,22.4171,15.6634,23.7695 +3375,132.972,14.2103,141.771 +8000,305.958,13.6766,324.241 +17576,646.562,12.4379,688.457 +35937,1091.71,12.2524,1098.45 +79507,1932.98,12.054,1877.56 +157464,2620.58,12.5233,2325.58 +328509,2057.35,12.4101,2108.48 +493039,1910.98,12.3707,2213.75 +1000000,2116.18,12.2002,2417.72 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv new file mode 100644 index 0000000..4578b7c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +64,22.4171,15.6634,23.7695 +512,77.69455,14.93685,82.77024999999999 +3375,132.972,14.2103,141.771 +8000,305.958,13.6766,324.241 +17576,646.562,12.4379,688.457 +35937,1091.71,12.4379,1098.45 +79507,1932.98,12.4101,1877.56 +157464,1932.98,12.3707,2108.48 +328509,2057.35,12.3707,2213.75 +493039,2086.765,12.3904,2269.665 +1000000,2057.35,12.3707,2213.75 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_flops_raw.csv new file mode 100644 index 0000000..91cdb84 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +64,1.03517,5.01708,1.24634 +512,7.57386,5.29204,8.03078 +3375,49.3251,5.27123,52.5889 +8000,116.784,5.22034,123.763 +17576,251.866,4.84513,268.187 +35937,431.565,4.84351,434.228 +79507,774.039,4.82689,751.847 +157464,1058.63,5.05904,939.463 +328509,837.387,5.05119,858.197 +493039,780.501,5.05256,904.162 +1000000,868.668,5.00806,992.449 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv new file mode 100644 index 0000000..5bea1e1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +64,7.57386,5.27123,8.03078 +512,28.44948,5.245785,30.30984 +3375,49.3251,5.22034,52.5889 +8000,116.784,5.22034,123.763 +17576,251.866,4.84513,268.187 +35937,431.565,4.84513,434.228 +79507,774.039,4.84513,751.847 +157464,780.501,5.05119,858.197 +328509,837.387,5.05119,904.162 +493039,853.0274999999999,5.051875,921.8125 +1000000,837.387,5.05119,904.162 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv new file mode 100644 index 0000000..86d73b6 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +80000,185.245,6.21439,182.04 +160000,345.609,8.07202,346.669 +320000,638.26,7.95189,628.902 +640000,1113.95,7.98527,1109.59 +1280000,1798.43,7.7401,1793.54 +2560000,2126.15,7.04253,2115.35 +3750000,2188.95,6.62487,2192.44 +7500000,2115.68,6.50583,2113.59 +10000000,2191.86,6.51347,2192.79 +12500000,2239.48,6.59158,2238.9 +15000000,2265.99,6.56119,2261.96 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv new file mode 100644 index 0000000..2a19690 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +80000,345.609,7.95189,346.669 +160000,491.93449999999996,7.968579999999999,487.7855 +320000,638.26,7.95189,628.902 +640000,1113.95,7.95189,1109.59 +1280000,1798.43,7.7401,1793.54 +2560000,2115.68,7.04253,2113.59 +3750000,2126.15,6.62487,2115.35 +7500000,2188.95,6.59158,2192.44 +10000000,2191.86,6.56119,2192.79 +12500000,2215.67,6.53733,2215.8450000000003 +15000000,2239.48,6.56119,2238.9 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_flops_raw.csv new file mode 100644 index 0000000..e15dc6c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +80000,0.0,0.0,0.0 +160000,0.0,0.0,0.0 +320000,0.0,0.0,0.0 +640000,0.0,0.0,0.0 +1280000,0.0,0.0,0.0 +2560000,0.0,0.0,0.0 +3750000,0.0,0.0,0.0 +7500000,0.0,0.0,0.0 +10000000,0.0,0.0,0.0 +12500000,0.0,0.0,0.0 +15000000,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_flops_smoothed.csv new file mode 100644 index 0000000..e15dc6c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_INDEXLIST_3LOOP_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256,Base_Seq-default,RAJA_CUDA-block_256 +80000,0.0,0.0,0.0 +160000,0.0,0.0,0.0 +320000,0.0,0.0,0.0 +640000,0.0,0.0,0.0 +1280000,0.0,0.0,0.0 +2560000,0.0,0.0,0.0 +3750000,0.0,0.0,0.0 +7500000,0.0,0.0,0.0 +10000000,0.0,0.0,0.0 +12500000,0.0,0.0,0.0 +15000000,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_bandwidth_raw.csv new file mode 100644 index 0000000..15f0259 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-atomic_direct_256,Base_CUDA-atomic_occgs_256,Base_Seq-default,RAJA_CUDA-atomic_direct_256,RAJA_CUDA-atomic_occgs_256 +99995,1.25844,1.26529,6.96569,1.22664,1.20025 +199995,2.50913,2.51178,6.92973,2.44485,2.40478 +399995,5.02467,5.03756,6.94815,4.86807,4.79058 +799995,10.0437,10.0659,6.94406,9.76294,9.58923 +1599995,20.155,20.0771,6.77215,19.5602,19.1352 +3199995,41.679,40.2205,6.38419,40.8481,39.8695 +4687495,60.9197,58.8195,6.05978,59.7946,58.5048 +9374995,122.225,117.632,5.88666,119.573,116.216 +12499995,163.402,157.554,5.95966,162.901,155.161 +15624995,208.178,196.703,5.8877,204.578,193.607 +18749995,249.995,234.088,5.98091,249.162,233.146 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_bandwidth_smoothed.csv new file mode 100644 index 0000000..f066226 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-atomic_direct_256,Base_CUDA-atomic_occgs_256,Base_Seq-default,RAJA_CUDA-atomic_direct_256,RAJA_CUDA-atomic_occgs_256 +99995,2.50913,2.51178,6.94815,2.44485,2.40478 +199995,3.7669,3.77467,6.946105,3.65646,3.5976800000000004 +399995,5.02467,5.03756,6.94406,4.86807,4.79058 +799995,10.0437,10.0659,6.92973,9.76294,9.58923 +1599995,20.155,20.0771,6.77215,19.5602,19.1352 +3199995,41.679,40.2205,6.38419,40.8481,39.8695 +4687495,60.9197,58.8195,6.05978,59.7946,58.5048 +9374995,122.225,117.632,5.95966,119.573,116.216 +12499995,163.402,157.554,5.95966,162.901,155.161 +15624995,185.79,177.1285,5.92368,183.73950000000002,174.38400000000001 +18749995,208.178,196.703,5.95966,204.578,193.607 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_flops_raw.csv new file mode 100644 index 0000000..81a5dfc --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-atomic_direct_256,Base_CUDA-atomic_occgs_256,Base_Seq-default,RAJA_CUDA-atomic_direct_256,RAJA_CUDA-atomic_occgs_256 +99995,0.0844437,0.0849038,0.467413,0.08231,0.0805395 +199995,0.168376,0.168555,0.465023,0.164063,0.161374 +399995,0.337191,0.338056,0.466271,0.326683,0.321482 +799995,0.674012,0.675501,0.466002,0.655172,0.643515 +1599995,1.35257,1.34734,0.454468,1.31265,1.28413 +3199995,2.79702,2.69914,0.428434,2.74126,2.67559 +4687495,4.08824,3.9473,0.406664,4.01274,3.92618 +9374995,8.20238,7.89413,0.395046,8.02441,7.7991 +12499995,10.9657,10.5733,0.399946,10.9321,10.4127 +15624995,13.9706,13.2005,0.395117,13.729,12.9928 +18749995,16.7769,15.7094,0.401372,16.721,15.6462 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_flops_smoothed.csv new file mode 100644 index 0000000..d869c1b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_MULTI_REDUCE_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-atomic_direct_256,Base_CUDA-atomic_occgs_256,Base_Seq-default,RAJA_CUDA-atomic_direct_256,RAJA_CUDA-atomic_occgs_256 +99995,0.168376,0.168555,0.466271,0.164063,0.161374 +199995,0.2527835,0.2533055,0.4661365,0.245373,0.24142799999999998 +399995,0.337191,0.338056,0.466002,0.326683,0.321482 +799995,0.674012,0.675501,0.465023,0.655172,0.643515 +1599995,1.35257,1.34734,0.454468,1.31265,1.28413 +3199995,2.79702,2.69914,0.428434,2.74126,2.67559 +4687495,4.08824,3.9473,0.406664,4.01274,3.92618 +9374995,8.20238,7.89413,0.399946,8.02441,7.7991 +12499995,10.9657,10.5733,0.399946,10.9321,10.4127 +15624995,12.46815,11.8869,0.39753150000000004,12.330549999999999,11.70275 +18749995,13.9706,13.2005,0.399946,13.729,12.9928 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_bandwidth_raw.csv new file mode 100644 index 0000000..bafb44c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-blkatm_direct_256,Base_CUDA-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_CUDA-blkatm_direct_256,RAJA_CUDA-blkatm_occgs_256,RAJA_CUDA-blkdev_direct_256,RAJA_CUDA-blkdev_direct_new_256,RAJA_CUDA-blkdev_occgs_256,RAJA_CUDA-blkdev_occgs_new_256 +100000,1.25739,1.26096,6.73416,14.0414,7.0409,1.23939,1.20995,59.1779,49.4085,58.9502,49.4196 +200000,2.51246,2.52978,6.71082,13.8645,7.01505,2.46425,2.39066,103.558,75.9507,102.736,94.4849 +400000,5.07893,5.04064,6.69086,13.9127,7.0069,5.01342,4.79053,145.453,128.384,203.545,184.567 +800000,10.2266,10.0696,6.71957,13.7919,6.97953,10.1306,9.6226,181.31,182.255,401.047,360.348 +1600000,20.7473,20.1229,6.59678,12.3329,6.74481,20.4721,20.222,208.444,226.96,743.831,677.05 +3200000,41.6873,40.3235,5.85546,10.7532,6.05561,41.8405,39.8752,203.23,246.047,1057.18,994.144 +4687500,62.3578,58.8472,5.88288,9.63741,5.76193,62.5251,58.897,199.728,253.014,1333.73,1258.16 +9375000,131.759,117.655,5.67759,9.16486,5.79071,133.842,117.597,194.678,268.242,1828.09,1609.17 +12500000,183.904,156.884,6.60337,9.42505,5.83336,179.502,155.879,193.53,273.398,2031.56,1965.21 +15625000,322.379,309.88,6.57882,9.2715,5.92925,200.018,194.536,192.364,274.404,2183.43,2113.4 +18750000,321.197,351.804,6.59273,9.37161,6.81255,217.55,232.102,192.16,277.96,2229.94,2180.61 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv new file mode 100644 index 0000000..d636801 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-blkatm_direct_256,Base_CUDA-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_CUDA-blkatm_direct_256,RAJA_CUDA-blkatm_occgs_256,RAJA_CUDA-blkdev_direct_256,RAJA_CUDA-blkdev_direct_new_256,RAJA_CUDA-blkdev_occgs_256,RAJA_CUDA-blkdev_occgs_new_256 +100000,2.51246,2.52978,6.71082,13.9127,7.01505,2.46425,2.39066,103.558,75.9507,102.736,94.4849 +200000,3.795695,3.78521,6.715195,13.8886,7.010975,3.738835,3.5905950000000004,124.50550000000001,102.16735,153.1405,139.52595 +400000,5.07893,5.04064,6.71082,13.8645,7.0069,5.01342,4.79053,145.453,128.384,203.545,184.567 +800000,10.2266,10.0696,6.69086,13.7919,6.97953,10.1306,9.6226,181.31,182.255,401.047,360.348 +1600000,20.7473,20.1229,6.59678,12.3329,6.74481,20.4721,20.222,199.728,226.96,743.831,677.05 +3200000,41.6873,40.3235,5.88288,10.7532,6.05561,41.8405,39.8752,199.728,246.047,1057.18,994.144 +4687500,62.3578,58.8472,5.88288,9.63741,5.83336,62.5251,58.897,199.728,253.014,1333.73,1258.16 +9375000,131.759,117.655,5.88288,9.42505,5.83336,133.842,117.597,194.678,268.242,1828.09,1609.17 +12500000,183.904,156.884,6.57882,9.37161,5.83336,179.502,155.879,193.53,273.398,2031.56,1965.21 +15625000,252.5505,233.382,6.585775,9.321555,5.881304999999999,189.76,175.20749999999998,192.947,273.901,2107.495,2039.305 +18750000,321.197,309.88,6.59273,9.37161,5.92925,200.018,194.536,192.364,274.404,2183.43,2113.4 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_flops_raw.csv new file mode 100644 index 0000000..0acfb24 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-blkatm_direct_256,Base_CUDA-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_CUDA-blkatm_direct_256,RAJA_CUDA-blkatm_occgs_256,RAJA_CUDA-blkdev_direct_256,RAJA_CUDA-blkdev_direct_new_256,RAJA_CUDA-blkdev_occgs_256,RAJA_CUDA-blkdev_occgs_new_256 +100000,0.168766,0.169245,0.903853,1.88462,0.945023,0.166349,0.162398,7.9428,6.63156,7.91224,6.63305 +200000,0.337219,0.339543,0.900716,1.86087,0.941549,0.330747,0.320871,13.8994,10.194,13.789,12.6816 +400000,0.681684,0.676545,0.898034,1.86734,0.940453,0.672891,0.642976,19.5225,17.2315,27.3195,24.7722 +800000,1.3726,1.35152,0.901887,1.85112,0.936778,1.35971,1.29153,24.3351,24.4619,53.8276,48.3652 +1600000,2.78466,2.70085,0.885405,1.65529,0.905274,2.74772,2.71416,27.9768,30.4621,99.8353,90.8721 +3200000,5.59518,5.41213,0.785907,1.44327,0.81277,5.61573,5.35196,27.2771,33.0238,141.892,133.432 +4687500,8.36953,7.89834,0.789586,1.29351,0.773354,8.39197,7.90503,26.8071,33.959,179.011,168.868 +9375000,17.6844,15.7914,0.762034,1.23009,0.777216,17.964,15.7837,26.1292,36.0028,245.362,215.979 +12500000,24.6832,21.0566,0.886289,1.26501,0.782941,24.0924,20.9218,25.9751,36.6949,272.671,263.766 +15625000,43.2689,41.5914,0.882995,1.2444,0.79581,26.846,26.1101,25.8187,36.8299,293.055,283.656 +18750000,43.1103,47.2183,0.884861,1.25784,0.914365,29.1991,31.1522,25.7913,37.3071,299.298,292.677 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_flops_smoothed.csv new file mode 100644 index 0000000..0c80cad --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Basic_REDUCE_STRUCT_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-blkatm_direct_256,Base_CUDA-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_CUDA-blkatm_direct_256,RAJA_CUDA-blkatm_occgs_256,RAJA_CUDA-blkdev_direct_256,RAJA_CUDA-blkdev_direct_new_256,RAJA_CUDA-blkdev_occgs_256,RAJA_CUDA-blkdev_occgs_new_256 +100000,0.337219,0.339543,0.900716,1.86734,0.941549,0.330747,0.320871,13.8994,10.194,13.789,12.6816 +200000,0.5094515,0.5080439999999999,0.9013015,1.864105,0.941001,0.501819,0.4819235,16.71095,13.71275,20.55425,18.7269 +400000,0.681684,0.676545,0.900716,1.86087,0.940453,0.672891,0.642976,19.5225,17.2315,27.3195,24.7722 +800000,1.3726,1.35152,0.898034,1.85112,0.936778,1.35971,1.29153,24.3351,24.4619,53.8276,48.3652 +1600000,2.78466,2.70085,0.885405,1.65529,0.905274,2.74772,2.71416,26.8071,30.4621,99.8353,90.8721 +3200000,5.59518,5.41213,0.789586,1.44327,0.81277,5.61573,5.35196,26.8071,33.0238,141.892,133.432 +4687500,8.36953,7.89834,0.789586,1.29351,0.782941,8.39197,7.90503,26.8071,33.959,179.011,168.868 +9375000,17.6844,15.7914,0.789586,1.26501,0.782941,17.964,15.7837,26.1292,36.0028,245.362,215.979 +12500000,24.6832,21.0566,0.882995,1.25784,0.782941,24.0924,20.9218,25.9751,36.6949,272.671,263.766 +15625000,33.89675,31.323999999999998,0.883928,1.25112,0.7893755,25.4692,23.51595,25.896900000000002,36.7624,282.863,273.711 +18750000,43.1103,41.5914,0.884861,1.25784,0.79581,26.846,26.1101,25.8187,36.8299,293.055,283.656 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv new file mode 100644 index 0000000..ea9c7cb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_1024,Base_Seq-direct,RAJA_CUDA-direct_1024,RAJA_CUDA-funcptr_1024,RAJA_CUDA-virtfunc_1024 +42875,27.8679,37.5249,24.3736,22.4841,22.6106 +91125,38.7235,35.4562,35.0238,32.7541,32.4712 +205379,51.5063,25.7731,40.2678,43.7553,43.5118 +421875,60.5788,19.5101,58.8854,55.7691,55.5149 +884736,78.1177,15.2354,74.6275,69.6403,70.7258 +1860867,73.5342,14.1839,75.5354,72.6788,72.5391 +2744000,88.3422,13.453,87.001,82.5619,82.1592 +5639752,83.8245,11.488,84.1051,79.0234,78.0234 +7645373,83.5172,11.4005,83.7469,79.2586,78.8235 +9528128,93.1066,10.815,93.3876,87.1422,87.6568 +11543176,83.9146,8.71324,83.4915,78.9519,78.465 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv new file mode 100644 index 0000000..c702c62 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_1024,Base_Seq-direct,RAJA_CUDA-direct_1024,RAJA_CUDA-funcptr_1024,RAJA_CUDA-virtfunc_1024 +42875,38.7235,35.4562,35.0238,32.7541,32.4712 +91125,45.114900000000006,30.61465,37.6458,38.2547,37.9915 +205379,51.5063,25.7731,40.2678,43.7553,43.5118 +421875,60.5788,19.5101,58.8854,55.7691,55.5149 +884736,73.5342,15.2354,74.6275,69.6403,70.7258 +1860867,78.1177,14.1839,75.5354,72.6788,72.5391 +2744000,83.5172,13.453,83.7469,79.0234,78.0234 +5639752,83.8245,11.488,84.1051,79.2586,78.8235 +7645373,83.9146,11.4005,84.1051,79.2586,78.8235 +9528128,83.86955,11.10775,83.92599999999999,79.14099999999999,78.64425 +11543176,83.9146,10.815,83.7469,79.2586,78.8235 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_flops_raw.csv new file mode 100644 index 0000000..f9837e4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_flops_raw.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_1024,Base_Seq-direct,RAJA_CUDA-direct_1024,RAJA_CUDA-funcptr_1024,RAJA_CUDA-virtfunc_1024 +42875,0.0,0.0,0.0,0.0,0.0 +91125,0.0,0.0,0.0,0.0,0.0 +205379,0.0,0.0,0.0,0.0,0.0 +421875,0.0,0.0,0.0,0.0,0.0 +884736,0.0,0.0,0.0,0.0,0.0 +1860867,0.0,0.0,0.0,0.0,0.0 +2744000,0.0,0.0,0.0,0.0,0.0 +5639752,0.0,0.0,0.0,0.0,0.0 +7645373,0.0,0.0,0.0,0.0,0.0 +9528128,0.0,0.0,0.0,0.0,0.0 +11543176,0.0,0.0,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_flops_smoothed.csv new file mode 100644 index 0000000..f9837e4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/Comm_HALO_PACKING_FUSED_flops_smoothed.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_1024,Base_Seq-direct,RAJA_CUDA-direct_1024,RAJA_CUDA-funcptr_1024,RAJA_CUDA-virtfunc_1024 +42875,0.0,0.0,0.0,0.0,0.0 +91125,0.0,0.0,0.0,0.0,0.0 +205379,0.0,0.0,0.0,0.0,0.0 +421875,0.0,0.0,0.0,0.0,0.0 +884736,0.0,0.0,0.0,0.0,0.0 +1860867,0.0,0.0,0.0,0.0,0.0 +2744000,0.0,0.0,0.0,0.0,0.0 +5639752,0.0,0.0,0.0,0.0,0.0 +7645373,0.0,0.0,0.0,0.0,0.0 +9528128,0.0,0.0,0.0,0.0,0.0 +11543176,0.0,0.0,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_CONVECTION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_CONVECTION3DPA.csv new file mode 100644 index 0000000..fb97c48 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_CONVECTION3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_CONVECTION3DPA-Base_Seq-default,702.0,16.2141,8.99998 +Apps_CONVECTION3DPA-Base_CUDA-block_64,351216.0,2353.16,1299.59 +Apps_CONVECTION3DPA-RAJA_CUDA-block_64,351216.0,2343.2,1294.09 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_DEL_DOT_VEC_2D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_DEL_DOT_VEC_2D.csv new file mode 100644 index 0000000..9b75eb8 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_DEL_DOT_VEC_2D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DEL_DOT_VEC_2D-Base_Seq-default,841.0,10.3907,9.00417 +Apps_DEL_DOT_VEC_2D-Base_CUDA-block_256,264196.0,2752.57,2284.61 +Apps_DEL_DOT_VEC_2D-RAJA_CUDA-block_256,264196.0,2752.84,2284.84 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_INTSC_HEXHEX.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_INTSC_HEXHEX.csv new file mode 100644 index 0000000..35fc6e9 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_INTSC_HEXHEX.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_INTSC_HEXHEX-Base_Seq-default,27.0,4.59175,0.0989909 +Apps_INTSC_HEXHEX-Base_CUDA-block_64,1728.0,1055.5,22.7549 +Apps_INTSC_HEXHEX-RAJA_CUDA-block_64,1728.0,1054.95,22.7431 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_LTIMES.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_LTIMES.csv new file mode 100644 index 0000000..2a2248d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_LTIMES.csv @@ -0,0 +1,5 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_LTIMES-Base_Seq-default,1344.0,5.10678,7.18731 +Apps_LTIMES-Base_CUDA-block_256,309696.0,642.991,894.303 +Apps_LTIMES-RAJA_CUDA-kernel_256,309696.0,636.478,885.243 +Apps_LTIMES-RAJA_CUDA-launch_256,309696.0,657.487,914.464 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_MASS3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_MASS3DPA.csv new file mode 100644 index 0000000..c4de6ac --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_MASS3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DPA-Base_Seq-default,1600.0,14.0527,6.5807 +Apps_MASS3DPA-Base_CUDA-block_25,809536.0,3074.41,1432.49 +Apps_MASS3DPA-RAJA_CUDA-block_25,809536.0,3060.07,1425.82 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_MATVEC_3D_STENCIL.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_MATVEC_3D_STENCIL.csv new file mode 100644 index 0000000..4115a60 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Apps_MATVEC_3D_STENCIL.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MATVEC_3D_STENCIL-Base_Seq-default,64.0,5.01708,17.6762 +Apps_MATVEC_3D_STENCIL-Base_CUDA-block_256,79507.0,774.039,1932.98 +Apps_MATVEC_3D_STENCIL-RAJA_CUDA-block_256,157464.0,939.463,2325.58 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_INDEXLIST_3LOOP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_INDEXLIST_3LOOP.csv new file mode 100644 index 0000000..9824743 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_INDEXLIST_3LOOP.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_INDEXLIST_3LOOP-Base_Seq-default,80000.0,0.0,6.21439 +Basic_INDEXLIST_3LOOP-Base_CUDA-block_256,80000.0,0.0,185.245 +Basic_INDEXLIST_3LOOP-RAJA_CUDA-block_256,80000.0,0.0,182.04 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_MULTI_REDUCE.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_MULTI_REDUCE.csv new file mode 100644 index 0000000..8151b8e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_MULTI_REDUCE.csv @@ -0,0 +1,6 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_MULTI_REDUCE-Base_Seq-default,99995.0,0.467413,6.96569 +Basic_MULTI_REDUCE-Base_CUDA-atomic_direct_256,18749995.0,16.7769,249.995 +Basic_MULTI_REDUCE-Base_CUDA-atomic_occgs_256,15624995.0,13.2005,196.703 +Basic_MULTI_REDUCE-RAJA_CUDA-atomic_direct_256,18749995.0,16.721,249.162 +Basic_MULTI_REDUCE-RAJA_CUDA-atomic_occgs_256,15624995.0,12.9928,193.607 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_REDUCE_STRUCT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_REDUCE_STRUCT.csv new file mode 100644 index 0000000..daddffb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Basic_REDUCE_STRUCT.csv @@ -0,0 +1,12 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_REDUCE_STRUCT-Base_Seq-default,100000.0,1.88462,14.0414 +Basic_REDUCE_STRUCT-Base_Seq-kahan,100000.0,0.945023,7.0409 +Basic_REDUCE_STRUCT-Base_Seq-cascade,100000.0,0.903853,6.73416 +Basic_REDUCE_STRUCT-Base_CUDA-blkatm_direct_256,18750000.0,43.1103,321.197 +Basic_REDUCE_STRUCT-Base_CUDA-blkatm_occgs_256,18750000.0,47.2183,351.804 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkatm_direct_256,15625000.0,26.846,200.018 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkdev_direct_256,800000.0,24.3351,181.31 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkdev_direct_new_256,4687500.0,33.959,253.014 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkatm_occgs_256,15625000.0,26.1101,194.536 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkdev_occgs_256,12500000.0,272.671,2031.56 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkdev_occgs_new_256,12500000.0,263.766,1965.21 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Comm_HALO_PACKING_FUSED.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Comm_HALO_PACKING_FUSED.csv new file mode 100644 index 0000000..8b939c5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/Comm_HALO_PACKING_FUSED.csv @@ -0,0 +1,6 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Comm_HALO_PACKING_FUSED-Base_Seq-direct,42875.0,0.0,37.5249 +Comm_HALO_PACKING_FUSED-Base_CUDA-direct_1024,42875.0,0.0,27.8679 +Comm_HALO_PACKING_FUSED-RAJA_CUDA-direct_1024,42875.0,0.0,24.3736 +Comm_HALO_PACKING_FUSED-RAJA_CUDA-funcptr_1024,42875.0,0.0,22.4841 +Comm_HALO_PACKING_FUSED-RAJA_CUDA-virtfunc_1024,42875.0,0.0,22.6106 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/combined_fom.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/combined_fom.csv new file mode 100644 index 0000000..4959099 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/FOM/combined_fom.csv @@ -0,0 +1,44 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_CONVECTION3DPA-Base_CUDA-block_64,351216.0,2353.16,1299.59 +Apps_CONVECTION3DPA-Base_Seq-default,702.0,16.2141,8.99998 +Apps_CONVECTION3DPA-RAJA_CUDA-block_64,351216.0,2343.2,1294.09 +Apps_DEL_DOT_VEC_2D-Base_CUDA-block_256,264196.0,2752.57,2284.61 +Apps_DEL_DOT_VEC_2D-Base_Seq-default,841.0,10.3907,9.00417 +Apps_DEL_DOT_VEC_2D-RAJA_CUDA-block_256,264196.0,2752.84,2284.84 +Apps_INTSC_HEXHEX-Base_CUDA-block_64,1728.0,1055.5,22.7549 +Apps_INTSC_HEXHEX-Base_Seq-default,27.0,4.59175,0.0989909 +Apps_INTSC_HEXHEX-RAJA_CUDA-block_64,1728.0,1054.95,22.7431 +Apps_LTIMES-Base_CUDA-block_256,309696.0,642.991,894.303 +Apps_LTIMES-Base_Seq-default,1344.0,5.10678,7.18731 +Apps_LTIMES-RAJA_CUDA-kernel_256,309696.0,636.478,885.243 +Apps_LTIMES-RAJA_CUDA-launch_256,309696.0,657.487,914.464 +Apps_MASS3DPA-Base_CUDA-block_25,809536.0,3074.41,1432.49 +Apps_MASS3DPA-Base_Seq-default,1600.0,14.0527,6.5807 +Apps_MASS3DPA-RAJA_CUDA-block_25,809536.0,3060.07,1425.82 +Apps_MATVEC_3D_STENCIL-Base_CUDA-block_256,79507.0,774.039,1932.98 +Apps_MATVEC_3D_STENCIL-Base_Seq-default,64.0,5.01708,17.6762 +Apps_MATVEC_3D_STENCIL-RAJA_CUDA-block_256,157464.0,939.463,2325.58 +Basic_INDEXLIST_3LOOP-Base_CUDA-block_256,80000.0,0.0,185.245 +Basic_INDEXLIST_3LOOP-Base_Seq-default,80000.0,0.0,6.21439 +Basic_INDEXLIST_3LOOP-RAJA_CUDA-block_256,80000.0,0.0,182.04 +Basic_MULTI_REDUCE-Base_CUDA-atomic_direct_256,18749995.0,16.7769,249.995 +Basic_MULTI_REDUCE-Base_CUDA-atomic_occgs_256,15624995.0,13.2005,196.703 +Basic_MULTI_REDUCE-Base_Seq-default,99995.0,0.467413,6.96569 +Basic_MULTI_REDUCE-RAJA_CUDA-atomic_direct_256,18749995.0,16.721,249.162 +Basic_MULTI_REDUCE-RAJA_CUDA-atomic_occgs_256,15624995.0,12.9928,193.607 +Basic_REDUCE_STRUCT-Base_CUDA-blkatm_direct_256,18750000.0,43.1103,321.197 +Basic_REDUCE_STRUCT-Base_CUDA-blkatm_occgs_256,18750000.0,47.2183,351.804 +Basic_REDUCE_STRUCT-Base_Seq-cascade,100000.0,0.903853,6.73416 +Basic_REDUCE_STRUCT-Base_Seq-default,100000.0,1.88462,14.0414 +Basic_REDUCE_STRUCT-Base_Seq-kahan,100000.0,0.945023,7.0409 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkatm_direct_256,15625000.0,26.846,200.018 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkatm_occgs_256,15625000.0,26.1101,194.536 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkdev_direct_256,800000.0,24.3351,181.31 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkdev_direct_new_256,4687500.0,33.959,253.014 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkdev_occgs_256,12500000.0,272.671,2031.56 +Basic_REDUCE_STRUCT-RAJA_CUDA-blkdev_occgs_new_256,12500000.0,263.766,1965.21 +Comm_HALO_PACKING_FUSED-Base_CUDA-direct_1024,42875.0,0.0,27.8679 +Comm_HALO_PACKING_FUSED-Base_Seq-direct,42875.0,0.0,37.5249 +Comm_HALO_PACKING_FUSED-RAJA_CUDA-direct_1024,42875.0,0.0,24.3736 +Comm_HALO_PACKING_FUSED-RAJA_CUDA-funcptr_1024,42875.0,0.0,22.4841 +Comm_HALO_PACKING_FUSED-RAJA_CUDA-virtfunc_1024,42875.0,0.0,22.6106 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/combined_table.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/combined_table.csv new file mode 100644 index 0000000..05d0744 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/combined_table.csv @@ -0,0 +1,474 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning +Apps_CONVECTION3DPA,Base_Seq,default,702, PASSED ,5.90584e-06,8.99998,16.2141,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,702, PASSED ,4.0634e-06,13.0808,23.566,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,702, PASSED ,4.12986e-06,12.8703,23.1867,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,702459, PASSED ,0.00632911,8.36122,15.1397,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,702459, PASSED ,3.85625e-05,1372.29,2484.81,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,702459, PASSED ,3.97062e-05,1332.77,2413.24,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,87804, PASSED ,0.000769192,8.59976,15.571,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,87804, PASSED ,7.32564e-06,902.974,1634.96,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,87804, PASSED ,7.81286e-06,846.664,1533.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,1028970, PASSED ,0.0111434,6.95626,12.5957,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,1028970, PASSED ,5.42286e-05,1429.44,2588.29,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,1028970, PASSED ,5.58236e-05,1388.59,2514.33,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,10989, PASSED ,8.42174e-05,9.833,17.799,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,10989, PASSED ,4.23404e-06,195.584,354.031,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,10989, PASSED ,4.22994e-06,195.773,354.374,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,175608, PASSED ,0.00140646,9.40624,17.0316,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,175608, PASSED ,1.16063e-05,1139.85,2063.9,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,175608, PASSED ,1.17986e-05,1121.27,2030.26,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,2057940, PASSED ,0.0230145,6.7363,12.1975,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,2057940, PASSED ,0.000102527,1512.12,2738.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,2057940, PASSED ,0.000105465,1470.0,2661.73,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,21951, PASSED ,0.000170701,9.68897,17.5411,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,21951, PASSED ,4.68898e-06,352.724,638.578,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,21951, PASSED ,4.68604e-06,352.946,638.979,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,2754, PASSED ,2.16801e-05,9.58193,17.3277,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,2754, PASSED ,4.07304e-06,51.003,92.2323,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,2754, PASSED ,4.12906e-06,50.311,90.981,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,351216, PASSED ,0.00295484,8.95436,16.2136,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,351216, PASSED ,2.03592e-05,1299.59,2353.16,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,351216, PASSED ,2.04458e-05,1294.09,2343.2,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,43902, PASSED ,0.000357982,9.23949,16.7287,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_CUDA,block_64,43902, PASSED ,5.69318e-06,580.97,1051.88,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,43902, PASSED ,5.61292e-06,589.277,1066.92,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,841, PASSED ,4.37064e-06,9.00417,10.3907,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,841, PASSED ,2.78384e-06,14.1366,16.3134,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,841, PASSED ,2.79968e-06,14.0566,16.2211,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1060900, PASSED ,0.00639,7.43151,8.96536,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,1060900, PASSED ,2.16115e-05,2197.32,2650.84,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,1060900, PASSED ,2.16106e-05,2197.41,2650.95,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,131044, PASSED ,0.000658839,8.92438,10.7407,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,131044, PASSED ,4.05538e-06,1449.86,1744.94,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,131044, PASSED ,4.03137e-06,1458.49,1755.33,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1555009, PASSED ,0.00972127,7.15839,8.63781,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,1555009, PASSED ,3.0096e-05,2312.22,2790.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,1555009, PASSED ,3.0066e-05,2314.53,2792.87,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,15876, PASSED ,8.18091e-05,8.7674,10.4793,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,15876, PASSED ,2.84052e-06,252.507,301.812,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,15876, PASSED ,2.81695e-06,254.62,304.338,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,264196, PASSED ,0.00140043,8.45538,10.1873,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,264196, PASSED ,5.183e-06,2284.61,2752.57,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,264196, PASSED ,5.18249e-06,2284.84,2752.84,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,3115225, PASSED ,0.0195063,7.14469,8.62398,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,3115225, PASSED ,5.68055e-05,2453.4,2961.37,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,3115225, PASSED ,5.67381e-05,2456.31,2964.89,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,32400, PASSED ,0.000166317,8.77331,10.5197,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,32400, PASSED ,2.99451e-06,487.276,584.269,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,32400, PASSED ,3.01031e-06,484.718,581.203,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,3844, PASSED ,1.97927e-05,8.87021,10.4875,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,3844, PASSED ,2.80222e-06,62.6523,74.0756,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,3844, PASSED ,2.80417e-06,62.6087,74.024,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,528529, PASSED ,0.00290632,8.14447,9.82016,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,528529, PASSED ,8.60536e-06,2750.66,3316.6,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,528529, PASSED ,8.56361e-06,2764.07,3332.77,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,65025, PASSED ,0.000345132,8.46653,10.1739,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,65025, PASSED ,3.35478e-06,871.018,1046.67,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,65025, PASSED ,3.31757e-06,880.787,1058.41,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,1860867, PASSED ,0.000726923,14.1839,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,1860867, PASSED ,0.000140216,73.5342,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,1860867, PASSED ,0.000136501,75.5354,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,1860867, PASSED ,0.000141866,72.6788,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,1860867, PASSED ,0.000142139,72.5391,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,205379, PASSED ,9.36717e-05,25.7731,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,205379, PASSED ,4.68721e-05,51.5063,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,205379, PASSED ,5.99539e-05,40.2678,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,205379, PASSED ,5.51753e-05,43.7553,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,205379, PASSED ,5.54841e-05,43.5118,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,2744000, PASSED ,0.000990967,13.453,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,2744000, PASSED ,0.000150907,88.3422,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,2744000, PASSED ,0.000153234,87.001,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,2744000, PASSED ,0.000161472,82.5619,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,2744000, PASSED ,0.000162264,82.1592,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,421875, PASSED ,0.000198529,19.5101,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,421875, PASSED ,6.39387e-05,60.5788,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,421875, PASSED ,6.57775e-05,58.8854,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,421875, PASSED ,6.9453e-05,55.7691,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,421875, PASSED ,6.9771e-05,55.5149,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,5639752, PASSED ,0.00187025,11.488,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,5639752, PASSED ,0.000256314,83.8245,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,5639752, PASSED ,0.000255459,84.1051,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,5639752, PASSED ,0.000271886,79.0234,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,5639752, PASSED ,0.000275371,78.0234,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,42875, PASSED ,2.31649e-05,37.5249,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,42875, PASSED ,3.11922e-05,27.8679,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,42875, PASSED ,3.5664e-05,24.3736,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,42875, PASSED ,3.86611e-05,22.4841,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,42875, PASSED ,3.84447e-05,22.6106,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,7645373, PASSED ,0.00230591,11.4005,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,7645373, PASSED ,0.000314768,83.5172,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,7645373, PASSED ,0.000313905,83.7469,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,7645373, PASSED ,0.000331681,79.2586,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,7645373, PASSED ,0.000333512,78.8235,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,9528128, PASSED ,0.00281299,10.815,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,9528128, PASSED ,0.000326749,93.1066,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,9528128, PASSED ,0.000325766,93.3876,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,9528128, PASSED ,0.000349113,87.1422,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,9528128, PASSED ,0.000347064,87.6568,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,884736, PASSED ,0.000414132,15.2354,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,884736, PASSED ,8.07685e-05,78.1177,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,884736, PASSED ,8.45459e-05,74.6275,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,884736, PASSED ,9.06005e-05,69.6403,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,884736, PASSED ,8.921e-05,70.7258,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,11543176, PASSED ,0.00396559,8.71324,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,11543176, PASSED ,0.000411765,83.9146,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,11543176, PASSED ,0.000413852,83.4915,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,11543176, PASSED ,0.000437648,78.9519,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,11543176, PASSED ,0.000440363,78.465,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,91125, PASSED ,4.00244e-05,35.4562,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,91125, PASSED ,3.66473e-05,38.7235,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,91125, PASSED ,4.05186e-05,35.0238,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,91125, PASSED ,4.33263e-05,32.7541,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,91125, PASSED ,4.37038e-05,32.4712,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024 +Basic_INDEXLIST_3LOOP,Base_Seq,default,2560000, PASSED ,0.0142187,7.04253,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,2560000, PASSED ,4.70973e-05,2126.15,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,2560000, PASSED ,4.73377e-05,2115.35,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,320000, PASSED ,0.00157409,7.95189,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,320000, PASSED ,1.96111e-05,638.26,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,320000, PASSED ,1.99029e-05,628.902,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,3750000, PASSED ,0.0221413,6.62487,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,3750000, PASSED ,6.70109e-05,2188.95,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,3750000, PASSED ,6.69042e-05,2192.44,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,640000, PASSED ,0.00313502,7.98527,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,640000, PASSED ,2.24732e-05,1113.95,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,640000, PASSED ,2.25615e-05,1109.59,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,7500000, PASSED ,0.0450929,6.50583,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,7500000, PASSED ,0.000138663,2115.68,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,7500000, PASSED ,0.0001388,2113.59,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,80000, PASSED ,0.000503552,6.21439,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,80000, PASSED ,1.68926e-05,185.245,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,80000, PASSED ,1.719e-05,182.04,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,10000000, PASSED ,0.0600533,6.51347,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,10000000, PASSED ,0.000178458,2191.86,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,10000000, PASSED ,0.000178382,2192.79,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,12500000, PASSED ,0.0741771,6.59158,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,12500000, PASSED ,0.000218329,2239.48,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,12500000, PASSED ,0.000218386,2238.9,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,1280000, PASSED ,0.00646864,7.7401,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,1280000, PASSED ,2.78398e-05,1798.43,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,1280000, PASSED ,2.79157e-05,1793.54,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,15000000, PASSED ,0.0894248,6.56119,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,15000000, PASSED ,0.000258931,2265.99,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,15000000, PASSED ,0.000259391,2261.96,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,160000, PASSED ,0.000775334,8.07202,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,160000, PASSED ,1.81087e-05,345.609,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,160000, PASSED ,1.80533e-05,346.669,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_INTSC_HEXHEX,Base_Seq,default,27, PASSED ,0.00113801,0.0989909,4.59175,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,27, PASSED ,3.0517e-05,3.69148,171.232,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,27, PASSED ,3.0991e-05,3.63502,168.613,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,13824, PASSED ,0.573433,0.100584,4.66566,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,13824, PASSED ,0.00229436,25.1391,1166.1,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,13824, PASSED ,0.00229631,25.1178,1165.1,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,1728, PASSED ,0.0716637,0.100606,4.66666,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,1728, PASSED ,0.000316845,22.7549,1055.5,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,1728, PASSED ,0.000317009,22.7431,1054.95,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,19683, PASSED ,0.817182,0.100496,4.66159,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,19683, PASSED ,0.00325913,25.1981,1168.83,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,19683, PASSED ,0.00325845,25.2033,1169.07,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,216, PASSED ,0.00898769,0.100273,4.65123,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,216, PASSED ,6.743e-05,13.3653,619.958,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,216, PASSED ,6.6808e-05,13.4897,625.73,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,3375, PASSED ,0.139883,0.100667,4.66949,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,3375, PASSED ,0.000586234,24.0204,1114.2,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,3375, PASSED ,0.000588246,23.9383,1110.39,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,39304, PASSED ,1.62818,0.100719,4.67192,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,39304, PASSED ,0.00648117,25.3024,1173.67,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,39304, PASSED ,0.00647179,25.3391,1175.37,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,512, PASSED ,0.021226,0.100642,4.66836,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,512, PASSED ,0.000116043,18.409,853.911,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,512, PASSED ,0.000117722,18.1464,841.732,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,64, PASSED ,0.00267651,0.0997673,4.62777,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,64, PASSED ,4.2192e-05,6.3289,293.57,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,64, PASSED ,3.7891e-05,7.04729,326.893,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,6859, PASSED ,0.284349,0.100644,4.66843,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,6859, PASSED ,0.0011558,24.7604,1148.53,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,6859, PASSED ,0.00115578,24.7607,1148.54,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,1000, PASSED ,0.0414815,0.100583,4.66559,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_CUDA,block_64,1000, PASSED ,0.000194956,21.4014,992.716,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,1000, PASSED ,0.000198316,21.0388,975.897,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64 +Apps_LTIMES,Base_Seq,default,1344, PASSED ,1.3159e-05,7.18731,5.10678,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,1344, PASSED ,3.35502e-06,28.1899,20.0297,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,1344, PASSED ,3.42376e-06,27.6239,19.6275,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,1344, PASSED ,3.43504e-06,27.5332,19.5631,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,1238784, PASSED ,0.0121454,7.0928,5.09983,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,1238784, PASSED ,9.03716e-05,953.226,685.383,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,1238784, PASSED ,9.27542e-05,928.741,667.778,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,1238784, PASSED ,9.18566e-05,937.816,674.303,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,154944, PASSED ,0.00153302,7.02907,5.05354,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,154944, PASSED ,1.39367e-05,773.189,555.883,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,154944, PASSED ,1.41069e-05,763.865,549.18,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,154944, PASSED ,1.3749e-05,783.746,563.474,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,1814592, PASSED ,0.0199534,6.32401,4.54707,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,1814592, PASSED ,0.000130216,969.049,696.763,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,1814592, PASSED ,0.000133785,943.198,678.176,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,1814592, PASSED ,0.000132435,952.809,685.086,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,19392, PASSED ,0.000189961,7.10468,5.1042,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,19392, PASSED ,4.30516e-06,313.487,225.218,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,19392, PASSED ,4.53638e-06,297.509,213.739,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,19392, PASSED ,4.44682e-06,303.501,218.043,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,309696, PASSED ,0.00308182,6.9884,5.02456,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,309696, PASSED ,2.40824e-05,894.303,642.991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,309696, PASSED ,2.43289e-05,885.243,636.478,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,309696, PASSED ,2.35515e-05,914.464,657.487,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,3629184, PASSED ,0.0404164,6.24426,4.48975,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,3629184, PASSED ,0.00025547,987.865,710.295,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,3629184, PASSED ,0.000262508,961.381,691.252,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,3629184, PASSED ,0.000259693,971.802,698.745,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,38784, PASSED ,0.000379928,7.10163,5.10412,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,38784, PASSED ,6.0753e-06,444.111,319.194,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,38784, PASSED ,6.32362e-06,426.672,306.66,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,38784, PASSED ,6.05992e-06,445.238,320.004,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,4992, PASSED ,4.904e-05,7.10145,5.08973,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,4992, PASSED ,3.39278e-06,102.646,73.568,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,4992, PASSED ,3.55478e-06,97.9681,70.2153,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,4992, PASSED ,3.42678e-06,101.627,72.8381,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,619392, PASSED ,0.00627232,6.86713,4.9375,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,619392, PASSED ,4.45587e-05,966.655,695.03,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,619392, PASSED ,4.48525e-05,960.322,690.477,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,619392, PASSED ,4.32649e-05,995.561,715.813,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_LTIMES,Base_Seq,default,77568, PASSED ,0.000758563,7.11226,5.11283,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_CUDA,block_256,77568, PASSED ,8.50688e-06,634.204,455.913,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_LTIMES,RAJA_CUDA,kernel_256,77568, PASSED ,8.69284e-06,620.637,446.16,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256 +Apps_LTIMES,RAJA_CUDA,launch_256,77568, PASSED ,8.73622e-06,617.555,443.945,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256 +Apps_MASS3DPA,Base_Seq,default,1600, PASSED ,9.01786e-06,6.5807,14.0527,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,1600, PASSED ,3.8825e-06,15.285,32.6401,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,1600, PASSED ,3.87526e-06,15.3135,32.701,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,1619008, PASSED ,0.0092196,6.4805,13.9085,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,1619008, PASSED ,4.01159e-05,1489.37,3196.5,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,1619008, PASSED ,4.03963e-05,1479.04,3174.31,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,202368, PASSED ,0.00108462,6.88576,14.7777,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,202368, PASSED ,7.22326e-06,1033.94,2218.97,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,202368, PASSED ,7.23264e-06,1032.6,2216.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,2371584, PASSED ,0.0150102,5.83072,12.5139,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,2371584, PASSED ,5.66451e-05,1545.07,3316.03,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,2371584, PASSED ,5.69624e-05,1536.46,3297.56,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,25344, PASSED ,0.000133332,7.01696,15.0551,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,25344, PASSED ,3.95496e-06,236.56,507.546,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,25344, PASSED ,3.95342e-06,236.652,507.744,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,404736, PASSED ,0.00220323,6.77938,14.5497,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,404736, PASSED ,1.17549e-05,1270.66,2727.06,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,404736, PASSED ,1.18154e-05,1264.16,2713.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,4743104, PASSED ,0.0306498,5.71091,12.2568,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,4743104, PASSED ,0.000108962,1606.41,3447.69,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,4743104, PASSED ,0.000109434,1599.49,3432.84,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,50624, PASSED ,0.000266148,7.02056,15.0652,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,50624, PASSED ,4.42372e-06,422.384,906.382,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,50624, PASSED ,4.4197e-06,422.768,907.206,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,6336, PASSED ,3.36787e-05,6.95157,14.9006,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,6336, PASSED ,3.80682e-06,61.5,131.824,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,6336, PASSED ,3.83872e-06,60.989,130.729,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,809536, PASSED ,0.00435007,6.86773,14.7395,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,809536, PASSED ,2.08553e-05,1432.49,3074.41,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,809536, PASSED ,2.0953e-05,1425.82,3060.07,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MASS3DPA,Base_Seq,default,101184, PASSED ,0.000546671,6.83109,14.6598,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_CUDA,block_25,101184, PASSED ,5.59842e-06,667.038,1431.49,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_25 +Apps_MASS3DPA,RAJA_CUDA,block_25,101184, PASSED ,5.59088e-06,667.937,1433.42,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,64, PASSED ,6.7609e-07,17.6762,5.01708,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,64, PASSED ,3.27675e-06,3.64713,1.03517,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,64, PASSED ,2.72157e-06,4.39112,1.24634,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,328509, PASSED ,0.0034469,12.4101,5.05119,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,328509, PASSED ,2.0792e-05,2057.35,837.387,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,328509, PASSED ,2.02879e-05,2108.48,858.197,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,35937, PASSED ,0.00039324,12.2524,4.84351,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,35937, PASSED ,4.41338e-06,1091.71,431.565,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,35937, PASSED ,4.38632e-06,1098.45,434.228,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,493039, PASSED ,0.00517185,12.3707,5.05256,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,493039, PASSED ,3.34798e-05,1910.98,780.501,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,493039, PASSED ,2.89009e-05,2213.75,904.162,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,3375, PASSED ,3.39342e-05,14.2103,5.27123,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,3375, PASSED ,3.62645e-06,132.972,49.3251,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,3375, PASSED ,3.40138e-06,141.771,52.5889,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,79507, PASSED ,0.000872998,12.054,4.82689,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,79507, PASSED ,5.444e-06,1932.98,774.039,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,79507, PASSED ,5.60469e-06,1877.56,751.847,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,1000000, PASSED ,0.010583,12.2002,5.00806,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,1000000, PASSED ,6.10129e-05,2116.18,868.668,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,1000000, PASSED ,5.34032e-05,2417.72,992.449,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,8000, PASSED ,8.12208e-05,13.6766,5.22034,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,8000, PASSED ,3.63063e-06,305.958,116.784,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,8000, PASSED ,3.42591e-06,324.241,123.763,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,512, PASSED ,5.1277e-06,15.6634,5.29204,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,512, PASSED ,3.58285e-06,22.4171,7.57386,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,512, PASSED ,3.379e-06,23.7695,8.03078,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,157464, PASSED ,0.00164964,12.5233,5.05904,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,157464, PASSED ,7.88336e-06,2620.58,1058.63,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,157464, PASSED ,8.88336e-06,2325.58,939.463,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,17576, PASSED ,0.000192261,12.4379,4.84513,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,17576, PASSED ,3.6985e-06,646.562,251.866,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,17576, PASSED ,3.47343e-06,688.457,268.187,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256 +Basic_MULTI_REDUCE,Base_Seq,default,3199995, PASSED ,0.00746905,6.38419,0.428434,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,3199995, PASSED ,0.00114407,41.679,2.79702,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,3199995, PASSED ,0.00118556,40.2205,2.69914,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,3199995, PASSED ,0.00116734,40.8481,2.74126,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,3199995, PASSED ,0.001196,39.8695,2.67559,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,399995, PASSED ,0.000857859,6.94815,0.466271,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,399995, PASSED ,0.00118626,5.02467,0.337191,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,399995, PASSED ,0.00118322,5.03756,0.338056,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,399995, PASSED ,0.00122441,4.86807,0.326683,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,399995, PASSED ,0.00124422,4.79058,0.321482,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,4687495, PASSED ,0.0115267,6.05978,0.406664,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,4687495, PASSED ,0.00114658,60.9197,4.08824,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,4687495, PASSED ,0.00118752,58.8195,3.9473,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,4687495, PASSED ,0.00116815,59.7946,4.01274,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,4687495, PASSED ,0.00119391,58.5048,3.92618,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,799995, PASSED ,0.00171672,6.94406,0.466002,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,799995, PASSED ,0.00118691,10.0437,0.674012,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,799995, PASSED ,0.0011843,10.0659,0.675501,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,799995, PASSED ,0.00122105,9.76294,0.655172,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,799995, PASSED ,0.00124317,9.58923,0.643515,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,9374995, PASSED ,0.0237314,5.88666,0.395046,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,9374995, PASSED ,0.00114296,122.225,8.20238,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,9374995, PASSED ,0.00118759,117.632,7.89413,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,9374995, PASSED ,0.00116831,119.573,8.02441,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,9374995, PASSED ,0.00120206,116.216,7.7991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,99995, PASSED ,0.000213933,6.96569,0.467413,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,99995, PASSED ,0.00118416,1.25844,0.0844437,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,99995, PASSED ,0.00117775,1.26529,0.0849038,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,99995, PASSED ,0.00121486,1.22664,0.08231,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,99995, PASSED ,0.00124156,1.20025,0.0805395,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,12499995, PASSED ,0.0312542,5.95966,0.399946,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,12499995, PASSED ,0.00113992,163.402,10.9657,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,12499995, PASSED ,0.00118223,157.554,10.5733,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,12499995, PASSED ,0.00114342,162.901,10.9321,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,12499995, PASSED ,0.00120046,155.161,10.4127,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,15624995, PASSED ,0.0395453,5.8877,0.395117,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,15624995, PASSED ,0.00111842,208.178,13.9706,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,15624995, PASSED ,0.00118367,196.703,13.2005,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,15624995, PASSED ,0.0011381,204.578,13.729,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,15624995, PASSED ,0.00120259,193.607,12.9928,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,1599995, PASSED ,0.00352059,6.77215,0.454468,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,1599995, PASSED ,0.00118293,20.155,1.35257,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,1599995, PASSED ,0.00118752,20.0771,1.34734,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,1599995, PASSED ,0.0012189,19.5602,1.31265,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,1599995, PASSED ,0.00124597,19.1352,1.28413,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,18749995, PASSED ,0.0467148,5.98091,0.401372,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,18749995, PASSED ,0.00111761,249.995,16.7769,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,18749995, PASSED ,0.00119355,234.088,15.7094,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,18749995, PASSED ,0.00112135,249.162,16.721,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,18749995, PASSED ,0.00119838,233.146,15.6462,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,199995, PASSED ,0.000430075,6.92973,0.465023,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,199995, PASSED ,0.00118779,2.50913,0.168376,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,199995, PASSED ,0.00118653,2.51178,0.168555,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,199995, PASSED ,0.00121902,2.44485,0.164063,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,199995, PASSED ,0.00123932,2.40478,0.161374,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256 +Basic_REDUCE_STRUCT,Base_Seq,default,3200000, PASSED ,0.00443437,10.7532,1.44327,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,3200000, PASSED ,0.0078743,6.05561,0.81277,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,3200000, PASSED ,0.00814346,5.85546,0.785907,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,3200000, PASSED ,0.00114384,41.6873,5.59518,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,3200000, PASSED ,0.00118253,40.3235,5.41213,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,3200000, PASSED ,0.00113966,41.8405,5.61573,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,3200000, PASSED ,0.000234629,203.23,27.2771,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,3200000, PASSED ,0.000193799,246.047,33.0238,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,3200000, PASSED ,0.00119582,39.8752,5.35196,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,3200000, PASSED ,4.51046e-05,1057.18,141.892,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,3200000, PASSED ,4.79646e-05,994.144,133.432,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,400000, PASSED ,0.000428418,13.9127,1.86734,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,400000, PASSED ,0.000850656,7.0069,0.940453,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,400000, PASSED ,0.000890837,6.69086,0.898034,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,400000, PASSED ,0.00117357,5.07893,0.681684,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,400000, PASSED ,0.00118248,5.04064,0.676545,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,400000, PASSED ,0.0011889,5.01342,0.672891,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,400000, PASSED ,4.09785e-05,145.453,19.5225,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,400000, PASSED ,4.64267e-05,128.384,17.2315,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,400000, PASSED ,0.00124422,4.79053,0.642976,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,400000, PASSED ,2.92832e-05,203.545,27.3195,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,400000, PASSED ,3.22944e-05,184.567,24.7722,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,4687500, PASSED ,0.00724771,9.63741,1.29351,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,4687500, PASSED ,0.0121225,5.76193,0.773354,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,4687500, PASSED ,0.0118733,5.88288,0.789586,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,4687500, PASSED ,0.00112014,62.3578,8.36953,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,4687500, PASSED ,0.00118696,58.8472,7.89834,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,4687500, PASSED ,0.00111714,62.5251,8.39197,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,4687500, PASSED ,0.000349721,199.728,26.8071,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,4687500, PASSED ,0.000276069,253.014,33.959,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,4687500, PASSED ,0.00118595,58.897,7.90503,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,4687500, PASSED ,5.23711e-05,1333.73,179.011,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,4687500, PASSED ,5.55167e-05,1258.16,168.868,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,800000, PASSED ,0.000864342,13.7919,1.85112,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,800000, PASSED ,0.00170798,6.97953,0.936778,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,800000, PASSED ,0.00177406,6.71957,0.901887,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,800000, PASSED ,0.00116567,10.2266,1.3726,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,800000, PASSED ,0.00118385,10.0696,1.35152,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,800000, PASSED ,0.00117672,10.1306,1.35971,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,800000, PASSED ,6.57488e-05,181.31,24.3351,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,800000, PASSED ,6.5408e-05,182.255,24.4619,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,800000, PASSED ,0.00123885,9.6226,1.29153,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,800000, PASSED ,2.97245e-05,401.047,53.8276,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,800000, PASSED ,3.30817e-05,360.348,48.3652,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,9375000, PASSED ,0.0152428,9.16486,1.23009,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,9375000, PASSED ,0.0241246,5.79071,0.777216,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,9375000, PASSED ,0.0246052,5.67759,0.762034,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,9375000, PASSED ,0.00106026,131.759,17.6844,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,9375000, PASSED ,0.00118735,117.655,15.7914,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,9375000, PASSED ,0.00104376,133.842,17.964,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,9375000, PASSED ,0.000717588,194.678,26.1292,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,9375000, PASSED ,0.000520792,268.242,36.0028,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,9375000, PASSED ,0.00118794,117.597,15.7837,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,9375000, PASSED ,7.64178e-05,1828.09,245.362,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,9375000, PASSED ,8.6814e-05,1609.17,215.979,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,100000, PASSED ,0.000106123,14.0414,1.88462,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,100000, PASSED ,0.000211637,7.0409,0.945023,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,100000, PASSED ,0.000221277,6.73416,0.903853,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,100000, PASSED ,0.00118509,1.25739,0.168766,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,100000, PASSED ,0.00118173,1.26096,0.169245,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,100000, PASSED ,0.0012023,1.23939,0.166349,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,100000, PASSED ,2.51803e-05,59.1779,7.9428,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,100000, PASSED ,3.01591e-05,49.4085,6.63156,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,100000, PASSED ,0.00123155,1.20995,0.162398,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,100000, PASSED ,2.52775e-05,58.9502,7.91224,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,100000, PASSED ,3.01523e-05,49.4196,6.63305,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,12500000, PASSED ,0.0197627,9.42505,1.26501,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,12500000, PASSED ,0.0319309,5.83336,0.782941,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,12500000, PASSED ,0.0282075,6.60337,0.886289,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,12500000, PASSED ,0.00101283,183.904,24.6832,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,12500000, PASSED ,0.00118728,156.884,21.0566,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,12500000, PASSED ,0.00103767,179.502,24.0924,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,12500000, PASSED ,0.000962459,193.53,25.9751,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,12500000, PASSED ,0.000681294,273.398,36.6949,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,12500000, PASSED ,0.00119493,155.879,20.9218,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,12500000, PASSED ,9.16856e-05,2031.56,272.671,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,12500000, PASSED ,9.47808e-05,1965.21,263.766,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,15625000, PASSED ,0.0251125,9.2715,1.2444,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,15625000, PASSED ,0.0392682,5.92925,0.79581,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,15625000, PASSED ,0.0353909,6.57882,0.882995,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,15625000, PASSED ,0.000722227,322.379,43.2689,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,15625000, PASSED ,0.000751357,309.88,41.5914,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,15625000, PASSED ,0.00116405,200.018,26.846,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,15625000, PASSED ,0.00121036,192.364,25.8187,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,15625000, PASSED ,0.000848496,274.404,36.8299,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,15625000, PASSED ,0.00119685,194.536,26.1101,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,15625000, PASSED ,0.000106635,2183.43,293.055,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,15625000, PASSED ,0.000110169,2113.4,283.656,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,1600000, PASSED ,0.0019332,12.3329,1.65529,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,1600000, PASSED ,0.00353484,6.74481,0.905274,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,1600000, PASSED ,0.00361417,6.59678,0.885405,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,1600000, PASSED ,0.00114916,20.7473,2.78466,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,1600000, PASSED ,0.00118481,20.1229,2.70085,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,1600000, PASSED ,0.0011646,20.4721,2.74772,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,1600000, PASSED ,0.00011438,208.444,27.9768,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,1600000, PASSED ,0.000105049,226.96,30.4621,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,1600000, PASSED ,0.001179,20.222,2.71416,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,1600000, PASSED ,3.20528e-05,743.831,99.8353,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,1600000, PASSED ,3.52143e-05,677.05,90.8721,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,18750000, PASSED ,0.0298131,9.37161,1.25784,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,18750000, PASSED ,0.0410121,6.81255,0.914365,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,18750000, PASSED ,0.0423796,6.59273,0.884861,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,18750000, PASSED ,0.000869862,321.197,43.1103,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,18750000, PASSED ,0.000794184,351.804,47.2183,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,18750000, PASSED ,0.00128429,217.55,29.1991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,18750000, PASSED ,0.00145398,192.16,25.7913,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,18750000, PASSED ,0.00100517,277.96,37.3071,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,18750000, PASSED ,0.00120377,232.102,31.1522,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,18750000, PASSED ,0.000125293,2229.94,299.298,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,18750000, PASSED ,0.000128128,2180.61,292.677,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,200000, PASSED ,0.000214954,13.8645,1.86087,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,200000, PASSED ,0.000424834,7.01505,0.941549,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,200000, PASSED ,0.000444093,6.71082,0.900716,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,200000, PASSED ,0.00118618,2.51246,0.337219,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,200000, PASSED ,0.00117806,2.52978,0.339543,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,200000, PASSED ,0.00120939,2.46425,0.330747,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,200000, PASSED ,2.87783e-05,103.558,13.8994,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,200000, PASSED ,3.9239e-05,75.9507,10.194,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,200000, PASSED ,0.00124661,2.39066,0.320871,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,200000, PASSED ,2.90087e-05,102.736,13.789,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,200000, PASSED ,3.15419e-05,94.4849,12.6816,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_CONVECTION3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_CONVECTION3DPA_bandwidth.png new file mode 100644 index 0000000..94eb136 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_CONVECTION3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_CONVECTION3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_CONVECTION3DPA_flops.png new file mode 100644 index 0000000..45b86da Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_CONVECTION3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png new file mode 100644 index 0000000..0172c27 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_DEL_DOT_VEC_2D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_DEL_DOT_VEC_2D_flops.png new file mode 100644 index 0000000..6a202f5 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_DEL_DOT_VEC_2D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_INTSC_HEXHEX_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_INTSC_HEXHEX_bandwidth.png new file mode 100644 index 0000000..fd54116 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_INTSC_HEXHEX_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_INTSC_HEXHEX_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_INTSC_HEXHEX_flops.png new file mode 100644 index 0000000..fa1fb46 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_INTSC_HEXHEX_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_LTIMES_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_LTIMES_bandwidth.png new file mode 100644 index 0000000..49049d4 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_LTIMES_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_LTIMES_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_LTIMES_flops.png new file mode 100644 index 0000000..29ffa06 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_LTIMES_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MASS3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MASS3DPA_bandwidth.png new file mode 100644 index 0000000..f97d37b Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MASS3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MASS3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MASS3DPA_flops.png new file mode 100644 index 0000000..00e570c Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MASS3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png new file mode 100644 index 0000000..a441b9a Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MATVEC_3D_STENCIL_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MATVEC_3D_STENCIL_flops.png new file mode 100644 index 0000000..f189265 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Apps_MATVEC_3D_STENCIL_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_INDEXLIST_3LOOP_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_INDEXLIST_3LOOP_bandwidth.png new file mode 100644 index 0000000..8740483 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_INDEXLIST_3LOOP_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_INDEXLIST_3LOOP_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_INDEXLIST_3LOOP_flops.png new file mode 100644 index 0000000..45f3d8d Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_INDEXLIST_3LOOP_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_MULTI_REDUCE_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_MULTI_REDUCE_bandwidth.png new file mode 100644 index 0000000..555e591 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_MULTI_REDUCE_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_MULTI_REDUCE_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_MULTI_REDUCE_flops.png new file mode 100644 index 0000000..c14b0bc Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_MULTI_REDUCE_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_REDUCE_STRUCT_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_REDUCE_STRUCT_bandwidth.png new file mode 100644 index 0000000..285b4c6 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_REDUCE_STRUCT_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_REDUCE_STRUCT_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_REDUCE_STRUCT_flops.png new file mode 100644 index 0000000..3004494 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Basic_REDUCE_STRUCT_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Comm_HALO_PACKING_FUSED_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Comm_HALO_PACKING_FUSED_bandwidth.png new file mode 100644 index 0000000..c3ceb9f Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Comm_HALO_PACKING_FUSED_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Comm_HALO_PACKING_FUSED_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Comm_HALO_PACKING_FUSED_flops.png new file mode 100644 index 0000000..d45754c Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/figures/Comm_HALO_PACKING_FUSED_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/output_with_variant_tuning.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/output_with_variant_tuning.csv new file mode 100644 index 0000000..96e0a0a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/output_with_variant_tuning.csv @@ -0,0 +1,474 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning,Smoothed Mean flops (gigaFLOP per sec.),Smoothed Bandwidth (GiB per sec.) +Apps_CONVECTION3DPA,Base_Seq,default,702, PASSED ,5.90584e-06,8.99998,16.2141,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,17.3277,9.58193 +Apps_CONVECTION3DPA,Base_CUDA,block_64,702, PASSED ,4.0634e-06,13.0808,23.566,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64,92.2323,51.003 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,702, PASSED ,4.12986e-06,12.8703,23.1867,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,90.981,50.311 +Apps_CONVECTION3DPA,Base_Seq,default,702459, PASSED ,0.00632911,8.36122,15.1397,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,15.1397,8.36122 +Apps_CONVECTION3DPA,Base_CUDA,block_64,702459, PASSED ,3.85625e-05,1372.29,2484.81,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2484.81,1372.29 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,702459, PASSED ,3.97062e-05,1332.77,2413.24,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2413.24,1332.77 +Apps_CONVECTION3DPA,Base_Seq,default,87804, PASSED ,0.000769192,8.59976,15.571,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,16.7287,9.23949 +Apps_CONVECTION3DPA,Base_CUDA,block_64,87804, PASSED ,7.32564e-06,902.974,1634.96,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1634.96,902.974 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,87804, PASSED ,7.81286e-06,846.664,1533.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1533.0,846.664 +Apps_CONVECTION3DPA,Base_Seq,default,1028970, PASSED ,0.0111434,6.95626,12.5957,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,13.8677,7.65874 +Apps_CONVECTION3DPA,Base_CUDA,block_64,1028970, PASSED ,5.42286e-05,1429.44,2588.29,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2536.55,1400.865 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,1028970, PASSED ,5.58236e-05,1388.59,2514.33,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2463.785,1360.6799999999998 +Apps_CONVECTION3DPA,Base_Seq,default,10989, PASSED ,8.42174e-05,9.833,17.799,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,17.3277,9.58193 +Apps_CONVECTION3DPA,Base_CUDA,block_64,10989, PASSED ,4.23404e-06,195.584,354.031,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64,354.031,195.584 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,10989, PASSED ,4.22994e-06,195.773,354.374,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,354.374,195.773 +Apps_CONVECTION3DPA,Base_Seq,default,175608, PASSED ,0.00140646,9.40624,17.0316,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,16.2136,8.95436 +Apps_CONVECTION3DPA,Base_CUDA,block_64,175608, PASSED ,1.16063e-05,1139.85,2063.9,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2063.9,1139.85 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,175608, PASSED ,1.17986e-05,1121.27,2030.26,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2030.26,1121.27 +Apps_CONVECTION3DPA,Base_Seq,default,2057940, PASSED ,0.0230145,6.7363,12.1975,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,12.5957,6.95626 +Apps_CONVECTION3DPA,Base_CUDA,block_64,2057940, PASSED ,0.000102527,1512.12,2738.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2588.29,1429.44 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,2057940, PASSED ,0.000105465,1470.0,2661.73,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2514.33,1388.59 +Apps_CONVECTION3DPA,Base_Seq,default,21951, PASSED ,0.000170701,9.68897,17.5411,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,17.3277,9.58193 +Apps_CONVECTION3DPA,Base_CUDA,block_64,21951, PASSED ,4.68898e-06,352.724,638.578,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64,638.578,352.724 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,21951, PASSED ,4.68604e-06,352.946,638.979,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,638.979,352.946 +Apps_CONVECTION3DPA,Base_Seq,default,2754, PASSED ,2.16801e-05,9.58193,17.3277,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,17.4344,9.635449999999999 +Apps_CONVECTION3DPA,Base_CUDA,block_64,2754, PASSED ,4.07304e-06,51.003,92.2323,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64,223.13165,123.2935 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,2754, PASSED ,4.12906e-06,50.311,90.981,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,222.6775,123.042 +Apps_CONVECTION3DPA,Base_Seq,default,351216, PASSED ,0.00295484,8.95436,16.2136,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,15.571,8.59976 +Apps_CONVECTION3DPA,Base_CUDA,block_64,351216, PASSED ,2.03592e-05,1299.59,2353.16,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64,2353.16,1299.59 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,351216, PASSED ,2.04458e-05,1294.09,2343.2,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,2343.2,1294.09 +Apps_CONVECTION3DPA,Base_Seq,default,43902, PASSED ,0.000357982,9.23949,16.7287,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,17.0316,9.40624 +Apps_CONVECTION3DPA,Base_CUDA,block_64,43902, PASSED ,5.69318e-06,580.97,1051.88,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1051.88,580.97 +Apps_CONVECTION3DPA,RAJA_CUDA,block_64,43902, PASSED ,5.61292e-06,589.277,1066.92,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/CONVECTION3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1066.92,589.277 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,841, PASSED ,4.37064e-06,9.00417,10.3907,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,10.4793,8.87021 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,841, PASSED ,2.78384e-06,14.1366,16.3134,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256,74.0756,62.6523 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,841, PASSED ,2.79968e-06,14.0566,16.2211,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,74.024,62.6087 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1060900, PASSED ,0.00639,7.43151,8.96536,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,8.96536,7.43151 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,1060900, PASSED ,2.16115e-05,2197.32,2650.84,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256,2790.09,2312.22 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,1060900, PASSED ,2.16106e-05,2197.41,2650.95,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,2792.87,2314.53 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,131044, PASSED ,0.000658839,8.92438,10.7407,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.1873,8.46653 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,131044, PASSED ,4.05538e-06,1449.86,1744.94,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1744.94,1449.86 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,131044, PASSED ,4.03137e-06,1458.49,1755.33,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1755.33,1458.49 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1555009, PASSED ,0.00972127,7.15839,8.63781,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,8.801585,7.29495 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,1555009, PASSED ,3.0096e-05,2312.22,2790.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256,2875.73,2382.81 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,1555009, PASSED ,3.0066e-05,2314.53,2792.87,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,2878.88,2385.42 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,15876, PASSED ,8.18091e-05,8.7674,10.4793,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,10.4793,8.77331 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,15876, PASSED ,2.84052e-06,252.507,301.812,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256,301.812,252.507 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,15876, PASSED ,2.81695e-06,254.62,304.338,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,304.338,254.62 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,264196, PASSED ,0.00140043,8.45538,10.1873,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,10.1739,8.45538 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,264196, PASSED ,5.183e-06,2284.61,2752.57,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256,2650.84,2197.32 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,264196, PASSED ,5.18249e-06,2284.84,2752.84,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,2650.95,2197.41 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,3115225, PASSED ,0.0195063,7.14469,8.62398,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,8.63781,7.15839 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,3115225, PASSED ,5.68055e-05,2453.4,2961.37,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,2790.09,2312.22 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,3115225, PASSED ,5.67381e-05,2456.31,2964.89,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,2792.87,2314.53 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,32400, PASSED ,0.000166317,8.77331,10.5197,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,10.4875,8.77331 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,32400, PASSED ,2.99451e-06,487.276,584.269,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256,584.269,487.276 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,32400, PASSED ,3.01031e-06,484.718,581.203,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,581.203,484.718 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,3844, PASSED ,1.97927e-05,8.87021,10.4875,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,10.4834,8.821760000000001 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,3844, PASSED ,2.80222e-06,62.6523,74.0756,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256,187.9438,157.57965000000002 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,3844, PASSED ,2.80417e-06,62.6087,74.024,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,189.181,158.61435 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,528529, PASSED ,0.00290632,8.14447,9.82016,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,9.82016,8.14447 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,528529, PASSED ,8.60536e-06,2750.66,3316.6,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256,2752.57,2284.61 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,528529, PASSED ,8.56361e-06,2764.07,3332.77,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,2752.84,2284.84 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,65025, PASSED ,0.000345132,8.46653,10.1739,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,10.4793,8.7674 +Apps_DEL_DOT_VEC_2D,Base_CUDA,block_256,65025, PASSED ,3.35478e-06,871.018,1046.67,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256,1046.67,871.018 +Apps_DEL_DOT_VEC_2D,RAJA_CUDA,block_256,65025, PASSED ,3.31757e-06,880.787,1058.41,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,1058.41,880.787 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,1860867, PASSED ,0.000726923,14.1839,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,14.1839 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,1860867, PASSED ,0.000140216,73.5342,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,78.1177 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,1860867, PASSED ,0.000136501,75.5354,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,75.5354 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,1860867, PASSED ,0.000141866,72.6788,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,72.6788 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,1860867, PASSED ,0.000142139,72.5391,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,72.5391 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,205379, PASSED ,9.36717e-05,25.7731,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,25.7731 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,205379, PASSED ,4.68721e-05,51.5063,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,51.5063 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,205379, PASSED ,5.99539e-05,40.2678,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,40.2678 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,205379, PASSED ,5.51753e-05,43.7553,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,43.7553 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,205379, PASSED ,5.54841e-05,43.5118,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,43.5118 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,2744000, PASSED ,0.000990967,13.453,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,13.453 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,2744000, PASSED ,0.000150907,88.3422,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,83.5172 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,2744000, PASSED ,0.000153234,87.001,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,83.7469 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,2744000, PASSED ,0.000161472,82.5619,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,79.0234 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,2744000, PASSED ,0.000162264,82.1592,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,78.0234 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,421875, PASSED ,0.000198529,19.5101,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,19.5101 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,421875, PASSED ,6.39387e-05,60.5788,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,60.5788 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,421875, PASSED ,6.57775e-05,58.8854,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,58.8854 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,421875, PASSED ,6.9453e-05,55.7691,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,55.7691 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,421875, PASSED ,6.9771e-05,55.5149,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,55.5149 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,5639752, PASSED ,0.00187025,11.488,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,11.488 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,5639752, PASSED ,0.000256314,83.8245,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,83.8245 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,5639752, PASSED ,0.000255459,84.1051,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,84.1051 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,5639752, PASSED ,0.000271886,79.0234,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,79.2586 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,5639752, PASSED ,0.000275371,78.0234,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,78.8235 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,42875, PASSED ,2.31649e-05,37.5249,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,35.4562 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,42875, PASSED ,3.11922e-05,27.8679,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,38.7235 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,42875, PASSED ,3.5664e-05,24.3736,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,35.0238 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,42875, PASSED ,3.86611e-05,22.4841,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,32.7541 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,42875, PASSED ,3.84447e-05,22.6106,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,32.4712 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,7645373, PASSED ,0.00230591,11.4005,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,11.4005 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,7645373, PASSED ,0.000314768,83.5172,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,83.9146 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,7645373, PASSED ,0.000313905,83.7469,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,84.1051 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,7645373, PASSED ,0.000331681,79.2586,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,79.2586 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,7645373, PASSED ,0.000333512,78.8235,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,78.8235 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,9528128, PASSED ,0.00281299,10.815,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,11.10775 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,9528128, PASSED ,0.000326749,93.1066,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,83.86955 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,9528128, PASSED ,0.000325766,93.3876,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,83.92599999999999 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,9528128, PASSED ,0.000349113,87.1422,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,79.14099999999999 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,9528128, PASSED ,0.000347064,87.6568,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,78.64425 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,884736, PASSED ,0.000414132,15.2354,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,15.2354 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,884736, PASSED ,8.07685e-05,78.1177,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,73.5342 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,884736, PASSED ,8.45459e-05,74.6275,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,74.6275 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,884736, PASSED ,9.06005e-05,69.6403,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,69.6403 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,884736, PASSED ,8.921e-05,70.7258,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,70.7258 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,11543176, PASSED ,0.00396559,8.71324,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,10.815 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,11543176, PASSED ,0.000411765,83.9146,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,83.9146 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,11543176, PASSED ,0.000413852,83.4915,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,83.7469 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,11543176, PASSED ,0.000437648,78.9519,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,79.2586 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,11543176, PASSED ,0.000440363,78.465,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,78.8235 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,91125, PASSED ,4.00244e-05,35.4562,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,30.61465 +Comm_HALO_PACKING_FUSED,Base_CUDA,direct_1024,91125, PASSED ,3.66473e-05,38.7235,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-direct_1024,0.0,45.114900000000006 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,direct_1024,91125, PASSED ,4.05186e-05,35.0238,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-direct_1024,0.0,37.6458 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,funcptr_1024,91125, PASSED ,4.33263e-05,32.7541,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-funcptr_1024,0.0,38.2547 +Comm_HALO_PACKING_FUSED,RAJA_CUDA,virtfunc_1024,91125, PASSED ,4.37038e-05,32.4712,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-virtfunc_1024,0.0,37.9915 +Basic_INDEXLIST_3LOOP,Base_Seq,default,2560000, PASSED ,0.0142187,7.04253,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.0,7.04253 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,2560000, PASSED ,4.70973e-05,2126.15,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,2115.68 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,2560000, PASSED ,4.73377e-05,2115.35,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,2113.59 +Basic_INDEXLIST_3LOOP,Base_Seq,default,320000, PASSED ,0.00157409,7.95189,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.0,7.95189 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,320000, PASSED ,1.96111e-05,638.26,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,638.26 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,320000, PASSED ,1.99029e-05,628.902,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,628.902 +Basic_INDEXLIST_3LOOP,Base_Seq,default,3750000, PASSED ,0.0221413,6.62487,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.0,6.62487 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,3750000, PASSED ,6.70109e-05,2188.95,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,2126.15 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,3750000, PASSED ,6.69042e-05,2192.44,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,2115.35 +Basic_INDEXLIST_3LOOP,Base_Seq,default,640000, PASSED ,0.00313502,7.98527,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.0,7.95189 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,640000, PASSED ,2.24732e-05,1113.95,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,1113.95 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,640000, PASSED ,2.25615e-05,1109.59,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,1109.59 +Basic_INDEXLIST_3LOOP,Base_Seq,default,7500000, PASSED ,0.0450929,6.50583,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,6.59158 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,7500000, PASSED ,0.000138663,2115.68,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,2188.95 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,7500000, PASSED ,0.0001388,2113.59,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,2192.44 +Basic_INDEXLIST_3LOOP,Base_Seq,default,80000, PASSED ,0.000503552,6.21439,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.0,7.95189 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,80000, PASSED ,1.68926e-05,185.245,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,345.609 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,80000, PASSED ,1.719e-05,182.04,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,346.669 +Basic_INDEXLIST_3LOOP,Base_Seq,default,10000000, PASSED ,0.0600533,6.51347,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,6.56119 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,10000000, PASSED ,0.000178458,2191.86,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,2191.86 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,10000000, PASSED ,0.000178382,2192.79,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,2192.79 +Basic_INDEXLIST_3LOOP,Base_Seq,default,12500000, PASSED ,0.0741771,6.59158,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,6.53733 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,12500000, PASSED ,0.000218329,2239.48,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,2215.67 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,12500000, PASSED ,0.000218386,2238.9,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,2215.8450000000003 +Basic_INDEXLIST_3LOOP,Base_Seq,default,1280000, PASSED ,0.00646864,7.7401,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.0,7.7401 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,1280000, PASSED ,2.78398e-05,1798.43,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,1798.43 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,1280000, PASSED ,2.79157e-05,1793.54,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,1793.54 +Basic_INDEXLIST_3LOOP,Base_Seq,default,15000000, PASSED ,0.0894248,6.56119,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,6.56119 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,15000000, PASSED ,0.000258931,2265.99,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,2239.48 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,15000000, PASSED ,0.000259391,2261.96,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,2238.9 +Basic_INDEXLIST_3LOOP,Base_Seq,default,160000, PASSED ,0.000775334,8.07202,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.0,7.968579999999999 +Basic_INDEXLIST_3LOOP,Base_CUDA,block_256,160000, PASSED ,1.81087e-05,345.609,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256,0.0,491.93449999999996 +Basic_INDEXLIST_3LOOP,RAJA_CUDA,block_256,160000, PASSED ,1.80533e-05,346.669,0.0,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,0.0,487.7855 +Apps_INTSC_HEXHEX,Base_Seq,default,27, PASSED ,0.00113801,0.0989909,4.59175,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,4.62777,0.0997673 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,27, PASSED ,3.0517e-05,3.69148,171.232,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_64,293.57,6.3289 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,27, PASSED ,3.0991e-05,3.63502,168.613,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,326.893,7.04729 +Apps_INTSC_HEXHEX,Base_Seq,default,13824, PASSED ,0.573433,0.100584,4.66566,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,4.66843,0.100644 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,13824, PASSED ,0.00229436,25.1391,1166.1,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1166.1,25.1391 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,13824, PASSED ,0.00229631,25.1178,1165.1,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1165.1,25.1178 +Apps_INTSC_HEXHEX,Base_Seq,default,1728, PASSED ,0.0716637,0.100606,4.66666,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,4.66836,0.100642 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,1728, PASSED ,0.000316845,22.7549,1055.5,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1055.5,22.7549 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,1728, PASSED ,0.000317009,22.7431,1054.95,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1054.95,22.7431 +Apps_INTSC_HEXHEX,Base_Seq,default,19683, PASSED ,0.817182,0.100496,4.66159,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,4.667045,0.10061400000000001 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,19683, PASSED ,0.00325913,25.1981,1168.83,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1167.465,25.168599999999998 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,19683, PASSED ,0.00325845,25.2033,1169.07,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1167.085,25.16055 +Apps_INTSC_HEXHEX,Base_Seq,default,216, PASSED ,0.00898769,0.100273,4.65123,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,4.65123,0.100273 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,216, PASSED ,6.743e-05,13.3653,619.958,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_64,619.958,13.3653 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,216, PASSED ,6.6808e-05,13.4897,625.73,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,625.73,13.4897 +Apps_INTSC_HEXHEX,Base_Seq,default,3375, PASSED ,0.139883,0.100667,4.66949,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,4.66666,0.100606 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,3375, PASSED ,0.000586234,24.0204,1114.2,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1114.2,24.0204 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,3375, PASSED ,0.000588246,23.9383,1110.39,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1110.39,23.9383 +Apps_INTSC_HEXHEX,Base_Seq,default,39304, PASSED ,1.62818,0.100719,4.67192,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,4.66566,0.100584 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,39304, PASSED ,0.00648117,25.3024,1173.67,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1168.83,25.1981 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,39304, PASSED ,0.00647179,25.3391,1175.37,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1169.07,25.2033 +Apps_INTSC_HEXHEX,Base_Seq,default,512, PASSED ,0.021226,0.100642,4.66836,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,4.66559,0.100583 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,512, PASSED ,0.000116043,18.409,853.911,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_64,853.911,18.409 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,512, PASSED ,0.000117722,18.1464,841.732,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,841.732,18.1464 +Apps_INTSC_HEXHEX,Base_Seq,default,64, PASSED ,0.00267651,0.0997673,4.62777,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,4.6395,0.10002015 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,64, PASSED ,4.2192e-05,6.3289,293.57,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_64,456.764,9.8471 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,64, PASSED ,3.7891e-05,7.04729,326.893,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,476.3115,10.268495 +Apps_INTSC_HEXHEX,Base_Seq,default,6859, PASSED ,0.284349,0.100644,4.66843,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,4.66666,0.100606 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,6859, PASSED ,0.0011558,24.7604,1148.53,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_64,1148.53,24.7604 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,6859, PASSED ,0.00115578,24.7607,1148.54,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,1148.54,24.7607 +Apps_INTSC_HEXHEX,Base_Seq,default,1000, PASSED ,0.0414815,0.100583,4.66559,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,4.66666,0.100606 +Apps_INTSC_HEXHEX,Base_CUDA,block_64,1000, PASSED ,0.000194956,21.4014,992.716,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_64,992.716,21.4014 +Apps_INTSC_HEXHEX,RAJA_CUDA,block_64,1000, PASSED ,0.000198316,21.0388,975.897,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/INTSC_HEXHEX_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_64,975.897,21.0388 +Apps_LTIMES,Base_Seq,default,1344, PASSED ,1.3159e-05,7.18731,5.10678,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,5.1042,7.10468 +Apps_LTIMES,Base_CUDA,block_256,1344, PASSED ,3.35502e-06,28.1899,20.0297,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256,73.568,102.646 +Apps_LTIMES,RAJA_CUDA,kernel_256,1344, PASSED ,3.42376e-06,27.6239,19.6275,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,70.2153,97.9681 +Apps_LTIMES,RAJA_CUDA,launch_256,1344, PASSED ,3.43504e-06,27.5332,19.5631,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,72.8381,101.627 +Apps_LTIMES,Base_Seq,default,1238784, PASSED ,0.0121454,7.0928,5.09983,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,4.9375,6.86713 +Apps_LTIMES,Base_CUDA,block_256,1238784, PASSED ,9.03716e-05,953.226,685.383,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256,695.03,966.655 +Apps_LTIMES,RAJA_CUDA,kernel_256,1238784, PASSED ,9.27542e-05,928.741,667.778,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,678.176,943.198 +Apps_LTIMES,RAJA_CUDA,launch_256,1238784, PASSED ,9.18566e-05,937.816,674.303,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,685.086,952.809 +Apps_LTIMES,Base_Seq,default,154944, PASSED ,0.00153302,7.02907,5.05354,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,5.05354,7.02907 +Apps_LTIMES,Base_CUDA,block_256,154944, PASSED ,1.39367e-05,773.189,555.883,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256,555.883,773.189 +Apps_LTIMES,RAJA_CUDA,kernel_256,154944, PASSED ,1.41069e-05,763.865,549.18,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,549.18,763.865 +Apps_LTIMES,RAJA_CUDA,launch_256,154944, PASSED ,1.3749e-05,783.746,563.474,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,563.474,783.746 +Apps_LTIMES,Base_Seq,default,1814592, PASSED ,0.0199534,6.32401,4.54707,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,4.742285,6.59557 +Apps_LTIMES,Base_CUDA,block_256,1814592, PASSED ,0.000130216,969.049,696.763,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256,695.8965000000001,967.852 +Apps_LTIMES,RAJA_CUDA,kernel_256,1814592, PASSED ,0.000133785,943.198,678.176,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,684.3265,951.76 +Apps_LTIMES,RAJA_CUDA,launch_256,1814592, PASSED ,0.000132435,952.809,685.086,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,691.9155000000001,962.3054999999999 +Apps_LTIMES,Base_Seq,default,19392, PASSED ,0.000189961,7.10468,5.1042,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,5.1042,7.10468 +Apps_LTIMES,Base_CUDA,block_256,19392, PASSED ,4.30516e-06,313.487,225.218,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256,225.218,313.487 +Apps_LTIMES,RAJA_CUDA,kernel_256,19392, PASSED ,4.53638e-06,297.509,213.739,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,213.739,297.509 +Apps_LTIMES,RAJA_CUDA,launch_256,19392, PASSED ,4.44682e-06,303.501,218.043,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,218.043,303.501 +Apps_LTIMES,Base_Seq,default,309696, PASSED ,0.00308182,6.9884,5.02456,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,5.05354,7.02907 +Apps_LTIMES,Base_CUDA,block_256,309696, PASSED ,2.40824e-05,894.303,642.991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256,642.991,894.303 +Apps_LTIMES,RAJA_CUDA,kernel_256,309696, PASSED ,2.43289e-05,885.243,636.478,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,636.478,885.243 +Apps_LTIMES,RAJA_CUDA,launch_256,309696, PASSED ,2.35515e-05,914.464,657.487,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,657.487,914.464 +Apps_LTIMES,Base_Seq,default,3629184, PASSED ,0.0404164,6.24426,4.48975,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,4.54707,6.32401 +Apps_LTIMES,Base_CUDA,block_256,3629184, PASSED ,0.00025547,987.865,710.295,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,696.763,969.049 +Apps_LTIMES,RAJA_CUDA,kernel_256,3629184, PASSED ,0.000262508,961.381,691.252,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,678.176,943.198 +Apps_LTIMES,RAJA_CUDA,launch_256,3629184, PASSED ,0.000259693,971.802,698.745,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,685.086,952.809 +Apps_LTIMES,Base_Seq,default,38784, PASSED ,0.000379928,7.10163,5.10412,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,5.10412,7.10163 +Apps_LTIMES,Base_CUDA,block_256,38784, PASSED ,6.0753e-06,444.111,319.194,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256,319.194,444.111 +Apps_LTIMES,RAJA_CUDA,kernel_256,38784, PASSED ,6.32362e-06,426.672,306.66,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,306.66,426.672 +Apps_LTIMES,RAJA_CUDA,launch_256,38784, PASSED ,6.05992e-06,445.238,320.004,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,320.004,445.238 +Apps_LTIMES,Base_Seq,default,4992, PASSED ,4.904e-05,7.10145,5.08973,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,5.10416,7.103155 +Apps_LTIMES,Base_CUDA,block_256,4992, PASSED ,3.39278e-06,102.646,73.568,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256,149.393,208.06650000000002 +Apps_LTIMES,RAJA_CUDA,kernel_256,4992, PASSED ,3.55478e-06,97.9681,70.2153,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,141.97715,197.73855 +Apps_LTIMES,RAJA_CUDA,launch_256,4992, PASSED ,3.42678e-06,101.627,72.8381,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,145.44055,202.564 +Apps_LTIMES,Base_Seq,default,619392, PASSED ,0.00627232,6.86713,4.9375,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,5.02456,6.9884 +Apps_LTIMES,Base_CUDA,block_256,619392, PASSED ,4.45587e-05,966.655,695.03,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256,685.383,953.226 +Apps_LTIMES,RAJA_CUDA,kernel_256,619392, PASSED ,4.48525e-05,960.322,690.477,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,667.778,928.741 +Apps_LTIMES,RAJA_CUDA,launch_256,619392, PASSED ,4.32649e-05,995.561,715.813,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,674.303,937.816 +Apps_LTIMES,Base_Seq,default,77568, PASSED ,0.000758563,7.11226,5.11283,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,5.10412,7.10163 +Apps_LTIMES,Base_CUDA,block_256,77568, PASSED ,8.50688e-06,634.204,455.913,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256,455.913,634.204 +Apps_LTIMES,RAJA_CUDA,kernel_256,77568, PASSED ,8.69284e-06,620.637,446.16,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-kernel_256,446.16,620.637 +Apps_LTIMES,RAJA_CUDA,launch_256,77568, PASSED ,8.73622e-06,617.555,443.945,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/LTIMES_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-launch_256,443.945,617.555 +Apps_MASS3DPA,Base_Seq,default,1600, PASSED ,9.01786e-06,6.5807,14.0527,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,14.9006,6.95157 +Apps_MASS3DPA,Base_CUDA,block_25,1600, PASSED ,3.8825e-06,15.285,32.6401,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_25,131.824,61.5 +Apps_MASS3DPA,RAJA_CUDA,block_25,1600, PASSED ,3.87526e-06,15.3135,32.701,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,130.729,60.989 +Apps_MASS3DPA,Base_Seq,default,1619008, PASSED ,0.0092196,6.4805,13.9085,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,13.9085,6.4805 +Apps_MASS3DPA,Base_CUDA,block_25,1619008, PASSED ,4.01159e-05,1489.37,3196.5,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_25,3196.5,1489.37 +Apps_MASS3DPA,RAJA_CUDA,block_25,1619008, PASSED ,4.03963e-05,1479.04,3174.31,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,3174.31,1479.04 +Apps_MASS3DPA,Base_Seq,default,202368, PASSED ,0.00108462,6.88576,14.7777,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,14.7395,6.86773 +Apps_MASS3DPA,Base_CUDA,block_25,202368, PASSED ,7.22326e-06,1033.94,2218.97,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_25,2218.97,1033.94 +Apps_MASS3DPA,RAJA_CUDA,block_25,202368, PASSED ,7.23264e-06,1032.6,2216.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,2216.09,1032.6 +Apps_MASS3DPA,Base_Seq,default,2371584, PASSED ,0.0150102,5.83072,12.5139,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,13.2112,6.15561 +Apps_MASS3DPA,Base_CUDA,block_25,2371584, PASSED ,5.66451e-05,1545.07,3316.03,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_25,3256.2650000000003,1517.2199999999998 +Apps_MASS3DPA,RAJA_CUDA,block_25,2371584, PASSED ,5.69624e-05,1536.46,3297.56,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,3235.935,1507.75 +Apps_MASS3DPA,Base_Seq,default,25344, PASSED ,0.000133332,7.01696,15.0551,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,14.9006,6.95157 +Apps_MASS3DPA,Base_CUDA,block_25,25344, PASSED ,3.95496e-06,236.56,507.546,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_25,507.546,236.56 +Apps_MASS3DPA,RAJA_CUDA,block_25,25344, PASSED ,3.95342e-06,236.652,507.744,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,507.744,236.652 +Apps_MASS3DPA,Base_Seq,default,404736, PASSED ,0.00220323,6.77938,14.5497,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,14.6598,6.83109 +Apps_MASS3DPA,Base_CUDA,block_25,404736, PASSED ,1.17549e-05,1270.66,2727.06,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_25,2727.06,1270.66 +Apps_MASS3DPA,RAJA_CUDA,block_25,404736, PASSED ,1.18154e-05,1264.16,2713.09,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,2713.09,1264.16 +Apps_MASS3DPA,Base_Seq,default,4743104, PASSED ,0.0306498,5.71091,12.2568,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,12.5139,5.83072 +Apps_MASS3DPA,Base_CUDA,block_25,4743104, PASSED ,0.000108962,1606.41,3447.69,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_25,3316.03,1545.07 +Apps_MASS3DPA,RAJA_CUDA,block_25,4743104, PASSED ,0.000109434,1599.49,3432.84,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,3297.56,1536.46 +Apps_MASS3DPA,Base_Seq,default,50624, PASSED ,0.000266148,7.02056,15.0652,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,14.9006,6.95157 +Apps_MASS3DPA,Base_CUDA,block_25,50624, PASSED ,4.42372e-06,422.384,906.382,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_25,906.382,422.384 +Apps_MASS3DPA,RAJA_CUDA,block_25,50624, PASSED ,4.4197e-06,422.768,907.206,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,907.206,422.768 +Apps_MASS3DPA,Base_Seq,default,6336, PASSED ,3.36787e-05,6.95157,14.9006,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,14.97785,6.984265000000001 +Apps_MASS3DPA,Base_CUDA,block_25,6336, PASSED ,3.80682e-06,61.5,131.824,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_25,319.685,149.03 +Apps_MASS3DPA,RAJA_CUDA,block_25,6336, PASSED ,3.83872e-06,60.989,130.729,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,319.23650000000004,148.82049999999998 +Apps_MASS3DPA,Base_Seq,default,809536, PASSED ,0.00435007,6.86773,14.7395,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,14.5497,6.77938 +Apps_MASS3DPA,Base_CUDA,block_25,809536, PASSED ,2.08553e-05,1432.49,3074.41,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_25,3074.41,1432.49 +Apps_MASS3DPA,RAJA_CUDA,block_25,809536, PASSED ,2.0953e-05,1425.82,3060.07,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,3060.07,1425.82 +Apps_MASS3DPA,Base_Seq,default,101184, PASSED ,0.000546671,6.83109,14.6598,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,14.7777,6.88576 +Apps_MASS3DPA,Base_CUDA,block_25,101184, PASSED ,5.59842e-06,667.038,1431.49,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_25,1431.49,667.038 +Apps_MASS3DPA,RAJA_CUDA,block_25,101184, PASSED ,5.59088e-06,667.937,1433.42,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MASS3DPA_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_25,1433.42,667.937 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,64, PASSED ,6.7609e-07,17.6762,5.01708,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,5.27123,15.6634 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,64, PASSED ,3.27675e-06,3.64713,1.03517,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,CUDA,Base_CUDA-block_256,7.57386,22.4171 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,64, PASSED ,2.72157e-06,4.39112,1.24634,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,8.03078,23.7695 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,328509, PASSED ,0.0034469,12.4101,5.05119,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,5.05119,12.3707 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,328509, PASSED ,2.0792e-05,2057.35,837.387,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-block_256,837.387,2057.35 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,328509, PASSED ,2.02879e-05,2108.48,858.197,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,904.162,2213.75 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,35937, PASSED ,0.00039324,12.2524,4.84351,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,4.84513,12.4379 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,35937, PASSED ,4.41338e-06,1091.71,431.565,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-block_256,431.565,1091.71 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,35937, PASSED ,4.38632e-06,1098.45,434.228,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,434.228,1098.45 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,493039, PASSED ,0.00517185,12.3707,5.05256,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,5.051875,12.3904 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,493039, PASSED ,3.34798e-05,1910.98,780.501,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-block_256,853.0274999999999,2086.765 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,493039, PASSED ,2.89009e-05,2213.75,904.162,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,921.8125,2269.665 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,3375, PASSED ,3.39342e-05,14.2103,5.27123,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,5.22034,14.2103 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,3375, PASSED ,3.62645e-06,132.972,49.3251,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,CUDA,Base_CUDA-block_256,49.3251,132.972 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,3375, PASSED ,3.40138e-06,141.771,52.5889,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,52.5889,141.771 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,79507, PASSED ,0.000872998,12.054,4.82689,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,4.84513,12.4101 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,79507, PASSED ,5.444e-06,1932.98,774.039,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-block_256,774.039,1932.98 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,79507, PASSED ,5.60469e-06,1877.56,751.847,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,751.847,1877.56 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,1000000, PASSED ,0.010583,12.2002,5.00806,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,5.05119,12.3707 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,1000000, PASSED ,6.10129e-05,2116.18,868.668,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-block_256,837.387,2057.35 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,1000000, PASSED ,5.34032e-05,2417.72,992.449,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,904.162,2213.75 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,8000, PASSED ,8.12208e-05,13.6766,5.22034,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,5.22034,13.6766 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,8000, PASSED ,3.63063e-06,305.958,116.784,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-block_256,116.784,305.958 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,8000, PASSED ,3.42591e-06,324.241,123.763,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,123.763,324.241 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,512, PASSED ,5.1277e-06,15.6634,5.29204,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,5.245785,14.93685 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,512, PASSED ,3.58285e-06,22.4171,7.57386,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,CUDA,Base_CUDA-block_256,28.44948,77.69455 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,512, PASSED ,3.379e-06,23.7695,8.03078,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,30.30984,82.77024999999999 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,157464, PASSED ,0.00164964,12.5233,5.05904,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,5.05119,12.3707 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,157464, PASSED ,7.88336e-06,2620.58,1058.63,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-block_256,780.501,1932.98 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,157464, PASSED ,8.88336e-06,2325.58,939.463,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,858.197,2108.48 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,17576, PASSED ,0.000192261,12.4379,4.84513,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,4.84513,12.4379 +Apps_MATVEC_3D_STENCIL,Base_CUDA,block_256,17576, PASSED ,3.6985e-06,646.562,251.866,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-block_256,251.866,646.562 +Apps_MATVEC_3D_STENCIL,RAJA_CUDA,block_256,17576, PASSED ,3.47343e-06,688.457,268.187,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-block_256,268.187,688.457 +Basic_MULTI_REDUCE,Base_Seq,default,3199995, PASSED ,0.00746905,6.38419,0.428434,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.428434,6.38419 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,3199995, PASSED ,0.00114407,41.679,2.79702,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,2.79702,41.679 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,3199995, PASSED ,0.00118556,40.2205,2.69914,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,2.69914,40.2205 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,3199995, PASSED ,0.00116734,40.8481,2.74126,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,2.74126,40.8481 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,3199995, PASSED ,0.001196,39.8695,2.67559,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,2.67559,39.8695 +Basic_MULTI_REDUCE,Base_Seq,default,399995, PASSED ,0.000857859,6.94815,0.466271,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.466002,6.94406 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,399995, PASSED ,0.00118626,5.02467,0.337191,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,0.337191,5.02467 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,399995, PASSED ,0.00118322,5.03756,0.338056,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,0.338056,5.03756 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,399995, PASSED ,0.00122441,4.86807,0.326683,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,0.326683,4.86807 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,399995, PASSED ,0.00124422,4.79058,0.321482,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,0.321482,4.79058 +Basic_MULTI_REDUCE,Base_Seq,default,4687495, PASSED ,0.0115267,6.05978,0.406664,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.406664,6.05978 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,4687495, PASSED ,0.00114658,60.9197,4.08824,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,4.08824,60.9197 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,4687495, PASSED ,0.00118752,58.8195,3.9473,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,3.9473,58.8195 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,4687495, PASSED ,0.00116815,59.7946,4.01274,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,4.01274,59.7946 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,4687495, PASSED ,0.00119391,58.5048,3.92618,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,3.92618,58.5048 +Basic_MULTI_REDUCE,Base_Seq,default,799995, PASSED ,0.00171672,6.94406,0.466002,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.465023,6.92973 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,799995, PASSED ,0.00118691,10.0437,0.674012,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,0.674012,10.0437 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,799995, PASSED ,0.0011843,10.0659,0.675501,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,0.675501,10.0659 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,799995, PASSED ,0.00122105,9.76294,0.655172,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,0.655172,9.76294 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,799995, PASSED ,0.00124317,9.58923,0.643515,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,0.643515,9.58923 +Basic_MULTI_REDUCE,Base_Seq,default,9374995, PASSED ,0.0237314,5.88666,0.395046,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,0.399946,5.95966 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,9374995, PASSED ,0.00114296,122.225,8.20238,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,8.20238,122.225 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,9374995, PASSED ,0.00118759,117.632,7.89413,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,7.89413,117.632 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,9374995, PASSED ,0.00116831,119.573,8.02441,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,8.02441,119.573 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,9374995, PASSED ,0.00120206,116.216,7.7991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,7.7991,116.216 +Basic_MULTI_REDUCE,Base_Seq,default,99995, PASSED ,0.000213933,6.96569,0.467413,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.466271,6.94815 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,99995, PASSED ,0.00118416,1.25844,0.0844437,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,0.168376,2.50913 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,99995, PASSED ,0.00117775,1.26529,0.0849038,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,0.168555,2.51178 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,99995, PASSED ,0.00121486,1.22664,0.08231,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,0.164063,2.44485 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,99995, PASSED ,0.00124156,1.20025,0.0805395,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,0.161374,2.40478 +Basic_MULTI_REDUCE,Base_Seq,default,12499995, PASSED ,0.0312542,5.95966,0.399946,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,0.399946,5.95966 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,12499995, PASSED ,0.00113992,163.402,10.9657,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,10.9657,163.402 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,12499995, PASSED ,0.00118223,157.554,10.5733,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,10.5733,157.554 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,12499995, PASSED ,0.00114342,162.901,10.9321,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,10.9321,162.901 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,12499995, PASSED ,0.00120046,155.161,10.4127,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,10.4127,155.161 +Basic_MULTI_REDUCE,Base_Seq,default,15624995, PASSED ,0.0395453,5.8877,0.395117,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default,0.39753150000000004,5.92368 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,15624995, PASSED ,0.00111842,208.178,13.9706,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,12.46815,185.79 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,15624995, PASSED ,0.00118367,196.703,13.2005,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,11.8869,177.1285 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,15624995, PASSED ,0.0011381,204.578,13.729,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,12.330549999999999,183.73950000000002 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,15624995, PASSED ,0.00120259,193.607,12.9928,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,11.70275,174.38400000000001 +Basic_MULTI_REDUCE,Base_Seq,default,1599995, PASSED ,0.00352059,6.77215,0.454468,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.454468,6.77215 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,1599995, PASSED ,0.00118293,20.155,1.35257,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,1.35257,20.155 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,1599995, PASSED ,0.00118752,20.0771,1.34734,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,1.34734,20.0771 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,1599995, PASSED ,0.0012189,19.5602,1.31265,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,1.31265,19.5602 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,1599995, PASSED ,0.00124597,19.1352,1.28413,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,1.28413,19.1352 +Basic_MULTI_REDUCE,Base_Seq,default,18749995, PASSED ,0.0467148,5.98091,0.401372,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default,0.399946,5.95966 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,18749995, PASSED ,0.00111761,249.995,16.7769,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,13.9706,208.178 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,18749995, PASSED ,0.00119355,234.088,15.7094,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,13.2005,196.703 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,18749995, PASSED ,0.00112135,249.162,16.721,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,13.729,204.578 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,18749995, PASSED ,0.00119838,233.146,15.6462,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,12.9928,193.607 +Basic_MULTI_REDUCE,Base_Seq,default,199995, PASSED ,0.000430075,6.92973,0.465023,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.4661365,6.946105 +Basic_MULTI_REDUCE,Base_CUDA,atomic_direct_256,199995, PASSED ,0.00118779,2.50913,0.168376,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-atomic_direct_256,0.2527835,3.7669 +Basic_MULTI_REDUCE,Base_CUDA,atomic_occgs_256,199995, PASSED ,0.00118653,2.51178,0.168555,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-atomic_occgs_256,0.2533055,3.77467 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_direct_256,199995, PASSED ,0.00121902,2.44485,0.164063,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_direct_256,0.245373,3.65646 +Basic_MULTI_REDUCE,RAJA_CUDA,atomic_occgs_256,199995, PASSED ,0.00123932,2.40478,0.161374,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/MULTI_REDUCE_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-atomic_occgs_256,0.24142799999999998,3.5976800000000004 +Basic_REDUCE_STRUCT,Base_Seq,default,3200000, PASSED ,0.00443437,10.7532,1.44327,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,1.44327,10.7532 +Basic_REDUCE_STRUCT,Base_Seq,kahan,3200000, PASSED ,0.0078743,6.05561,0.81277,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-kahan,0.81277,6.05561 +Basic_REDUCE_STRUCT,Base_Seq,cascade,3200000, PASSED ,0.00814346,5.85546,0.785907,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-cascade,0.789586,5.88288 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,3200000, PASSED ,0.00114384,41.6873,5.59518,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,5.59518,41.6873 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,3200000, PASSED ,0.00118253,40.3235,5.41213,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,5.41213,40.3235 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,3200000, PASSED ,0.00113966,41.8405,5.61573,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,5.61573,41.8405 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,3200000, PASSED ,0.000234629,203.23,27.2771,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,26.8071,199.728 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,3200000, PASSED ,0.000193799,246.047,33.0238,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,33.0238,246.047 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,3200000, PASSED ,0.00119582,39.8752,5.35196,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,5.35196,39.8752 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,3200000, PASSED ,4.51046e-05,1057.18,141.892,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,141.892,1057.18 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,3200000, PASSED ,4.79646e-05,994.144,133.432,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,133.432,994.144 +Basic_REDUCE_STRUCT,Base_Seq,default,400000, PASSED ,0.000428418,13.9127,1.86734,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,1.86087,13.8645 +Basic_REDUCE_STRUCT,Base_Seq,kahan,400000, PASSED ,0.000850656,7.0069,0.940453,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-kahan,0.940453,7.0069 +Basic_REDUCE_STRUCT,Base_Seq,cascade,400000, PASSED ,0.000890837,6.69086,0.898034,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-cascade,0.900716,6.71082 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,400000, PASSED ,0.00117357,5.07893,0.681684,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,0.681684,5.07893 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,400000, PASSED ,0.00118248,5.04064,0.676545,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,0.676545,5.04064 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,400000, PASSED ,0.0011889,5.01342,0.672891,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,0.672891,5.01342 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,400000, PASSED ,4.09785e-05,145.453,19.5225,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,19.5225,145.453 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,400000, PASSED ,4.64267e-05,128.384,17.2315,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,17.2315,128.384 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,400000, PASSED ,0.00124422,4.79053,0.642976,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,0.642976,4.79053 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,400000, PASSED ,2.92832e-05,203.545,27.3195,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,27.3195,203.545 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,400000, PASSED ,3.22944e-05,184.567,24.7722,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_128-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,24.7722,184.567 +Basic_REDUCE_STRUCT,Base_Seq,default,4687500, PASSED ,0.00724771,9.63741,1.29351,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,1.29351,9.63741 +Basic_REDUCE_STRUCT,Base_Seq,kahan,4687500, PASSED ,0.0121225,5.76193,0.773354,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-kahan,0.782941,5.83336 +Basic_REDUCE_STRUCT,Base_Seq,cascade,4687500, PASSED ,0.0118733,5.88288,0.789586,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-cascade,0.789586,5.88288 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,4687500, PASSED ,0.00112014,62.3578,8.36953,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,8.36953,62.3578 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,4687500, PASSED ,0.00118696,58.8472,7.89834,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,7.89834,58.8472 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,4687500, PASSED ,0.00111714,62.5251,8.39197,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,8.39197,62.5251 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,4687500, PASSED ,0.000349721,199.728,26.8071,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,26.8071,199.728 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,4687500, PASSED ,0.000276069,253.014,33.959,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,33.959,253.014 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,4687500, PASSED ,0.00118595,58.897,7.90503,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,7.90503,58.897 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,4687500, PASSED ,5.23711e-05,1333.73,179.011,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,179.011,1333.73 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,4687500, PASSED ,5.55167e-05,1258.16,168.868,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,168.868,1258.16 +Basic_REDUCE_STRUCT,Base_Seq,default,800000, PASSED ,0.000864342,13.7919,1.85112,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,1.85112,13.7919 +Basic_REDUCE_STRUCT,Base_Seq,kahan,800000, PASSED ,0.00170798,6.97953,0.936778,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-kahan,0.936778,6.97953 +Basic_REDUCE_STRUCT,Base_Seq,cascade,800000, PASSED ,0.00177406,6.71957,0.901887,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-cascade,0.898034,6.69086 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,800000, PASSED ,0.00116567,10.2266,1.3726,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,1.3726,10.2266 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,800000, PASSED ,0.00118385,10.0696,1.35152,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,1.35152,10.0696 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,800000, PASSED ,0.00117672,10.1306,1.35971,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,1.35971,10.1306 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,800000, PASSED ,6.57488e-05,181.31,24.3351,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,24.3351,181.31 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,800000, PASSED ,6.5408e-05,182.255,24.4619,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,24.4619,182.255 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,800000, PASSED ,0.00123885,9.6226,1.29153,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,1.29153,9.6226 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,800000, PASSED ,2.97245e-05,401.047,53.8276,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,53.8276,401.047 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,800000, PASSED ,3.30817e-05,360.348,48.3652,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_256-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,48.3652,360.348 +Basic_REDUCE_STRUCT,Base_Seq,default,9375000, PASSED ,0.0152428,9.16486,1.23009,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,1.26501,9.42505 +Basic_REDUCE_STRUCT,Base_Seq,kahan,9375000, PASSED ,0.0241246,5.79071,0.777216,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-kahan,0.782941,5.83336 +Basic_REDUCE_STRUCT,Base_Seq,cascade,9375000, PASSED ,0.0246052,5.67759,0.762034,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-cascade,0.789586,5.88288 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,9375000, PASSED ,0.00106026,131.759,17.6844,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,17.6844,131.759 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,9375000, PASSED ,0.00118735,117.655,15.7914,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,15.7914,117.655 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,9375000, PASSED ,0.00104376,133.842,17.964,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,17.964,133.842 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,9375000, PASSED ,0.000717588,194.678,26.1292,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,26.1292,194.678 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,9375000, PASSED ,0.000520792,268.242,36.0028,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,36.0028,268.242 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,9375000, PASSED ,0.00118794,117.597,15.7837,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,15.7837,117.597 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,9375000, PASSED ,7.64178e-05,1828.09,245.362,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,245.362,1828.09 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,9375000, PASSED ,8.6814e-05,1609.17,215.979,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,215.979,1609.17 +Basic_REDUCE_STRUCT,Base_Seq,default,100000, PASSED ,0.000106123,14.0414,1.88462,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,1.86734,13.9127 +Basic_REDUCE_STRUCT,Base_Seq,kahan,100000, PASSED ,0.000211637,7.0409,0.945023,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-kahan,0.941549,7.01505 +Basic_REDUCE_STRUCT,Base_Seq,cascade,100000, PASSED ,0.000221277,6.73416,0.903853,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-cascade,0.900716,6.71082 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,100000, PASSED ,0.00118509,1.25739,0.168766,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,0.337219,2.51246 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,100000, PASSED ,0.00118173,1.26096,0.169245,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,0.339543,2.52978 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,100000, PASSED ,0.0012023,1.23939,0.166349,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,0.330747,2.46425 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,100000, PASSED ,2.51803e-05,59.1779,7.9428,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,13.8994,103.558 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,100000, PASSED ,3.01591e-05,49.4085,6.63156,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,10.194,75.9507 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,100000, PASSED ,0.00123155,1.20995,0.162398,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,0.320871,2.39066 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,100000, PASSED ,2.52775e-05,58.9502,7.91224,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,13.789,102.736 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,100000, PASSED ,3.01523e-05,49.4196,6.63305,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_32-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,12.6816,94.4849 +Basic_REDUCE_STRUCT,Base_Seq,default,12500000, PASSED ,0.0197627,9.42505,1.26501,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,1.25784,9.37161 +Basic_REDUCE_STRUCT,Base_Seq,kahan,12500000, PASSED ,0.0319309,5.83336,0.782941,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-kahan,0.782941,5.83336 +Basic_REDUCE_STRUCT,Base_Seq,cascade,12500000, PASSED ,0.0282075,6.60337,0.886289,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-cascade,0.882995,6.57882 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,12500000, PASSED ,0.00101283,183.904,24.6832,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,24.6832,183.904 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,12500000, PASSED ,0.00118728,156.884,21.0566,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,21.0566,156.884 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,12500000, PASSED ,0.00103767,179.502,24.0924,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,24.0924,179.502 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,12500000, PASSED ,0.000962459,193.53,25.9751,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,25.9751,193.53 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,12500000, PASSED ,0.000681294,273.398,36.6949,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,36.6949,273.398 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,12500000, PASSED ,0.00119493,155.879,20.9218,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,20.9218,155.879 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,12500000, PASSED ,9.16856e-05,2031.56,272.671,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,272.671,2031.56 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,12500000, PASSED ,9.47808e-05,1965.21,263.766,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,263.766,1965.21 +Basic_REDUCE_STRUCT,Base_Seq,default,15625000, PASSED ,0.0251125,9.2715,1.2444,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default,1.25112,9.321555 +Basic_REDUCE_STRUCT,Base_Seq,kahan,15625000, PASSED ,0.0392682,5.92925,0.79581,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,Seq,Base_Seq-kahan,0.7893755,5.881304999999999 +Basic_REDUCE_STRUCT,Base_Seq,cascade,15625000, PASSED ,0.0353909,6.57882,0.882995,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,Seq,Base_Seq-cascade,0.883928,6.585775 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,15625000, PASSED ,0.000722227,322.379,43.2689,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,33.89675,252.5505 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,15625000, PASSED ,0.000751357,309.88,41.5914,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,31.323999999999998,233.382 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,15625000, PASSED ,0.00116405,200.018,26.846,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,25.4692,189.76 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,15625000, PASSED ,0.00121036,192.364,25.8187,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,25.896900000000002,192.947 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,15625000, PASSED ,0.000848496,274.404,36.8299,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,36.7624,273.901 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,15625000, PASSED ,0.00119685,194.536,26.1101,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,23.51595,175.20749999999998 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,15625000, PASSED ,0.000106635,2183.43,293.055,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,282.863,2107.495 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,15625000, PASSED ,0.000110169,2113.4,283.656,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_5000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,273.711,2039.305 +Basic_REDUCE_STRUCT,Base_Seq,default,1600000, PASSED ,0.0019332,12.3329,1.65529,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,1.65529,12.3329 +Basic_REDUCE_STRUCT,Base_Seq,kahan,1600000, PASSED ,0.00353484,6.74481,0.905274,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-kahan,0.905274,6.74481 +Basic_REDUCE_STRUCT,Base_Seq,cascade,1600000, PASSED ,0.00361417,6.59678,0.885405,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-cascade,0.885405,6.59678 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,1600000, PASSED ,0.00114916,20.7473,2.78466,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,2.78466,20.7473 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,1600000, PASSED ,0.00118481,20.1229,2.70085,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,2.70085,20.1229 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,1600000, PASSED ,0.0011646,20.4721,2.74772,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,2.74772,20.4721 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,1600000, PASSED ,0.00011438,208.444,27.9768,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,26.8071,199.728 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,1600000, PASSED ,0.000105049,226.96,30.4621,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,30.4621,226.96 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,1600000, PASSED ,0.001179,20.222,2.71416,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,2.71416,20.222 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,1600000, PASSED ,3.20528e-05,743.831,99.8353,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,99.8353,743.831 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,1600000, PASSED ,3.52143e-05,677.05,90.8721,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_512-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,90.8721,677.05 +Basic_REDUCE_STRUCT,Base_Seq,default,18750000, PASSED ,0.0298131,9.37161,1.25784,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default,1.25784,9.37161 +Basic_REDUCE_STRUCT,Base_Seq,kahan,18750000, PASSED ,0.0410121,6.81255,0.914365,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,Seq,Base_Seq-kahan,0.79581,5.92925 +Basic_REDUCE_STRUCT,Base_Seq,cascade,18750000, PASSED ,0.0423796,6.59273,0.884861,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,Seq,Base_Seq-cascade,0.884861,6.59273 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,18750000, PASSED ,0.000869862,321.197,43.1103,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,43.1103,321.197 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,18750000, PASSED ,0.000794184,351.804,47.2183,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,41.5914,309.88 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,18750000, PASSED ,0.00128429,217.55,29.1991,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,26.846,200.018 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,18750000, PASSED ,0.00145398,192.16,25.7913,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,25.8187,192.364 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,18750000, PASSED ,0.00100517,277.96,37.3071,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,36.8299,274.404 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,18750000, PASSED ,0.00120377,232.102,31.1522,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,26.1101,194.536 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,18750000, PASSED ,0.000125293,2229.94,299.298,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,293.055,2183.43 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,18750000, PASSED ,0.000128128,2180.61,292.677,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_6000-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,283.656,2113.4 +Basic_REDUCE_STRUCT,Base_Seq,default,200000, PASSED ,0.000214954,13.8645,1.86087,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,1.864105,13.8886 +Basic_REDUCE_STRUCT,Base_Seq,kahan,200000, PASSED ,0.000424834,7.01505,0.941549,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-kahan,0.941001,7.010975 +Basic_REDUCE_STRUCT,Base_Seq,cascade,200000, PASSED ,0.000444093,6.71082,0.900716,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-cascade,0.9013015,6.715195 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_direct_256,200000, PASSED ,0.00118618,2.51246,0.337219,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_direct_256,0.5094515,3.795695 +Basic_REDUCE_STRUCT,Base_CUDA,blkatm_occgs_256,200000, PASSED ,0.00117806,2.52978,0.339543,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,Base_CUDA-blkatm_occgs_256,0.5080439999999999,3.78521 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_direct_256,200000, PASSED ,0.00120939,2.46425,0.330747,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_direct_256,0.501819,3.738835 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_256,200000, PASSED ,2.87783e-05,103.558,13.8994,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_256,16.71095,124.50550000000001 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_direct_new_256,200000, PASSED ,3.9239e-05,75.9507,10.194,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_direct_new_256,13.71275,102.16735 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkatm_occgs_256,200000, PASSED ,0.00124661,2.39066,0.320871,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkatm_occgs_256,0.4819235,3.5905950000000004 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_256,200000, PASSED ,2.90087e-05,102.736,13.789,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_256,20.55425,153.1405 +Basic_REDUCE_STRUCT,RAJA_CUDA,blkdev_occgs_new_256,200000, PASSED ,3.15419e-05,94.4849,12.6816,build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1/RPBenchmark_H100_tier2/REDUCE_STRUCT_factor_64-kernel-run-data.csv,CUDA,RAJA_CUDA-blkdev_occgs_new_256,18.7269,139.52595 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_CONVECTION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_CONVECTION3DPA.csv new file mode 100644 index 0000000..e9d2a86 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_CONVECTION3DPA.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64 (raw),Base_CUDA-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_64 (raw),RAJA_CUDA-block_64 (smoothed),Base_CUDA-block_64 (raw B/W),Base_CUDA-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_64 (raw B/W),RAJA_CUDA-block_64 (smoothed B/W) +702,23.566,92.2323,16.2141,17.3277,23.1867,90.981,13.0808,51.003,8.99998,9.58193,12.8703,50.311 +2754,92.2323,223.13165,17.3277,17.4344,90.981,222.6775,51.003,123.2935,9.58193,9.635449999999999,50.311,123.042 +10989,354.031,354.031,17.799,17.3277,354.374,354.374,195.584,195.584,9.833,9.58193,195.773,195.773 +21951,638.578,638.578,17.5411,17.3277,638.979,638.979,352.724,352.724,9.68897,9.58193,352.946,352.946 +43902,1051.88,1051.88,16.7287,17.0316,1066.92,1066.92,580.97,580.97,9.23949,9.40624,589.277,589.277 +87804,1634.96,1634.96,15.571,16.7287,1533.0,1533.0,902.974,902.974,8.59976,9.23949,846.664,846.664 +175608,2063.9,2063.9,17.0316,16.2136,2030.26,2030.26,1139.85,1139.85,9.40624,8.95436,1121.27,1121.27 +351216,2353.16,2353.16,16.2136,15.571,2343.2,2343.2,1299.59,1299.59,8.95436,8.59976,1294.09,1294.09 +702459,2484.81,2484.81,15.1397,15.1397,2413.24,2413.24,1372.29,1372.29,8.36122,8.36122,1332.77,1332.77 +1028970,2588.29,2536.55,12.5957,13.8677,2514.33,2463.785,1429.44,1400.865,6.95626,7.65874,1388.59,1360.6799999999998 +2057940,2738.0,2588.29,12.1975,12.5957,2661.73,2514.33,1512.12,1429.44,6.7363,6.95626,1470.0,1388.59 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv new file mode 100644 index 0000000..128c8ab --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256 (raw),Base_CUDA-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_256 (raw),RAJA_CUDA-block_256 (smoothed),Base_CUDA-block_256 (raw B/W),Base_CUDA-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_256 (raw B/W),RAJA_CUDA-block_256 (smoothed B/W) +841,16.3134,74.0756,10.3907,10.4793,16.2211,74.024,14.1366,62.6523,9.00417,8.87021,14.0566,62.6087 +3844,74.0756,187.9438,10.4875,10.4834,74.024,189.181,62.6523,157.57965000000002,8.87021,8.821760000000001,62.6087,158.61435 +15876,301.812,301.812,10.4793,10.4793,304.338,304.338,252.507,252.507,8.7674,8.77331,254.62,254.62 +32400,584.269,584.269,10.5197,10.4875,581.203,581.203,487.276,487.276,8.77331,8.77331,484.718,484.718 +65025,1046.67,1046.67,10.1739,10.4793,1058.41,1058.41,871.018,871.018,8.46653,8.7674,880.787,880.787 +131044,1744.94,1744.94,10.7407,10.1873,1755.33,1755.33,1449.86,1449.86,8.92438,8.46653,1458.49,1458.49 +264196,2752.57,2650.84,10.1873,10.1739,2752.84,2650.95,2284.61,2197.32,8.45538,8.45538,2284.84,2197.41 +528529,3316.6,2752.57,9.82016,9.82016,3332.77,2752.84,2750.66,2284.61,8.14447,8.14447,2764.07,2284.84 +1060900,2650.84,2790.09,8.96536,8.96536,2650.95,2792.87,2197.32,2312.22,7.43151,7.43151,2197.41,2314.53 +1555009,2790.09,2875.73,8.63781,8.801585,2792.87,2878.88,2312.22,2382.81,7.15839,7.29495,2314.53,2385.42 +3115225,2961.37,2790.09,8.62398,8.63781,2964.89,2792.87,2453.4,2312.22,7.14469,7.15839,2456.31,2314.53 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_INTSC_HEXHEX.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_INTSC_HEXHEX.csv new file mode 100644 index 0000000..fadb45b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_INTSC_HEXHEX.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_64 (raw),Base_CUDA-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_64 (raw),RAJA_CUDA-block_64 (smoothed),Base_CUDA-block_64 (raw B/W),Base_CUDA-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_64 (raw B/W),RAJA_CUDA-block_64 (smoothed B/W) +27,171.232,293.57,4.59175,4.62777,168.613,326.893,3.69148,6.3289,0.0989909,0.0997673,3.63502,7.04729 +64,293.57,456.764,4.62777,4.6395,326.893,476.3115,6.3289,9.8471,0.0997673,0.10002015,7.04729,10.268495 +216,619.958,619.958,4.65123,4.65123,625.73,625.73,13.3653,13.3653,0.100273,0.100273,13.4897,13.4897 +512,853.911,853.911,4.66836,4.66559,841.732,841.732,18.409,18.409,0.100642,0.100583,18.1464,18.1464 +1000,992.716,992.716,4.66559,4.66666,975.897,975.897,21.4014,21.4014,0.100583,0.100606,21.0388,21.0388 +1728,1055.5,1055.5,4.66666,4.66836,1054.95,1054.95,22.7549,22.7549,0.100606,0.100642,22.7431,22.7431 +3375,1114.2,1114.2,4.66949,4.66666,1110.39,1110.39,24.0204,24.0204,0.100667,0.100606,23.9383,23.9383 +6859,1148.53,1148.53,4.66843,4.66666,1148.54,1148.54,24.7604,24.7604,0.100644,0.100606,24.7607,24.7607 +13824,1166.1,1166.1,4.66566,4.66843,1165.1,1165.1,25.1391,25.1391,0.100584,0.100644,25.1178,25.1178 +19683,1168.83,1167.465,4.66159,4.667045,1169.07,1167.085,25.1981,25.168599999999998,0.100496,0.10061400000000001,25.2033,25.16055 +39304,1173.67,1168.83,4.67192,4.66566,1175.37,1169.07,25.3024,25.1981,0.100719,0.100584,25.3391,25.2033 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_LTIMES.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_LTIMES.csv new file mode 100644 index 0000000..36ce8d5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_LTIMES.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256 (raw),Base_CUDA-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-kernel_256 (raw),RAJA_CUDA-kernel_256 (smoothed),RAJA_CUDA-launch_256 (raw),RAJA_CUDA-launch_256 (smoothed),Base_CUDA-block_256 (raw B/W),Base_CUDA-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-kernel_256 (raw B/W),RAJA_CUDA-kernel_256 (smoothed B/W),RAJA_CUDA-launch_256 (raw B/W),RAJA_CUDA-launch_256 (smoothed B/W) +1344,20.0297,73.568,5.10678,5.1042,19.6275,70.2153,19.5631,72.8381,28.1899,102.646,7.18731,7.10468,27.6239,97.9681,27.5332,101.627 +4992,73.568,149.393,5.08973,5.10416,70.2153,141.97715,72.8381,145.44055,102.646,208.06650000000002,7.10145,7.103155,97.9681,197.73855,101.627,202.564 +19392,225.218,225.218,5.1042,5.1042,213.739,213.739,218.043,218.043,313.487,313.487,7.10468,7.10468,297.509,297.509,303.501,303.501 +38784,319.194,319.194,5.10412,5.10412,306.66,306.66,320.004,320.004,444.111,444.111,7.10163,7.10163,426.672,426.672,445.238,445.238 +77568,455.913,455.913,5.11283,5.10412,446.16,446.16,443.945,443.945,634.204,634.204,7.11226,7.10163,620.637,620.637,617.555,617.555 +154944,555.883,555.883,5.05354,5.05354,549.18,549.18,563.474,563.474,773.189,773.189,7.02907,7.02907,763.865,763.865,783.746,783.746 +309696,642.991,642.991,5.02456,5.05354,636.478,636.478,657.487,657.487,894.303,894.303,6.9884,7.02907,885.243,885.243,914.464,914.464 +619392,695.03,685.383,4.9375,5.02456,690.477,667.778,715.813,674.303,966.655,953.226,6.86713,6.9884,960.322,928.741,995.561,937.816 +1238784,685.383,695.03,5.09983,4.9375,667.778,678.176,674.303,685.086,953.226,966.655,7.0928,6.86713,928.741,943.198,937.816,952.809 +1814592,696.763,695.8965000000001,4.54707,4.742285,678.176,684.3265,685.086,691.9155000000001,969.049,967.852,6.32401,6.59557,943.198,951.76,952.809,962.3054999999999 +3629184,710.295,696.763,4.48975,4.54707,691.252,678.176,698.745,685.086,987.865,969.049,6.24426,6.32401,961.381,943.198,971.802,952.809 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_MASS3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_MASS3DPA.csv new file mode 100644 index 0000000..a5c5548 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_MASS3DPA.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_25 (raw),Base_CUDA-block_25 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_25 (raw),RAJA_CUDA-block_25 (smoothed),Base_CUDA-block_25 (raw B/W),Base_CUDA-block_25 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_25 (raw B/W),RAJA_CUDA-block_25 (smoothed B/W) +1600,32.6401,131.824,14.0527,14.9006,32.701,130.729,15.285,61.5,6.5807,6.95157,15.3135,60.989 +6336,131.824,319.685,14.9006,14.97785,130.729,319.23650000000004,61.5,149.03,6.95157,6.984265000000001,60.989,148.82049999999998 +25344,507.546,507.546,15.0551,14.9006,507.744,507.744,236.56,236.56,7.01696,6.95157,236.652,236.652 +50624,906.382,906.382,15.0652,14.9006,907.206,907.206,422.384,422.384,7.02056,6.95157,422.768,422.768 +101184,1431.49,1431.49,14.6598,14.7777,1433.42,1433.42,667.038,667.038,6.83109,6.88576,667.937,667.937 +202368,2218.97,2218.97,14.7777,14.7395,2216.09,2216.09,1033.94,1033.94,6.88576,6.86773,1032.6,1032.6 +404736,2727.06,2727.06,14.5497,14.6598,2713.09,2713.09,1270.66,1270.66,6.77938,6.83109,1264.16,1264.16 +809536,3074.41,3074.41,14.7395,14.5497,3060.07,3060.07,1432.49,1432.49,6.86773,6.77938,1425.82,1425.82 +1619008,3196.5,3196.5,13.9085,13.9085,3174.31,3174.31,1489.37,1489.37,6.4805,6.4805,1479.04,1479.04 +2371584,3316.03,3256.2650000000003,12.5139,13.2112,3297.56,3235.935,1545.07,1517.2199999999998,5.83072,6.15561,1536.46,1507.75 +4743104,3447.69,3316.03,12.2568,12.5139,3432.84,3297.56,1606.41,1545.07,5.71091,5.83072,1599.49,1536.46 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv new file mode 100644 index 0000000..9a34598 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256 (raw),Base_CUDA-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_256 (raw),RAJA_CUDA-block_256 (smoothed),Base_CUDA-block_256 (raw B/W),Base_CUDA-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_256 (raw B/W),RAJA_CUDA-block_256 (smoothed B/W) +64,1.03517,7.57386,5.01708,5.27123,1.24634,8.03078,3.64713,22.4171,17.6762,15.6634,4.39112,23.7695 +512,7.57386,28.44948,5.29204,5.245785,8.03078,30.30984,22.4171,77.69455,15.6634,14.93685,23.7695,82.77024999999999 +3375,49.3251,49.3251,5.27123,5.22034,52.5889,52.5889,132.972,132.972,14.2103,14.2103,141.771,141.771 +8000,116.784,116.784,5.22034,5.22034,123.763,123.763,305.958,305.958,13.6766,13.6766,324.241,324.241 +17576,251.866,251.866,4.84513,4.84513,268.187,268.187,646.562,646.562,12.4379,12.4379,688.457,688.457 +35937,431.565,431.565,4.84351,4.84513,434.228,434.228,1091.71,1091.71,12.2524,12.4379,1098.45,1098.45 +79507,774.039,774.039,4.82689,4.84513,751.847,751.847,1932.98,1932.98,12.054,12.4101,1877.56,1877.56 +157464,1058.63,780.501,5.05904,5.05119,939.463,858.197,2620.58,1932.98,12.5233,12.3707,2325.58,2108.48 +328509,837.387,837.387,5.05119,5.05119,858.197,904.162,2057.35,2057.35,12.4101,12.3707,2108.48,2213.75 +493039,780.501,853.0274999999999,5.05256,5.051875,904.162,921.8125,1910.98,2086.765,12.3707,12.3904,2213.75,2269.665 +1000000,868.668,837.387,5.00806,5.05119,992.449,904.162,2116.18,2057.35,12.2002,12.3707,2417.72,2213.75 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv new file mode 100644 index 0000000..5c612d3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-block_256 (raw),Base_CUDA-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-block_256 (raw),RAJA_CUDA-block_256 (smoothed),Base_CUDA-block_256 (raw B/W),Base_CUDA-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-block_256 (raw B/W),RAJA_CUDA-block_256 (smoothed B/W) +80000,0.0,0.0,0.0,0.0,0.0,0.0,185.245,345.609,6.21439,7.95189,182.04,346.669 +160000,0.0,0.0,0.0,0.0,0.0,0.0,345.609,491.93449999999996,8.07202,7.968579999999999,346.669,487.7855 +320000,0.0,0.0,0.0,0.0,0.0,0.0,638.26,638.26,7.95189,7.95189,628.902,628.902 +640000,0.0,0.0,0.0,0.0,0.0,0.0,1113.95,1113.95,7.98527,7.95189,1109.59,1109.59 +1280000,0.0,0.0,0.0,0.0,0.0,0.0,1798.43,1798.43,7.7401,7.7401,1793.54,1793.54 +2560000,0.0,0.0,0.0,0.0,0.0,0.0,2126.15,2115.68,7.04253,7.04253,2115.35,2113.59 +3750000,0.0,0.0,0.0,0.0,0.0,0.0,2188.95,2126.15,6.62487,6.62487,2192.44,2115.35 +7500000,0.0,0.0,0.0,0.0,0.0,0.0,2115.68,2188.95,6.50583,6.59158,2113.59,2192.44 +10000000,0.0,0.0,0.0,0.0,0.0,0.0,2191.86,2191.86,6.51347,6.56119,2192.79,2192.79 +12500000,0.0,0.0,0.0,0.0,0.0,0.0,2239.48,2215.67,6.59158,6.53733,2238.9,2215.8450000000003 +15000000,0.0,0.0,0.0,0.0,0.0,0.0,2265.99,2239.48,6.56119,6.56119,2261.96,2238.9 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_MULTI_REDUCE.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_MULTI_REDUCE.csv new file mode 100644 index 0000000..6dad657 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_MULTI_REDUCE.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-atomic_direct_256 (raw),Base_CUDA-atomic_direct_256 (smoothed),Base_CUDA-atomic_occgs_256 (raw),Base_CUDA-atomic_occgs_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_CUDA-atomic_direct_256 (raw),RAJA_CUDA-atomic_direct_256 (smoothed),RAJA_CUDA-atomic_occgs_256 (raw),RAJA_CUDA-atomic_occgs_256 (smoothed),Base_CUDA-atomic_direct_256 (raw B/W),Base_CUDA-atomic_direct_256 (smoothed B/W),Base_CUDA-atomic_occgs_256 (raw B/W),Base_CUDA-atomic_occgs_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_CUDA-atomic_direct_256 (raw B/W),RAJA_CUDA-atomic_direct_256 (smoothed B/W),RAJA_CUDA-atomic_occgs_256 (raw B/W),RAJA_CUDA-atomic_occgs_256 (smoothed B/W) +99995,0.0844437,0.168376,0.0849038,0.168555,0.467413,0.466271,0.08231,0.164063,0.0805395,0.161374,1.25844,2.50913,1.26529,2.51178,6.96569,6.94815,1.22664,2.44485,1.20025,2.40478 +199995,0.168376,0.2527835,0.168555,0.2533055,0.465023,0.4661365,0.164063,0.245373,0.161374,0.24142799999999998,2.50913,3.7669,2.51178,3.77467,6.92973,6.946105,2.44485,3.65646,2.40478,3.5976800000000004 +399995,0.337191,0.337191,0.338056,0.338056,0.466271,0.466002,0.326683,0.326683,0.321482,0.321482,5.02467,5.02467,5.03756,5.03756,6.94815,6.94406,4.86807,4.86807,4.79058,4.79058 +799995,0.674012,0.674012,0.675501,0.675501,0.466002,0.465023,0.655172,0.655172,0.643515,0.643515,10.0437,10.0437,10.0659,10.0659,6.94406,6.92973,9.76294,9.76294,9.58923,9.58923 +1599995,1.35257,1.35257,1.34734,1.34734,0.454468,0.454468,1.31265,1.31265,1.28413,1.28413,20.155,20.155,20.0771,20.0771,6.77215,6.77215,19.5602,19.5602,19.1352,19.1352 +3199995,2.79702,2.79702,2.69914,2.69914,0.428434,0.428434,2.74126,2.74126,2.67559,2.67559,41.679,41.679,40.2205,40.2205,6.38419,6.38419,40.8481,40.8481,39.8695,39.8695 +4687495,4.08824,4.08824,3.9473,3.9473,0.406664,0.406664,4.01274,4.01274,3.92618,3.92618,60.9197,60.9197,58.8195,58.8195,6.05978,6.05978,59.7946,59.7946,58.5048,58.5048 +9374995,8.20238,8.20238,7.89413,7.89413,0.395046,0.399946,8.02441,8.02441,7.7991,7.7991,122.225,122.225,117.632,117.632,5.88666,5.95966,119.573,119.573,116.216,116.216 +12499995,10.9657,10.9657,10.5733,10.5733,0.399946,0.399946,10.9321,10.9321,10.4127,10.4127,163.402,163.402,157.554,157.554,5.95966,5.95966,162.901,162.901,155.161,155.161 +15624995,13.9706,12.46815,13.2005,11.8869,0.395117,0.39753150000000004,13.729,12.330549999999999,12.9928,11.70275,208.178,185.79,196.703,177.1285,5.8877,5.92368,204.578,183.73950000000002,193.607,174.38400000000001 +18749995,16.7769,13.9706,15.7094,13.2005,0.401372,0.399946,16.721,13.729,15.6462,12.9928,249.995,208.178,234.088,196.703,5.98091,5.95966,249.162,204.578,233.146,193.607 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_REDUCE_STRUCT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_REDUCE_STRUCT.csv new file mode 100644 index 0000000..29c6a25 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Basic_REDUCE_STRUCT.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-blkatm_direct_256 (raw),Base_CUDA-blkatm_direct_256 (smoothed),Base_CUDA-blkatm_occgs_256 (raw),Base_CUDA-blkatm_occgs_256 (smoothed),Base_Seq-cascade (raw),Base_Seq-cascade (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),Base_Seq-kahan (raw),Base_Seq-kahan (smoothed),RAJA_CUDA-blkatm_direct_256 (raw),RAJA_CUDA-blkatm_direct_256 (smoothed),RAJA_CUDA-blkatm_occgs_256 (raw),RAJA_CUDA-blkatm_occgs_256 (smoothed),RAJA_CUDA-blkdev_direct_256 (raw),RAJA_CUDA-blkdev_direct_256 (smoothed),RAJA_CUDA-blkdev_direct_new_256 (raw),RAJA_CUDA-blkdev_direct_new_256 (smoothed),RAJA_CUDA-blkdev_occgs_256 (raw),RAJA_CUDA-blkdev_occgs_256 (smoothed),RAJA_CUDA-blkdev_occgs_new_256 (raw),RAJA_CUDA-blkdev_occgs_new_256 (smoothed),Base_CUDA-blkatm_direct_256 (raw B/W),Base_CUDA-blkatm_direct_256 (smoothed B/W),Base_CUDA-blkatm_occgs_256 (raw B/W),Base_CUDA-blkatm_occgs_256 (smoothed B/W),Base_Seq-cascade (raw B/W),Base_Seq-cascade (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),Base_Seq-kahan (raw B/W),Base_Seq-kahan (smoothed B/W),RAJA_CUDA-blkatm_direct_256 (raw B/W),RAJA_CUDA-blkatm_direct_256 (smoothed B/W),RAJA_CUDA-blkatm_occgs_256 (raw B/W),RAJA_CUDA-blkatm_occgs_256 (smoothed B/W),RAJA_CUDA-blkdev_direct_256 (raw B/W),RAJA_CUDA-blkdev_direct_256 (smoothed B/W),RAJA_CUDA-blkdev_direct_new_256 (raw B/W),RAJA_CUDA-blkdev_direct_new_256 (smoothed B/W),RAJA_CUDA-blkdev_occgs_256 (raw B/W),RAJA_CUDA-blkdev_occgs_256 (smoothed B/W),RAJA_CUDA-blkdev_occgs_new_256 (raw B/W),RAJA_CUDA-blkdev_occgs_new_256 (smoothed B/W) +100000,0.168766,0.337219,0.169245,0.339543,0.903853,0.900716,1.88462,1.86734,0.945023,0.941549,0.166349,0.330747,0.162398,0.320871,7.9428,13.8994,6.63156,10.194,7.91224,13.789,6.63305,12.6816,1.25739,2.51246,1.26096,2.52978,6.73416,6.71082,14.0414,13.9127,7.0409,7.01505,1.23939,2.46425,1.20995,2.39066,59.1779,103.558,49.4085,75.9507,58.9502,102.736,49.4196,94.4849 +200000,0.337219,0.5094515,0.339543,0.5080439999999999,0.900716,0.9013015,1.86087,1.864105,0.941549,0.941001,0.330747,0.501819,0.320871,0.4819235,13.8994,16.71095,10.194,13.71275,13.789,20.55425,12.6816,18.7269,2.51246,3.795695,2.52978,3.78521,6.71082,6.715195,13.8645,13.8886,7.01505,7.010975,2.46425,3.738835,2.39066,3.5905950000000004,103.558,124.50550000000001,75.9507,102.16735,102.736,153.1405,94.4849,139.52595 +400000,0.681684,0.681684,0.676545,0.676545,0.898034,0.900716,1.86734,1.86087,0.940453,0.940453,0.672891,0.672891,0.642976,0.642976,19.5225,19.5225,17.2315,17.2315,27.3195,27.3195,24.7722,24.7722,5.07893,5.07893,5.04064,5.04064,6.69086,6.71082,13.9127,13.8645,7.0069,7.0069,5.01342,5.01342,4.79053,4.79053,145.453,145.453,128.384,128.384,203.545,203.545,184.567,184.567 +800000,1.3726,1.3726,1.35152,1.35152,0.901887,0.898034,1.85112,1.85112,0.936778,0.936778,1.35971,1.35971,1.29153,1.29153,24.3351,24.3351,24.4619,24.4619,53.8276,53.8276,48.3652,48.3652,10.2266,10.2266,10.0696,10.0696,6.71957,6.69086,13.7919,13.7919,6.97953,6.97953,10.1306,10.1306,9.6226,9.6226,181.31,181.31,182.255,182.255,401.047,401.047,360.348,360.348 +1600000,2.78466,2.78466,2.70085,2.70085,0.885405,0.885405,1.65529,1.65529,0.905274,0.905274,2.74772,2.74772,2.71416,2.71416,27.9768,26.8071,30.4621,30.4621,99.8353,99.8353,90.8721,90.8721,20.7473,20.7473,20.1229,20.1229,6.59678,6.59678,12.3329,12.3329,6.74481,6.74481,20.4721,20.4721,20.222,20.222,208.444,199.728,226.96,226.96,743.831,743.831,677.05,677.05 +3200000,5.59518,5.59518,5.41213,5.41213,0.785907,0.789586,1.44327,1.44327,0.81277,0.81277,5.61573,5.61573,5.35196,5.35196,27.2771,26.8071,33.0238,33.0238,141.892,141.892,133.432,133.432,41.6873,41.6873,40.3235,40.3235,5.85546,5.88288,10.7532,10.7532,6.05561,6.05561,41.8405,41.8405,39.8752,39.8752,203.23,199.728,246.047,246.047,1057.18,1057.18,994.144,994.144 +4687500,8.36953,8.36953,7.89834,7.89834,0.789586,0.789586,1.29351,1.29351,0.773354,0.782941,8.39197,8.39197,7.90503,7.90503,26.8071,26.8071,33.959,33.959,179.011,179.011,168.868,168.868,62.3578,62.3578,58.8472,58.8472,5.88288,5.88288,9.63741,9.63741,5.76193,5.83336,62.5251,62.5251,58.897,58.897,199.728,199.728,253.014,253.014,1333.73,1333.73,1258.16,1258.16 +9375000,17.6844,17.6844,15.7914,15.7914,0.762034,0.789586,1.23009,1.26501,0.777216,0.782941,17.964,17.964,15.7837,15.7837,26.1292,26.1292,36.0028,36.0028,245.362,245.362,215.979,215.979,131.759,131.759,117.655,117.655,5.67759,5.88288,9.16486,9.42505,5.79071,5.83336,133.842,133.842,117.597,117.597,194.678,194.678,268.242,268.242,1828.09,1828.09,1609.17,1609.17 +12500000,24.6832,24.6832,21.0566,21.0566,0.886289,0.882995,1.26501,1.25784,0.782941,0.782941,24.0924,24.0924,20.9218,20.9218,25.9751,25.9751,36.6949,36.6949,272.671,272.671,263.766,263.766,183.904,183.904,156.884,156.884,6.60337,6.57882,9.42505,9.37161,5.83336,5.83336,179.502,179.502,155.879,155.879,193.53,193.53,273.398,273.398,2031.56,2031.56,1965.21,1965.21 +15625000,43.2689,33.89675,41.5914,31.323999999999998,0.882995,0.883928,1.2444,1.25112,0.79581,0.7893755,26.846,25.4692,26.1101,23.51595,25.8187,25.896900000000002,36.8299,36.7624,293.055,282.863,283.656,273.711,322.379,252.5505,309.88,233.382,6.57882,6.585775,9.2715,9.321555,5.92925,5.881304999999999,200.018,189.76,194.536,175.20749999999998,192.364,192.947,274.404,273.901,2183.43,2107.495,2113.4,2039.305 +18750000,43.1103,43.1103,47.2183,41.5914,0.884861,0.884861,1.25784,1.25784,0.914365,0.79581,29.1991,26.846,31.1522,26.1101,25.7913,25.8187,37.3071,36.8299,299.298,293.055,292.677,283.656,321.197,321.197,351.804,309.88,6.59273,6.59273,9.37161,9.37161,6.81255,5.92925,217.55,200.018,232.102,194.536,192.16,192.364,277.96,274.404,2229.94,2183.43,2180.61,2113.4 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv new file mode 100644 index 0000000..6156485 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_H100_tier2/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv @@ -0,0 +1,12 @@ +Problem size,Base_CUDA-direct_1024 (raw),Base_CUDA-direct_1024 (smoothed),Base_Seq-direct (raw),Base_Seq-direct (smoothed),RAJA_CUDA-direct_1024 (raw),RAJA_CUDA-direct_1024 (smoothed),RAJA_CUDA-funcptr_1024 (raw),RAJA_CUDA-funcptr_1024 (smoothed),RAJA_CUDA-virtfunc_1024 (raw),RAJA_CUDA-virtfunc_1024 (smoothed),Base_CUDA-direct_1024 (raw B/W),Base_CUDA-direct_1024 (smoothed B/W),Base_Seq-direct (raw B/W),Base_Seq-direct (smoothed B/W),RAJA_CUDA-direct_1024 (raw B/W),RAJA_CUDA-direct_1024 (smoothed B/W),RAJA_CUDA-funcptr_1024 (raw B/W),RAJA_CUDA-funcptr_1024 (smoothed B/W),RAJA_CUDA-virtfunc_1024 (raw B/W),RAJA_CUDA-virtfunc_1024 (smoothed B/W) +42875,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,27.8679,38.7235,37.5249,35.4562,24.3736,35.0238,22.4841,32.7541,22.6106,32.4712 +91125,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,38.7235,45.114900000000006,35.4562,30.61465,35.0238,37.6458,32.7541,38.2547,32.4712,37.9915 +205379,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,51.5063,51.5063,25.7731,25.7731,40.2678,40.2678,43.7553,43.7553,43.5118,43.5118 +421875,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,60.5788,60.5788,19.5101,19.5101,58.8854,58.8854,55.7691,55.7691,55.5149,55.5149 +884736,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,78.1177,73.5342,15.2354,15.2354,74.6275,74.6275,69.6403,69.6403,70.7258,70.7258 +1860867,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,73.5342,78.1177,14.1839,14.1839,75.5354,75.5354,72.6788,72.6788,72.5391,72.5391 +2744000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,88.3422,83.5172,13.453,13.453,87.001,83.7469,82.5619,79.0234,82.1592,78.0234 +5639752,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,83.8245,83.8245,11.488,11.488,84.1051,84.1051,79.0234,79.2586,78.0234,78.8235 +7645373,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,83.5172,83.9146,11.4005,11.4005,83.7469,84.1051,79.2586,79.2586,78.8235,78.8235 +9528128,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,93.1066,83.86955,10.815,11.10775,93.3876,83.92599999999999,87.1422,79.14099999999999,87.6568,78.64425 +11543176,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,83.9146,83.9146,8.71324,10.815,83.4915,83.7469,78.9519,79.2586,78.465,78.8235 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..e3bb57d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +405,16.244,6.47622,16.9284 +1566,60.7029,6.58336,62.8621 +6183,178.287,5.97172,181.757 +12339,244.958,5.62009,242.58 +24678,343.264,4.6109,341.959 +49329,368.25,5.46811,390.553 +98631,409.361,3.87975,426.04 +197262,437.666,1.47934,453.017 +394524,344.694,1.2619,354.82 +577935,325.335,1.4086,333.594 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..4e84ecd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +405,60.7029,6.47622,62.8621 +1566,119.49495,6.22397,122.30955 +6183,178.287,5.97172,181.757 +12339,244.958,5.62009,242.58 +24678,343.264,5.46811,341.959 +49329,368.25,4.6109,390.553 +98631,368.25,3.87975,390.553 +197262,368.25,1.47934,390.553 +394524,377.02750000000003,1.4439700000000002,390.43 +577935,344.694,1.4086,354.82 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_flops_raw.csv new file mode 100644 index 0000000..49488b8 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +405,24.2929,9.68515,25.3164 +1566,91.0123,9.87048,94.2495 +6183,267.484,8.95938,272.69 +12339,367.553,8.43279,363.984 +24678,515.086,6.91891,513.128 +49329,552.595,8.20543,586.063 +98631,614.295,5.82203,639.324 +197262,656.775,2.21994,679.812 +394524,517.261,1.89364,532.456 +577935,488.21,2.1138,500.604 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_flops_smoothed.csv new file mode 100644 index 0000000..f8e9181 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_DIFFUSION3DPA_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +405,91.0123,9.68515,94.2495 +1566,179.24814999999998,9.322265,183.46975 +6183,267.484,8.95938,272.69 +12339,367.553,8.43279,363.984 +24678,515.086,8.20543,513.128 +49329,552.595,6.91891,586.063 +98631,552.595,5.82203,586.063 +197262,552.595,2.21994,586.063 +394524,565.778,2.16687,585.89 +577935,517.261,2.1138,532.456 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_bandwidth_raw.csv new file mode 100644 index 0000000..cb2ea38 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +512,1.36819,0.0204122,1.8982 +3375,5.77634,0.0197187,7.64611 +17576,9.05878,0.0193809,9.46373 +35937,9.52453,0.0192874,10.8367 +79507,9.97035,0.0191751,10.2362 +166375,10.0119,0.0191437,10.0301 +343000,10.3195,0.0190992,10.4729 +704969,10.6345,0.019035,10.7633 +1442897,10.7398,0.0190027,10.8304 +2146689,10.744,0.0189847,10.8443 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..d3fbd18 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +512,5.77634,0.0197187,7.64611 +3375,7.41756,0.0195498,8.55492 +17576,9.05878,0.0193809,9.46373 +35937,9.52453,0.0192874,10.0301 +79507,9.97035,0.0191751,10.2362 +166375,10.0119,0.0191437,10.4729 +343000,10.3195,0.0190992,10.4729 +704969,10.6345,0.019035,10.7633 +1442897,10.687149999999999,0.01901885,10.79685 +2146689,10.7398,0.0190027,10.8304 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_flops_raw.csv new file mode 100644 index 0000000..29eb933 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +512,560.006,8.35478,776.939 +3375,2446.5,8.35162,3238.42 +17576,3908.01,8.36103,4082.7 +35937,4131.92,8.36724,4701.17 +79507,4346.65,8.35954,4462.53 +166375,4380.49,8.37593,4388.43 +343000,4527.7,8.37984,4595.03 +704969,4676.26,8.37013,4732.87 +1442897,4730.76,8.37049,4770.69 +2146689,4736.46,8.36932,4780.67 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_flops_smoothed.csv new file mode 100644 index 0000000..5502768 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_EDGE3D_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +512,2446.5,8.35478,3238.42 +3375,3177.255,8.357904999999999,3660.56 +17576,3908.01,8.35954,4082.7 +35937,4131.92,8.36103,4388.43 +79507,4346.65,8.36724,4462.53 +166375,4380.49,8.37013,4595.03 +343000,4527.7,8.37049,4595.03 +704969,4676.26,8.37049,4732.87 +1442897,4703.51,8.37031,4751.78 +2146689,4730.76,8.37013,4770.69 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_bandwidth_raw.csv new file mode 100644 index 0000000..c5c2dd3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +417,5.95104,39.4271,7.02906 +1667,23.5696,40.8146,37.0113 +6667,91.3822,40.4766,147.673 +13334,195.225,38.6982,302.715 +26667,388.829,38.2125,582.554 +53334,770.744,39.2795,861.156 +106667,579.227,38.8749,576.567 +213334,573.135,31.957,571.807 +426667,597.937,25.6852,589.757 +625000,599.038,24.9927,599.411 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_bandwidth_smoothed.csv new file mode 100644 index 0000000..32fd1a2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +417,23.5696,40.4766,37.0113 +1667,57.475899999999996,39.95185,92.34215 +6667,91.3822,39.4271,147.673 +13334,195.225,39.2795,302.715 +26667,388.829,38.8749,576.567 +53334,573.135,38.6982,576.567 +106667,579.227,38.2125,582.554 +213334,597.937,31.957,589.757 +426667,588.582,28.8211,583.162 +625000,597.937,25.6852,589.757 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_flops_raw.csv new file mode 100644 index 0000000..f645514 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +417,1.62705,10.7796,1.92179 +1667,6.44407,11.159,10.1191 +6667,24.9845,11.0666,40.3748 +13334,53.3759,10.5804,82.7643 +26667,106.308,10.4475,159.274 +53334,210.727,10.7393,235.446 +106667,158.364,10.6286,157.637 +213334,156.699,8.73726,156.336 +426667,163.48,7.0225,161.243 +625000,163.781,6.83318,163.883 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_flops_smoothed.csv new file mode 100644 index 0000000..575036f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_ENERGY_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +417,6.44407,11.0666,10.1191 +1667,15.714285,10.9231,25.24695 +6667,24.9845,10.7796,40.3748 +13334,53.3759,10.7393,82.7643 +26667,106.308,10.6286,157.637 +53334,156.699,10.5804,157.637 +106667,158.364,10.4475,159.274 +213334,163.48,8.73726,161.243 +426667,160.922,7.87988,159.44 +625000,163.48,7.0225,161.243 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_bandwidth_raw.csv new file mode 100644 index 0000000..a5fb34d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_bandwidth_raw.csv @@ -0,0 +1,10 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +31104,11.4746,0.6036360000000001,12.40105 +73728,18.5512,0.57432,19.9817 +144000,27.4057,0.462276,29.0971 +248832,35.957,0.420849,37.5482 +395136,37.471,0.428621,40.524 +589824,44.4605,0.425644,42.9218 +839808,46.932,0.387519,49.2199 +1152000,44.2472,0.377586,46.6927 +1533312,43.8905,0.411853,46.3573 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_bandwidth_smoothed.csv new file mode 100644 index 0000000..bfcfbc1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_bandwidth_smoothed.csv @@ -0,0 +1,10 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +31104,15.024750000000001,0.5885345,16.19475 +73728,18.5512,0.57432,19.9817 +144000,27.4057,0.462276,29.0971 +248832,35.957,0.428621,37.5482 +395136,37.471,0.425644,40.524 +589824,44.2472,0.420849,42.9218 +839808,44.2472,0.411853,46.3573 +1152000,44.35385,0.399686,46.525000000000006 +1533312,44.2472,0.387519,46.6927 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_flops_raw.csv new file mode 100644 index 0000000..49174e8 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_flops_raw.csv @@ -0,0 +1,10 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +31104,63.895700000000005,3.3613150000000003,69.0547 +73728,100.518,3.11191,108.269 +144000,146.182,2.46577,155.203 +248832,189.847,2.22201,198.248 +395136,196.428,2.2469,212.433 +589824,231.835,2.21948,223.812 +839808,243.725,2.01244,255.606 +1152000,229.037,1.9545,241.696 +1533312,226.592,2.12626,239.328 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_flops_smoothed.csv new file mode 100644 index 0000000..376b48b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_FEMSWEEP_flops_smoothed.csv @@ -0,0 +1,10 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +31104,82.2728,3.23414,88.68065 +73728,100.518,3.11191,108.269 +144000,146.182,2.46577,155.203 +248832,189.847,2.2469,198.248 +395136,196.428,2.22201,212.433 +589824,229.037,2.21948,223.812 +839808,229.037,2.12626,239.328 +1152000,230.436,2.06935,240.512 +1533312,229.037,2.01244,241.696 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_bandwidth_raw.csv new file mode 100644 index 0000000..2689c60 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1728,0.300447,0.0511849,0.298721 +5832,0.951003,0.0533866,0.948242 +17576,1.46924,0.0538508,1.49487 +39304,1.5415,0.0539456,1.5502 +74088,1.72573,0.0538376,1.7118 +140608,1.77869,0.0539579,1.79187 +287496,1.79347,0.053867,1.75128 +551368,1.81102,0.053863,1.86199 +1124864,1.88875,0.0537387,1.89168 +1643032,1.89481,0.0536954,1.89039 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv new file mode 100644 index 0000000..aa82629 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1728,0.951003,0.0533866,0.948242 +5832,1.2101215,0.0536187,1.221556 +17576,1.46924,0.0538376,1.49487 +39304,1.5415,0.0538508,1.5502 +74088,1.72573,0.053867,1.7118 +140608,1.77869,0.053867,1.75128 +287496,1.79347,0.053863,1.79187 +551368,1.81102,0.053863,1.86199 +1124864,1.849885,0.05380085,1.87619 +1643032,1.88875,0.0537387,1.89039 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_flops_raw.csv new file mode 100644 index 0000000..6ed79f5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1728,23.8161,4.05739,23.6793 +5832,76.4015,4.28896,76.1797 +17576,118.946,4.35962,121.021 +39304,125.284,4.38435,125.991 +74088,140.587,4.38589,139.452 +140608,145.176,4.40402,146.252 +287496,146.625,4.4039,143.176 +551368,148.237,4.40881,152.408 +1124864,154.757,4.40316,154.998 +1643032,155.324,4.4016,154.961 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_flops_smoothed.csv new file mode 100644 index 0000000..8ba9a7b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_INTSC_HEXRECT_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1728,76.4015,4.28896,76.1797 +5832,97.67375,4.3242899999999995,98.60034999999999 +17576,118.946,4.35962,121.021 +39304,125.284,4.38435,125.991 +74088,140.587,4.38589,139.452 +140608,145.176,4.4039,143.176 +287496,146.625,4.4039,146.252 +551368,148.237,4.4039,152.408 +1124864,151.497,4.40353,153.6845 +1643032,154.757,4.40316,154.961 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_bandwidth_raw.csv new file mode 100644 index 0000000..5fae2ed --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-compile_time_block_stride_loop_64 +196608,6.82688,0.0879186,5.98395,3.20441 +389120,12.8137,0.0882862,11.4439,5.63946 +778240,23.3652,0.0879253,20.8792,5.25612 +1556480,26.2855,0.0877564,27.2853,6.76388 +3108864,36.5373,0.0873663,42.5442,7.33737 +6213632,33.0333,0.0874635,41.1283,7.48462 +9101312,35.9133,0.0875556,45.1167,7.3024 +12423168,40.8521,0.08774,49.0714,7.69642 +18198528,38.8189,0.0873937,48.8683,7.70027 +24260608,39.5485,0.087801,50.085,7.77038 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_bandwidth_smoothed.csv new file mode 100644 index 0000000..68b4dec --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-compile_time_block_stride_loop_64 +196608,12.8137,0.0879253,11.4439,5.25612 +389120,18.08945,0.08792195,16.16155,5.4477899999999995 +778240,23.3652,0.0879186,20.8792,5.63946 +1556480,26.2855,0.0877564,27.2853,6.76388 +3108864,33.0333,0.0875556,41.1283,7.3024 +6213632,35.9133,0.0875556,42.5442,7.33737 +9101312,36.5373,0.0874635,45.1167,7.48462 +12423168,38.8189,0.0875556,48.8683,7.69642 +18198528,39.1837,0.0876478,48.969849999999994,7.698345 +24260608,39.5485,0.08774,49.0714,7.70027 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_flops_raw.csv new file mode 100644 index 0000000..8dceea6 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-compile_time_block_stride_loop_64 +196608,6.22346,0.0801476,5.45503,2.92117 +389120,11.6817,0.0804867,10.4329,5.14124 +778240,21.3016,0.0801596,19.0351,4.79189 +1556480,23.9642,0.0800066,24.8758,6.16656 +3108864,33.3109,0.0796515,38.7873,6.68945 +6213632,30.1164,0.0797404,37.4966,6.82371 +9101312,32.7421,0.0798244,41.1328,6.65759 +12423168,37.2449,0.0799925,44.7383,7.01683 +18198528,35.3912,0.0796768,44.5533,7.02034 +24260608,36.0564,0.0800482,45.6625,7.08426 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_flops_smoothed.csv new file mode 100644 index 0000000..f4ab02a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DEA_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-compile_time_block_stride_loop_64 +196608,11.6817,0.0801596,10.4329,4.79189 +389120,16.49165,0.08015359999999999,14.734,4.966565 +778240,21.3016,0.0801476,19.0351,5.14124 +1556480,23.9642,0.0800066,24.8758,6.16656 +3108864,30.1164,0.0798244,37.4966,6.65759 +6213632,32.7421,0.0798244,38.7873,6.68945 +9101312,33.3109,0.0797404,41.1328,6.82371 +12423168,35.3912,0.0798244,44.5533,7.01683 +18198528,35.7238,0.07990844999999999,44.6458,7.018585 +24260608,36.0564,0.0799925,44.7383,7.02034 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv new file mode 100644 index 0000000..d7f630d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +729,20.5641,5.04932,19.8433 +3375,74.8639,4.9566,73.4013 +9261,146.083,4.69623,144.821 +19683,183.315,4.7032,184.193 +35937,208.66,4.70308,199.478 +68921,199.773,4.67384,194.828 +132651,204.558,4.649,206.143 +250047,197.078,4.48718,198.375 +531441,178.764,3.97743,184.162 +753571,178.479,4.02294,179.078 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv new file mode 100644 index 0000000..ae5bfe4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +729,74.8639,4.9566,73.4013 +3375,110.47345,4.8299,109.11115000000001 +9261,146.083,4.7032,144.821 +19683,183.315,4.70308,184.193 +35937,199.773,4.69623,194.828 +68921,199.773,4.67384,198.375 +132651,199.773,4.649,198.375 +250047,197.078,4.48718,194.828 +531441,187.921,4.25506,191.26850000000002 +753571,178.764,4.02294,184.162 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_flops_raw.csv new file mode 100644 index 0000000..7fc2433 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +729,41.1061,10.0932,39.6654 +3375,155.613,10.3028,152.573 +9261,308.146,9.90615,305.484 +19683,389.674,9.99765,391.541 +35937,445.663,10.045,426.052 +68921,428.424,10.0233,417.819 +132651,440.106,10.0023,443.516 +250047,425.069,9.6782,427.867 +531441,386.463,8.59865,398.134 +753571,386.187,8.70474,387.484 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv new file mode 100644 index 0000000..3a0cfa5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +729,155.613,10.0932,152.573 +3375,231.8795,10.045425,229.0285 +9261,308.146,10.045,305.484 +19683,389.674,10.0233,391.541 +35937,428.424,10.0023,417.819 +68921,428.424,10.0023,426.052 +132651,428.424,10.0023,426.052 +250047,425.069,9.6782,417.819 +531441,405.766,9.191469999999999,413.0005 +753571,386.463,8.70474,398.134 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..c61a8c7 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_64,Base_HIP-runtime_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-direct_64,RAJA_HIP-runtime_block_stride_loop_64 +5376,12.19,5.86309,3.28712,6.43497,12.1008,4.55125 +21312,44.5988,22.0971,3.36096,24.5696,44.2338,17.2593 +85056,86.7307,60.3189,3.29603,68.9384,86.2078,53.3042 +169920,132.107,96.2002,3.29467,118.49,131.876,93.5856 +339840,173.608,128.838,3.29211,140.567,173.132,106.312 +679680,178.961,129.091,3.29348,132.423,175.869,92.3834 +1359360,177.128,130.436,3.32126,135.0,177.477,93.6736 +2718720,172.411,132.677,3.27381,138.586,170.242,96.7789 +5437248,164.129,129.855,3.3161,135.267,162.211,84.0754 +7964736,164.12,131.333,3.32505,135.74,162.534,84.1268 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..5cfb0ab --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_64,Base_HIP-runtime_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-direct_64,RAJA_HIP-runtime_block_stride_loop_64 +5376,44.5988,22.0971,3.29603,24.5696,44.2338,17.2593 +21312,65.66475,41.208,3.29535,46.754000000000005,65.2208,35.28175 +85056,86.7307,60.3189,3.29467,68.9384,86.2078,53.3042 +169920,132.107,96.2002,3.29467,118.49,131.876,92.3834 +339840,173.608,128.838,3.29467,132.423,173.132,93.5856 +679680,173.608,129.091,3.29348,135.0,173.132,93.6736 +1359360,173.608,129.855,3.29348,135.267,173.132,93.6736 +2718720,172.411,130.436,3.3161,135.267,170.242,92.3834 +5437248,168.26999999999998,130.8845,3.31868,135.5035,166.38799999999998,88.9002 +7964736,164.129,131.333,3.3161,135.74,162.534,84.1268 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_flops_raw.csv new file mode 100644 index 0000000..fe04b91 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_64,Base_HIP-runtime_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-direct_64,RAJA_HIP-runtime_block_stride_loop_64 +5376,39.8862,19.1842,10.7556,21.0554,39.5942,14.8918 +21312,146.136,72.4048,11.0127,80.5064,144.939,56.553 +85056,284.29,197.716,10.8039,225.969,282.576,174.723 +169920,433.053,315.348,10.8001,388.416,432.295,306.778 +339840,569.111,422.349,10.792,460.798,567.55,348.506 +679680,586.668,423.185,10.7966,434.108,576.532,302.85 +1359360,580.662,427.596,10.8878,442.559,581.807,307.082 +2718720,565.203,434.945,10.7323,454.317,558.09,317.263 +5437248,538.055,425.694,10.8709,443.436,531.766,275.619 +7964736,538.024,430.541,10.9003,444.989,532.825,275.787 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_flops_smoothed.csv new file mode 100644 index 0000000..7549567 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_MASSVEC3DPA_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_64,Base_HIP-runtime_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-direct_64,RAJA_HIP-runtime_block_stride_loop_64 +5376,146.136,72.4048,10.8039,80.5064,144.939,56.553 +21312,215.21300000000002,135.06040000000002,10.802,153.2377,213.7575,115.638 +85056,284.29,197.716,10.8001,225.969,282.576,174.723 +169920,433.053,315.348,10.8001,388.416,432.295,302.85 +339840,569.111,422.349,10.8001,434.108,567.55,306.778 +679680,569.111,423.185,10.7966,442.559,567.55,307.082 +1359360,569.111,425.694,10.7966,443.436,567.55,307.082 +2718720,565.203,427.596,10.8709,443.436,558.09,302.85 +5437248,551.6289999999999,429.0685,10.87935,444.2125,545.4575,291.43449999999996 +7964736,538.055,430.541,10.8709,444.989,532.825,275.787 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv new file mode 100644 index 0000000..8bed640 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1000,13.0067,5.37512,17.5648 +5832,60.8403,4.96773,61.284 +27000,105.753,4.72527,107.933 +54872,114.164,4.64042,114.301 +117649,120.424,4.59871,121.275 +238328,122.931,4.54776,123.632 +493039,121.164,4.53122,121.388 +1000000,122.989,4.45236,123.014 +2048383,123.892,4.44515,124.023 +2985984,123.804,4.42601,123.707 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..dbbc04f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1000,60.8403,4.96773,61.284 +5832,83.29665,4.846500000000001,84.6085 +27000,105.753,4.72527,107.933 +54872,114.164,4.64042,114.301 +117649,120.424,4.59871,121.275 +238328,121.164,4.54776,121.388 +493039,122.931,4.53122,123.014 +1000000,122.989,4.45236,123.632 +2048383,123.3965,4.448755,123.3605 +2985984,123.804,4.44515,123.707 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv new file mode 100644 index 0000000..746c7e8 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1000,3.37014,1.39273,4.55118 +5832,16.8863,1.3788,17.0095 +27000,30.367,1.35685,30.9928 +54872,33.1336,1.34679,33.1735 +117649,35.2651,1.34669,35.5144 +238328,36.2331,1.34042,36.4398 +493039,35.8999,1.34257,35.9665 +1000000,36.5871,1.3245,36.5946 +2048383,36.9741,1.3266,37.0132 +2985984,36.9993,1.32274,36.9704 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv new file mode 100644 index 0000000..a1d7e44 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1000,16.8863,1.3788,17.0095 +5832,23.626649999999998,1.3678249999999998,24.00115 +27000,30.367,1.35685,30.9928 +54872,33.1336,1.34679,33.1735 +117649,35.2651,1.34669,35.5144 +238328,35.8999,1.34257,35.9665 +493039,36.2331,1.34042,36.4398 +1000000,36.5871,1.3266,36.5946 +2048383,36.7806,1.32555,36.7825 +2985984,36.9741,1.3245,36.9704 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_bandwidth_raw.csv new file mode 100644 index 0000000..c5d19c7 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +512,13.7292,7.02031,19.5946 +3375,60.5007,6.71414,81.7623 +17576,192.769,6.92586,194.023 +35937,231.35,6.86628,260.304 +79507,250.995,6.81545,277.975 +166375,248.726,6.71395,253.724 +343000,254.87,6.69096,255.439 +704969,265.303,6.48104,267.485 +1442897,238.451,6.38656,237.412 +2146689,234.813,5.84542,236.557 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..6aa693c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +512,60.5007,6.92586,81.7623 +3375,126.63485,6.89607,137.89265 +17576,192.769,6.86628,194.023 +35937,231.35,6.81545,253.724 +79507,248.726,6.81545,255.439 +166375,250.995,6.71395,260.304 +343000,250.995,6.69096,255.439 +704969,248.726,6.48104,253.724 +1442897,246.6605,6.4338,246.4255 +2146689,238.451,6.38656,237.412 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_flops_raw.csv new file mode 100644 index 0000000..a249ad8 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +512,30.6189,15.6567,43.6999 +3375,139.621,15.4946,188.688 +17576,453.129,16.2801,456.074 +35937,546.86,16.2304,615.301 +79507,596.22,16.1896,660.309 +166375,592.96,16.006,604.875 +343000,609.31,15.9959,610.668 +704969,635.654,15.5283,640.881 +1442897,572.313,15.3286,569.819 +2146689,564.035,14.0411,568.225 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_flops_smoothed.csv new file mode 100644 index 0000000..dbb773d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/Apps_VOL3D_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +512,139.621,15.6567,188.688 +3375,296.375,15.94355,322.381 +17576,453.129,16.1896,456.074 +35937,546.86,16.1896,604.875 +79507,592.96,16.1896,610.668 +166375,596.22,16.006,615.301 +343000,596.22,15.9959,610.668 +704969,592.96,15.5283,604.875 +1442897,590.8115,15.42845,590.2435 +2146689,572.313,15.3286,569.819 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_DIFFUSION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_DIFFUSION3DPA.csv new file mode 100644 index 0000000..fd8a4c5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_DIFFUSION3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DIFFUSION3DPA-Base_Seq-default,405.0,9.68515,6.47622 +Apps_DIFFUSION3DPA-Base_HIP-block_64,24678.0,515.086,343.264 +Apps_DIFFUSION3DPA-RAJA_HIP-block_64,24678.0,513.128,341.959 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_EDGE3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_EDGE3D.csv new file mode 100644 index 0000000..de4d346 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_EDGE3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_EDGE3D-Base_Seq-default,512.0,8.35478,0.0204122 +Apps_EDGE3D-Base_HIP-block_256,79507.0,4346.65,9.97035 +Apps_EDGE3D-RAJA_HIP-block_256,35937.0,4701.17,10.8367 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_ENERGY.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_ENERGY.csv new file mode 100644 index 0000000..9e6daee --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_ENERGY.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_ENERGY-Base_Seq-default,417.0,10.7796,39.4271 +Apps_ENERGY-Base_HIP-block_256,53334.0,210.727,770.744 +Apps_ENERGY-RAJA_HIP-block_256,26667.0,159.274,582.554 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_FEMSWEEP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_FEMSWEEP.csv new file mode 100644 index 0000000..d82ba80 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_FEMSWEEP.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_FEMSWEEP-Base_Seq-default,31104.0,3.35637,0.602749 +Apps_FEMSWEEP-Base_HIP-block_64,589824.0,231.835,44.4605 +Apps_FEMSWEEP-RAJA_HIP-block_64,589824.0,223.812,42.9218 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_INTSC_HEXRECT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_INTSC_HEXRECT.csv new file mode 100644 index 0000000..6683c07 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_INTSC_HEXRECT.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_INTSC_HEXRECT-Base_Seq-default,1728.0,4.05739,0.0511849 +Apps_INTSC_HEXRECT-Base_HIP-block_64,74088.0,140.587,1.72573 +Apps_INTSC_HEXRECT-RAJA_HIP-block_64,140608.0,146.252,1.79187 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASS3DEA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASS3DEA.csv new file mode 100644 index 0000000..88db681 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASS3DEA.csv @@ -0,0 +1,5 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DEA-Base_Seq-default,196608.0,0.0801476,0.0879186 +Apps_MASS3DEA-Base_HIP-compile_time_block_stride_loop_64,6213632.0,30.1164,33.0333 +Apps_MASS3DEA-RAJA_HIP-compile_time_block_stride_loop_64,3108864.0,6.68945,7.33737 +Apps_MASS3DEA-RAJA_HIP-cached_block_stride_loop_64,9101312.0,41.1328,45.1167 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASS3DPA_ATOMIC.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASS3DPA_ATOMIC.csv new file mode 100644 index 0000000..4001f3b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASS3DPA_ATOMIC.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DPA_ATOMIC-Base_Seq-default,729.0,10.0932,5.04932 +Apps_MASS3DPA_ATOMIC-Base_HIP-block_64,19683.0,389.674,183.315 +Apps_MASS3DPA_ATOMIC-RAJA_HIP-block_64,19683.0,391.541,184.193 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASSVEC3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASSVEC3DPA.csv new file mode 100644 index 0000000..f86ac43 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_MASSVEC3DPA.csv @@ -0,0 +1,7 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASSVEC3DPA-Base_Seq-default,5376.0,10.7556,3.28712 +Apps_MASSVEC3DPA-Base_HIP-runtime_block_stride_loop_64,339840.0,422.349,128.838 +Apps_MASSVEC3DPA-Base_HIP-direct_64,339840.0,569.111,173.608 +Apps_MASSVEC3DPA-RAJA_HIP-runtime_block_stride_loop_64,169920.0,306.778,93.5856 +Apps_MASSVEC3DPA-RAJA_HIP-direct_64,339840.0,567.55,173.132 +Apps_MASSVEC3DPA-RAJA_HIP-cached_block_stride_loop_64,339840.0,460.798,140.567 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_NODAL_ACCUMULATION_3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_NODAL_ACCUMULATION_3D.csv new file mode 100644 index 0000000..cbc3c1b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_NODAL_ACCUMULATION_3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_NODAL_ACCUMULATION_3D-Base_Seq-default,1000.0,1.39273,5.37512 +Apps_NODAL_ACCUMULATION_3D-Base_HIP-block_256,117649.0,35.2651,120.424 +Apps_NODAL_ACCUMULATION_3D-RAJA_HIP-block_256,117649.0,35.5144,121.275 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_VOL3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_VOL3D.csv new file mode 100644 index 0000000..b4830dd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/Apps_VOL3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_VOL3D-Base_Seq-default,512.0,15.6567,7.02031 +Apps_VOL3D-Base_HIP-block_256,35937.0,546.86,231.35 +Apps_VOL3D-RAJA_HIP-block_256,35937.0,615.301,260.304 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/combined_fom.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/combined_fom.csv new file mode 100644 index 0000000..9de8861 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/FOM/combined_fom.csv @@ -0,0 +1,35 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DIFFUSION3DPA-Base_HIP-block_64,24678.0,515.086,343.264 +Apps_DIFFUSION3DPA-Base_Seq-default,405.0,9.68515,6.47622 +Apps_DIFFUSION3DPA-RAJA_HIP-block_64,24678.0,513.128,341.959 +Apps_EDGE3D-Base_HIP-block_256,79507.0,4346.65,9.97035 +Apps_EDGE3D-Base_Seq-default,512.0,8.35478,0.0204122 +Apps_EDGE3D-RAJA_HIP-block_256,35937.0,4701.17,10.8367 +Apps_ENERGY-Base_HIP-block_256,53334.0,210.727,770.744 +Apps_ENERGY-Base_Seq-default,417.0,10.7796,39.4271 +Apps_ENERGY-RAJA_HIP-block_256,26667.0,159.274,582.554 +Apps_FEMSWEEP-Base_HIP-block_64,589824.0,231.835,44.4605 +Apps_FEMSWEEP-Base_Seq-default,31104.0,3.35637,0.602749 +Apps_FEMSWEEP-RAJA_HIP-block_64,589824.0,223.812,42.9218 +Apps_INTSC_HEXRECT-Base_HIP-block_64,74088.0,140.587,1.72573 +Apps_INTSC_HEXRECT-Base_Seq-default,1728.0,4.05739,0.0511849 +Apps_INTSC_HEXRECT-RAJA_HIP-block_64,140608.0,146.252,1.79187 +Apps_MASS3DEA-Base_HIP-compile_time_block_stride_loop_64,6213632.0,30.1164,33.0333 +Apps_MASS3DEA-Base_Seq-default,196608.0,0.0801476,0.0879186 +Apps_MASS3DEA-RAJA_HIP-cached_block_stride_loop_64,9101312.0,41.1328,45.1167 +Apps_MASS3DEA-RAJA_HIP-compile_time_block_stride_loop_64,3108864.0,6.68945,7.33737 +Apps_MASS3DPA_ATOMIC-Base_HIP-block_64,19683.0,389.674,183.315 +Apps_MASS3DPA_ATOMIC-Base_Seq-default,729.0,10.0932,5.04932 +Apps_MASS3DPA_ATOMIC-RAJA_HIP-block_64,19683.0,391.541,184.193 +Apps_MASSVEC3DPA-Base_HIP-direct_64,339840.0,569.111,173.608 +Apps_MASSVEC3DPA-Base_HIP-runtime_block_stride_loop_64,339840.0,422.349,128.838 +Apps_MASSVEC3DPA-Base_Seq-default,5376.0,10.7556,3.28712 +Apps_MASSVEC3DPA-RAJA_HIP-cached_block_stride_loop_64,339840.0,460.798,140.567 +Apps_MASSVEC3DPA-RAJA_HIP-direct_64,339840.0,567.55,173.132 +Apps_MASSVEC3DPA-RAJA_HIP-runtime_block_stride_loop_64,169920.0,306.778,93.5856 +Apps_NODAL_ACCUMULATION_3D-Base_HIP-block_256,117649.0,35.2651,120.424 +Apps_NODAL_ACCUMULATION_3D-Base_Seq-default,1000.0,1.39273,5.37512 +Apps_NODAL_ACCUMULATION_3D-RAJA_HIP-block_256,117649.0,35.5144,121.275 +Apps_VOL3D-Base_HIP-block_256,35937.0,546.86,231.35 +Apps_VOL3D-Base_Seq-default,512.0,15.6567,7.02031 +Apps_VOL3D-RAJA_HIP-block_256,35937.0,615.301,260.304 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/combined_table.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/combined_table.csv new file mode 100644 index 0000000..c303266 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/combined_table.csv @@ -0,0 +1,341 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning +Apps_DIFFUSION3DPA,Base_Seq,default,405, PASSED ,8.05202e-06,6.47622,9.68515,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,405, PASSED ,3.2102e-06,16.244,24.2929,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,405, PASSED ,3.08042e-06,16.9284,25.3164,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,394524, PASSED ,0.0401172,1.2619,1.89364,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,394524, PASSED ,0.000146866,344.694,517.261,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,394524, PASSED ,0.000142674,354.82,532.456,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,49329, PASSED ,0.0011576,5.46811,8.20543,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,49329, PASSED ,1.7189e-05,368.25,552.595,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,49329, PASSED ,1.62074e-05,390.553,586.063,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,577935, PASSED ,0.0526467,1.4086,2.1138,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,577935, PASSED ,0.000227944,325.335,488.21,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,577935, PASSED ,0.000222301,333.594,500.604,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,6183, PASSED ,0.000132885,5.97172,8.95938,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,6183, PASSED ,4.451e-06,178.287,267.484,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,6183, PASSED ,4.36602e-06,181.757,272.69,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,98631, PASSED ,0.00326208,3.87975,5.82203,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,98631, PASSED ,3.09167e-05,409.361,614.295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,98631, PASSED ,2.97063e-05,426.04,639.324,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,12339, PASSED ,0.000281751,5.62009,8.43279,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,12339, PASSED ,6.46422e-06,244.958,367.553,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,12339, PASSED ,6.5276e-06,242.58,363.984,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,1566, PASSED ,3.05499e-05,6.58336,9.87048,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,1566, PASSED ,3.3132e-06,60.7029,91.0123,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,1566, PASSED ,3.1994e-06,62.8621,94.2495,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,197262, PASSED ,0.0171103,1.47934,2.21994,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,197262, PASSED ,5.7834e-05,437.666,656.775,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,197262, PASSED ,5.58741e-05,453.017,679.812,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,24678, PASSED ,0.000686797,4.6109,6.91891,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,24678, PASSED ,9.22542e-06,343.264,515.086,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,24678, PASSED ,9.26062e-06,341.959,513.128,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_EDGE3D,Base_Seq,default,512, PASSED ,0.0022364,0.0204122,8.35478,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,512, PASSED ,3.3365e-05,1.36819,560.006,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,512, PASSED ,2.4049e-05,1.8982,776.939,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,1442897, PASSED ,2.48478,0.0190027,8.37049,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,1442897, PASSED ,0.00439651,10.7398,4730.76,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,1442897, PASSED ,0.00435971,10.8304,4770.69,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,166375, PASSED ,0.312837,0.0191437,8.37593,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,166375, PASSED ,0.000598175,10.0119,4380.49,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,166375, PASSED ,0.000597092,10.0301,4388.43,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,2146689, PASSED ,3.65821,0.0189847,8.36932,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,2146689, PASSED ,0.00646406,10.744,4736.46,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,2146689, PASSED ,0.00640428,10.8443,4780.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,17576, PASSED ,0.0397288,0.0193809,8.36103,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,17576, PASSED ,8.49982e-05,9.05878,3908.01,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,17576, PASSED ,8.13612e-05,9.46373,4082.7,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,343000, PASSED ,0.621483,0.0190992,8.37984,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,343000, PASSED ,0.00115024,10.3195,4527.7,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,343000, PASSED ,0.00113338,10.4729,4595.03,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,35937, PASSED ,0.0755499,0.0192874,8.36724,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,35937, PASSED ,0.00015299,9.52453,4131.92,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,35937, PASSED ,0.000134465,10.8367,4701.17,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,3375, PASSED ,0.00964672,0.0197187,8.35162,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,3375, PASSED ,3.2931e-05,5.77634,2446.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,3375, PASSED ,2.48781e-05,7.64611,3238.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,704969, PASSED ,1.24224,0.019035,8.37013,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,704969, PASSED ,0.00222351,10.6345,4676.26,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,704969, PASSED ,0.00219691,10.7633,4732.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,79507, PASSED ,0.156979,0.0191751,8.35954,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,79507, PASSED ,0.000301904,9.97035,4346.65,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,79507, PASSED ,0.000294064,10.2362,4462.53,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,417, PASSED ,2.12762e-06,39.4271,10.7796,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,417, PASSED ,1.4096e-05,5.95104,1.62705,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,417, PASSED ,1.19342e-05,7.02906,1.92179,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,426667, PASSED ,0.00334164,25.6852,7.0225,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,426667, PASSED ,0.000143545,597.937,163.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,426667, PASSED ,0.000145536,589.757,161.243,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,53334, PASSED ,0.000273144,39.2795,10.7393,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,53334, PASSED ,1.39203e-05,770.744,210.727,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,53334, PASSED ,1.24588e-05,861.156,235.446,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,625000, PASSED ,0.0050306,24.9927,6.83318,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,625000, PASSED ,0.000209884,599.038,163.781,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,625000, PASSED ,0.000209753,599.411,163.883,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,6667, PASSED ,3.31345e-05,40.4766,11.0666,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,6667, PASSED ,1.46765e-05,91.3822,24.9845,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,6667, PASSED ,9.08202e-06,147.673,40.3748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,106667, PASSED ,0.000551969,38.8749,10.6286,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,106667, PASSED ,3.70455e-05,579.227,158.364,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,106667, PASSED ,3.72164e-05,576.567,157.637,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,13334, PASSED ,6.93143e-05,38.6982,10.5804,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,13334, PASSED ,1.37397e-05,195.225,53.3759,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,13334, PASSED ,8.86095e-06,302.715,82.7643,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,1667, PASSED ,8.21625e-06,40.8146,11.159,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,1667, PASSED ,1.42278e-05,23.5696,6.44407,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,1667, PASSED ,9.06056e-06,37.0113,10.1191,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,213334, PASSED ,0.00134291,31.957,8.73726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,213334, PASSED ,7.48785e-05,573.135,156.699,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,213334, PASSED ,7.50524e-05,571.807,156.336,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,26667, PASSED ,0.000140386,38.2125,10.4475,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,26667, PASSED ,1.37965e-05,388.829,106.308,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,26667, PASSED ,9.20857e-06,582.554,159.274,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_FEMSWEEP,Base_Seq,default,395136, PASSED ,0.152243,0.428621,2.2469,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,395136, PASSED ,0.00174147,37.471,196.428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,395136, PASSED ,0.00161027,40.524,212.433,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,73728, PASSED ,0.0201147,0.57432,3.11191,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,73728, PASSED ,0.000622722,18.5512,100.518,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,73728, PASSED ,0.000578142,19.9817,108.269,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,589824, PASSED ,0.230803,0.425644,2.21948,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,589824, PASSED ,0.0022096,44.4605,231.835,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,589824, PASSED ,0.00228881,42.9218,223.812,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,839808, PASSED ,0.363337,0.387519,2.01244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,839808, PASSED ,0.00300008,46.932,243.725,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,839808, PASSED ,0.00286063,49.2199,255.606,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,144000, PASSED ,0.0500367,0.462276,2.46577,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,144000, PASSED ,0.000844012,27.4057,146.182,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,144000, PASSED ,0.000794952,29.0971,155.203,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,1152000, PASSED ,0.5142,0.377586,1.9545,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,1152000, PASSED ,0.00438795,44.2472,229.037,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,1152000, PASSED ,0.00415813,46.6927,241.696,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00774733,0.602749,3.35637,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,31104, PASSED ,0.000407801,11.4509,63.7638,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,31104, PASSED ,0.000376761,12.3943,69.0171,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,1533312, PASSED ,0.630138,0.411853,2.12626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,1533312, PASSED ,0.00591299,43.8905,226.592,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,1533312, PASSED ,0.00559834,46.3573,239.328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,248832, PASSED ,0.096531,0.420849,2.22201,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,248832, PASSED ,0.00112982,35.957,189.847,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,248832, PASSED ,0.00108194,37.5482,198.248,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00772459,0.604523,3.36626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,31104, PASSED ,0.000406121,11.4983,64.0276,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,31104, PASSED ,0.000376351,12.4078,69.0923,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,1728, PASSED ,0.0015332,0.0511849,4.05739,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,1728, PASSED ,0.000261201,0.300447,23.8161,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,1728, PASSED ,0.00026271,0.298721,23.6793,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,1124864, PASSED ,0.919682,0.0537387,4.40316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,1124864, PASSED ,0.0261668,1.88875,154.757,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,1124864, PASSED ,0.0261263,1.89168,154.998,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,140608, PASSED ,0.114938,0.0539579,4.40402,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,140608, PASSED ,0.00348672,1.77869,145.176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,140608, PASSED ,0.00346108,1.79187,146.252,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,1643032, PASSED ,1.34381,0.0536954,4.4016,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,1643032, PASSED ,0.0380811,1.89481,155.324,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,1643032, PASSED ,0.0381702,1.89039,154.961,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,17576, PASSED ,0.0145135,0.0538508,4.35962,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,17576, PASSED ,0.000531951,1.46924,118.946,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,17576, PASSED ,0.000522831,1.49487,121.021,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,287496, PASSED ,0.235016,0.053867,4.4039,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,287496, PASSED ,0.00705871,1.79347,146.625,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,287496, PASSED ,0.00722877,1.75128,143.176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,39304, PASSED ,0.0322726,0.0539456,4.38435,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,39304, PASSED ,0.00112939,1.5415,125.284,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,39304, PASSED ,0.00112305,1.5502,125.991,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,5832, PASSED ,0.00489517,0.0533866,4.28896,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,5832, PASSED ,0.000274801,0.951003,76.4015,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,5832, PASSED ,0.000275601,0.948242,76.1797,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,551368, PASSED ,0.450218,0.053863,4.40881,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,551368, PASSED ,0.0133902,1.81102,148.237,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,551368, PASSED ,0.0130237,1.86199,152.408,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,74088, PASSED ,0.0608124,0.0538376,4.38589,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,74088, PASSED ,0.00189716,1.72573,140.587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,74088, PASSED ,0.0019126,1.7118,139.452,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DEA,Base_Seq,default,6213632, PASSED ,0.545463,0.0874635,0.0797404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,6213632, PASSED ,0.00144424,33.0333,30.1164,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,6213632, PASSED ,0.00637416,7.48462,6.82371,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,6213632, PASSED ,0.00115998,41.1283,37.4966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,778240, PASSED ,0.0679604,0.0879253,0.0801596,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,778240, PASSED ,0.000255741,23.3652,21.3016,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,778240, PASSED ,0.00113685,5.25612,4.79189,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,778240, PASSED ,0.000286191,20.8792,19.0351,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,9101312, PASSED ,0.798117,0.0875556,0.0798244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,9101312, PASSED ,0.00194579,35.9133,32.7421,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,9101312, PASSED ,0.00956941,7.3024,6.65759,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,9101312, PASSED ,0.00154886,45.1167,41.1328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,12423168, PASSED ,1.08713,0.08774,0.0799925,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,12423168, PASSED ,0.00233488,40.8521,37.2449,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,12423168, PASSED ,0.0123934,7.69642,7.01683,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,12423168, PASSED ,0.00194379,49.0714,44.7383,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,1556480, PASSED ,0.136181,0.0877564,0.0800066,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,1556480, PASSED ,0.000454651,26.2855,23.9642,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,1556480, PASSED ,0.00176684,6.76388,6.16656,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,1556480, PASSED ,0.000437991,27.2853,24.8758,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,18198528, PASSED ,1.59883,0.0873937,0.0796768,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,18198528, PASSED ,0.00359947,38.8189,35.3912,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,18198528, PASSED ,0.0181458,7.70027,7.02034,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,18198528, PASSED ,0.00285927,48.8683,44.5533,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,196608, PASSED ,0.0171715,0.0879186,0.0801476,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,196608, PASSED ,0.00022114,6.82688,6.22346,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,196608, PASSED ,0.000471131,3.20441,2.92117,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,196608, PASSED ,0.000252291,5.98395,5.45503,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,24260608, PASSED ,2.12153,0.087801,0.0800482,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,24260608, PASSED ,0.00470996,39.5485,36.0564,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,24260608, PASSED ,0.023972,7.77038,7.08426,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,24260608, PASSED ,0.00371912,50.085,45.6625,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,3108864, PASSED ,0.273216,0.0873663,0.0796515,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,3108864, PASSED ,0.000653302,36.5373,33.3109,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,3108864, PASSED ,0.00325319,7.33737,6.68945,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,3108864, PASSED ,0.000561061,42.5442,38.7873,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,389120, PASSED ,0.0338421,0.0882862,0.0804867,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,389120, PASSED ,0.000233171,12.8137,11.6817,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,389120, PASSED ,0.000529802,5.63946,5.14124,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,389120, PASSED ,0.000261081,11.4439,10.4329,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,729, PASSED ,1.18384e-05,5.04932,10.0932,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,729, PASSED ,2.90682e-06,20.5641,41.1061,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,729, PASSED ,3.0124e-06,19.8433,39.6654,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,531441, PASSED ,0.0138961,3.97743,8.59865,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,531441, PASSED ,0.000309184,178.764,386.463,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,531441, PASSED ,0.00030012,184.162,398.134,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,68921, PASSED ,0.00149013,4.67384,10.0233,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,68921, PASSED ,3.48627e-05,199.773,428.424,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,68921, PASSED ,3.57475e-05,194.828,417.819,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,753571, PASSED ,0.0195446,4.02294,8.70474,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,753571, PASSED ,0.000440539,178.479,386.187,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,753571, PASSED ,0.000439064,179.078,387.484,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,9261, PASSED ,0.000188469,4.69623,9.90615,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,9261, PASSED ,6.05882e-06,146.083,308.146,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,9261, PASSED ,6.11162e-06,144.821,305.484,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,132651, PASSED ,0.00291651,4.649,10.0023,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,132651, PASSED ,6.62838e-05,204.558,440.106,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,132651, PASSED ,6.57742e-05,206.143,443.516,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,19683, PASSED ,0.000410276,4.7032,9.99765,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,19683, PASSED ,1.05262e-05,183.315,389.674,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,19683, PASSED ,1.0476e-05,184.193,391.541,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,3375, PASSED ,6.21558e-05,4.9566,10.3028,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,3375, PASSED ,4.11522e-06,74.8639,155.613,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,3375, PASSED ,4.19722e-06,73.4013,152.573,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,250047, PASSED ,0.00574692,4.48718,9.6782,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,250047, PASSED ,0.000130849,197.078,425.069,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,250047, PASSED ,0.000129993,198.375,427.867,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,35937, PASSED ,0.000761298,4.70308,10.045,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,35937, PASSED ,1.71592e-05,208.66,445.663,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,35937, PASSED ,1.7949e-05,199.478,426.052,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASSVEC3DPA,Base_Seq,default,5376, PASSED ,1.43702e-05,3.28712,10.7556,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,5376, PASSED ,8.05662e-06,5.86309,19.1842,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,5376, PASSED ,3.87502e-06,12.19,39.8862,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,5376, PASSED ,1.03788e-05,4.55125,14.8918,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,5376, PASSED ,3.9036e-06,12.1008,39.5942,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,5376, PASSED ,7.34062e-06,6.43497,21.0554,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,5437248, PASSED ,0.0143797,3.3161,10.8709,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,5437248, PASSED ,0.000367214,129.855,425.694,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,5437248, PASSED ,0.00029053,164.129,538.055,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,5437248, PASSED ,0.000567163,84.0754,275.619,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,5437248, PASSED ,0.000293966,162.211,531.766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,5437248, PASSED ,0.000352522,135.267,443.436,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,679680, PASSED ,0.0018099,3.29348,10.7966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,679680, PASSED ,4.61755e-05,129.091,423.185,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,679680, PASSED ,3.33081e-05,178.961,586.668,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,679680, PASSED ,6.4523e-05,92.3834,302.85,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,679680, PASSED ,3.38937e-05,175.869,576.532,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,679680, PASSED ,4.50137e-05,132.423,434.108,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,7964736, PASSED ,0.0210073,3.32505,10.9003,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,7964736, PASSED ,0.000531857,131.333,430.541,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,7964736, PASSED ,0.000425606,164.12,538.024,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,7964736, PASSED ,0.000830299,84.1268,275.787,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,7964736, PASSED ,0.000429759,162.534,532.825,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,7964736, PASSED ,0.000514589,135.74,444.989,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,85056, PASSED ,0.000226341,3.29603,10.8039,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,85056, PASSED ,1.2368e-05,60.3189,197.716,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,85056, PASSED ,8.60164e-06,86.7307,284.29,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,85056, PASSED ,1.39956e-05,53.3042,174.723,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,85056, PASSED ,8.65382e-06,86.2078,282.576,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,85056, PASSED ,1.08216e-05,68.9384,225.969,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,1359360, PASSED ,0.00358948,3.32126,10.8878,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,1359360, PASSED ,9.13985e-05,130.436,427.596,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,1359360, PASSED ,6.73052e-05,177.128,580.662,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,1359360, PASSED ,0.000127268,93.6736,307.082,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,1359360, PASSED ,6.71728e-05,177.477,581.807,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,1359360, PASSED ,8.83082e-05,135.0,442.559,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,169920, PASSED ,0.000452331,3.29467,10.8001,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,169920, PASSED ,1.54914e-05,96.2002,315.348,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,169920, PASSED ,1.12808e-05,132.107,433.053,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,169920, PASSED ,1.59242e-05,93.5856,306.778,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,169920, PASSED ,1.13006e-05,131.876,432.295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,169920, PASSED ,1.25772e-05,118.49,388.416,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,21312, PASSED ,5.56373e-05,3.36096,11.0127,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,21312, PASSED ,8.46242e-06,22.0971,72.4048,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,21312, PASSED ,4.19282e-06,44.5988,146.136,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,21312, PASSED ,1.08344e-05,17.2593,56.553,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,21312, PASSED ,4.22742e-06,44.2338,144.939,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,21312, PASSED ,7.61082e-06,24.5696,80.5064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,2718720, PASSED ,0.00728298,3.27381,10.7323,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,2718720, PASSED ,0.000179708,132.677,434.945,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,2718720, PASSED ,0.000138292,172.411,565.203,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,2718720, PASSED ,0.000246367,96.7789,317.263,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,2718720, PASSED ,0.000140055,170.242,558.09,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,2718720, PASSED ,0.000172045,138.586,454.317,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,339840, PASSED ,0.000905337,3.29211,10.792,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,339840, PASSED ,2.31335e-05,128.838,422.349,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,339840, PASSED ,1.71678e-05,173.608,569.111,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,339840, PASSED ,2.80351e-05,106.312,348.506,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,339840, PASSED ,1.72151e-05,173.132,567.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,339840, PASSED ,2.12032e-05,140.567,460.798,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000, PASSED ,6.46211e-06,5.37512,1.39273,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,1000, PASSED ,2.67051e-06,13.0067,3.37014,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,1000, PASSED ,1.97751e-06,17.5648,4.55118,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2048383, PASSED ,0.0138968,4.44515,1.3266,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,2048383, PASSED ,0.000498605,123.892,36.9741,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,2048383, PASSED ,0.000498078,124.023,37.0132,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,238328, PASSED ,0.00160021,4.54776,1.34042,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,238328, PASSED ,5.91987e-05,122.931,36.2331,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,238328, PASSED ,5.8863e-05,123.632,36.4398,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2985984, PASSED ,0.0203169,4.42601,1.32274,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,2985984, PASSED ,0.000726334,123.804,36.9993,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,2985984, PASSED ,0.000726902,123.707,36.9704,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,27000, PASSED ,0.000179091,4.72527,1.35685,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,27000, PASSED ,8.00212e-06,105.753,30.367,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,27000, PASSED ,7.84052e-06,107.933,30.9928,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,493039, PASSED ,0.00330512,4.53122,1.34257,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,493039, PASSED ,0.000123603,121.164,35.8999,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,493039, PASSED ,0.000123375,121.388,35.9665,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,54872, PASSED ,0.000366686,4.64042,1.34679,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,54872, PASSED ,1.49047e-05,114.164,33.1336,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,54872, PASSED ,1.48868e-05,114.301,33.1735,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,5832, PASSED ,3.80678e-05,4.96773,1.3788,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,5832, PASSED ,3.10831e-06,60.8403,16.8863,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,5832, PASSED ,3.08581e-06,61.284,17.0095,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000000, PASSED ,0.00679502,4.45236,1.3245,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,1000000, PASSED ,0.000245989,122.989,36.5871,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,1000000, PASSED ,0.000245938,123.014,36.5946,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,117649, PASSED ,0.000786253,4.59871,1.34669,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,117649, PASSED ,3.00252e-05,120.424,35.2651,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,117649, PASSED ,2.98144e-05,121.275,35.5144,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,512, PASSED ,6.50252e-06,7.02031,15.6567,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,512, PASSED ,3.32501e-06,13.7292,30.6189,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,512, PASSED ,2.32971e-06,19.5946,43.6999,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,1442897, PASSED ,0.00739325,6.38656,15.3286,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,1442897, PASSED ,0.000198018,238.451,572.313,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,1442897, PASSED ,0.000198884,237.412,569.819,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,166375, PASSED ,0.000892002,6.71395,16.006,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,166375, PASSED ,2.40782e-05,248.726,592.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,166375, PASSED ,2.36039e-05,253.724,604.875,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,2146689, PASSED ,0.0118811,5.84542,14.0411,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,2146689, PASSED ,0.000295768,234.813,564.035,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,2146689, PASSED ,0.000293587,236.557,568.225,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,17576, PASSED ,0.000111175,6.92586,16.2801,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,17576, PASSED ,3.99431e-06,192.769,453.129,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,17576, PASSED ,3.96851e-06,194.023,456.074,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,343000, PASSED ,0.00177401,6.69096,15.9959,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,343000, PASSED ,4.6572e-05,254.87,609.31,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,343000, PASSED ,4.64684e-05,255.439,610.668,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,35937, PASSED ,0.00021222,6.86628,16.2304,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,35937, PASSED ,6.29852e-06,231.35,546.86,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,35937, PASSED ,5.59792e-06,260.304,615.301,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,3375, PASSED ,2.83314e-05,6.71414,15.4946,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,3375, PASSED ,3.14411e-06,60.5007,139.621,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,3375, PASSED ,2.32651e-06,81.7623,188.688,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,704969, PASSED ,0.00364849,6.48104,15.5283,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,704969, PASSED ,8.91282e-05,265.303,635.654,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,704969, PASSED ,8.84012e-05,267.485,640.881,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,79507, PASSED ,0.000441656,6.81545,16.1896,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,79507, PASSED ,1.19926e-05,250.995,596.22,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,79507, PASSED ,1.08286e-05,277.975,660.309,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_DIFFUSION3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_DIFFUSION3DPA_bandwidth.png new file mode 100644 index 0000000..c52667c Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_DIFFUSION3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_DIFFUSION3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_DIFFUSION3DPA_flops.png new file mode 100644 index 0000000..737e6b6 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_DIFFUSION3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_EDGE3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_EDGE3D_bandwidth.png new file mode 100644 index 0000000..0029081 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_EDGE3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_EDGE3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_EDGE3D_flops.png new file mode 100644 index 0000000..6556c29 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_EDGE3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_ENERGY_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_ENERGY_bandwidth.png new file mode 100644 index 0000000..a520991 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_ENERGY_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_ENERGY_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_ENERGY_flops.png new file mode 100644 index 0000000..914de9e Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_ENERGY_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_FEMSWEEP_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_FEMSWEEP_bandwidth.png new file mode 100644 index 0000000..7b0a750 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_FEMSWEEP_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_FEMSWEEP_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_FEMSWEEP_flops.png new file mode 100644 index 0000000..a3bc649 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_FEMSWEEP_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_INTSC_HEXRECT_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_INTSC_HEXRECT_bandwidth.png new file mode 100644 index 0000000..5d05355 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_INTSC_HEXRECT_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_INTSC_HEXRECT_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_INTSC_HEXRECT_flops.png new file mode 100644 index 0000000..dd3976a Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_INTSC_HEXRECT_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DEA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DEA_bandwidth.png new file mode 100644 index 0000000..08ad776 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DEA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DEA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DEA_flops.png new file mode 100644 index 0000000..e7be150 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DEA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png new file mode 100644 index 0000000..f05b923 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DPA_ATOMIC_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DPA_ATOMIC_flops.png new file mode 100644 index 0000000..6fd449a Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASS3DPA_ATOMIC_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASSVEC3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASSVEC3DPA_bandwidth.png new file mode 100644 index 0000000..7523d21 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASSVEC3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASSVEC3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASSVEC3DPA_flops.png new file mode 100644 index 0000000..5a92c55 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_MASSVEC3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png new file mode 100644 index 0000000..3138a5e Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_NODAL_ACCUMULATION_3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_NODAL_ACCUMULATION_3D_flops.png new file mode 100644 index 0000000..44e51f5 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_NODAL_ACCUMULATION_3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_VOL3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_VOL3D_bandwidth.png new file mode 100644 index 0000000..057c7ac Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_VOL3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_VOL3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_VOL3D_flops.png new file mode 100644 index 0000000..04ec41d Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/figures/Apps_VOL3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/output_with_variant_tuning.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/output_with_variant_tuning.csv new file mode 100644 index 0000000..f4400f3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/output_with_variant_tuning.csv @@ -0,0 +1,341 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning,Smoothed Mean flops (gigaFLOP per sec.),Smoothed Bandwidth (GiB per sec.) +Apps_DIFFUSION3DPA,Base_Seq,default,405, PASSED ,8.05202e-06,6.47622,9.68515,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,9.68515,6.47622 +Apps_DIFFUSION3DPA,Base_HIP,block_64,405, PASSED ,3.2102e-06,16.244,24.2929,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,91.0123,60.7029 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,405, PASSED ,3.08042e-06,16.9284,25.3164,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,94.2495,62.8621 +Apps_DIFFUSION3DPA,Base_Seq,default,394524, PASSED ,0.0401172,1.2619,1.89364,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,2.16687,1.4439700000000002 +Apps_DIFFUSION3DPA,Base_HIP,block_64,394524, PASSED ,0.000146866,344.694,517.261,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,565.778,377.02750000000003 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,394524, PASSED ,0.000142674,354.82,532.456,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,585.89,390.43 +Apps_DIFFUSION3DPA,Base_Seq,default,49329, PASSED ,0.0011576,5.46811,8.20543,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,6.91891,4.6109 +Apps_DIFFUSION3DPA,Base_HIP,block_64,49329, PASSED ,1.7189e-05,368.25,552.595,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,552.595,368.25 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,49329, PASSED ,1.62074e-05,390.553,586.063,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,586.063,390.553 +Apps_DIFFUSION3DPA,Base_Seq,default,577935, PASSED ,0.0526467,1.4086,2.1138,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,2.1138,1.4086 +Apps_DIFFUSION3DPA,Base_HIP,block_64,577935, PASSED ,0.000227944,325.335,488.21,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,517.261,344.694 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,577935, PASSED ,0.000222301,333.594,500.604,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,532.456,354.82 +Apps_DIFFUSION3DPA,Base_Seq,default,6183, PASSED ,0.000132885,5.97172,8.95938,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,8.95938,5.97172 +Apps_DIFFUSION3DPA,Base_HIP,block_64,6183, PASSED ,4.451e-06,178.287,267.484,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,267.484,178.287 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,6183, PASSED ,4.36602e-06,181.757,272.69,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,272.69,181.757 +Apps_DIFFUSION3DPA,Base_Seq,default,98631, PASSED ,0.00326208,3.87975,5.82203,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,5.82203,3.87975 +Apps_DIFFUSION3DPA,Base_HIP,block_64,98631, PASSED ,3.09167e-05,409.361,614.295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,552.595,368.25 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,98631, PASSED ,2.97063e-05,426.04,639.324,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,586.063,390.553 +Apps_DIFFUSION3DPA,Base_Seq,default,12339, PASSED ,0.000281751,5.62009,8.43279,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,8.43279,5.62009 +Apps_DIFFUSION3DPA,Base_HIP,block_64,12339, PASSED ,6.46422e-06,244.958,367.553,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,367.553,244.958 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,12339, PASSED ,6.5276e-06,242.58,363.984,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,363.984,242.58 +Apps_DIFFUSION3DPA,Base_Seq,default,1566, PASSED ,3.05499e-05,6.58336,9.87048,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,9.322265,6.22397 +Apps_DIFFUSION3DPA,Base_HIP,block_64,1566, PASSED ,3.3132e-06,60.7029,91.0123,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,179.24814999999998,119.49495 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,1566, PASSED ,3.1994e-06,62.8621,94.2495,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,183.46975,122.30955 +Apps_DIFFUSION3DPA,Base_Seq,default,197262, PASSED ,0.0171103,1.47934,2.21994,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,2.21994,1.47934 +Apps_DIFFUSION3DPA,Base_HIP,block_64,197262, PASSED ,5.7834e-05,437.666,656.775,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,552.595,368.25 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,197262, PASSED ,5.58741e-05,453.017,679.812,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,586.063,390.553 +Apps_DIFFUSION3DPA,Base_Seq,default,24678, PASSED ,0.000686797,4.6109,6.91891,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,8.20543,5.46811 +Apps_DIFFUSION3DPA,Base_HIP,block_64,24678, PASSED ,9.22542e-06,343.264,515.086,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,515.086,343.264 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,24678, PASSED ,9.26062e-06,341.959,513.128,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,513.128,341.959 +Apps_EDGE3D,Base_Seq,default,512, PASSED ,0.0022364,0.0204122,8.35478,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,8.35478,0.0197187 +Apps_EDGE3D,Base_HIP,block_256,512, PASSED ,3.3365e-05,1.36819,560.006,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,2446.5,5.77634 +Apps_EDGE3D,RAJA_HIP,block_256,512, PASSED ,2.4049e-05,1.8982,776.939,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,3238.42,7.64611 +Apps_EDGE3D,Base_Seq,default,1442897, PASSED ,2.48478,0.0190027,8.37049,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,8.37031,0.01901885 +Apps_EDGE3D,Base_HIP,block_256,1442897, PASSED ,0.00439651,10.7398,4730.76,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,4703.51,10.687149999999999 +Apps_EDGE3D,RAJA_HIP,block_256,1442897, PASSED ,0.00435971,10.8304,4770.69,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,4751.78,10.79685 +Apps_EDGE3D,Base_Seq,default,166375, PASSED ,0.312837,0.0191437,8.37593,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,8.37013,0.0191437 +Apps_EDGE3D,Base_HIP,block_256,166375, PASSED ,0.000598175,10.0119,4380.49,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,4380.49,10.0119 +Apps_EDGE3D,RAJA_HIP,block_256,166375, PASSED ,0.000597092,10.0301,4388.43,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,4595.03,10.4729 +Apps_EDGE3D,Base_Seq,default,2146689, PASSED ,3.65821,0.0189847,8.36932,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,8.37013,0.0190027 +Apps_EDGE3D,Base_HIP,block_256,2146689, PASSED ,0.00646406,10.744,4736.46,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,4730.76,10.7398 +Apps_EDGE3D,RAJA_HIP,block_256,2146689, PASSED ,0.00640428,10.8443,4780.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,4770.69,10.8304 +Apps_EDGE3D,Base_Seq,default,17576, PASSED ,0.0397288,0.0193809,8.36103,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,8.35954,0.0193809 +Apps_EDGE3D,Base_HIP,block_256,17576, PASSED ,8.49982e-05,9.05878,3908.01,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,3908.01,9.05878 +Apps_EDGE3D,RAJA_HIP,block_256,17576, PASSED ,8.13612e-05,9.46373,4082.7,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,4082.7,9.46373 +Apps_EDGE3D,Base_Seq,default,343000, PASSED ,0.621483,0.0190992,8.37984,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,8.37049,0.0190992 +Apps_EDGE3D,Base_HIP,block_256,343000, PASSED ,0.00115024,10.3195,4527.7,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,4527.7,10.3195 +Apps_EDGE3D,RAJA_HIP,block_256,343000, PASSED ,0.00113338,10.4729,4595.03,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,4595.03,10.4729 +Apps_EDGE3D,Base_Seq,default,35937, PASSED ,0.0755499,0.0192874,8.36724,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,8.36103,0.0192874 +Apps_EDGE3D,Base_HIP,block_256,35937, PASSED ,0.00015299,9.52453,4131.92,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,4131.92,9.52453 +Apps_EDGE3D,RAJA_HIP,block_256,35937, PASSED ,0.000134465,10.8367,4701.17,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,4388.43,10.0301 +Apps_EDGE3D,Base_Seq,default,3375, PASSED ,0.00964672,0.0197187,8.35162,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,8.357904999999999,0.0195498 +Apps_EDGE3D,Base_HIP,block_256,3375, PASSED ,3.2931e-05,5.77634,2446.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,3177.255,7.41756 +Apps_EDGE3D,RAJA_HIP,block_256,3375, PASSED ,2.48781e-05,7.64611,3238.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,3660.56,8.55492 +Apps_EDGE3D,Base_Seq,default,704969, PASSED ,1.24224,0.019035,8.37013,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,8.37049,0.019035 +Apps_EDGE3D,Base_HIP,block_256,704969, PASSED ,0.00222351,10.6345,4676.26,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,4676.26,10.6345 +Apps_EDGE3D,RAJA_HIP,block_256,704969, PASSED ,0.00219691,10.7633,4732.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,4732.87,10.7633 +Apps_EDGE3D,Base_Seq,default,79507, PASSED ,0.156979,0.0191751,8.35954,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,8.36724,0.0191751 +Apps_EDGE3D,Base_HIP,block_256,79507, PASSED ,0.000301904,9.97035,4346.65,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,4346.65,9.97035 +Apps_EDGE3D,RAJA_HIP,block_256,79507, PASSED ,0.000294064,10.2362,4462.53,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/EDGE3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,4462.53,10.2362 +Apps_ENERGY,Base_Seq,default,417, PASSED ,2.12762e-06,39.4271,10.7796,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,11.0666,40.4766 +Apps_ENERGY,Base_HIP,block_256,417, PASSED ,1.4096e-05,5.95104,1.62705,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,6.44407,23.5696 +Apps_ENERGY,RAJA_HIP,block_256,417, PASSED ,1.19342e-05,7.02906,1.92179,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,10.1191,37.0113 +Apps_ENERGY,Base_Seq,default,426667, PASSED ,0.00334164,25.6852,7.0225,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,7.87988,28.8211 +Apps_ENERGY,Base_HIP,block_256,426667, PASSED ,0.000143545,597.937,163.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,160.922,588.582 +Apps_ENERGY,RAJA_HIP,block_256,426667, PASSED ,0.000145536,589.757,161.243,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,159.44,583.162 +Apps_ENERGY,Base_Seq,default,53334, PASSED ,0.000273144,39.2795,10.7393,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.5804,38.6982 +Apps_ENERGY,Base_HIP,block_256,53334, PASSED ,1.39203e-05,770.744,210.727,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,156.699,573.135 +Apps_ENERGY,RAJA_HIP,block_256,53334, PASSED ,1.24588e-05,861.156,235.446,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,157.637,576.567 +Apps_ENERGY,Base_Seq,default,625000, PASSED ,0.0050306,24.9927,6.83318,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,7.0225,25.6852 +Apps_ENERGY,Base_HIP,block_256,625000, PASSED ,0.000209884,599.038,163.781,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,163.48,597.937 +Apps_ENERGY,RAJA_HIP,block_256,625000, PASSED ,0.000209753,599.411,163.883,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,161.243,589.757 +Apps_ENERGY,Base_Seq,default,6667, PASSED ,3.31345e-05,40.4766,11.0666,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,10.7796,39.4271 +Apps_ENERGY,Base_HIP,block_256,6667, PASSED ,1.46765e-05,91.3822,24.9845,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,24.9845,91.3822 +Apps_ENERGY,RAJA_HIP,block_256,6667, PASSED ,9.08202e-06,147.673,40.3748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,40.3748,147.673 +Apps_ENERGY,Base_Seq,default,106667, PASSED ,0.000551969,38.8749,10.6286,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,10.4475,38.2125 +Apps_ENERGY,Base_HIP,block_256,106667, PASSED ,3.70455e-05,579.227,158.364,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,158.364,579.227 +Apps_ENERGY,RAJA_HIP,block_256,106667, PASSED ,3.72164e-05,576.567,157.637,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,159.274,582.554 +Apps_ENERGY,Base_Seq,default,13334, PASSED ,6.93143e-05,38.6982,10.5804,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,10.7393,39.2795 +Apps_ENERGY,Base_HIP,block_256,13334, PASSED ,1.37397e-05,195.225,53.3759,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,53.3759,195.225 +Apps_ENERGY,RAJA_HIP,block_256,13334, PASSED ,8.86095e-06,302.715,82.7643,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,82.7643,302.715 +Apps_ENERGY,Base_Seq,default,1667, PASSED ,8.21625e-06,40.8146,11.159,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,10.9231,39.95185 +Apps_ENERGY,Base_HIP,block_256,1667, PASSED ,1.42278e-05,23.5696,6.44407,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,15.714285,57.475899999999996 +Apps_ENERGY,RAJA_HIP,block_256,1667, PASSED ,9.06056e-06,37.0113,10.1191,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,25.24695,92.34215 +Apps_ENERGY,Base_Seq,default,213334, PASSED ,0.00134291,31.957,8.73726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,8.73726,31.957 +Apps_ENERGY,Base_HIP,block_256,213334, PASSED ,7.48785e-05,573.135,156.699,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,163.48,597.937 +Apps_ENERGY,RAJA_HIP,block_256,213334, PASSED ,7.50524e-05,571.807,156.336,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,161.243,589.757 +Apps_ENERGY,Base_Seq,default,26667, PASSED ,0.000140386,38.2125,10.4475,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,10.6286,38.8749 +Apps_ENERGY,Base_HIP,block_256,26667, PASSED ,1.37965e-05,388.829,106.308,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,106.308,388.829 +Apps_ENERGY,RAJA_HIP,block_256,26667, PASSED ,9.20857e-06,582.554,159.274,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/ENERGY_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,157.637,576.567 +Apps_FEMSWEEP,Base_Seq,default,395136, PASSED ,0.152243,0.428621,2.2469,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,2.22201,0.425644 +Apps_FEMSWEEP,Base_HIP,block_64,395136, PASSED ,0.00174147,37.471,196.428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,196.428,37.471 +Apps_FEMSWEEP,RAJA_HIP,block_64,395136, PASSED ,0.00161027,40.524,212.433,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,212.433,40.524 +Apps_FEMSWEEP,Base_Seq,default,73728, PASSED ,0.0201147,0.57432,3.11191,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,3.11191,0.57432 +Apps_FEMSWEEP,Base_HIP,block_64,73728, PASSED ,0.000622722,18.5512,100.518,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,100.518,18.5512 +Apps_FEMSWEEP,RAJA_HIP,block_64,73728, PASSED ,0.000578142,19.9817,108.269,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,108.269,19.9817 +Apps_FEMSWEEP,Base_Seq,default,589824, PASSED ,0.230803,0.425644,2.21948,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,2.21948,0.420849 +Apps_FEMSWEEP,Base_HIP,block_64,589824, PASSED ,0.0022096,44.4605,231.835,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,229.037,44.2472 +Apps_FEMSWEEP,RAJA_HIP,block_64,589824, PASSED ,0.00228881,42.9218,223.812,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,223.812,42.9218 +Apps_FEMSWEEP,Base_Seq,default,839808, PASSED ,0.363337,0.387519,2.01244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,2.12626,0.411853 +Apps_FEMSWEEP,Base_HIP,block_64,839808, PASSED ,0.00300008,46.932,243.725,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64,229.037,44.2472 +Apps_FEMSWEEP,RAJA_HIP,block_64,839808, PASSED ,0.00286063,49.2199,255.606,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64,239.328,46.3573 +Apps_FEMSWEEP,Base_Seq,default,144000, PASSED ,0.0500367,0.462276,2.46577,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,2.46577,0.462276 +Apps_FEMSWEEP,Base_HIP,block_64,144000, PASSED ,0.000844012,27.4057,146.182,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,146.182,27.4057 +Apps_FEMSWEEP,RAJA_HIP,block_64,144000, PASSED ,0.000794952,29.0971,155.203,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,155.203,29.0971 +Apps_FEMSWEEP,Base_Seq,default,1152000, PASSED ,0.5142,0.377586,1.9545,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,2.06935,0.399686 +Apps_FEMSWEEP,Base_HIP,block_64,1152000, PASSED ,0.00438795,44.2472,229.037,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64,230.436,44.35385 +Apps_FEMSWEEP,RAJA_HIP,block_64,1152000, PASSED ,0.00415813,46.6927,241.696,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,240.512,46.525000000000006 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00774733,0.602749,3.35637,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,3.23414,0.5885345 +Apps_FEMSWEEP,Base_HIP,block_64,31104, PASSED ,0.000407801,11.4509,63.7638,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,82.2728,15.024750000000001 +Apps_FEMSWEEP,RAJA_HIP,block_64,31104, PASSED ,0.000376761,12.3943,69.0171,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,88.68065,16.19475 +Apps_FEMSWEEP,Base_Seq,default,1533312, PASSED ,0.630138,0.411853,2.12626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,2.01244,0.387519 +Apps_FEMSWEEP,Base_HIP,block_64,1533312, PASSED ,0.00591299,43.8905,226.592,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64,229.037,44.2472 +Apps_FEMSWEEP,RAJA_HIP,block_64,1533312, PASSED ,0.00559834,46.3573,239.328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,241.696,46.6927 +Apps_FEMSWEEP,Base_Seq,default,248832, PASSED ,0.096531,0.420849,2.22201,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,2.2469,0.428621 +Apps_FEMSWEEP,Base_HIP,block_64,248832, PASSED ,0.00112982,35.957,189.847,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,189.847,35.957 +Apps_FEMSWEEP,RAJA_HIP,block_64,248832, PASSED ,0.00108194,37.5482,198.248,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,198.248,37.5482 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00772459,0.604523,3.36626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,3.23414,0.5885345 +Apps_FEMSWEEP,Base_HIP,block_64,31104, PASSED ,0.000406121,11.4983,64.0276,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,82.2728,15.024750000000001 +Apps_FEMSWEEP,RAJA_HIP,block_64,31104, PASSED ,0.000376351,12.4078,69.0923,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/FEMSWEEP_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,88.68065,16.19475 +Apps_INTSC_HEXRECT,Base_Seq,default,1728, PASSED ,0.0015332,0.0511849,4.05739,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,4.28896,0.0533866 +Apps_INTSC_HEXRECT,Base_HIP,block_64,1728, PASSED ,0.000261201,0.300447,23.8161,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,76.4015,0.951003 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,1728, PASSED ,0.00026271,0.298721,23.6793,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,76.1797,0.948242 +Apps_INTSC_HEXRECT,Base_Seq,default,1124864, PASSED ,0.919682,0.0537387,4.40316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,4.40353,0.05380085 +Apps_INTSC_HEXRECT,Base_HIP,block_64,1124864, PASSED ,0.0261668,1.88875,154.757,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,151.497,1.849885 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,1124864, PASSED ,0.0261263,1.89168,154.998,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,153.6845,1.87619 +Apps_INTSC_HEXRECT,Base_Seq,default,140608, PASSED ,0.114938,0.0539579,4.40402,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,4.4039,0.053867 +Apps_INTSC_HEXRECT,Base_HIP,block_64,140608, PASSED ,0.00348672,1.77869,145.176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,145.176,1.77869 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,140608, PASSED ,0.00346108,1.79187,146.252,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,143.176,1.75128 +Apps_INTSC_HEXRECT,Base_Seq,default,1643032, PASSED ,1.34381,0.0536954,4.4016,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,4.40316,0.0537387 +Apps_INTSC_HEXRECT,Base_HIP,block_64,1643032, PASSED ,0.0380811,1.89481,155.324,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,154.757,1.88875 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,1643032, PASSED ,0.0381702,1.89039,154.961,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,154.961,1.89039 +Apps_INTSC_HEXRECT,Base_Seq,default,17576, PASSED ,0.0145135,0.0538508,4.35962,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,4.35962,0.0538376 +Apps_INTSC_HEXRECT,Base_HIP,block_64,17576, PASSED ,0.000531951,1.46924,118.946,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,118.946,1.46924 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,17576, PASSED ,0.000522831,1.49487,121.021,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,121.021,1.49487 +Apps_INTSC_HEXRECT,Base_Seq,default,287496, PASSED ,0.235016,0.053867,4.4039,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,4.4039,0.053863 +Apps_INTSC_HEXRECT,Base_HIP,block_64,287496, PASSED ,0.00705871,1.79347,146.625,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,146.625,1.79347 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,287496, PASSED ,0.00722877,1.75128,143.176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,146.252,1.79187 +Apps_INTSC_HEXRECT,Base_Seq,default,39304, PASSED ,0.0322726,0.0539456,4.38435,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,4.38435,0.0538508 +Apps_INTSC_HEXRECT,Base_HIP,block_64,39304, PASSED ,0.00112939,1.5415,125.284,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,125.284,1.5415 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,39304, PASSED ,0.00112305,1.5502,125.991,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,125.991,1.5502 +Apps_INTSC_HEXRECT,Base_Seq,default,5832, PASSED ,0.00489517,0.0533866,4.28896,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,4.3242899999999995,0.0536187 +Apps_INTSC_HEXRECT,Base_HIP,block_64,5832, PASSED ,0.000274801,0.951003,76.4015,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,97.67375,1.2101215 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,5832, PASSED ,0.000275601,0.948242,76.1797,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,98.60034999999999,1.221556 +Apps_INTSC_HEXRECT,Base_Seq,default,551368, PASSED ,0.450218,0.053863,4.40881,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,4.4039,0.053863 +Apps_INTSC_HEXRECT,Base_HIP,block_64,551368, PASSED ,0.0133902,1.81102,148.237,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,148.237,1.81102 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,551368, PASSED ,0.0130237,1.86199,152.408,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,152.408,1.86199 +Apps_INTSC_HEXRECT,Base_Seq,default,74088, PASSED ,0.0608124,0.0538376,4.38589,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,4.38589,0.053867 +Apps_INTSC_HEXRECT,Base_HIP,block_64,74088, PASSED ,0.00189716,1.72573,140.587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,140.587,1.72573 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,74088, PASSED ,0.0019126,1.7118,139.452,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,139.452,1.7118 +Apps_MASS3DEA,Base_Seq,default,6213632, PASSED ,0.545463,0.0874635,0.0797404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.0798244,0.0875556 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,6213632, PASSED ,0.00144424,33.0333,30.1164,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,32.7421,35.9133 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,6213632, PASSED ,0.00637416,7.48462,6.82371,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,6.68945,7.33737 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,6213632, PASSED ,0.00115998,41.1283,37.4966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,38.7873,42.5442 +Apps_MASS3DEA,Base_Seq,default,778240, PASSED ,0.0679604,0.0879253,0.0801596,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.0801476,0.0879186 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,778240, PASSED ,0.000255741,23.3652,21.3016,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,21.3016,23.3652 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,778240, PASSED ,0.00113685,5.25612,4.79189,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,5.14124,5.63946 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,778240, PASSED ,0.000286191,20.8792,19.0351,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,19.0351,20.8792 +Apps_MASS3DEA,Base_Seq,default,9101312, PASSED ,0.798117,0.0875556,0.0798244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.0797404,0.0874635 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,9101312, PASSED ,0.00194579,35.9133,32.7421,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,33.3109,36.5373 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,9101312, PASSED ,0.00956941,7.3024,6.65759,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,6.82371,7.48462 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,9101312, PASSED ,0.00154886,45.1167,41.1328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,41.1328,45.1167 +Apps_MASS3DEA,Base_Seq,default,12423168, PASSED ,1.08713,0.08774,0.0799925,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,0.0798244,0.0875556 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,12423168, PASSED ,0.00233488,40.8521,37.2449,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,35.3912,38.8189 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,12423168, PASSED ,0.0123934,7.69642,7.01683,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,7.01683,7.69642 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,12423168, PASSED ,0.00194379,49.0714,44.7383,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,44.5533,48.8683 +Apps_MASS3DEA,Base_Seq,default,1556480, PASSED ,0.136181,0.0877564,0.0800066,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.0800066,0.0877564 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,1556480, PASSED ,0.000454651,26.2855,23.9642,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,23.9642,26.2855 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,1556480, PASSED ,0.00176684,6.76388,6.16656,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,6.16656,6.76388 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,1556480, PASSED ,0.000437991,27.2853,24.8758,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,24.8758,27.2853 +Apps_MASS3DEA,Base_Seq,default,18198528, PASSED ,1.59883,0.0873937,0.0796768,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,0.07990844999999999,0.0876478 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,18198528, PASSED ,0.00359947,38.8189,35.3912,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,35.7238,39.1837 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,18198528, PASSED ,0.0181458,7.70027,7.02034,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,7.018585,7.698345 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,18198528, PASSED ,0.00285927,48.8683,44.5533,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,44.6458,48.969849999999994 +Apps_MASS3DEA,Base_Seq,default,196608, PASSED ,0.0171715,0.0879186,0.0801476,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.0801596,0.0879253 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,196608, PASSED ,0.00022114,6.82688,6.22346,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,11.6817,12.8137 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,196608, PASSED ,0.000471131,3.20441,2.92117,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,4.79189,5.25612 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,196608, PASSED ,0.000252291,5.98395,5.45503,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,10.4329,11.4439 +Apps_MASS3DEA,Base_Seq,default,24260608, PASSED ,2.12153,0.087801,0.0800482,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,0.0799925,0.08774 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,24260608, PASSED ,0.00470996,39.5485,36.0564,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,36.0564,39.5485 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,24260608, PASSED ,0.023972,7.77038,7.08426,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,7.02034,7.70027 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,24260608, PASSED ,0.00371912,50.085,45.6625,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,44.7383,49.0714 +Apps_MASS3DEA,Base_Seq,default,3108864, PASSED ,0.273216,0.0873663,0.0796515,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.0798244,0.0875556 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,3108864, PASSED ,0.000653302,36.5373,33.3109,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,30.1164,33.0333 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,3108864, PASSED ,0.00325319,7.33737,6.68945,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,6.65759,7.3024 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,3108864, PASSED ,0.000561061,42.5442,38.7873,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,37.4966,41.1283 +Apps_MASS3DEA,Base_Seq,default,389120, PASSED ,0.0338421,0.0882862,0.0804867,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.08015359999999999,0.08792195 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,389120, PASSED ,0.000233171,12.8137,11.6817,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,16.49165,18.08945 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,389120, PASSED ,0.000529802,5.63946,5.14124,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,4.966565,5.4477899999999995 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,389120, PASSED ,0.000261081,11.4439,10.4329,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,14.734,16.16155 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,729, PASSED ,1.18384e-05,5.04932,10.0932,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,10.0932,4.9566 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,729, PASSED ,2.90682e-06,20.5641,41.1061,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,155.613,74.8639 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,729, PASSED ,3.0124e-06,19.8433,39.6654,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,152.573,73.4013 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,531441, PASSED ,0.0138961,3.97743,8.59865,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,9.191469999999999,4.25506 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,531441, PASSED ,0.000309184,178.764,386.463,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,405.766,187.921 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,531441, PASSED ,0.00030012,184.162,398.134,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,413.0005,191.26850000000002 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,68921, PASSED ,0.00149013,4.67384,10.0233,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.0023,4.67384 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,68921, PASSED ,3.48627e-05,199.773,428.424,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,428.424,199.773 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,68921, PASSED ,3.57475e-05,194.828,417.819,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,426.052,198.375 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,753571, PASSED ,0.0195446,4.02294,8.70474,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,8.70474,4.02294 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,753571, PASSED ,0.000440539,178.479,386.187,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,386.463,178.764 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,753571, PASSED ,0.000439064,179.078,387.484,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,398.134,184.162 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,9261, PASSED ,0.000188469,4.69623,9.90615,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,10.045,4.7032 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,9261, PASSED ,6.05882e-06,146.083,308.146,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,308.146,146.083 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,9261, PASSED ,6.11162e-06,144.821,305.484,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,305.484,144.821 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,132651, PASSED ,0.00291651,4.649,10.0023,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,10.0023,4.649 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,132651, PASSED ,6.62838e-05,204.558,440.106,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,428.424,199.773 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,132651, PASSED ,6.57742e-05,206.143,443.516,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,426.052,198.375 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,19683, PASSED ,0.000410276,4.7032,9.99765,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,10.0233,4.70308 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,19683, PASSED ,1.05262e-05,183.315,389.674,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,389.674,183.315 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,19683, PASSED ,1.0476e-05,184.193,391.541,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,391.541,184.193 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,3375, PASSED ,6.21558e-05,4.9566,10.3028,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,10.045425,4.8299 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,3375, PASSED ,4.11522e-06,74.8639,155.613,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,231.8795,110.47345 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,3375, PASSED ,4.19722e-06,73.4013,152.573,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,229.0285,109.11115000000001 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,250047, PASSED ,0.00574692,4.48718,9.6782,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,9.6782,4.48718 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,250047, PASSED ,0.000130849,197.078,425.069,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,425.069,197.078 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,250047, PASSED ,0.000129993,198.375,427.867,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,417.819,194.828 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,35937, PASSED ,0.000761298,4.70308,10.045,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,10.0023,4.69623 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,35937, PASSED ,1.71592e-05,208.66,445.663,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,428.424,199.773 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,35937, PASSED ,1.7949e-05,199.478,426.052,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,417.819,194.828 +Apps_MASSVEC3DPA,Base_Seq,default,5376, PASSED ,1.43702e-05,3.28712,10.7556,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,10.8039,3.29603 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,5376, PASSED ,8.05662e-06,5.86309,19.1842,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,72.4048,22.0971 +Apps_MASSVEC3DPA,Base_HIP,direct_64,5376, PASSED ,3.87502e-06,12.19,39.8862,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-direct_64,146.136,44.5988 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,5376, PASSED ,1.03788e-05,4.55125,14.8918,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,56.553,17.2593 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,5376, PASSED ,3.9036e-06,12.1008,39.5942,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,144.939,44.2338 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,5376, PASSED ,7.34062e-06,6.43497,21.0554,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,80.5064,24.5696 +Apps_MASSVEC3DPA,Base_Seq,default,5437248, PASSED ,0.0143797,3.3161,10.8709,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,10.87935,3.31868 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,5437248, PASSED ,0.000367214,129.855,425.694,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,429.0685,130.8845 +Apps_MASSVEC3DPA,Base_HIP,direct_64,5437248, PASSED ,0.00029053,164.129,538.055,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-direct_64,551.6289999999999,168.26999999999998 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,5437248, PASSED ,0.000567163,84.0754,275.619,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,291.43449999999996,88.9002 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,5437248, PASSED ,0.000293966,162.211,531.766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,545.4575,166.38799999999998 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,5437248, PASSED ,0.000352522,135.267,443.436,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,444.2125,135.5035 +Apps_MASSVEC3DPA,Base_Seq,default,679680, PASSED ,0.0018099,3.29348,10.7966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.7966,3.29348 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,679680, PASSED ,4.61755e-05,129.091,423.185,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,423.185,129.091 +Apps_MASSVEC3DPA,Base_HIP,direct_64,679680, PASSED ,3.33081e-05,178.961,586.668,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-direct_64,569.111,173.608 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,679680, PASSED ,6.4523e-05,92.3834,302.85,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,307.082,93.6736 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,679680, PASSED ,3.38937e-05,175.869,576.532,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,567.55,173.132 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,679680, PASSED ,4.50137e-05,132.423,434.108,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,442.559,135.0 +Apps_MASSVEC3DPA,Base_Seq,default,7964736, PASSED ,0.0210073,3.32505,10.9003,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,10.8709,3.3161 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,7964736, PASSED ,0.000531857,131.333,430.541,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,430.541,131.333 +Apps_MASSVEC3DPA,Base_HIP,direct_64,7964736, PASSED ,0.000425606,164.12,538.024,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-direct_64,538.055,164.129 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,7964736, PASSED ,0.000830299,84.1268,275.787,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,275.787,84.1268 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,7964736, PASSED ,0.000429759,162.534,532.825,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,532.825,162.534 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,7964736, PASSED ,0.000514589,135.74,444.989,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,444.989,135.74 +Apps_MASSVEC3DPA,Base_Seq,default,85056, PASSED ,0.000226341,3.29603,10.8039,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,10.8001,3.29467 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,85056, PASSED ,1.2368e-05,60.3189,197.716,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,197.716,60.3189 +Apps_MASSVEC3DPA,Base_HIP,direct_64,85056, PASSED ,8.60164e-06,86.7307,284.29,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-direct_64,284.29,86.7307 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,85056, PASSED ,1.39956e-05,53.3042,174.723,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,174.723,53.3042 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,85056, PASSED ,8.65382e-06,86.2078,282.576,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,282.576,86.2078 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,85056, PASSED ,1.08216e-05,68.9384,225.969,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,225.969,68.9384 +Apps_MASSVEC3DPA,Base_Seq,default,1359360, PASSED ,0.00358948,3.32126,10.8878,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,10.7966,3.29348 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,1359360, PASSED ,9.13985e-05,130.436,427.596,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,425.694,129.855 +Apps_MASSVEC3DPA,Base_HIP,direct_64,1359360, PASSED ,6.73052e-05,177.128,580.662,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-direct_64,569.111,173.608 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,1359360, PASSED ,0.000127268,93.6736,307.082,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,307.082,93.6736 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,1359360, PASSED ,6.71728e-05,177.477,581.807,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,567.55,173.132 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,1359360, PASSED ,8.83082e-05,135.0,442.559,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,443.436,135.267 +Apps_MASSVEC3DPA,Base_Seq,default,169920, PASSED ,0.000452331,3.29467,10.8001,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,10.8001,3.29467 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,169920, PASSED ,1.54914e-05,96.2002,315.348,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,315.348,96.2002 +Apps_MASSVEC3DPA,Base_HIP,direct_64,169920, PASSED ,1.12808e-05,132.107,433.053,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-direct_64,433.053,132.107 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,169920, PASSED ,1.59242e-05,93.5856,306.778,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,302.85,92.3834 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,169920, PASSED ,1.13006e-05,131.876,432.295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,432.295,131.876 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,169920, PASSED ,1.25772e-05,118.49,388.416,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,388.416,118.49 +Apps_MASSVEC3DPA,Base_Seq,default,21312, PASSED ,5.56373e-05,3.36096,11.0127,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,10.802,3.29535 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,21312, PASSED ,8.46242e-06,22.0971,72.4048,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,135.06040000000002,41.208 +Apps_MASSVEC3DPA,Base_HIP,direct_64,21312, PASSED ,4.19282e-06,44.5988,146.136,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-direct_64,215.21300000000002,65.66475 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,21312, PASSED ,1.08344e-05,17.2593,56.553,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,115.638,35.28175 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,21312, PASSED ,4.22742e-06,44.2338,144.939,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,213.7575,65.2208 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,21312, PASSED ,7.61082e-06,24.5696,80.5064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,153.2377,46.754000000000005 +Apps_MASSVEC3DPA,Base_Seq,default,2718720, PASSED ,0.00728298,3.27381,10.7323,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,10.8709,3.3161 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,2718720, PASSED ,0.000179708,132.677,434.945,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,427.596,130.436 +Apps_MASSVEC3DPA,Base_HIP,direct_64,2718720, PASSED ,0.000138292,172.411,565.203,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-direct_64,565.203,172.411 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,2718720, PASSED ,0.000246367,96.7789,317.263,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,302.85,92.3834 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,2718720, PASSED ,0.000140055,170.242,558.09,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,558.09,170.242 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,2718720, PASSED ,0.000172045,138.586,454.317,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,443.436,135.267 +Apps_MASSVEC3DPA,Base_Seq,default,339840, PASSED ,0.000905337,3.29211,10.792,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,10.8001,3.29467 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,339840, PASSED ,2.31335e-05,128.838,422.349,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,422.349,128.838 +Apps_MASSVEC3DPA,Base_HIP,direct_64,339840, PASSED ,1.71678e-05,173.608,569.111,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-direct_64,569.111,173.608 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,339840, PASSED ,2.80351e-05,106.312,348.506,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,306.778,93.5856 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,339840, PASSED ,1.72151e-05,173.132,567.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,567.55,173.132 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,339840, PASSED ,2.12032e-05,140.567,460.798,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,434.108,132.423 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000, PASSED ,6.46211e-06,5.37512,1.39273,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,1.3788,4.96773 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,1000, PASSED ,2.67051e-06,13.0067,3.37014,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,16.8863,60.8403 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,1000, PASSED ,1.97751e-06,17.5648,4.55118,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,17.0095,61.284 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2048383, PASSED ,0.0138968,4.44515,1.3266,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,1.32555,4.448755 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,2048383, PASSED ,0.000498605,123.892,36.9741,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,36.7806,123.3965 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,2048383, PASSED ,0.000498078,124.023,37.0132,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,36.7825,123.3605 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,238328, PASSED ,0.00160021,4.54776,1.34042,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,1.34257,4.54776 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,238328, PASSED ,5.91987e-05,122.931,36.2331,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,35.8999,121.164 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,238328, PASSED ,5.8863e-05,123.632,36.4398,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,35.9665,121.388 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2985984, PASSED ,0.0203169,4.42601,1.32274,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,1.3245,4.44515 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,2985984, PASSED ,0.000726334,123.804,36.9993,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,36.9741,123.804 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,2985984, PASSED ,0.000726902,123.707,36.9704,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,36.9704,123.707 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,27000, PASSED ,0.000179091,4.72527,1.35685,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,1.35685,4.72527 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,27000, PASSED ,8.00212e-06,105.753,30.367,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,30.367,105.753 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,27000, PASSED ,7.84052e-06,107.933,30.9928,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,30.9928,107.933 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,493039, PASSED ,0.00330512,4.53122,1.34257,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,1.34042,4.53122 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,493039, PASSED ,0.000123603,121.164,35.8999,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,36.2331,122.931 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,493039, PASSED ,0.000123375,121.388,35.9665,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,36.4398,123.014 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,54872, PASSED ,0.000366686,4.64042,1.34679,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,1.34679,4.64042 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,54872, PASSED ,1.49047e-05,114.164,33.1336,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,33.1336,114.164 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,54872, PASSED ,1.48868e-05,114.301,33.1735,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,33.1735,114.301 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,5832, PASSED ,3.80678e-05,4.96773,1.3788,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,1.3678249999999998,4.846500000000001 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,5832, PASSED ,3.10831e-06,60.8403,16.8863,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,23.626649999999998,83.29665 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,5832, PASSED ,3.08581e-06,61.284,17.0095,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,24.00115,84.6085 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000000, PASSED ,0.00679502,4.45236,1.3245,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,1.3266,4.45236 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,1000000, PASSED ,0.000245989,122.989,36.5871,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,36.5871,122.989 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,1000000, PASSED ,0.000245938,123.014,36.5946,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,36.5946,123.632 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,117649, PASSED ,0.000786253,4.59871,1.34669,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,1.34669,4.59871 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,117649, PASSED ,3.00252e-05,120.424,35.2651,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,35.2651,120.424 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,117649, PASSED ,2.98144e-05,121.275,35.5144,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,35.5144,121.275 +Apps_VOL3D,Base_Seq,default,512, PASSED ,6.50252e-06,7.02031,15.6567,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,15.6567,6.92586 +Apps_VOL3D,Base_HIP,block_256,512, PASSED ,3.32501e-06,13.7292,30.6189,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,139.621,60.5007 +Apps_VOL3D,RAJA_HIP,block_256,512, PASSED ,2.32971e-06,19.5946,43.6999,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,188.688,81.7623 +Apps_VOL3D,Base_Seq,default,1442897, PASSED ,0.00739325,6.38656,15.3286,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,15.42845,6.4338 +Apps_VOL3D,Base_HIP,block_256,1442897, PASSED ,0.000198018,238.451,572.313,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,590.8115,246.6605 +Apps_VOL3D,RAJA_HIP,block_256,1442897, PASSED ,0.000198884,237.412,569.819,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,590.2435,246.4255 +Apps_VOL3D,Base_Seq,default,166375, PASSED ,0.000892002,6.71395,16.006,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,16.006,6.71395 +Apps_VOL3D,Base_HIP,block_256,166375, PASSED ,2.40782e-05,248.726,592.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,596.22,250.995 +Apps_VOL3D,RAJA_HIP,block_256,166375, PASSED ,2.36039e-05,253.724,604.875,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,615.301,260.304 +Apps_VOL3D,Base_Seq,default,2146689, PASSED ,0.0118811,5.84542,14.0411,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,15.3286,6.38656 +Apps_VOL3D,Base_HIP,block_256,2146689, PASSED ,0.000295768,234.813,564.035,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,572.313,238.451 +Apps_VOL3D,RAJA_HIP,block_256,2146689, PASSED ,0.000293587,236.557,568.225,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,569.819,237.412 +Apps_VOL3D,Base_Seq,default,17576, PASSED ,0.000111175,6.92586,16.2801,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,16.1896,6.86628 +Apps_VOL3D,Base_HIP,block_256,17576, PASSED ,3.99431e-06,192.769,453.129,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,453.129,192.769 +Apps_VOL3D,RAJA_HIP,block_256,17576, PASSED ,3.96851e-06,194.023,456.074,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,456.074,194.023 +Apps_VOL3D,Base_Seq,default,343000, PASSED ,0.00177401,6.69096,15.9959,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,15.9959,6.69096 +Apps_VOL3D,Base_HIP,block_256,343000, PASSED ,4.6572e-05,254.87,609.31,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,596.22,250.995 +Apps_VOL3D,RAJA_HIP,block_256,343000, PASSED ,4.64684e-05,255.439,610.668,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,610.668,255.439 +Apps_VOL3D,Base_Seq,default,35937, PASSED ,0.00021222,6.86628,16.2304,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,16.1896,6.81545 +Apps_VOL3D,Base_HIP,block_256,35937, PASSED ,6.29852e-06,231.35,546.86,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,546.86,231.35 +Apps_VOL3D,RAJA_HIP,block_256,35937, PASSED ,5.59792e-06,260.304,615.301,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,604.875,253.724 +Apps_VOL3D,Base_Seq,default,3375, PASSED ,2.83314e-05,6.71414,15.4946,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,15.94355,6.89607 +Apps_VOL3D,Base_HIP,block_256,3375, PASSED ,3.14411e-06,60.5007,139.621,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,296.375,126.63485 +Apps_VOL3D,RAJA_HIP,block_256,3375, PASSED ,2.32651e-06,81.7623,188.688,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,322.381,137.89265 +Apps_VOL3D,Base_Seq,default,704969, PASSED ,0.00364849,6.48104,15.5283,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,15.5283,6.48104 +Apps_VOL3D,Base_HIP,block_256,704969, PASSED ,8.91282e-05,265.303,635.654,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,592.96,248.726 +Apps_VOL3D,RAJA_HIP,block_256,704969, PASSED ,8.84012e-05,267.485,640.881,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,604.875,253.724 +Apps_VOL3D,Base_Seq,default,79507, PASSED ,0.000441656,6.81545,16.1896,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,16.1896,6.81545 +Apps_VOL3D,Base_HIP,block_256,79507, PASSED ,1.19926e-05,250.995,596.22,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,592.96,248.726 +Apps_VOL3D,RAJA_HIP,block_256,79507, PASSED ,1.08286e-05,277.975,660.309,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-CPX/VOL3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,610.668,255.439 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_DIFFUSION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_DIFFUSION3DPA.csv new file mode 100644 index 0000000..b57d58f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_DIFFUSION3DPA.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +405,24.2929,91.0123,9.68515,9.68515,25.3164,94.2495,16.244,60.7029,6.47622,6.47622,16.9284,62.8621 +1566,91.0123,179.24814999999998,9.87048,9.322265,94.2495,183.46975,60.7029,119.49495,6.58336,6.22397,62.8621,122.30955 +6183,267.484,267.484,8.95938,8.95938,272.69,272.69,178.287,178.287,5.97172,5.97172,181.757,181.757 +12339,367.553,367.553,8.43279,8.43279,363.984,363.984,244.958,244.958,5.62009,5.62009,242.58,242.58 +24678,515.086,515.086,6.91891,8.20543,513.128,513.128,343.264,343.264,4.6109,5.46811,341.959,341.959 +49329,552.595,552.595,8.20543,6.91891,586.063,586.063,368.25,368.25,5.46811,4.6109,390.553,390.553 +98631,614.295,552.595,5.82203,5.82203,639.324,586.063,409.361,368.25,3.87975,3.87975,426.04,390.553 +197262,656.775,552.595,2.21994,2.21994,679.812,586.063,437.666,368.25,1.47934,1.47934,453.017,390.553 +394524,517.261,565.778,1.89364,2.16687,532.456,585.89,344.694,377.02750000000003,1.2619,1.4439700000000002,354.82,390.43 +577935,488.21,517.261,2.1138,2.1138,500.604,532.456,325.335,344.694,1.4086,1.4086,333.594,354.82 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_EDGE3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_EDGE3D.csv new file mode 100644 index 0000000..933f92c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_EDGE3D.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +512,560.006,2446.5,8.35478,8.35478,776.939,3238.42,1.36819,5.77634,0.0204122,0.0197187,1.8982,7.64611 +3375,2446.5,3177.255,8.35162,8.357904999999999,3238.42,3660.56,5.77634,7.41756,0.0197187,0.0195498,7.64611,8.55492 +17576,3908.01,3908.01,8.36103,8.35954,4082.7,4082.7,9.05878,9.05878,0.0193809,0.0193809,9.46373,9.46373 +35937,4131.92,4131.92,8.36724,8.36103,4701.17,4388.43,9.52453,9.52453,0.0192874,0.0192874,10.8367,10.0301 +79507,4346.65,4346.65,8.35954,8.36724,4462.53,4462.53,9.97035,9.97035,0.0191751,0.0191751,10.2362,10.2362 +166375,4380.49,4380.49,8.37593,8.37013,4388.43,4595.03,10.0119,10.0119,0.0191437,0.0191437,10.0301,10.4729 +343000,4527.7,4527.7,8.37984,8.37049,4595.03,4595.03,10.3195,10.3195,0.0190992,0.0190992,10.4729,10.4729 +704969,4676.26,4676.26,8.37013,8.37049,4732.87,4732.87,10.6345,10.6345,0.019035,0.019035,10.7633,10.7633 +1442897,4730.76,4703.51,8.37049,8.37031,4770.69,4751.78,10.7398,10.687149999999999,0.0190027,0.01901885,10.8304,10.79685 +2146689,4736.46,4730.76,8.36932,8.37013,4780.67,4770.69,10.744,10.7398,0.0189847,0.0190027,10.8443,10.8304 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_ENERGY.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_ENERGY.csv new file mode 100644 index 0000000..db49009 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_ENERGY.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +417,1.62705,6.44407,10.7796,11.0666,1.92179,10.1191,5.95104,23.5696,39.4271,40.4766,7.02906,37.0113 +1667,6.44407,15.714285,11.159,10.9231,10.1191,25.24695,23.5696,57.475899999999996,40.8146,39.95185,37.0113,92.34215 +6667,24.9845,24.9845,11.0666,10.7796,40.3748,40.3748,91.3822,91.3822,40.4766,39.4271,147.673,147.673 +13334,53.3759,53.3759,10.5804,10.7393,82.7643,82.7643,195.225,195.225,38.6982,39.2795,302.715,302.715 +26667,106.308,106.308,10.4475,10.6286,159.274,157.637,388.829,388.829,38.2125,38.8749,582.554,576.567 +53334,210.727,156.699,10.7393,10.5804,235.446,157.637,770.744,573.135,39.2795,38.6982,861.156,576.567 +106667,158.364,158.364,10.6286,10.4475,157.637,159.274,579.227,579.227,38.8749,38.2125,576.567,582.554 +213334,156.699,163.48,8.73726,8.73726,156.336,161.243,573.135,597.937,31.957,31.957,571.807,589.757 +426667,163.48,160.922,7.0225,7.87988,161.243,159.44,597.937,588.582,25.6852,28.8211,589.757,583.162 +625000,163.781,163.48,6.83318,7.0225,163.883,161.243,599.038,597.937,24.9927,25.6852,599.411,589.757 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_FEMSWEEP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_FEMSWEEP.csv new file mode 100644 index 0000000..ed12486 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_FEMSWEEP.csv @@ -0,0 +1,10 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +31104,63.895700000000005,82.2728,3.3613150000000003,3.23414,69.0547,88.68065,11.4746,15.024750000000001,0.6036360000000001,0.5885345,12.40105,16.19475 +73728,100.518,100.518,3.11191,3.11191,108.269,108.269,18.5512,18.5512,0.57432,0.57432,19.9817,19.9817 +144000,146.182,146.182,2.46577,2.46577,155.203,155.203,27.4057,27.4057,0.462276,0.462276,29.0971,29.0971 +248832,189.847,189.847,2.22201,2.2469,198.248,198.248,35.957,35.957,0.420849,0.428621,37.5482,37.5482 +395136,196.428,196.428,2.2469,2.22201,212.433,212.433,37.471,37.471,0.428621,0.425644,40.524,40.524 +589824,231.835,229.037,2.21948,2.21948,223.812,223.812,44.4605,44.2472,0.425644,0.420849,42.9218,42.9218 +839808,243.725,229.037,2.01244,2.12626,255.606,239.328,46.932,44.2472,0.387519,0.411853,49.2199,46.3573 +1152000,229.037,230.436,1.9545,2.06935,241.696,240.512,44.2472,44.35385,0.377586,0.399686,46.6927,46.525000000000006 +1533312,226.592,229.037,2.12626,2.01244,239.328,241.696,43.8905,44.2472,0.411853,0.387519,46.3573,46.6927 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_INTSC_HEXRECT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_INTSC_HEXRECT.csv new file mode 100644 index 0000000..ba4563d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_INTSC_HEXRECT.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +1728,23.8161,76.4015,4.05739,4.28896,23.6793,76.1797,0.300447,0.951003,0.0511849,0.0533866,0.298721,0.948242 +5832,76.4015,97.67375,4.28896,4.3242899999999995,76.1797,98.60034999999999,0.951003,1.2101215,0.0533866,0.0536187,0.948242,1.221556 +17576,118.946,118.946,4.35962,4.35962,121.021,121.021,1.46924,1.46924,0.0538508,0.0538376,1.49487,1.49487 +39304,125.284,125.284,4.38435,4.38435,125.991,125.991,1.5415,1.5415,0.0539456,0.0538508,1.5502,1.5502 +74088,140.587,140.587,4.38589,4.38589,139.452,139.452,1.72573,1.72573,0.0538376,0.053867,1.7118,1.7118 +140608,145.176,145.176,4.40402,4.4039,146.252,143.176,1.77869,1.77869,0.0539579,0.053867,1.79187,1.75128 +287496,146.625,146.625,4.4039,4.4039,143.176,146.252,1.79347,1.79347,0.053867,0.053863,1.75128,1.79187 +551368,148.237,148.237,4.40881,4.4039,152.408,152.408,1.81102,1.81102,0.053863,0.053863,1.86199,1.86199 +1124864,154.757,151.497,4.40316,4.40353,154.998,153.6845,1.88875,1.849885,0.0537387,0.05380085,1.89168,1.87619 +1643032,155.324,154.757,4.4016,4.40316,154.961,154.961,1.89481,1.88875,0.0536954,0.0537387,1.89039,1.89039 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASS3DEA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASS3DEA.csv new file mode 100644 index 0000000..d7c6105 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASS3DEA.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64 (raw),Base_HIP-compile_time_block_stride_loop_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-cached_block_stride_loop_64 (raw),RAJA_HIP-cached_block_stride_loop_64 (smoothed),RAJA_HIP-compile_time_block_stride_loop_64 (raw),RAJA_HIP-compile_time_block_stride_loop_64 (smoothed),Base_HIP-compile_time_block_stride_loop_64 (raw B/W),Base_HIP-compile_time_block_stride_loop_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-cached_block_stride_loop_64 (raw B/W),RAJA_HIP-cached_block_stride_loop_64 (smoothed B/W),RAJA_HIP-compile_time_block_stride_loop_64 (raw B/W),RAJA_HIP-compile_time_block_stride_loop_64 (smoothed B/W) +196608,6.22346,11.6817,0.0801476,0.0801596,5.45503,10.4329,2.92117,4.79189,6.82688,12.8137,0.0879186,0.0879253,5.98395,11.4439,3.20441,5.25612 +389120,11.6817,16.49165,0.0804867,0.08015359999999999,10.4329,14.734,5.14124,4.966565,12.8137,18.08945,0.0882862,0.08792195,11.4439,16.16155,5.63946,5.4477899999999995 +778240,21.3016,21.3016,0.0801596,0.0801476,19.0351,19.0351,4.79189,5.14124,23.3652,23.3652,0.0879253,0.0879186,20.8792,20.8792,5.25612,5.63946 +1556480,23.9642,23.9642,0.0800066,0.0800066,24.8758,24.8758,6.16656,6.16656,26.2855,26.2855,0.0877564,0.0877564,27.2853,27.2853,6.76388,6.76388 +3108864,33.3109,30.1164,0.0796515,0.0798244,38.7873,37.4966,6.68945,6.65759,36.5373,33.0333,0.0873663,0.0875556,42.5442,41.1283,7.33737,7.3024 +6213632,30.1164,32.7421,0.0797404,0.0798244,37.4966,38.7873,6.82371,6.68945,33.0333,35.9133,0.0874635,0.0875556,41.1283,42.5442,7.48462,7.33737 +9101312,32.7421,33.3109,0.0798244,0.0797404,41.1328,41.1328,6.65759,6.82371,35.9133,36.5373,0.0875556,0.0874635,45.1167,45.1167,7.3024,7.48462 +12423168,37.2449,35.3912,0.0799925,0.0798244,44.7383,44.5533,7.01683,7.01683,40.8521,38.8189,0.08774,0.0875556,49.0714,48.8683,7.69642,7.69642 +18198528,35.3912,35.7238,0.0796768,0.07990844999999999,44.5533,44.6458,7.02034,7.018585,38.8189,39.1837,0.0873937,0.0876478,48.8683,48.969849999999994,7.70027,7.698345 +24260608,36.0564,36.0564,0.0800482,0.0799925,45.6625,44.7383,7.08426,7.02034,39.5485,39.5485,0.087801,0.08774,50.085,49.0714,7.77038,7.70027 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv new file mode 100644 index 0000000..4cab95a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +729,41.1061,155.613,10.0932,10.0932,39.6654,152.573,20.5641,74.8639,5.04932,4.9566,19.8433,73.4013 +3375,155.613,231.8795,10.3028,10.045425,152.573,229.0285,74.8639,110.47345,4.9566,4.8299,73.4013,109.11115000000001 +9261,308.146,308.146,9.90615,10.045,305.484,305.484,146.083,146.083,4.69623,4.7032,144.821,144.821 +19683,389.674,389.674,9.99765,10.0233,391.541,391.541,183.315,183.315,4.7032,4.70308,184.193,184.193 +35937,445.663,428.424,10.045,10.0023,426.052,417.819,208.66,199.773,4.70308,4.69623,199.478,194.828 +68921,428.424,428.424,10.0233,10.0023,417.819,426.052,199.773,199.773,4.67384,4.67384,194.828,198.375 +132651,440.106,428.424,10.0023,10.0023,443.516,426.052,204.558,199.773,4.649,4.649,206.143,198.375 +250047,425.069,425.069,9.6782,9.6782,427.867,417.819,197.078,197.078,4.48718,4.48718,198.375,194.828 +531441,386.463,405.766,8.59865,9.191469999999999,398.134,413.0005,178.764,187.921,3.97743,4.25506,184.162,191.26850000000002 +753571,386.187,386.463,8.70474,8.70474,387.484,398.134,178.479,178.764,4.02294,4.02294,179.078,184.162 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASSVEC3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASSVEC3DPA.csv new file mode 100644 index 0000000..244e56d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_MASSVEC3DPA.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_64 (raw),Base_HIP-direct_64 (smoothed),Base_HIP-runtime_block_stride_loop_64 (raw),Base_HIP-runtime_block_stride_loop_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-cached_block_stride_loop_64 (raw),RAJA_HIP-cached_block_stride_loop_64 (smoothed),RAJA_HIP-direct_64 (raw),RAJA_HIP-direct_64 (smoothed),RAJA_HIP-runtime_block_stride_loop_64 (raw),RAJA_HIP-runtime_block_stride_loop_64 (smoothed),Base_HIP-direct_64 (raw B/W),Base_HIP-direct_64 (smoothed B/W),Base_HIP-runtime_block_stride_loop_64 (raw B/W),Base_HIP-runtime_block_stride_loop_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-cached_block_stride_loop_64 (raw B/W),RAJA_HIP-cached_block_stride_loop_64 (smoothed B/W),RAJA_HIP-direct_64 (raw B/W),RAJA_HIP-direct_64 (smoothed B/W),RAJA_HIP-runtime_block_stride_loop_64 (raw B/W),RAJA_HIP-runtime_block_stride_loop_64 (smoothed B/W) +5376,39.8862,146.136,19.1842,72.4048,10.7556,10.8039,21.0554,80.5064,39.5942,144.939,14.8918,56.553,12.19,44.5988,5.86309,22.0971,3.28712,3.29603,6.43497,24.5696,12.1008,44.2338,4.55125,17.2593 +21312,146.136,215.21300000000002,72.4048,135.06040000000002,11.0127,10.802,80.5064,153.2377,144.939,213.7575,56.553,115.638,44.5988,65.66475,22.0971,41.208,3.36096,3.29535,24.5696,46.754000000000005,44.2338,65.2208,17.2593,35.28175 +85056,284.29,284.29,197.716,197.716,10.8039,10.8001,225.969,225.969,282.576,282.576,174.723,174.723,86.7307,86.7307,60.3189,60.3189,3.29603,3.29467,68.9384,68.9384,86.2078,86.2078,53.3042,53.3042 +169920,433.053,433.053,315.348,315.348,10.8001,10.8001,388.416,388.416,432.295,432.295,306.778,302.85,132.107,132.107,96.2002,96.2002,3.29467,3.29467,118.49,118.49,131.876,131.876,93.5856,92.3834 +339840,569.111,569.111,422.349,422.349,10.792,10.8001,460.798,434.108,567.55,567.55,348.506,306.778,173.608,173.608,128.838,128.838,3.29211,3.29467,140.567,132.423,173.132,173.132,106.312,93.5856 +679680,586.668,569.111,423.185,423.185,10.7966,10.7966,434.108,442.559,576.532,567.55,302.85,307.082,178.961,173.608,129.091,129.091,3.29348,3.29348,132.423,135.0,175.869,173.132,92.3834,93.6736 +1359360,580.662,569.111,427.596,425.694,10.8878,10.7966,442.559,443.436,581.807,567.55,307.082,307.082,177.128,173.608,130.436,129.855,3.32126,3.29348,135.0,135.267,177.477,173.132,93.6736,93.6736 +2718720,565.203,565.203,434.945,427.596,10.7323,10.8709,454.317,443.436,558.09,558.09,317.263,302.85,172.411,172.411,132.677,130.436,3.27381,3.3161,138.586,135.267,170.242,170.242,96.7789,92.3834 +5437248,538.055,551.6289999999999,425.694,429.0685,10.8709,10.87935,443.436,444.2125,531.766,545.4575,275.619,291.43449999999996,164.129,168.26999999999998,129.855,130.8845,3.3161,3.31868,135.267,135.5035,162.211,166.38799999999998,84.0754,88.9002 +7964736,538.024,538.055,430.541,430.541,10.9003,10.8709,444.989,444.989,532.825,532.825,275.787,275.787,164.12,164.129,131.333,131.333,3.32505,3.3161,135.74,135.74,162.534,162.534,84.1268,84.1268 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv new file mode 100644 index 0000000..f854aab --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +1000,3.37014,16.8863,1.39273,1.3788,4.55118,17.0095,13.0067,60.8403,5.37512,4.96773,17.5648,61.284 +5832,16.8863,23.626649999999998,1.3788,1.3678249999999998,17.0095,24.00115,60.8403,83.29665,4.96773,4.846500000000001,61.284,84.6085 +27000,30.367,30.367,1.35685,1.35685,30.9928,30.9928,105.753,105.753,4.72527,4.72527,107.933,107.933 +54872,33.1336,33.1336,1.34679,1.34679,33.1735,33.1735,114.164,114.164,4.64042,4.64042,114.301,114.301 +117649,35.2651,35.2651,1.34669,1.34669,35.5144,35.5144,120.424,120.424,4.59871,4.59871,121.275,121.275 +238328,36.2331,35.8999,1.34042,1.34257,36.4398,35.9665,122.931,121.164,4.54776,4.54776,123.632,121.388 +493039,35.8999,36.2331,1.34257,1.34042,35.9665,36.4398,121.164,122.931,4.53122,4.53122,121.388,123.014 +1000000,36.5871,36.5871,1.3245,1.3266,36.5946,36.5946,122.989,122.989,4.45236,4.45236,123.014,123.632 +2048383,36.9741,36.7806,1.3266,1.32555,37.0132,36.7825,123.892,123.3965,4.44515,4.448755,124.023,123.3605 +2985984,36.9993,36.9741,1.32274,1.3245,36.9704,36.9704,123.804,123.804,4.42601,4.44515,123.707,123.707 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_VOL3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_VOL3D.csv new file mode 100644 index 0000000..72d79f0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-CPX/saturation-curve-data/Apps_VOL3D.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +512,30.6189,139.621,15.6567,15.6567,43.6999,188.688,13.7292,60.5007,7.02031,6.92586,19.5946,81.7623 +3375,139.621,296.375,15.4946,15.94355,188.688,322.381,60.5007,126.63485,6.71414,6.89607,81.7623,137.89265 +17576,453.129,453.129,16.2801,16.1896,456.074,456.074,192.769,192.769,6.92586,6.86628,194.023,194.023 +35937,546.86,546.86,16.2304,16.1896,615.301,604.875,231.35,231.35,6.86628,6.81545,260.304,253.724 +79507,596.22,592.96,16.1896,16.1896,660.309,610.668,250.995,248.726,6.81545,6.81545,277.975,255.439 +166375,592.96,596.22,16.006,16.006,604.875,615.301,248.726,250.995,6.71395,6.71395,253.724,260.304 +343000,609.31,596.22,15.9959,15.9959,610.668,610.668,254.87,250.995,6.69096,6.69096,255.439,255.439 +704969,635.654,592.96,15.5283,15.5283,640.881,604.875,265.303,248.726,6.48104,6.48104,267.485,253.724 +1442897,572.313,590.8115,15.3286,15.42845,569.819,590.2435,238.451,246.6605,6.38656,6.4338,237.412,246.4255 +2146689,564.035,572.313,14.0411,15.3286,568.225,569.819,234.813,238.451,5.84542,6.38656,236.557,237.412 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..7ac7c16 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +783,25.5093,6.59477,26.6423 +3105,99.0499,6.65339,103.387 +12339,389.88,6.17346,396.181 +24678,694.399,6.21249,719.451 +49329,1035.33,6.227,1038.22 +98631,1353.03,6.12336,1402.58 +197262,1841.5,4.42259,1909.78 +394524,2219.14,1.69703,2273.25 +789048,2395.58,2.91033,2467.53 +1155843,2508.59,2.92682,2548.4 +1578096,2237.43,3.01898,2324.9 +2311659,2024.31,3.11862,2123.62 +3082212,1929.3,3.10045,2016.42 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..1f9fbd1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +783,99.0499,6.59477,103.387 +3105,244.46495,6.40363,249.784 +12339,389.88,6.227,396.181 +24678,694.399,6.21249,719.451 +49329,1035.33,6.17346,1038.22 +98631,1353.03,6.12336,1402.58 +197262,1841.5,4.42259,1909.78 +394524,2219.14,2.92682,2273.25 +789048,2237.43,2.92682,2324.9 +1155843,2237.43,2.92682,2324.9 +1578096,2237.43,3.01898,2324.9 +2311659,2130.87,3.0597149999999997,2224.26 +3082212,2024.31,3.10045,2123.62 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_flops_raw.csv new file mode 100644 index 0000000..4c6a103 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +783,38.2122,9.8788,39.9095 +3105,148.572,9.97987,155.076 +12339,585.003,9.2631,594.458 +24678,1041.98,9.32219,1079.58 +49329,1553.62,9.34422,1557.96 +98631,2030.39,9.18884,2104.73 +197262,2763.42,6.63667,2865.87 +394524,3330.12,2.54663,3411.32 +789048,3594.9,4.36735,3702.87 +1155843,3764.48,4.39209,3824.22 +1578096,3357.58,4.5304,3488.83 +2311659,3037.75,4.67993,3186.78 +3082212,2895.18,4.65266,3025.93 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_flops_smoothed.csv new file mode 100644 index 0000000..689e97f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_DIFFUSION3DPA_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +783,148.572,9.8788,155.076 +3105,366.7875,9.600495,374.767 +12339,585.003,9.34422,594.458 +24678,1041.98,9.32219,1079.58 +49329,1553.62,9.2631,1557.96 +98631,2030.39,9.18884,2104.73 +197262,2763.42,6.63667,2865.87 +394524,3330.12,4.39209,3411.32 +789048,3357.58,4.39209,3488.83 +1155843,3357.58,4.39209,3488.83 +1578096,3357.58,4.5304,3488.83 +2311659,3197.665,4.5915300000000006,3337.8050000000003 +3082212,3037.75,4.65266,3186.78 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_bandwidth_raw.csv new file mode 100644 index 0000000..492c0c0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1331,2.75942,0.0200444,3.75459 +8000,11.6555,0.0195325,15.9162 +35937,41.7859,0.0192935,54.5811 +79507,50.0086,0.0192253,59.8984 +166375,56.8739,0.0191493,58.752 +343000,63.2963,0.0191105,65.9768 +704969,61.1716,0.0190425,63.3001 +1442897,63.3082,0.0190052,63.2589 +2985984,63.717,0.0189848,63.9446 +4410944,63.9287,0.0189935,64.9219 +6028568,64.6727,0.0189842,65.1231 +8869743,65.0368,0.0189662,65.5175 +12008989,64.7476,0.0189674,65.4785 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..735ad9b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1331,11.6555,0.0195325,15.9162 +8000,26.7207,0.019413,35.24865 +35937,41.7859,0.0192935,54.5811 +79507,50.0086,0.0192253,58.752 +166375,56.8739,0.0191493,59.8984 +343000,61.1716,0.0191105,63.2589 +704969,63.2963,0.0190425,63.3001 +1442897,63.3082,0.0190052,63.9446 +2985984,63.717,0.0189935,63.9446 +4410944,63.9287,0.0189848,64.9219 +6028568,64.6727,0.0189842,65.1231 +8869743,64.71015,0.0189758,65.3008 +12008989,64.7476,0.0189674,65.4785 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_flops_raw.csv new file mode 100644 index 0000000..594a69e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1331,1151.55,8.36483,1566.85 +8000,4989.71,8.36188,6813.73 +35937,18127.5,8.3699,23678.3 +79507,21801.6,8.38141,26113.1 +166375,24884.0,8.37836,25705.7 +343000,27771.5,8.3848,28947.6 +704969,26898.6,8.37346,27834.6 +1442897,27886.6,8.37162,27864.9 +2985984,28106.0,8.3743,28206.4 +4410944,28217.0,8.38338,28655.4 +6028568,28558.1,8.38302,28757.0 +8869743,28733.0,8.37918,28945.3 +12008989,28615.0,8.38257,28938.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_flops_smoothed.csv new file mode 100644 index 0000000..6ffc05e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_EDGE3D_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1331,4989.71,8.36483,6813.73 +8000,11558.605,8.367365,15246.015 +35937,18127.5,8.3699,23678.3 +79507,21801.6,8.37836,25705.7 +166375,24884.0,8.37836,26113.1 +343000,26898.6,8.37836,27834.6 +704969,27771.5,8.3743,27864.9 +1442897,27886.6,8.3743,28206.4 +2985984,28106.0,8.3743,28206.4 +4410944,28217.0,8.37918,28655.4 +6028568,28558.1,8.38257,28757.0 +8869743,28586.55,8.382795,28847.5 +12008989,28615.0,8.38257,28938.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_bandwidth_raw.csv new file mode 100644 index 0000000..f569042 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +834,14.5457,40.4861,14.0127 +3334,57.2725,41.4825,54.7015 +13334,208.645,38.216,223.679 +26667,413.794,38.5922,439.815 +53334,858.804,39.3772,859.106 +106667,1525.85,40.2279,1528.19 +213334,2218.04,39.8824,2267.1 +426667,2718.87,34.4278,2743.81 +853334,2839.87,26.6877,2859.1 +1250000,3049.37,26.4199,3046.81 +1706667,3193.68,26.5235,3173.91 +2500000,3331.12,26.4735,3328.94 +3333334,3378.76,26.339,3385.04 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_bandwidth_smoothed.csv new file mode 100644 index 0000000..339c4c3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +834,57.2725,40.4861,54.7015 +3334,132.95875,39.53915,139.19025 +13334,208.645,39.3772,223.679 +26667,413.794,39.3772,439.815 +53334,858.804,39.3772,859.106 +106667,1525.85,39.3772,1528.19 +213334,2218.04,39.3772,2267.1 +426667,2718.87,34.4278,2743.81 +853334,2839.87,26.6877,2859.1 +1250000,3049.37,26.5235,3046.81 +1706667,3193.68,26.4735,3173.91 +2500000,3262.3999999999996,26.4467,3251.425 +3333334,3331.12,26.4735,3328.94 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_flops_raw.csv new file mode 100644 index 0000000..afbad7c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +834,3.97689,11.0692,3.83117 +3334,15.6587,11.3416,14.9557 +13334,57.045,10.4485,61.1554 +26667,113.134,10.5514,120.248 +53334,234.803,10.766,234.885 +106667,417.176,10.9986,417.816 +213334,606.428,10.9041,619.841 +426667,743.356,9.41277,750.174 +853334,776.438,7.29659,781.695 +1250000,833.718,7.22338,833.018 +1706667,873.173,7.2517,867.768 +2500000,910.749,7.23801,910.152 +3333334,923.776,7.20124,925.493 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_flops_smoothed.csv new file mode 100644 index 0000000..23b6bde --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_ENERGY_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +834,15.6587,11.0692,14.9557 +3334,36.35185,10.8103,38.05555 +13334,57.045,10.766,61.1554 +26667,113.134,10.766,120.248 +53334,234.803,10.766,234.885 +106667,417.176,10.766,417.816 +213334,606.428,10.766,619.841 +426667,743.356,9.41277,750.174 +853334,776.438,7.29659,781.695 +1250000,833.718,7.2517,833.018 +1706667,873.173,7.23801,867.768 +2500000,891.961,7.230695,888.96 +3333334,910.749,7.23801,910.152 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_bandwidth_raw.csv new file mode 100644 index 0000000..e24a958 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_bandwidth_raw.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +31104,41.0451,0.541864,43.4957 +73728,68.6976,0.613022,75.465 +144000,101.304,0.592812,110.488 +248832,139.974,0.521471,147.78 +395136,172.13,0.453919,181.701 +839808,205.115,0.448329,221.79 +1152000,209.224,0.420301,220.524 +1533312,191.136,0.438205,194.421 +2530944,215.271,0.432411,227.684 +3161088,206.848,0.431259,207.751 +3888000,199.795,0.433031,209.161 +4718592,197.416,0.411559,203.844 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_bandwidth_smoothed.csv new file mode 100644 index 0000000..3fe7ef1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_bandwidth_smoothed.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +31104,68.6976,0.592812,75.465 +73728,85.0008,0.567338,92.9765 +144000,101.304,0.541864,110.488 +248832,139.974,0.521471,147.78 +395136,172.13,0.453919,181.701 +839808,191.136,0.448329,194.421 +1152000,205.115,0.438205,220.524 +1533312,206.848,0.432411,220.524 +2530944,206.848,0.432411,209.161 +3161088,199.795,0.432411,207.751 +3888000,203.32150000000001,0.43183499999999997,208.45600000000002 +4718592,199.795,0.431259,207.751 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_flops_raw.csv new file mode 100644 index 0000000..e086166 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_flops_raw.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +31104,228.557,3.01734,242.203 +73728,372.233,3.32161,408.902 +144000,540.352,3.16205,589.341 +248832,739.04,2.75328,780.256 +395136,902.329,2.37951,952.505 +839808,1065.19,2.32824,1151.79 +1152000,1083.01,2.17561,1141.5 +1533312,986.771,2.26231,1003.73 +2530944,1106.9,2.22341,1170.72 +3161088,1061.91,2.21399,1066.55 +3888000,1024.31,2.22007,1072.33 +4718592,1010.91,2.10748,1043.83 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_flops_smoothed.csv new file mode 100644 index 0000000..0fdf4f9 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_FEMSWEEP_flops_smoothed.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +31104,372.233,3.16205,408.902 +73728,456.2925,3.089695,499.12149999999997 +144000,540.352,3.01734,589.341 +248832,739.04,2.75328,780.256 +395136,902.329,2.37951,952.505 +839808,986.771,2.32824,1003.73 +1152000,1065.19,2.26231,1141.5 +1533312,1065.19,2.22341,1141.5 +2530944,1061.91,2.22007,1072.33 +3161088,1024.31,2.22007,1066.55 +3888000,1043.1100000000001,2.2170300000000003,1069.44 +4718592,1024.31,2.21399,1066.55 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_bandwidth_raw.csv new file mode 100644 index 0000000..d8e7dfe --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +2744,0.499688,0.0521051,0.484808 +10648,1.93552,0.0528136,1.87471 +39304,6.39726,0.0531318,6.46187 +74088,6.86053,0.0533937,6.85435 +140608,8.71209,0.0528441,8.65917 +287496,10.3438,0.0530326,10.2587 +551368,10.457,0.0528825,10.454 +1124864,11.0168,0.0530364,11.0216 +2197000,11.2594,0.0530816,11.0427 +3241792,11.3537,0.0529303,11.3253 +4410944,11.3355,0.0529206,11.3275 +6434856,11.233,0.0525273,11.2406 +8741816,11.3614,0.0527711,11.3424 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv new file mode 100644 index 0000000..4fb71fe --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +2744,1.93552,0.0528136,1.87471 +10648,4.16639,0.0529727,4.16829 +39304,6.39726,0.0528441,6.46187 +74088,6.86053,0.0530326,6.85435 +140608,8.71209,0.0530326,8.65917 +287496,10.3438,0.0530326,10.2587 +551368,10.457,0.0530326,10.454 +1124864,11.0168,0.0530326,11.0216 +2197000,11.2594,0.0529303,11.0427 +3241792,11.2594,0.0529303,11.2406 +4410944,11.3355,0.0529206,11.3253 +6434856,11.3446,0.05284585,11.3264 +8741816,11.3355,0.0527711,11.3275 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_flops_raw.csv new file mode 100644 index 0000000..85884dd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +2744,39.8433,4.15467,38.6568 +10648,156.211,4.26245,151.303 +39304,519.929,4.31822,525.18 +74088,558.895,4.34974,558.391 +140608,711.076,4.31311,706.757 +287496,845.661,4.33569,838.699 +551368,855.931,4.32856,855.681 +1124864,902.675,4.34562,903.073 +2197000,923.259,4.35263,905.491 +3241792,931.332,4.34181,929.002 +4410944,930.082,4.34214,929.419 +6434856,921.93,4.31109,922.552 +8741816,932.657,4.33198,931.096 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_flops_smoothed.csv new file mode 100644 index 0000000..d11dbc8 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_INTSC_HEXRECT_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +2744,156.211,4.26245,151.303 +10648,338.07,4.290335000000001,338.2415 +39304,519.929,4.31311,525.18 +74088,558.895,4.31822,558.391 +140608,711.076,4.32856,706.757 +287496,845.661,4.33569,838.699 +551368,855.931,4.33569,855.681 +1124864,902.675,4.34181,903.073 +2197000,923.259,4.34214,905.491 +3241792,923.259,4.34214,922.552 +4410944,930.082,4.34181,929.002 +6434856,930.707,4.336895,929.2104999999999 +8741816,930.082,4.33198,929.419 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_bandwidth_raw.csv new file mode 100644 index 0000000..33ca996 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_bandwidth_raw.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-compile_time_block_stride_loop_64 +389120,14.0107,0.0884992,12.2295,7.28549 +778240,27.0896,0.0885011,24.0681,13.707 +1556480,49.2081,0.0884974,44.4445,24.2132 +3108864,88.7745,0.0881212,80.9145,38.4203 +6213632,177.28,0.0879501,144.956,40.0775 +12423168,200.404,0.0879218,184.274,40.7463 +18198528,212.19,0.0881316,252.347,44.7736 +24842240,164.284,0.0884596,194.332,42.5068 +36392960,186.5,0.0882529,246.152,43.3908 +48521216,203.957,0.0881932,234.919,42.6827 +60649472,206.666,0.0883532,281.63,43.0718 +72781824,219.656,0.0880561,270.001,45.694 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_bandwidth_smoothed.csv new file mode 100644 index 0000000..2f79f98 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_bandwidth_smoothed.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-compile_time_block_stride_loop_64 +389120,27.0896,0.0884992,24.0681,13.707 +778240,38.14885,0.0884983,34.256299999999996,18.9601 +1556480,49.2081,0.0884974,44.4445,24.2132 +3108864,88.7745,0.0881212,80.9145,38.4203 +6213632,177.28,0.0881212,144.956,40.0775 +12423168,177.28,0.0881212,184.274,40.7463 +18198528,186.5,0.0881316,194.332,42.5068 +24842240,200.404,0.0881932,234.919,42.6827 +36392960,203.957,0.0882529,246.152,43.0718 +48521216,203.957,0.0882529,246.152,43.0718 +60649472,205.3115,0.08822305,258.0765,43.231300000000005 +72781824,206.666,0.0881932,270.001,43.0718 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_flops_raw.csv new file mode 100644 index 0000000..171b429 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_flops_raw.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-compile_time_block_stride_loop_64 +389120,12.7729,0.0806808,11.1491,6.64186 +778240,24.697,0.0806846,21.9424,12.4963 +1556480,44.8625,0.0806822,40.5196,22.0749 +3108864,80.9353,0.0803397,73.7694,35.0276 +6213632,161.626,0.080184,132.156,36.5386 +12423168,182.708,0.0801583,168.003,37.1484 +18198528,193.453,0.0803496,230.064,40.8201 +24842240,149.777,0.0806487,177.172,38.7535 +36392960,170.032,0.0804602,224.417,39.5594 +48521216,185.948,0.0804058,214.176,38.9138 +60649472,188.417,0.0805517,256.763,39.2686 +72781824,200.261,0.0802808,246.16,41.6593 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_flops_smoothed.csv new file mode 100644 index 0000000..a36d4cd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DEA_flops_smoothed.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-compile_time_block_stride_loop_64 +389120,24.697,0.0806822,21.9424,12.4963 +778240,34.77975,0.08068149999999999,31.230999999999998,17.2856 +1556480,44.8625,0.0806808,40.5196,22.0749 +3108864,80.9353,0.0803397,73.7694,35.0276 +6213632,161.626,0.0803397,132.156,36.5386 +12423168,161.626,0.0803397,168.003,37.1484 +18198528,170.032,0.0803496,177.172,38.7535 +24842240,182.708,0.0804058,214.176,38.9138 +36392960,185.948,0.0804602,224.417,39.2686 +48521216,185.948,0.0804602,224.417,39.2686 +60649472,187.1825,0.080433,235.2885,39.414 +72781824,188.417,0.0804058,246.16,39.2686 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv new file mode 100644 index 0000000..018ece1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1331,34.9485,5.06074,34.1672 +4913,134.669,4.9594,131.499 +19683,401.081,4.71322,396.222 +35937,595.706,4.70075,586.281 +68921,829.253,4.734,826.284 +132651,1072.69,4.69783,1076.3 +250047,1140.66,4.63633,1154.49 +531441,1163.69,4.14383,1146.18 +1030301,1148.36,4.26351,1139.76 +1442897,1104.19,4.27094,1128.44 +2048383,1091.77,4.19839,1094.2 +2924207,1033.54,4.26945,1019.8 +3869893,999.747,4.28746,996.77 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv new file mode 100644 index 0000000..15e6bdf --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1331,134.669,4.9594,131.499 +4913,267.875,4.836309999999999,263.8605 +19683,401.081,4.734,396.222 +35937,595.706,4.71322,586.281 +68921,829.253,4.70075,826.284 +132651,1072.69,4.69783,1076.3 +250047,1140.66,4.63633,1139.76 +531441,1140.66,4.27094,1139.76 +1030301,1140.66,4.26351,1139.76 +1442897,1104.19,4.26351,1128.44 +2048383,1091.77,4.26945,1094.2 +2924207,1062.655,4.270195,1057.0 +3869893,1033.54,4.26945,1019.8 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_flops_raw.csv new file mode 100644 index 0000000..97bf0a0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1331,71.1765,10.3068,69.5852 +4913,281.662,10.3726,275.031 +19683,852.584,10.019,842.255 +35937,1272.33,10.04,1252.2 +68921,1778.38,10.1523,1772.01 +132651,2307.89,10.1074,2315.66 +250047,2460.23,9.9999,2490.06 +531441,2515.74,8.95839,2477.88 +1030301,2486.55,9.23179,2467.91 +1442897,2392.52,9.25416,2445.07 +2048383,2367.11,9.10268,2372.38 +2924207,2242.11,9.26198,2212.31 +3869893,2169.68,9.30478,2163.22 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv new file mode 100644 index 0000000..04bffc0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASS3DPA_ATOMIC_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1331,281.662,10.3068,275.031 +4913,567.1229999999999,10.1734,558.643 +19683,852.584,10.1523,842.255 +35937,1272.33,10.1074,1252.2 +68921,1778.38,10.04,1772.01 +132651,2307.89,10.04,2315.66 +250047,2460.23,9.9999,2467.91 +531441,2460.23,9.25416,2467.91 +1030301,2460.23,9.23179,2467.91 +1442897,2392.52,9.23179,2445.07 +2048383,2367.11,9.25416,2372.38 +2924207,2304.61,9.25807,2292.3450000000003 +3869893,2242.11,9.26198,2212.31 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..1699d86 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-direct_64,Base_HIP-runtime_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-direct_64,RAJA_HIP-runtime_block_stride_loop_64 +10752,21.6029,10.9679,3.35254,12.0124,21.4703,8.72273 +42624,84.0179,43.2082,3.37636,47.2058,83.2365,34.3618 +169920,283.992,153.589,3.31818,175.128,283.224,128.171 +339840,410.34,273.05,3.2903,305.431,406.945,231.455 +679680,501.128,356.704,3.31409,449.08,499.533,354.237 +1359360,801.461,618.729,3.32293,640.111,795.597,461.21 +2718720,953.827,723.994,3.31033,757.849,948.432,525.343 +5437248,1039.22,778.511,3.31363,804.273,1040.01,544.659 +10874496,1015.03,768.417,3.31531,794.696,1023.59,562.617 +15929280,1020.65,792.915,3.32111,827.198,1002.54,564.531 +21748800,1009.37,804.051,3.31904,839.303,996.938,577.583 +31858560,982.439,779.81,3.31785,809.578,970.163,502.972 +42477888,990.035,777.689,3.3134,809.028,972.117,494.684 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..5198dd9 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-direct_64,Base_HIP-runtime_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-direct_64,RAJA_HIP-runtime_block_stride_loop_64 +10752,84.0179,43.2082,3.35254,47.2058,83.2365,34.3618 +42624,184.00495,98.3986,3.3353599999999997,111.1669,183.23025,81.2664 +169920,283.992,153.589,3.31818,175.128,283.224,128.171 +339840,410.34,273.05,3.31818,305.431,406.945,231.455 +679680,501.128,356.704,3.31409,449.08,499.533,354.237 +1359360,801.461,618.729,3.31363,640.111,795.597,461.21 +2718720,953.827,723.994,3.31409,757.849,948.432,525.343 +5437248,1015.03,768.417,3.31531,794.696,1002.54,544.659 +10874496,1015.03,778.511,3.31531,804.273,1002.54,562.617 +15929280,1015.03,779.81,3.31785,809.578,1002.54,562.617 +21748800,1009.37,779.81,3.31785,809.578,996.938,562.617 +31858560,999.7025,786.3625,3.318445,818.3879999999999,984.5274999999999,533.7515 +42477888,990.035,779.81,3.31785,809.578,972.117,502.972 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_flops_raw.csv new file mode 100644 index 0000000..d3579b1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-direct_64,Base_HIP-runtime_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-direct_64,RAJA_HIP-runtime_block_stride_loop_64 +10752,70.7524,35.9215,10.98,39.3421,70.3182,28.5681 +42624,275.365,141.613,11.0659,154.715,272.804,112.619 +169920,930.936,503.47,10.8771,574.078,928.42,420.15 +339840,1345.15,895.096,10.7861,1001.24,1334.02,758.743 +679680,1642.79,1169.34,10.8642,1472.17,1637.56,1161.26 +1359360,2627.36,2028.33,10.8933,2098.42,2608.14,1511.95 +2718720,3126.86,2373.42,10.852,2484.4,3109.17,1722.19 +5437248,3406.81,2552.14,10.8628,2636.6,3409.39,1785.52 +10874496,3327.49,2519.05,10.8684,2605.2,3355.57,1844.39 +15929280,3345.94,2599.36,10.8874,2711.75,3286.56,1850.67 +21748800,3308.95,2635.87,10.8806,2751.43,3268.2,1893.45 +31858560,3220.67,2556.4,10.8767,2653.99,3180.43,1648.86 +42477888,3245.57,2549.45,10.8621,2652.19,3186.83,1621.69 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_flops_smoothed.csv new file mode 100644 index 0000000..1121004 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_MASSVEC3DPA_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-direct_64,Base_HIP-runtime_block_stride_loop_64,Base_Seq-default,RAJA_HIP-cached_block_stride_loop_64,RAJA_HIP-direct_64,RAJA_HIP-runtime_block_stride_loop_64 +10752,275.365,141.613,10.98,154.715,272.804,112.619 +42624,603.1505,322.54150000000004,10.928550000000001,364.3965,600.612,266.3845 +169920,930.936,503.47,10.8771,574.078,928.42,420.15 +339840,1345.15,895.096,10.8771,1001.24,1334.02,758.743 +679680,1642.79,1169.34,10.8642,1472.17,1637.56,1161.26 +1359360,2627.36,2028.33,10.8628,2098.42,2608.14,1511.95 +2718720,3126.86,2373.42,10.8642,2484.4,3109.17,1722.19 +5437248,3327.49,2519.05,10.8684,2605.2,3286.56,1785.52 +10874496,3327.49,2552.14,10.8684,2636.6,3286.56,1844.39 +15929280,3327.49,2556.4,10.8767,2653.99,3286.56,1844.39 +21748800,3308.95,2556.4,10.8767,2653.99,3268.2,1844.39 +31858560,3277.26,2577.88,10.87865,2682.87,3227.515,1749.7649999999999 +42477888,3245.57,2556.4,10.8767,2653.99,3186.83,1648.86 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv new file mode 100644 index 0000000..98d78d9 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +2744,39.5814,5.1525,37.6512 +12167,147.687,4.83581,149.419 +54872,340.028,4.68254,377.154 +117649,458.256,4.60138,472.04 +238328,583.165,4.58258,605.51 +493039,632.039,4.49236,639.545 +1000000,691.63,4.47608,691.105 +2048383,708.195,4.46134,713.825 +4096000,734.242,4.40936,736.062 +6028568,745.24,4.43761,745.905 +8242408,758.572,4.43953,759.823 +12167000,759.727,4.4425,757.981 +16194277,777.233,4.38922,775.878 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..ef5df67 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +2744,147.687,4.83581,149.419 +12167,243.85750000000002,4.759175000000001,263.2865 +54872,340.028,4.68254,377.154 +117649,458.256,4.60138,472.04 +238328,583.165,4.58258,605.51 +493039,632.039,4.49236,639.545 +1000000,691.63,4.47608,691.105 +2048383,708.195,4.46134,713.825 +4096000,734.242,4.43953,736.062 +6028568,745.24,4.43953,745.905 +8242408,758.572,4.43761,757.981 +12167000,759.1495,4.43857,758.902 +16194277,759.727,4.43953,759.823 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv new file mode 100644 index 0000000..811585a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +2744,10.7206,1.39555,10.1978 +12167,41.7565,1.36726,42.2464 +54872,98.6861,1.35901,109.461 +117649,134.196,1.34747,138.233 +238328,171.884,1.35069,178.47 +493039,187.268,1.33105,189.492 +1000000,205.748,1.33156,205.592 +2048383,211.352,1.33143,213.032 +4096000,219.661,1.31914,220.206 +6028568,223.205,1.3291,223.404 +8242408,227.384,1.33076,227.759 +12167000,227.937,1.33286,227.413 +16194277,233.328,1.31766,232.921 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv new file mode 100644 index 0000000..1696c86 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_NODAL_ACCUMULATION_3D_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +2744,41.7565,1.36726,42.2464 +12167,70.2213,1.363135,75.8537 +54872,98.6861,1.35901,109.461 +117649,134.196,1.35069,138.233 +238328,171.884,1.34747,178.47 +493039,187.268,1.33156,189.492 +1000000,205.748,1.33143,205.592 +2048383,211.352,1.33105,213.032 +4096000,219.661,1.33076,220.206 +6028568,223.205,1.33076,223.404 +8242408,227.384,1.3291,227.413 +12167000,227.6605,1.32993,227.586 +16194277,227.937,1.33076,227.759 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_bandwidth_raw.csv new file mode 100644 index 0000000..e4fb8df --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1331,32.0687,7.06277,32.1643 +8000,133.227,6.44564,129.982 +35937,382.434,6.82946,473.854 +79507,666.267,6.81901,762.389 +166375,1019.13,6.84974,1053.03 +343000,1238.39,6.79477,1235.03 +704969,1174.76,6.66757,1166.49 +1442897,1353.8,6.47818,1381.39 +2985984,1231.28,6.22355,1224.81 +4410944,1217.78,6.219,1209.27 +6028568,1240.84,6.33519,1225.97 +8869743,1359.41,6.21392,1365.48 +12008989,984.951,6.11479,1018.16 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_bandwidth_smoothed.csv new file mode 100644 index 0000000..9027ec1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1331,133.227,6.82946,129.982 +8000,257.83050000000003,6.824235,301.918 +35937,382.434,6.82946,473.854 +79507,666.267,6.81901,762.389 +166375,1019.13,6.81901,1053.03 +343000,1174.76,6.79477,1166.49 +704969,1231.28,6.66757,1224.81 +1442897,1231.28,6.47818,1224.81 +2985984,1231.28,6.33519,1224.81 +4410944,1240.84,6.22355,1225.97 +6028568,1231.28,6.219,1224.81 +8869743,1229.31,6.21646,1217.62 +12008989,1240.84,6.21392,1225.97 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_flops_raw.csv new file mode 100644 index 0000000..ed2225e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1331,72.9195,16.0597,73.1369 +8000,310.767,15.0352,303.199 +35937,903.99,16.1433,1120.09 +79507,1582.67,16.1981,1811.0 +166375,2429.59,16.3297,2510.42 +343000,2960.57,16.244,2952.54 +704969,2814.67,15.9752,2794.85 +1442897,3249.29,15.5485,3315.53 +2985984,2959.36,14.9582,2943.81 +4410944,2928.74,14.9566,2908.28 +6028568,2985.54,15.2428,2949.74 +8869743,3272.42,14.9584,3287.05 +12008989,2371.83,14.7248,2451.8 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_flops_smoothed.csv new file mode 100644 index 0000000..0bb69ad --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/Apps_VOL3D_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1331,310.767,16.0597,303.199 +8000,607.3785,16.1015,711.6445 +35937,903.99,16.1433,1120.09 +79507,1582.67,16.1981,1811.0 +166375,2429.59,16.1981,2510.42 +343000,2814.67,16.1981,2794.85 +704969,2959.36,15.9752,2943.81 +1442897,2959.36,15.5485,2943.81 +2985984,2959.36,15.2428,2943.81 +4410944,2985.54,14.9584,2949.74 +6028568,2959.36,14.9582,2943.81 +8869743,2957.14,14.9575,2929.01 +12008989,2985.54,14.9584,2949.74 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_DIFFUSION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_DIFFUSION3DPA.csv new file mode 100644 index 0000000..7677af4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_DIFFUSION3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DIFFUSION3DPA-Base_Seq-default,783.0,9.8788,6.59477 +Apps_DIFFUSION3DPA-Base_HIP-block_64,197262.0,2763.42,1841.5 +Apps_DIFFUSION3DPA-RAJA_HIP-block_64,394524.0,3411.32,2273.25 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_EDGE3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_EDGE3D.csv new file mode 100644 index 0000000..350455a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_EDGE3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_EDGE3D-Base_Seq-default,1331.0,8.36483,0.0200444 +Apps_EDGE3D-Base_HIP-block_256,343000.0,27771.5,63.2963 +Apps_EDGE3D-RAJA_HIP-block_256,166375.0,25705.7,58.752 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_ENERGY.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_ENERGY.csv new file mode 100644 index 0000000..76d22c2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_ENERGY.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_ENERGY-Base_Seq-default,834.0,11.0692,40.4861 +Apps_ENERGY-Base_HIP-block_256,1250000.0,833.718,3049.37 +Apps_ENERGY-RAJA_HIP-block_256,1250000.0,833.018,3046.81 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_FEMSWEEP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_FEMSWEEP.csv new file mode 100644 index 0000000..4116693 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_FEMSWEEP.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_FEMSWEEP-Base_Seq-default,31104.0,3.01734,0.541864 +Apps_FEMSWEEP-Base_HIP-block_64,839808.0,1065.19,205.115 +Apps_FEMSWEEP-RAJA_HIP-block_64,839808.0,1151.79,221.79 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_INTSC_HEXRECT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_INTSC_HEXRECT.csv new file mode 100644 index 0000000..acc372f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_INTSC_HEXRECT.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_INTSC_HEXRECT-Base_Seq-default,2744.0,4.15467,0.0521051 +Apps_INTSC_HEXRECT-Base_HIP-block_64,287496.0,845.661,10.3438 +Apps_INTSC_HEXRECT-RAJA_HIP-block_64,287496.0,838.699,10.2587 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASS3DEA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASS3DEA.csv new file mode 100644 index 0000000..3aeb510 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASS3DEA.csv @@ -0,0 +1,5 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DEA-Base_Seq-default,389120.0,0.0806808,0.0884992 +Apps_MASS3DEA-Base_HIP-compile_time_block_stride_loop_64,18198528.0,193.453,212.19 +Apps_MASS3DEA-RAJA_HIP-compile_time_block_stride_loop_64,6213632.0,36.5386,40.0775 +Apps_MASS3DEA-RAJA_HIP-cached_block_stride_loop_64,36392960.0,224.417,246.152 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASS3DPA_ATOMIC.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASS3DPA_ATOMIC.csv new file mode 100644 index 0000000..2ec753b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASS3DPA_ATOMIC.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DPA_ATOMIC-Base_Seq-default,1331.0,10.3068,5.06074 +Apps_MASS3DPA_ATOMIC-Base_HIP-block_64,132651.0,2307.89,1072.69 +Apps_MASS3DPA_ATOMIC-RAJA_HIP-block_64,132651.0,2315.66,1076.3 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASSVEC3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASSVEC3DPA.csv new file mode 100644 index 0000000..57431da --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_MASSVEC3DPA.csv @@ -0,0 +1,7 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASSVEC3DPA-Base_Seq-default,10752.0,10.98,3.35254 +Apps_MASSVEC3DPA-Base_HIP-runtime_block_stride_loop_64,2718720.0,2373.42,723.994 +Apps_MASSVEC3DPA-Base_HIP-direct_64,2718720.0,3126.86,953.827 +Apps_MASSVEC3DPA-RAJA_HIP-runtime_block_stride_loop_64,1359360.0,1511.95,461.21 +Apps_MASSVEC3DPA-RAJA_HIP-direct_64,2718720.0,3109.17,948.432 +Apps_MASSVEC3DPA-RAJA_HIP-cached_block_stride_loop_64,2718720.0,2484.4,757.849 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_NODAL_ACCUMULATION_3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_NODAL_ACCUMULATION_3D.csv new file mode 100644 index 0000000..cbe161d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_NODAL_ACCUMULATION_3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_NODAL_ACCUMULATION_3D-Base_Seq-default,2744.0,1.39555,5.1525 +Apps_NODAL_ACCUMULATION_3D-Base_HIP-block_256,1000000.0,205.748,691.63 +Apps_NODAL_ACCUMULATION_3D-RAJA_HIP-block_256,1000000.0,205.592,691.105 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_VOL3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_VOL3D.csv new file mode 100644 index 0000000..089a65f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/Apps_VOL3D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_VOL3D-Base_Seq-default,1331.0,16.0597,7.06277 +Apps_VOL3D-Base_HIP-block_256,343000.0,2960.57,1238.39 +Apps_VOL3D-RAJA_HIP-block_256,343000.0,2952.54,1235.03 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/combined_fom.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/combined_fom.csv new file mode 100644 index 0000000..6996e90 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/FOM/combined_fom.csv @@ -0,0 +1,35 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DIFFUSION3DPA-Base_HIP-block_64,197262.0,2763.42,1841.5 +Apps_DIFFUSION3DPA-Base_Seq-default,783.0,9.8788,6.59477 +Apps_DIFFUSION3DPA-RAJA_HIP-block_64,394524.0,3411.32,2273.25 +Apps_EDGE3D-Base_HIP-block_256,343000.0,27771.5,63.2963 +Apps_EDGE3D-Base_Seq-default,1331.0,8.36483,0.0200444 +Apps_EDGE3D-RAJA_HIP-block_256,166375.0,25705.7,58.752 +Apps_ENERGY-Base_HIP-block_256,1250000.0,833.718,3049.37 +Apps_ENERGY-Base_Seq-default,834.0,11.0692,40.4861 +Apps_ENERGY-RAJA_HIP-block_256,1250000.0,833.018,3046.81 +Apps_FEMSWEEP-Base_HIP-block_64,839808.0,1065.19,205.115 +Apps_FEMSWEEP-Base_Seq-default,31104.0,3.01734,0.541864 +Apps_FEMSWEEP-RAJA_HIP-block_64,839808.0,1151.79,221.79 +Apps_INTSC_HEXRECT-Base_HIP-block_64,287496.0,845.661,10.3438 +Apps_INTSC_HEXRECT-Base_Seq-default,2744.0,4.15467,0.0521051 +Apps_INTSC_HEXRECT-RAJA_HIP-block_64,287496.0,838.699,10.2587 +Apps_MASS3DEA-Base_HIP-compile_time_block_stride_loop_64,18198528.0,193.453,212.19 +Apps_MASS3DEA-Base_Seq-default,389120.0,0.0806808,0.0884992 +Apps_MASS3DEA-RAJA_HIP-cached_block_stride_loop_64,36392960.0,224.417,246.152 +Apps_MASS3DEA-RAJA_HIP-compile_time_block_stride_loop_64,6213632.0,36.5386,40.0775 +Apps_MASS3DPA_ATOMIC-Base_HIP-block_64,132651.0,2307.89,1072.69 +Apps_MASS3DPA_ATOMIC-Base_Seq-default,1331.0,10.3068,5.06074 +Apps_MASS3DPA_ATOMIC-RAJA_HIP-block_64,132651.0,2315.66,1076.3 +Apps_MASSVEC3DPA-Base_HIP-direct_64,2718720.0,3126.86,953.827 +Apps_MASSVEC3DPA-Base_HIP-runtime_block_stride_loop_64,2718720.0,2373.42,723.994 +Apps_MASSVEC3DPA-Base_Seq-default,10752.0,10.98,3.35254 +Apps_MASSVEC3DPA-RAJA_HIP-cached_block_stride_loop_64,2718720.0,2484.4,757.849 +Apps_MASSVEC3DPA-RAJA_HIP-direct_64,2718720.0,3109.17,948.432 +Apps_MASSVEC3DPA-RAJA_HIP-runtime_block_stride_loop_64,1359360.0,1511.95,461.21 +Apps_NODAL_ACCUMULATION_3D-Base_HIP-block_256,1000000.0,205.748,691.63 +Apps_NODAL_ACCUMULATION_3D-Base_Seq-default,2744.0,1.39555,5.1525 +Apps_NODAL_ACCUMULATION_3D-RAJA_HIP-block_256,1000000.0,205.592,691.105 +Apps_VOL3D-Base_HIP-block_256,343000.0,2960.57,1238.39 +Apps_VOL3D-Base_Seq-default,1331.0,16.0597,7.06277 +Apps_VOL3D-RAJA_HIP-block_256,343000.0,2952.54,1235.03 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/combined_table.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/combined_table.csv new file mode 100644 index 0000000..089d5ba --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/combined_table.csv @@ -0,0 +1,436 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning +Apps_DIFFUSION3DPA,Base_Seq,default,783, PASSED ,1.52621e-05,6.59477,9.8788,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,783, PASSED ,3.94562e-06,25.5093,38.2122,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,783, PASSED ,3.77782e-06,26.6423,39.9095,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,789048, PASSED ,0.034789,2.91033,4.36735,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,789048, PASSED ,4.22642e-05,2395.58,3594.9,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,789048, PASSED ,4.10318e-05,2467.53,3702.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,98631, PASSED ,0.00206685,6.12336,9.18884,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,98631, PASSED ,9.35384e-06,1353.03,2030.39,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,98631, PASSED ,9.02344e-06,1402.58,2104.73,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,1155843, PASSED ,0.0506738,2.92682,4.39209,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,1155843, PASSED ,5.91221e-05,2508.59,3764.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,1155843, PASSED ,5.81985e-05,2548.4,3824.22,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,12339, PASSED ,0.000256495,6.17346,9.2631,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,12339, PASSED ,4.06142e-06,389.88,585.003,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,12339, PASSED ,3.99682e-06,396.181,594.458,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,1578096, PASSED ,0.0670738,3.01898,4.5304,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,1578096, PASSED ,9.0503e-05,2237.43,3357.58,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,1578096, PASSED ,8.70982e-05,2324.9,3488.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,197262, PASSED ,0.00572334,4.42259,6.63667,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,197262, PASSED ,1.37453e-05,1841.5,2763.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,197262, PASSED ,1.32539e-05,1909.78,2865.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,2311659, PASSED ,0.0951131,3.11862,4.67993,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,2311659, PASSED ,0.00014653,2024.31,3037.75,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,2311659, PASSED ,0.000139678,2123.62,3186.78,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,24678, PASSED ,0.000509739,6.21249,9.32219,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,24678, PASSED ,4.56042e-06,694.399,1041.98,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,24678, PASSED ,4.40162e-06,719.451,1079.58,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,3105, PASSED ,5.99091e-05,6.65339,9.97987,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,3105, PASSED ,4.02422e-06,99.0499,148.572,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,3105, PASSED ,3.85542e-06,103.387,155.076,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,3082212, PASSED ,0.127561,3.10045,4.65266,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,3082212, PASSED ,0.000204995,1929.3,2895.18,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,3082212, PASSED ,0.000196137,2016.42,3025.93,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,394524, PASSED ,0.0298307,1.69703,2.54663,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,394524, PASSED ,2.28123e-05,2219.14,3330.12,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,394524, PASSED ,2.22693e-05,2273.25,3411.32,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DIFFUSION3DPA,Base_Seq,default,49329, PASSED ,0.00101652,6.227,9.34422,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DIFFUSION3DPA,Base_HIP,block_64,49329, PASSED ,6.11384e-06,1035.33,1553.62,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,49329, PASSED ,6.09682e-06,1038.22,1557.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_EDGE3D,Base_Seq,default,1331, PASSED ,0.0045701,0.0200444,8.36483,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,1331, PASSED ,3.31972e-05,2.75942,1151.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,1331, PASSED ,2.43981e-05,3.75459,1566.85,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,2985984, PASSED ,5.0457,0.0189848,8.3743,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,2985984, PASSED ,0.00150339,63.717,28106.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,2985984, PASSED ,0.00149804,63.9446,28206.4,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,343000, PASSED ,0.621116,0.0191105,8.3848,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,343000, PASSED ,0.000187528,63.2963,27771.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,343000, PASSED ,0.000179909,65.9768,28947.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,4410944, PASSED ,7.38432,0.0189935,8.38338,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,4410944, PASSED ,0.00219391,63.9287,28217.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,4410944, PASSED ,0.00216035,64.9219,28655.4,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,35937, PASSED ,0.0755259,0.0192935,8.3699,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,35937, PASSED ,3.48721e-05,41.7859,18127.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,35937, PASSED ,2.66972e-05,54.5811,23678.3,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,6028568, PASSED ,10.0335,0.0189842,8.38302,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,6028568, PASSED ,0.00294526,64.6727,28558.1,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,6028568, PASSED ,0.00292489,65.1231,28757.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,704969, PASSED ,1.24175,0.0190425,8.37346,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,704969, PASSED ,0.000386552,61.1716,26898.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,704969, PASSED ,0.000373554,63.3001,27834.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,8869743, PASSED ,14.6732,0.0189662,8.37918,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,8869743, PASSED ,0.00427903,65.0368,28733.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,8869743, PASSED ,0.00424764,65.5175,28945.3,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,79507, PASSED ,0.156569,0.0192253,8.38141,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,79507, PASSED ,6.01914e-05,50.0086,21801.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,79507, PASSED ,5.02532e-05,59.8984,26113.1,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,8000, PASSED ,0.0199461,0.0195325,8.36188,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,8000, PASSED ,3.34262e-05,11.6555,4989.71,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,8000, PASSED ,2.44781e-05,15.9162,6813.73,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,12008989, PASSED ,19.7681,0.0189674,8.38257,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,12008989, PASSED ,0.00579093,64.7476,28615.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,12008989, PASSED ,0.00572628,65.4785,28938.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,1442897, PASSED ,2.48444,0.0190052,8.37162,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,1442897, PASSED ,0.000745835,63.3082,27886.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,1442897, PASSED ,0.000746416,63.2589,27864.9,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_EDGE3D,Base_Seq,default,166375, PASSED ,0.312746,0.0191493,8.37836,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_EDGE3D,Base_HIP,block_256,166375, PASSED ,0.000105301,56.8739,24884.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_EDGE3D,RAJA_HIP,block_256,166375, PASSED ,0.000101935,58.752,25705.7,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,834, PASSED ,4.14395e-06,40.4861,11.0692,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,834, PASSED ,1.15341e-05,14.5457,3.97689,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,834, PASSED ,1.19728e-05,14.0127,3.83117,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,853334, PASSED ,0.00643223,26.6877,7.29659,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,853334, PASSED ,6.0447e-05,2839.87,776.438,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,853334, PASSED ,6.00405e-05,2859.1,781.695,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,106667, PASSED ,0.000533405,40.2279,10.9986,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,106667, PASSED ,1.40628e-05,1525.85,417.176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,106667, PASSED ,1.40413e-05,1528.19,417.816,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,1250000, PASSED ,0.00951771,26.4199,7.22338,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,1250000, PASSED ,8.24619e-05,3049.37,833.718,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,1250000, PASSED ,8.25312e-05,3046.81,833.018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,13334, PASSED ,7.0189e-05,38.216,10.4485,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,13334, PASSED ,1.2856e-05,208.645,57.045,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,13334, PASSED ,1.19919e-05,223.679,61.1554,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,1706667, PASSED ,0.0129441,26.5235,7.2517,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,1706667, PASSED ,0.000107501,3193.68,873.173,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,1706667, PASSED ,0.00010817,3173.91,867.768,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,213334, PASSED ,0.00107605,39.8824,10.9041,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,213334, PASSED ,1.93483e-05,2218.04,606.428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,213334, PASSED ,1.89296e-05,2267.1,619.841,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,2500000, PASSED ,0.0189969,26.4735,7.23801,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,2500000, PASSED ,0.000150975,3331.12,910.749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,2500000, PASSED ,0.000151074,3328.94,910.152,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,26667, PASSED ,0.000139004,38.5922,10.5514,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,26667, PASSED ,1.29641e-05,413.794,113.134,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,26667, PASSED ,1.21971e-05,439.815,120.248,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,3334, PASSED ,1.61679e-05,41.4825,11.3416,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,3334, PASSED ,1.17104e-05,57.2725,15.6587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,3334, PASSED ,1.22608e-05,54.7015,14.9557,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,3333334, PASSED ,0.0254586,26.339,7.20124,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,3333334, PASSED ,0.000198461,3378.76,923.776,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,3333334, PASSED ,0.000198093,3385.04,925.493,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,426667, PASSED ,0.00249307,34.4278,9.41277,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,426667, PASSED ,3.15686e-05,2718.87,743.356,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,426667, PASSED ,3.12816e-05,2743.81,750.174,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_ENERGY,Base_Seq,default,53334, PASSED ,0.000272467,39.3772,10.766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_ENERGY,Base_HIP,block_256,53334, PASSED ,1.24929e-05,858.804,234.803,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_ENERGY,RAJA_HIP,block_256,53334, PASSED ,1.24885e-05,859.106,234.885,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_FEMSWEEP,Base_Seq,default,839808, PASSED ,0.314054,0.448329,2.32824,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,839808, PASSED ,0.000686444,205.115,1065.19,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,839808, PASSED ,0.000634834,221.79,1151.79,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,144000, PASSED ,0.0390188,0.592812,3.16205,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,144000, PASSED ,0.000228331,101.304,540.352,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,144000, PASSED ,0.000209351,110.488,589.341,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,1152000, PASSED ,0.461941,0.420301,2.17561,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,1152000, PASSED ,0.000927976,209.224,1083.01,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,1152000, PASSED ,0.000880425,220.524,1141.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,1533312, PASSED ,0.592243,0.438205,2.26231,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,1533312, PASSED ,0.0013578,191.136,986.771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,1533312, PASSED ,0.00133486,194.421,1003.73,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,248832, PASSED ,0.0779046,0.521471,2.75328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,248832, PASSED ,0.000290232,139.974,739.04,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,248832, PASSED ,0.000274901,147.78,780.256,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,2530944, PASSED ,0.997166,0.432411,2.22341,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,2530944, PASSED ,0.00200299,215.271,1106.9,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,2530944, PASSED ,0.00189379,227.684,1170.72,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00861784,0.541864,3.01734,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,31104, PASSED ,0.00011377,41.0451,228.557,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,31104, PASSED ,0.00010736,43.4957,242.203,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,3161088, PASSED ,1.25196,0.431259,2.21399,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,3161088, PASSED ,0.00261022,206.848,1061.91,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,3161088, PASSED ,0.00259887,207.751,1066.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,3888000, PASSED ,1.53694,0.433031,2.22007,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,3888000, PASSED ,0.00333112,199.795,1024.31,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_5000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,3888000, PASSED ,0.00318197,209.161,1072.33,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,395136, PASSED ,0.143758,0.453919,2.37951,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,395136, PASSED ,0.000379102,172.13,902.329,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,395136, PASSED ,0.000359132,181.701,952.505,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,4718592, PASSED ,1.96638,0.411559,2.10748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,4718592, PASSED ,0.00409937,197.416,1010.91,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_6000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,4718592, PASSED ,0.00397009,203.844,1043.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_FEMSWEEP,Base_Seq,default,73728, PASSED ,0.0188448,0.613022,3.32161,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_FEMSWEEP,Base_HIP,block_64,73728, PASSED ,0.000168161,68.6976,372.233,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_FEMSWEEP,RAJA_HIP,block_64,73728, PASSED ,0.000153081,75.465,408.902,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,2744, PASSED ,0.00237766,0.0521051,4.15467,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,2744, PASSED ,0.000247931,0.499688,39.8433,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,2744, PASSED ,0.000255541,0.484808,38.6568,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,2197000, PASSED ,1.81711,0.0530816,4.35263,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,2197000, PASSED ,0.00856661,11.2594,923.259,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,2197000, PASSED ,0.00873471,11.0427,905.491,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,287496, PASSED ,0.238713,0.0530326,4.33569,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,287496, PASSED ,0.00122388,10.3438,845.661,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,287496, PASSED ,0.00123404,10.2587,838.699,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,3241792, PASSED ,2.68792,0.0529303,4.34181,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,3241792, PASSED ,0.0125309,11.3537,931.332,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,3241792, PASSED ,0.0125623,11.3253,929.002,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,39304, PASSED ,0.0327669,0.0531318,4.31822,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,39304, PASSED ,0.000272142,6.39726,519.929,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,39304, PASSED ,0.000269421,6.46187,525.18,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,4410944, PASSED ,3.65704,0.0529206,4.34214,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,4410944, PASSED ,0.0170731,11.3355,930.082,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,4410944, PASSED ,0.0170853,11.3275,929.419,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,551368, PASSED ,0.458565,0.0528825,4.32856,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,551368, PASSED ,0.00231902,10.457,855.931,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,551368, PASSED ,0.0023197,10.454,855.681,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,6434856, PASSED ,5.37347,0.0525273,4.31109,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,6434856, PASSED ,0.0251272,11.233,921.93,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,6434856, PASSED ,0.0251102,11.2406,922.552,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,74088, PASSED ,0.0613179,0.0533937,4.34974,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,74088, PASSED ,0.000477222,6.86053,558.895,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,74088, PASSED ,0.000477652,6.85435,558.391,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,10648, PASSED ,0.00899313,0.0528136,4.26245,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,10648, PASSED ,0.000245391,1.93552,156.211,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,10648, PASSED ,0.000253351,1.87471,151.303,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,8741816, PASSED ,7.26471,0.0527711,4.33198,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,8741816, PASSED ,0.0337429,11.3614,932.657,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,8741816, PASSED ,0.0337994,11.3424,931.096,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,1124864, PASSED ,0.93186,0.0530364,4.34562,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,1124864, PASSED ,0.00448612,11.0168,902.675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,1124864, PASSED ,0.00448414,11.0216,903.073,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXRECT,Base_Seq,default,140608, PASSED ,0.117361,0.0528441,4.31311,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXRECT,Base_HIP,block_64,140608, PASSED ,0.000711863,8.71209,711.076,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,140608, PASSED ,0.000716213,8.65917,706.757,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DEA,Base_Seq,default,12423168, PASSED ,1.08488,0.0879218,0.0801583,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,12423168, PASSED ,0.000475963,200.404,182.708,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,12423168, PASSED ,0.00234094,40.7463,37.1484,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,12423168, PASSED ,0.000517623,184.274,168.003,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,1556480, PASSED ,0.13504,0.0884974,0.0806822,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,1556480, PASSED ,0.000242861,49.2081,44.8625,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,1556480, PASSED ,0.000493563,24.2132,22.0749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,1556480, PASSED ,0.000268891,44.4445,40.5196,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,18198528, PASSED ,1.58544,0.0881316,0.0803496,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,18198528, PASSED ,0.000658503,212.19,193.453,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,18198528, PASSED ,0.00312076,44.7736,40.8201,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,18198528, PASSED ,0.000553713,252.347,230.064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,24842240, PASSED ,2.15621,0.0884596,0.0806487,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,24842240, PASSED ,0.00116103,164.284,149.777,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,24842240, PASSED ,0.00448723,42.5068,38.7535,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,24842240, PASSED ,0.000981506,194.332,177.172,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,3108864, PASSED ,0.270875,0.0881212,0.0803397,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,3108864, PASSED ,0.000268882,88.7745,80.9353,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,3108864, PASSED ,0.000621283,38.4203,35.0276,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,3108864, PASSED ,0.000295001,80.9145,73.7694,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,36392960, PASSED ,3.16617,0.0882529,0.0804602,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,36392960, PASSED ,0.00149825,186.5,170.032,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,36392960, PASSED ,0.0064397,43.3908,39.5594,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,36392960, PASSED ,0.00113517,246.152,224.417,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,389120, PASSED ,0.0337607,0.0884992,0.0806808,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,389120, PASSED ,0.000213251,14.0107,12.7729,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,389120, PASSED ,0.000410102,7.28549,6.64186,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,389120, PASSED ,0.000244311,12.2295,11.1491,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,48521216, PASSED ,4.22418,0.0881932,0.0804058,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,48521216, PASSED ,0.00182658,203.957,185.948,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,48521216, PASSED ,0.00872822,42.6827,38.9138,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,48521216, PASSED ,0.00158584,234.919,214.176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,60649472, PASSED ,5.27048,0.0883532,0.0805517,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,60649472, PASSED ,0.00225322,206.666,188.417,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_5000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,60649472, PASSED ,0.0108113,43.0718,39.2686,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,60649472, PASSED ,0.00165346,281.63,256.763,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,6213632, PASSED ,0.542445,0.0879501,0.080184,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,6213632, PASSED ,0.000269112,177.28,161.626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,6213632, PASSED ,0.0011904,40.0775,36.5386,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,6213632, PASSED ,0.000329122,144.956,132.156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,72781824, PASSED ,6.34614,0.0880561,0.0802808,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,72781824, PASSED ,0.00254404,219.656,200.261,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_6000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,72781824, PASSED ,0.0122295,45.694,41.6593,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,72781824, PASSED ,0.00206968,270.001,246.16,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DEA,Base_Seq,default,778240, PASSED ,0.0675182,0.0885011,0.0806846,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,778240, PASSED ,0.000220581,27.0896,24.697,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,778240, PASSED ,0.000435942,13.707,12.4963,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,778240, PASSED ,0.000248272,24.0681,21.9424,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,1331, PASSED ,2.26429e-05,5.06074,10.3068,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,1331, PASSED ,3.27882e-06,34.9485,71.1765,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,1331, PASSED ,3.3538e-06,34.1672,69.5852,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,1030301, PASSED ,0.0252795,4.26351,9.23179,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,1030301, PASSED ,9.38549e-05,1148.36,2486.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,1030301, PASSED ,9.45637e-05,1139.76,2467.91,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,132651, PASSED ,0.0028862,4.69783,10.1074,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,132651, PASSED ,1.26401e-05,1072.69,2307.89,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,132651, PASSED ,1.25977e-05,1076.3,2315.66,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,1442897, PASSED ,0.03543,4.27094,9.25416,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,1442897, PASSED ,0.000137042,1104.19,2392.52,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,1442897, PASSED ,0.000134097,1128.44,2445.07,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,19683, PASSED ,0.000409404,4.71322,10.019,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,19683, PASSED ,4.81102e-06,401.081,852.584,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,19683, PASSED ,4.87002e-06,396.222,842.255,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,2048383, PASSED ,0.0512858,4.19839,9.10268,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,2048383, PASSED ,0.000197218,1091.77,2367.11,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,2048383, PASSED ,0.000196781,1094.2,2372.38,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,250047, PASSED ,0.00556204,4.63633,9.9999,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,250047, PASSED ,2.26075e-05,1140.66,2460.23,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,250047, PASSED ,2.23367e-05,1154.49,2490.06,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,2924207, PASSED ,0.0721465,4.26945,9.26198,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,2924207, PASSED ,0.000298031,1033.54,2242.11,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,2924207, PASSED ,0.000302046,1019.8,2212.31,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,35937, PASSED ,0.000761674,4.70075,10.04,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,35937, PASSED ,6.01042e-06,595.706,1272.33,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,35937, PASSED ,6.10704e-06,586.281,1252.2,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,4913, PASSED ,9.21565e-05,4.9594,10.3726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,4913, PASSED ,3.3938e-06,134.669,281.662,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,4913, PASSED ,3.47562e-06,131.499,275.031,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,3869893, PASSED ,0.0952186,4.28746,9.30478,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,3869893, PASSED ,0.00040835,999.747,2169.68,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,3869893, PASSED ,0.000409569,996.77,2163.22,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,531441, PASSED ,0.0133381,4.14383,8.95839,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,531441, PASSED ,4.74962e-05,1163.69,2515.74,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,531441, PASSED ,4.82218e-05,1146.18,2477.88,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,68921, PASSED ,0.00147119,4.734,10.1523,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,68921, PASSED ,8.39866e-06,829.253,1778.38,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,68921, PASSED ,8.42884e-06,826.284,1772.01,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_MASSVEC3DPA,Base_Seq,default,10752, PASSED ,2.8153e-05,3.35254,10.98,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,10752, PASSED ,8.60544e-06,10.9679,35.9215,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,10752, PASSED ,4.36904e-06,21.6029,70.7524,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,10752, PASSED ,1.08205e-05,8.72273,28.5681,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,10752, PASSED ,4.39602e-06,21.4703,70.3182,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,10752, PASSED ,7.85724e-06,12.0124,39.3421,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,10874496, PASSED ,0.0287662,3.31531,10.8684,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,10874496, PASSED ,0.000124111,768.417,2519.05,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,10874496, PASSED ,9.39571e-05,1015.03,3327.49,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,10874496, PASSED ,0.000169509,562.617,1844.39,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,10874496, PASSED ,9.31709e-05,1023.59,3355.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,10874496, PASSED ,0.000120007,794.696,2605.2,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,1359360, PASSED ,0.00358768,3.32293,10.8933,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,1359360, PASSED ,1.92679e-05,618.729,2028.33,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,1359360, PASSED ,1.48749e-05,801.461,2627.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,1359360, PASSED ,2.58485e-05,461.21,1511.95,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,1359360, PASSED ,1.49845e-05,795.597,2608.14,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,1359360, PASSED ,1.86243e-05,640.111,2098.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,15929280, PASSED ,0.0420641,3.32111,10.8874,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,15929280, PASSED ,0.000176184,792.915,2599.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,15929280, PASSED ,0.000136873,1020.65,3345.94,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,15929280, PASSED ,0.000247461,564.531,1850.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,15929280, PASSED ,0.000139345,1002.54,3286.56,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,15929280, PASSED ,0.000168882,827.198,2711.75,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,169920, PASSED ,0.000449126,3.31818,10.8771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,169920, PASSED ,9.70306e-06,153.589,503.47,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,169920, PASSED ,5.24762e-06,283.992,930.936,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,169920, PASSED ,1.16273e-05,128.171,420.15,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,169920, PASSED ,5.26184e-06,283.224,928.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,169920, PASSED ,8.50964e-06,175.128,574.078,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,21748800, PASSED ,0.0574672,3.31904,10.8806,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,21748800, PASSED ,0.000237219,804.051,2635.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,21748800, PASSED ,0.000188966,1009.37,3308.95,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,21748800, PASSED ,0.000330231,577.583,1893.45,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,21748800, PASSED ,0.000191322,996.938,3268.2,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,21748800, PASSED ,0.000227255,839.303,2751.43,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,2718720, PASSED ,0.00720265,3.31033,10.852,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,2718720, PASSED ,3.29328e-05,723.994,2373.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,2718720, PASSED ,2.49973e-05,953.827,3126.86,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,2718720, PASSED ,4.53858e-05,525.343,1722.19,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,2718720, PASSED ,2.51395e-05,948.432,3109.17,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,2718720, PASSED ,3.14616e-05,757.849,2484.4,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,31858560, PASSED ,0.0842107,3.31785,10.8767,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,31858560, PASSED ,0.00035829,779.81,2556.4,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,31858560, PASSED ,0.000284392,982.439,3220.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,31858560, PASSED ,0.000555495,502.972,1648.86,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,31858560, PASSED ,0.000287991,970.163,3180.43,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,31858560, PASSED ,0.000345116,809.578,2653.99,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,339840, PASSED ,0.000905836,3.2903,10.7861,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,339840, PASSED ,1.09155e-05,273.05,895.096,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,339840, PASSED ,7.26342e-06,410.34,1345.15,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,339840, PASSED ,1.28771e-05,231.455,758.743,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,339840, PASSED ,7.32402e-06,406.945,1334.02,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,339840, PASSED ,9.75826e-06,305.431,1001.24,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,42624, PASSED ,0.00011074,3.37636,11.0659,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,42624, PASSED ,8.65344e-06,43.2082,141.613,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,42624, PASSED ,4.45024e-06,84.0179,275.365,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,42624, PASSED ,1.08813e-05,34.3618,112.619,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,42624, PASSED ,4.49202e-06,83.2365,272.804,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,42624, PASSED ,7.92064e-06,47.2058,154.715,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,42477888, PASSED ,0.112431,3.3134,10.8621,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,42477888, PASSED ,0.000479021,777.689,2549.45,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,42477888, PASSED ,0.000376279,990.035,3245.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,42477888, PASSED ,0.000753065,494.684,1621.69,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,42477888, PASSED ,0.000383214,972.117,3186.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,42477888, PASSED ,0.000460465,809.028,2652.19,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,5437248, PASSED ,0.0143904,3.31363,10.8628,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,5437248, PASSED ,6.12509e-05,778.511,2552.14,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,5437248, PASSED ,4.58848e-05,1039.22,3406.81,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,5437248, PASSED ,8.75493e-05,544.659,1785.52,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,5437248, PASSED ,4.585e-05,1040.01,3409.39,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,5437248, PASSED ,5.92889e-05,804.273,2636.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_Seq,default,679680, PASSED ,0.00179864,3.31409,10.8642,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,679680, PASSED ,1.67109e-05,356.704,1169.34,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,Base_HIP,direct_64,679680, PASSED ,1.18949e-05,501.128,1642.79,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,679680, PASSED ,1.68273e-05,354.237,1161.26,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,679680, PASSED ,1.19329e-05,499.533,1637.56,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-direct_64 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,679680, PASSED ,1.32735e-05,449.08,1472.17,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2744, PASSED ,1.76963e-05,5.1525,1.39555,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,2744, PASSED ,2.30361e-06,39.5814,10.7206,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,2744, PASSED ,2.42171e-06,37.6512,10.1978,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,4096000, PASSED ,0.0279455,4.40936,1.31914,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,4096000, PASSED ,0.000167822,734.242,219.661,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,4096000, PASSED ,0.000167407,736.062,220.206,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,493039, PASSED ,0.00333371,4.49236,1.33105,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,493039, PASSED ,2.36951e-05,632.039,187.268,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,493039, PASSED ,2.3417e-05,639.545,189.492,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,6028568, PASSED ,0.0408225,4.43761,1.3291,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,6028568, PASSED ,0.000243082,745.24,223.205,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,6028568, PASSED ,0.000242865,745.905,223.404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,54872, PASSED ,0.000363388,4.68254,1.35901,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,54872, PASSED ,5.00423e-06,340.028,98.6861,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,54872, PASSED ,4.51163e-06,377.154,109.461,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,8242408, PASSED ,0.0557438,4.43953,1.33076,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,8242408, PASSED ,0.000326239,758.572,227.384,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,8242408, PASSED ,0.000325702,759.823,227.759,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000000, PASSED ,0.006759,4.47608,1.33156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,1000000, PASSED ,4.37428e-05,691.63,205.748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,1000000, PASSED ,4.3776e-05,691.105,205.592,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,12167000, PASSED ,0.0821564,4.4425,1.33286,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,12167000, PASSED ,0.000480409,759.727,227.937,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,12167000, PASSED ,0.000481516,757.981,227.413,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,117649, PASSED ,0.000785798,4.60138,1.34747,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,117649, PASSED ,7.89024e-06,458.256,134.196,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,117649, PASSED ,7.65984e-06,472.04,138.233,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,12167, PASSED ,8.00891e-05,4.83581,1.36726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,12167, PASSED ,2.62242e-06,147.687,41.7565,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,12167, PASSED ,2.59201e-06,149.419,42.2464,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,16194277, PASSED ,0.110612,4.38922,1.31766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,16194277, PASSED ,0.000624651,777.233,233.328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,16194277, PASSED ,0.000625743,775.878,232.921,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2048383, PASSED ,0.0138464,4.46134,1.33143,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,2048383, PASSED ,8.72264e-05,708.195,211.352,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,2048383, PASSED ,8.65385e-05,713.825,213.032,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,238328, PASSED ,0.00158805,4.58258,1.35069,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,238328, PASSED ,1.24791e-05,583.165,171.884,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,238328, PASSED ,1.20186e-05,605.51,178.47,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,1331, PASSED ,1.29701e-05,7.06277,16.0597,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,1331, PASSED ,2.85652e-06,32.0687,72.9195,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,1331, PASSED ,2.84803e-06,32.1643,73.1369,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,2985984, PASSED ,0.0153918,6.22355,14.9582,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,2985984, PASSED ,7.77983e-05,1231.28,2959.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,2985984, PASSED ,7.82093e-05,1224.81,2943.81,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,343000, PASSED ,0.00174691,6.79477,16.244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,343000, PASSED ,9.58489e-06,1238.39,2960.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,343000, PASSED ,9.61098e-06,1235.03,2952.54,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,4410944, PASSED ,0.0225525,6.219,14.9566,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,4410944, PASSED ,0.000115172,1217.78,2928.74,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,4410944, PASSED ,0.000115982,1209.27,2908.28,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,35937, PASSED ,0.000213364,6.82946,16.1433,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,35937, PASSED ,3.81023e-06,382.434,903.99,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,35937, PASSED ,3.07513e-06,473.854,1120.09,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,6028568, PASSED ,0.0300666,6.33519,15.2428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,6028568, PASSED ,0.000153507,1240.84,2985.54,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,6028568, PASSED ,0.00015537,1225.97,2949.74,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,704969, PASSED ,0.00354642,6.66757,15.9752,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,704969, PASSED ,2.01284e-05,1174.76,2814.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,704969, PASSED ,2.02711e-05,1166.49,2794.85,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,8869743, PASSED ,0.0447857,6.21392,14.9584,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,8869743, PASSED ,0.000204717,1359.41,3272.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,8869743, PASSED ,0.000203806,1365.48,3287.05,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,79507, PASSED ,0.000441426,6.81901,16.1981,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,79507, PASSED ,4.51784e-06,666.267,1582.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,79507, PASSED ,3.94823e-06,762.389,1811.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,8000, PASSED ,6.04437e-05,6.44564,15.0352,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,8000, PASSED ,2.92433e-06,133.227,310.767,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,8000, PASSED ,2.99732e-06,129.982,303.199,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,12008989, PASSED ,0.0613183,6.11479,14.7248,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,12008989, PASSED ,0.000380677,984.951,2371.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,12008989, PASSED ,0.000368261,1018.16,2451.8,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,1442897, PASSED ,0.00728869,6.47818,15.5485,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,1442897, PASSED ,3.48778e-05,1353.8,3249.29,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,1442897, PASSED ,3.4181e-05,1381.39,3315.53,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_VOL3D,Base_Seq,default,166375, PASSED ,0.000874319,6.84974,16.3297,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_VOL3D,Base_HIP,block_256,166375, PASSED ,5.87645e-06,1019.13,2429.59,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_VOL3D,RAJA_HIP,block_256,166375, PASSED ,5.68725e-06,1053.03,2510.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_DIFFUSION3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_DIFFUSION3DPA_bandwidth.png new file mode 100644 index 0000000..012d279 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_DIFFUSION3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_DIFFUSION3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_DIFFUSION3DPA_flops.png new file mode 100644 index 0000000..09e29c4 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_DIFFUSION3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_EDGE3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_EDGE3D_bandwidth.png new file mode 100644 index 0000000..a190136 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_EDGE3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_EDGE3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_EDGE3D_flops.png new file mode 100644 index 0000000..833c23e Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_EDGE3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_ENERGY_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_ENERGY_bandwidth.png new file mode 100644 index 0000000..01f94e2 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_ENERGY_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_ENERGY_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_ENERGY_flops.png new file mode 100644 index 0000000..edac6e6 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_ENERGY_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_FEMSWEEP_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_FEMSWEEP_bandwidth.png new file mode 100644 index 0000000..dd9484a Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_FEMSWEEP_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_FEMSWEEP_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_FEMSWEEP_flops.png new file mode 100644 index 0000000..f613b2e Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_FEMSWEEP_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_INTSC_HEXRECT_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_INTSC_HEXRECT_bandwidth.png new file mode 100644 index 0000000..e88cdf0 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_INTSC_HEXRECT_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_INTSC_HEXRECT_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_INTSC_HEXRECT_flops.png new file mode 100644 index 0000000..58f8f59 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_INTSC_HEXRECT_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DEA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DEA_bandwidth.png new file mode 100644 index 0000000..e455fb7 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DEA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DEA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DEA_flops.png new file mode 100644 index 0000000..22588f0 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DEA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png new file mode 100644 index 0000000..0e1443b Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DPA_ATOMIC_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DPA_ATOMIC_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DPA_ATOMIC_flops.png new file mode 100644 index 0000000..3f52c8a Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASS3DPA_ATOMIC_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASSVEC3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASSVEC3DPA_bandwidth.png new file mode 100644 index 0000000..575266f Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASSVEC3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASSVEC3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASSVEC3DPA_flops.png new file mode 100644 index 0000000..f38411e Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_MASSVEC3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png new file mode 100644 index 0000000..a4db1ad Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_NODAL_ACCUMULATION_3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_NODAL_ACCUMULATION_3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_NODAL_ACCUMULATION_3D_flops.png new file mode 100644 index 0000000..2d58e44 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_NODAL_ACCUMULATION_3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_VOL3D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_VOL3D_bandwidth.png new file mode 100644 index 0000000..b8123da Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_VOL3D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_VOL3D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_VOL3D_flops.png new file mode 100644 index 0000000..21794ed Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/figures/Apps_VOL3D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/output_with_variant_tuning.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/output_with_variant_tuning.csv new file mode 100644 index 0000000..9ca7d10 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/output_with_variant_tuning.csv @@ -0,0 +1,436 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning,Smoothed Mean flops (gigaFLOP per sec.),Smoothed Bandwidth (GiB per sec.) +Apps_DIFFUSION3DPA,Base_Seq,default,783, PASSED ,1.52621e-05,6.59477,9.8788,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,9.8788,6.59477 +Apps_DIFFUSION3DPA,Base_HIP,block_64,783, PASSED ,3.94562e-06,25.5093,38.2122,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,148.572,99.0499 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,783, PASSED ,3.77782e-06,26.6423,39.9095,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,155.076,103.387 +Apps_DIFFUSION3DPA,Base_Seq,default,789048, PASSED ,0.034789,2.91033,4.36735,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,4.39209,2.92682 +Apps_DIFFUSION3DPA,Base_HIP,block_64,789048, PASSED ,4.22642e-05,2395.58,3594.9,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,3357.58,2237.43 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,789048, PASSED ,4.10318e-05,2467.53,3702.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,3488.83,2324.9 +Apps_DIFFUSION3DPA,Base_Seq,default,98631, PASSED ,0.00206685,6.12336,9.18884,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,9.18884,6.12336 +Apps_DIFFUSION3DPA,Base_HIP,block_64,98631, PASSED ,9.35384e-06,1353.03,2030.39,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,2030.39,1353.03 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,98631, PASSED ,9.02344e-06,1402.58,2104.73,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2104.73,1402.58 +Apps_DIFFUSION3DPA,Base_Seq,default,1155843, PASSED ,0.0506738,2.92682,4.39209,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,4.39209,2.92682 +Apps_DIFFUSION3DPA,Base_HIP,block_64,1155843, PASSED ,5.91221e-05,2508.59,3764.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,3357.58,2237.43 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,1155843, PASSED ,5.81985e-05,2548.4,3824.22,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,3488.83,2324.9 +Apps_DIFFUSION3DPA,Base_Seq,default,12339, PASSED ,0.000256495,6.17346,9.2631,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,9.34422,6.227 +Apps_DIFFUSION3DPA,Base_HIP,block_64,12339, PASSED ,4.06142e-06,389.88,585.003,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,585.003,389.88 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,12339, PASSED ,3.99682e-06,396.181,594.458,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,594.458,396.181 +Apps_DIFFUSION3DPA,Base_Seq,default,1578096, PASSED ,0.0670738,3.01898,4.5304,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,4.5304,3.01898 +Apps_DIFFUSION3DPA,Base_HIP,block_64,1578096, PASSED ,9.0503e-05,2237.43,3357.58,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64,3357.58,2237.43 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,1578096, PASSED ,8.70982e-05,2324.9,3488.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64,3488.83,2324.9 +Apps_DIFFUSION3DPA,Base_Seq,default,197262, PASSED ,0.00572334,4.42259,6.63667,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,6.63667,4.42259 +Apps_DIFFUSION3DPA,Base_HIP,block_64,197262, PASSED ,1.37453e-05,1841.5,2763.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,2763.42,1841.5 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,197262, PASSED ,1.32539e-05,1909.78,2865.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2865.87,1909.78 +Apps_DIFFUSION3DPA,Base_Seq,default,2311659, PASSED ,0.0951131,3.11862,4.67993,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,4.5915300000000006,3.0597149999999997 +Apps_DIFFUSION3DPA,Base_HIP,block_64,2311659, PASSED ,0.00014653,2024.31,3037.75,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64,3197.665,2130.87 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,2311659, PASSED ,0.000139678,2123.62,3186.78,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,3337.8050000000003,2224.26 +Apps_DIFFUSION3DPA,Base_Seq,default,24678, PASSED ,0.000509739,6.21249,9.32219,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,9.32219,6.21249 +Apps_DIFFUSION3DPA,Base_HIP,block_64,24678, PASSED ,4.56042e-06,694.399,1041.98,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,1041.98,694.399 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,24678, PASSED ,4.40162e-06,719.451,1079.58,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1079.58,719.451 +Apps_DIFFUSION3DPA,Base_Seq,default,3105, PASSED ,5.99091e-05,6.65339,9.97987,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,9.600495,6.40363 +Apps_DIFFUSION3DPA,Base_HIP,block_64,3105, PASSED ,4.02422e-06,99.0499,148.572,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,366.7875,244.46495 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,3105, PASSED ,3.85542e-06,103.387,155.076,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,374.767,249.784 +Apps_DIFFUSION3DPA,Base_Seq,default,3082212, PASSED ,0.127561,3.10045,4.65266,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,4.65266,3.10045 +Apps_DIFFUSION3DPA,Base_HIP,block_64,3082212, PASSED ,0.000204995,1929.3,2895.18,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64,3037.75,2024.31 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,3082212, PASSED ,0.000196137,2016.42,3025.93,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,3186.78,2123.62 +Apps_DIFFUSION3DPA,Base_Seq,default,394524, PASSED ,0.0298307,1.69703,2.54663,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,4.39209,2.92682 +Apps_DIFFUSION3DPA,Base_HIP,block_64,394524, PASSED ,2.28123e-05,2219.14,3330.12,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,3330.12,2219.14 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,394524, PASSED ,2.22693e-05,2273.25,3411.32,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,3411.32,2273.25 +Apps_DIFFUSION3DPA,Base_Seq,default,49329, PASSED ,0.00101652,6.227,9.34422,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,9.2631,6.17346 +Apps_DIFFUSION3DPA,Base_HIP,block_64,49329, PASSED ,6.11384e-06,1035.33,1553.62,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,1553.62,1035.33 +Apps_DIFFUSION3DPA,RAJA_HIP,block_64,49329, PASSED ,6.09682e-06,1038.22,1557.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/DIFFUSION3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1557.96,1038.22 +Apps_EDGE3D,Base_Seq,default,1331, PASSED ,0.0045701,0.0200444,8.36483,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,8.36483,0.0195325 +Apps_EDGE3D,Base_HIP,block_256,1331, PASSED ,3.31972e-05,2.75942,1151.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,4989.71,11.6555 +Apps_EDGE3D,RAJA_HIP,block_256,1331, PASSED ,2.43981e-05,3.75459,1566.85,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,6813.73,15.9162 +Apps_EDGE3D,Base_Seq,default,2985984, PASSED ,5.0457,0.0189848,8.3743,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,8.3743,0.0189935 +Apps_EDGE3D,Base_HIP,block_256,2985984, PASSED ,0.00150339,63.717,28106.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,28106.0,63.717 +Apps_EDGE3D,RAJA_HIP,block_256,2985984, PASSED ,0.00149804,63.9446,28206.4,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,28206.4,63.9446 +Apps_EDGE3D,Base_Seq,default,343000, PASSED ,0.621116,0.0191105,8.3848,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,8.37836,0.0191105 +Apps_EDGE3D,Base_HIP,block_256,343000, PASSED ,0.000187528,63.2963,27771.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,26898.6,61.1716 +Apps_EDGE3D,RAJA_HIP,block_256,343000, PASSED ,0.000179909,65.9768,28947.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,27834.6,63.2589 +Apps_EDGE3D,Base_Seq,default,4410944, PASSED ,7.38432,0.0189935,8.38338,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,8.37918,0.0189848 +Apps_EDGE3D,Base_HIP,block_256,4410944, PASSED ,0.00219391,63.9287,28217.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,28217.0,63.9287 +Apps_EDGE3D,RAJA_HIP,block_256,4410944, PASSED ,0.00216035,64.9219,28655.4,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,28655.4,64.9219 +Apps_EDGE3D,Base_Seq,default,35937, PASSED ,0.0755259,0.0192935,8.3699,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,8.3699,0.0192935 +Apps_EDGE3D,Base_HIP,block_256,35937, PASSED ,3.48721e-05,41.7859,18127.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,18127.5,41.7859 +Apps_EDGE3D,RAJA_HIP,block_256,35937, PASSED ,2.66972e-05,54.5811,23678.3,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,23678.3,54.5811 +Apps_EDGE3D,Base_Seq,default,6028568, PASSED ,10.0335,0.0189842,8.38302,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,8.38257,0.0189842 +Apps_EDGE3D,Base_HIP,block_256,6028568, PASSED ,0.00294526,64.6727,28558.1,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,28558.1,64.6727 +Apps_EDGE3D,RAJA_HIP,block_256,6028568, PASSED ,0.00292489,65.1231,28757.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256,28757.0,65.1231 +Apps_EDGE3D,Base_Seq,default,704969, PASSED ,1.24175,0.0190425,8.37346,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,8.3743,0.0190425 +Apps_EDGE3D,Base_HIP,block_256,704969, PASSED ,0.000386552,61.1716,26898.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,27771.5,63.2963 +Apps_EDGE3D,RAJA_HIP,block_256,704969, PASSED ,0.000373554,63.3001,27834.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,27864.9,63.3001 +Apps_EDGE3D,Base_Seq,default,8869743, PASSED ,14.6732,0.0189662,8.37918,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,8.382795,0.0189758 +Apps_EDGE3D,Base_HIP,block_256,8869743, PASSED ,0.00427903,65.0368,28733.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,28586.55,64.71015 +Apps_EDGE3D,RAJA_HIP,block_256,8869743, PASSED ,0.00424764,65.5175,28945.3,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,28847.5,65.3008 +Apps_EDGE3D,Base_Seq,default,79507, PASSED ,0.156569,0.0192253,8.38141,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,8.37836,0.0192253 +Apps_EDGE3D,Base_HIP,block_256,79507, PASSED ,6.01914e-05,50.0086,21801.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,21801.6,50.0086 +Apps_EDGE3D,RAJA_HIP,block_256,79507, PASSED ,5.02532e-05,59.8984,26113.1,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,25705.7,58.752 +Apps_EDGE3D,Base_Seq,default,8000, PASSED ,0.0199461,0.0195325,8.36188,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,8.367365,0.019413 +Apps_EDGE3D,Base_HIP,block_256,8000, PASSED ,3.34262e-05,11.6555,4989.71,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,11558.605,26.7207 +Apps_EDGE3D,RAJA_HIP,block_256,8000, PASSED ,2.44781e-05,15.9162,6813.73,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,15246.015,35.24865 +Apps_EDGE3D,Base_Seq,default,12008989, PASSED ,19.7681,0.0189674,8.38257,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,8.38257,0.0189674 +Apps_EDGE3D,Base_HIP,block_256,12008989, PASSED ,0.00579093,64.7476,28615.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,28615.0,64.7476 +Apps_EDGE3D,RAJA_HIP,block_256,12008989, PASSED ,0.00572628,65.4785,28938.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,28938.0,65.4785 +Apps_EDGE3D,Base_Seq,default,1442897, PASSED ,2.48444,0.0190052,8.37162,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,8.3743,0.0190052 +Apps_EDGE3D,Base_HIP,block_256,1442897, PASSED ,0.000745835,63.3082,27886.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,27886.6,63.3082 +Apps_EDGE3D,RAJA_HIP,block_256,1442897, PASSED ,0.000746416,63.2589,27864.9,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,28206.4,63.9446 +Apps_EDGE3D,Base_Seq,default,166375, PASSED ,0.312746,0.0191493,8.37836,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,8.37836,0.0191493 +Apps_EDGE3D,Base_HIP,block_256,166375, PASSED ,0.000105301,56.8739,24884.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,24884.0,56.8739 +Apps_EDGE3D,RAJA_HIP,block_256,166375, PASSED ,0.000101935,58.752,25705.7,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/EDGE3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,26113.1,59.8984 +Apps_ENERGY,Base_Seq,default,834, PASSED ,4.14395e-06,40.4861,11.0692,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,11.0692,40.4861 +Apps_ENERGY,Base_HIP,block_256,834, PASSED ,1.15341e-05,14.5457,3.97689,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,15.6587,57.2725 +Apps_ENERGY,RAJA_HIP,block_256,834, PASSED ,1.19728e-05,14.0127,3.83117,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,14.9557,54.7015 +Apps_ENERGY,Base_Seq,default,853334, PASSED ,0.00643223,26.6877,7.29659,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,7.29659,26.6877 +Apps_ENERGY,Base_HIP,block_256,853334, PASSED ,6.0447e-05,2839.87,776.438,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,776.438,2839.87 +Apps_ENERGY,RAJA_HIP,block_256,853334, PASSED ,6.00405e-05,2859.1,781.695,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,781.695,2859.1 +Apps_ENERGY,Base_Seq,default,106667, PASSED ,0.000533405,40.2279,10.9986,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.766,39.3772 +Apps_ENERGY,Base_HIP,block_256,106667, PASSED ,1.40628e-05,1525.85,417.176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,417.176,1525.85 +Apps_ENERGY,RAJA_HIP,block_256,106667, PASSED ,1.40413e-05,1528.19,417.816,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,417.816,1528.19 +Apps_ENERGY,Base_Seq,default,1250000, PASSED ,0.00951771,26.4199,7.22338,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,7.2517,26.5235 +Apps_ENERGY,Base_HIP,block_256,1250000, PASSED ,8.24619e-05,3049.37,833.718,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,833.718,3049.37 +Apps_ENERGY,RAJA_HIP,block_256,1250000, PASSED ,8.25312e-05,3046.81,833.018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,833.018,3046.81 +Apps_ENERGY,Base_Seq,default,13334, PASSED ,7.0189e-05,38.216,10.4485,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,10.766,39.3772 +Apps_ENERGY,Base_HIP,block_256,13334, PASSED ,1.2856e-05,208.645,57.045,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,57.045,208.645 +Apps_ENERGY,RAJA_HIP,block_256,13334, PASSED ,1.19919e-05,223.679,61.1554,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,61.1554,223.679 +Apps_ENERGY,Base_Seq,default,1706667, PASSED ,0.0129441,26.5235,7.2517,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,7.23801,26.4735 +Apps_ENERGY,Base_HIP,block_256,1706667, PASSED ,0.000107501,3193.68,873.173,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,873.173,3193.68 +Apps_ENERGY,RAJA_HIP,block_256,1706667, PASSED ,0.00010817,3173.91,867.768,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256,867.768,3173.91 +Apps_ENERGY,Base_Seq,default,213334, PASSED ,0.00107605,39.8824,10.9041,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,10.766,39.3772 +Apps_ENERGY,Base_HIP,block_256,213334, PASSED ,1.93483e-05,2218.04,606.428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,606.428,2218.04 +Apps_ENERGY,RAJA_HIP,block_256,213334, PASSED ,1.89296e-05,2267.1,619.841,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,619.841,2267.1 +Apps_ENERGY,Base_Seq,default,2500000, PASSED ,0.0189969,26.4735,7.23801,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,7.230695,26.4467 +Apps_ENERGY,Base_HIP,block_256,2500000, PASSED ,0.000150975,3331.12,910.749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,891.961,3262.3999999999996 +Apps_ENERGY,RAJA_HIP,block_256,2500000, PASSED ,0.000151074,3328.94,910.152,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,888.96,3251.425 +Apps_ENERGY,Base_Seq,default,26667, PASSED ,0.000139004,38.5922,10.5514,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,10.766,39.3772 +Apps_ENERGY,Base_HIP,block_256,26667, PASSED ,1.29641e-05,413.794,113.134,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,113.134,413.794 +Apps_ENERGY,RAJA_HIP,block_256,26667, PASSED ,1.21971e-05,439.815,120.248,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,120.248,439.815 +Apps_ENERGY,Base_Seq,default,3334, PASSED ,1.61679e-05,41.4825,11.3416,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,10.8103,39.53915 +Apps_ENERGY,Base_HIP,block_256,3334, PASSED ,1.17104e-05,57.2725,15.6587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,36.35185,132.95875 +Apps_ENERGY,RAJA_HIP,block_256,3334, PASSED ,1.22608e-05,54.7015,14.9557,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,38.05555,139.19025 +Apps_ENERGY,Base_Seq,default,3333334, PASSED ,0.0254586,26.339,7.20124,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,7.23801,26.4735 +Apps_ENERGY,Base_HIP,block_256,3333334, PASSED ,0.000198461,3378.76,923.776,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,910.749,3331.12 +Apps_ENERGY,RAJA_HIP,block_256,3333334, PASSED ,0.000198093,3385.04,925.493,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,910.152,3328.94 +Apps_ENERGY,Base_Seq,default,426667, PASSED ,0.00249307,34.4278,9.41277,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,9.41277,34.4278 +Apps_ENERGY,Base_HIP,block_256,426667, PASSED ,3.15686e-05,2718.87,743.356,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,743.356,2718.87 +Apps_ENERGY,RAJA_HIP,block_256,426667, PASSED ,3.12816e-05,2743.81,750.174,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,750.174,2743.81 +Apps_ENERGY,Base_Seq,default,53334, PASSED ,0.000272467,39.3772,10.766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,10.766,39.3772 +Apps_ENERGY,Base_HIP,block_256,53334, PASSED ,1.24929e-05,858.804,234.803,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,234.803,858.804 +Apps_ENERGY,RAJA_HIP,block_256,53334, PASSED ,1.24885e-05,859.106,234.885,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/ENERGY_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,234.885,859.106 +Apps_FEMSWEEP,Base_Seq,default,839808, PASSED ,0.314054,0.448329,2.32824,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,2.32824,0.448329 +Apps_FEMSWEEP,Base_HIP,block_64,839808, PASSED ,0.000686444,205.115,1065.19,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,986.771,191.136 +Apps_FEMSWEEP,RAJA_HIP,block_64,839808, PASSED ,0.000634834,221.79,1151.79,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1003.73,194.421 +Apps_FEMSWEEP,Base_Seq,default,144000, PASSED ,0.0390188,0.592812,3.16205,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,3.01734,0.541864 +Apps_FEMSWEEP,Base_HIP,block_64,144000, PASSED ,0.000228331,101.304,540.352,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,540.352,101.304 +Apps_FEMSWEEP,RAJA_HIP,block_64,144000, PASSED ,0.000209351,110.488,589.341,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,589.341,110.488 +Apps_FEMSWEEP,Base_Seq,default,1152000, PASSED ,0.461941,0.420301,2.17561,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,2.26231,0.438205 +Apps_FEMSWEEP,Base_HIP,block_64,1152000, PASSED ,0.000927976,209.224,1083.01,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,1065.19,205.115 +Apps_FEMSWEEP,RAJA_HIP,block_64,1152000, PASSED ,0.000880425,220.524,1141.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1141.5,220.524 +Apps_FEMSWEEP,Base_Seq,default,1533312, PASSED ,0.592243,0.438205,2.26231,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,2.22341,0.432411 +Apps_FEMSWEEP,Base_HIP,block_64,1533312, PASSED ,0.0013578,191.136,986.771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64,1065.19,206.848 +Apps_FEMSWEEP,RAJA_HIP,block_64,1533312, PASSED ,0.00133486,194.421,1003.73,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1141.5,220.524 +Apps_FEMSWEEP,Base_Seq,default,248832, PASSED ,0.0779046,0.521471,2.75328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,2.75328,0.521471 +Apps_FEMSWEEP,Base_HIP,block_64,248832, PASSED ,0.000290232,139.974,739.04,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,739.04,139.974 +Apps_FEMSWEEP,RAJA_HIP,block_64,248832, PASSED ,0.000274901,147.78,780.256,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,780.256,147.78 +Apps_FEMSWEEP,Base_Seq,default,2530944, PASSED ,0.997166,0.432411,2.22341,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,2.22007,0.432411 +Apps_FEMSWEEP,Base_HIP,block_64,2530944, PASSED ,0.00200299,215.271,1106.9,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64,1061.91,206.848 +Apps_FEMSWEEP,RAJA_HIP,block_64,2530944, PASSED ,0.00189379,227.684,1170.72,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1072.33,209.161 +Apps_FEMSWEEP,Base_Seq,default,31104, PASSED ,0.00861784,0.541864,3.01734,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,3.16205,0.592812 +Apps_FEMSWEEP,Base_HIP,block_64,31104, PASSED ,0.00011377,41.0451,228.557,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,372.233,68.6976 +Apps_FEMSWEEP,RAJA_HIP,block_64,31104, PASSED ,0.00010736,43.4957,242.203,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,408.902,75.465 +Apps_FEMSWEEP,Base_Seq,default,3161088, PASSED ,1.25196,0.431259,2.21399,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,2.22007,0.432411 +Apps_FEMSWEEP,Base_HIP,block_64,3161088, PASSED ,0.00261022,206.848,1061.91,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64,1024.31,199.795 +Apps_FEMSWEEP,RAJA_HIP,block_64,3161088, PASSED ,0.00259887,207.751,1066.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1066.55,207.751 +Apps_FEMSWEEP,Base_Seq,default,3888000, PASSED ,1.53694,0.433031,2.22007,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default,2.2170300000000003,0.43183499999999997 +Apps_FEMSWEEP,Base_HIP,block_64,3888000, PASSED ,0.00333112,199.795,1024.31,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_5000-kernel-run-data.csv,HIP,Base_HIP-block_64,1043.1100000000001,203.32150000000001 +Apps_FEMSWEEP,RAJA_HIP,block_64,3888000, PASSED ,0.00318197,209.161,1072.33,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1069.44,208.45600000000002 +Apps_FEMSWEEP,Base_Seq,default,395136, PASSED ,0.143758,0.453919,2.37951,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,2.37951,0.453919 +Apps_FEMSWEEP,Base_HIP,block_64,395136, PASSED ,0.000379102,172.13,902.329,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,902.329,172.13 +Apps_FEMSWEEP,RAJA_HIP,block_64,395136, PASSED ,0.000359132,181.701,952.505,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,952.505,181.701 +Apps_FEMSWEEP,Base_Seq,default,4718592, PASSED ,1.96638,0.411559,2.10748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default,2.21399,0.431259 +Apps_FEMSWEEP,Base_HIP,block_64,4718592, PASSED ,0.00409937,197.416,1010.91,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_6000-kernel-run-data.csv,HIP,Base_HIP-block_64,1024.31,199.795 +Apps_FEMSWEEP,RAJA_HIP,block_64,4718592, PASSED ,0.00397009,203.844,1043.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1066.55,207.751 +Apps_FEMSWEEP,Base_Seq,default,73728, PASSED ,0.0188448,0.613022,3.32161,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,3.089695,0.567338 +Apps_FEMSWEEP,Base_HIP,block_64,73728, PASSED ,0.000168161,68.6976,372.233,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,456.2925,85.0008 +Apps_FEMSWEEP,RAJA_HIP,block_64,73728, PASSED ,0.000153081,75.465,408.902,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/FEMSWEEP_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,499.12149999999997,92.9765 +Apps_INTSC_HEXRECT,Base_Seq,default,2744, PASSED ,0.00237766,0.0521051,4.15467,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,4.26245,0.0528136 +Apps_INTSC_HEXRECT,Base_HIP,block_64,2744, PASSED ,0.000247931,0.499688,39.8433,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,156.211,1.93552 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,2744, PASSED ,0.000255541,0.484808,38.6568,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,151.303,1.87471 +Apps_INTSC_HEXRECT,Base_Seq,default,2197000, PASSED ,1.81711,0.0530816,4.35263,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,4.34214,0.0529303 +Apps_INTSC_HEXRECT,Base_HIP,block_64,2197000, PASSED ,0.00856661,11.2594,923.259,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,923.259,11.2594 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,2197000, PASSED ,0.00873471,11.0427,905.491,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,905.491,11.0427 +Apps_INTSC_HEXRECT,Base_Seq,default,287496, PASSED ,0.238713,0.0530326,4.33569,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,4.33569,0.0530326 +Apps_INTSC_HEXRECT,Base_HIP,block_64,287496, PASSED ,0.00122388,10.3438,845.661,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,845.661,10.3438 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,287496, PASSED ,0.00123404,10.2587,838.699,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,838.699,10.2587 +Apps_INTSC_HEXRECT,Base_Seq,default,3241792, PASSED ,2.68792,0.0529303,4.34181,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,4.34214,0.0529303 +Apps_INTSC_HEXRECT,Base_HIP,block_64,3241792, PASSED ,0.0125309,11.3537,931.332,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,923.259,11.2594 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,3241792, PASSED ,0.0125623,11.3253,929.002,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,922.552,11.2406 +Apps_INTSC_HEXRECT,Base_Seq,default,39304, PASSED ,0.0327669,0.0531318,4.31822,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,4.31311,0.0528441 +Apps_INTSC_HEXRECT,Base_HIP,block_64,39304, PASSED ,0.000272142,6.39726,519.929,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,519.929,6.39726 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,39304, PASSED ,0.000269421,6.46187,525.18,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,525.18,6.46187 +Apps_INTSC_HEXRECT,Base_Seq,default,4410944, PASSED ,3.65704,0.0529206,4.34214,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,4.34181,0.0529206 +Apps_INTSC_HEXRECT,Base_HIP,block_64,4410944, PASSED ,0.0170731,11.3355,930.082,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64,930.082,11.3355 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,4410944, PASSED ,0.0170853,11.3275,929.419,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64,929.002,11.3253 +Apps_INTSC_HEXRECT,Base_Seq,default,551368, PASSED ,0.458565,0.0528825,4.32856,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,4.33569,0.0530326 +Apps_INTSC_HEXRECT,Base_HIP,block_64,551368, PASSED ,0.00231902,10.457,855.931,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,855.931,10.457 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,551368, PASSED ,0.0023197,10.454,855.681,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,855.681,10.454 +Apps_INTSC_HEXRECT,Base_Seq,default,6434856, PASSED ,5.37347,0.0525273,4.31109,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,4.336895,0.05284585 +Apps_INTSC_HEXRECT,Base_HIP,block_64,6434856, PASSED ,0.0251272,11.233,921.93,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64,930.707,11.3446 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,6434856, PASSED ,0.0251102,11.2406,922.552,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,929.2104999999999,11.3264 +Apps_INTSC_HEXRECT,Base_Seq,default,74088, PASSED ,0.0613179,0.0533937,4.34974,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,4.31822,0.0530326 +Apps_INTSC_HEXRECT,Base_HIP,block_64,74088, PASSED ,0.000477222,6.86053,558.895,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,558.895,6.86053 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,74088, PASSED ,0.000477652,6.85435,558.391,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,558.391,6.85435 +Apps_INTSC_HEXRECT,Base_Seq,default,10648, PASSED ,0.00899313,0.0528136,4.26245,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,4.290335000000001,0.0529727 +Apps_INTSC_HEXRECT,Base_HIP,block_64,10648, PASSED ,0.000245391,1.93552,156.211,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,338.07,4.16639 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,10648, PASSED ,0.000253351,1.87471,151.303,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,338.2415,4.16829 +Apps_INTSC_HEXRECT,Base_Seq,default,8741816, PASSED ,7.26471,0.0527711,4.33198,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,4.33198,0.0527711 +Apps_INTSC_HEXRECT,Base_HIP,block_64,8741816, PASSED ,0.0337429,11.3614,932.657,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64,930.082,11.3355 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,8741816, PASSED ,0.0337994,11.3424,931.096,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,929.419,11.3275 +Apps_INTSC_HEXRECT,Base_Seq,default,1124864, PASSED ,0.93186,0.0530364,4.34562,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,4.34181,0.0530326 +Apps_INTSC_HEXRECT,Base_HIP,block_64,1124864, PASSED ,0.00448612,11.0168,902.675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,902.675,11.0168 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,1124864, PASSED ,0.00448414,11.0216,903.073,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,903.073,11.0216 +Apps_INTSC_HEXRECT,Base_Seq,default,140608, PASSED ,0.117361,0.0528441,4.31311,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,4.32856,0.0530326 +Apps_INTSC_HEXRECT,Base_HIP,block_64,140608, PASSED ,0.000711863,8.71209,711.076,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,711.076,8.71209 +Apps_INTSC_HEXRECT,RAJA_HIP,block_64,140608, PASSED ,0.000716213,8.65917,706.757,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/INTSC_HEXRECT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,706.757,8.65917 +Apps_MASS3DEA,Base_Seq,default,12423168, PASSED ,1.08488,0.0879218,0.0801583,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.0803397,0.0881212 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,12423168, PASSED ,0.000475963,200.404,182.708,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,161.626,177.28 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,12423168, PASSED ,0.00234094,40.7463,37.1484,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,37.1484,40.7463 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,12423168, PASSED ,0.000517623,184.274,168.003,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,168.003,184.274 +Apps_MASS3DEA,Base_Seq,default,1556480, PASSED ,0.13504,0.0884974,0.0806822,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.0806808,0.0884974 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,1556480, PASSED ,0.000242861,49.2081,44.8625,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,44.8625,49.2081 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,1556480, PASSED ,0.000493563,24.2132,22.0749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,22.0749,24.2132 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,1556480, PASSED ,0.000268891,44.4445,40.5196,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,40.5196,44.4445 +Apps_MASS3DEA,Base_Seq,default,18198528, PASSED ,1.58544,0.0881316,0.0803496,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.0803496,0.0881316 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,18198528, PASSED ,0.000658503,212.19,193.453,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,170.032,186.5 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,18198528, PASSED ,0.00312076,44.7736,40.8201,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,38.7535,42.5068 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,18198528, PASSED ,0.000553713,252.347,230.064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,177.172,194.332 +Apps_MASS3DEA,Base_Seq,default,24842240, PASSED ,2.15621,0.0884596,0.0806487,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,0.0804058,0.0881932 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,24842240, PASSED ,0.00116103,164.284,149.777,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,182.708,200.404 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,24842240, PASSED ,0.00448723,42.5068,38.7535,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,38.9138,42.6827 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,24842240, PASSED ,0.000981506,194.332,177.172,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,214.176,234.919 +Apps_MASS3DEA,Base_Seq,default,3108864, PASSED ,0.270875,0.0881212,0.0803397,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.0803397,0.0881212 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,3108864, PASSED ,0.000268882,88.7745,80.9353,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,80.9353,88.7745 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,3108864, PASSED ,0.000621283,38.4203,35.0276,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,35.0276,38.4203 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,3108864, PASSED ,0.000295001,80.9145,73.7694,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,73.7694,80.9145 +Apps_MASS3DEA,Base_Seq,default,36392960, PASSED ,3.16617,0.0882529,0.0804602,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,0.0804602,0.0882529 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,36392960, PASSED ,0.00149825,186.5,170.032,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,185.948,203.957 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,36392960, PASSED ,0.0064397,43.3908,39.5594,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,39.2686,43.0718 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,36392960, PASSED ,0.00113517,246.152,224.417,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,224.417,246.152 +Apps_MASS3DEA,Base_Seq,default,389120, PASSED ,0.0337607,0.0884992,0.0806808,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.0806822,0.0884992 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,389120, PASSED ,0.000213251,14.0107,12.7729,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,24.697,27.0896 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,389120, PASSED ,0.000410102,7.28549,6.64186,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,12.4963,13.707 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,389120, PASSED ,0.000244311,12.2295,11.1491,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,21.9424,24.0681 +Apps_MASS3DEA,Base_Seq,default,48521216, PASSED ,4.22418,0.0881932,0.0804058,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,0.0804602,0.0882529 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,48521216, PASSED ,0.00182658,203.957,185.948,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,185.948,203.957 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,48521216, PASSED ,0.00872822,42.6827,38.9138,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,39.2686,43.0718 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,48521216, PASSED ,0.00158584,234.919,214.176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,224.417,246.152 +Apps_MASS3DEA,Base_Seq,default,60649472, PASSED ,5.27048,0.0883532,0.0805517,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default,0.080433,0.08822305 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,60649472, PASSED ,0.00225322,206.666,188.417,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_5000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,187.1825,205.3115 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,60649472, PASSED ,0.0108113,43.0718,39.2686,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,39.414,43.231300000000005 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,60649472, PASSED ,0.00165346,281.63,256.763,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,235.2885,258.0765 +Apps_MASS3DEA,Base_Seq,default,6213632, PASSED ,0.542445,0.0879501,0.080184,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.0803397,0.0881212 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,6213632, PASSED ,0.000269112,177.28,161.626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,161.626,177.28 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,6213632, PASSED ,0.0011904,40.0775,36.5386,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,36.5386,40.0775 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,6213632, PASSED ,0.000329122,144.956,132.156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,132.156,144.956 +Apps_MASS3DEA,Base_Seq,default,72781824, PASSED ,6.34614,0.0880561,0.0802808,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default,0.0804058,0.0881932 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,72781824, PASSED ,0.00254404,219.656,200.261,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_6000-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,188.417,206.666 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,72781824, PASSED ,0.0122295,45.694,41.6593,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,39.2686,43.0718 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,72781824, PASSED ,0.00206968,270.001,246.16,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,246.16,270.001 +Apps_MASS3DEA,Base_Seq,default,778240, PASSED ,0.0675182,0.0885011,0.0806846,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.08068149999999999,0.0884983 +Apps_MASS3DEA,Base_HIP,compile_time_block_stride_loop_64,778240, PASSED ,0.000220581,27.0896,24.697,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,Base_HIP-compile_time_block_stride_loop_64,34.77975,38.14885 +Apps_MASS3DEA,RAJA_HIP,compile_time_block_stride_loop_64,778240, PASSED ,0.000435942,13.707,12.4963,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-compile_time_block_stride_loop_64,17.2856,18.9601 +Apps_MASS3DEA,RAJA_HIP,cached_block_stride_loop_64,778240, PASSED ,0.000248272,24.0681,21.9424,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DEA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,31.230999999999998,34.256299999999996 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,1331, PASSED ,2.26429e-05,5.06074,10.3068,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,10.3068,4.9594 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,1331, PASSED ,3.27882e-06,34.9485,71.1765,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,281.662,134.669 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,1331, PASSED ,3.3538e-06,34.1672,69.5852,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,275.031,131.499 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,1030301, PASSED ,0.0252795,4.26351,9.23179,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,9.23179,4.26351 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,1030301, PASSED ,9.38549e-05,1148.36,2486.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,2460.23,1140.66 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,1030301, PASSED ,9.45637e-05,1139.76,2467.91,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2467.91,1139.76 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,132651, PASSED ,0.0028862,4.69783,10.1074,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.04,4.69783 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,132651, PASSED ,1.26401e-05,1072.69,2307.89,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,2307.89,1072.69 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,132651, PASSED ,1.25977e-05,1076.3,2315.66,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2315.66,1076.3 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,1442897, PASSED ,0.03543,4.27094,9.25416,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,9.23179,4.26351 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,1442897, PASSED ,0.000137042,1104.19,2392.52,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,2392.52,1104.19 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,1442897, PASSED ,0.000134097,1128.44,2445.07,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2445.07,1128.44 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,19683, PASSED ,0.000409404,4.71322,10.019,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,10.1523,4.734 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,19683, PASSED ,4.81102e-06,401.081,852.584,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,852.584,401.081 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,19683, PASSED ,4.87002e-06,396.222,842.255,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,842.255,396.222 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,2048383, PASSED ,0.0512858,4.19839,9.10268,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,9.25416,4.26945 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,2048383, PASSED ,0.000197218,1091.77,2367.11,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64,2367.11,1091.77 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,2048383, PASSED ,0.000196781,1094.2,2372.38,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2372.38,1094.2 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,250047, PASSED ,0.00556204,4.63633,9.9999,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,9.9999,4.63633 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,250047, PASSED ,2.26075e-05,1140.66,2460.23,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,2460.23,1140.66 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,250047, PASSED ,2.23367e-05,1154.49,2490.06,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2467.91,1139.76 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,2924207, PASSED ,0.0721465,4.26945,9.26198,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,9.25807,4.270195 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,2924207, PASSED ,0.000298031,1033.54,2242.11,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64,2304.61,1062.655 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,2924207, PASSED ,0.000302046,1019.8,2212.31,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2292.3450000000003,1057.0 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,35937, PASSED ,0.000761674,4.70075,10.04,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,10.1074,4.71322 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,35937, PASSED ,6.01042e-06,595.706,1272.33,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,1272.33,595.706 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,35937, PASSED ,6.10704e-06,586.281,1252.2,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1252.2,586.281 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,4913, PASSED ,9.21565e-05,4.9594,10.3726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,10.1734,4.836309999999999 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,4913, PASSED ,3.3938e-06,134.669,281.662,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,567.1229999999999,267.875 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,4913, PASSED ,3.47562e-06,131.499,275.031,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,558.643,263.8605 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,3869893, PASSED ,0.0952186,4.28746,9.30478,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,9.26198,4.26945 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,3869893, PASSED ,0.00040835,999.747,2169.68,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64,2242.11,1033.54 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,3869893, PASSED ,0.000409569,996.77,2163.22,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2212.31,1019.8 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,531441, PASSED ,0.0133381,4.14383,8.95839,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,9.25416,4.27094 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,531441, PASSED ,4.74962e-05,1163.69,2515.74,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,2460.23,1140.66 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,531441, PASSED ,4.82218e-05,1146.18,2477.88,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2467.91,1139.76 +Apps_MASS3DPA_ATOMIC,Base_Seq,default,68921, PASSED ,0.00147119,4.734,10.1523,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,10.04,4.70075 +Apps_MASS3DPA_ATOMIC,Base_HIP,block_64,68921, PASSED ,8.39866e-06,829.253,1778.38,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,1778.38,829.253 +Apps_MASS3DPA_ATOMIC,RAJA_HIP,block_64,68921, PASSED ,8.42884e-06,826.284,1772.01,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASS3DPA_ATOMIC_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1772.01,826.284 +Apps_MASSVEC3DPA,Base_Seq,default,10752, PASSED ,2.8153e-05,3.35254,10.98,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,10.98,3.35254 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,10752, PASSED ,8.60544e-06,10.9679,35.9215,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,141.613,43.2082 +Apps_MASSVEC3DPA,Base_HIP,direct_64,10752, PASSED ,4.36904e-06,21.6029,70.7524,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-direct_64,275.365,84.0179 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,10752, PASSED ,1.08205e-05,8.72273,28.5681,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,112.619,34.3618 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,10752, PASSED ,4.39602e-06,21.4703,70.3182,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,272.804,83.2365 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,10752, PASSED ,7.85724e-06,12.0124,39.3421,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,154.715,47.2058 +Apps_MASSVEC3DPA,Base_Seq,default,10874496, PASSED ,0.0287662,3.31531,10.8684,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,10.8684,3.31531 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,10874496, PASSED ,0.000124111,768.417,2519.05,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,2552.14,778.511 +Apps_MASSVEC3DPA,Base_HIP,direct_64,10874496, PASSED ,9.39571e-05,1015.03,3327.49,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-direct_64,3327.49,1015.03 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,10874496, PASSED ,0.000169509,562.617,1844.39,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1844.39,562.617 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,10874496, PASSED ,9.31709e-05,1023.59,3355.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,3286.56,1002.54 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,10874496, PASSED ,0.000120007,794.696,2605.2,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,2636.6,804.273 +Apps_MASSVEC3DPA,Base_Seq,default,1359360, PASSED ,0.00358768,3.32293,10.8933,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,10.8628,3.31363 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,1359360, PASSED ,1.92679e-05,618.729,2028.33,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,2028.33,618.729 +Apps_MASSVEC3DPA,Base_HIP,direct_64,1359360, PASSED ,1.48749e-05,801.461,2627.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-direct_64,2627.36,801.461 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,1359360, PASSED ,2.58485e-05,461.21,1511.95,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1511.95,461.21 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,1359360, PASSED ,1.49845e-05,795.597,2608.14,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,2608.14,795.597 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,1359360, PASSED ,1.86243e-05,640.111,2098.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,2098.42,640.111 +Apps_MASSVEC3DPA,Base_Seq,default,15929280, PASSED ,0.0420641,3.32111,10.8874,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,10.8767,3.31785 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,15929280, PASSED ,0.000176184,792.915,2599.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,2556.4,779.81 +Apps_MASSVEC3DPA,Base_HIP,direct_64,15929280, PASSED ,0.000136873,1020.65,3345.94,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-direct_64,3327.49,1015.03 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,15929280, PASSED ,0.000247461,564.531,1850.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1844.39,562.617 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,15929280, PASSED ,0.000139345,1002.54,3286.56,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,3286.56,1002.54 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,15929280, PASSED ,0.000168882,827.198,2711.75,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,2653.99,809.578 +Apps_MASSVEC3DPA,Base_Seq,default,169920, PASSED ,0.000449126,3.31818,10.8771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,10.8771,3.31818 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,169920, PASSED ,9.70306e-06,153.589,503.47,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,503.47,153.589 +Apps_MASSVEC3DPA,Base_HIP,direct_64,169920, PASSED ,5.24762e-06,283.992,930.936,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-direct_64,930.936,283.992 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,169920, PASSED ,1.16273e-05,128.171,420.15,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,420.15,128.171 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,169920, PASSED ,5.26184e-06,283.224,928.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,928.42,283.224 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,169920, PASSED ,8.50964e-06,175.128,574.078,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,574.078,175.128 +Apps_MASSVEC3DPA,Base_Seq,default,21748800, PASSED ,0.0574672,3.31904,10.8806,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,10.8767,3.31785 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,21748800, PASSED ,0.000237219,804.051,2635.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,2556.4,779.81 +Apps_MASSVEC3DPA,Base_HIP,direct_64,21748800, PASSED ,0.000188966,1009.37,3308.95,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-direct_64,3308.95,1009.37 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,21748800, PASSED ,0.000330231,577.583,1893.45,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1844.39,562.617 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,21748800, PASSED ,0.000191322,996.938,3268.2,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,3268.2,996.938 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,21748800, PASSED ,0.000227255,839.303,2751.43,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,2653.99,809.578 +Apps_MASSVEC3DPA,Base_Seq,default,2718720, PASSED ,0.00720265,3.31033,10.852,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,10.8642,3.31409 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,2718720, PASSED ,3.29328e-05,723.994,2373.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,2373.42,723.994 +Apps_MASSVEC3DPA,Base_HIP,direct_64,2718720, PASSED ,2.49973e-05,953.827,3126.86,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-direct_64,3126.86,953.827 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,2718720, PASSED ,4.53858e-05,525.343,1722.19,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1722.19,525.343 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,2718720, PASSED ,2.51395e-05,948.432,3109.17,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,3109.17,948.432 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,2718720, PASSED ,3.14616e-05,757.849,2484.4,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,2484.4,757.849 +Apps_MASSVEC3DPA,Base_Seq,default,31858560, PASSED ,0.0842107,3.31785,10.8767,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,10.87865,3.318445 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,31858560, PASSED ,0.00035829,779.81,2556.4,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,2577.88,786.3625 +Apps_MASSVEC3DPA,Base_HIP,direct_64,31858560, PASSED ,0.000284392,982.439,3220.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-direct_64,3277.26,999.7025 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,31858560, PASSED ,0.000555495,502.972,1648.86,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1749.7649999999999,533.7515 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,31858560, PASSED ,0.000287991,970.163,3180.43,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,3227.515,984.5274999999999 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,31858560, PASSED ,0.000345116,809.578,2653.99,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,2682.87,818.3879999999999 +Apps_MASSVEC3DPA,Base_Seq,default,339840, PASSED ,0.000905836,3.2903,10.7861,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,10.8771,3.31818 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,339840, PASSED ,1.09155e-05,273.05,895.096,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,895.096,273.05 +Apps_MASSVEC3DPA,Base_HIP,direct_64,339840, PASSED ,7.26342e-06,410.34,1345.15,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-direct_64,1345.15,410.34 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,339840, PASSED ,1.28771e-05,231.455,758.743,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,758.743,231.455 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,339840, PASSED ,7.32402e-06,406.945,1334.02,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,1334.02,406.945 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,339840, PASSED ,9.75826e-06,305.431,1001.24,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,1001.24,305.431 +Apps_MASSVEC3DPA,Base_Seq,default,42624, PASSED ,0.00011074,3.37636,11.0659,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,10.928550000000001,3.3353599999999997 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,42624, PASSED ,8.65344e-06,43.2082,141.613,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,322.54150000000004,98.3986 +Apps_MASSVEC3DPA,Base_HIP,direct_64,42624, PASSED ,4.45024e-06,84.0179,275.365,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-direct_64,603.1505,184.00495 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,42624, PASSED ,1.08813e-05,34.3618,112.619,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,266.3845,81.2664 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,42624, PASSED ,4.49202e-06,83.2365,272.804,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,600.612,183.23025 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,42624, PASSED ,7.92064e-06,47.2058,154.715,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,364.3965,111.1669 +Apps_MASSVEC3DPA,Base_Seq,default,42477888, PASSED ,0.112431,3.3134,10.8621,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,10.8767,3.31785 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,42477888, PASSED ,0.000479021,777.689,2549.45,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,2556.4,779.81 +Apps_MASSVEC3DPA,Base_HIP,direct_64,42477888, PASSED ,0.000376279,990.035,3245.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-direct_64,3245.57,990.035 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,42477888, PASSED ,0.000753065,494.684,1621.69,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1648.86,502.972 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,42477888, PASSED ,0.000383214,972.117,3186.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,3186.83,972.117 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,42477888, PASSED ,0.000460465,809.028,2652.19,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,2653.99,809.578 +Apps_MASSVEC3DPA,Base_Seq,default,5437248, PASSED ,0.0143904,3.31363,10.8628,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,10.8684,3.31531 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,5437248, PASSED ,6.12509e-05,778.511,2552.14,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,2519.05,768.417 +Apps_MASSVEC3DPA,Base_HIP,direct_64,5437248, PASSED ,4.58848e-05,1039.22,3406.81,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-direct_64,3327.49,1015.03 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,5437248, PASSED ,8.75493e-05,544.659,1785.52,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1785.52,544.659 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,5437248, PASSED ,4.585e-05,1040.01,3409.39,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,3286.56,1002.54 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,5437248, PASSED ,5.92889e-05,804.273,2636.6,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,2605.2,794.696 +Apps_MASSVEC3DPA,Base_Seq,default,679680, PASSED ,0.00179864,3.31409,10.8642,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,10.8642,3.31409 +Apps_MASSVEC3DPA,Base_HIP,runtime_block_stride_loop_64,679680, PASSED ,1.67109e-05,356.704,1169.34,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-runtime_block_stride_loop_64,1169.34,356.704 +Apps_MASSVEC3DPA,Base_HIP,direct_64,679680, PASSED ,1.18949e-05,501.128,1642.79,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-direct_64,1642.79,501.128 +Apps_MASSVEC3DPA,RAJA_HIP,runtime_block_stride_loop_64,679680, PASSED ,1.68273e-05,354.237,1161.26,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-runtime_block_stride_loop_64,1161.26,354.237 +Apps_MASSVEC3DPA,RAJA_HIP,direct_64,679680, PASSED ,1.19329e-05,499.533,1637.56,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-direct_64,1637.56,499.533 +Apps_MASSVEC3DPA,RAJA_HIP,cached_block_stride_loop_64,679680, PASSED ,1.32735e-05,449.08,1472.17,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/MASSVEC3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-cached_block_stride_loop_64,1472.17,449.08 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2744, PASSED ,1.76963e-05,5.1525,1.39555,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,1.36726,4.83581 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,2744, PASSED ,2.30361e-06,39.5814,10.7206,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,41.7565,147.687 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,2744, PASSED ,2.42171e-06,37.6512,10.1978,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,42.2464,149.419 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,4096000, PASSED ,0.0279455,4.40936,1.31914,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,1.33076,4.43953 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,4096000, PASSED ,0.000167822,734.242,219.661,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,219.661,734.242 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,4096000, PASSED ,0.000167407,736.062,220.206,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,220.206,736.062 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,493039, PASSED ,0.00333371,4.49236,1.33105,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,1.33156,4.49236 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,493039, PASSED ,2.36951e-05,632.039,187.268,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,187.268,632.039 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,493039, PASSED ,2.3417e-05,639.545,189.492,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,189.492,639.545 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,6028568, PASSED ,0.0408225,4.43761,1.3291,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,1.33076,4.43953 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,6028568, PASSED ,0.000243082,745.24,223.205,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,223.205,745.24 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,6028568, PASSED ,0.000242865,745.905,223.404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,223.404,745.905 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,54872, PASSED ,0.000363388,4.68254,1.35901,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,1.35901,4.68254 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,54872, PASSED ,5.00423e-06,340.028,98.6861,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,98.6861,340.028 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,54872, PASSED ,4.51163e-06,377.154,109.461,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,109.461,377.154 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,8242408, PASSED ,0.0557438,4.43953,1.33076,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,1.3291,4.43761 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,8242408, PASSED ,0.000326239,758.572,227.384,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,227.384,758.572 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,8242408, PASSED ,0.000325702,759.823,227.759,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256,227.413,757.981 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,1000000, PASSED ,0.006759,4.47608,1.33156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,1.33143,4.47608 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,1000000, PASSED ,4.37428e-05,691.63,205.748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,205.748,691.63 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,1000000, PASSED ,4.3776e-05,691.105,205.592,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,205.592,691.105 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,12167000, PASSED ,0.0821564,4.4425,1.33286,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,1.32993,4.43857 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,12167000, PASSED ,0.000480409,759.727,227.937,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,227.6605,759.1495 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,12167000, PASSED ,0.000481516,757.981,227.413,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,227.586,758.902 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,117649, PASSED ,0.000785798,4.60138,1.34747,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,1.35069,4.60138 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,117649, PASSED ,7.89024e-06,458.256,134.196,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,134.196,458.256 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,117649, PASSED ,7.65984e-06,472.04,138.233,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,138.233,472.04 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,12167, PASSED ,8.00891e-05,4.83581,1.36726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,1.363135,4.759175000000001 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,12167, PASSED ,2.62242e-06,147.687,41.7565,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,70.2213,243.85750000000002 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,12167, PASSED ,2.59201e-06,149.419,42.2464,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,75.8537,263.2865 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,16194277, PASSED ,0.110612,4.38922,1.31766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,1.33076,4.43953 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,16194277, PASSED ,0.000624651,777.233,233.328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,227.937,759.727 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,16194277, PASSED ,0.000625743,775.878,232.921,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,227.759,759.823 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,2048383, PASSED ,0.0138464,4.46134,1.33143,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,1.33105,4.46134 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,2048383, PASSED ,8.72264e-05,708.195,211.352,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,211.352,708.195 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,2048383, PASSED ,8.65385e-05,713.825,213.032,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,213.032,713.825 +Apps_NODAL_ACCUMULATION_3D,Base_Seq,default,238328, PASSED ,0.00158805,4.58258,1.35069,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,1.34747,4.58258 +Apps_NODAL_ACCUMULATION_3D,Base_HIP,block_256,238328, PASSED ,1.24791e-05,583.165,171.884,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,171.884,583.165 +Apps_NODAL_ACCUMULATION_3D,RAJA_HIP,block_256,238328, PASSED ,1.20186e-05,605.51,178.47,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/NODAL_ACCUMULATION_3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,178.47,605.51 +Apps_VOL3D,Base_Seq,default,1331, PASSED ,1.29701e-05,7.06277,16.0597,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,16.0597,6.82946 +Apps_VOL3D,Base_HIP,block_256,1331, PASSED ,2.85652e-06,32.0687,72.9195,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,310.767,133.227 +Apps_VOL3D,RAJA_HIP,block_256,1331, PASSED ,2.84803e-06,32.1643,73.1369,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,303.199,129.982 +Apps_VOL3D,Base_Seq,default,2985984, PASSED ,0.0153918,6.22355,14.9582,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,15.2428,6.33519 +Apps_VOL3D,Base_HIP,block_256,2985984, PASSED ,7.77983e-05,1231.28,2959.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,2959.36,1231.28 +Apps_VOL3D,RAJA_HIP,block_256,2985984, PASSED ,7.82093e-05,1224.81,2943.81,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2943.81,1224.81 +Apps_VOL3D,Base_Seq,default,343000, PASSED ,0.00174691,6.79477,16.244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,16.1981,6.79477 +Apps_VOL3D,Base_HIP,block_256,343000, PASSED ,9.58489e-06,1238.39,2960.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,2814.67,1174.76 +Apps_VOL3D,RAJA_HIP,block_256,343000, PASSED ,9.61098e-06,1235.03,2952.54,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2794.85,1166.49 +Apps_VOL3D,Base_Seq,default,4410944, PASSED ,0.0225525,6.219,14.9566,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,14.9584,6.22355 +Apps_VOL3D,Base_HIP,block_256,4410944, PASSED ,0.000115172,1217.78,2928.74,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,2985.54,1240.84 +Apps_VOL3D,RAJA_HIP,block_256,4410944, PASSED ,0.000115982,1209.27,2908.28,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2949.74,1225.97 +Apps_VOL3D,Base_Seq,default,35937, PASSED ,0.000213364,6.82946,16.1433,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,16.1433,6.82946 +Apps_VOL3D,Base_HIP,block_256,35937, PASSED ,3.81023e-06,382.434,903.99,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,903.99,382.434 +Apps_VOL3D,RAJA_HIP,block_256,35937, PASSED ,3.07513e-06,473.854,1120.09,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,1120.09,473.854 +Apps_VOL3D,Base_Seq,default,6028568, PASSED ,0.0300666,6.33519,15.2428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,14.9582,6.219 +Apps_VOL3D,Base_HIP,block_256,6028568, PASSED ,0.000153507,1240.84,2985.54,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,2959.36,1231.28 +Apps_VOL3D,RAJA_HIP,block_256,6028568, PASSED ,0.00015537,1225.97,2949.74,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2943.81,1224.81 +Apps_VOL3D,Base_Seq,default,704969, PASSED ,0.00354642,6.66757,15.9752,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,15.9752,6.66757 +Apps_VOL3D,Base_HIP,block_256,704969, PASSED ,2.01284e-05,1174.76,2814.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,2959.36,1231.28 +Apps_VOL3D,RAJA_HIP,block_256,704969, PASSED ,2.02711e-05,1166.49,2794.85,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2943.81,1224.81 +Apps_VOL3D,Base_Seq,default,8869743, PASSED ,0.0447857,6.21392,14.9584,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,14.9575,6.21646 +Apps_VOL3D,Base_HIP,block_256,8869743, PASSED ,0.000204717,1359.41,3272.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,2957.14,1229.31 +Apps_VOL3D,RAJA_HIP,block_256,8869743, PASSED ,0.000203806,1365.48,3287.05,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2929.01,1217.62 +Apps_VOL3D,Base_Seq,default,79507, PASSED ,0.000441426,6.81901,16.1981,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,16.1981,6.81901 +Apps_VOL3D,Base_HIP,block_256,79507, PASSED ,4.51784e-06,666.267,1582.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,1582.67,666.267 +Apps_VOL3D,RAJA_HIP,block_256,79507, PASSED ,3.94823e-06,762.389,1811.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,1811.0,762.389 +Apps_VOL3D,Base_Seq,default,8000, PASSED ,6.04437e-05,6.44564,15.0352,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,16.1015,6.824235 +Apps_VOL3D,Base_HIP,block_256,8000, PASSED ,2.92433e-06,133.227,310.767,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,607.3785,257.83050000000003 +Apps_VOL3D,RAJA_HIP,block_256,8000, PASSED ,2.99732e-06,129.982,303.199,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,711.6445,301.918 +Apps_VOL3D,Base_Seq,default,12008989, PASSED ,0.0613183,6.11479,14.7248,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,14.9584,6.21392 +Apps_VOL3D,Base_HIP,block_256,12008989, PASSED ,0.000380677,984.951,2371.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,2985.54,1240.84 +Apps_VOL3D,RAJA_HIP,block_256,12008989, PASSED ,0.000368261,1018.16,2451.8,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2949.74,1225.97 +Apps_VOL3D,Base_Seq,default,1442897, PASSED ,0.00728869,6.47818,15.5485,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,15.5485,6.47818 +Apps_VOL3D,Base_HIP,block_256,1442897, PASSED ,3.48778e-05,1353.8,3249.29,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,2959.36,1231.28 +Apps_VOL3D,RAJA_HIP,block_256,1442897, PASSED ,3.4181e-05,1381.39,3315.53,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2943.81,1224.81 +Apps_VOL3D,Base_Seq,default,166375, PASSED ,0.000874319,6.84974,16.3297,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,16.1981,6.81901 +Apps_VOL3D,Base_HIP,block_256,166375, PASSED ,5.87645e-06,1019.13,2429.59,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,2429.59,1019.13 +Apps_VOL3D,RAJA_HIP,block_256,166375, PASSED ,5.68725e-06,1053.03,2510.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/VOL3D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2510.42,1053.03 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_DIFFUSION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_DIFFUSION3DPA.csv new file mode 100644 index 0000000..7057816 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_DIFFUSION3DPA.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +783,38.2122,148.572,9.8788,9.8788,39.9095,155.076,25.5093,99.0499,6.59477,6.59477,26.6423,103.387 +3105,148.572,366.7875,9.97987,9.600495,155.076,374.767,99.0499,244.46495,6.65339,6.40363,103.387,249.784 +12339,585.003,585.003,9.2631,9.34422,594.458,594.458,389.88,389.88,6.17346,6.227,396.181,396.181 +24678,1041.98,1041.98,9.32219,9.32219,1079.58,1079.58,694.399,694.399,6.21249,6.21249,719.451,719.451 +49329,1553.62,1553.62,9.34422,9.2631,1557.96,1557.96,1035.33,1035.33,6.227,6.17346,1038.22,1038.22 +98631,2030.39,2030.39,9.18884,9.18884,2104.73,2104.73,1353.03,1353.03,6.12336,6.12336,1402.58,1402.58 +197262,2763.42,2763.42,6.63667,6.63667,2865.87,2865.87,1841.5,1841.5,4.42259,4.42259,1909.78,1909.78 +394524,3330.12,3330.12,2.54663,4.39209,3411.32,3411.32,2219.14,2219.14,1.69703,2.92682,2273.25,2273.25 +789048,3594.9,3357.58,4.36735,4.39209,3702.87,3488.83,2395.58,2237.43,2.91033,2.92682,2467.53,2324.9 +1155843,3764.48,3357.58,4.39209,4.39209,3824.22,3488.83,2508.59,2237.43,2.92682,2.92682,2548.4,2324.9 +1578096,3357.58,3357.58,4.5304,4.5304,3488.83,3488.83,2237.43,2237.43,3.01898,3.01898,2324.9,2324.9 +2311659,3037.75,3197.665,4.67993,4.5915300000000006,3186.78,3337.8050000000003,2024.31,2130.87,3.11862,3.0597149999999997,2123.62,2224.26 +3082212,2895.18,3037.75,4.65266,4.65266,3025.93,3186.78,1929.3,2024.31,3.10045,3.10045,2016.42,2123.62 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_EDGE3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_EDGE3D.csv new file mode 100644 index 0000000..aa49c32 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_EDGE3D.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +1331,1151.55,4989.71,8.36483,8.36483,1566.85,6813.73,2.75942,11.6555,0.0200444,0.0195325,3.75459,15.9162 +8000,4989.71,11558.605,8.36188,8.367365,6813.73,15246.015,11.6555,26.7207,0.0195325,0.019413,15.9162,35.24865 +35937,18127.5,18127.5,8.3699,8.3699,23678.3,23678.3,41.7859,41.7859,0.0192935,0.0192935,54.5811,54.5811 +79507,21801.6,21801.6,8.38141,8.37836,26113.1,25705.7,50.0086,50.0086,0.0192253,0.0192253,59.8984,58.752 +166375,24884.0,24884.0,8.37836,8.37836,25705.7,26113.1,56.8739,56.8739,0.0191493,0.0191493,58.752,59.8984 +343000,27771.5,26898.6,8.3848,8.37836,28947.6,27834.6,63.2963,61.1716,0.0191105,0.0191105,65.9768,63.2589 +704969,26898.6,27771.5,8.37346,8.3743,27834.6,27864.9,61.1716,63.2963,0.0190425,0.0190425,63.3001,63.3001 +1442897,27886.6,27886.6,8.37162,8.3743,27864.9,28206.4,63.3082,63.3082,0.0190052,0.0190052,63.2589,63.9446 +2985984,28106.0,28106.0,8.3743,8.3743,28206.4,28206.4,63.717,63.717,0.0189848,0.0189935,63.9446,63.9446 +4410944,28217.0,28217.0,8.38338,8.37918,28655.4,28655.4,63.9287,63.9287,0.0189935,0.0189848,64.9219,64.9219 +6028568,28558.1,28558.1,8.38302,8.38257,28757.0,28757.0,64.6727,64.6727,0.0189842,0.0189842,65.1231,65.1231 +8869743,28733.0,28586.55,8.37918,8.382795,28945.3,28847.5,65.0368,64.71015,0.0189662,0.0189758,65.5175,65.3008 +12008989,28615.0,28615.0,8.38257,8.38257,28938.0,28938.0,64.7476,64.7476,0.0189674,0.0189674,65.4785,65.4785 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_ENERGY.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_ENERGY.csv new file mode 100644 index 0000000..f4071c7 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_ENERGY.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +834,3.97689,15.6587,11.0692,11.0692,3.83117,14.9557,14.5457,57.2725,40.4861,40.4861,14.0127,54.7015 +3334,15.6587,36.35185,11.3416,10.8103,14.9557,38.05555,57.2725,132.95875,41.4825,39.53915,54.7015,139.19025 +13334,57.045,57.045,10.4485,10.766,61.1554,61.1554,208.645,208.645,38.216,39.3772,223.679,223.679 +26667,113.134,113.134,10.5514,10.766,120.248,120.248,413.794,413.794,38.5922,39.3772,439.815,439.815 +53334,234.803,234.803,10.766,10.766,234.885,234.885,858.804,858.804,39.3772,39.3772,859.106,859.106 +106667,417.176,417.176,10.9986,10.766,417.816,417.816,1525.85,1525.85,40.2279,39.3772,1528.19,1528.19 +213334,606.428,606.428,10.9041,10.766,619.841,619.841,2218.04,2218.04,39.8824,39.3772,2267.1,2267.1 +426667,743.356,743.356,9.41277,9.41277,750.174,750.174,2718.87,2718.87,34.4278,34.4278,2743.81,2743.81 +853334,776.438,776.438,7.29659,7.29659,781.695,781.695,2839.87,2839.87,26.6877,26.6877,2859.1,2859.1 +1250000,833.718,833.718,7.22338,7.2517,833.018,833.018,3049.37,3049.37,26.4199,26.5235,3046.81,3046.81 +1706667,873.173,873.173,7.2517,7.23801,867.768,867.768,3193.68,3193.68,26.5235,26.4735,3173.91,3173.91 +2500000,910.749,891.961,7.23801,7.230695,910.152,888.96,3331.12,3262.3999999999996,26.4735,26.4467,3328.94,3251.425 +3333334,923.776,910.749,7.20124,7.23801,925.493,910.152,3378.76,3331.12,26.339,26.4735,3385.04,3328.94 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_FEMSWEEP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_FEMSWEEP.csv new file mode 100644 index 0000000..6995d41 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_FEMSWEEP.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +31104,228.557,372.233,3.01734,3.16205,242.203,408.902,41.0451,68.6976,0.541864,0.592812,43.4957,75.465 +73728,372.233,456.2925,3.32161,3.089695,408.902,499.12149999999997,68.6976,85.0008,0.613022,0.567338,75.465,92.9765 +144000,540.352,540.352,3.16205,3.01734,589.341,589.341,101.304,101.304,0.592812,0.541864,110.488,110.488 +248832,739.04,739.04,2.75328,2.75328,780.256,780.256,139.974,139.974,0.521471,0.521471,147.78,147.78 +395136,902.329,902.329,2.37951,2.37951,952.505,952.505,172.13,172.13,0.453919,0.453919,181.701,181.701 +839808,1065.19,986.771,2.32824,2.32824,1151.79,1003.73,205.115,191.136,0.448329,0.448329,221.79,194.421 +1152000,1083.01,1065.19,2.17561,2.26231,1141.5,1141.5,209.224,205.115,0.420301,0.438205,220.524,220.524 +1533312,986.771,1065.19,2.26231,2.22341,1003.73,1141.5,191.136,206.848,0.438205,0.432411,194.421,220.524 +2530944,1106.9,1061.91,2.22341,2.22007,1170.72,1072.33,215.271,206.848,0.432411,0.432411,227.684,209.161 +3161088,1061.91,1024.31,2.21399,2.22007,1066.55,1066.55,206.848,199.795,0.431259,0.432411,207.751,207.751 +3888000,1024.31,1043.1100000000001,2.22007,2.2170300000000003,1072.33,1069.44,199.795,203.32150000000001,0.433031,0.43183499999999997,209.161,208.45600000000002 +4718592,1010.91,1024.31,2.10748,2.21399,1043.83,1066.55,197.416,199.795,0.411559,0.431259,203.844,207.751 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_INTSC_HEXRECT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_INTSC_HEXRECT.csv new file mode 100644 index 0000000..c1c6621 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_INTSC_HEXRECT.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +2744,39.8433,156.211,4.15467,4.26245,38.6568,151.303,0.499688,1.93552,0.0521051,0.0528136,0.484808,1.87471 +10648,156.211,338.07,4.26245,4.290335000000001,151.303,338.2415,1.93552,4.16639,0.0528136,0.0529727,1.87471,4.16829 +39304,519.929,519.929,4.31822,4.31311,525.18,525.18,6.39726,6.39726,0.0531318,0.0528441,6.46187,6.46187 +74088,558.895,558.895,4.34974,4.31822,558.391,558.391,6.86053,6.86053,0.0533937,0.0530326,6.85435,6.85435 +140608,711.076,711.076,4.31311,4.32856,706.757,706.757,8.71209,8.71209,0.0528441,0.0530326,8.65917,8.65917 +287496,845.661,845.661,4.33569,4.33569,838.699,838.699,10.3438,10.3438,0.0530326,0.0530326,10.2587,10.2587 +551368,855.931,855.931,4.32856,4.33569,855.681,855.681,10.457,10.457,0.0528825,0.0530326,10.454,10.454 +1124864,902.675,902.675,4.34562,4.34181,903.073,903.073,11.0168,11.0168,0.0530364,0.0530326,11.0216,11.0216 +2197000,923.259,923.259,4.35263,4.34214,905.491,905.491,11.2594,11.2594,0.0530816,0.0529303,11.0427,11.0427 +3241792,931.332,923.259,4.34181,4.34214,929.002,922.552,11.3537,11.2594,0.0529303,0.0529303,11.3253,11.2406 +4410944,930.082,930.082,4.34214,4.34181,929.419,929.002,11.3355,11.3355,0.0529206,0.0529206,11.3275,11.3253 +6434856,921.93,930.707,4.31109,4.336895,922.552,929.2104999999999,11.233,11.3446,0.0525273,0.05284585,11.2406,11.3264 +8741816,932.657,930.082,4.33198,4.33198,931.096,929.419,11.3614,11.3355,0.0527711,0.0527711,11.3424,11.3275 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASS3DEA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASS3DEA.csv new file mode 100644 index 0000000..d0b8417 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASS3DEA.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-compile_time_block_stride_loop_64 (raw),Base_HIP-compile_time_block_stride_loop_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-cached_block_stride_loop_64 (raw),RAJA_HIP-cached_block_stride_loop_64 (smoothed),RAJA_HIP-compile_time_block_stride_loop_64 (raw),RAJA_HIP-compile_time_block_stride_loop_64 (smoothed),Base_HIP-compile_time_block_stride_loop_64 (raw B/W),Base_HIP-compile_time_block_stride_loop_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-cached_block_stride_loop_64 (raw B/W),RAJA_HIP-cached_block_stride_loop_64 (smoothed B/W),RAJA_HIP-compile_time_block_stride_loop_64 (raw B/W),RAJA_HIP-compile_time_block_stride_loop_64 (smoothed B/W) +389120,12.7729,24.697,0.0806808,0.0806822,11.1491,21.9424,6.64186,12.4963,14.0107,27.0896,0.0884992,0.0884992,12.2295,24.0681,7.28549,13.707 +778240,24.697,34.77975,0.0806846,0.08068149999999999,21.9424,31.230999999999998,12.4963,17.2856,27.0896,38.14885,0.0885011,0.0884983,24.0681,34.256299999999996,13.707,18.9601 +1556480,44.8625,44.8625,0.0806822,0.0806808,40.5196,40.5196,22.0749,22.0749,49.2081,49.2081,0.0884974,0.0884974,44.4445,44.4445,24.2132,24.2132 +3108864,80.9353,80.9353,0.0803397,0.0803397,73.7694,73.7694,35.0276,35.0276,88.7745,88.7745,0.0881212,0.0881212,80.9145,80.9145,38.4203,38.4203 +6213632,161.626,161.626,0.080184,0.0803397,132.156,132.156,36.5386,36.5386,177.28,177.28,0.0879501,0.0881212,144.956,144.956,40.0775,40.0775 +12423168,182.708,161.626,0.0801583,0.0803397,168.003,168.003,37.1484,37.1484,200.404,177.28,0.0879218,0.0881212,184.274,184.274,40.7463,40.7463 +18198528,193.453,170.032,0.0803496,0.0803496,230.064,177.172,40.8201,38.7535,212.19,186.5,0.0881316,0.0881316,252.347,194.332,44.7736,42.5068 +24842240,149.777,182.708,0.0806487,0.0804058,177.172,214.176,38.7535,38.9138,164.284,200.404,0.0884596,0.0881932,194.332,234.919,42.5068,42.6827 +36392960,170.032,185.948,0.0804602,0.0804602,224.417,224.417,39.5594,39.2686,186.5,203.957,0.0882529,0.0882529,246.152,246.152,43.3908,43.0718 +48521216,185.948,185.948,0.0804058,0.0804602,214.176,224.417,38.9138,39.2686,203.957,203.957,0.0881932,0.0882529,234.919,246.152,42.6827,43.0718 +60649472,188.417,187.1825,0.0805517,0.080433,256.763,235.2885,39.2686,39.414,206.666,205.3115,0.0883532,0.08822305,281.63,258.0765,43.0718,43.231300000000005 +72781824,200.261,188.417,0.0802808,0.0804058,246.16,246.16,41.6593,39.2686,219.656,206.666,0.0880561,0.0881932,270.001,270.001,45.694,43.0718 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv new file mode 100644 index 0000000..e13b5fd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASS3DPA_ATOMIC.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +1331,71.1765,281.662,10.3068,10.3068,69.5852,275.031,34.9485,134.669,5.06074,4.9594,34.1672,131.499 +4913,281.662,567.1229999999999,10.3726,10.1734,275.031,558.643,134.669,267.875,4.9594,4.836309999999999,131.499,263.8605 +19683,852.584,852.584,10.019,10.1523,842.255,842.255,401.081,401.081,4.71322,4.734,396.222,396.222 +35937,1272.33,1272.33,10.04,10.1074,1252.2,1252.2,595.706,595.706,4.70075,4.71322,586.281,586.281 +68921,1778.38,1778.38,10.1523,10.04,1772.01,1772.01,829.253,829.253,4.734,4.70075,826.284,826.284 +132651,2307.89,2307.89,10.1074,10.04,2315.66,2315.66,1072.69,1072.69,4.69783,4.69783,1076.3,1076.3 +250047,2460.23,2460.23,9.9999,9.9999,2490.06,2467.91,1140.66,1140.66,4.63633,4.63633,1154.49,1139.76 +531441,2515.74,2460.23,8.95839,9.25416,2477.88,2467.91,1163.69,1140.66,4.14383,4.27094,1146.18,1139.76 +1030301,2486.55,2460.23,9.23179,9.23179,2467.91,2467.91,1148.36,1140.66,4.26351,4.26351,1139.76,1139.76 +1442897,2392.52,2392.52,9.25416,9.23179,2445.07,2445.07,1104.19,1104.19,4.27094,4.26351,1128.44,1128.44 +2048383,2367.11,2367.11,9.10268,9.25416,2372.38,2372.38,1091.77,1091.77,4.19839,4.26945,1094.2,1094.2 +2924207,2242.11,2304.61,9.26198,9.25807,2212.31,2292.3450000000003,1033.54,1062.655,4.26945,4.270195,1019.8,1057.0 +3869893,2169.68,2242.11,9.30478,9.26198,2163.22,2212.31,999.747,1033.54,4.28746,4.26945,996.77,1019.8 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASSVEC3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASSVEC3DPA.csv new file mode 100644 index 0000000..d0f6ae3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_MASSVEC3DPA.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-direct_64 (raw),Base_HIP-direct_64 (smoothed),Base_HIP-runtime_block_stride_loop_64 (raw),Base_HIP-runtime_block_stride_loop_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-cached_block_stride_loop_64 (raw),RAJA_HIP-cached_block_stride_loop_64 (smoothed),RAJA_HIP-direct_64 (raw),RAJA_HIP-direct_64 (smoothed),RAJA_HIP-runtime_block_stride_loop_64 (raw),RAJA_HIP-runtime_block_stride_loop_64 (smoothed),Base_HIP-direct_64 (raw B/W),Base_HIP-direct_64 (smoothed B/W),Base_HIP-runtime_block_stride_loop_64 (raw B/W),Base_HIP-runtime_block_stride_loop_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-cached_block_stride_loop_64 (raw B/W),RAJA_HIP-cached_block_stride_loop_64 (smoothed B/W),RAJA_HIP-direct_64 (raw B/W),RAJA_HIP-direct_64 (smoothed B/W),RAJA_HIP-runtime_block_stride_loop_64 (raw B/W),RAJA_HIP-runtime_block_stride_loop_64 (smoothed B/W) +10752,70.7524,275.365,35.9215,141.613,10.98,10.98,39.3421,154.715,70.3182,272.804,28.5681,112.619,21.6029,84.0179,10.9679,43.2082,3.35254,3.35254,12.0124,47.2058,21.4703,83.2365,8.72273,34.3618 +42624,275.365,603.1505,141.613,322.54150000000004,11.0659,10.928550000000001,154.715,364.3965,272.804,600.612,112.619,266.3845,84.0179,184.00495,43.2082,98.3986,3.37636,3.3353599999999997,47.2058,111.1669,83.2365,183.23025,34.3618,81.2664 +169920,930.936,930.936,503.47,503.47,10.8771,10.8771,574.078,574.078,928.42,928.42,420.15,420.15,283.992,283.992,153.589,153.589,3.31818,3.31818,175.128,175.128,283.224,283.224,128.171,128.171 +339840,1345.15,1345.15,895.096,895.096,10.7861,10.8771,1001.24,1001.24,1334.02,1334.02,758.743,758.743,410.34,410.34,273.05,273.05,3.2903,3.31818,305.431,305.431,406.945,406.945,231.455,231.455 +679680,1642.79,1642.79,1169.34,1169.34,10.8642,10.8642,1472.17,1472.17,1637.56,1637.56,1161.26,1161.26,501.128,501.128,356.704,356.704,3.31409,3.31409,449.08,449.08,499.533,499.533,354.237,354.237 +1359360,2627.36,2627.36,2028.33,2028.33,10.8933,10.8628,2098.42,2098.42,2608.14,2608.14,1511.95,1511.95,801.461,801.461,618.729,618.729,3.32293,3.31363,640.111,640.111,795.597,795.597,461.21,461.21 +2718720,3126.86,3126.86,2373.42,2373.42,10.852,10.8642,2484.4,2484.4,3109.17,3109.17,1722.19,1722.19,953.827,953.827,723.994,723.994,3.31033,3.31409,757.849,757.849,948.432,948.432,525.343,525.343 +5437248,3406.81,3327.49,2552.14,2519.05,10.8628,10.8684,2636.6,2605.2,3409.39,3286.56,1785.52,1785.52,1039.22,1015.03,778.511,768.417,3.31363,3.31531,804.273,794.696,1040.01,1002.54,544.659,544.659 +10874496,3327.49,3327.49,2519.05,2552.14,10.8684,10.8684,2605.2,2636.6,3355.57,3286.56,1844.39,1844.39,1015.03,1015.03,768.417,778.511,3.31531,3.31531,794.696,804.273,1023.59,1002.54,562.617,562.617 +15929280,3345.94,3327.49,2599.36,2556.4,10.8874,10.8767,2711.75,2653.99,3286.56,3286.56,1850.67,1844.39,1020.65,1015.03,792.915,779.81,3.32111,3.31785,827.198,809.578,1002.54,1002.54,564.531,562.617 +21748800,3308.95,3308.95,2635.87,2556.4,10.8806,10.8767,2751.43,2653.99,3268.2,3268.2,1893.45,1844.39,1009.37,1009.37,804.051,779.81,3.31904,3.31785,839.303,809.578,996.938,996.938,577.583,562.617 +31858560,3220.67,3277.26,2556.4,2577.88,10.8767,10.87865,2653.99,2682.87,3180.43,3227.515,1648.86,1749.7649999999999,982.439,999.7025,779.81,786.3625,3.31785,3.318445,809.578,818.3879999999999,970.163,984.5274999999999,502.972,533.7515 +42477888,3245.57,3245.57,2549.45,2556.4,10.8621,10.8767,2652.19,2653.99,3186.83,3186.83,1621.69,1648.86,990.035,990.035,777.689,779.81,3.3134,3.31785,809.028,809.578,972.117,972.117,494.684,502.972 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv new file mode 100644 index 0000000..a8e0354 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_NODAL_ACCUMULATION_3D.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +2744,10.7206,41.7565,1.39555,1.36726,10.1978,42.2464,39.5814,147.687,5.1525,4.83581,37.6512,149.419 +12167,41.7565,70.2213,1.36726,1.363135,42.2464,75.8537,147.687,243.85750000000002,4.83581,4.759175000000001,149.419,263.2865 +54872,98.6861,98.6861,1.35901,1.35901,109.461,109.461,340.028,340.028,4.68254,4.68254,377.154,377.154 +117649,134.196,134.196,1.34747,1.35069,138.233,138.233,458.256,458.256,4.60138,4.60138,472.04,472.04 +238328,171.884,171.884,1.35069,1.34747,178.47,178.47,583.165,583.165,4.58258,4.58258,605.51,605.51 +493039,187.268,187.268,1.33105,1.33156,189.492,189.492,632.039,632.039,4.49236,4.49236,639.545,639.545 +1000000,205.748,205.748,1.33156,1.33143,205.592,205.592,691.63,691.63,4.47608,4.47608,691.105,691.105 +2048383,211.352,211.352,1.33143,1.33105,213.032,213.032,708.195,708.195,4.46134,4.46134,713.825,713.825 +4096000,219.661,219.661,1.31914,1.33076,220.206,220.206,734.242,734.242,4.40936,4.43953,736.062,736.062 +6028568,223.205,223.205,1.3291,1.33076,223.404,223.404,745.24,745.24,4.43761,4.43953,745.905,745.905 +8242408,227.384,227.384,1.33076,1.3291,227.759,227.413,758.572,758.572,4.43953,4.43761,759.823,757.981 +12167000,227.937,227.6605,1.33286,1.32993,227.413,227.586,759.727,759.1495,4.4425,4.43857,757.981,758.902 +16194277,233.328,227.937,1.31766,1.33076,232.921,227.759,777.233,759.727,4.38922,4.43953,775.878,759.823 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_VOL3D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_VOL3D.csv new file mode 100644 index 0000000..d91659f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier1-SPX/saturation-curve-data/Apps_VOL3D.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +1331,72.9195,310.767,16.0597,16.0597,73.1369,303.199,32.0687,133.227,7.06277,6.82946,32.1643,129.982 +8000,310.767,607.3785,15.0352,16.1015,303.199,711.6445,133.227,257.83050000000003,6.44564,6.824235,129.982,301.918 +35937,903.99,903.99,16.1433,16.1433,1120.09,1120.09,382.434,382.434,6.82946,6.82946,473.854,473.854 +79507,1582.67,1582.67,16.1981,16.1981,1811.0,1811.0,666.267,666.267,6.81901,6.81901,762.389,762.389 +166375,2429.59,2429.59,16.3297,16.1981,2510.42,2510.42,1019.13,1019.13,6.84974,6.81901,1053.03,1053.03 +343000,2960.57,2814.67,16.244,16.1981,2952.54,2794.85,1238.39,1174.76,6.79477,6.79477,1235.03,1166.49 +704969,2814.67,2959.36,15.9752,15.9752,2794.85,2943.81,1174.76,1231.28,6.66757,6.66757,1166.49,1224.81 +1442897,3249.29,2959.36,15.5485,15.5485,3315.53,2943.81,1353.8,1231.28,6.47818,6.47818,1381.39,1224.81 +2985984,2959.36,2959.36,14.9582,15.2428,2943.81,2943.81,1231.28,1231.28,6.22355,6.33519,1224.81,1224.81 +4410944,2928.74,2985.54,14.9566,14.9584,2908.28,2949.74,1217.78,1240.84,6.219,6.22355,1209.27,1225.97 +6028568,2985.54,2959.36,15.2428,14.9582,2949.74,2943.81,1240.84,1231.28,6.33519,6.219,1225.97,1224.81 +8869743,3272.42,2957.14,14.9584,14.9575,3287.05,2929.01,1359.41,1229.31,6.21392,6.21646,1365.48,1217.62 +12008989,2371.83,2985.54,14.7248,14.9584,2451.8,2949.74,984.951,1240.84,6.11479,6.21392,1018.16,1225.97 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..9c7c9ea --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +702,18.8242,7.24657,18.3296 +2754,71.4457,7.73436,66.6931 +10989,157.171,7.51252,152.725 +21951,198.044,7.04361,193.521 +43902,223.049,6.57224,220.403 +87804,231.66,6.98584,233.236 +175608,236.02,5.30205,236.775 +351216,231.122,2.47933,228.273 +702459,208.59,2.15669,207.829 +1028970,204.078,2.05897,204.833 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..29e01b3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +702,71.4457,7.51252,66.6931 +2754,114.30834999999999,7.379545,109.70904999999999 +10989,157.171,7.24657,152.725 +21951,198.044,7.04361,193.521 +43902,223.049,6.98584,220.403 +87804,231.122,6.57224,228.273 +175608,231.122,5.30205,228.273 +351216,231.122,2.47933,228.273 +702459,219.856,2.31801,218.051 +1028970,208.59,2.15669,207.829 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_flops_raw.csv new file mode 100644 index 0000000..703efd6 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +702,33.9132,13.0552,33.022 +2754,129.201,13.9866,120.606 +10989,284.499,13.5986,276.451 +21951,358.542,12.7519,350.353 +43902,403.844,11.8994,399.054 +87804,419.452,12.6488,422.306 +175608,427.354,9.60028,428.722 +351216,418.491,4.4893,413.332 +702459,377.694,3.90513,376.316 +1028970,369.525,3.72818,370.892 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_flops_smoothed.csv new file mode 100644 index 0000000..f697ecc --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_CONVECTION3DPA_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +702,129.201,13.5986,120.606 +2754,206.85000000000002,13.326899999999998,198.5285 +10989,284.499,13.0552,276.451 +21951,358.542,12.7519,350.353 +43902,403.844,12.6488,399.054 +87804,418.491,11.8994,413.332 +175608,418.491,9.60028,413.332 +351216,418.491,4.4893,413.332 +702459,398.0925,4.197215,394.82399999999996 +1028970,377.694,3.90513,376.316 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv new file mode 100644 index 0000000..2322c83 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +841,13.1301,7.12761,19.1223 +3844,61.3475,7.05094,83.5024 +15876,254.019,6.94974,265.009 +32400,384.755,6.89359,387.348 +65025,471.999,6.88855,466.722 +131044,368.256,6.90546,379.205 +264196,408.618,6.81632,398.196 +528529,431.904,6.76234,426.344 +1060900,364.821,6.76766,371.24 +1555009,348.33,6.70243,344.602 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv new file mode 100644 index 0000000..bf3f114 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +841,61.3475,7.05094,83.5024 +3844,157.68325,7.00034,174.2557 +15876,254.019,6.94974,265.009 +32400,368.256,6.90546,379.205 +65025,384.755,6.89359,387.348 +131044,408.618,6.88855,398.196 +264196,408.618,6.81632,398.196 +528529,368.256,6.76766,379.205 +1060900,386.71950000000004,6.765000000000001,384.718 +1555009,364.821,6.76234,371.24 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_flops_raw.csv new file mode 100644 index 0000000..48b2a23 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +841,15.152,8.22518,22.0669 +3844,72.5329,8.33653,98.7272 +15876,303.619,8.30676,316.755 +32400,461.341,8.26578,464.451 +65025,567.185,8.27772,560.843 +131044,443.204,8.31087,456.381 +264196,492.316,8.21252,479.759 +528529,520.767,8.15367,514.063 +1060900,440.119,8.16448,447.863 +1555009,420.319,8.08762,415.82 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv new file mode 100644 index 0000000..6797883 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +841,72.5329,8.30676,98.7272 +3844,188.07595,8.28627,207.7411 +15876,303.619,8.27772,316.755 +32400,443.204,8.30676,456.381 +65025,461.341,8.27772,464.451 +131044,492.316,8.26578,479.759 +264196,492.316,8.21252,479.759 +528529,443.204,8.16448,456.381 +1060900,466.2175,8.159075,463.81100000000004 +1555009,440.119,8.15367,447.863 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_bandwidth_raw.csv new file mode 100644 index 0000000..71c397b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +27,0.0608571,0.0758293,0.10716 +64,0.0604735,0.0762729,0.10547 +216,0.0674069,0.0766671,0.116977 +512,0.0704105,0.0769074,0.122127 +1000,0.0716662,0.0770157,0.126111 +1728,0.071919,0.0769536,0.130787 +3375,0.0720209,0.0766019,0.133359 +6859,0.0720402,0.0766165,0.135752 +13824,0.0729852,0.0766193,0.136625 +19683,0.0734538,0.0767298,0.136874 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv new file mode 100644 index 0000000..6f13aae --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +27,0.0608571,0.0762729,0.10716 +64,0.064132,0.07647000000000001,0.1120685 +216,0.0674069,0.0766671,0.116977 +512,0.0704105,0.0769074,0.122127 +1000,0.0716662,0.0769074,0.126111 +1728,0.071919,0.0769074,0.130787 +3375,0.0720209,0.0766193,0.133359 +6859,0.0720402,0.0766193,0.135752 +13824,0.0725127,0.0766179,0.1361885 +19683,0.0729852,0.0766193,0.136625 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_flops_raw.csv new file mode 100644 index 0000000..4dae950 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +27,2.8229,3.51739,4.97069 +64,2.8051,3.53797,4.89231 +216,3.12671,3.55625,5.42606 +512,3.26604,3.5674,5.66495 +1000,3.32428,3.57242,5.84976 +1728,3.33601,3.56954,6.06665 +3375,3.34073,3.55323,6.18593 +6859,3.34163,3.5539,6.29694 +13824,3.38547,3.55404,6.33743 +19683,3.4072,3.55916,6.34898 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_flops_smoothed.csv new file mode 100644 index 0000000..fbe5ccf --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_INTSC_HEXHEX_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +27,2.8229,3.53797,4.97069 +64,2.974805,3.54711,5.198375 +216,3.12671,3.55625,5.42606 +512,3.26604,3.5674,5.66495 +1000,3.32428,3.5674,5.84976 +1728,3.33601,3.5674,6.06665 +3375,3.34073,3.55404,6.18593 +6859,3.34163,3.55404,6.29694 +13824,3.36355,3.55397,6.317185 +19683,3.38547,3.55404,6.33743 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_bandwidth_raw.csv new file mode 100644 index 0000000..7886450 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-kernel_256,RAJA_HIP-launch_256 +1344,30.7808,8.69785,30.6035,22.7173 +4992,92.6304,8.70005,81.5998,78.9043 +19392,152.356,8.36339,129.02,152.498 +38784,173.714,8.38156,142.62,171.991 +77568,164.556,8.37786,136.489,159.203 +154944,164.02,8.27718,132.568,158.28 +309696,159.885,8.28278,130.12,156.138 +619392,162.557,8.21518,132.34,157.932 +1238784,165.423,8.13308,130.001,160.391 +1814592,165.165,8.13223,133.138,161.421 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_bandwidth_smoothed.csv new file mode 100644 index 0000000..b3beab3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-kernel_256,RAJA_HIP-launch_256 +1344,92.6304,8.69785,81.5998,78.9043 +4992,122.4932,8.539705000000001,105.3099,115.70115 +19392,152.356,8.38156,129.02,152.498 +38784,164.02,8.37786,132.568,158.28 +77568,164.02,8.36339,132.568,158.28 +154944,164.02,8.28278,132.568,158.28 +309696,164.02,8.27718,132.34,158.28 +619392,164.02,8.21518,132.34,158.28 +1238784,163.861,8.17413,131.23000000000002,159.1615 +1814592,165.165,8.13308,132.34,160.391 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_flops_raw.csv new file mode 100644 index 0000000..f75cb7a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-kernel_256,RAJA_HIP-launch_256 +1344,21.8706,6.18006,21.7446,16.1413 +4992,66.3897,6.23547,58.4839,56.552 +19392,109.457,6.0085,92.6917,109.559 +38784,124.853,6.02404,102.505,123.614 +77568,118.295,6.02263,98.1186,114.447 +154944,117.922,5.95087,95.3096,113.795 +309696,114.955,5.9552,93.5542,112.261 +619392,116.879,5.90676,95.1529,113.554 +1238784,118.942,5.8478,93.4727,115.323 +1814592,118.756,5.84722,95.7286,116.064 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_flops_smoothed.csv new file mode 100644 index 0000000..30f2bb3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_LTIMES_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-kernel_256,RAJA_HIP-launch_256 +1344,66.3897,6.18006,58.4839,56.552 +4992,87.92335,6.10205,75.5878,83.0555 +19392,109.457,6.02404,92.6917,109.559 +38784,117.922,6.02263,95.3096,113.795 +77568,117.922,6.0085,95.3096,113.795 +154944,117.922,5.9552,95.3096,113.795 +309696,117.922,5.95087,95.1529,113.795 +619392,117.922,5.90676,95.1529,113.795 +1238784,117.8175,5.877280000000001,94.35355,114.4385 +1814592,118.756,5.8478,95.1529,115.323 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..73d26fb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_25,Base_Seq-default,RAJA_HIP-block_25 +1600,17.8445,5.201,17.9589 +6336,56.3896,5.26676,55.8969 +25344,96.4673,5.19259,96.1439 +50624,138.615,5.17515,139.015 +101184,188.507,5.19191,187.797 +202368,205.471,5.2001,206.508 +404736,209.016,5.17149,210.34 +809536,206.019,5.13865,206.864 +1619008,194.333,5.11364,195.732 +2371584,193.572,5.10618,193.082 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..4469620 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_25,Base_Seq-default,RAJA_HIP-block_25 +1600,56.3896,5.201,55.8969 +6336,76.42845,5.196795,76.0204 +25344,96.4673,5.19259,96.1439 +50624,138.615,5.19259,139.015 +101184,188.507,5.19191,187.797 +202368,205.471,5.17515,206.508 +404736,205.471,5.17149,206.508 +809536,205.471,5.13865,206.508 +1619008,200.176,5.126145,201.298 +2371584,194.333,5.11364,195.732 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_flops_raw.csv new file mode 100644 index 0000000..05804e3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_25,Base_Seq-default,RAJA_HIP-block_25 +1600,38.1057,11.1064,38.3501 +6336,120.87,11.2892,119.814 +25344,206.973,11.1409,206.28 +50624,297.449,11.1052,298.307 +101184,404.545,11.1421,403.019 +202368,440.966,11.1601,443.193 +404736,448.585,11.0989,451.425 +809536,442.156,11.0285,443.969 +1619008,417.077,10.9749,420.08 +2371584,415.446,10.9589,414.395 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_flops_smoothed.csv new file mode 100644 index 0000000..20d7742 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MASS3DPA_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_25,Base_Seq-default,RAJA_HIP-block_25 +1600,120.87,11.1409,119.814 +6336,163.9215,11.123650000000001,163.047 +25344,206.973,11.1409,206.28 +50624,297.449,11.1421,298.307 +101184,404.545,11.1409,403.019 +202368,440.966,11.1052,443.193 +404736,440.966,11.0989,443.193 +809536,440.966,11.0285,443.193 +1619008,429.6165,11.0017,432.0245 +2371584,417.077,10.9749,420.08 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv new file mode 100644 index 0000000..6bafdb2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +64,2.3184,15.3687,5.12375 +512,15.9952,14.2524,23.3519 +3375,93.8871,12.9009,148.259 +8000,213.061,12.1691,337.173 +17576,443.39,12.2763,471.59 +35937,410.17,12.1287,415.415 +79507,431.336,10.2309,430.777 +157464,462.878,8.38297,459.122 +328509,385.364,4.66426,384.811 +493039,346.718,4.60877,347.717 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv new file mode 100644 index 0000000..677d0b2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +64,15.9952,14.2524,23.3519 +512,54.94115,13.57665,85.80545 +3375,93.8871,12.9009,148.259 +8000,213.061,12.2763,337.173 +17576,410.17,12.1691,415.415 +35937,431.336,12.1287,430.777 +79507,431.336,10.2309,430.777 +157464,410.17,8.38297,415.415 +328509,408.35,6.5236149999999995,407.794 +493039,385.364,4.66426,384.811 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_flops_raw.csv new file mode 100644 index 0000000..b1a1a0c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +64,0.658035,4.36214,1.45428 +512,5.40414,4.81533,7.88968 +3375,34.8268,4.78551,54.9958 +8000,81.3251,4.64495,128.699 +17576,172.721,4.78219,183.707 +35937,162.145,4.79459,164.218 +79507,172.724,4.09687,172.5 +157464,186.988,3.38646,185.471 +328509,156.851,1.89846,156.627 +493039,141.61,1.88236,142.018 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv new file mode 100644 index 0000000..dcc1eaf --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +64,5.40414,4.78551,7.88968 +512,20.11547,4.71523,31.44274 +3375,34.8268,4.78219,54.9958 +8000,81.3251,4.78551,128.699 +17576,162.145,4.78219,164.218 +35937,172.721,4.64495,172.5 +79507,172.721,4.09687,172.5 +157464,162.145,3.38646,164.218 +328509,164.7875,2.64246,164.5635 +493039,156.851,1.89846,156.627 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv new file mode 100644 index 0000000..fe0fdd0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +80000,146.085,14.1788,143.168 +160000,217.801,10.9567,220.631 +320000,312.425,10.4999,316.614 +640000,374.327,10.3092,379.045 +1280000,443.779,9.50777,440.75 +2560000,466.897,9.23769,466.256 +3750000,481.583,9.13207,484.242 +5120000,473.886,9.06123,474.695 +7500000,452.468,9.01723,451.012 +10000000,449.537,8.99193,447.195 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv new file mode 100644 index 0000000..f60450d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +80000,217.801,10.9567,220.631 +160000,265.113,10.7283,268.6225 +320000,312.425,10.4999,316.614 +640000,374.327,10.3092,379.045 +1280000,443.779,9.50777,440.75 +2560000,466.897,9.23769,466.256 +3750000,466.897,9.13207,466.256 +5120000,466.897,9.06123,466.256 +7500000,463.177,9.03923,462.8535 +10000000,452.468,9.01723,451.012 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_flops_raw.csv new file mode 100644 index 0000000..7b75092 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +80000,0.0,0.0,0.0 +160000,0.0,0.0,0.0 +320000,0.0,0.0,0.0 +640000,0.0,0.0,0.0 +1280000,0.0,0.0,0.0 +2560000,0.0,0.0,0.0 +3750000,0.0,0.0,0.0 +5120000,0.0,0.0,0.0 +7500000,0.0,0.0,0.0 +10000000,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_flops_smoothed.csv new file mode 100644 index 0000000..7b75092 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_INDEXLIST_3LOOP_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +80000,0.0,0.0,0.0 +160000,0.0,0.0,0.0 +320000,0.0,0.0,0.0 +640000,0.0,0.0,0.0 +1280000,0.0,0.0,0.0 +2560000,0.0,0.0,0.0 +3750000,0.0,0.0,0.0 +5120000,0.0,0.0,0.0 +7500000,0.0,0.0,0.0 +10000000,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_bandwidth_raw.csv new file mode 100644 index 0000000..b66775e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-atomic_direct_256,Base_HIP-atomic_occgs_256,Base_Seq-default,RAJA_HIP-atomic_direct_256,RAJA_HIP-atomic_occgs_256 +3120,4.67047,4.62363,4.78196,4.34494,4.28538 +12495,17.7215,17.6489,4.64252,17.0075,16.6415 +49995,69.0062,69.0431,4.59966,64.7093,63.0929 +99995,124.126,130.713,4.59197,117.075,123.133 +199995,221.566,238.614,4.58966,204.062,217.27 +399995,297.757,298.961,4.5878,282.78,288.432 +799995,407.522,408.478,4.58573,387.028,398.214 +1599995,495.21,497.876,4.57977,463.98,491.753 +3199995,457.638,497.456,4.57854,412.137,494.989 +4687495,412.268,463.435,4.57812,368.591,463.739 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_bandwidth_smoothed.csv new file mode 100644 index 0000000..0ec2fa3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-atomic_direct_256,Base_HIP-atomic_occgs_256,Base_Seq-default,RAJA_HIP-atomic_direct_256,RAJA_HIP-atomic_occgs_256 +3120,17.7215,17.6489,4.64252,17.0075,16.6415 +12495,43.36385,43.346,4.621090000000001,40.8584,39.8672 +49995,69.0062,69.0431,4.59966,64.7093,63.0929 +99995,124.126,130.713,4.59197,117.075,123.133 +199995,221.566,238.614,4.58966,204.062,217.27 +399995,297.757,298.961,4.5878,282.78,288.432 +799995,407.522,408.478,4.58573,387.028,398.214 +1599995,412.268,463.435,4.57977,387.028,463.739 +3199995,434.953,480.44550000000004,4.579155,399.5825,477.746 +4687495,457.638,497.456,4.57854,412.137,491.753 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_flops_raw.csv new file mode 100644 index 0000000..a651599 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-atomic_direct_256,Base_HIP-atomic_occgs_256,Base_Seq-default,RAJA_HIP-atomic_direct_256,RAJA_HIP-atomic_occgs_256 +3120,0.312429,0.309295,0.319886,0.290652,0.286668 +12495,1.18832,1.18345,0.311305,1.14044,1.1159 +49995,4.63,4.63248,0.308616,4.3417,4.23325 +99995,8.3291,8.77114,0.308131,7.856,8.26249 +199995,14.8683,16.0123,0.307991,13.6937,14.58 +399995,19.9816,20.0624,0.307875,18.9766,19.3558 +799995,27.348,27.4121,0.307739,25.9727,26.7233 +1599995,33.2328,33.4117,0.307341,31.1369,33.0008 +3199995,30.7115,33.3836,0.30726,27.6579,33.218 +4687495,27.6668,31.1006,0.307232,24.7356,31.121 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_flops_smoothed.csv new file mode 100644 index 0000000..505d4af --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_MULTI_REDUCE_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-atomic_direct_256,Base_HIP-atomic_occgs_256,Base_Seq-default,RAJA_HIP-atomic_direct_256,RAJA_HIP-atomic_occgs_256 +3120,1.18832,1.18345,0.311305,1.14044,1.1159 +12495,2.90916,2.907965,0.30996049999999997,2.74107,2.674575 +49995,4.63,4.63248,0.308616,4.3417,4.23325 +99995,8.3291,8.77114,0.308131,7.856,8.26249 +199995,14.8683,16.0123,0.307991,13.6937,14.58 +399995,19.9816,20.0624,0.307875,18.9766,19.3558 +799995,27.348,27.4121,0.307739,25.9727,26.7233 +1599995,27.6668,31.1006,0.307341,25.9727,31.121 +3199995,29.189149999999998,32.2421,0.3073005,26.8153,32.0609 +4687495,30.7115,33.3836,0.30726,27.6579,33.0008 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_bandwidth_raw.csv new file mode 100644 index 0000000..650152e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-blkatm_direct_256,Base_HIP-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_HIP-blkatm_direct_256,RAJA_HIP-blkatm_occgs_256,RAJA_HIP-blkdev_direct_256,RAJA_HIP-blkdev_direct_new_256,RAJA_HIP-blkdev_occgs_256,RAJA_HIP-blkdev_occgs_new_256 +3125,2.43833,2.45828,9.20709,17.0284,4.52183,2.02997,2.02829,2.43362,1.76144,2.42725,1.73304 +12500,5.44607,5.49647,9.48223,18.0593,4.57919,7.82994,7.89981,6.5301,6.75435,6.43316,6.69453 +50000,7.07765,7.15708,9.41668,17.671,4.58415,27.5206,27.6263,23.0961,20.3425,22.8227,20.2458 +100000,7.31487,14.5278,9.4112,17.8173,4.58426,40.4865,53.8797,34.9564,27.6976,44.3131,35.7095 +200000,7.8085,28.7275,9.41252,17.833,4.58483,55.0749,100.061,48.5718,33.3397,85.28,68.5554 +400000,8.17193,52.5516,9.43391,17.9217,4.58753,61.9048,158.329,54.5527,38.9782,137.984,120.369 +800000,7.9639,93.6942,9.41254,17.7726,4.58485,68.097,256.172,59.208,42.077,224.522,201.431 +1600000,7.71168,173.54,9.3563,17.2186,4.57427,72.4032,364.879,63.0717,44.5954,326.557,312.237 +3200000,7.73076,258.132,9.34906,17.092,4.57258,72.468,387.62,62.2175,44.7497,354.03,353.177 +4687500,8.63973,282.678,9.34431,17.0924,4.57297,72.9963,391.914,62.4369,45.2207,365.851,368.856 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv new file mode 100644 index 0000000..337bccb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-blkatm_direct_256,Base_HIP-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_HIP-blkatm_direct_256,RAJA_HIP-blkatm_occgs_256,RAJA_HIP-blkdev_direct_256,RAJA_HIP-blkdev_direct_new_256,RAJA_HIP-blkdev_occgs_256,RAJA_HIP-blkdev_occgs_new_256 +3125,5.44607,5.49647,9.41668,17.671,4.57919,7.82994,7.89981,6.5301,6.75435,6.43316,6.69453 +12500,6.26186,6.326775,9.41394,17.744149999999998,4.58167,17.67527,17.763055,14.8131,13.548425,14.627930000000001,13.470165 +50000,7.07765,7.15708,9.41252,17.8173,4.58415,27.5206,27.6263,23.0961,20.3425,22.8227,20.2458 +100000,7.31487,14.5278,9.41668,17.833,4.58426,40.4865,53.8797,34.9564,27.6976,44.3131,35.7095 +200000,7.8085,28.7275,9.41254,17.8173,4.58483,55.0749,100.061,48.5718,33.3397,85.28,68.5554 +400000,7.8085,52.5516,9.41252,17.8173,4.58483,61.9048,158.329,54.5527,38.9782,137.984,120.369 +800000,7.8085,93.6942,9.41252,17.7726,4.58483,68.097,256.172,59.208,42.077,224.522,201.431 +1600000,7.9639,173.54,9.3563,17.2186,4.57427,72.4032,364.879,62.2175,44.5954,326.557,312.237 +3200000,7.8473299999999995,215.836,9.35268,17.1555,4.57362,72.4356,376.2495,62.327200000000005,44.67255,340.2935,332.707 +4687500,7.73076,258.132,9.34906,17.0924,4.57297,72.468,387.62,62.4369,44.7497,354.03,353.177 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_flops_raw.csv new file mode 100644 index 0000000..3a24ce9 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-blkatm_direct_256,Base_HIP-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_HIP-blkatm_direct_256,RAJA_HIP-blkatm_occgs_256,RAJA_HIP-blkdev_direct_256,RAJA_HIP-blkdev_direct_new_256,RAJA_HIP-blkdev_occgs_256,RAJA_HIP-blkdev_occgs_new_256 +3125,0.327372,0.330051,1.23615,2.28624,0.607103,0.272545,0.272319,0.326739,0.236492,0.325884,0.232679 +12500,0.731018,0.737782,1.27278,2.42407,0.614658,1.051,1.06038,0.876525,0.906626,0.863514,0.898597 +50000,0.949965,0.960626,1.26391,2.37181,0.615287,3.69382,3.70801,3.09997,2.73038,3.06328,2.7174 +100000,0.981795,1.94991,1.26316,2.39142,0.615295,5.43406,7.23168,4.69181,3.71754,5.94766,4.79289 +200000,1.04804,3.85576,1.26333,2.39351,0.615369,7.39206,13.43,6.51923,4.47481,11.4461,9.2014 +400000,1.09682,7.05338,1.2662,2.40541,0.615729,8.30874,21.2506,7.32195,5.23158,18.52,16.1557 +800000,1.0689,12.5754,1.26333,2.3854,0.615369,9.13983,34.3828,7.94678,5.64748,30.1348,27.0357 +1600000,1.03504,23.2921,1.25578,2.31104,0.613948,9.7178,48.9732,8.46535,5.98549,43.8298,41.9078 +3200000,1.03761,34.6459,1.25481,2.29405,0.613722,9.7265,52.0255,8.35069,6.0062,47.5171,47.4026 +4687500,1.15961,37.9404,1.25417,2.2941,0.613774,9.7974,52.6018,8.38014,6.06943,49.1038,49.507 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_flops_smoothed.csv new file mode 100644 index 0000000..653fe38 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Basic_REDUCE_STRUCT_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-blkatm_direct_256,Base_HIP-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_HIP-blkatm_direct_256,RAJA_HIP-blkatm_occgs_256,RAJA_HIP-blkdev_direct_256,RAJA_HIP-blkdev_direct_new_256,RAJA_HIP-blkdev_occgs_256,RAJA_HIP-blkdev_occgs_new_256 +3125,0.731018,0.737782,1.26391,2.37181,0.614658,1.051,1.06038,0.876525,0.906626,0.863514,0.898597 +12500,0.8404915,0.8492040000000001,1.263535,2.381615,0.6149725,2.37241,2.384195,1.9882475,1.818503,1.9633969999999998,1.8079985 +50000,0.949965,0.960626,1.26333,2.39142,0.615287,3.69382,3.70801,3.09997,2.73038,3.06328,2.7174 +100000,0.981795,1.94991,1.26391,2.39351,0.615295,5.43406,7.23168,4.69181,3.71754,5.94766,4.79289 +200000,1.04804,3.85576,1.26333,2.39142,0.615369,7.39206,13.43,6.51923,4.47481,11.4461,9.2014 +400000,1.04804,7.05338,1.26333,2.39142,0.615369,8.30874,21.2506,7.32195,5.23158,18.52,16.1557 +800000,1.04804,12.5754,1.26333,2.3854,0.615369,9.13983,34.3828,7.94678,5.64748,30.1348,27.0357 +1600000,1.0689,23.2921,1.25578,2.31104,0.613948,9.7178,48.9732,8.35069,5.98549,43.8298,41.9078 +3200000,1.053255,28.969,1.2552949999999998,2.3025700000000002,0.613861,9.72215,50.49935,8.365415,5.995845,45.67345,44.6552 +4687500,1.03761,34.6459,1.25481,2.2941,0.613774,9.7265,52.0255,8.38014,6.0062,47.5171,47.4026 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv new file mode 100644 index 0000000..50c4096 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_1024,Base_Seq-direct,RAJA_HIP-direct_1024,RAJA_HIP-funcptr_1024,RAJA_HIP-virtfunc_1024 +42875,35.5465,34.2866,28.3649,30.9433,29.0926 +91125,52.7123,30.6163,43.3236,46.2492,44.3283 +205379,76.4868,31.4224,65.7495,68.2299,65.6235 +421875,116.949,29.4222,99.173,103.677,98.5 +884736,127.604,26.5345,139.893,142.861,133.87 +1860867,196.573,16.5543,180.069,177.742,165.402 +2744000,207.767,12.0213,194.723,189.791,177.557 +3796416,223.313,9.34983,209.559,204.866,191.745 +5639752,199.269,7.45299,192.515,187.563,180.556 +7645373,205.182,7.23912,199.822,182.713,173.613 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv new file mode 100644 index 0000000..5dd1d51 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_1024,Base_Seq-direct,RAJA_HIP-direct_1024,RAJA_HIP-funcptr_1024,RAJA_HIP-virtfunc_1024 +42875,52.7123,31.4224,43.3236,46.2492,44.3283 +91125,64.59955,31.01935,54.53655,57.23955,54.9759 +205379,76.4868,30.6163,65.7495,68.2299,65.6235 +421875,116.949,29.4222,99.173,103.677,98.5 +884736,127.604,26.5345,139.893,142.861,133.87 +1860867,196.573,16.5543,180.069,177.742,165.402 +2744000,199.269,12.0213,192.515,187.563,177.557 +3796416,205.182,9.34983,194.723,187.563,177.557 +5639752,206.47449999999998,8.40141,197.2725,188.677,179.0565 +7645373,205.182,7.45299,199.822,187.563,180.556 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_flops_raw.csv new file mode 100644 index 0000000..b69bd9d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_flops_raw.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_1024,Base_Seq-direct,RAJA_HIP-direct_1024,RAJA_HIP-funcptr_1024,RAJA_HIP-virtfunc_1024 +42875,0.0,0.0,0.0,0.0,0.0 +91125,0.0,0.0,0.0,0.0,0.0 +205379,0.0,0.0,0.0,0.0,0.0 +421875,0.0,0.0,0.0,0.0,0.0 +884736,0.0,0.0,0.0,0.0,0.0 +1860867,0.0,0.0,0.0,0.0,0.0 +2744000,0.0,0.0,0.0,0.0,0.0 +3796416,0.0,0.0,0.0,0.0,0.0 +5639752,0.0,0.0,0.0,0.0,0.0 +7645373,0.0,0.0,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_flops_smoothed.csv new file mode 100644 index 0000000..b69bd9d --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/Comm_HALO_PACKING_FUSED_flops_smoothed.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_1024,Base_Seq-direct,RAJA_HIP-direct_1024,RAJA_HIP-funcptr_1024,RAJA_HIP-virtfunc_1024 +42875,0.0,0.0,0.0,0.0,0.0 +91125,0.0,0.0,0.0,0.0,0.0 +205379,0.0,0.0,0.0,0.0,0.0 +421875,0.0,0.0,0.0,0.0,0.0 +884736,0.0,0.0,0.0,0.0,0.0 +1860867,0.0,0.0,0.0,0.0,0.0 +2744000,0.0,0.0,0.0,0.0,0.0 +3796416,0.0,0.0,0.0,0.0,0.0 +5639752,0.0,0.0,0.0,0.0,0.0 +7645373,0.0,0.0,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_CONVECTION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_CONVECTION3DPA.csv new file mode 100644 index 0000000..4bb3fc6 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_CONVECTION3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_CONVECTION3DPA-Base_Seq-default,702.0,13.0552,7.24657 +Apps_CONVECTION3DPA-Base_HIP-block_64,21951.0,358.542,198.044 +Apps_CONVECTION3DPA-RAJA_HIP-block_64,21951.0,350.353,193.521 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_DEL_DOT_VEC_2D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_DEL_DOT_VEC_2D.csv new file mode 100644 index 0000000..9e12d5b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_DEL_DOT_VEC_2D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DEL_DOT_VEC_2D-Base_Seq-default,841.0,8.22518,7.12761 +Apps_DEL_DOT_VEC_2D-Base_HIP-block_256,32400.0,461.341,384.755 +Apps_DEL_DOT_VEC_2D-RAJA_HIP-block_256,32400.0,464.451,387.348 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_INTSC_HEXHEX.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_INTSC_HEXHEX.csv new file mode 100644 index 0000000..205e8ac --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_INTSC_HEXHEX.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_INTSC_HEXHEX-Base_Seq-default,27.0,3.51739,0.0758293 +Apps_INTSC_HEXHEX-Base_HIP-block_64,216.0,3.12671,0.0674069 +Apps_INTSC_HEXHEX-RAJA_HIP-block_64,1000.0,5.84976,0.126111 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_LTIMES.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_LTIMES.csv new file mode 100644 index 0000000..66eea6e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_LTIMES.csv @@ -0,0 +1,5 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_LTIMES-Base_Seq-default,1344.0,6.18006,8.69785 +Apps_LTIMES-Base_HIP-block_256,19392.0,109.457,152.356 +Apps_LTIMES-RAJA_HIP-kernel_256,19392.0,92.6917,129.02 +Apps_LTIMES-RAJA_HIP-launch_256,19392.0,109.559,152.498 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_MASS3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_MASS3DPA.csv new file mode 100644 index 0000000..6c9adb7 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_MASS3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DPA-Base_Seq-default,1600.0,11.1064,5.201 +Apps_MASS3DPA-Base_HIP-block_25,101184.0,404.545,188.507 +Apps_MASS3DPA-RAJA_HIP-block_25,101184.0,403.019,187.797 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_MATVEC_3D_STENCIL.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_MATVEC_3D_STENCIL.csv new file mode 100644 index 0000000..8706718 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Apps_MATVEC_3D_STENCIL.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MATVEC_3D_STENCIL-Base_Seq-default,64.0,4.36214,15.3687 +Apps_MATVEC_3D_STENCIL-Base_HIP-block_256,17576.0,172.721,443.39 +Apps_MATVEC_3D_STENCIL-RAJA_HIP-block_256,17576.0,183.707,471.59 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_INDEXLIST_3LOOP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_INDEXLIST_3LOOP.csv new file mode 100644 index 0000000..22ba238 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_INDEXLIST_3LOOP.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_INDEXLIST_3LOOP-Base_Seq-default,80000.0,0.0,14.1788 +Basic_INDEXLIST_3LOOP-Base_HIP-block_256,80000.0,0.0,146.085 +Basic_INDEXLIST_3LOOP-RAJA_HIP-block_256,80000.0,0.0,143.168 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_MULTI_REDUCE.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_MULTI_REDUCE.csv new file mode 100644 index 0000000..35504b2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_MULTI_REDUCE.csv @@ -0,0 +1,6 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_MULTI_REDUCE-Base_Seq-default,3120.0,0.319886,4.78196 +Basic_MULTI_REDUCE-Base_HIP-atomic_direct_256,1599995.0,33.2328,495.21 +Basic_MULTI_REDUCE-Base_HIP-atomic_occgs_256,1599995.0,33.4117,497.876 +Basic_MULTI_REDUCE-RAJA_HIP-atomic_direct_256,799995.0,25.9727,387.028 +Basic_MULTI_REDUCE-RAJA_HIP-atomic_occgs_256,1599995.0,33.0008,491.753 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_REDUCE_STRUCT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_REDUCE_STRUCT.csv new file mode 100644 index 0000000..df06499 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Basic_REDUCE_STRUCT.csv @@ -0,0 +1,12 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_REDUCE_STRUCT-Base_Seq-default,3125.0,2.28624,17.0284 +Basic_REDUCE_STRUCT-Base_Seq-kahan,3125.0,0.607103,4.52183 +Basic_REDUCE_STRUCT-Base_Seq-cascade,3125.0,1.23615,9.20709 +Basic_REDUCE_STRUCT-Base_HIP-blkatm_direct_256,50000.0,0.949965,7.07765 +Basic_REDUCE_STRUCT-Base_HIP-blkatm_occgs_256,4687500.0,37.9404,282.678 +Basic_REDUCE_STRUCT-RAJA_HIP-blkatm_direct_256,800000.0,9.13983,68.097 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_direct_256,800000.0,7.94678,59.208 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_direct_new_256,800000.0,5.64748,42.077 +Basic_REDUCE_STRUCT-RAJA_HIP-blkatm_occgs_256,1600000.0,48.9732,364.879 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_occgs_256,1600000.0,43.8298,326.557 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_occgs_new_256,3200000.0,47.4026,353.177 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Comm_HALO_PACKING_FUSED.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Comm_HALO_PACKING_FUSED.csv new file mode 100644 index 0000000..6938acb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/Comm_HALO_PACKING_FUSED.csv @@ -0,0 +1,6 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Comm_HALO_PACKING_FUSED-Base_Seq-direct,42875.0,0.0,34.2866 +Comm_HALO_PACKING_FUSED-Base_HIP-direct_1024,42875.0,0.0,35.5465 +Comm_HALO_PACKING_FUSED-RAJA_HIP-direct_1024,42875.0,0.0,28.3649 +Comm_HALO_PACKING_FUSED-RAJA_HIP-funcptr_1024,42875.0,0.0,30.9433 +Comm_HALO_PACKING_FUSED-RAJA_HIP-virtfunc_1024,42875.0,0.0,29.0926 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/combined_fom.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/combined_fom.csv new file mode 100644 index 0000000..23749bf --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/FOM/combined_fom.csv @@ -0,0 +1,44 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_CONVECTION3DPA-Base_HIP-block_64,21951.0,358.542,198.044 +Apps_CONVECTION3DPA-Base_Seq-default,702.0,13.0552,7.24657 +Apps_CONVECTION3DPA-RAJA_HIP-block_64,21951.0,350.353,193.521 +Apps_DEL_DOT_VEC_2D-Base_HIP-block_256,32400.0,461.341,384.755 +Apps_DEL_DOT_VEC_2D-Base_Seq-default,841.0,8.22518,7.12761 +Apps_DEL_DOT_VEC_2D-RAJA_HIP-block_256,32400.0,464.451,387.348 +Apps_INTSC_HEXHEX-Base_HIP-block_64,216.0,3.12671,0.0674069 +Apps_INTSC_HEXHEX-Base_Seq-default,27.0,3.51739,0.0758293 +Apps_INTSC_HEXHEX-RAJA_HIP-block_64,1000.0,5.84976,0.126111 +Apps_LTIMES-Base_HIP-block_256,19392.0,109.457,152.356 +Apps_LTIMES-Base_Seq-default,1344.0,6.18006,8.69785 +Apps_LTIMES-RAJA_HIP-kernel_256,19392.0,92.6917,129.02 +Apps_LTIMES-RAJA_HIP-launch_256,19392.0,109.559,152.498 +Apps_MASS3DPA-Base_HIP-block_25,101184.0,404.545,188.507 +Apps_MASS3DPA-Base_Seq-default,1600.0,11.1064,5.201 +Apps_MASS3DPA-RAJA_HIP-block_25,101184.0,403.019,187.797 +Apps_MATVEC_3D_STENCIL-Base_HIP-block_256,17576.0,172.721,443.39 +Apps_MATVEC_3D_STENCIL-Base_Seq-default,64.0,4.36214,15.3687 +Apps_MATVEC_3D_STENCIL-RAJA_HIP-block_256,17576.0,183.707,471.59 +Basic_INDEXLIST_3LOOP-Base_HIP-block_256,80000.0,0.0,146.085 +Basic_INDEXLIST_3LOOP-Base_Seq-default,80000.0,0.0,14.1788 +Basic_INDEXLIST_3LOOP-RAJA_HIP-block_256,80000.0,0.0,143.168 +Basic_MULTI_REDUCE-Base_HIP-atomic_direct_256,1599995.0,33.2328,495.21 +Basic_MULTI_REDUCE-Base_HIP-atomic_occgs_256,1599995.0,33.4117,497.876 +Basic_MULTI_REDUCE-Base_Seq-default,3120.0,0.319886,4.78196 +Basic_MULTI_REDUCE-RAJA_HIP-atomic_direct_256,799995.0,25.9727,387.028 +Basic_MULTI_REDUCE-RAJA_HIP-atomic_occgs_256,1599995.0,33.0008,491.753 +Basic_REDUCE_STRUCT-Base_HIP-blkatm_direct_256,50000.0,0.949965,7.07765 +Basic_REDUCE_STRUCT-Base_HIP-blkatm_occgs_256,4687500.0,37.9404,282.678 +Basic_REDUCE_STRUCT-Base_Seq-cascade,3125.0,1.23615,9.20709 +Basic_REDUCE_STRUCT-Base_Seq-default,3125.0,2.28624,17.0284 +Basic_REDUCE_STRUCT-Base_Seq-kahan,3125.0,0.607103,4.52183 +Basic_REDUCE_STRUCT-RAJA_HIP-blkatm_direct_256,800000.0,9.13983,68.097 +Basic_REDUCE_STRUCT-RAJA_HIP-blkatm_occgs_256,1600000.0,48.9732,364.879 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_direct_256,800000.0,7.94678,59.208 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_direct_new_256,800000.0,5.64748,42.077 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_occgs_256,1600000.0,43.8298,326.557 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_occgs_new_256,3200000.0,47.4026,353.177 +Comm_HALO_PACKING_FUSED-Base_HIP-direct_1024,42875.0,0.0,35.5465 +Comm_HALO_PACKING_FUSED-Base_Seq-direct,42875.0,0.0,34.2866 +Comm_HALO_PACKING_FUSED-RAJA_HIP-direct_1024,42875.0,0.0,28.3649 +Comm_HALO_PACKING_FUSED-RAJA_HIP-funcptr_1024,42875.0,0.0,30.9433 +Comm_HALO_PACKING_FUSED-RAJA_HIP-virtfunc_1024,42875.0,0.0,29.0926 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/combined_table.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/combined_table.csv new file mode 100644 index 0000000..086852e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/combined_table.csv @@ -0,0 +1,431 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning +Apps_CONVECTION3DPA,Base_Seq,default,702, PASSED ,7.33484e-06,7.24657,13.0552,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,702, PASSED ,2.82362e-06,18.8242,33.9132,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,702, PASSED ,2.89982e-06,18.3296,33.022,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,702459, PASSED ,0.0245371,2.15669,3.90513,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,702459, PASSED ,0.000253699,208.59,377.694,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,702459, PASSED ,0.000254628,207.829,376.316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,87804, PASSED ,0.000946896,6.98584,12.6488,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,87804, PASSED ,2.85542e-05,231.66,419.452,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,87804, PASSED ,2.83612e-05,233.236,422.306,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,1028970, PASSED ,0.0376482,2.05897,3.72818,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,1028970, PASSED ,0.000379837,204.078,369.525,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,1028970, PASSED ,0.000378437,204.833,370.892,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,10989, PASSED ,0.000110231,7.51252,13.5986,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,10989, PASSED ,5.26884e-06,157.171,284.499,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,10989, PASSED ,5.42224e-06,152.725,276.451,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,175608, PASSED ,0.00249516,5.30205,9.60028,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,175608, PASSED ,5.60524e-05,236.02,427.354,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,175608, PASSED ,5.58736e-05,236.775,428.722,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,21951, PASSED ,0.000234811,7.04361,12.7519,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,21951, PASSED ,8.35126e-06,198.044,358.542,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,21951, PASSED ,8.54646e-06,193.521,350.353,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,2754, PASSED ,2.6859e-05,7.73436,13.9866,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,2754, PASSED ,2.90762e-06,71.4457,129.201,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,2754, PASSED ,3.11482e-06,66.6931,120.606,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,351216, PASSED ,0.0106717,2.47933,4.4893,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,351216, PASSED ,0.000114479,231.122,418.491,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,351216, PASSED ,0.000115908,228.273,413.332,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,43902, PASSED ,0.000503263,6.57224,11.8994,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,43902, PASSED ,1.48289e-05,223.049,403.844,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,43902, PASSED ,1.50069e-05,220.403,399.054,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,841, PASSED ,5.52134e-06,7.12761,8.22518,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,841, PASSED ,2.99723e-06,13.1301,15.152,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,841, PASSED ,2.05801e-06,19.1223,22.0669,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1060900, PASSED ,0.00701681,6.76766,8.16448,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,1060900, PASSED ,0.000130166,364.821,440.119,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,1060900, PASSED ,0.000127915,371.24,447.863,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,131044, PASSED ,0.000851461,6.90546,8.31087,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,131044, PASSED ,1.59664e-05,368.256,443.204,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,131044, PASSED ,1.55054e-05,379.205,456.381,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1555009, PASSED ,0.0103826,6.70243,8.08762,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,1555009, PASSED ,0.000199778,348.33,420.319,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,1555009, PASSED ,0.000201939,344.602,415.82,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,15876, PASSED ,0.000103206,6.94974,8.30676,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,15876, PASSED ,2.82362e-06,254.019,303.619,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,15876, PASSED ,2.70652e-06,265.009,316.755,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,264196, PASSED ,0.00173718,6.81632,8.21252,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,264196, PASSED ,2.89785e-05,408.618,492.316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,264196, PASSED ,2.9737e-05,398.196,479.759,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,32400, PASSED ,0.000211668,6.89359,8.26578,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,32400, PASSED ,3.79242e-06,384.755,461.341,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,32400, PASSED ,3.76703e-06,387.348,464.451,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,3844, PASSED ,2.48996e-05,7.05094,8.33653,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,3844, PASSED ,2.86182e-06,61.3475,72.5329,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,3844, PASSED ,2.10252e-06,83.5024,98.7272,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,528529, PASSED ,0.00350033,6.76234,8.15367,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,528529, PASSED ,5.48049e-05,431.904,520.767,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,528529, PASSED ,5.55196e-05,426.344,514.063,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,65025, PASSED ,0.000424193,6.88855,8.27772,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,65025, PASSED ,6.19084e-06,471.999,567.185,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,65025, PASSED ,6.26084e-06,466.722,560.843,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,1860867, PASSED ,0.000622838,16.5543,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,1860867, PASSED ,5.24521e-05,196.573,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,1860867, PASSED ,5.72595e-05,180.069,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,1860867, PASSED ,5.80091e-05,177.742,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,1860867, PASSED ,6.23368e-05,165.402,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,205379, PASSED ,7.6831e-05,31.4224,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,205379, PASSED ,3.15638e-05,76.4868,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,205379, PASSED ,3.67183e-05,65.7495,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,205379, PASSED ,3.53835e-05,68.2299,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,205379, PASSED ,3.67888e-05,65.6235,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,2744000, PASSED ,0.00110899,12.0213,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,2744000, PASSED ,6.41654e-05,207.767,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,2744000, PASSED ,6.84637e-05,194.723,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,2744000, PASSED ,7.02429e-05,189.791,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,2744000, PASSED ,7.50827e-05,177.557,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,3796416, PASSED ,0.0017678,9.34983,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,3796416, PASSED ,7.40156e-05,223.313,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,3796416, PASSED ,7.88734e-05,209.559,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,3796416, PASSED ,8.06804e-05,204.866,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,3796416, PASSED ,8.62012e-05,191.745,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,421875, PASSED ,0.000131646,29.4222,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,421875, PASSED ,3.31198e-05,116.949,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,421875, PASSED ,3.90563e-05,99.173,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,421875, PASSED ,3.73596e-05,103.677,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,421875, PASSED ,3.93232e-05,98.5,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,5639752, PASSED ,0.00288279,7.45299,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,5639752, PASSED ,0.000107821,199.269,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,5639752, PASSED ,0.000111604,192.515,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,5639752, PASSED ,0.00011455,187.563,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,5639752, PASSED ,0.000118996,180.556,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,42875, PASSED ,2.53527e-05,34.2866,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,42875, PASSED ,2.44541e-05,35.5465,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,42875, PASSED ,3.06456e-05,28.3649,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,42875, PASSED ,2.8092e-05,30.9433,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,42875, PASSED ,2.98791e-05,29.0926,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,7645373, PASSED ,0.00363146,7.23912,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,7645373, PASSED ,0.000128123,205.182,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,7645373, PASSED ,0.00013156,199.822,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,7645373, PASSED ,0.000143879,182.713,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,7645373, PASSED ,0.00015142,173.613,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,884736, PASSED ,0.000237783,26.5345,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,884736, PASSED ,4.94457e-05,127.604,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,884736, PASSED ,4.51021e-05,139.893,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,884736, PASSED ,4.41649e-05,142.861,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,884736, PASSED ,4.71311e-05,133.87,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,91125, PASSED ,4.63515e-05,30.6163,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,91125, PASSED ,2.69218e-05,52.7123,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,91125, PASSED ,3.27561e-05,43.3236,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,91125, PASSED ,3.0684e-05,46.2492,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,91125, PASSED ,3.20137e-05,44.3283,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Basic_INDEXLIST_3LOOP,Base_Seq,default,2560000, PASSED ,0.0108399,9.23769,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,2560000, PASSED ,0.000214471,466.897,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,2560000, PASSED ,0.000214766,466.256,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,320000, PASSED ,0.00119211,10.4999,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,320000, PASSED ,4.0064e-05,312.425,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,320000, PASSED ,3.9534e-05,316.614,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,3750000, PASSED ,0.0160624,9.13207,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,3750000, PASSED ,0.000304586,481.583,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,3750000, PASSED ,0.000302913,484.242,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,5120000, PASSED ,0.022102,9.06123,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,5120000, PASSED ,0.000422616,473.886,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,5120000, PASSED ,0.000421896,474.695,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,640000, PASSED ,0.00242832,10.3092,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,640000, PASSED ,6.68772e-05,374.327,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,640000, PASSED ,6.60449e-05,379.045,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,7500000, PASSED ,0.032534,9.01723,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,7500000, PASSED ,0.000648369,452.468,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,7500000, PASSED ,0.000650462,451.012,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,80000, PASSED ,0.000220701,14.1788,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,80000, PASSED ,2.14209e-05,146.085,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,80000, PASSED ,2.18572e-05,143.168,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,10000000, PASSED ,0.0435007,8.99193,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,10000000, PASSED ,0.00087013,449.537,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,10000000, PASSED ,0.000874687,447.195,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,1280000, PASSED ,0.005266,9.50777,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,1280000, PASSED ,0.000112822,443.779,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,1280000, PASSED ,0.000113597,440.75,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,160000, PASSED ,0.000571205,10.9567,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,160000, PASSED ,2.8735e-05,217.801,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,160000, PASSED ,2.83664e-05,220.631,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_INTSC_HEXHEX,Base_Seq,default,27, PASSED ,0.00148561,0.0758293,3.51739,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,27, PASSED ,0.0018511,0.0608571,2.8229,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,27, PASSED ,0.00105126,0.10716,4.97069,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,13824, PASSED ,0.75279,0.0766193,3.55404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,13824, PASSED ,0.790273,0.0729852,3.38547,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,13824, PASSED ,0.422165,0.136625,6.33743,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,1728, PASSED ,0.09369,0.0769536,3.56954,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,1728, PASSED ,0.100249,0.071919,3.33601,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,1728, PASSED ,0.055126,0.130787,6.06665,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,19683, PASSED ,1.0703,0.0767298,3.55916,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,19683, PASSED ,1.11803,0.0734538,3.4072,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,19683, PASSED ,0.599997,0.136874,6.34898,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,216, PASSED ,0.011755,0.0766671,3.55625,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,216, PASSED ,0.0133699,0.0674069,3.12671,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,216, PASSED ,0.00770426,0.116977,5.42606,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,3375, PASSED ,0.183828,0.0766019,3.55323,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,3375, PASSED ,0.195521,0.0720209,3.34073,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,3375, PASSED ,0.105592,0.133359,6.18593,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,512, PASSED ,0.0277766,0.0769074,3.5674,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,512, PASSED ,0.0303397,0.0704105,3.26604,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,512, PASSED ,0.0174918,0.122127,5.66495,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,64, PASSED ,0.00350096,0.0762729,3.53797,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,64, PASSED ,0.00441563,0.0604735,2.8051,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,64, PASSED ,0.00253179,0.10547,4.89231,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,6859, PASSED ,0.373523,0.0766165,3.5539,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,6859, PASSED ,0.39725,0.0720402,3.34163,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,6859, PASSED ,0.210811,0.135752,6.29694,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,1000, PASSED ,0.054175,0.0770157,3.57242,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,1000, PASSED ,0.0582188,0.0716662,3.32428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,1000, PASSED ,0.0330844,0.126111,5.84976,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_LTIMES,Base_Seq,default,1344, PASSED ,1.08737e-05,8.69785,6.18006,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,1344, FAILED ,3.07262e-06,30.7808,21.8706,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,1344, FAILED ,3.09042e-06,30.6035,21.7446,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,1344, FAILED ,4.16324e-06,22.7173,16.1413,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,1238784, PASSED ,0.0105919,8.13308,5.8478,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,1238784, PASSED ,0.000520752,165.423,118.942,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,1238784, PASSED ,0.000662645,130.001,93.4727,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,1238784, PASSED ,0.000537092,160.391,115.323,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,154944, PASSED ,0.00130186,8.27718,5.95087,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,154944, PASSED ,6.56977e-05,164.02,117.922,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,154944, PASSED ,8.12846e-05,132.568,95.3096,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,154944, PASSED ,6.80803e-05,158.28,113.795,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,1814592, PASSED ,0.0155167,8.13223,5.84722,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,1814592, PASSED ,0.000763999,165.165,118.756,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,1814592, PASSED ,0.000947779,133.138,95.7286,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,1814592, PASSED ,0.000781718,161.421,116.064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,19392, PASSED ,0.000161372,8.36339,6.0085,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,19392, PASSED ,8.85826e-06,152.356,109.457,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,19392, PASSED ,1.04605e-05,129.02,92.6917,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,19392, PASSED ,8.85006e-06,152.498,109.559,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,309696, PASSED ,0.00260021,8.28278,5.9552,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,309696, PASSED ,0.000134703,159.885,114.955,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,309696, PASSED ,0.000165517,130.12,93.5542,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,309696, PASSED ,0.000137936,156.138,112.261,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,38784, PASSED ,0.00032191,8.38156,6.02404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,38784, PASSED ,1.55319e-05,173.714,124.853,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,38784, PASSED ,1.89181e-05,142.62,102.505,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,38784, PASSED ,1.56875e-05,171.991,123.614,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,4992, PASSED ,4.00291e-05,8.70005,6.23547,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,4992, PASSED ,3.75962e-06,92.6304,66.3897,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,4992, PASSED ,4.26784e-06,81.5998,58.4839,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,4992, PASSED ,4.41364e-06,78.9043,56.552,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,619392, PASSED ,0.00524308,8.21518,5.90676,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,619392, PASSED ,0.000264971,162.557,116.879,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,619392, PASSED ,0.000325472,132.34,95.1529,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,619392, PASSED ,0.000272731,157.932,113.554,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,77568, PASSED ,0.000643971,8.37786,6.02263,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,77568, PASSED ,3.27858e-05,164.556,118.295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,77568, PASSED ,3.95277e-05,136.489,98.1186,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,77568, PASSED ,3.38882e-05,159.203,114.447,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_MASS3DPA,Base_Seq,default,1600, PASSED ,1.14101e-05,5.201,11.1064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,1600, PASSED ,3.32562e-06,17.8445,38.1057,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,1600, PASSED ,3.30442e-06,17.9589,38.3501,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,1619008, PASSED ,0.011684,5.11364,10.9749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,1619008, PASSED ,0.00030745,194.333,417.077,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,1619008, PASSED ,0.000305253,195.732,420.08,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,202368, PASSED ,0.00143621,5.2001,11.1601,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,202368, PASSED ,3.63478e-05,205.471,440.966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,202368, PASSED ,3.61652e-05,206.508,443.193,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,2371584, PASSED ,0.0171401,5.10618,10.9589,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,2371584, PASSED ,0.000452133,193.572,415.446,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,2371584, PASSED ,0.00045328,193.082,414.395,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,25344, PASSED ,0.000180177,5.19259,11.1409,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,25344, PASSED ,9.69846e-06,96.4673,206.973,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,25344, PASSED ,9.73108e-06,96.1439,206.28,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,404736, PASSED ,0.00288824,5.17149,11.0989,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,404736, PASSED ,7.14611e-05,209.016,448.585,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,404736, PASSED ,7.10115e-05,210.34,451.425,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,50624, PASSED ,0.000361054,5.17515,11.1052,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,50624, PASSED ,1.34799e-05,138.615,297.449,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,50624, PASSED ,1.34411e-05,139.015,298.307,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,6336, PASSED ,4.44523e-05,5.26676,11.2892,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,6336, PASSED ,4.15182e-06,56.3896,120.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,6336, PASSED ,4.18842e-06,55.8969,119.814,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,809536, PASSED ,0.00581382,5.13865,11.0285,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,809536, PASSED ,0.000145012,206.019,442.156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,809536, PASSED ,0.00014442,206.864,443.969,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,101184, PASSED ,0.000719264,5.19191,11.1421,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,101184, PASSED ,1.98101e-05,188.507,404.545,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,101184, PASSED ,1.98851e-05,187.797,403.019,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,64, PASSED ,7.776e-07,15.3687,4.36214,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,64, PASSED ,5.15474e-06,2.3184,0.658035,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,64, PASSED ,2.33242e-06,5.12375,1.45428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,328509, PASSED ,0.00917113,4.66426,1.89846,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,328509, PASSED ,0.000111003,385.364,156.851,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,328509, PASSED ,0.000111162,384.811,156.627,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,35937, PASSED ,0.000397252,12.1287,4.79459,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,35937, PASSED ,1.17467e-05,410.17,162.145,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,35937, PASSED ,1.15984e-05,415.415,164.218,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,493039, PASSED ,0.0138821,4.60877,1.88236,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,493039, PASSED ,0.000184528,346.718,141.61,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,493039, PASSED ,0.000183998,347.717,142.018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,3375, PASSED ,3.73785e-05,12.9009,4.78551,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,3375, PASSED ,5.13613e-06,93.8871,34.8268,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,3375, PASSED ,3.25252e-06,148.259,54.9958,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,79507, PASSED ,0.00102856,10.2309,4.09687,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,79507, PASSED ,2.43966e-05,431.336,172.724,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,79507, PASSED ,2.44283e-05,430.777,172.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,8000, PASSED ,9.12819e-05,12.1691,4.64495,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,8000, PASSED ,5.21364e-06,213.061,81.3251,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,8000, PASSED ,3.29452e-06,337.173,128.699,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,512, PASSED ,5.63534e-06,14.2524,4.81533,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,512, PASSED ,5.02134e-06,15.9952,5.40414,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,512, PASSED ,3.43943e-06,23.3519,7.88968,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,157464, PASSED ,0.0024644,8.38297,3.38646,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,157464, PASSED ,4.46316e-05,462.878,186.988,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,157464, PASSED ,4.49968e-05,459.122,185.471,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,17576, PASSED ,0.000194791,12.2763,4.78219,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,17576, PASSED ,5.39324e-06,443.39,172.721,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,17576, PASSED ,5.07074e-06,471.59,183.707,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_MULTI_REDUCE,Base_Seq,default,3120, PASSED ,9.75346e-06,4.78196,0.319886,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,3120, PASSED ,9.98628e-06,4.67047,0.312429,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,3120, PASSED ,1.00875e-05,4.62363,0.309295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,3120, PASSED ,1.07345e-05,4.34494,0.290652,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,3120, PASSED ,1.08837e-05,4.28538,0.286668,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,3199995, PASSED ,0.0104146,4.57854,0.30726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,3199995, PASSED ,0.000104195,457.638,30.7115,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,3199995, PASSED ,9.58552e-05,497.456,33.3836,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,3199995, PASSED ,0.000115699,412.137,27.6579,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,3199995, PASSED ,9.6333e-05,494.989,33.218,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,399995, PASSED ,0.00129921,4.5878,0.307875,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,399995, PASSED ,2.00181e-05,297.757,19.9816,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,399995, PASSED ,1.99375e-05,298.961,20.0624,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,399995, PASSED ,2.10783e-05,282.78,18.9766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,399995, PASSED ,2.06653e-05,288.432,19.3558,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,4687495, PASSED ,0.0152572,4.57812,0.307232,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,4687495, PASSED ,0.000169427,412.268,27.6668,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,4687495, PASSED ,0.000150721,463.435,31.1006,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,4687495, PASSED ,0.000189504,368.591,24.7356,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,4687495, PASSED ,0.000150622,463.739,31.121,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,49995, PASSED ,0.000161997,4.59966,0.308616,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,49995, PASSED ,1.07981e-05,69.0062,4.63,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,49995, PASSED ,1.07923e-05,69.0431,4.63248,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,49995, PASSED ,1.15151e-05,64.7093,4.3417,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,49995, PASSED ,1.18101e-05,63.0929,4.23325,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,799995, PASSED ,0.00259959,4.58573,0.307739,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,799995, PASSED ,2.92524e-05,407.522,27.348,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,799995, PASSED ,2.9184e-05,408.478,27.4121,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,799995, PASSED ,3.08014e-05,387.028,25.9727,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,799995, PASSED ,2.99362e-05,398.214,26.7233,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,99995, PASSED ,0.000324521,4.59197,0.308131,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,99995, PASSED ,1.20055e-05,124.126,8.3291,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,99995, PASSED ,1.14005e-05,130.713,8.77114,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,99995, PASSED ,1.27285e-05,117.075,7.856,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,99995, PASSED ,1.21023e-05,123.133,8.26249,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,12495, PASSED ,4.01375e-05,4.64252,0.311305,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,12495, PASSED ,1.05149e-05,17.7215,1.18832,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,12495, PASSED ,1.05581e-05,17.6489,1.18345,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,12495, PASSED ,1.09563e-05,17.0075,1.14044,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,12495, PASSED ,1.11973e-05,16.6415,1.1159,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,1599995, PASSED ,0.00520593,4.57977,0.307341,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,1599995, PASSED ,4.81451e-05,495.21,33.2328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,1599995, PASSED ,4.78873e-05,497.876,33.4117,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,1599995, PASSED ,5.13857e-05,463.98,31.1369,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,1599995, PASSED ,4.84835e-05,491.753,33.0008,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,199995, PASSED ,0.000649353,4.58966,0.307991,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,199995, PASSED ,1.34511e-05,221.566,14.8683,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,199995, PASSED ,1.24901e-05,238.614,16.0123,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,199995, PASSED ,1.46049e-05,204.062,13.6937,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,199995, PASSED ,1.37171e-05,217.27,14.58,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_REDUCE_STRUCT,Base_Seq,default,3125, PASSED ,2.73462e-06,17.0284,2.28624,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,3125, PASSED ,1.02981e-05,4.52183,0.607103,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,3125, PASSED ,5.05764e-06,9.20709,1.23615,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,3125, PASSED ,1.90975e-05,2.43833,0.327372,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,3125, PASSED ,1.89425e-05,2.45828,0.330051,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,3125, PASSED ,2.29393e-05,2.02997,0.272545,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,3125, PASSED ,1.91345e-05,2.43362,0.326739,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,3125, PASSED ,2.64364e-05,1.76144,0.236492,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,3125, PASSED ,2.29583e-05,2.02829,0.272319,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,3125, PASSED ,1.91847e-05,2.42725,0.325884,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,3125, PASSED ,2.68696e-05,1.73304,0.232679,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,3200000, PASSED ,0.00278983,17.092,2.29405,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,3200000, PASSED ,0.0104282,4.57258,0.613722,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,3200000, PASSED ,0.00510038,9.34906,1.25481,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,3200000, PASSED ,0.00616805,7.73076,1.03761,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,3200000, PASSED ,0.000184726,258.132,34.6459,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,3200000, PASSED ,0.000657996,72.468,9.7265,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,3200000, PASSED ,0.000766404,62.2175,8.35069,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,3200000, PASSED ,0.00106557,44.7497,6.0062,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,3200000, PASSED ,0.000123017,387.62,52.0255,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,3200000, PASSED ,0.000134688,354.03,47.5171,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,3200000, PASSED ,0.000135014,353.177,47.4026,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,400000, PASSED ,0.000332584,17.9217,2.40541,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,400000, PASSED ,0.00129928,4.58753,0.615729,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,400000, PASSED ,0.000631813,9.43391,1.2662,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,400000, PASSED ,0.000729383,8.17193,1.09682,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,400000, PASSED ,0.000113421,52.5516,7.05338,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,400000, PASSED ,9.62844e-05,61.9048,8.30874,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,400000, PASSED ,0.000109261,54.5527,7.32195,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,400000, PASSED ,0.000152918,38.9782,5.23158,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,400000, PASSED ,3.76461e-05,158.329,21.2506,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,400000, PASSED ,4.31967e-05,137.984,18.52,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,400000, PASSED ,4.95181e-05,120.369,16.1557,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,4687500, PASSED ,0.00408657,17.0924,2.2941,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,4687500, PASSED ,0.0152744,4.57297,0.613774,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,4687500, PASSED ,0.00747505,9.34431,1.25417,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,4687500, PASSED ,0.00808465,8.63973,1.15961,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,4687500, PASSED ,0.000247098,282.678,37.9404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,4687500, PASSED ,0.000956887,72.9963,9.7974,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,4687500, PASSED ,0.00111872,62.4369,8.38014,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,4687500, PASSED ,0.00154463,45.2207,6.06943,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,4687500, PASSED ,0.000178226,391.914,52.6018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,4687500, PASSED ,0.000190922,365.851,49.1038,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,4687500, PASSED ,0.000189367,368.856,49.507,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,50000, PASSED ,4.21627e-05,17.671,2.37181,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,50000, PASSED ,0.000162529,4.58415,0.615287,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,50000, PASSED ,7.91211e-05,9.41668,1.26391,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,50000, PASSED ,0.000105269,7.07765,0.949965,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,50000, PASSED ,0.000104101,7.15708,0.960626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,50000, PASSED ,2.70728e-05,27.5206,3.69382,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,50000, PASSED ,3.2259e-05,23.0961,3.09997,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,50000, PASSED ,3.66256e-05,20.3425,2.73038,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,50000, PASSED ,2.69692e-05,27.6263,3.70801,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,50000, PASSED ,3.26454e-05,22.8227,3.06328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,50000, PASSED ,3.68006e-05,20.2458,2.7174,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,800000, PASSED ,0.000670746,17.7726,2.3854,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,800000, PASSED ,0.00260007,4.58485,0.615369,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,800000, PASSED ,0.00126649,9.41254,1.26333,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,800000, PASSED ,0.00149687,7.9639,1.0689,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,800000, PASSED ,0.000127232,93.6942,12.5754,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,800000, PASSED ,0.000175058,68.097,9.13983,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,800000, PASSED ,0.00020134,59.208,7.94678,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,800000, PASSED ,0.000283312,42.077,5.64748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,800000, PASSED ,4.65349e-05,256.172,34.3828,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,800000, PASSED ,5.30948e-05,224.522,30.1348,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,800000, PASSED ,5.91812e-05,201.431,27.0357,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,100000, PASSED ,8.36332e-05,17.8173,2.39142,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,100000, PASSED ,0.000325051,4.58426,0.615295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,100000, PASSED ,0.000158334,9.4112,1.26316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,100000, PASSED ,0.000203711,7.31487,0.981795,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,100000, PASSED ,0.00010257,14.5278,1.94991,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,100000, PASSED ,3.68052e-05,40.4865,5.43406,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,100000, PASSED ,4.26279e-05,34.9564,4.69181,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,100000, PASSED ,5.37996e-05,27.6976,3.71754,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,100000, PASSED ,2.76564e-05,53.8797,7.23168,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,100000, PASSED ,3.3627e-05,44.3131,5.94766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,100000, PASSED ,4.17289e-05,35.7095,4.79289,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,12500, PASSED ,1.03141e-05,18.0593,2.42407,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,12500, PASSED ,4.06763e-05,4.57919,0.614658,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,12500, PASSED ,1.96435e-05,9.48223,1.27278,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,12500, PASSED ,3.42016e-05,5.44607,0.731018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,12500, PASSED ,3.3888e-05,5.49647,0.737782,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,12500, PASSED ,2.37887e-05,7.82994,1.051,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,12500, PASSED ,2.8524e-05,6.5301,0.876525,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,12500, PASSED ,2.7577e-05,6.75435,0.906626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,12500, PASSED ,2.35784e-05,7.89981,1.06038,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,12500, PASSED ,2.89538e-05,6.43316,0.863514,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,12500, PASSED ,2.78234e-05,6.69453,0.898597,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,1600000, PASSED ,0.00138466,17.2186,2.31104,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,1600000, PASSED ,0.00521217,4.57427,0.613948,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,1600000, PASSED ,0.00254821,9.3563,1.25578,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,1600000, PASSED ,0.00309166,7.71168,1.03504,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,1600000, PASSED ,0.000137386,173.54,23.2921,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,1600000, PASSED ,0.000329293,72.4032,9.7178,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,1600000, PASSED ,0.000378012,63.0717,8.46535,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,1600000, PASSED ,0.000534626,44.5954,5.98549,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,1600000, PASSED ,6.53418e-05,364.879,48.9732,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,1600000, PASSED ,7.30097e-05,326.557,43.8298,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,1600000, PASSED ,7.63581e-05,312.237,41.9078,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,200000, PASSED ,0.000167119,17.833,2.39351,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,200000, PASSED ,0.00065002,4.58483,0.615369,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,200000, PASSED ,0.000316624,9.41252,1.26333,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,200000, PASSED ,0.000381665,7.8085,1.04804,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,200000, PASSED ,0.000103741,28.7275,3.85576,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,200000, PASSED ,5.41124e-05,55.0749,7.39206,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,200000, PASSED ,6.13572e-05,48.5718,6.51923,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,200000, PASSED ,8.93898e-05,33.3397,4.47481,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,200000, PASSED ,2.97842e-05,100.061,13.43,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,200000, PASSED ,3.49464e-05,85.28,11.4461,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,200000, PASSED ,4.34719e-05,68.5554,9.2014,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_CONVECTION3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_CONVECTION3DPA_bandwidth.png new file mode 100644 index 0000000..b217155 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_CONVECTION3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_CONVECTION3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_CONVECTION3DPA_flops.png new file mode 100644 index 0000000..9ef9c8b Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_CONVECTION3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png new file mode 100644 index 0000000..073fa28 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_DEL_DOT_VEC_2D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_DEL_DOT_VEC_2D_flops.png new file mode 100644 index 0000000..5ac0422 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_DEL_DOT_VEC_2D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_INTSC_HEXHEX_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_INTSC_HEXHEX_bandwidth.png new file mode 100644 index 0000000..530c3c8 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_INTSC_HEXHEX_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_INTSC_HEXHEX_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_INTSC_HEXHEX_flops.png new file mode 100644 index 0000000..745a273 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_INTSC_HEXHEX_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_LTIMES_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_LTIMES_bandwidth.png new file mode 100644 index 0000000..01a89cf Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_LTIMES_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_LTIMES_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_LTIMES_flops.png new file mode 100644 index 0000000..e47d724 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_LTIMES_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MASS3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MASS3DPA_bandwidth.png new file mode 100644 index 0000000..de87042 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MASS3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MASS3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MASS3DPA_flops.png new file mode 100644 index 0000000..b3e8d64 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MASS3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png new file mode 100644 index 0000000..979bfb0 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MATVEC_3D_STENCIL_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MATVEC_3D_STENCIL_flops.png new file mode 100644 index 0000000..a6fcc84 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Apps_MATVEC_3D_STENCIL_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_INDEXLIST_3LOOP_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_INDEXLIST_3LOOP_bandwidth.png new file mode 100644 index 0000000..1a7512f Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_INDEXLIST_3LOOP_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_INDEXLIST_3LOOP_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_INDEXLIST_3LOOP_flops.png new file mode 100644 index 0000000..91e2642 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_INDEXLIST_3LOOP_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_MULTI_REDUCE_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_MULTI_REDUCE_bandwidth.png new file mode 100644 index 0000000..637a241 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_MULTI_REDUCE_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_MULTI_REDUCE_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_MULTI_REDUCE_flops.png new file mode 100644 index 0000000..f213bd4 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_MULTI_REDUCE_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_REDUCE_STRUCT_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_REDUCE_STRUCT_bandwidth.png new file mode 100644 index 0000000..e4c1b05 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_REDUCE_STRUCT_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_REDUCE_STRUCT_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_REDUCE_STRUCT_flops.png new file mode 100644 index 0000000..cdbc6ab Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Basic_REDUCE_STRUCT_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Comm_HALO_PACKING_FUSED_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Comm_HALO_PACKING_FUSED_bandwidth.png new file mode 100644 index 0000000..60b3c6f Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Comm_HALO_PACKING_FUSED_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Comm_HALO_PACKING_FUSED_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Comm_HALO_PACKING_FUSED_flops.png new file mode 100644 index 0000000..753b298 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/figures/Comm_HALO_PACKING_FUSED_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/output_with_variant_tuning.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/output_with_variant_tuning.csv new file mode 100644 index 0000000..f02bead --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/output_with_variant_tuning.csv @@ -0,0 +1,431 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning,Smoothed Mean flops (gigaFLOP per sec.),Smoothed Bandwidth (GiB per sec.) +Apps_CONVECTION3DPA,Base_Seq,default,702, PASSED ,7.33484e-06,7.24657,13.0552,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,13.5986,7.51252 +Apps_CONVECTION3DPA,Base_HIP,block_64,702, PASSED ,2.82362e-06,18.8242,33.9132,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,129.201,71.4457 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,702, PASSED ,2.89982e-06,18.3296,33.022,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,120.606,66.6931 +Apps_CONVECTION3DPA,Base_Seq,default,702459, PASSED ,0.0245371,2.15669,3.90513,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,4.197215,2.31801 +Apps_CONVECTION3DPA,Base_HIP,block_64,702459, PASSED ,0.000253699,208.59,377.694,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,398.0925,219.856 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,702459, PASSED ,0.000254628,207.829,376.316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,394.82399999999996,218.051 +Apps_CONVECTION3DPA,Base_Seq,default,87804, PASSED ,0.000946896,6.98584,12.6488,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,11.8994,6.57224 +Apps_CONVECTION3DPA,Base_HIP,block_64,87804, PASSED ,2.85542e-05,231.66,419.452,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,418.491,231.122 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,87804, PASSED ,2.83612e-05,233.236,422.306,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,413.332,228.273 +Apps_CONVECTION3DPA,Base_Seq,default,1028970, PASSED ,0.0376482,2.05897,3.72818,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,3.90513,2.15669 +Apps_CONVECTION3DPA,Base_HIP,block_64,1028970, PASSED ,0.000379837,204.078,369.525,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,377.694,208.59 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,1028970, PASSED ,0.000378437,204.833,370.892,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,376.316,207.829 +Apps_CONVECTION3DPA,Base_Seq,default,10989, PASSED ,0.000110231,7.51252,13.5986,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,13.0552,7.24657 +Apps_CONVECTION3DPA,Base_HIP,block_64,10989, PASSED ,5.26884e-06,157.171,284.499,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,284.499,157.171 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,10989, PASSED ,5.42224e-06,152.725,276.451,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,276.451,152.725 +Apps_CONVECTION3DPA,Base_Seq,default,175608, PASSED ,0.00249516,5.30205,9.60028,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,9.60028,5.30205 +Apps_CONVECTION3DPA,Base_HIP,block_64,175608, PASSED ,5.60524e-05,236.02,427.354,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,418.491,231.122 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,175608, PASSED ,5.58736e-05,236.775,428.722,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,413.332,228.273 +Apps_CONVECTION3DPA,Base_Seq,default,21951, PASSED ,0.000234811,7.04361,12.7519,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,12.7519,7.04361 +Apps_CONVECTION3DPA,Base_HIP,block_64,21951, PASSED ,8.35126e-06,198.044,358.542,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,358.542,198.044 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,21951, PASSED ,8.54646e-06,193.521,350.353,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,350.353,193.521 +Apps_CONVECTION3DPA,Base_Seq,default,2754, PASSED ,2.6859e-05,7.73436,13.9866,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,13.326899999999998,7.379545 +Apps_CONVECTION3DPA,Base_HIP,block_64,2754, PASSED ,2.90762e-06,71.4457,129.201,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,206.85000000000002,114.30834999999999 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,2754, PASSED ,3.11482e-06,66.6931,120.606,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,198.5285,109.70904999999999 +Apps_CONVECTION3DPA,Base_Seq,default,351216, PASSED ,0.0106717,2.47933,4.4893,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,4.4893,2.47933 +Apps_CONVECTION3DPA,Base_HIP,block_64,351216, PASSED ,0.000114479,231.122,418.491,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,418.491,231.122 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,351216, PASSED ,0.000115908,228.273,413.332,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,413.332,228.273 +Apps_CONVECTION3DPA,Base_Seq,default,43902, PASSED ,0.000503263,6.57224,11.8994,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,12.6488,6.98584 +Apps_CONVECTION3DPA,Base_HIP,block_64,43902, PASSED ,1.48289e-05,223.049,403.844,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,403.844,223.049 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,43902, PASSED ,1.50069e-05,220.403,399.054,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,399.054,220.403 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,841, PASSED ,5.52134e-06,7.12761,8.22518,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,8.30676,7.05094 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,841, PASSED ,2.99723e-06,13.1301,15.152,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,72.5329,61.3475 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,841, PASSED ,2.05801e-06,19.1223,22.0669,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,98.7272,83.5024 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1060900, PASSED ,0.00701681,6.76766,8.16448,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,8.159075,6.765000000000001 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,1060900, PASSED ,0.000130166,364.821,440.119,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,466.2175,386.71950000000004 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,1060900, PASSED ,0.000127915,371.24,447.863,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,463.81100000000004,384.718 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,131044, PASSED ,0.000851461,6.90546,8.31087,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,8.26578,6.88855 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,131044, PASSED ,1.59664e-05,368.256,443.204,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,492.316,408.618 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,131044, PASSED ,1.55054e-05,379.205,456.381,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,479.759,398.196 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1555009, PASSED ,0.0103826,6.70243,8.08762,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,8.15367,6.76234 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,1555009, PASSED ,0.000199778,348.33,420.319,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,440.119,364.821 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,1555009, PASSED ,0.000201939,344.602,415.82,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,447.863,371.24 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,15876, PASSED ,0.000103206,6.94974,8.30676,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,8.27772,6.94974 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,15876, PASSED ,2.82362e-06,254.019,303.619,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,303.619,254.019 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,15876, PASSED ,2.70652e-06,265.009,316.755,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,316.755,265.009 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,264196, PASSED ,0.00173718,6.81632,8.21252,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,8.21252,6.81632 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,264196, PASSED ,2.89785e-05,408.618,492.316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,492.316,408.618 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,264196, PASSED ,2.9737e-05,398.196,479.759,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,479.759,398.196 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,32400, PASSED ,0.000211668,6.89359,8.26578,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,8.30676,6.90546 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,32400, PASSED ,3.79242e-06,384.755,461.341,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,443.204,368.256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,32400, PASSED ,3.76703e-06,387.348,464.451,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,456.381,379.205 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,3844, PASSED ,2.48996e-05,7.05094,8.33653,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,8.28627,7.00034 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,3844, PASSED ,2.86182e-06,61.3475,72.5329,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,188.07595,157.68325 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,3844, PASSED ,2.10252e-06,83.5024,98.7272,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,207.7411,174.2557 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,528529, PASSED ,0.00350033,6.76234,8.15367,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,8.16448,6.76766 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,528529, PASSED ,5.48049e-05,431.904,520.767,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,443.204,368.256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,528529, PASSED ,5.55196e-05,426.344,514.063,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,456.381,379.205 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,65025, PASSED ,0.000424193,6.88855,8.27772,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,8.27772,6.89359 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,65025, PASSED ,6.19084e-06,471.999,567.185,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,461.341,384.755 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,65025, PASSED ,6.26084e-06,466.722,560.843,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,464.451,387.348 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,1860867, PASSED ,0.000622838,16.5543,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,16.5543 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,1860867, PASSED ,5.24521e-05,196.573,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,196.573 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,1860867, PASSED ,5.72595e-05,180.069,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,180.069 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,1860867, PASSED ,5.80091e-05,177.742,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,177.742 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,1860867, PASSED ,6.23368e-05,165.402,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,165.402 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,205379, PASSED ,7.6831e-05,31.4224,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,30.6163 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,205379, PASSED ,3.15638e-05,76.4868,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,76.4868 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,205379, PASSED ,3.67183e-05,65.7495,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,65.7495 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,205379, PASSED ,3.53835e-05,68.2299,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,68.2299 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,205379, PASSED ,3.67888e-05,65.6235,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,65.6235 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,2744000, PASSED ,0.00110899,12.0213,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,12.0213 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,2744000, PASSED ,6.41654e-05,207.767,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,199.269 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,2744000, PASSED ,6.84637e-05,194.723,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,192.515 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,2744000, PASSED ,7.02429e-05,189.791,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,187.563 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,2744000, PASSED ,7.50827e-05,177.557,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,177.557 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,3796416, PASSED ,0.0017678,9.34983,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,9.34983 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,3796416, PASSED ,7.40156e-05,223.313,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,205.182 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,3796416, PASSED ,7.88734e-05,209.559,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,194.723 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,3796416, PASSED ,8.06804e-05,204.866,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,187.563 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,3796416, PASSED ,8.62012e-05,191.745,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,177.557 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,421875, PASSED ,0.000131646,29.4222,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,29.4222 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,421875, PASSED ,3.31198e-05,116.949,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,116.949 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,421875, PASSED ,3.90563e-05,99.173,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,99.173 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,421875, PASSED ,3.73596e-05,103.677,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,103.677 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,421875, PASSED ,3.93232e-05,98.5,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,98.5 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,5639752, PASSED ,0.00288279,7.45299,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,8.40141 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,5639752, PASSED ,0.000107821,199.269,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,206.47449999999998 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,5639752, PASSED ,0.000111604,192.515,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,197.2725 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,5639752, PASSED ,0.00011455,187.563,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,188.677 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,5639752, PASSED ,0.000118996,180.556,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,179.0565 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,42875, PASSED ,2.53527e-05,34.2866,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,31.4224 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,42875, PASSED ,2.44541e-05,35.5465,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,52.7123 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,42875, PASSED ,3.06456e-05,28.3649,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,43.3236 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,42875, PASSED ,2.8092e-05,30.9433,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,46.2492 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,42875, PASSED ,2.98791e-05,29.0926,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,44.3283 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,7645373, PASSED ,0.00363146,7.23912,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,7.45299 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,7645373, PASSED ,0.000128123,205.182,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,205.182 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,7645373, PASSED ,0.00013156,199.822,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,199.822 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,7645373, PASSED ,0.000143879,182.713,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,187.563 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,7645373, PASSED ,0.00015142,173.613,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,180.556 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,884736, PASSED ,0.000237783,26.5345,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,26.5345 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,884736, PASSED ,4.94457e-05,127.604,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,127.604 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,884736, PASSED ,4.51021e-05,139.893,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,139.893 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,884736, PASSED ,4.41649e-05,142.861,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,142.861 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,884736, PASSED ,4.71311e-05,133.87,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,133.87 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,91125, PASSED ,4.63515e-05,30.6163,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,31.01935 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,91125, PASSED ,2.69218e-05,52.7123,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,64.59955 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,91125, PASSED ,3.27561e-05,43.3236,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,54.53655 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,91125, PASSED ,3.0684e-05,46.2492,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,57.23955 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,91125, PASSED ,3.20137e-05,44.3283,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,54.9759 +Basic_INDEXLIST_3LOOP,Base_Seq,default,2560000, PASSED ,0.0108399,9.23769,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.23769 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,2560000, PASSED ,0.000214471,466.897,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,466.897 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,2560000, PASSED ,0.000214766,466.256,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,466.256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,320000, PASSED ,0.00119211,10.4999,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.0,10.4999 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,320000, PASSED ,4.0064e-05,312.425,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,312.425 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,320000, PASSED ,3.9534e-05,316.614,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,316.614 +Basic_INDEXLIST_3LOOP,Base_Seq,default,3750000, PASSED ,0.0160624,9.13207,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.13207 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,3750000, PASSED ,0.000304586,481.583,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,466.897 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,3750000, PASSED ,0.000302913,484.242,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,466.256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,5120000, PASSED ,0.022102,9.06123,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.06123 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,5120000, PASSED ,0.000422616,473.886,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,466.897 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,5120000, PASSED ,0.000421896,474.695,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,466.256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,640000, PASSED ,0.00242832,10.3092,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.0,10.3092 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,640000, PASSED ,6.68772e-05,374.327,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,374.327 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,640000, PASSED ,6.60449e-05,379.045,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,379.045 +Basic_INDEXLIST_3LOOP,Base_Seq,default,7500000, PASSED ,0.032534,9.01723,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.03923 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,7500000, PASSED ,0.000648369,452.468,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,463.177 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,7500000, PASSED ,0.000650462,451.012,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,462.8535 +Basic_INDEXLIST_3LOOP,Base_Seq,default,80000, PASSED ,0.000220701,14.1788,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.0,10.9567 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,80000, PASSED ,2.14209e-05,146.085,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,217.801 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,80000, PASSED ,2.18572e-05,143.168,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,220.631 +Basic_INDEXLIST_3LOOP,Base_Seq,default,10000000, PASSED ,0.0435007,8.99193,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.01723 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,10000000, PASSED ,0.00087013,449.537,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,452.468 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,10000000, PASSED ,0.000874687,447.195,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,451.012 +Basic_INDEXLIST_3LOOP,Base_Seq,default,1280000, PASSED ,0.005266,9.50777,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.50777 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,1280000, PASSED ,0.000112822,443.779,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,443.779 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,1280000, PASSED ,0.000113597,440.75,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,440.75 +Basic_INDEXLIST_3LOOP,Base_Seq,default,160000, PASSED ,0.000571205,10.9567,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.0,10.7283 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,160000, PASSED ,2.8735e-05,217.801,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,265.113 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,160000, PASSED ,2.83664e-05,220.631,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,268.6225 +Apps_INTSC_HEXHEX,Base_Seq,default,27, PASSED ,0.00148561,0.0758293,3.51739,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,3.53797,0.0762729 +Apps_INTSC_HEXHEX,Base_HIP,block_64,27, PASSED ,0.0018511,0.0608571,2.8229,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,2.8229,0.0608571 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,27, PASSED ,0.00105126,0.10716,4.97069,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,4.97069,0.10716 +Apps_INTSC_HEXHEX,Base_Seq,default,13824, PASSED ,0.75279,0.0766193,3.55404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,3.55397,0.0766179 +Apps_INTSC_HEXHEX,Base_HIP,block_64,13824, PASSED ,0.790273,0.0729852,3.38547,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,3.36355,0.0725127 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,13824, PASSED ,0.422165,0.136625,6.33743,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,6.317185,0.1361885 +Apps_INTSC_HEXHEX,Base_Seq,default,1728, PASSED ,0.09369,0.0769536,3.56954,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,3.5674,0.0769074 +Apps_INTSC_HEXHEX,Base_HIP,block_64,1728, PASSED ,0.100249,0.071919,3.33601,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,3.33601,0.071919 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,1728, PASSED ,0.055126,0.130787,6.06665,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,6.06665,0.130787 +Apps_INTSC_HEXHEX,Base_Seq,default,19683, PASSED ,1.0703,0.0767298,3.55916,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,3.55404,0.0766193 +Apps_INTSC_HEXHEX,Base_HIP,block_64,19683, PASSED ,1.11803,0.0734538,3.4072,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,3.38547,0.0729852 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,19683, PASSED ,0.599997,0.136874,6.34898,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,6.33743,0.136625 +Apps_INTSC_HEXHEX,Base_Seq,default,216, PASSED ,0.011755,0.0766671,3.55625,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,3.55625,0.0766671 +Apps_INTSC_HEXHEX,Base_HIP,block_64,216, PASSED ,0.0133699,0.0674069,3.12671,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,3.12671,0.0674069 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,216, PASSED ,0.00770426,0.116977,5.42606,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,5.42606,0.116977 +Apps_INTSC_HEXHEX,Base_Seq,default,3375, PASSED ,0.183828,0.0766019,3.55323,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,3.55404,0.0766193 +Apps_INTSC_HEXHEX,Base_HIP,block_64,3375, PASSED ,0.195521,0.0720209,3.34073,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,3.34073,0.0720209 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,3375, PASSED ,0.105592,0.133359,6.18593,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,6.18593,0.133359 +Apps_INTSC_HEXHEX,Base_Seq,default,512, PASSED ,0.0277766,0.0769074,3.5674,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,3.5674,0.0769074 +Apps_INTSC_HEXHEX,Base_HIP,block_64,512, PASSED ,0.0303397,0.0704105,3.26604,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,3.26604,0.0704105 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,512, PASSED ,0.0174918,0.122127,5.66495,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,5.66495,0.122127 +Apps_INTSC_HEXHEX,Base_Seq,default,64, PASSED ,0.00350096,0.0762729,3.53797,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,3.54711,0.07647000000000001 +Apps_INTSC_HEXHEX,Base_HIP,block_64,64, PASSED ,0.00441563,0.0604735,2.8051,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,2.974805,0.064132 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,64, PASSED ,0.00253179,0.10547,4.89231,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,5.198375,0.1120685 +Apps_INTSC_HEXHEX,Base_Seq,default,6859, PASSED ,0.373523,0.0766165,3.5539,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,3.55404,0.0766193 +Apps_INTSC_HEXHEX,Base_HIP,block_64,6859, PASSED ,0.39725,0.0720402,3.34163,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,3.34163,0.0720402 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,6859, PASSED ,0.210811,0.135752,6.29694,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,6.29694,0.135752 +Apps_INTSC_HEXHEX,Base_Seq,default,1000, PASSED ,0.054175,0.0770157,3.57242,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,3.5674,0.0769074 +Apps_INTSC_HEXHEX,Base_HIP,block_64,1000, PASSED ,0.0582188,0.0716662,3.32428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,3.32428,0.0716662 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,1000, PASSED ,0.0330844,0.126111,5.84976,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,5.84976,0.126111 +Apps_LTIMES,Base_Seq,default,1344, PASSED ,1.08737e-05,8.69785,6.18006,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,6.18006,8.69785 +Apps_LTIMES,Base_HIP,block_256,1344, FAILED ,3.07262e-06,30.7808,21.8706,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,66.3897,92.6304 +Apps_LTIMES,RAJA_HIP,kernel_256,1344, FAILED ,3.09042e-06,30.6035,21.7446,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,58.4839,81.5998 +Apps_LTIMES,RAJA_HIP,launch_256,1344, FAILED ,4.16324e-06,22.7173,16.1413,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,56.552,78.9043 +Apps_LTIMES,Base_Seq,default,1238784, PASSED ,0.0105919,8.13308,5.8478,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,5.877280000000001,8.17413 +Apps_LTIMES,Base_HIP,block_256,1238784, PASSED ,0.000520752,165.423,118.942,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,117.8175,163.861 +Apps_LTIMES,RAJA_HIP,kernel_256,1238784, PASSED ,0.000662645,130.001,93.4727,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,94.35355,131.23000000000002 +Apps_LTIMES,RAJA_HIP,launch_256,1238784, PASSED ,0.000537092,160.391,115.323,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,114.4385,159.1615 +Apps_LTIMES,Base_Seq,default,154944, PASSED ,0.00130186,8.27718,5.95087,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,5.9552,8.28278 +Apps_LTIMES,Base_HIP,block_256,154944, PASSED ,6.56977e-05,164.02,117.922,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,117.922,164.02 +Apps_LTIMES,RAJA_HIP,kernel_256,154944, PASSED ,8.12846e-05,132.568,95.3096,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,95.3096,132.568 +Apps_LTIMES,RAJA_HIP,launch_256,154944, PASSED ,6.80803e-05,158.28,113.795,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,113.795,158.28 +Apps_LTIMES,Base_Seq,default,1814592, PASSED ,0.0155167,8.13223,5.84722,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,5.8478,8.13308 +Apps_LTIMES,Base_HIP,block_256,1814592, PASSED ,0.000763999,165.165,118.756,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,118.756,165.165 +Apps_LTIMES,RAJA_HIP,kernel_256,1814592, PASSED ,0.000947779,133.138,95.7286,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,95.1529,132.34 +Apps_LTIMES,RAJA_HIP,launch_256,1814592, PASSED ,0.000781718,161.421,116.064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,115.323,160.391 +Apps_LTIMES,Base_Seq,default,19392, PASSED ,0.000161372,8.36339,6.0085,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,6.02404,8.38156 +Apps_LTIMES,Base_HIP,block_256,19392, PASSED ,8.85826e-06,152.356,109.457,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,109.457,152.356 +Apps_LTIMES,RAJA_HIP,kernel_256,19392, PASSED ,1.04605e-05,129.02,92.6917,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,92.6917,129.02 +Apps_LTIMES,RAJA_HIP,launch_256,19392, PASSED ,8.85006e-06,152.498,109.559,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,109.559,152.498 +Apps_LTIMES,Base_Seq,default,309696, PASSED ,0.00260021,8.28278,5.9552,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,5.95087,8.27718 +Apps_LTIMES,Base_HIP,block_256,309696, PASSED ,0.000134703,159.885,114.955,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,117.922,164.02 +Apps_LTIMES,RAJA_HIP,kernel_256,309696, PASSED ,0.000165517,130.12,93.5542,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,95.1529,132.34 +Apps_LTIMES,RAJA_HIP,launch_256,309696, PASSED ,0.000137936,156.138,112.261,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,113.795,158.28 +Apps_LTIMES,Base_Seq,default,38784, PASSED ,0.00032191,8.38156,6.02404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,6.02263,8.37786 +Apps_LTIMES,Base_HIP,block_256,38784, PASSED ,1.55319e-05,173.714,124.853,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,117.922,164.02 +Apps_LTIMES,RAJA_HIP,kernel_256,38784, PASSED ,1.89181e-05,142.62,102.505,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,95.3096,132.568 +Apps_LTIMES,RAJA_HIP,launch_256,38784, PASSED ,1.56875e-05,171.991,123.614,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,113.795,158.28 +Apps_LTIMES,Base_Seq,default,4992, PASSED ,4.00291e-05,8.70005,6.23547,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,6.10205,8.539705000000001 +Apps_LTIMES,Base_HIP,block_256,4992, PASSED ,3.75962e-06,92.6304,66.3897,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,87.92335,122.4932 +Apps_LTIMES,RAJA_HIP,kernel_256,4992, PASSED ,4.26784e-06,81.5998,58.4839,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,75.5878,105.3099 +Apps_LTIMES,RAJA_HIP,launch_256,4992, PASSED ,4.41364e-06,78.9043,56.552,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,83.0555,115.70115 +Apps_LTIMES,Base_Seq,default,619392, PASSED ,0.00524308,8.21518,5.90676,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,5.90676,8.21518 +Apps_LTIMES,Base_HIP,block_256,619392, PASSED ,0.000264971,162.557,116.879,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,117.922,164.02 +Apps_LTIMES,RAJA_HIP,kernel_256,619392, PASSED ,0.000325472,132.34,95.1529,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,95.1529,132.34 +Apps_LTIMES,RAJA_HIP,launch_256,619392, PASSED ,0.000272731,157.932,113.554,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,113.795,158.28 +Apps_LTIMES,Base_Seq,default,77568, PASSED ,0.000643971,8.37786,6.02263,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,6.0085,8.36339 +Apps_LTIMES,Base_HIP,block_256,77568, PASSED ,3.27858e-05,164.556,118.295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,117.922,164.02 +Apps_LTIMES,RAJA_HIP,kernel_256,77568, PASSED ,3.95277e-05,136.489,98.1186,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,95.3096,132.568 +Apps_LTIMES,RAJA_HIP,launch_256,77568, PASSED ,3.38882e-05,159.203,114.447,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/LTIMES_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,113.795,158.28 +Apps_MASS3DPA,Base_Seq,default,1600, PASSED ,1.14101e-05,5.201,11.1064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,11.1409,5.201 +Apps_MASS3DPA,Base_HIP,block_25,1600, PASSED ,3.32562e-06,17.8445,38.1057,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_25,120.87,56.3896 +Apps_MASS3DPA,RAJA_HIP,block_25,1600, PASSED ,3.30442e-06,17.9589,38.3501,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_25,119.814,55.8969 +Apps_MASS3DPA,Base_Seq,default,1619008, PASSED ,0.011684,5.11364,10.9749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,11.0017,5.126145 +Apps_MASS3DPA,Base_HIP,block_25,1619008, PASSED ,0.00030745,194.333,417.077,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_25,429.6165,200.176 +Apps_MASS3DPA,RAJA_HIP,block_25,1619008, PASSED ,0.000305253,195.732,420.08,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_25,432.0245,201.298 +Apps_MASS3DPA,Base_Seq,default,202368, PASSED ,0.00143621,5.2001,11.1601,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,11.1052,5.17515 +Apps_MASS3DPA,Base_HIP,block_25,202368, PASSED ,3.63478e-05,205.471,440.966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_25,440.966,205.471 +Apps_MASS3DPA,RAJA_HIP,block_25,202368, PASSED ,3.61652e-05,206.508,443.193,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_25,443.193,206.508 +Apps_MASS3DPA,Base_Seq,default,2371584, PASSED ,0.0171401,5.10618,10.9589,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,10.9749,5.11364 +Apps_MASS3DPA,Base_HIP,block_25,2371584, PASSED ,0.000452133,193.572,415.446,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_25,417.077,194.333 +Apps_MASS3DPA,RAJA_HIP,block_25,2371584, PASSED ,0.00045328,193.082,414.395,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_25,420.08,195.732 +Apps_MASS3DPA,Base_Seq,default,25344, PASSED ,0.000180177,5.19259,11.1409,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,11.1409,5.19259 +Apps_MASS3DPA,Base_HIP,block_25,25344, PASSED ,9.69846e-06,96.4673,206.973,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_25,206.973,96.4673 +Apps_MASS3DPA,RAJA_HIP,block_25,25344, PASSED ,9.73108e-06,96.1439,206.28,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_25,206.28,96.1439 +Apps_MASS3DPA,Base_Seq,default,404736, PASSED ,0.00288824,5.17149,11.0989,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,11.0989,5.17149 +Apps_MASS3DPA,Base_HIP,block_25,404736, PASSED ,7.14611e-05,209.016,448.585,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_25,440.966,205.471 +Apps_MASS3DPA,RAJA_HIP,block_25,404736, PASSED ,7.10115e-05,210.34,451.425,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_25,443.193,206.508 +Apps_MASS3DPA,Base_Seq,default,50624, PASSED ,0.000361054,5.17515,11.1052,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,11.1421,5.19259 +Apps_MASS3DPA,Base_HIP,block_25,50624, PASSED ,1.34799e-05,138.615,297.449,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_25,297.449,138.615 +Apps_MASS3DPA,RAJA_HIP,block_25,50624, PASSED ,1.34411e-05,139.015,298.307,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_25,298.307,139.015 +Apps_MASS3DPA,Base_Seq,default,6336, PASSED ,4.44523e-05,5.26676,11.2892,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,11.123650000000001,5.196795 +Apps_MASS3DPA,Base_HIP,block_25,6336, PASSED ,4.15182e-06,56.3896,120.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_25,163.9215,76.42845 +Apps_MASS3DPA,RAJA_HIP,block_25,6336, PASSED ,4.18842e-06,55.8969,119.814,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_25,163.047,76.0204 +Apps_MASS3DPA,Base_Seq,default,809536, PASSED ,0.00581382,5.13865,11.0285,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,11.0285,5.13865 +Apps_MASS3DPA,Base_HIP,block_25,809536, PASSED ,0.000145012,206.019,442.156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_25,440.966,205.471 +Apps_MASS3DPA,RAJA_HIP,block_25,809536, PASSED ,0.00014442,206.864,443.969,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_25,443.193,206.508 +Apps_MASS3DPA,Base_Seq,default,101184, PASSED ,0.000719264,5.19191,11.1421,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,11.1409,5.19191 +Apps_MASS3DPA,Base_HIP,block_25,101184, PASSED ,1.98101e-05,188.507,404.545,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_25,404.545,188.507 +Apps_MASS3DPA,RAJA_HIP,block_25,101184, PASSED ,1.98851e-05,187.797,403.019,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MASS3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_25,403.019,187.797 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,64, PASSED ,7.776e-07,15.3687,4.36214,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,4.78551,14.2524 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,64, PASSED ,5.15474e-06,2.3184,0.658035,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,5.40414,15.9952 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,64, PASSED ,2.33242e-06,5.12375,1.45428,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,7.88968,23.3519 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,328509, PASSED ,0.00917113,4.66426,1.89846,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,2.64246,6.5236149999999995 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,328509, PASSED ,0.000111003,385.364,156.851,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,164.7875,408.35 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,328509, PASSED ,0.000111162,384.811,156.627,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,164.5635,407.794 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,35937, PASSED ,0.000397252,12.1287,4.79459,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,4.64495,12.1287 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,35937, PASSED ,1.17467e-05,410.17,162.145,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,172.721,431.336 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,35937, PASSED ,1.15984e-05,415.415,164.218,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,172.5,430.777 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,493039, PASSED ,0.0138821,4.60877,1.88236,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,1.89846,4.66426 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,493039, PASSED ,0.000184528,346.718,141.61,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,156.851,385.364 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,493039, PASSED ,0.000183998,347.717,142.018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,156.627,384.811 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,3375, PASSED ,3.73785e-05,12.9009,4.78551,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,4.78219,12.9009 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,3375, PASSED ,5.13613e-06,93.8871,34.8268,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,34.8268,93.8871 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,3375, PASSED ,3.25252e-06,148.259,54.9958,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,54.9958,148.259 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,79507, PASSED ,0.00102856,10.2309,4.09687,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,4.09687,10.2309 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,79507, PASSED ,2.43966e-05,431.336,172.724,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,172.721,431.336 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,79507, PASSED ,2.44283e-05,430.777,172.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,172.5,430.777 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,8000, PASSED ,9.12819e-05,12.1691,4.64495,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,4.78551,12.2763 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,8000, PASSED ,5.21364e-06,213.061,81.3251,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,81.3251,213.061 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,8000, PASSED ,3.29452e-06,337.173,128.699,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,128.699,337.173 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,512, PASSED ,5.63534e-06,14.2524,4.81533,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,4.71523,13.57665 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,512, PASSED ,5.02134e-06,15.9952,5.40414,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,20.11547,54.94115 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,512, PASSED ,3.43943e-06,23.3519,7.88968,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,31.44274,85.80545 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,157464, PASSED ,0.0024644,8.38297,3.38646,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,3.38646,8.38297 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,157464, PASSED ,4.46316e-05,462.878,186.988,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,162.145,410.17 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,157464, PASSED ,4.49968e-05,459.122,185.471,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,164.218,415.415 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,17576, PASSED ,0.000194791,12.2763,4.78219,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,4.78219,12.1691 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,17576, PASSED ,5.39324e-06,443.39,172.721,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,162.145,410.17 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,17576, PASSED ,5.07074e-06,471.59,183.707,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,164.218,415.415 +Basic_MULTI_REDUCE,Base_Seq,default,3120, PASSED ,9.75346e-06,4.78196,0.319886,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,0.311305,4.64252 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,3120, PASSED ,9.98628e-06,4.67047,0.312429,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,1.18832,17.7215 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,3120, PASSED ,1.00875e-05,4.62363,0.309295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,1.18345,17.6489 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,3120, PASSED ,1.07345e-05,4.34494,0.290652,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,1.14044,17.0075 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,3120, PASSED ,1.08837e-05,4.28538,0.286668,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,1.1159,16.6415 +Basic_MULTI_REDUCE,Base_Seq,default,3199995, PASSED ,0.0104146,4.57854,0.30726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.3073005,4.579155 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,3199995, PASSED ,0.000104195,457.638,30.7115,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,29.189149999999998,434.953 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,3199995, PASSED ,9.58552e-05,497.456,33.3836,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,32.2421,480.44550000000004 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,3199995, PASSED ,0.000115699,412.137,27.6579,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,26.8153,399.5825 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,3199995, PASSED ,9.6333e-05,494.989,33.218,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,32.0609,477.746 +Basic_MULTI_REDUCE,Base_Seq,default,399995, PASSED ,0.00129921,4.5878,0.307875,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.307875,4.5878 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,399995, PASSED ,2.00181e-05,297.757,19.9816,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,19.9816,297.757 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,399995, PASSED ,1.99375e-05,298.961,20.0624,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,20.0624,298.961 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,399995, PASSED ,2.10783e-05,282.78,18.9766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,18.9766,282.78 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,399995, PASSED ,2.06653e-05,288.432,19.3558,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,19.3558,288.432 +Basic_MULTI_REDUCE,Base_Seq,default,4687495, PASSED ,0.0152572,4.57812,0.307232,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.30726,4.57854 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,4687495, PASSED ,0.000169427,412.268,27.6668,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,30.7115,457.638 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,4687495, PASSED ,0.000150721,463.435,31.1006,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,33.3836,497.456 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,4687495, PASSED ,0.000189504,368.591,24.7356,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,27.6579,412.137 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,4687495, PASSED ,0.000150622,463.739,31.121,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,33.0008,491.753 +Basic_MULTI_REDUCE,Base_Seq,default,49995, PASSED ,0.000161997,4.59966,0.308616,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,0.308616,4.59966 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,49995, PASSED ,1.07981e-05,69.0062,4.63,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,4.63,69.0062 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,49995, PASSED ,1.07923e-05,69.0431,4.63248,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,4.63248,69.0431 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,49995, PASSED ,1.15151e-05,64.7093,4.3417,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,4.3417,64.7093 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,49995, PASSED ,1.18101e-05,63.0929,4.23325,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,4.23325,63.0929 +Basic_MULTI_REDUCE,Base_Seq,default,799995, PASSED ,0.00259959,4.58573,0.307739,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.307739,4.58573 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,799995, PASSED ,2.92524e-05,407.522,27.348,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,27.348,407.522 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,799995, PASSED ,2.9184e-05,408.478,27.4121,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,27.4121,408.478 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,799995, PASSED ,3.08014e-05,387.028,25.9727,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,25.9727,387.028 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,799995, PASSED ,2.99362e-05,398.214,26.7233,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,26.7233,398.214 +Basic_MULTI_REDUCE,Base_Seq,default,99995, PASSED ,0.000324521,4.59197,0.308131,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.308131,4.59197 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,99995, PASSED ,1.20055e-05,124.126,8.3291,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,8.3291,124.126 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,99995, PASSED ,1.14005e-05,130.713,8.77114,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,8.77114,130.713 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,99995, PASSED ,1.27285e-05,117.075,7.856,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,7.856,117.075 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,99995, PASSED ,1.21023e-05,123.133,8.26249,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,8.26249,123.133 +Basic_MULTI_REDUCE,Base_Seq,default,12495, PASSED ,4.01375e-05,4.64252,0.311305,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,0.30996049999999997,4.621090000000001 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,12495, PASSED ,1.05149e-05,17.7215,1.18832,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,2.90916,43.36385 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,12495, PASSED ,1.05581e-05,17.6489,1.18345,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,2.907965,43.346 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,12495, PASSED ,1.09563e-05,17.0075,1.14044,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,2.74107,40.8584 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,12495, PASSED ,1.11973e-05,16.6415,1.1159,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,2.674575,39.8672 +Basic_MULTI_REDUCE,Base_Seq,default,1599995, PASSED ,0.00520593,4.57977,0.307341,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.307341,4.57977 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,1599995, PASSED ,4.81451e-05,495.21,33.2328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,27.6668,412.268 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,1599995, PASSED ,4.78873e-05,497.876,33.4117,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,31.1006,463.435 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,1599995, PASSED ,5.13857e-05,463.98,31.1369,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,25.9727,387.028 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,1599995, PASSED ,4.84835e-05,491.753,33.0008,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,31.121,463.739 +Basic_MULTI_REDUCE,Base_Seq,default,199995, PASSED ,0.000649353,4.58966,0.307991,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.307991,4.58966 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,199995, PASSED ,1.34511e-05,221.566,14.8683,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,14.8683,221.566 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,199995, PASSED ,1.24901e-05,238.614,16.0123,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,16.0123,238.614 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,199995, PASSED ,1.46049e-05,204.062,13.6937,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,13.6937,204.062 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,199995, PASSED ,1.37171e-05,217.27,14.58,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,14.58,217.27 +Basic_REDUCE_STRUCT,Base_Seq,default,3125, PASSED ,2.73462e-06,17.0284,2.28624,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,2.37181,17.671 +Basic_REDUCE_STRUCT,Base_Seq,kahan,3125, PASSED ,1.02981e-05,4.52183,0.607103,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-kahan,0.614658,4.57919 +Basic_REDUCE_STRUCT,Base_Seq,cascade,3125, PASSED ,5.05764e-06,9.20709,1.23615,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26391,9.41668 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,3125, PASSED ,1.90975e-05,2.43833,0.327372,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,0.731018,5.44607 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,3125, PASSED ,1.89425e-05,2.45828,0.330051,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,0.737782,5.49647 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,3125, PASSED ,2.29393e-05,2.02997,0.272545,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,1.051,7.82994 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,3125, PASSED ,1.91345e-05,2.43362,0.326739,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,0.876525,6.5301 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,3125, PASSED ,2.64364e-05,1.76144,0.236492,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,0.906626,6.75435 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,3125, PASSED ,2.29583e-05,2.02829,0.272319,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,1.06038,7.89981 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,3125, PASSED ,1.91847e-05,2.42725,0.325884,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,0.863514,6.43316 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,3125, PASSED ,2.68696e-05,1.73304,0.232679,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,0.898597,6.69453 +Basic_REDUCE_STRUCT,Base_Seq,default,3200000, PASSED ,0.00278983,17.092,2.29405,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,2.3025700000000002,17.1555 +Basic_REDUCE_STRUCT,Base_Seq,kahan,3200000, PASSED ,0.0104282,4.57258,0.613722,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-kahan,0.613861,4.57362 +Basic_REDUCE_STRUCT,Base_Seq,cascade,3200000, PASSED ,0.00510038,9.34906,1.25481,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-cascade,1.2552949999999998,9.35268 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,3200000, PASSED ,0.00616805,7.73076,1.03761,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,1.053255,7.8473299999999995 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,3200000, PASSED ,0.000184726,258.132,34.6459,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,28.969,215.836 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,3200000, PASSED ,0.000657996,72.468,9.7265,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,9.72215,72.4356 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,3200000, PASSED ,0.000766404,62.2175,8.35069,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,8.365415,62.327200000000005 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,3200000, PASSED ,0.00106557,44.7497,6.0062,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,5.995845,44.67255 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,3200000, PASSED ,0.000123017,387.62,52.0255,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,50.49935,376.2495 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,3200000, PASSED ,0.000134688,354.03,47.5171,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,45.67345,340.2935 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,3200000, PASSED ,0.000135014,353.177,47.4026,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,44.6552,332.707 +Basic_REDUCE_STRUCT,Base_Seq,default,400000, PASSED ,0.000332584,17.9217,2.40541,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,2.39142,17.8173 +Basic_REDUCE_STRUCT,Base_Seq,kahan,400000, PASSED ,0.00129928,4.58753,0.615729,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615369,4.58483 +Basic_REDUCE_STRUCT,Base_Seq,cascade,400000, PASSED ,0.000631813,9.43391,1.2662,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26333,9.41252 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,400000, PASSED ,0.000729383,8.17193,1.09682,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,1.04804,7.8085 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,400000, PASSED ,0.000113421,52.5516,7.05338,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,7.05338,52.5516 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,400000, PASSED ,9.62844e-05,61.9048,8.30874,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,8.30874,61.9048 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,400000, PASSED ,0.000109261,54.5527,7.32195,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,7.32195,54.5527 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,400000, PASSED ,0.000152918,38.9782,5.23158,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,5.23158,38.9782 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,400000, PASSED ,3.76461e-05,158.329,21.2506,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,21.2506,158.329 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,400000, PASSED ,4.31967e-05,137.984,18.52,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,18.52,137.984 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,400000, PASSED ,4.95181e-05,120.369,16.1557,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,16.1557,120.369 +Basic_REDUCE_STRUCT,Base_Seq,default,4687500, PASSED ,0.00408657,17.0924,2.2941,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,2.2941,17.0924 +Basic_REDUCE_STRUCT,Base_Seq,kahan,4687500, PASSED ,0.0152744,4.57297,0.613774,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-kahan,0.613774,4.57297 +Basic_REDUCE_STRUCT,Base_Seq,cascade,4687500, PASSED ,0.00747505,9.34431,1.25417,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-cascade,1.25481,9.34906 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,4687500, PASSED ,0.00808465,8.63973,1.15961,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,1.03761,7.73076 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,4687500, PASSED ,0.000247098,282.678,37.9404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,34.6459,258.132 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,4687500, PASSED ,0.000956887,72.9963,9.7974,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,9.7265,72.468 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,4687500, PASSED ,0.00111872,62.4369,8.38014,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,8.38014,62.4369 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,4687500, PASSED ,0.00154463,45.2207,6.06943,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,6.0062,44.7497 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,4687500, PASSED ,0.000178226,391.914,52.6018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,52.0255,387.62 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,4687500, PASSED ,0.000190922,365.851,49.1038,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,47.5171,354.03 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,4687500, PASSED ,0.000189367,368.856,49.507,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,47.4026,353.177 +Basic_REDUCE_STRUCT,Base_Seq,default,50000, PASSED ,4.21627e-05,17.671,2.37181,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,2.39142,17.8173 +Basic_REDUCE_STRUCT,Base_Seq,kahan,50000, PASSED ,0.000162529,4.58415,0.615287,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615287,4.58415 +Basic_REDUCE_STRUCT,Base_Seq,cascade,50000, PASSED ,7.91211e-05,9.41668,1.26391,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26333,9.41252 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,50000, PASSED ,0.000105269,7.07765,0.949965,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,0.949965,7.07765 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,50000, PASSED ,0.000104101,7.15708,0.960626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,0.960626,7.15708 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,50000, PASSED ,2.70728e-05,27.5206,3.69382,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,3.69382,27.5206 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,50000, PASSED ,3.2259e-05,23.0961,3.09997,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,3.09997,23.0961 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,50000, PASSED ,3.66256e-05,20.3425,2.73038,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,2.73038,20.3425 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,50000, PASSED ,2.69692e-05,27.6263,3.70801,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,3.70801,27.6263 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,50000, PASSED ,3.26454e-05,22.8227,3.06328,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,3.06328,22.8227 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,50000, PASSED ,3.68006e-05,20.2458,2.7174,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,2.7174,20.2458 +Basic_REDUCE_STRUCT,Base_Seq,default,800000, PASSED ,0.000670746,17.7726,2.3854,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,2.3854,17.7726 +Basic_REDUCE_STRUCT,Base_Seq,kahan,800000, PASSED ,0.00260007,4.58485,0.615369,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615369,4.58483 +Basic_REDUCE_STRUCT,Base_Seq,cascade,800000, PASSED ,0.00126649,9.41254,1.26333,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26333,9.41252 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,800000, PASSED ,0.00149687,7.9639,1.0689,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,1.04804,7.8085 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,800000, PASSED ,0.000127232,93.6942,12.5754,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,12.5754,93.6942 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,800000, PASSED ,0.000175058,68.097,9.13983,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,9.13983,68.097 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,800000, PASSED ,0.00020134,59.208,7.94678,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,7.94678,59.208 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,800000, PASSED ,0.000283312,42.077,5.64748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,5.64748,42.077 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,800000, PASSED ,4.65349e-05,256.172,34.3828,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,34.3828,256.172 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,800000, PASSED ,5.30948e-05,224.522,30.1348,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,30.1348,224.522 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,800000, PASSED ,5.91812e-05,201.431,27.0357,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,27.0357,201.431 +Basic_REDUCE_STRUCT,Base_Seq,default,100000, PASSED ,8.36332e-05,17.8173,2.39142,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,2.39351,17.833 +Basic_REDUCE_STRUCT,Base_Seq,kahan,100000, PASSED ,0.000325051,4.58426,0.615295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615295,4.58426 +Basic_REDUCE_STRUCT,Base_Seq,cascade,100000, PASSED ,0.000158334,9.4112,1.26316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26391,9.41668 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,100000, PASSED ,0.000203711,7.31487,0.981795,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,0.981795,7.31487 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,100000, PASSED ,0.00010257,14.5278,1.94991,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,1.94991,14.5278 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,100000, PASSED ,3.68052e-05,40.4865,5.43406,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,5.43406,40.4865 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,100000, PASSED ,4.26279e-05,34.9564,4.69181,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,4.69181,34.9564 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,100000, PASSED ,5.37996e-05,27.6976,3.71754,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.71754,27.6976 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,100000, PASSED ,2.76564e-05,53.8797,7.23168,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,7.23168,53.8797 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,100000, PASSED ,3.3627e-05,44.3131,5.94766,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,5.94766,44.3131 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,100000, PASSED ,4.17289e-05,35.7095,4.79289,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,4.79289,35.7095 +Basic_REDUCE_STRUCT,Base_Seq,default,12500, PASSED ,1.03141e-05,18.0593,2.42407,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,2.381615,17.744149999999998 +Basic_REDUCE_STRUCT,Base_Seq,kahan,12500, PASSED ,4.06763e-05,4.57919,0.614658,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-kahan,0.6149725,4.58167 +Basic_REDUCE_STRUCT,Base_Seq,cascade,12500, PASSED ,1.96435e-05,9.48223,1.27278,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-cascade,1.263535,9.41394 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,12500, PASSED ,3.42016e-05,5.44607,0.731018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,0.8404915,6.26186 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,12500, PASSED ,3.3888e-05,5.49647,0.737782,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,0.8492040000000001,6.326775 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,12500, PASSED ,2.37887e-05,7.82994,1.051,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,2.37241,17.67527 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,12500, PASSED ,2.8524e-05,6.5301,0.876525,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,1.9882475,14.8131 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,12500, PASSED ,2.7577e-05,6.75435,0.906626,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,1.818503,13.548425 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,12500, PASSED ,2.35784e-05,7.89981,1.06038,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,2.384195,17.763055 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,12500, PASSED ,2.89538e-05,6.43316,0.863514,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,1.9633969999999998,14.627930000000001 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,12500, PASSED ,2.78234e-05,6.69453,0.898597,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,1.8079985,13.470165 +Basic_REDUCE_STRUCT,Base_Seq,default,1600000, PASSED ,0.00138466,17.2186,2.31104,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,2.31104,17.2186 +Basic_REDUCE_STRUCT,Base_Seq,kahan,1600000, PASSED ,0.00521217,4.57427,0.613948,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-kahan,0.613948,4.57427 +Basic_REDUCE_STRUCT,Base_Seq,cascade,1600000, PASSED ,0.00254821,9.3563,1.25578,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-cascade,1.25578,9.3563 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,1600000, PASSED ,0.00309166,7.71168,1.03504,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,1.0689,7.9639 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,1600000, PASSED ,0.000137386,173.54,23.2921,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,23.2921,173.54 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,1600000, PASSED ,0.000329293,72.4032,9.7178,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,9.7178,72.4032 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,1600000, PASSED ,0.000378012,63.0717,8.46535,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,8.35069,62.2175 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,1600000, PASSED ,0.000534626,44.5954,5.98549,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,5.98549,44.5954 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,1600000, PASSED ,6.53418e-05,364.879,48.9732,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,48.9732,364.879 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,1600000, PASSED ,7.30097e-05,326.557,43.8298,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,43.8298,326.557 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,1600000, PASSED ,7.63581e-05,312.237,41.9078,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,41.9078,312.237 +Basic_REDUCE_STRUCT,Base_Seq,default,200000, PASSED ,0.000167119,17.833,2.39351,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,2.39142,17.8173 +Basic_REDUCE_STRUCT,Base_Seq,kahan,200000, PASSED ,0.00065002,4.58483,0.615369,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615369,4.58483 +Basic_REDUCE_STRUCT,Base_Seq,cascade,200000, PASSED ,0.000316624,9.41252,1.26333,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26333,9.41254 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,200000, PASSED ,0.000381665,7.8085,1.04804,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,1.04804,7.8085 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,200000, PASSED ,0.000103741,28.7275,3.85576,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,3.85576,28.7275 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,200000, PASSED ,5.41124e-05,55.0749,7.39206,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,7.39206,55.0749 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,200000, PASSED ,6.13572e-05,48.5718,6.51923,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,6.51923,48.5718 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,200000, PASSED ,8.93898e-05,33.3397,4.47481,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,4.47481,33.3397 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,200000, PASSED ,2.97842e-05,100.061,13.43,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,13.43,100.061 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,200000, PASSED ,3.49464e-05,85.28,11.4461,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,11.4461,85.28 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,200000, PASSED ,4.34719e-05,68.5554,9.2014,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-CPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,9.2014,68.5554 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_CONVECTION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_CONVECTION3DPA.csv new file mode 100644 index 0000000..2b506c0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_CONVECTION3DPA.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +702,33.9132,129.201,13.0552,13.5986,33.022,120.606,18.8242,71.4457,7.24657,7.51252,18.3296,66.6931 +2754,129.201,206.85000000000002,13.9866,13.326899999999998,120.606,198.5285,71.4457,114.30834999999999,7.73436,7.379545,66.6931,109.70904999999999 +10989,284.499,284.499,13.5986,13.0552,276.451,276.451,157.171,157.171,7.51252,7.24657,152.725,152.725 +21951,358.542,358.542,12.7519,12.7519,350.353,350.353,198.044,198.044,7.04361,7.04361,193.521,193.521 +43902,403.844,403.844,11.8994,12.6488,399.054,399.054,223.049,223.049,6.57224,6.98584,220.403,220.403 +87804,419.452,418.491,12.6488,11.8994,422.306,413.332,231.66,231.122,6.98584,6.57224,233.236,228.273 +175608,427.354,418.491,9.60028,9.60028,428.722,413.332,236.02,231.122,5.30205,5.30205,236.775,228.273 +351216,418.491,418.491,4.4893,4.4893,413.332,413.332,231.122,231.122,2.47933,2.47933,228.273,228.273 +702459,377.694,398.0925,3.90513,4.197215,376.316,394.82399999999996,208.59,219.856,2.15669,2.31801,207.829,218.051 +1028970,369.525,377.694,3.72818,3.90513,370.892,376.316,204.078,208.59,2.05897,2.15669,204.833,207.829 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv new file mode 100644 index 0000000..b8b3267 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +841,15.152,72.5329,8.22518,8.30676,22.0669,98.7272,13.1301,61.3475,7.12761,7.05094,19.1223,83.5024 +3844,72.5329,188.07595,8.33653,8.28627,98.7272,207.7411,61.3475,157.68325,7.05094,7.00034,83.5024,174.2557 +15876,303.619,303.619,8.30676,8.27772,316.755,316.755,254.019,254.019,6.94974,6.94974,265.009,265.009 +32400,461.341,443.204,8.26578,8.30676,464.451,456.381,384.755,368.256,6.89359,6.90546,387.348,379.205 +65025,567.185,461.341,8.27772,8.27772,560.843,464.451,471.999,384.755,6.88855,6.89359,466.722,387.348 +131044,443.204,492.316,8.31087,8.26578,456.381,479.759,368.256,408.618,6.90546,6.88855,379.205,398.196 +264196,492.316,492.316,8.21252,8.21252,479.759,479.759,408.618,408.618,6.81632,6.81632,398.196,398.196 +528529,520.767,443.204,8.15367,8.16448,514.063,456.381,431.904,368.256,6.76234,6.76766,426.344,379.205 +1060900,440.119,466.2175,8.16448,8.159075,447.863,463.81100000000004,364.821,386.71950000000004,6.76766,6.765000000000001,371.24,384.718 +1555009,420.319,440.119,8.08762,8.15367,415.82,447.863,348.33,364.821,6.70243,6.76234,344.602,371.24 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_INTSC_HEXHEX.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_INTSC_HEXHEX.csv new file mode 100644 index 0000000..b5b8e2c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_INTSC_HEXHEX.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +27,2.8229,2.8229,3.51739,3.53797,4.97069,4.97069,0.0608571,0.0608571,0.0758293,0.0762729,0.10716,0.10716 +64,2.8051,2.974805,3.53797,3.54711,4.89231,5.198375,0.0604735,0.064132,0.0762729,0.07647000000000001,0.10547,0.1120685 +216,3.12671,3.12671,3.55625,3.55625,5.42606,5.42606,0.0674069,0.0674069,0.0766671,0.0766671,0.116977,0.116977 +512,3.26604,3.26604,3.5674,3.5674,5.66495,5.66495,0.0704105,0.0704105,0.0769074,0.0769074,0.122127,0.122127 +1000,3.32428,3.32428,3.57242,3.5674,5.84976,5.84976,0.0716662,0.0716662,0.0770157,0.0769074,0.126111,0.126111 +1728,3.33601,3.33601,3.56954,3.5674,6.06665,6.06665,0.071919,0.071919,0.0769536,0.0769074,0.130787,0.130787 +3375,3.34073,3.34073,3.55323,3.55404,6.18593,6.18593,0.0720209,0.0720209,0.0766019,0.0766193,0.133359,0.133359 +6859,3.34163,3.34163,3.5539,3.55404,6.29694,6.29694,0.0720402,0.0720402,0.0766165,0.0766193,0.135752,0.135752 +13824,3.38547,3.36355,3.55404,3.55397,6.33743,6.317185,0.0729852,0.0725127,0.0766193,0.0766179,0.136625,0.1361885 +19683,3.4072,3.38547,3.55916,3.55404,6.34898,6.33743,0.0734538,0.0729852,0.0767298,0.0766193,0.136874,0.136625 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_LTIMES.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_LTIMES.csv new file mode 100644 index 0000000..ad279a2 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_LTIMES.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-kernel_256 (raw),RAJA_HIP-kernel_256 (smoothed),RAJA_HIP-launch_256 (raw),RAJA_HIP-launch_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-kernel_256 (raw B/W),RAJA_HIP-kernel_256 (smoothed B/W),RAJA_HIP-launch_256 (raw B/W),RAJA_HIP-launch_256 (smoothed B/W) +1344,21.8706,66.3897,6.18006,6.18006,21.7446,58.4839,16.1413,56.552,30.7808,92.6304,8.69785,8.69785,30.6035,81.5998,22.7173,78.9043 +4992,66.3897,87.92335,6.23547,6.10205,58.4839,75.5878,56.552,83.0555,92.6304,122.4932,8.70005,8.539705000000001,81.5998,105.3099,78.9043,115.70115 +19392,109.457,109.457,6.0085,6.02404,92.6917,92.6917,109.559,109.559,152.356,152.356,8.36339,8.38156,129.02,129.02,152.498,152.498 +38784,124.853,117.922,6.02404,6.02263,102.505,95.3096,123.614,113.795,173.714,164.02,8.38156,8.37786,142.62,132.568,171.991,158.28 +77568,118.295,117.922,6.02263,6.0085,98.1186,95.3096,114.447,113.795,164.556,164.02,8.37786,8.36339,136.489,132.568,159.203,158.28 +154944,117.922,117.922,5.95087,5.9552,95.3096,95.3096,113.795,113.795,164.02,164.02,8.27718,8.28278,132.568,132.568,158.28,158.28 +309696,114.955,117.922,5.9552,5.95087,93.5542,95.1529,112.261,113.795,159.885,164.02,8.28278,8.27718,130.12,132.34,156.138,158.28 +619392,116.879,117.922,5.90676,5.90676,95.1529,95.1529,113.554,113.795,162.557,164.02,8.21518,8.21518,132.34,132.34,157.932,158.28 +1238784,118.942,117.8175,5.8478,5.877280000000001,93.4727,94.35355,115.323,114.4385,165.423,163.861,8.13308,8.17413,130.001,131.23000000000002,160.391,159.1615 +1814592,118.756,118.756,5.84722,5.8478,95.7286,95.1529,116.064,115.323,165.165,165.165,8.13223,8.13308,133.138,132.34,161.421,160.391 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_MASS3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_MASS3DPA.csv new file mode 100644 index 0000000..3f58163 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_MASS3DPA.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_25 (raw),Base_HIP-block_25 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_25 (raw),RAJA_HIP-block_25 (smoothed),Base_HIP-block_25 (raw B/W),Base_HIP-block_25 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_25 (raw B/W),RAJA_HIP-block_25 (smoothed B/W) +1600,38.1057,120.87,11.1064,11.1409,38.3501,119.814,17.8445,56.3896,5.201,5.201,17.9589,55.8969 +6336,120.87,163.9215,11.2892,11.123650000000001,119.814,163.047,56.3896,76.42845,5.26676,5.196795,55.8969,76.0204 +25344,206.973,206.973,11.1409,11.1409,206.28,206.28,96.4673,96.4673,5.19259,5.19259,96.1439,96.1439 +50624,297.449,297.449,11.1052,11.1421,298.307,298.307,138.615,138.615,5.17515,5.19259,139.015,139.015 +101184,404.545,404.545,11.1421,11.1409,403.019,403.019,188.507,188.507,5.19191,5.19191,187.797,187.797 +202368,440.966,440.966,11.1601,11.1052,443.193,443.193,205.471,205.471,5.2001,5.17515,206.508,206.508 +404736,448.585,440.966,11.0989,11.0989,451.425,443.193,209.016,205.471,5.17149,5.17149,210.34,206.508 +809536,442.156,440.966,11.0285,11.0285,443.969,443.193,206.019,205.471,5.13865,5.13865,206.864,206.508 +1619008,417.077,429.6165,10.9749,11.0017,420.08,432.0245,194.333,200.176,5.11364,5.126145,195.732,201.298 +2371584,415.446,417.077,10.9589,10.9749,414.395,420.08,193.572,194.333,5.10618,5.11364,193.082,195.732 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv new file mode 100644 index 0000000..8146da0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +64,0.658035,5.40414,4.36214,4.78551,1.45428,7.88968,2.3184,15.9952,15.3687,14.2524,5.12375,23.3519 +512,5.40414,20.11547,4.81533,4.71523,7.88968,31.44274,15.9952,54.94115,14.2524,13.57665,23.3519,85.80545 +3375,34.8268,34.8268,4.78551,4.78219,54.9958,54.9958,93.8871,93.8871,12.9009,12.9009,148.259,148.259 +8000,81.3251,81.3251,4.64495,4.78551,128.699,128.699,213.061,213.061,12.1691,12.2763,337.173,337.173 +17576,172.721,162.145,4.78219,4.78219,183.707,164.218,443.39,410.17,12.2763,12.1691,471.59,415.415 +35937,162.145,172.721,4.79459,4.64495,164.218,172.5,410.17,431.336,12.1287,12.1287,415.415,430.777 +79507,172.724,172.721,4.09687,4.09687,172.5,172.5,431.336,431.336,10.2309,10.2309,430.777,430.777 +157464,186.988,162.145,3.38646,3.38646,185.471,164.218,462.878,410.17,8.38297,8.38297,459.122,415.415 +328509,156.851,164.7875,1.89846,2.64246,156.627,164.5635,385.364,408.35,4.66426,6.5236149999999995,384.811,407.794 +493039,141.61,156.851,1.88236,1.89846,142.018,156.627,346.718,385.364,4.60877,4.66426,347.717,384.811 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv new file mode 100644 index 0000000..84b204c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +80000,0.0,0.0,0.0,0.0,0.0,0.0,146.085,217.801,14.1788,10.9567,143.168,220.631 +160000,0.0,0.0,0.0,0.0,0.0,0.0,217.801,265.113,10.9567,10.7283,220.631,268.6225 +320000,0.0,0.0,0.0,0.0,0.0,0.0,312.425,312.425,10.4999,10.4999,316.614,316.614 +640000,0.0,0.0,0.0,0.0,0.0,0.0,374.327,374.327,10.3092,10.3092,379.045,379.045 +1280000,0.0,0.0,0.0,0.0,0.0,0.0,443.779,443.779,9.50777,9.50777,440.75,440.75 +2560000,0.0,0.0,0.0,0.0,0.0,0.0,466.897,466.897,9.23769,9.23769,466.256,466.256 +3750000,0.0,0.0,0.0,0.0,0.0,0.0,481.583,466.897,9.13207,9.13207,484.242,466.256 +5120000,0.0,0.0,0.0,0.0,0.0,0.0,473.886,466.897,9.06123,9.06123,474.695,466.256 +7500000,0.0,0.0,0.0,0.0,0.0,0.0,452.468,463.177,9.01723,9.03923,451.012,462.8535 +10000000,0.0,0.0,0.0,0.0,0.0,0.0,449.537,452.468,8.99193,9.01723,447.195,451.012 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_MULTI_REDUCE.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_MULTI_REDUCE.csv new file mode 100644 index 0000000..f3b9f03 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_MULTI_REDUCE.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-atomic_direct_256 (raw),Base_HIP-atomic_direct_256 (smoothed),Base_HIP-atomic_occgs_256 (raw),Base_HIP-atomic_occgs_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-atomic_direct_256 (raw),RAJA_HIP-atomic_direct_256 (smoothed),RAJA_HIP-atomic_occgs_256 (raw),RAJA_HIP-atomic_occgs_256 (smoothed),Base_HIP-atomic_direct_256 (raw B/W),Base_HIP-atomic_direct_256 (smoothed B/W),Base_HIP-atomic_occgs_256 (raw B/W),Base_HIP-atomic_occgs_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-atomic_direct_256 (raw B/W),RAJA_HIP-atomic_direct_256 (smoothed B/W),RAJA_HIP-atomic_occgs_256 (raw B/W),RAJA_HIP-atomic_occgs_256 (smoothed B/W) +3120,0.312429,1.18832,0.309295,1.18345,0.319886,0.311305,0.290652,1.14044,0.286668,1.1159,4.67047,17.7215,4.62363,17.6489,4.78196,4.64252,4.34494,17.0075,4.28538,16.6415 +12495,1.18832,2.90916,1.18345,2.907965,0.311305,0.30996049999999997,1.14044,2.74107,1.1159,2.674575,17.7215,43.36385,17.6489,43.346,4.64252,4.621090000000001,17.0075,40.8584,16.6415,39.8672 +49995,4.63,4.63,4.63248,4.63248,0.308616,0.308616,4.3417,4.3417,4.23325,4.23325,69.0062,69.0062,69.0431,69.0431,4.59966,4.59966,64.7093,64.7093,63.0929,63.0929 +99995,8.3291,8.3291,8.77114,8.77114,0.308131,0.308131,7.856,7.856,8.26249,8.26249,124.126,124.126,130.713,130.713,4.59197,4.59197,117.075,117.075,123.133,123.133 +199995,14.8683,14.8683,16.0123,16.0123,0.307991,0.307991,13.6937,13.6937,14.58,14.58,221.566,221.566,238.614,238.614,4.58966,4.58966,204.062,204.062,217.27,217.27 +399995,19.9816,19.9816,20.0624,20.0624,0.307875,0.307875,18.9766,18.9766,19.3558,19.3558,297.757,297.757,298.961,298.961,4.5878,4.5878,282.78,282.78,288.432,288.432 +799995,27.348,27.348,27.4121,27.4121,0.307739,0.307739,25.9727,25.9727,26.7233,26.7233,407.522,407.522,408.478,408.478,4.58573,4.58573,387.028,387.028,398.214,398.214 +1599995,33.2328,27.6668,33.4117,31.1006,0.307341,0.307341,31.1369,25.9727,33.0008,31.121,495.21,412.268,497.876,463.435,4.57977,4.57977,463.98,387.028,491.753,463.739 +3199995,30.7115,29.189149999999998,33.3836,32.2421,0.30726,0.3073005,27.6579,26.8153,33.218,32.0609,457.638,434.953,497.456,480.44550000000004,4.57854,4.579155,412.137,399.5825,494.989,477.746 +4687495,27.6668,30.7115,31.1006,33.3836,0.307232,0.30726,24.7356,27.6579,31.121,33.0008,412.268,457.638,463.435,497.456,4.57812,4.57854,368.591,412.137,463.739,491.753 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_REDUCE_STRUCT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_REDUCE_STRUCT.csv new file mode 100644 index 0000000..b0b3648 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Basic_REDUCE_STRUCT.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-blkatm_direct_256 (raw),Base_HIP-blkatm_direct_256 (smoothed),Base_HIP-blkatm_occgs_256 (raw),Base_HIP-blkatm_occgs_256 (smoothed),Base_Seq-cascade (raw),Base_Seq-cascade (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),Base_Seq-kahan (raw),Base_Seq-kahan (smoothed),RAJA_HIP-blkatm_direct_256 (raw),RAJA_HIP-blkatm_direct_256 (smoothed),RAJA_HIP-blkatm_occgs_256 (raw),RAJA_HIP-blkatm_occgs_256 (smoothed),RAJA_HIP-blkdev_direct_256 (raw),RAJA_HIP-blkdev_direct_256 (smoothed),RAJA_HIP-blkdev_direct_new_256 (raw),RAJA_HIP-blkdev_direct_new_256 (smoothed),RAJA_HIP-blkdev_occgs_256 (raw),RAJA_HIP-blkdev_occgs_256 (smoothed),RAJA_HIP-blkdev_occgs_new_256 (raw),RAJA_HIP-blkdev_occgs_new_256 (smoothed),Base_HIP-blkatm_direct_256 (raw B/W),Base_HIP-blkatm_direct_256 (smoothed B/W),Base_HIP-blkatm_occgs_256 (raw B/W),Base_HIP-blkatm_occgs_256 (smoothed B/W),Base_Seq-cascade (raw B/W),Base_Seq-cascade (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),Base_Seq-kahan (raw B/W),Base_Seq-kahan (smoothed B/W),RAJA_HIP-blkatm_direct_256 (raw B/W),RAJA_HIP-blkatm_direct_256 (smoothed B/W),RAJA_HIP-blkatm_occgs_256 (raw B/W),RAJA_HIP-blkatm_occgs_256 (smoothed B/W),RAJA_HIP-blkdev_direct_256 (raw B/W),RAJA_HIP-blkdev_direct_256 (smoothed B/W),RAJA_HIP-blkdev_direct_new_256 (raw B/W),RAJA_HIP-blkdev_direct_new_256 (smoothed B/W),RAJA_HIP-blkdev_occgs_256 (raw B/W),RAJA_HIP-blkdev_occgs_256 (smoothed B/W),RAJA_HIP-blkdev_occgs_new_256 (raw B/W),RAJA_HIP-blkdev_occgs_new_256 (smoothed B/W) +3125,0.327372,0.731018,0.330051,0.737782,1.23615,1.26391,2.28624,2.37181,0.607103,0.614658,0.272545,1.051,0.272319,1.06038,0.326739,0.876525,0.236492,0.906626,0.325884,0.863514,0.232679,0.898597,2.43833,5.44607,2.45828,5.49647,9.20709,9.41668,17.0284,17.671,4.52183,4.57919,2.02997,7.82994,2.02829,7.89981,2.43362,6.5301,1.76144,6.75435,2.42725,6.43316,1.73304,6.69453 +12500,0.731018,0.8404915,0.737782,0.8492040000000001,1.27278,1.263535,2.42407,2.381615,0.614658,0.6149725,1.051,2.37241,1.06038,2.384195,0.876525,1.9882475,0.906626,1.818503,0.863514,1.9633969999999998,0.898597,1.8079985,5.44607,6.26186,5.49647,6.326775,9.48223,9.41394,18.0593,17.744149999999998,4.57919,4.58167,7.82994,17.67527,7.89981,17.763055,6.5301,14.8131,6.75435,13.548425,6.43316,14.627930000000001,6.69453,13.470165 +50000,0.949965,0.949965,0.960626,0.960626,1.26391,1.26333,2.37181,2.39142,0.615287,0.615287,3.69382,3.69382,3.70801,3.70801,3.09997,3.09997,2.73038,2.73038,3.06328,3.06328,2.7174,2.7174,7.07765,7.07765,7.15708,7.15708,9.41668,9.41252,17.671,17.8173,4.58415,4.58415,27.5206,27.5206,27.6263,27.6263,23.0961,23.0961,20.3425,20.3425,22.8227,22.8227,20.2458,20.2458 +100000,0.981795,0.981795,1.94991,1.94991,1.26316,1.26391,2.39142,2.39351,0.615295,0.615295,5.43406,5.43406,7.23168,7.23168,4.69181,4.69181,3.71754,3.71754,5.94766,5.94766,4.79289,4.79289,7.31487,7.31487,14.5278,14.5278,9.4112,9.41668,17.8173,17.833,4.58426,4.58426,40.4865,40.4865,53.8797,53.8797,34.9564,34.9564,27.6976,27.6976,44.3131,44.3131,35.7095,35.7095 +200000,1.04804,1.04804,3.85576,3.85576,1.26333,1.26333,2.39351,2.39142,0.615369,0.615369,7.39206,7.39206,13.43,13.43,6.51923,6.51923,4.47481,4.47481,11.4461,11.4461,9.2014,9.2014,7.8085,7.8085,28.7275,28.7275,9.41252,9.41254,17.833,17.8173,4.58483,4.58483,55.0749,55.0749,100.061,100.061,48.5718,48.5718,33.3397,33.3397,85.28,85.28,68.5554,68.5554 +400000,1.09682,1.04804,7.05338,7.05338,1.2662,1.26333,2.40541,2.39142,0.615729,0.615369,8.30874,8.30874,21.2506,21.2506,7.32195,7.32195,5.23158,5.23158,18.52,18.52,16.1557,16.1557,8.17193,7.8085,52.5516,52.5516,9.43391,9.41252,17.9217,17.8173,4.58753,4.58483,61.9048,61.9048,158.329,158.329,54.5527,54.5527,38.9782,38.9782,137.984,137.984,120.369,120.369 +800000,1.0689,1.04804,12.5754,12.5754,1.26333,1.26333,2.3854,2.3854,0.615369,0.615369,9.13983,9.13983,34.3828,34.3828,7.94678,7.94678,5.64748,5.64748,30.1348,30.1348,27.0357,27.0357,7.9639,7.8085,93.6942,93.6942,9.41254,9.41252,17.7726,17.7726,4.58485,4.58483,68.097,68.097,256.172,256.172,59.208,59.208,42.077,42.077,224.522,224.522,201.431,201.431 +1600000,1.03504,1.0689,23.2921,23.2921,1.25578,1.25578,2.31104,2.31104,0.613948,0.613948,9.7178,9.7178,48.9732,48.9732,8.46535,8.35069,5.98549,5.98549,43.8298,43.8298,41.9078,41.9078,7.71168,7.9639,173.54,173.54,9.3563,9.3563,17.2186,17.2186,4.57427,4.57427,72.4032,72.4032,364.879,364.879,63.0717,62.2175,44.5954,44.5954,326.557,326.557,312.237,312.237 +3200000,1.03761,1.053255,34.6459,28.969,1.25481,1.2552949999999998,2.29405,2.3025700000000002,0.613722,0.613861,9.7265,9.72215,52.0255,50.49935,8.35069,8.365415,6.0062,5.995845,47.5171,45.67345,47.4026,44.6552,7.73076,7.8473299999999995,258.132,215.836,9.34906,9.35268,17.092,17.1555,4.57258,4.57362,72.468,72.4356,387.62,376.2495,62.2175,62.327200000000005,44.7497,44.67255,354.03,340.2935,353.177,332.707 +4687500,1.15961,1.03761,37.9404,34.6459,1.25417,1.25481,2.2941,2.2941,0.613774,0.613774,9.7974,9.7265,52.6018,52.0255,8.38014,8.38014,6.06943,6.0062,49.1038,47.5171,49.507,47.4026,8.63973,7.73076,282.678,258.132,9.34431,9.34906,17.0924,17.0924,4.57297,4.57297,72.9963,72.468,391.914,387.62,62.4369,62.4369,45.2207,44.7497,365.851,354.03,368.856,353.177 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv new file mode 100644 index 0000000..4892df0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-CPX/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv @@ -0,0 +1,11 @@ +Problem size,Base_HIP-direct_1024 (raw),Base_HIP-direct_1024 (smoothed),Base_Seq-direct (raw),Base_Seq-direct (smoothed),RAJA_HIP-direct_1024 (raw),RAJA_HIP-direct_1024 (smoothed),RAJA_HIP-funcptr_1024 (raw),RAJA_HIP-funcptr_1024 (smoothed),RAJA_HIP-virtfunc_1024 (raw),RAJA_HIP-virtfunc_1024 (smoothed),Base_HIP-direct_1024 (raw B/W),Base_HIP-direct_1024 (smoothed B/W),Base_Seq-direct (raw B/W),Base_Seq-direct (smoothed B/W),RAJA_HIP-direct_1024 (raw B/W),RAJA_HIP-direct_1024 (smoothed B/W),RAJA_HIP-funcptr_1024 (raw B/W),RAJA_HIP-funcptr_1024 (smoothed B/W),RAJA_HIP-virtfunc_1024 (raw B/W),RAJA_HIP-virtfunc_1024 (smoothed B/W) +42875,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,35.5465,52.7123,34.2866,31.4224,28.3649,43.3236,30.9433,46.2492,29.0926,44.3283 +91125,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,52.7123,64.59955,30.6163,31.01935,43.3236,54.53655,46.2492,57.23955,44.3283,54.9759 +205379,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,76.4868,76.4868,31.4224,30.6163,65.7495,65.7495,68.2299,68.2299,65.6235,65.6235 +421875,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,116.949,116.949,29.4222,29.4222,99.173,99.173,103.677,103.677,98.5,98.5 +884736,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,127.604,127.604,26.5345,26.5345,139.893,139.893,142.861,142.861,133.87,133.87 +1860867,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,196.573,196.573,16.5543,16.5543,180.069,180.069,177.742,177.742,165.402,165.402 +2744000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,207.767,199.269,12.0213,12.0213,194.723,192.515,189.791,187.563,177.557,177.557 +3796416,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,223.313,205.182,9.34983,9.34983,209.559,194.723,204.866,187.563,191.745,177.557 +5639752,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,199.269,206.47449999999998,7.45299,8.40141,192.515,197.2725,187.563,188.677,180.556,179.0565 +7645373,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,205.182,205.182,7.23912,7.45299,199.822,199.822,182.713,187.563,173.613,180.556 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..0472874 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1377,28.7189,7.70152,28.068 +5508,112.498,7.72835,108.853 +21951,432.487,6.7051,414.952 +43902,638.329,7.06895,642.371 +87804,862.391,7.07049,840.882 +175608,1030.27,7.0633,1013.18 +351216,1191.32,5.41833,1192.82 +702459,1354.4,2.6375,1350.19 +1404891,1313.69,2.17096,1305.6 +2057940,1307.01,2.1129,1306.44 +2809755,1265.12,2.08775,1250.38 +4115853,1253.27,2.04849,1256.74 +5487804,1224.11,2.06502,1218.09 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..e78e00c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1377,112.498,7.70152,108.853 +5508,272.4925,7.385235,261.9025 +21951,432.487,7.07049,414.952 +43902,638.329,7.06895,642.371 +87804,862.391,7.0633,840.882 +175608,1030.27,7.0633,1013.18 +351216,1191.32,5.41833,1192.82 +702459,1307.01,2.6375,1305.6 +1404891,1307.01,2.17096,1305.6 +2057940,1307.01,2.1129,1305.6 +2809755,1265.12,2.08775,1256.74 +4115853,1259.195,2.076385,1253.56 +5487804,1253.27,2.06502,1250.38 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_flops_raw.csv new file mode 100644 index 0000000..36a4dac --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1377,51.8675,13.9092,50.692 +5508,203.569,13.9848,196.974 +21951,782.982,12.139,751.237 +43902,1155.74,12.7988,1163.05 +87804,1561.48,12.8021,1522.53 +175608,1865.48,12.7893,1834.54 +351216,2157.11,9.81092,2159.83 +702459,2452.42,4.77572,2444.8 +1404891,2378.7,3.93096,2364.06 +2057940,2366.62,3.82584,2365.59 +2809755,2290.76,3.7803,2264.07 +4115853,2269.31,3.70921,2275.59 +5487804,2216.51,3.73914,2205.61 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_flops_smoothed.csv new file mode 100644 index 0000000..b842452 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_CONVECTION3DPA_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +1377,203.569,13.9092,196.974 +5508,493.27549999999997,13.354,474.1055 +21951,782.982,12.8021,751.237 +43902,1155.74,12.7988,1163.05 +87804,1561.48,12.7893,1522.53 +175608,1865.48,12.7893,1834.54 +351216,2157.11,9.81092,2159.83 +702459,2366.62,4.77572,2364.06 +1404891,2366.62,3.93096,2364.06 +2057940,2366.62,3.82584,2364.06 +2809755,2290.76,3.7803,2275.59 +4115853,2280.035,3.7597199999999997,2269.83 +5487804,2269.31,3.73914,2264.07 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv new file mode 100644 index 0000000..be5e04e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1849,26.3791,7.01899,31.5271 +7744,130.131,6.94882,128.414 +32400,465.096,6.91914,522.879 +65025,870.75,6.89789,883.357 +131044,1436.18,6.90635,1451.21 +264196,1727.01,6.8548,1643.27 +528529,1661.51,6.86785,1675.75 +1060900,1804.69,6.79735,1795.26 +2125764,2347.72,6.73309,2374.29 +3115225,2153.59,6.72062,2132.2 +4255969,2064.0,6.23478,2050.3 +6235009,1792.54,6.18992,1816.71 +8317456,1820.63,6.50454,1837.98 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv new file mode 100644 index 0000000..14322eb --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1849,130.131,6.94882,128.414 +7744,297.6135,6.93398,325.6465 +32400,465.096,6.91914,522.879 +65025,870.75,6.90635,883.357 +131044,1436.18,6.89789,1451.21 +264196,1661.51,6.86785,1643.27 +528529,1727.01,6.8548,1675.75 +1060900,1804.69,6.79735,1795.26 +2125764,2064.0,6.73309,2050.3 +3115225,2064.0,6.72062,2050.3 +4255969,2064.0,6.50454,2050.3 +6235009,1942.315,6.36966,1944.14 +8317456,1820.63,6.23478,1837.98 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_flops_raw.csv new file mode 100644 index 0000000..492e75c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1849,30.8957,8.22078,36.9252 +7744,154.834,8.26791,152.791 +32400,557.675,8.29641,626.96 +65025,1046.35,8.28894,1061.5 +131044,1728.47,8.31193,1746.56 +264196,2080.76,8.25887,1979.87 +528529,2003.36,8.28088,2020.53 +1060900,2177.17,8.20031,2165.8 +2125764,2833.35,8.12587,2865.42 +3115225,2599.48,8.1121,2573.67 +4255969,2491.61,7.5265,2475.08 +6235009,2164.16,7.47318,2193.34 +8317456,2198.23,7.85359,2219.18 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv new file mode 100644 index 0000000..224b599 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_DEL_DOT_VEC_2D_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +1849,154.834,8.26791,152.791 +7744,356.2545,8.278425,389.8755 +32400,557.675,8.28894,626.96 +65025,1046.35,8.28894,1061.5 +131044,1728.47,8.28894,1746.56 +264196,2003.36,8.28088,1979.87 +528529,2080.76,8.25887,2020.53 +1060900,2177.17,8.20031,2165.8 +2125764,2491.61,8.12587,2475.08 +3115225,2491.61,8.1121,2475.08 +4255969,2491.61,7.85359,2475.08 +6235009,2344.92,7.690045,2347.13 +8317456,2198.23,7.5265,2219.18 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_bandwidth_raw.csv new file mode 100644 index 0000000..baa5132 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +27,0.361332,0.0762581,0.500055 +125,0.367612,0.0770286,0.546417 +512,0.366381,0.0770515,0.649993 +1000,0.394913,0.0769662,0.700591 +1728,0.41308,0.0769608,0.72505 +3375,0.430266,0.0771036,0.750994 +6859,0.442773,0.0768661,0.773771 +13824,0.446885,0.0766108,0.790999 +27000,0.449095,0.0769857,0.796342 +39304,0.447921,0.0771837,0.802517 +50653,0.447736,0.0769533,0.80397 +74088,0.449811,0.0767716,0.806147 +97336,0.449862,0.0770738,0.807049 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv new file mode 100644 index 0000000..545d39e --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +27,0.366381,0.0770286,0.546417 +125,0.3669965,0.0769974,0.5982050000000001 +512,0.367612,0.0769662,0.649993 +1000,0.394913,0.0770286,0.700591 +1728,0.41308,0.0769662,0.72505 +3375,0.430266,0.0769608,0.750994 +6859,0.442773,0.0769608,0.773771 +13824,0.446885,0.0769857,0.790999 +27000,0.447736,0.0769533,0.796342 +39304,0.447921,0.0769533,0.802517 +50653,0.449095,0.0769857,0.80397 +74088,0.448866,0.07701355,0.8050584999999999 +97336,0.449811,0.0769533,0.806147 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_flops_raw.csv new file mode 100644 index 0000000..bc47216 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +27,16.7606,3.53728,23.1954 +125,17.0519,3.57302,25.3459 +512,16.9948,3.57408,30.1503 +1000,18.3183,3.57013,32.4974 +1728,19.161,3.56988,33.6319 +3375,19.9581,3.5765,34.8353 +6859,20.5383,3.56548,35.8919 +13824,20.7291,3.55364,36.691 +27000,20.8315,3.57103,36.9388 +39304,20.7771,3.58022,37.2253 +50653,20.7685,3.56953,37.2927 +74088,20.8648,3.5611,37.3937 +97336,20.8671,3.57512,37.4355 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_flops_smoothed.csv new file mode 100644 index 0000000..b08d890 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_INTSC_HEXHEX_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64,Base_Seq-default,RAJA_HIP-block_64 +27,16.9948,3.57302,25.3459 +125,17.02335,3.571575,27.7481 +512,17.0519,3.57013,30.1503 +1000,18.3183,3.57302,32.4974 +1728,19.161,3.57013,33.6319 +3375,19.9581,3.56988,34.8353 +6859,20.5383,3.56988,35.8919 +13824,20.7291,3.57103,36.691 +27000,20.7685,3.56953,36.9388 +39304,20.7771,3.56953,37.2253 +50653,20.8315,3.57103,37.2927 +74088,20.82095,3.572325,37.3432 +97336,20.8648,3.56953,37.3937 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_bandwidth_raw.csv new file mode 100644 index 0000000..4f5409a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-kernel_256,RAJA_HIP-launch_256 +2496,47.1104,8.93438,45.5952,46.5183 +9792,177.9,8.70866,171.408,173.971 +38784,445.435,8.47555,409.657,450.883 +77568,427.568,8.41261,464.379,517.889 +154944,667.919,8.38568,580.054,664.319 +309696,785.409,8.37555,682.903,785.988 +619392,888.12,8.24656,743.546,878.867 +1238784,913.079,8.31775,749.416,894.681 +2477568,934.653,8.30493,767.18,914.626 +3629184,955.521,8.31962,782.16,924.21 +4954944,949.809,8.22013,789.287,938.802 +7258176,957.814,8.20832,776.856,947.696 +9677568,957.959,8.20761,775.257,951.949 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_bandwidth_smoothed.csv new file mode 100644 index 0000000..71e3518 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-kernel_256,RAJA_HIP-launch_256 +2496,177.9,8.70866,171.408,173.971 +9792,302.734,8.592105,290.53249999999997,312.427 +38784,427.568,8.47555,409.657,450.883 +77568,445.435,8.41261,464.379,517.889 +154944,667.919,8.38568,580.054,664.319 +309696,785.409,8.37555,682.903,785.988 +619392,888.12,8.31775,743.546,878.867 +1238784,913.079,8.31775,749.416,894.681 +2477568,934.653,8.30493,767.18,914.626 +3629184,949.809,8.30493,776.856,924.21 +4954944,955.521,8.22013,776.856,938.802 +7258176,956.6675,8.214224999999999,779.508,943.249 +9677568,957.814,8.20832,776.856,947.696 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_flops_raw.csv new file mode 100644 index 0000000..7a9ed51 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-kernel_256,RAJA_HIP-launch_256 +2496,33.6568,6.38293,32.5743,33.2337 +9792,127.705,6.25147,123.045,124.885 +38784,320.146,6.0916,294.431,324.061 +77568,307.368,6.04761,333.83,372.297 +154944,480.199,6.02887,417.029,477.611 +309696,564.698,6.0219,490.998,565.114 +619392,638.563,5.92931,534.613,631.91 +1238784,656.516,5.98058,538.841,643.288 +2477568,672.033,5.9714,551.617,657.633 +3629184,687.039,5.98197,562.389,664.526 +4954944,682.933,5.91045,567.514,675.018 +7258176,688.689,5.90196,558.576,681.414 +9677568,688.794,5.90146,557.427,684.472 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_flops_smoothed.csv new file mode 100644 index 0000000..a18b71b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_LTIMES_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-kernel_256,RAJA_HIP-launch_256 +2496,127.705,6.25147,123.045,124.885 +9792,217.5365,6.171535,208.738,224.47299999999998 +38784,307.368,6.0916,294.431,324.061 +77568,320.146,6.04761,333.83,372.297 +154944,480.199,6.02887,417.029,477.611 +309696,564.698,6.0219,490.998,565.114 +619392,638.563,5.98058,534.613,631.91 +1238784,656.516,5.98058,538.841,643.288 +2477568,672.033,5.9714,551.617,657.633 +3629184,682.933,5.9714,558.576,664.526 +4954944,687.039,5.91045,558.576,675.018 +7258176,687.864,5.906205,560.4825000000001,678.216 +9677568,688.689,5.90196,558.576,681.414 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_bandwidth_raw.csv new file mode 100644 index 0000000..3e1dd00 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_25,Base_Seq-default,RAJA_HIP-block_25 +3200,29.3042,5.25832,28.8078 +12672,112.881,5.26504,112.269 +50624,339.37,5.17562,337.689 +101184,466.361,5.2024,463.558 +202368,573.802,5.20566,568.456 +404736,825.456,5.21928,826.853 +809536,1023.07,5.22359,1033.34 +1619008,1178.58,5.16814,1186.46 +3237952,1229.66,5.16021,1220.68 +4743104,1250.28,5.15267,1211.21 +6475904,1202.57,5.15408,1190.51 +9486208,1163.42,5.13914,1160.44 +12648256,1170.24,5.1546,1170.83 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_bandwidth_smoothed.csv new file mode 100644 index 0000000..bdac384 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_25,Base_Seq-default,RAJA_HIP-block_25 +3200,112.881,5.25832,112.269 +12672,226.1255,5.23036,224.979 +50624,339.37,5.20566,337.689 +101184,466.361,5.20566,463.558 +202368,573.802,5.20566,568.456 +404736,825.456,5.20566,826.853 +809536,1023.07,5.20566,1033.34 +1619008,1178.58,5.16814,1186.46 +3237952,1202.57,5.16021,1190.51 +4743104,1202.57,5.15408,1190.51 +6475904,1202.57,5.15408,1190.51 +9486208,1186.405,5.1533750000000005,1180.67 +12648256,1170.24,5.15408,1170.83 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_flops_raw.csv new file mode 100644 index 0000000..93cb090 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_25,Base_Seq-default,RAJA_HIP-block_25 +3200,62.7348,11.2571,61.6721 +12672,242.112,11.2927,240.801 +50624,728.244,11.1062,724.638 +101184,1000.83,11.1646,994.815 +202368,1231.45,11.172,1219.98 +404736,1771.57,11.2015,1774.57 +809536,2195.71,11.2108,2217.75 +1619008,2529.48,11.0919,2546.38 +3237952,2639.1,11.0749,2619.83 +4743104,2683.36,11.0587,2599.51 +6475904,2580.96,11.0617,2555.09 +9486208,2496.96,11.0297,2490.55 +12648256,2511.58,11.0629,2512.86 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_flops_smoothed.csv new file mode 100644 index 0000000..9f635ba --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MASS3DPA_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_25,Base_Seq-default,RAJA_HIP-block_25 +3200,242.112,11.2571,240.801 +12672,485.178,11.21085,482.71950000000004 +50624,728.244,11.172,724.638 +101184,1000.83,11.172,994.815 +202368,1231.45,11.172,1219.98 +404736,1771.57,11.172,1774.57 +809536,2195.71,11.172,2217.75 +1619008,2529.48,11.0919,2546.38 +3237952,2580.96,11.0749,2555.09 +4743104,2580.96,11.0617,2555.09 +6475904,2580.96,11.0617,2555.09 +9486208,2546.27,11.0602,2533.9750000000004 +12648256,2511.58,11.0617,2512.86 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv new file mode 100644 index 0000000..4ea6085 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +216,7.57793,15.2267,9.43932 +1331,43.2409,13.8755,50.6178 +8000,238.342,11.9161,287.277 +17576,528.826,12.2455,627.67 +35937,1063.56,11.9863,1232.16 +79507,1658.04,12.0474,1747.18 +157464,2025.36,11.3978,2053.46 +328509,1977.85,6.83387,2033.64 +681472,2290.43,4.83293,2321.56 +1000000,1910.0,4.29488,1901.27 +1404928,1967.15,4.59264,1954.98 +2048383,1863.51,4.57083,1854.89 +2744000,1716.99,4.28615,1722.95 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv new file mode 100644 index 0000000..5ddbb8b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +216,43.2409,13.8755,50.6178 +1331,140.79145,13.060500000000001,168.9474 +8000,238.342,12.2455,287.277 +17576,528.826,12.0474,627.67 +35937,1063.56,11.9863,1232.16 +79507,1658.04,11.9863,1747.18 +157464,1977.85,11.3978,2033.64 +328509,1977.85,6.83387,2033.64 +681472,1977.85,4.83293,2033.64 +1000000,1967.15,4.59264,1954.98 +1404928,1910.0,4.57083,1901.27 +2048383,1886.755,4.432855,1878.08 +2744000,1863.51,4.57083,1854.89 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_flops_raw.csv new file mode 100644 index 0000000..ca8c375 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +216,2.40771,4.83791,2.99912 +1331,15.411,4.94522,18.0402 +8000,90.9748,4.54837,109.653 +17576,206.003,4.77019,244.507 +35937,420.435,4.73832,487.086 +79507,663.943,4.82424,699.638 +157464,818.182,4.60436,829.536 +328509,805.027,2.78153,827.737 +681472,937.771,1.97875,950.518 +1000000,784.035,1.763,780.45 +1404928,809.14,1.88907,804.134 +2048383,768.05,1.88388,764.498 +2744000,708.65,1.76902,711.109 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv new file mode 100644 index 0000000..6cffaa0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Apps_MATVEC_3D_STENCIL_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +216,15.411,4.83791,18.0402 +1331,53.1929,4.80405,63.8466 +8000,90.9748,4.77019,109.653 +17576,206.003,4.77019,244.507 +35937,420.435,4.73832,487.086 +79507,663.943,4.73832,699.638 +157464,805.027,4.60436,827.737 +328509,805.027,2.78153,827.737 +681472,809.14,1.97875,827.737 +1000000,805.027,1.88907,804.134 +1404928,784.035,1.88388,780.45 +2048383,776.0425,1.82645,772.474 +2744000,768.05,1.88388,764.498 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv new file mode 100644 index 0000000..ab60300 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_bandwidth_raw.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +160000,282.038,10.9259,281.64 +320000,484.515,10.5095,491.281 +640000,769.998,10.4641,771.498 +1280000,1098.8,10.3463,1121.51 +2560000,1537.47,9.57698,1537.84 +5120000,2025.0,9.33421,2002.31 +7500000,2268.75,9.21605,2270.15 +10240000,2411.97,9.14268,2427.37 +15000000,2557.58,9.06695,2543.69 +20000000,2588.86,9.03661,2615.38 +25000000,2593.46,9.01477,2577.97 +30000000,2577.57,9.00109,2578.84 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv new file mode 100644 index 0000000..40aa612 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_bandwidth_smoothed.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +160000,484.515,10.5095,491.281 +320000,627.2565,10.486799999999999,631.3895 +640000,769.998,10.4641,771.498 +1280000,1098.8,10.3463,1121.51 +2560000,1537.47,9.57698,1537.84 +5120000,2025.0,9.33421,2002.31 +7500000,2268.75,9.21605,2270.15 +10240000,2411.97,9.14268,2427.37 +15000000,2557.58,9.06695,2543.69 +20000000,2577.57,9.03661,2577.97 +25000000,2583.215,9.02569,2578.4049999999997 +30000000,2588.86,9.01477,2578.84 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_flops_raw.csv new file mode 100644 index 0000000..386dbbe --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_flops_raw.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +160000,0.0,0.0,0.0 +320000,0.0,0.0,0.0 +640000,0.0,0.0,0.0 +1280000,0.0,0.0,0.0 +2560000,0.0,0.0,0.0 +5120000,0.0,0.0,0.0 +7500000,0.0,0.0,0.0 +10240000,0.0,0.0,0.0 +15000000,0.0,0.0,0.0 +20000000,0.0,0.0,0.0 +25000000,0.0,0.0,0.0 +30000000,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_flops_smoothed.csv new file mode 100644 index 0000000..386dbbe --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_INDEXLIST_3LOOP_flops_smoothed.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_256,Base_Seq-default,RAJA_HIP-block_256 +160000,0.0,0.0,0.0 +320000,0.0,0.0,0.0 +640000,0.0,0.0,0.0 +1280000,0.0,0.0,0.0 +2560000,0.0,0.0,0.0 +5120000,0.0,0.0,0.0 +7500000,0.0,0.0,0.0 +10240000,0.0,0.0,0.0 +15000000,0.0,0.0,0.0 +20000000,0.0,0.0,0.0 +25000000,0.0,0.0,0.0 +30000000,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_bandwidth_raw.csv new file mode 100644 index 0000000..54ab5ff --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-atomic_direct_256,Base_HIP-atomic_occgs_256,Base_Seq-default,RAJA_HIP-atomic_direct_256,RAJA_HIP-atomic_occgs_256 +6245,7.75335,7.70146,4.69577,7.49752,7.4178 +24995,31.7778,31.8354,4.60804,29.7767,29.887 +99995,128.418,127.179,4.59568,123.125,122.264 +199995,249.63,250.134,4.59044,242.075,232.439 +399995,486.492,497.721,4.58914,461.132,440.501 +799995,868.036,875.715,4.58831,814.472,845.504 +1599995,1499.82,1541.56,4.58558,1367.89,1460.7 +3199995,1950.45,1990.61,4.57907,1866.84,1884.81 +6399995,2556.08,2517.79,4.57733,2340.7,2483.72 +9374995,2869.3,2875.96,4.57632,2673.36,2837.25 +12799995,2825.08,2966.29,4.57698,2568.11,2929.42 +18749995,2599.61,2819.54,4.57631,2358.17,2799.69 +24999995,2504.85,2714.98,4.5776,2261.77,2699.7 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_bandwidth_smoothed.csv new file mode 100644 index 0000000..c5af0a1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-atomic_direct_256,Base_HIP-atomic_occgs_256,Base_Seq-default,RAJA_HIP-atomic_direct_256,RAJA_HIP-atomic_occgs_256 +6245,31.7778,31.8354,4.60804,29.7767,29.887 +24995,80.09790000000001,79.5072,4.60186,76.45085,76.0755 +99995,128.418,127.179,4.59568,123.125,122.264 +199995,249.63,250.134,4.59044,242.075,232.439 +399995,486.492,497.721,4.58914,461.132,440.501 +799995,868.036,875.715,4.58831,814.472,845.504 +1599995,1499.82,1541.56,4.58558,1367.89,1460.7 +3199995,1950.45,1990.61,4.57907,1866.84,1884.81 +6399995,2556.08,2517.79,4.57733,2340.7,2483.72 +9374995,2599.61,2819.54,4.57698,2358.17,2799.69 +12799995,2599.61,2819.54,4.57698,2358.17,2799.69 +18749995,2712.3450000000003,2847.75,4.57665,2463.1400000000003,2818.4700000000003 +24999995,2599.61,2819.54,4.57698,2358.17,2799.69 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_flops_raw.csv new file mode 100644 index 0000000..514b063 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-atomic_direct_256,Base_HIP-atomic_occgs_256,Base_Seq-default,RAJA_HIP-atomic_direct_256,RAJA_HIP-atomic_occgs_256 +6245,0.519487,0.51601,0.314624,0.502346,0.497004 +24995,2.13172,2.13558,0.309117,1.99748,2.00488 +99995,8.61709,8.53398,0.30838,8.26195,8.20421 +199995,16.7516,16.7853,0.308044,16.2446,15.5979 +399995,32.6471,33.4007,0.307964,30.9453,29.5608 +799995,58.2522,58.7675,0.307912,54.6576,56.7401 +1599995,100.651,103.452,0.307731,91.7972,98.0251 +3199995,130.892,133.587,0.307295,125.281,126.487 +6399995,171.536,168.966,0.307179,157.081,166.679 +9374995,192.555,193.002,0.307111,179.406,190.404 +12799995,189.588,199.064,0.307156,172.343,196.59 +18749995,174.457,189.216,0.307111,158.254,187.884 +24999995,168.098,182.199,0.307197,151.785,181.174 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_flops_smoothed.csv new file mode 100644 index 0000000..2a1a48a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_MULTI_REDUCE_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-atomic_direct_256,Base_HIP-atomic_occgs_256,Base_Seq-default,RAJA_HIP-atomic_direct_256,RAJA_HIP-atomic_occgs_256 +6245,2.13172,2.13558,0.309117,1.99748,2.00488 +24995,5.374404999999999,5.33478,0.3087485,5.129715,5.104545 +99995,8.61709,8.53398,0.30838,8.26195,8.20421 +199995,16.7516,16.7853,0.308044,16.2446,15.5979 +399995,32.6471,33.4007,0.307964,30.9453,29.5608 +799995,58.2522,58.7675,0.307912,54.6576,56.7401 +1599995,100.651,103.452,0.307731,91.7972,98.0251 +3199995,130.892,133.587,0.307295,125.281,126.487 +6399995,171.536,168.966,0.307179,157.081,166.679 +9374995,174.457,189.216,0.307156,158.254,187.884 +12799995,174.457,189.216,0.307156,158.254,187.884 +18749995,182.02249999999998,191.109,0.3071335,165.2985,189.144 +24999995,174.457,189.216,0.307156,158.254,187.884 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_bandwidth_raw.csv new file mode 100644 index 0000000..c38f085 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_bandwidth_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-blkatm_direct_256,Base_HIP-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_HIP-blkatm_direct_256,RAJA_HIP-blkatm_occgs_256,RAJA_HIP-blkdev_direct_256,RAJA_HIP-blkdev_direct_new_256,RAJA_HIP-blkdev_occgs_256,RAJA_HIP-blkdev_occgs_new_256 +6250,4.46136,4.5203,9.25599,17.9107,4.57718,3.81591,3.83063,4.65775,2.62709,4.64007,2.59265 +25000,11.4713,11.4928,9.4984,18.2721,4.58912,15.3696,15.3823,12.4069,7.97406,12.4162,7.92119 +100000,21.3663,22.7513,9.44387,17.946,4.58631,56.5996,57.471,47.8142,17.1615,47.7055,17.1638 +200000,31.4902,32.4121,9.42705,17.9276,4.58714,104.426,105.866,91.4688,21.1074,90.696,21.0717 +400000,27.613,37.0496,9.45746,17.9685,4.58829,177.934,178.178,168.394,23.3677,169.295,23.2215 +800000,24.6339,70.54,9.46773,18.0088,4.58898,237.566,347.681,240.857,24.1335,329.308,45.8789 +1600000,21.8346,145.402,9.43083,17.782,4.58467,311.57,661.095,295.141,24.5137,598.921,90.5478 +3200000,21.541,306.391,9.35962,17.2797,4.57414,368.882,1091.42,331.915,24.4658,991.432,172.877 +6400000,21.6182,573.49,9.36547,17.1248,4.57251,411.026,1722.86,363.719,24.2975,1564.8,322.008 +9375000,21.406,817.096,9.35046,17.0078,4.57014,424.781,2017.87,372.367,23.0999,1915.68,454.172 +12800000,19.4087,922.82,9.34837,17.0091,4.56956,415.911,2190.38,370.326,23.7009,2033.58,545.025 +18750000,19.2922,1078.12,9.36435,17.2053,4.57311,422.829,2153.0,370.5,23.2064,2007.29,674.473 +25000000,19.2351,1172.91,9.36658,17.25,4.5735,419.544,2218.97,371.649,21.5732,2108.4,766.882 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv new file mode 100644 index 0000000..44ac10c --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_bandwidth_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-blkatm_direct_256,Base_HIP-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_HIP-blkatm_direct_256,RAJA_HIP-blkatm_occgs_256,RAJA_HIP-blkdev_direct_256,RAJA_HIP-blkdev_direct_new_256,RAJA_HIP-blkdev_occgs_256,RAJA_HIP-blkdev_occgs_new_256 +6250,11.4713,11.4928,9.44387,17.946,4.58631,15.3696,15.3823,12.4069,7.97406,12.4162,7.92119 +25000,16.418799999999997,17.12205,9.435459999999999,17.9368,4.5867249999999995,35.9846,36.426649999999995,30.11055,12.567779999999999,30.060850000000002,12.542494999999999 +100000,21.3663,22.7513,9.44387,17.946,4.58714,56.5996,57.471,47.8142,17.1615,47.7055,17.1638 +200000,24.6339,32.4121,9.45746,17.9685,4.58829,104.426,105.866,91.4688,21.1074,90.696,21.0717 +400000,24.6339,37.0496,9.44387,17.946,4.58714,177.934,178.178,168.394,23.3677,169.295,23.2215 +800000,24.6339,70.54,9.43083,17.9276,4.58714,237.566,347.681,240.857,24.1335,329.308,45.8789 +1600000,21.8346,145.402,9.43083,17.782,4.58467,311.57,661.095,295.141,24.2975,598.921,90.5478 +3200000,21.6182,306.391,9.36547,17.2797,4.57414,368.882,1091.42,331.915,24.2975,991.432,172.877 +6400000,21.541,573.49,9.35962,17.1248,4.57251,411.026,1722.86,363.719,24.2975,1564.8,322.008 +9375000,21.406,817.096,9.35962,17.1248,4.57251,415.911,2017.87,370.326,23.7009,1915.68,454.172 +12800000,19.4087,922.82,9.36435,17.1248,4.57251,419.544,2153.0,370.5,23.2064,2007.29,545.025 +18750000,19.350450000000002,1000.47,9.357405,17.1072,4.571625,421.1865,2171.69,371.0745,23.15315,2020.435,609.749 +25000000,19.2922,1078.12,9.36435,17.2053,4.57311,419.544,2190.38,370.5,23.2064,2033.58,674.473 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_flops_raw.csv new file mode 100644 index 0000000..21c7e84 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_flops_raw.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-blkatm_direct_256,Base_HIP-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_HIP-blkatm_direct_256,RAJA_HIP-blkatm_occgs_256,RAJA_HIP-blkdev_direct_256,RAJA_HIP-blkdev_direct_new_256,RAJA_HIP-blkdev_occgs_256,RAJA_HIP-blkdev_occgs_new_256 +6250,0.59889,0.606802,1.24252,2.40431,0.614436,0.512244,0.514221,0.625253,0.352658,0.622879,0.348036 +25000,1.53972,1.5426,1.2749,2.45253,0.615966,2.06295,2.06465,1.66529,1.0703,1.66655,1.06321 +100000,2.86776,3.05366,1.26755,2.40869,0.61557,7.59675,7.7137,6.41757,2.3034,6.40299,2.30371 +200000,4.22656,4.3503,1.26528,2.40622,0.615679,14.0159,14.2092,12.2768,2.83301,12.1731,2.82821 +400000,3.70616,4.97273,1.26936,2.41169,0.615832,23.882,23.9147,22.6015,3.13637,22.7224,3.11675 +800000,3.30631,9.46774,1.27074,2.4171,0.615924,31.8856,46.665,32.3273,3.23914,44.199,6.15777 +1600000,2.93059,19.5156,1.26578,2.38666,0.615345,41.8183,88.7308,39.6132,3.29018,80.3859,12.1531 +3200000,2.89119,41.1232,1.25623,2.31924,0.61393,49.5105,146.487,44.5489,3.28374,133.068,23.2031 +6400000,2.90154,76.9726,1.25701,2.29845,0.613712,55.167,231.239,48.8176,3.26116,210.024,43.2192 +9375000,2.87306,109.669,1.255,2.28275,0.613394,57.0132,270.833,49.9782,3.10041,257.118,60.958 +12800000,2.60499,123.859,1.25472,2.28292,0.613316,55.8227,293.988,49.7044,3.18108,272.943,73.1521 +18750000,2.58935,144.703,1.25686,2.30926,0.613792,56.7512,288.97,49.7276,3.11471,269.415,90.5263 +25000000,2.58168,157.426,1.25716,2.31526,0.613845,56.3103,297.825,49.8818,2.89551,282.985,102.929 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_flops_smoothed.csv new file mode 100644 index 0000000..c948bc5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Basic_REDUCE_STRUCT_flops_smoothed.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-blkatm_direct_256,Base_HIP-blkatm_occgs_256,Base_Seq-cascade,Base_Seq-default,Base_Seq-kahan,RAJA_HIP-blkatm_direct_256,RAJA_HIP-blkatm_occgs_256,RAJA_HIP-blkdev_direct_256,RAJA_HIP-blkdev_direct_new_256,RAJA_HIP-blkdev_occgs_256,RAJA_HIP-blkdev_occgs_new_256 +6250,1.53972,1.5426,1.26755,2.40869,0.61557,2.06295,2.06465,1.66529,1.0703,1.66655,1.06321 +25000,2.20374,2.29813,1.2664149999999998,2.4074549999999997,0.6156245,4.82985,4.889175,4.04143,1.68685,4.03477,1.6834600000000002 +100000,2.86776,3.05366,1.26755,2.40869,0.615679,7.59675,7.7137,6.41757,2.3034,6.40299,2.30371 +200000,3.30631,4.3503,1.26936,2.41169,0.615832,14.0159,14.2092,12.2768,2.83301,12.1731,2.82821 +400000,3.30631,4.97273,1.26755,2.40869,0.615679,23.882,23.9147,22.6015,3.13637,22.7224,3.11675 +800000,3.30631,9.46774,1.26578,2.40622,0.615679,31.8856,46.665,32.3273,3.23914,44.199,6.15777 +1600000,2.93059,19.5156,1.26578,2.38666,0.615345,41.8183,88.7308,39.6132,3.26116,80.3859,12.1531 +3200000,2.90154,41.1232,1.25701,2.31924,0.61393,49.5105,146.487,44.5489,3.26116,133.068,23.2031 +6400000,2.89119,76.9726,1.25623,2.29845,0.613712,55.167,231.239,48.8176,3.26116,210.024,43.2192 +9375000,2.87306,109.669,1.25623,2.29845,0.613712,55.8227,270.833,49.7044,3.18108,257.118,60.958 +12800000,2.60499,123.859,1.25686,2.29845,0.613712,56.3103,288.97,49.7276,3.11471,269.415,73.1521 +18750000,2.59717,134.281,1.25593,2.29609,0.613593,56.53075,291.47900000000004,49.8047,3.1075600000000003,271.179,81.8392 +25000000,2.58935,144.703,1.25686,2.30926,0.613792,56.3103,293.988,49.7276,3.11471,272.943,90.5263 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv new file mode 100644 index 0000000..0b94b68 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_bandwidth_raw.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-direct_1024,Base_Seq-direct,RAJA_HIP-direct_1024,RAJA_HIP-funcptr_1024,RAJA_HIP-virtfunc_1024 +91125,53.049,30.503,43.7518,46.6773,45.935 +205379,81.0342,28.2635,70.0771,73.2531,71.0136 +421875,131.186,28.801,111.083,119.378,115.585 +884736,195.121,27.1852,160.986,174.266,165.913 +1860867,305.984,26.9538,251.596,270.63,263.685 +3796416,451.394,22.6057,364.717,407.436,388.323 +5639752,546.885,14.3594,473.418,499.463,476.998 +7762392,557.471,8.92213,495.627,528.494,513.647 +11543176,719.735,8.25019,670.95,670.952,646.866 +15438249,798.716,7.70923,748.537,736.716,712.972 +19465109,861.82,7.3292,787.955,797.128,779.828 +23393656,863.478,3.9391,807.196,801.537,783.349 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv new file mode 100644 index 0000000..83f6aa5 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_bandwidth_smoothed.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-direct_1024,Base_Seq-direct,RAJA_HIP-direct_1024,RAJA_HIP-funcptr_1024,RAJA_HIP-virtfunc_1024 +91125,81.0342,28.801,70.0771,73.2531,71.0136 +205379,106.1101,28.532249999999998,90.58005,96.31555,93.29929999999999 +421875,131.186,28.2635,111.083,119.378,115.585 +884736,195.121,27.1852,160.986,174.266,165.913 +1860867,305.984,26.9538,251.596,270.63,263.685 +3796416,451.394,22.6057,364.717,407.436,388.323 +5639752,546.885,14.3594,473.418,499.463,476.998 +7762392,557.471,8.92213,495.627,528.494,513.647 +11543176,719.735,8.25019,670.95,670.952,646.866 +15438249,798.716,7.70923,748.537,736.716,712.972 +19465109,830.268,7.519215,768.2460000000001,766.922,746.4 +23393656,861.82,7.3292,787.955,797.128,779.828 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_flops_raw.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_flops_raw.csv new file mode 100644 index 0000000..4c36d64 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_flops_raw.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-direct_1024,Base_Seq-direct,RAJA_HIP-direct_1024,RAJA_HIP-funcptr_1024,RAJA_HIP-virtfunc_1024 +91125,0.0,0.0,0.0,0.0,0.0 +205379,0.0,0.0,0.0,0.0,0.0 +421875,0.0,0.0,0.0,0.0,0.0 +884736,0.0,0.0,0.0,0.0,0.0 +1860867,0.0,0.0,0.0,0.0,0.0 +3796416,0.0,0.0,0.0,0.0,0.0 +5639752,0.0,0.0,0.0,0.0,0.0 +7762392,0.0,0.0,0.0,0.0,0.0 +11543176,0.0,0.0,0.0,0.0,0.0 +15438249,0.0,0.0,0.0,0.0,0.0 +19465109,0.0,0.0,0.0,0.0,0.0 +23393656,0.0,0.0,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_flops_smoothed.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_flops_smoothed.csv new file mode 100644 index 0000000..4c36d64 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/Comm_HALO_PACKING_FUSED_flops_smoothed.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-direct_1024,Base_Seq-direct,RAJA_HIP-direct_1024,RAJA_HIP-funcptr_1024,RAJA_HIP-virtfunc_1024 +91125,0.0,0.0,0.0,0.0,0.0 +205379,0.0,0.0,0.0,0.0,0.0 +421875,0.0,0.0,0.0,0.0,0.0 +884736,0.0,0.0,0.0,0.0,0.0 +1860867,0.0,0.0,0.0,0.0,0.0 +3796416,0.0,0.0,0.0,0.0,0.0 +5639752,0.0,0.0,0.0,0.0,0.0 +7762392,0.0,0.0,0.0,0.0,0.0 +11543176,0.0,0.0,0.0,0.0,0.0 +15438249,0.0,0.0,0.0,0.0,0.0 +19465109,0.0,0.0,0.0,0.0,0.0 +23393656,0.0,0.0,0.0,0.0,0.0 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_CONVECTION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_CONVECTION3DPA.csv new file mode 100644 index 0000000..b22d9fd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_CONVECTION3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_CONVECTION3DPA-Base_Seq-default,1377.0,13.9092,7.70152 +Apps_CONVECTION3DPA-Base_HIP-block_64,351216.0,2157.11,1191.32 +Apps_CONVECTION3DPA-RAJA_HIP-block_64,351216.0,2159.83,1192.82 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_DEL_DOT_VEC_2D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_DEL_DOT_VEC_2D.csv new file mode 100644 index 0000000..70f6572 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_DEL_DOT_VEC_2D.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_DEL_DOT_VEC_2D-Base_Seq-default,1849.0,8.22078,7.01899 +Apps_DEL_DOT_VEC_2D-Base_HIP-block_256,264196.0,2080.76,1727.01 +Apps_DEL_DOT_VEC_2D-RAJA_HIP-block_256,528529.0,2020.53,1675.75 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_INTSC_HEXHEX.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_INTSC_HEXHEX.csv new file mode 100644 index 0000000..b268610 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_INTSC_HEXHEX.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_INTSC_HEXHEX-Base_Seq-default,27.0,3.53728,0.0762581 +Apps_INTSC_HEXHEX-Base_HIP-block_64,1728.0,19.161,0.41308 +Apps_INTSC_HEXHEX-RAJA_HIP-block_64,3375.0,34.8353,0.750994 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_LTIMES.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_LTIMES.csv new file mode 100644 index 0000000..021607f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_LTIMES.csv @@ -0,0 +1,5 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_LTIMES-Base_Seq-default,2496.0,6.38293,8.93438 +Apps_LTIMES-Base_HIP-block_256,619392.0,638.563,888.12 +Apps_LTIMES-RAJA_HIP-kernel_256,619392.0,534.613,743.546 +Apps_LTIMES-RAJA_HIP-launch_256,619392.0,631.91,878.867 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_MASS3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_MASS3DPA.csv new file mode 100644 index 0000000..445b55b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_MASS3DPA.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MASS3DPA-Base_Seq-default,3200.0,11.2571,5.25832 +Apps_MASS3DPA-Base_HIP-block_25,1619008.0,2529.48,1178.58 +Apps_MASS3DPA-RAJA_HIP-block_25,1619008.0,2546.38,1186.46 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_MATVEC_3D_STENCIL.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_MATVEC_3D_STENCIL.csv new file mode 100644 index 0000000..d3152db --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Apps_MATVEC_3D_STENCIL.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_MATVEC_3D_STENCIL-Base_Seq-default,216.0,4.83791,15.2267 +Apps_MATVEC_3D_STENCIL-Base_HIP-block_256,157464.0,818.182,2025.36 +Apps_MATVEC_3D_STENCIL-RAJA_HIP-block_256,79507.0,699.638,1747.18 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_INDEXLIST_3LOOP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_INDEXLIST_3LOOP.csv new file mode 100644 index 0000000..d41e2c4 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_INDEXLIST_3LOOP.csv @@ -0,0 +1,4 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_INDEXLIST_3LOOP-Base_Seq-default,160000.0,0.0,10.9259 +Basic_INDEXLIST_3LOOP-Base_HIP-block_256,160000.0,0.0,282.038 +Basic_INDEXLIST_3LOOP-RAJA_HIP-block_256,160000.0,0.0,281.64 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_MULTI_REDUCE.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_MULTI_REDUCE.csv new file mode 100644 index 0000000..d492aa1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_MULTI_REDUCE.csv @@ -0,0 +1,6 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_MULTI_REDUCE-Base_Seq-default,6245.0,0.314624,4.69577 +Basic_MULTI_REDUCE-Base_HIP-atomic_direct_256,6399995.0,171.536,2556.08 +Basic_MULTI_REDUCE-Base_HIP-atomic_occgs_256,9374995.0,193.002,2875.96 +Basic_MULTI_REDUCE-RAJA_HIP-atomic_direct_256,6399995.0,157.081,2340.7 +Basic_MULTI_REDUCE-RAJA_HIP-atomic_occgs_256,9374995.0,190.404,2837.25 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_REDUCE_STRUCT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_REDUCE_STRUCT.csv new file mode 100644 index 0000000..ccd670b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Basic_REDUCE_STRUCT.csv @@ -0,0 +1,12 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Basic_REDUCE_STRUCT-Base_Seq-default,6250.0,2.40431,17.9107 +Basic_REDUCE_STRUCT-Base_Seq-kahan,6250.0,0.614436,4.57718 +Basic_REDUCE_STRUCT-Base_Seq-cascade,6250.0,1.24252,9.25599 +Basic_REDUCE_STRUCT-Base_HIP-blkatm_direct_256,200000.0,4.22656,31.4902 +Basic_REDUCE_STRUCT-Base_HIP-blkatm_occgs_256,18750000.0,144.703,1078.12 +Basic_REDUCE_STRUCT-RAJA_HIP-blkatm_direct_256,6400000.0,55.167,411.026 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_direct_256,6400000.0,48.8176,363.719 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_direct_new_256,200000.0,2.83301,21.1074 +Basic_REDUCE_STRUCT-RAJA_HIP-blkatm_occgs_256,9375000.0,270.833,2017.87 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_occgs_256,9375000.0,257.118,1915.68 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_occgs_new_256,18750000.0,90.5263,674.473 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Comm_HALO_PACKING_FUSED.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Comm_HALO_PACKING_FUSED.csv new file mode 100644 index 0000000..a0a742f --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/Comm_HALO_PACKING_FUSED.csv @@ -0,0 +1,6 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Comm_HALO_PACKING_FUSED-Base_Seq-direct,91125.0,0.0,30.503 +Comm_HALO_PACKING_FUSED-Base_HIP-direct_1024,91125.0,0.0,53.049 +Comm_HALO_PACKING_FUSED-RAJA_HIP-direct_1024,91125.0,0.0,43.7518 +Comm_HALO_PACKING_FUSED-RAJA_HIP-funcptr_1024,91125.0,0.0,46.6773 +Comm_HALO_PACKING_FUSED-RAJA_HIP-virtfunc_1024,91125.0,0.0,45.935 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/combined_fom.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/combined_fom.csv new file mode 100644 index 0000000..461c7e1 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/FOM/combined_fom.csv @@ -0,0 +1,44 @@ +Kernel,Sat Problem Size,Sat GFLOP/s,Sat B/W (GiB per sec.) +Apps_CONVECTION3DPA-Base_HIP-block_64,351216.0,2157.11,1191.32 +Apps_CONVECTION3DPA-Base_Seq-default,1377.0,13.9092,7.70152 +Apps_CONVECTION3DPA-RAJA_HIP-block_64,351216.0,2159.83,1192.82 +Apps_DEL_DOT_VEC_2D-Base_HIP-block_256,264196.0,2080.76,1727.01 +Apps_DEL_DOT_VEC_2D-Base_Seq-default,1849.0,8.22078,7.01899 +Apps_DEL_DOT_VEC_2D-RAJA_HIP-block_256,528529.0,2020.53,1675.75 +Apps_INTSC_HEXHEX-Base_HIP-block_64,1728.0,19.161,0.41308 +Apps_INTSC_HEXHEX-Base_Seq-default,27.0,3.53728,0.0762581 +Apps_INTSC_HEXHEX-RAJA_HIP-block_64,3375.0,34.8353,0.750994 +Apps_LTIMES-Base_HIP-block_256,619392.0,638.563,888.12 +Apps_LTIMES-Base_Seq-default,2496.0,6.38293,8.93438 +Apps_LTIMES-RAJA_HIP-kernel_256,619392.0,534.613,743.546 +Apps_LTIMES-RAJA_HIP-launch_256,619392.0,631.91,878.867 +Apps_MASS3DPA-Base_HIP-block_25,1619008.0,2529.48,1178.58 +Apps_MASS3DPA-Base_Seq-default,3200.0,11.2571,5.25832 +Apps_MASS3DPA-RAJA_HIP-block_25,1619008.0,2546.38,1186.46 +Apps_MATVEC_3D_STENCIL-Base_HIP-block_256,157464.0,818.182,2025.36 +Apps_MATVEC_3D_STENCIL-Base_Seq-default,216.0,4.83791,15.2267 +Apps_MATVEC_3D_STENCIL-RAJA_HIP-block_256,79507.0,699.638,1747.18 +Basic_INDEXLIST_3LOOP-Base_HIP-block_256,160000.0,0.0,282.038 +Basic_INDEXLIST_3LOOP-Base_Seq-default,160000.0,0.0,10.9259 +Basic_INDEXLIST_3LOOP-RAJA_HIP-block_256,160000.0,0.0,281.64 +Basic_MULTI_REDUCE-Base_HIP-atomic_direct_256,6399995.0,171.536,2556.08 +Basic_MULTI_REDUCE-Base_HIP-atomic_occgs_256,9374995.0,193.002,2875.96 +Basic_MULTI_REDUCE-Base_Seq-default,6245.0,0.314624,4.69577 +Basic_MULTI_REDUCE-RAJA_HIP-atomic_direct_256,6399995.0,157.081,2340.7 +Basic_MULTI_REDUCE-RAJA_HIP-atomic_occgs_256,9374995.0,190.404,2837.25 +Basic_REDUCE_STRUCT-Base_HIP-blkatm_direct_256,200000.0,4.22656,31.4902 +Basic_REDUCE_STRUCT-Base_HIP-blkatm_occgs_256,18750000.0,144.703,1078.12 +Basic_REDUCE_STRUCT-Base_Seq-cascade,6250.0,1.24252,9.25599 +Basic_REDUCE_STRUCT-Base_Seq-default,6250.0,2.40431,17.9107 +Basic_REDUCE_STRUCT-Base_Seq-kahan,6250.0,0.614436,4.57718 +Basic_REDUCE_STRUCT-RAJA_HIP-blkatm_direct_256,6400000.0,55.167,411.026 +Basic_REDUCE_STRUCT-RAJA_HIP-blkatm_occgs_256,9375000.0,270.833,2017.87 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_direct_256,6400000.0,48.8176,363.719 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_direct_new_256,200000.0,2.83301,21.1074 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_occgs_256,9375000.0,257.118,1915.68 +Basic_REDUCE_STRUCT-RAJA_HIP-blkdev_occgs_new_256,18750000.0,90.5263,674.473 +Comm_HALO_PACKING_FUSED-Base_HIP-direct_1024,91125.0,0.0,53.049 +Comm_HALO_PACKING_FUSED-Base_Seq-direct,91125.0,0.0,30.503 +Comm_HALO_PACKING_FUSED-RAJA_HIP-direct_1024,91125.0,0.0,43.7518 +Comm_HALO_PACKING_FUSED-RAJA_HIP-funcptr_1024,91125.0,0.0,46.6773 +Comm_HALO_PACKING_FUSED-RAJA_HIP-virtfunc_1024,91125.0,0.0,45.935 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/combined_table.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/combined_table.csv new file mode 100644 index 0000000..f45975b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/combined_table.csv @@ -0,0 +1,552 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning +Apps_CONVECTION3DPA,Base_Seq,default,1377, PASSED ,1.35042e-05,7.70152,13.9092,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,1377, PASSED ,3.6214e-06,28.7189,51.8675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,1377, PASSED ,3.70538e-06,28.068,50.692,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,1404891, PASSED ,0.0487508,2.17096,3.93096,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,1404891, PASSED ,8.0564e-05,1313.69,2378.7,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,1404891, PASSED ,8.1063e-05,1305.6,2364.06,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,175608, PASSED ,0.00187299,7.0633,12.7893,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,175608, PASSED ,1.28408e-05,1030.27,1865.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,175608, PASSED ,1.30574e-05,1013.18,1834.54,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,2057940, PASSED ,0.0733744,2.1129,3.82584,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,2057940, PASSED ,0.000118616,1307.01,2366.62,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,2057940, PASSED ,0.000118668,1306.44,2365.59,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,21951, PASSED ,0.000246666,6.7051,12.139,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,21951, PASSED ,3.8242e-06,432.487,782.982,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,21951, PASSED ,3.9858e-06,414.952,751.237,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,2809755, PASSED ,0.101386,2.08775,3.7803,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,2809755, PASSED ,0.000167312,1265.12,2290.76,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,2809755, PASSED ,0.000169284,1250.38,2264.07,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,351216, PASSED ,0.00488318,5.41833,9.81092,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,351216, PASSED ,2.22096e-05,1191.32,2157.11,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,351216, PASSED ,2.21815e-05,1192.82,2159.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,4115853, PASSED ,0.151362,2.04849,3.70921,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,4115853, PASSED ,0.000247403,1253.27,2269.31,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,4115853, PASSED ,0.00024672,1256.74,2275.59,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,43902, PASSED ,0.0004679,7.06895,12.7988,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,43902, PASSED ,5.1816e-06,638.329,1155.74,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,43902, PASSED ,5.149e-06,642.371,1163.05,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,5508, PASSED ,5.37251e-05,7.72835,13.9848,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,5508, PASSED ,3.6908e-06,112.498,203.569,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,5508, PASSED ,3.81438e-06,108.853,196.974,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,5487804, PASSED ,0.2002,2.06502,3.73914,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,5487804, PASSED ,0.000337728,1224.11,2216.51,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,5487804, PASSED ,0.000339396,1218.09,2205.61,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,702459, PASSED ,0.0200641,2.6375,4.77572,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,702459, PASSED ,3.90719e-05,1354.4,2452.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,702459, PASSED ,3.91937e-05,1350.19,2444.8,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_CONVECTION3DPA,Base_Seq,default,87804, PASSED ,0.00093556,7.07049,12.8021,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_CONVECTION3DPA,Base_HIP,block_64,87804, PASSED ,7.67038e-06,862.391,1561.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,87804, PASSED ,7.86658e-06,840.882,1522.53,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1849, PASSED ,1.21456e-05,7.01899,8.22078,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,1849, PASSED ,3.23171e-06,26.3791,30.8957,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,1849, PASSED ,2.70401e-06,31.5271,36.9252,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,2125764, PASSED ,0.0141266,6.73309,8.12587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,2125764, PASSED ,4.05143e-05,2347.72,2833.35,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,2125764, PASSED ,4.00609e-05,2374.29,2865.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,264196, PASSED ,0.00172742,6.8548,8.25887,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,264196, PASSED ,6.85643e-06,1727.01,2080.76,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,264196, PASSED ,7.20583e-06,1643.27,1979.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,3115225, PASSED ,0.0207372,6.72062,8.1121,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,3115225, PASSED ,6.47138e-05,2153.59,2599.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,3115225, PASSED ,6.53628e-05,2132.2,2573.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,32400, PASSED ,0.000210886,6.91914,8.29641,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,32400, PASSED ,3.13731e-06,465.096,557.675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,32400, PASSED ,2.79061e-06,522.879,626.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,4255969, PASSED ,0.0305351,6.23478,7.5265,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,4255969, PASSED ,9.22383e-05,2064.0,2491.61,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,4255969, PASSED ,9.28546e-05,2050.3,2475.08,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,528529, PASSED ,0.00344656,6.86785,8.28088,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,528529, PASSED ,1.42464e-05,1661.51,2003.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,528529, PASSED ,1.41253e-05,1675.75,2020.53,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,6235009, PASSED ,0.0450532,6.18992,7.47318,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,6235009, PASSED ,0.000155575,1792.54,2164.16,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,6235009, PASSED ,0.000153506,1816.71,2193.34,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,65025, PASSED ,0.000423619,6.89789,8.28894,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,65025, PASSED ,3.35581e-06,870.75,1046.35,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,65025, PASSED ,3.30792e-06,883.357,1061.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,7744, PASSED ,5.05782e-05,6.94882,8.26791,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,7744, PASSED ,2.70081e-06,130.131,154.834,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,7744, PASSED ,2.73691e-06,128.414,152.791,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,8317456, PASSED ,0.0571895,6.50454,7.85359,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,8317456, PASSED ,0.00020432,1820.63,2198.23,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,8317456, PASSED ,0.000202391,1837.98,2219.18,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1060900, PASSED ,0.00698615,6.79735,8.20031,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,1060900, PASSED ,2.63133e-05,1804.69,2177.17,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,1060900, PASSED ,2.64515e-05,1795.26,2165.8,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,131044, PASSED ,0.000851352,6.90635,8.31193,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,131044, PASSED ,4.09401e-06,1436.18,1728.47,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,131044, PASSED ,4.05161e-06,1451.21,1746.56,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,3796416, PASSED ,0.000731173,22.6057,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,3796416, PASSED ,3.6617e-05,451.394,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,3796416, PASSED ,4.53192e-05,364.717,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,3796416, PASSED ,4.05675e-05,407.436,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,3796416, PASSED ,4.25642e-05,388.323,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,421875, PASSED ,0.000134486,28.801,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,421875, PASSED ,2.95255e-05,131.186,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,421875, PASSED ,3.48688e-05,111.083,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,421875, PASSED ,3.24459e-05,119.378,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,421875, PASSED ,3.35106e-05,115.585,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,5639752, PASSED ,0.00149626,14.3594,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,5639752, PASSED ,3.92868e-05,546.885,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,5639752, PASSED ,4.53836e-05,473.418,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,5639752, PASSED ,4.3017e-05,499.463,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,5639752, PASSED ,4.5043e-05,476.998,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,7762392, PASSED ,0.00297628,8.92213,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,7762392, PASSED ,4.76344e-05,557.471,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,7762392, PASSED ,5.35781e-05,495.627,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,7762392, PASSED ,5.02461e-05,528.494,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,7762392, PASSED ,5.16985e-05,513.647,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,884736, PASSED ,0.000232092,27.1852,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,884736, PASSED ,3.23362e-05,195.121,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,884736, PASSED ,3.91926e-05,160.986,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,884736, PASSED ,3.62058e-05,174.266,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,884736, PASSED ,3.80287e-05,165.913,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,11543176, PASSED ,0.00418816,8.25019,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,11543176, PASSED ,4.80081e-05,719.735,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,11543176, PASSED ,5.14988e-05,670.95,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,11543176, PASSED ,5.14986e-05,670.952,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,11543176, PASSED ,5.34162e-05,646.866,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,91125, PASSED ,4.65237e-05,30.503,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,91125, PASSED ,2.6751e-05,53.049,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,91125, PASSED ,3.24355e-05,43.7518,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,91125, PASSED ,3.04026e-05,46.6773,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,91125, PASSED ,3.08939e-05,45.935,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,15438249, PASSED ,0.00543631,7.70923,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,15438249, PASSED ,5.24714e-05,798.716,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,15438249, PASSED ,5.59889e-05,748.537,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,15438249, PASSED ,5.68872e-05,736.716,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,15438249, PASSED ,5.87817e-05,712.972,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,19465109, PASSED ,0.00666969,7.3292,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,19465109, PASSED ,5.67212e-05,861.82,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,19465109, PASSED ,6.20384e-05,787.955,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,19465109, PASSED ,6.13245e-05,797.128,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,19465109, PASSED ,6.26849e-05,779.828,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,1860867, PASSED ,0.000382529,26.9538,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,1860867, PASSED ,3.36967e-05,305.984,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,1860867, PASSED ,4.0981e-05,251.596,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,1860867, PASSED ,3.80987e-05,270.63,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,1860867, PASSED ,3.91021e-05,263.685,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,23393656, PASSED ,0.0140217,3.9391,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,23393656, PASSED ,6.39656e-05,863.478,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,23393656, PASSED ,6.84257e-05,807.196,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,23393656, PASSED ,6.89088e-05,801.537,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,23393656, PASSED ,7.05087e-05,783.349,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,205379, PASSED ,8.54179e-05,28.2635,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,Seq,Base_Seq-direct +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,205379, PASSED ,2.97925e-05,81.0342,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,Base_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,205379, PASSED ,3.44508e-05,70.0771,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,205379, PASSED ,3.29571e-05,73.2531,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,205379, PASSED ,3.39965e-05,71.0136,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024 +Basic_INDEXLIST_3LOOP,Base_Seq,default,5120000, PASSED ,0.0214557,9.33421,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,5120000, PASSED ,9.88996e-05,2025.0,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,5120000, PASSED ,0.00010002,2002.31,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,640000, PASSED ,0.00239236,10.4641,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,640000, PASSED ,3.25117e-05,769.998,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,640000, PASSED ,3.24485e-05,771.498,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,7500000, PASSED ,0.0318322,9.21605,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,7500000, PASSED ,0.000129308,2268.75,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,7500000, PASSED ,0.000129228,2270.15,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,10240000, PASSED ,0.0438102,9.14268,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,10240000, PASSED ,0.000166064,2411.97,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,10240000, PASSED ,0.000165011,2427.37,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,1280000, PASSED ,0.00483921,10.3463,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,1280000, PASSED ,4.55659e-05,1098.8,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,1280000, PASSED ,4.46435e-05,1121.51,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,15000000, PASSED ,0.0647112,9.06695,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,15000000, PASSED ,0.00022941,2557.58,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,15000000, PASSED ,0.000230662,2543.69,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,160000, PASSED ,0.000572814,10.9259,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,160000, PASSED ,2.21903e-05,282.038,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,160000, PASSED ,2.22217e-05,281.64,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,20000000, PASSED ,0.0865713,9.03661,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,20000000, PASSED ,0.000302183,2588.86,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,20000000, PASSED ,0.000299119,2615.38,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,25000000, PASSED ,0.108476,9.01477,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,25000000, PASSED ,0.00037706,2593.46,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,25000000, PASSED ,0.000379325,2577.97,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,2560000, PASSED ,0.0104559,9.57698,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,2560000, PASSED ,6.51301e-05,1537.47,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,2560000, PASSED ,6.51145e-05,1537.84,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,30000000, PASSED ,0.130369,9.00109,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,30000000, PASSED ,0.000455261,2577.57,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,30000000, PASSED ,0.000455036,2578.84,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_INDEXLIST_3LOOP,Base_Seq,default,320000, PASSED ,0.00119101,10.5095,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,320000, PASSED ,2.58341e-05,484.515,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,320000, PASSED ,2.54783e-05,491.281,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_INTSC_HEXHEX,Base_Seq,default,27, PASSED ,0.00147726,0.0762581,3.53728,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,27, PASSED ,0.000311771,0.361332,16.7606,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,27, PASSED ,0.000225281,0.500055,23.1954,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,27000, PASSED ,1.46329,0.0769857,3.57103,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,27000, PASSED ,0.250844,0.449095,20.8315,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,27000, PASSED ,0.141463,0.796342,36.9388,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,3375, PASSED ,0.182632,0.0771036,3.5765,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,3375, PASSED ,0.0327277,0.430266,19.9581,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,3375, PASSED ,0.0187506,0.750994,34.8353,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,39304, PASSED ,2.12466,0.0771837,3.58022,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,39304, PASSED ,0.366111,0.447921,20.7771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,39304, PASSED ,0.204343,0.802517,37.2253,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,512, PASSED ,0.0277247,0.0770515,3.57408,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,512, PASSED ,0.00583062,0.366381,16.9948,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,512, PASSED ,0.00328654,0.649993,30.1503,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,50653, PASSED ,2.74635,0.0769533,3.56953,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,50653, PASSED ,0.472021,0.447736,20.7685,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,50653, PASSED ,0.262872,0.80397,37.2927,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,6859, PASSED ,0.37231,0.0768661,3.56548,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,6859, PASSED ,0.0646335,0.442773,20.5383,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,6859, PASSED ,0.0369851,0.773771,35.8919,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,74088, PASSED ,4.02648,0.0767716,3.5611,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,74088, PASSED ,0.68722,0.449811,20.8648,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,74088, PASSED ,0.383453,0.806147,37.3937,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,1000, PASSED ,0.0542098,0.0769662,3.57013,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,1000, PASSED ,0.0105652,0.394913,18.3183,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,1000, PASSED ,0.00595544,0.700591,32.4974,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,125, PASSED ,0.00677074,0.0770286,3.57302,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,125, PASSED ,0.00141873,0.367612,17.0519,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,125, PASSED ,0.000954474,0.546417,25.3459,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,97336, PASSED ,5.2692,0.0770738,3.57512,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,97336, PASSED ,0.902761,0.449862,20.8671,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,97336, PASSED ,0.503213,0.807049,37.4355,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,13824, PASSED ,0.752873,0.0766108,3.55364,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,13824, PASSED ,0.129067,0.446885,20.7291,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,13824, PASSED ,0.0729182,0.790999,36.691,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_INTSC_HEXHEX,Base_Seq,default,1728, PASSED ,0.0936811,0.0769608,3.56988,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_INTSC_HEXHEX,Base_HIP,block_64,1728, PASSED ,0.0174537,0.41308,19.161,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,1728, PASSED ,0.00994384,0.72505,33.6319,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64 +Apps_LTIMES,Base_Seq,default,2496, PASSED ,1.95521e-05,8.93438,6.38293,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,2496, PASSED ,3.70802e-06,47.1104,33.6568,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,2496, PASSED ,3.83124e-06,45.5952,32.5743,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,2496, PASSED ,3.75522e-06,46.5183,33.2337,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,2477568, PASSED ,0.0207453,8.30493,5.9714,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,2477568, PASSED ,0.000184334,934.653,672.033,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,2477568, PASSED ,0.000224573,767.18,551.617,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,2477568, PASSED ,0.00018837,914.626,657.633,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,309696, PASSED ,0.00257141,8.37555,6.0219,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,309696, PASSED ,2.74214e-05,785.409,564.698,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,309696, PASSED ,3.15374e-05,682.903,490.998,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,309696, PASSED ,2.74012e-05,785.988,565.114,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,3629184, PASSED ,0.0303343,8.31962,5.98197,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,3629184, PASSED ,0.000264118,955.521,687.039,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,3629184, PASSED ,0.000322658,782.16,562.389,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,3629184, PASSED ,0.000273066,924.21,664.526,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,38784, PASSED ,0.00031834,8.47555,6.0916,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,38784, PASSED ,6.05724e-06,445.435,320.146,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,38784, PASSED ,6.58626e-06,409.657,294.431,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,38784, PASSED ,5.98406e-06,450.883,324.061,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,4954944, PASSED ,0.0419168,8.22013,5.91045,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,4954944, PASSED ,0.000362769,949.809,682.933,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,4954944, PASSED ,0.000436548,789.287,567.514,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,4954944, PASSED ,0.000367023,938.802,675.018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,619392, PASSED ,0.00522313,8.24656,5.92931,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,619392, PASSED ,4.84989e-05,888.12,638.563,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,619392, PASSED ,5.7929e-05,743.546,534.613,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,619392, PASSED ,4.90095e-05,878.867,631.91,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,7258176, PASSED ,0.0614895,8.20832,5.90196,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,7258176, PASSED ,0.000526956,957.814,688.689,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,7258176, PASSED ,0.000649703,776.856,558.576,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,7258176, PASSED ,0.000532582,947.696,681.414,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,77568, PASSED ,0.000641311,8.41261,6.04761,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,77568, PASSED ,1.26181e-05,427.568,307.368,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,77568, PASSED ,1.16179e-05,464.379,333.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,77568, PASSED ,1.04175e-05,517.889,372.297,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,9792, PASSED ,7.83175e-05,8.70866,6.25147,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,9792, PASSED ,3.83384e-06,177.9,127.705,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,9792, PASSED ,3.97904e-06,171.408,123.045,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,9792, PASSED ,3.92042e-06,173.971,124.885,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,9677568, PASSED ,0.0819931,8.20761,5.90146,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,9677568, PASSED ,0.000702501,957.959,688.794,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,9677568, PASSED ,0.000868057,775.257,557.427,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,9677568, PASSED ,0.000706936,951.949,684.472,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,1238784, PASSED ,0.0103567,8.31775,5.98058,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,1238784, PASSED ,9.43452e-05,913.079,656.516,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,1238784, PASSED ,0.000114949,749.416,538.841,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,1238784, PASSED ,9.62853e-05,894.681,643.288,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_LTIMES,Base_Seq,default,154944, PASSED ,0.00128502,8.38568,6.02887,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_LTIMES,Base_HIP,block_256,154944, PASSED ,1.61333e-05,667.919,480.199,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_LTIMES,RAJA_HIP,kernel_256,154944, PASSED ,1.85771e-05,580.054,417.029,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256 +Apps_LTIMES,RAJA_HIP,launch_256,154944, PASSED ,1.62207e-05,664.319,477.611,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-launch_256 +Apps_MASS3DPA,Base_Seq,default,3200, PASSED ,2.25147e-05,5.25832,11.2571,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,3200, PASSED ,4.04002e-06,29.3042,62.7348,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,3200, PASSED ,4.10964e-06,28.8078,61.6721,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,3237952, PASSED ,0.0231565,5.16021,11.0749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,3237952, PASSED ,9.71754e-05,1229.66,2639.1,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,3237952, PASSED ,9.78902e-05,1220.68,2619.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,404736, PASSED ,0.0028618,5.21928,11.2015,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,404736, PASSED ,1.80949e-05,825.456,1771.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,404736, PASSED ,1.80643e-05,826.853,1774.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,4743104, PASSED ,0.0339704,5.15267,11.0587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,4743104, PASSED ,0.000139999,1250.28,2683.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,4743104, PASSED ,0.000144515,1211.21,2599.51,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,50624, PASSED ,0.000361022,5.17562,11.1062,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,50624, PASSED ,5.50582e-06,339.37,728.244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,50624, PASSED ,5.53322e-06,337.689,724.638,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,6475904, PASSED ,0.0463681,5.15408,11.0617,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,6475904, PASSED ,0.000198729,1202.57,2580.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,6475904, PASSED ,0.000200741,1190.51,2555.09,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,809536, PASSED ,0.00571927,5.22359,11.2108,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,809536, PASSED ,2.92014e-05,1023.07,2195.71,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,809536, PASSED ,2.89112e-05,1033.34,2217.75,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,9486208, PASSED ,0.0681196,5.13914,11.0297,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,9486208, PASSED ,0.000300901,1163.42,2496.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,9486208, PASSED ,0.000301675,1160.44,2490.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,101184, PASSED ,0.000717815,5.2024,11.1646,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,101184, PASSED ,8.00744e-06,466.361,1000.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,101184, PASSED ,8.05586e-06,463.558,994.815,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,12672, PASSED ,8.8877e-05,5.26504,11.2927,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,12672, PASSED ,4.14544e-06,112.881,242.112,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,12672, PASSED ,4.16802e-06,112.269,240.801,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,12648256, PASSED ,0.0905535,5.1546,11.0629,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,12648256, PASSED ,0.000398865,1170.24,2511.58,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,12648256, PASSED ,0.000398662,1170.83,2512.86,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,1619008, PASSED ,0.0115608,5.16814,11.0919,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,1619008, PASSED ,5.06945e-05,1178.58,2529.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,1619008, PASSED ,5.03579e-05,1186.46,2546.38,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MASS3DPA,Base_Seq,default,202368, PASSED ,0.00143467,5.20566,11.172,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MASS3DPA,Base_HIP,block_25,202368, PASSED ,1.30157e-05,573.802,1231.45,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_25 +Apps_MASS3DPA,RAJA_HIP,block_25,202368, PASSED ,1.31381e-05,568.456,1219.98,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_25 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,216, PASSED ,2.36631e-06,15.2267,4.83791,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,216, PASSED ,4.75473e-06,7.57793,2.40771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,216, PASSED ,3.81712e-06,9.43932,2.99912,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,681472, PASSED ,0.018253,4.83293,1.97875,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,681472, PASSED ,3.85147e-05,2290.43,937.771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,681472, PASSED ,3.79982e-05,2321.56,950.518,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,79507, PASSED ,0.000873478,12.0474,4.82424,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,79507, PASSED ,6.34674e-06,1658.04,663.943,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,79507, PASSED ,6.02293e-06,1747.18,699.638,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,1000000, PASSED ,0.0300624,4.29488,1.763,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,1000000, PASSED ,6.7599e-05,1910.0,784.035,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,1000000, PASSED ,6.79095e-05,1901.27,780.45,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,8000, PASSED ,9.32202e-05,11.9161,4.54837,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,8000, PASSED ,4.66063e-06,238.342,90.9748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,8000, PASSED ,3.86673e-06,287.277,109.653,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,1404928, PASSED ,0.0394168,4.59264,1.88907,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,1404928, PASSED ,9.20251e-05,1967.15,809.14,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,1404928, PASSED ,9.25979e-05,1954.98,804.134,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,157464, PASSED ,0.00181254,11.3978,4.60436,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,157464, PASSED ,1.02002e-05,2025.36,818.182,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,157464, PASSED ,1.00606e-05,2053.46,829.536,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,2048383, PASSED ,0.0576281,4.57083,1.88388,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,2048383, PASSED ,0.000141351,1863.51,768.05,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,2048383, PASSED ,0.000142007,1854.89,764.498,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,17576, PASSED ,0.000195281,12.2455,4.77019,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,17576, PASSED ,4.52192e-06,528.826,206.003,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,17576, PASSED ,3.80982e-06,627.67,244.507,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,1331, PASSED ,1.42649e-05,13.8755,4.94522,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,1331, PASSED ,4.57743e-06,43.2409,15.411,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,1331, PASSED ,3.91033e-06,50.6178,18.0402,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,2744000, PASSED ,0.0822107,4.28615,1.76902,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,2744000, PASSED ,0.000205224,1716.99,708.65,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,2744000, PASSED ,0.000204514,1722.95,711.109,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,328509, PASSED ,0.00625949,6.83387,2.78153,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,328509, PASSED ,2.16278e-05,1977.85,805.027,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,328509, PASSED ,2.10344e-05,2033.64,827.737,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,35937, PASSED ,0.000401969,11.9863,4.73832,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,35937, PASSED ,4.53022e-06,1063.56,420.435,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,35937, PASSED ,3.91032e-06,1232.16,487.086,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256 +Basic_MULTI_REDUCE,Base_Seq,default,6245, PASSED ,1.98491e-05,4.69577,0.314624,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,6245, PASSED ,1.20215e-05,7.75335,0.519487,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,6245, PASSED ,1.21025e-05,7.70146,0.51601,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,6245, PASSED ,1.24317e-05,7.49752,0.502346,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,6245, PASSED ,1.25653e-05,7.4178,0.497004,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,6399995, PASSED ,0.0208347,4.57733,0.307179,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,6399995, PASSED ,3.731e-05,2556.08,171.536,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,6399995, PASSED ,3.78774e-05,2517.79,168.966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,6399995, PASSED ,4.07432e-05,2340.7,157.081,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,6399995, PASSED ,3.8397e-05,2483.72,166.679,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,799995, PASSED ,0.00259813,4.58831,0.307912,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,799995, PASSED ,1.37333e-05,868.036,58.2522,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,799995, PASSED ,1.36129e-05,875.715,58.7675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,799995, PASSED ,1.46365e-05,814.472,54.6576,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,799995, PASSED ,1.40993e-05,845.504,56.7401,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,9374995, PASSED ,0.0305264,4.57632,0.307111,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,9374995, PASSED ,4.86873e-05,2869.3,192.555,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,9374995, PASSED ,4.85745e-05,2875.96,193.002,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,9374995, PASSED ,5.22557e-05,2673.36,179.406,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,9374995, PASSED ,4.92373e-05,2837.25,190.404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,99995, PASSED ,0.000324259,4.59568,0.30838,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,99995, PASSED ,1.16043e-05,128.418,8.61709,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,99995, PASSED ,1.17173e-05,127.179,8.53398,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,99995, PASSED ,1.21031e-05,123.125,8.26195,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,99995, PASSED ,1.21883e-05,122.264,8.20421,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,12799995, PASSED ,0.0416726,4.57698,0.307156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,12799995, PASSED ,6.75148e-05,2825.08,189.588,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,12799995, PASSED ,6.43008e-05,2966.29,199.064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,12799995, PASSED ,7.42704e-05,2568.11,172.343,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,12799995, PASSED ,6.51102e-05,2929.42,196.59,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,1599995, PASSED ,0.00519933,4.58558,0.307731,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,1599995, PASSED ,1.58965e-05,1499.82,100.651,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,1599995, PASSED ,1.54661e-05,1541.56,103.452,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,1599995, PASSED ,1.74297e-05,1367.89,91.7972,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,1599995, PASSED ,1.63223e-05,1460.7,98.0251,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,18749995, PASSED ,0.0610529,4.57631,0.307111,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,18749995, PASSED ,0.000107477,2599.61,174.457,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,18749995, PASSED ,9.90932e-05,2819.54,189.216,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,18749995, PASSED ,0.000118481,2358.17,158.254,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,18749995, PASSED ,9.97958e-05,2799.69,187.884,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,199995, PASSED ,0.000649242,4.59044,0.308044,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,199995, PASSED ,1.19389e-05,249.63,16.7516,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,199995, PASSED ,1.19149e-05,250.134,16.7853,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,199995, PASSED ,1.23115e-05,242.075,16.2446,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,199995, PASSED ,1.28219e-05,232.439,15.5979,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,24995, PASSED ,8.08595e-05,4.60804,0.309117,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,24995, PASSED ,1.17253e-05,31.7778,2.13172,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,24995, PASSED ,1.17041e-05,31.8354,2.13558,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,24995, PASSED ,1.25133e-05,29.7767,1.99748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,24995, PASSED ,1.24671e-05,29.887,2.00488,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,24999995, PASSED ,0.0813809,4.5776,0.307197,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,24999995, PASSED ,0.000148723,2504.85,168.098,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,24999995, PASSED ,0.000137212,2714.98,182.199,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,24999995, PASSED ,0.000164707,2261.77,151.785,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,24999995, PASSED ,0.000137989,2699.7,181.174,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,3199995, PASSED ,0.0104134,4.57907,0.307295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,3199995, PASSED ,2.44475e-05,1950.45,130.892,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,3199995, PASSED ,2.39544e-05,1990.61,133.587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,3199995, PASSED ,2.55426e-05,1866.84,125.281,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,3199995, PASSED ,2.52989e-05,1884.81,126.487,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,Base_Seq,default,399995, PASSED ,0.00129884,4.58914,0.307964,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,399995, PASSED ,1.22521e-05,486.492,32.6471,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,399995, PASSED ,1.19757e-05,497.721,33.4007,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,399995, PASSED ,1.29259e-05,461.132,30.9453,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,399995, PASSED ,1.35313e-05,440.501,29.5608,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256 +Basic_REDUCE_STRUCT,Base_Seq,default,6250, PASSED ,5.19982e-06,17.9107,2.40431,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,6250, PASSED ,2.03471e-05,4.57718,0.614436,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,6250, PASSED ,1.00618e-05,9.25599,1.24252,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,6250, PASSED ,2.08753e-05,4.46136,0.59889,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,6250, PASSED ,2.06031e-05,4.5203,0.606802,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,6250, PASSED ,2.44063e-05,3.81591,0.512244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,6250, PASSED ,1.99951e-05,4.65775,0.625253,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,6250, PASSED ,3.54508e-05,2.62709,0.352658,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,6250, PASSED ,2.43125e-05,3.83063,0.514221,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,6250, PASSED ,2.00713e-05,4.64007,0.622879,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,6250, PASSED ,3.59216e-05,2.59265,0.348036,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,6400000, PASSED ,0.00556897,17.1248,2.29845,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,6400000, PASSED ,0.0208567,4.57251,0.613712,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,6400000, PASSED ,0.0101829,9.36547,1.25701,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,6400000, PASSED ,0.00441144,21.6182,2.90154,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,6400000, PASSED ,0.000166293,573.49,76.9726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,6400000, PASSED ,0.000232023,411.026,55.167,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,6400000, PASSED ,0.000262201,363.719,48.8176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,6400000, PASSED ,0.00392498,24.2975,3.26116,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,6400000, PASSED ,5.53541e-05,1722.86,231.239,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,6400000, PASSED ,6.09455e-05,1564.8,210.024,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,6400000, PASSED ,0.000296165,322.008,43.2192,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,800000, PASSED ,0.00066195,18.0088,2.4171,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,800000, PASSED ,0.00259773,4.58898,0.615924,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,800000, PASSED ,0.00125911,9.46773,1.27074,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,800000, PASSED ,0.000483924,24.6339,3.30631,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,800000, PASSED ,0.000168995,70.54,9.46774,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,800000, PASSED ,5.01795e-05,237.566,31.8856,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,800000, PASSED ,4.94938e-05,240.857,32.3273,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,800000, PASSED ,0.000493959,24.1335,3.23914,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,800000, PASSED ,3.4287e-05,347.681,46.665,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,800000, PASSED ,3.62e-05,329.308,44.199,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,800000, PASSED ,0.000259835,45.8789,6.15777,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,9375000, PASSED ,0.00821376,17.0078,2.28275,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,9375000, PASSED ,0.0305676,4.57014,0.613394,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,9375000, PASSED ,0.0149403,9.35046,1.255,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,9375000, PASSED ,0.00652613,21.406,2.87306,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,9375000, PASSED ,0.000170969,817.096,109.669,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,9375000, PASSED ,0.000328871,424.781,57.0132,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,9375000, PASSED ,0.000375164,372.367,49.9782,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,9375000, PASSED ,0.00604758,23.0999,3.10041,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,9375000, PASSED ,6.92307e-05,2017.87,270.833,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,9375000, PASSED ,7.29238e-05,1915.68,257.118,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,9375000, PASSED ,0.000307589,454.172,60.958,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,100000, PASSED ,8.30334e-05,17.946,2.40869,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,100000, PASSED ,0.000324906,4.58631,0.61557,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,100000, PASSED ,0.000157787,9.44387,1.26755,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,100000, PASSED ,6.97415e-05,21.3663,2.86776,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,100000, PASSED ,6.54959e-05,22.7513,3.05366,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,100000, PASSED ,2.63273e-05,56.5996,7.59675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,100000, PASSED ,3.11647e-05,47.8142,6.41757,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,100000, PASSED ,8.6829e-05,17.1615,2.3034,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,100000, PASSED ,2.59281e-05,57.471,7.7137,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,100000, PASSED ,3.12357e-05,47.7055,6.40299,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,100000, PASSED ,8.68172e-05,17.1638,2.30371,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,12800000, PASSED ,0.0112137,17.0091,2.28292,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,12800000, PASSED ,0.0417403,4.56956,0.613316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,12800000, PASSED ,0.020403,9.34837,1.25472,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,12800000, PASSED ,0.00982728,19.4087,2.60499,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,12800000, PASSED ,0.000206687,922.82,123.859,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,12800000, PASSED ,0.000458595,415.911,55.8227,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,12800000, PASSED ,0.000515045,370.326,49.7044,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,12800000, PASSED ,0.00804758,23.7009,3.18108,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,12800000, PASSED ,8.70784e-05,2190.38,293.988,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,12800000, PASSED ,9.37924e-05,2033.58,272.943,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,12800000, PASSED ,0.000349956,545.025,73.1521,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,1600000, PASSED ,0.00134078,17.782,2.38666,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,1600000, PASSED ,0.00520034,4.58467,0.615345,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,1600000, PASSED ,0.00252808,9.43083,1.26578,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,1600000, PASSED ,0.00109193,21.8346,2.93059,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,1600000, PASSED ,0.000163972,145.402,19.5156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,1600000, PASSED ,7.65216e-05,311.57,41.8183,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,1600000, PASSED ,8.07812e-05,295.141,39.6132,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,1600000, PASSED ,0.000972593,24.5137,3.29018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,1600000, PASSED ,3.60642e-05,661.095,88.7308,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,1600000, PASSED ,3.9808e-05,598.921,80.3859,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,1600000, PASSED ,0.000263307,90.5478,12.1531,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,18750000, PASSED ,0.0162389,17.2053,2.30926,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,18750000, PASSED ,0.0610956,4.57311,0.613792,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,18750000, PASSED ,0.0298362,9.36435,1.25686,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,18750000, PASSED ,0.0144824,19.2922,2.58935,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,18750000, PASSED ,0.000259151,1078.12,144.703,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,18750000, PASSED ,0.000660779,422.829,56.7512,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,18750000, PASSED ,0.000754108,370.5,49.7276,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,18750000, PASSED ,0.0120397,23.2064,3.11471,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,18750000, PASSED ,0.000129771,2153.0,288.97,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,18750000, PASSED ,0.000139191,2007.29,269.415,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,18750000, PASSED ,0.000414244,674.473,90.5263,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,200000, PASSED ,0.000166237,17.9276,2.40622,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,200000, PASSED ,0.000649693,4.58714,0.615679,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,200000, PASSED ,0.000316136,9.42705,1.26528,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,200000, PASSED ,9.46401e-05,31.4902,4.22656,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,200000, PASSED ,9.1948e-05,32.4121,4.3503,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,200000, PASSED ,2.85391e-05,104.426,14.0159,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,200000, PASSED ,3.2582e-05,91.4688,12.2768,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,200000, PASSED ,0.000141193,21.1074,2.83301,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,200000, PASSED ,2.81509e-05,105.866,14.2092,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,200000, PASSED ,3.28596e-05,90.696,12.1731,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,200000, PASSED ,0.000141433,21.0717,2.82821,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,25000, PASSED ,2.03879e-05,18.2721,2.45253,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,25000, PASSED ,8.11766e-05,4.58912,0.615966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,25000, PASSED ,3.92202e-05,9.4984,1.2749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,25000, PASSED ,3.24748e-05,11.4713,1.53972,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,25000, PASSED ,3.24142e-05,11.4928,1.5426,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,25000, PASSED ,2.42381e-05,15.3696,2.06295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,25000, PASSED ,3.00259e-05,12.4069,1.66529,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,25000, PASSED ,4.67176e-05,7.97406,1.0703,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,25000, PASSED ,2.42181e-05,15.3823,2.06465,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,25000, PASSED ,3.00034e-05,12.4162,1.66655,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,25000, PASSED ,4.70294e-05,7.92119,1.06321,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,25000000, PASSED ,0.0215959,17.25,2.31526,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,25000000, PASSED ,0.0814538,4.5735,0.613845,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,25000000, PASSED ,0.0397722,9.36658,1.25716,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,25000000, PASSED ,0.0193672,19.2351,2.58168,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,25000000, PASSED ,0.00031761,1172.91,157.426,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,25000000, PASSED ,0.000887937,419.544,56.3103,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,25000000, PASSED ,0.00100237,371.649,49.8818,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,25000000, PASSED ,0.0172681,21.5732,2.89551,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,25000000, PASSED ,0.000167884,2218.97,297.825,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,25000000, PASSED ,0.000176688,2108.4,282.985,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,25000000, PASSED ,0.000485771,766.882,102.929,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,3200000, PASSED ,0.00275952,17.2797,2.31924,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,3200000, PASSED ,0.0104246,4.57414,0.61393,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,3200000, PASSED ,0.00509462,9.35962,1.25623,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,3200000, PASSED ,0.00221362,21.541,2.89119,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,3200000, PASSED ,0.00015563,306.391,41.1232,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,3200000, PASSED ,0.000129265,368.882,49.5105,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,3200000, PASSED ,0.000143662,331.915,44.5489,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,3200000, PASSED ,0.001949,24.4658,3.28374,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,3200000, PASSED ,4.36898e-05,1091.42,146.487,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,3200000, PASSED ,4.80958e-05,991.432,133.068,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,3200000, PASSED ,0.000275825,172.877,23.2031,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 +Basic_REDUCE_STRUCT,Base_Seq,default,400000, PASSED ,0.000331718,17.9685,2.41169,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default +Basic_REDUCE_STRUCT,Base_Seq,kahan,400000, PASSED ,0.00129906,4.58829,0.615832,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-kahan +Basic_REDUCE_STRUCT,Base_Seq,cascade,400000, PASSED ,0.000630239,9.45746,1.26936,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-cascade +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,400000, PASSED ,0.000215857,27.613,3.70616,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,400000, PASSED ,0.000160878,37.0496,4.97273,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,400000, PASSED ,3.34982e-05,177.934,23.882,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,400000, PASSED ,3.5396e-05,168.394,22.6015,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,400000, PASSED ,0.000255073,23.3677,3.13637,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,400000, PASSED ,3.34524e-05,178.178,23.9147,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,400000, PASSED ,3.52076e-05,169.295,22.7224,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,400000, PASSED ,0.000256678,23.2215,3.11675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_CONVECTION3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_CONVECTION3DPA_bandwidth.png new file mode 100644 index 0000000..7f45893 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_CONVECTION3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_CONVECTION3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_CONVECTION3DPA_flops.png new file mode 100644 index 0000000..3408b08 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_CONVECTION3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png new file mode 100644 index 0000000..3b1deec Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_DEL_DOT_VEC_2D_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_DEL_DOT_VEC_2D_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_DEL_DOT_VEC_2D_flops.png new file mode 100644 index 0000000..8263970 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_DEL_DOT_VEC_2D_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_INTSC_HEXHEX_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_INTSC_HEXHEX_bandwidth.png new file mode 100644 index 0000000..024828c Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_INTSC_HEXHEX_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_INTSC_HEXHEX_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_INTSC_HEXHEX_flops.png new file mode 100644 index 0000000..f1e0390 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_INTSC_HEXHEX_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_LTIMES_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_LTIMES_bandwidth.png new file mode 100644 index 0000000..414dc9b Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_LTIMES_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_LTIMES_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_LTIMES_flops.png new file mode 100644 index 0000000..9465556 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_LTIMES_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MASS3DPA_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MASS3DPA_bandwidth.png new file mode 100644 index 0000000..0ff90f3 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MASS3DPA_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MASS3DPA_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MASS3DPA_flops.png new file mode 100644 index 0000000..d452708 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MASS3DPA_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png new file mode 100644 index 0000000..aeb8d0a Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MATVEC_3D_STENCIL_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MATVEC_3D_STENCIL_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MATVEC_3D_STENCIL_flops.png new file mode 100644 index 0000000..3a01d36 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Apps_MATVEC_3D_STENCIL_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_INDEXLIST_3LOOP_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_INDEXLIST_3LOOP_bandwidth.png new file mode 100644 index 0000000..bfa2027 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_INDEXLIST_3LOOP_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_INDEXLIST_3LOOP_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_INDEXLIST_3LOOP_flops.png new file mode 100644 index 0000000..30cb1ce Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_INDEXLIST_3LOOP_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_MULTI_REDUCE_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_MULTI_REDUCE_bandwidth.png new file mode 100644 index 0000000..68f062c Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_MULTI_REDUCE_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_MULTI_REDUCE_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_MULTI_REDUCE_flops.png new file mode 100644 index 0000000..f904a6d Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_MULTI_REDUCE_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_REDUCE_STRUCT_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_REDUCE_STRUCT_bandwidth.png new file mode 100644 index 0000000..d3a5148 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_REDUCE_STRUCT_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_REDUCE_STRUCT_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_REDUCE_STRUCT_flops.png new file mode 100644 index 0000000..993df29 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Basic_REDUCE_STRUCT_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Comm_HALO_PACKING_FUSED_bandwidth.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Comm_HALO_PACKING_FUSED_bandwidth.png new file mode 100644 index 0000000..bc6a471 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Comm_HALO_PACKING_FUSED_bandwidth.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Comm_HALO_PACKING_FUSED_flops.png b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Comm_HALO_PACKING_FUSED_flops.png new file mode 100644 index 0000000..cc98dd6 Binary files /dev/null and b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/figures/Comm_HALO_PACKING_FUSED_flops.png differ diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/output_with_variant_tuning.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/output_with_variant_tuning.csv new file mode 100644 index 0000000..b1ed284 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/output_with_variant_tuning.csv @@ -0,0 +1,552 @@ +Kernel,Variant,Tuning,Problem size,Checksum,Mean time per rep (sec.),Bandwidth (GiB per sec.),Mean gFlops (gigaFLOP per sec.),__source_file__,Backend,Variant_Tuning,Smoothed Mean flops (gigaFLOP per sec.),Smoothed Bandwidth (GiB per sec.) +Apps_CONVECTION3DPA,Base_Seq,default,1377, PASSED ,1.35042e-05,7.70152,13.9092,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,13.9092,7.70152 +Apps_CONVECTION3DPA,Base_HIP,block_64,1377, PASSED ,3.6214e-06,28.7189,51.8675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,203.569,112.498 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,1377, PASSED ,3.70538e-06,28.068,50.692,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,196.974,108.853 +Apps_CONVECTION3DPA,Base_Seq,default,1404891, PASSED ,0.0487508,2.17096,3.93096,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,3.93096,2.17096 +Apps_CONVECTION3DPA,Base_HIP,block_64,1404891, PASSED ,8.0564e-05,1313.69,2378.7,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,2366.62,1307.01 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,1404891, PASSED ,8.1063e-05,1305.6,2364.06,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2364.06,1305.6 +Apps_CONVECTION3DPA,Base_Seq,default,175608, PASSED ,0.00187299,7.0633,12.7893,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,12.7893,7.0633 +Apps_CONVECTION3DPA,Base_HIP,block_64,175608, PASSED ,1.28408e-05,1030.27,1865.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,1865.48,1030.27 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,175608, PASSED ,1.30574e-05,1013.18,1834.54,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1834.54,1013.18 +Apps_CONVECTION3DPA,Base_Seq,default,2057940, PASSED ,0.0733744,2.1129,3.82584,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,3.82584,2.1129 +Apps_CONVECTION3DPA,Base_HIP,block_64,2057940, PASSED ,0.000118616,1307.01,2366.62,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,2366.62,1307.01 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,2057940, PASSED ,0.000118668,1306.44,2365.59,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2364.06,1305.6 +Apps_CONVECTION3DPA,Base_Seq,default,21951, PASSED ,0.000246666,6.7051,12.139,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,12.8021,7.07049 +Apps_CONVECTION3DPA,Base_HIP,block_64,21951, PASSED ,3.8242e-06,432.487,782.982,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,782.982,432.487 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,21951, PASSED ,3.9858e-06,414.952,751.237,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,751.237,414.952 +Apps_CONVECTION3DPA,Base_Seq,default,2809755, PASSED ,0.101386,2.08775,3.7803,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,3.7803,2.08775 +Apps_CONVECTION3DPA,Base_HIP,block_64,2809755, PASSED ,0.000167312,1265.12,2290.76,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64,2290.76,1265.12 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,2809755, PASSED ,0.000169284,1250.38,2264.07,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2275.59,1256.74 +Apps_CONVECTION3DPA,Base_Seq,default,351216, PASSED ,0.00488318,5.41833,9.81092,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,9.81092,5.41833 +Apps_CONVECTION3DPA,Base_HIP,block_64,351216, PASSED ,2.22096e-05,1191.32,2157.11,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,2157.11,1191.32 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,351216, PASSED ,2.21815e-05,1192.82,2159.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2159.83,1192.82 +Apps_CONVECTION3DPA,Base_Seq,default,4115853, PASSED ,0.151362,2.04849,3.70921,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,3.7597199999999997,2.076385 +Apps_CONVECTION3DPA,Base_HIP,block_64,4115853, PASSED ,0.000247403,1253.27,2269.31,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64,2280.035,1259.195 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,4115853, PASSED ,0.00024672,1256.74,2275.59,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2269.83,1253.56 +Apps_CONVECTION3DPA,Base_Seq,default,43902, PASSED ,0.0004679,7.06895,12.7988,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,12.7988,7.06895 +Apps_CONVECTION3DPA,Base_HIP,block_64,43902, PASSED ,5.1816e-06,638.329,1155.74,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,1155.74,638.329 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,43902, PASSED ,5.149e-06,642.371,1163.05,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1163.05,642.371 +Apps_CONVECTION3DPA,Base_Seq,default,5508, PASSED ,5.37251e-05,7.72835,13.9848,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,13.354,7.385235 +Apps_CONVECTION3DPA,Base_HIP,block_64,5508, PASSED ,3.6908e-06,112.498,203.569,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,493.27549999999997,272.4925 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,5508, PASSED ,3.81438e-06,108.853,196.974,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,474.1055,261.9025 +Apps_CONVECTION3DPA,Base_Seq,default,5487804, PASSED ,0.2002,2.06502,3.73914,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,3.73914,2.06502 +Apps_CONVECTION3DPA,Base_HIP,block_64,5487804, PASSED ,0.000337728,1224.11,2216.51,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64,2269.31,1253.27 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,5487804, PASSED ,0.000339396,1218.09,2205.61,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2264.07,1250.38 +Apps_CONVECTION3DPA,Base_Seq,default,702459, PASSED ,0.0200641,2.6375,4.77572,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,4.77572,2.6375 +Apps_CONVECTION3DPA,Base_HIP,block_64,702459, PASSED ,3.90719e-05,1354.4,2452.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,2366.62,1307.01 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,702459, PASSED ,3.91937e-05,1350.19,2444.8,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,2364.06,1305.6 +Apps_CONVECTION3DPA,Base_Seq,default,87804, PASSED ,0.00093556,7.07049,12.8021,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,12.7893,7.0633 +Apps_CONVECTION3DPA,Base_HIP,block_64,87804, PASSED ,7.67038e-06,862.391,1561.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,1561.48,862.391 +Apps_CONVECTION3DPA,RAJA_HIP,block_64,87804, PASSED ,7.86658e-06,840.882,1522.53,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/CONVECTION3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,1522.53,840.882 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1849, PASSED ,1.21456e-05,7.01899,8.22078,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,8.26791,6.94882 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,1849, PASSED ,3.23171e-06,26.3791,30.8957,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,154.834,130.131 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,1849, PASSED ,2.70401e-06,31.5271,36.9252,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,152.791,128.414 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,2125764, PASSED ,0.0141266,6.73309,8.12587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,8.12587,6.73309 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,2125764, PASSED ,4.05143e-05,2347.72,2833.35,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,2491.61,2064.0 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,2125764, PASSED ,4.00609e-05,2374.29,2865.42,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2475.08,2050.3 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,264196, PASSED ,0.00172742,6.8548,8.25887,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,8.28088,6.86785 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,264196, PASSED ,6.85643e-06,1727.01,2080.76,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,2003.36,1661.51 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,264196, PASSED ,7.20583e-06,1643.27,1979.87,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,1979.87,1643.27 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,3115225, PASSED ,0.0207372,6.72062,8.1121,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,8.1121,6.72062 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,3115225, PASSED ,6.47138e-05,2153.59,2599.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,2491.61,2064.0 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,3115225, PASSED ,6.53628e-05,2132.2,2573.67,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2475.08,2050.3 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,32400, PASSED ,0.000210886,6.91914,8.29641,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,8.28894,6.91914 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,32400, PASSED ,3.13731e-06,465.096,557.675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,557.675,465.096 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,32400, PASSED ,2.79061e-06,522.879,626.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,626.96,522.879 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,4255969, PASSED ,0.0305351,6.23478,7.5265,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,7.85359,6.50454 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,4255969, PASSED ,9.22383e-05,2064.0,2491.61,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,2491.61,2064.0 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,4255969, PASSED ,9.28546e-05,2050.3,2475.08,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2475.08,2050.3 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,528529, PASSED ,0.00344656,6.86785,8.28088,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,8.25887,6.8548 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,528529, PASSED ,1.42464e-05,1661.51,2003.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,2080.76,1727.01 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,528529, PASSED ,1.41253e-05,1675.75,2020.53,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2020.53,1675.75 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,6235009, PASSED ,0.0450532,6.18992,7.47318,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,7.690045,6.36966 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,6235009, PASSED ,0.000155575,1792.54,2164.16,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,2344.92,1942.315 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,6235009, PASSED ,0.000153506,1816.71,2193.34,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2347.13,1944.14 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,65025, PASSED ,0.000423619,6.89789,8.28894,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,8.28894,6.90635 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,65025, PASSED ,3.35581e-06,870.75,1046.35,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,1046.35,870.75 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,65025, PASSED ,3.30792e-06,883.357,1061.5,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,1061.5,883.357 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,7744, PASSED ,5.05782e-05,6.94882,8.26791,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,8.278425,6.93398 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,7744, PASSED ,2.70081e-06,130.131,154.834,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,356.2545,297.6135 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,7744, PASSED ,2.73691e-06,128.414,152.791,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,389.8755,325.6465 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,8317456, PASSED ,0.0571895,6.50454,7.85359,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,7.5265,6.23478 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,8317456, PASSED ,0.00020432,1820.63,2198.23,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,2198.23,1820.63 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,8317456, PASSED ,0.000202391,1837.98,2219.18,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2219.18,1837.98 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,1060900, PASSED ,0.00698615,6.79735,8.20031,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,8.20031,6.79735 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,1060900, PASSED ,2.63133e-05,1804.69,2177.17,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,2177.17,1804.69 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,1060900, PASSED ,2.64515e-05,1795.26,2165.8,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,2165.8,1795.26 +Apps_DEL_DOT_VEC_2D,Base_Seq,default,131044, PASSED ,0.000851352,6.90635,8.31193,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,8.28894,6.89789 +Apps_DEL_DOT_VEC_2D,Base_HIP,block_256,131044, PASSED ,4.09401e-06,1436.18,1728.47,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,1728.47,1436.18 +Apps_DEL_DOT_VEC_2D,RAJA_HIP,block_256,131044, PASSED ,4.05161e-06,1451.21,1746.56,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/DEL_DOT_VEC_2D_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,1746.56,1451.21 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,3796416, PASSED ,0.000731173,22.6057,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,22.6057 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,3796416, PASSED ,3.6617e-05,451.394,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,451.394 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,3796416, PASSED ,4.53192e-05,364.717,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,364.717 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,3796416, PASSED ,4.05675e-05,407.436,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,407.436 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,3796416, PASSED ,4.25642e-05,388.323,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,388.323 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,421875, PASSED ,0.000134486,28.801,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,28.2635 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,421875, PASSED ,2.95255e-05,131.186,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,131.186 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,421875, PASSED ,3.48688e-05,111.083,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,111.083 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,421875, PASSED ,3.24459e-05,119.378,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,119.378 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,421875, PASSED ,3.35106e-05,115.585,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,115.585 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,5639752, PASSED ,0.00149626,14.3594,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,14.3594 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,5639752, PASSED ,3.92868e-05,546.885,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,546.885 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,5639752, PASSED ,4.53836e-05,473.418,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,473.418 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,5639752, PASSED ,4.3017e-05,499.463,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,499.463 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,5639752, PASSED ,4.5043e-05,476.998,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,476.998 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,7762392, PASSED ,0.00297628,8.92213,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,8.92213 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,7762392, PASSED ,4.76344e-05,557.471,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,557.471 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,7762392, PASSED ,5.35781e-05,495.627,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,495.627 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,7762392, PASSED ,5.02461e-05,528.494,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,528.494 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,7762392, PASSED ,5.16985e-05,513.647,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,513.647 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,884736, PASSED ,0.000232092,27.1852,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,27.1852 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,884736, PASSED ,3.23362e-05,195.121,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,195.121 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,884736, PASSED ,3.91926e-05,160.986,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,160.986 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,884736, PASSED ,3.62058e-05,174.266,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,174.266 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,884736, PASSED ,3.80287e-05,165.913,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,165.913 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,11543176, PASSED ,0.00418816,8.25019,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,8.25019 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,11543176, PASSED ,4.80081e-05,719.735,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,719.735 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,11543176, PASSED ,5.14988e-05,670.95,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,670.95 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,11543176, PASSED ,5.14986e-05,670.952,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,670.952 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,11543176, PASSED ,5.34162e-05,646.866,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,646.866 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,91125, PASSED ,4.65237e-05,30.503,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,28.801 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,91125, PASSED ,2.6751e-05,53.049,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,81.0342 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,91125, PASSED ,3.24355e-05,43.7518,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,70.0771 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,91125, PASSED ,3.04026e-05,46.6773,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,73.2531 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,91125, PASSED ,3.08939e-05,45.935,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,71.0136 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,15438249, PASSED ,0.00543631,7.70923,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,7.70923 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,15438249, PASSED ,5.24714e-05,798.716,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,798.716 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,15438249, PASSED ,5.59889e-05,748.537,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,748.537 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,15438249, PASSED ,5.68872e-05,736.716,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,736.716 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,15438249, PASSED ,5.87817e-05,712.972,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,712.972 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,19465109, PASSED ,0.00666969,7.3292,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,7.519215 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,19465109, PASSED ,5.67212e-05,861.82,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,830.268 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,19465109, PASSED ,6.20384e-05,787.955,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,768.2460000000001 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,19465109, PASSED ,6.13245e-05,797.128,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,766.922 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,19465109, PASSED ,6.26849e-05,779.828,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,746.4 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,1860867, PASSED ,0.000382529,26.9538,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,26.9538 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,1860867, PASSED ,3.36967e-05,305.984,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,305.984 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,1860867, PASSED ,4.0981e-05,251.596,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,251.596 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,1860867, PASSED ,3.80987e-05,270.63,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,270.63 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,1860867, PASSED ,3.91021e-05,263.685,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,263.685 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,23393656, PASSED ,0.0140217,3.9391,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,7.3292 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,23393656, PASSED ,6.39656e-05,863.478,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,861.82 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,23393656, PASSED ,6.84257e-05,807.196,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,787.955 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,23393656, PASSED ,6.89088e-05,801.537,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,797.128 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,23393656, PASSED ,7.05087e-05,783.349,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,779.828 +Comm_HALO_PACKING_FUSED,Base_Seq,direct,205379, PASSED ,8.54179e-05,28.2635,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,Seq,Base_Seq-direct,0.0,28.532249999999998 +Comm_HALO_PACKING_FUSED,Base_HIP,direct_1024,205379, PASSED ,2.97925e-05,81.0342,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,Base_HIP-direct_1024,0.0,106.1101 +Comm_HALO_PACKING_FUSED,RAJA_HIP,direct_1024,205379, PASSED ,3.44508e-05,70.0771,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-direct_1024,0.0,90.58005 +Comm_HALO_PACKING_FUSED,RAJA_HIP,funcptr_1024,205379, PASSED ,3.29571e-05,73.2531,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-funcptr_1024,0.0,96.31555 +Comm_HALO_PACKING_FUSED,RAJA_HIP,virtfunc_1024,205379, PASSED ,3.39965e-05,71.0136,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/HALO_PACKING_FUSED_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-virtfunc_1024,0.0,93.29929999999999 +Basic_INDEXLIST_3LOOP,Base_Seq,default,5120000, PASSED ,0.0214557,9.33421,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.33421 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,5120000, PASSED ,9.88996e-05,2025.0,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,2025.0 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,5120000, PASSED ,0.00010002,2002.31,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,2002.31 +Basic_INDEXLIST_3LOOP,Base_Seq,default,640000, PASSED ,0.00239236,10.4641,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.0,10.4641 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,640000, PASSED ,3.25117e-05,769.998,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,769.998 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,640000, PASSED ,3.24485e-05,771.498,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,771.498 +Basic_INDEXLIST_3LOOP,Base_Seq,default,7500000, PASSED ,0.0318322,9.21605,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.21605 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,7500000, PASSED ,0.000129308,2268.75,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,2268.75 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,7500000, PASSED ,0.000129228,2270.15,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,2270.15 +Basic_INDEXLIST_3LOOP,Base_Seq,default,10240000, PASSED ,0.0438102,9.14268,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.14268 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,10240000, PASSED ,0.000166064,2411.97,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,2411.97 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,10240000, PASSED ,0.000165011,2427.37,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,2427.37 +Basic_INDEXLIST_3LOOP,Base_Seq,default,1280000, PASSED ,0.00483921,10.3463,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.0,10.3463 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,1280000, PASSED ,4.55659e-05,1098.8,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,1098.8 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,1280000, PASSED ,4.46435e-05,1121.51,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,1121.51 +Basic_INDEXLIST_3LOOP,Base_Seq,default,15000000, PASSED ,0.0647112,9.06695,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.06695 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,15000000, PASSED ,0.00022941,2557.58,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,2557.58 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,15000000, PASSED ,0.000230662,2543.69,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,2543.69 +Basic_INDEXLIST_3LOOP,Base_Seq,default,160000, PASSED ,0.000572814,10.9259,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.0,10.5095 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,160000, PASSED ,2.21903e-05,282.038,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,484.515 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,160000, PASSED ,2.22217e-05,281.64,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,491.281 +Basic_INDEXLIST_3LOOP,Base_Seq,default,20000000, PASSED ,0.0865713,9.03661,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.03661 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,20000000, PASSED ,0.000302183,2588.86,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,2577.57 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,20000000, PASSED ,0.000299119,2615.38,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,2577.97 +Basic_INDEXLIST_3LOOP,Base_Seq,default,25000000, PASSED ,0.108476,9.01477,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.02569 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,25000000, PASSED ,0.00037706,2593.46,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,2583.215 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,25000000, PASSED ,0.000379325,2577.97,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_5000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,2578.4049999999997 +Basic_INDEXLIST_3LOOP,Base_Seq,default,2560000, PASSED ,0.0104559,9.57698,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.57698 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,2560000, PASSED ,6.51301e-05,1537.47,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,1537.47 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,2560000, PASSED ,6.51145e-05,1537.84,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,1537.84 +Basic_INDEXLIST_3LOOP,Base_Seq,default,30000000, PASSED ,0.130369,9.00109,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,Seq,Base_Seq-default,0.0,9.01477 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,30000000, PASSED ,0.000455261,2577.57,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,2588.86 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,30000000, PASSED ,0.000455036,2578.84,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_6000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,2578.84 +Basic_INDEXLIST_3LOOP,Base_Seq,default,320000, PASSED ,0.00119101,10.5095,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.0,10.486799999999999 +Basic_INDEXLIST_3LOOP,Base_HIP,block_256,320000, PASSED ,2.58341e-05,484.515,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,0.0,627.2565 +Basic_INDEXLIST_3LOOP,RAJA_HIP,block_256,320000, PASSED ,2.54783e-05,491.281,0.0,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INDEXLIST_3LOOP_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,0.0,631.3895 +Apps_INTSC_HEXHEX,Base_Seq,default,27, PASSED ,0.00147726,0.0762581,3.53728,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,3.57302,0.0770286 +Apps_INTSC_HEXHEX,Base_HIP,block_64,27, PASSED ,0.000311771,0.361332,16.7606,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_64,16.9948,0.366381 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,27, PASSED ,0.000225281,0.500055,23.1954,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_64,25.3459,0.546417 +Apps_INTSC_HEXHEX,Base_Seq,default,27000, PASSED ,1.46329,0.0769857,3.57103,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,3.56953,0.0769533 +Apps_INTSC_HEXHEX,Base_HIP,block_64,27000, PASSED ,0.250844,0.449095,20.8315,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_64,20.7685,0.447736 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,27000, PASSED ,0.141463,0.796342,36.9388,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_64,36.9388,0.796342 +Apps_INTSC_HEXHEX,Base_Seq,default,3375, PASSED ,0.182632,0.0771036,3.5765,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,3.56988,0.0769608 +Apps_INTSC_HEXHEX,Base_HIP,block_64,3375, PASSED ,0.0327277,0.430266,19.9581,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_64,19.9581,0.430266 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,3375, PASSED ,0.0187506,0.750994,34.8353,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_64,34.8353,0.750994 +Apps_INTSC_HEXHEX,Base_Seq,default,39304, PASSED ,2.12466,0.0771837,3.58022,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,3.56953,0.0769533 +Apps_INTSC_HEXHEX,Base_HIP,block_64,39304, PASSED ,0.366111,0.447921,20.7771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_64,20.7771,0.447921 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,39304, PASSED ,0.204343,0.802517,37.2253,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_64,37.2253,0.802517 +Apps_INTSC_HEXHEX,Base_Seq,default,512, PASSED ,0.0277247,0.0770515,3.57408,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,3.57013,0.0769662 +Apps_INTSC_HEXHEX,Base_HIP,block_64,512, PASSED ,0.00583062,0.366381,16.9948,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_64,17.0519,0.367612 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,512, PASSED ,0.00328654,0.649993,30.1503,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_64,30.1503,0.649993 +Apps_INTSC_HEXHEX,Base_Seq,default,50653, PASSED ,2.74635,0.0769533,3.56953,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,3.57103,0.0769857 +Apps_INTSC_HEXHEX,Base_HIP,block_64,50653, PASSED ,0.472021,0.447736,20.7685,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_64,20.8315,0.449095 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,50653, PASSED ,0.262872,0.80397,37.2927,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_64,37.2927,0.80397 +Apps_INTSC_HEXHEX,Base_Seq,default,6859, PASSED ,0.37231,0.0768661,3.56548,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,3.56988,0.0769608 +Apps_INTSC_HEXHEX,Base_HIP,block_64,6859, PASSED ,0.0646335,0.442773,20.5383,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_64,20.5383,0.442773 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,6859, PASSED ,0.0369851,0.773771,35.8919,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_64,35.8919,0.773771 +Apps_INTSC_HEXHEX,Base_Seq,default,74088, PASSED ,4.02648,0.0767716,3.5611,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,3.572325,0.07701355 +Apps_INTSC_HEXHEX,Base_HIP,block_64,74088, PASSED ,0.68722,0.449811,20.8648,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_64,20.82095,0.448866 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,74088, PASSED ,0.383453,0.806147,37.3937,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,37.3432,0.8050584999999999 +Apps_INTSC_HEXHEX,Base_Seq,default,1000, PASSED ,0.0542098,0.0769662,3.57013,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,3.57302,0.0770286 +Apps_INTSC_HEXHEX,Base_HIP,block_64,1000, PASSED ,0.0105652,0.394913,18.3183,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_64,18.3183,0.394913 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,1000, PASSED ,0.00595544,0.700591,32.4974,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_64,32.4974,0.700591 +Apps_INTSC_HEXHEX,Base_Seq,default,125, PASSED ,0.00677074,0.0770286,3.57302,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,3.571575,0.0769974 +Apps_INTSC_HEXHEX,Base_HIP,block_64,125, PASSED ,0.00141873,0.367612,17.0519,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_64,17.02335,0.3669965 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,125, PASSED ,0.000954474,0.546417,25.3459,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_64,27.7481,0.5982050000000001 +Apps_INTSC_HEXHEX,Base_Seq,default,97336, PASSED ,5.2692,0.0770738,3.57512,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,3.56953,0.0769533 +Apps_INTSC_HEXHEX,Base_HIP,block_64,97336, PASSED ,0.902761,0.449862,20.8671,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_64,20.8648,0.449811 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,97336, PASSED ,0.503213,0.807049,37.4355,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_64,37.3937,0.806147 +Apps_INTSC_HEXHEX,Base_Seq,default,13824, PASSED ,0.752873,0.0766108,3.55364,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,3.57103,0.0769857 +Apps_INTSC_HEXHEX,Base_HIP,block_64,13824, PASSED ,0.129067,0.446885,20.7291,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_64,20.7291,0.446885 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,13824, PASSED ,0.0729182,0.790999,36.691,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_64,36.691,0.790999 +Apps_INTSC_HEXHEX,Base_Seq,default,1728, PASSED ,0.0936811,0.0769608,3.56988,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,3.57013,0.0769662 +Apps_INTSC_HEXHEX,Base_HIP,block_64,1728, PASSED ,0.0174537,0.41308,19.161,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_64,19.161,0.41308 +Apps_INTSC_HEXHEX,RAJA_HIP,block_64,1728, PASSED ,0.00994384,0.72505,33.6319,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/INTSC_HEXHEX_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_64,33.6319,0.72505 +Apps_LTIMES,Base_Seq,default,2496, PASSED ,1.95521e-05,8.93438,6.38293,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,6.25147,8.70866 +Apps_LTIMES,Base_HIP,block_256,2496, PASSED ,3.70802e-06,47.1104,33.6568,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,127.705,177.9 +Apps_LTIMES,RAJA_HIP,kernel_256,2496, PASSED ,3.83124e-06,45.5952,32.5743,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,123.045,171.408 +Apps_LTIMES,RAJA_HIP,launch_256,2496, PASSED ,3.75522e-06,46.5183,33.2337,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,124.885,173.971 +Apps_LTIMES,Base_Seq,default,2477568, PASSED ,0.0207453,8.30493,5.9714,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,5.9714,8.30493 +Apps_LTIMES,Base_HIP,block_256,2477568, PASSED ,0.000184334,934.653,672.033,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,672.033,934.653 +Apps_LTIMES,RAJA_HIP,kernel_256,2477568, PASSED ,0.000224573,767.18,551.617,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,551.617,767.18 +Apps_LTIMES,RAJA_HIP,launch_256,2477568, PASSED ,0.00018837,914.626,657.633,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,657.633,914.626 +Apps_LTIMES,Base_Seq,default,309696, PASSED ,0.00257141,8.37555,6.0219,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,6.0219,8.37555 +Apps_LTIMES,Base_HIP,block_256,309696, PASSED ,2.74214e-05,785.409,564.698,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,564.698,785.409 +Apps_LTIMES,RAJA_HIP,kernel_256,309696, PASSED ,3.15374e-05,682.903,490.998,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,490.998,682.903 +Apps_LTIMES,RAJA_HIP,launch_256,309696, PASSED ,2.74012e-05,785.988,565.114,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,565.114,785.988 +Apps_LTIMES,Base_Seq,default,3629184, PASSED ,0.0303343,8.31962,5.98197,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,5.9714,8.30493 +Apps_LTIMES,Base_HIP,block_256,3629184, PASSED ,0.000264118,955.521,687.039,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,682.933,949.809 +Apps_LTIMES,RAJA_HIP,kernel_256,3629184, PASSED ,0.000322658,782.16,562.389,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,558.576,776.856 +Apps_LTIMES,RAJA_HIP,launch_256,3629184, PASSED ,0.000273066,924.21,664.526,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,664.526,924.21 +Apps_LTIMES,Base_Seq,default,38784, PASSED ,0.00031834,8.47555,6.0916,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,6.0916,8.47555 +Apps_LTIMES,Base_HIP,block_256,38784, PASSED ,6.05724e-06,445.435,320.146,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,307.368,427.568 +Apps_LTIMES,RAJA_HIP,kernel_256,38784, PASSED ,6.58626e-06,409.657,294.431,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,294.431,409.657 +Apps_LTIMES,RAJA_HIP,launch_256,38784, PASSED ,5.98406e-06,450.883,324.061,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,324.061,450.883 +Apps_LTIMES,Base_Seq,default,4954944, PASSED ,0.0419168,8.22013,5.91045,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,5.91045,8.22013 +Apps_LTIMES,Base_HIP,block_256,4954944, PASSED ,0.000362769,949.809,682.933,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,687.039,955.521 +Apps_LTIMES,RAJA_HIP,kernel_256,4954944, PASSED ,0.000436548,789.287,567.514,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,558.576,776.856 +Apps_LTIMES,RAJA_HIP,launch_256,4954944, PASSED ,0.000367023,938.802,675.018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,675.018,938.802 +Apps_LTIMES,Base_Seq,default,619392, PASSED ,0.00522313,8.24656,5.92931,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,5.98058,8.31775 +Apps_LTIMES,Base_HIP,block_256,619392, PASSED ,4.84989e-05,888.12,638.563,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,638.563,888.12 +Apps_LTIMES,RAJA_HIP,kernel_256,619392, PASSED ,5.7929e-05,743.546,534.613,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,534.613,743.546 +Apps_LTIMES,RAJA_HIP,launch_256,619392, PASSED ,4.90095e-05,878.867,631.91,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,631.91,878.867 +Apps_LTIMES,Base_Seq,default,7258176, PASSED ,0.0614895,8.20832,5.90196,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,5.906205,8.214224999999999 +Apps_LTIMES,Base_HIP,block_256,7258176, PASSED ,0.000526956,957.814,688.689,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,687.864,956.6675 +Apps_LTIMES,RAJA_HIP,kernel_256,7258176, PASSED ,0.000649703,776.856,558.576,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,560.4825000000001,779.508 +Apps_LTIMES,RAJA_HIP,launch_256,7258176, PASSED ,0.000532582,947.696,681.414,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,678.216,943.249 +Apps_LTIMES,Base_Seq,default,77568, PASSED ,0.000641311,8.41261,6.04761,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,6.04761,8.41261 +Apps_LTIMES,Base_HIP,block_256,77568, PASSED ,1.26181e-05,427.568,307.368,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,320.146,445.435 +Apps_LTIMES,RAJA_HIP,kernel_256,77568, PASSED ,1.16179e-05,464.379,333.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,333.83,464.379 +Apps_LTIMES,RAJA_HIP,launch_256,77568, PASSED ,1.04175e-05,517.889,372.297,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,372.297,517.889 +Apps_LTIMES,Base_Seq,default,9792, PASSED ,7.83175e-05,8.70866,6.25147,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,6.171535,8.592105 +Apps_LTIMES,Base_HIP,block_256,9792, PASSED ,3.83384e-06,177.9,127.705,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,217.5365,302.734 +Apps_LTIMES,RAJA_HIP,kernel_256,9792, PASSED ,3.97904e-06,171.408,123.045,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,208.738,290.53249999999997 +Apps_LTIMES,RAJA_HIP,launch_256,9792, PASSED ,3.92042e-06,173.971,124.885,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,224.47299999999998,312.427 +Apps_LTIMES,Base_Seq,default,9677568, PASSED ,0.0819931,8.20761,5.90146,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,5.90196,8.20832 +Apps_LTIMES,Base_HIP,block_256,9677568, PASSED ,0.000702501,957.959,688.794,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,688.689,957.814 +Apps_LTIMES,RAJA_HIP,kernel_256,9677568, PASSED ,0.000868057,775.257,557.427,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,558.576,776.856 +Apps_LTIMES,RAJA_HIP,launch_256,9677568, PASSED ,0.000706936,951.949,684.472,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,681.414,947.696 +Apps_LTIMES,Base_Seq,default,1238784, PASSED ,0.0103567,8.31775,5.98058,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,5.98058,8.31775 +Apps_LTIMES,Base_HIP,block_256,1238784, PASSED ,9.43452e-05,913.079,656.516,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,656.516,913.079 +Apps_LTIMES,RAJA_HIP,kernel_256,1238784, PASSED ,0.000114949,749.416,538.841,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,538.841,749.416 +Apps_LTIMES,RAJA_HIP,launch_256,1238784, PASSED ,9.62853e-05,894.681,643.288,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,643.288,894.681 +Apps_LTIMES,Base_Seq,default,154944, PASSED ,0.00128502,8.38568,6.02887,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,6.02887,8.38568 +Apps_LTIMES,Base_HIP,block_256,154944, PASSED ,1.61333e-05,667.919,480.199,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,480.199,667.919 +Apps_LTIMES,RAJA_HIP,kernel_256,154944, PASSED ,1.85771e-05,580.054,417.029,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-kernel_256,417.029,580.054 +Apps_LTIMES,RAJA_HIP,launch_256,154944, PASSED ,1.62207e-05,664.319,477.611,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/LTIMES_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-launch_256,477.611,664.319 +Apps_MASS3DPA,Base_Seq,default,3200, PASSED ,2.25147e-05,5.25832,11.2571,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,11.2571,5.25832 +Apps_MASS3DPA,Base_HIP,block_25,3200, PASSED ,4.04002e-06,29.3042,62.7348,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_25,242.112,112.881 +Apps_MASS3DPA,RAJA_HIP,block_25,3200, PASSED ,4.10964e-06,28.8078,61.6721,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_25,240.801,112.269 +Apps_MASS3DPA,Base_Seq,default,3237952, PASSED ,0.0231565,5.16021,11.0749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,11.0749,5.16021 +Apps_MASS3DPA,Base_HIP,block_25,3237952, PASSED ,9.71754e-05,1229.66,2639.1,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_25,2580.96,1202.57 +Apps_MASS3DPA,RAJA_HIP,block_25,3237952, PASSED ,9.78902e-05,1220.68,2619.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_25,2555.09,1190.51 +Apps_MASS3DPA,Base_Seq,default,404736, PASSED ,0.0028618,5.21928,11.2015,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,11.172,5.20566 +Apps_MASS3DPA,Base_HIP,block_25,404736, PASSED ,1.80949e-05,825.456,1771.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_25,1771.57,825.456 +Apps_MASS3DPA,RAJA_HIP,block_25,404736, PASSED ,1.80643e-05,826.853,1774.57,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_25,1774.57,826.853 +Apps_MASS3DPA,Base_Seq,default,4743104, PASSED ,0.0339704,5.15267,11.0587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,11.0617,5.15408 +Apps_MASS3DPA,Base_HIP,block_25,4743104, PASSED ,0.000139999,1250.28,2683.36,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_25,2580.96,1202.57 +Apps_MASS3DPA,RAJA_HIP,block_25,4743104, PASSED ,0.000144515,1211.21,2599.51,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_25,2555.09,1190.51 +Apps_MASS3DPA,Base_Seq,default,50624, PASSED ,0.000361022,5.17562,11.1062,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,11.172,5.20566 +Apps_MASS3DPA,Base_HIP,block_25,50624, PASSED ,5.50582e-06,339.37,728.244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_25,728.244,339.37 +Apps_MASS3DPA,RAJA_HIP,block_25,50624, PASSED ,5.53322e-06,337.689,724.638,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_25,724.638,337.689 +Apps_MASS3DPA,Base_Seq,default,6475904, PASSED ,0.0463681,5.15408,11.0617,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,11.0617,5.15408 +Apps_MASS3DPA,Base_HIP,block_25,6475904, PASSED ,0.000198729,1202.57,2580.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_25,2580.96,1202.57 +Apps_MASS3DPA,RAJA_HIP,block_25,6475904, PASSED ,0.000200741,1190.51,2555.09,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_25,2555.09,1190.51 +Apps_MASS3DPA,Base_Seq,default,809536, PASSED ,0.00571927,5.22359,11.2108,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,11.172,5.20566 +Apps_MASS3DPA,Base_HIP,block_25,809536, PASSED ,2.92014e-05,1023.07,2195.71,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_25,2195.71,1023.07 +Apps_MASS3DPA,RAJA_HIP,block_25,809536, PASSED ,2.89112e-05,1033.34,2217.75,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_25,2217.75,1033.34 +Apps_MASS3DPA,Base_Seq,default,9486208, PASSED ,0.0681196,5.13914,11.0297,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,11.0602,5.1533750000000005 +Apps_MASS3DPA,Base_HIP,block_25,9486208, PASSED ,0.000300901,1163.42,2496.96,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_25,2546.27,1186.405 +Apps_MASS3DPA,RAJA_HIP,block_25,9486208, PASSED ,0.000301675,1160.44,2490.55,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_25,2533.9750000000004,1180.67 +Apps_MASS3DPA,Base_Seq,default,101184, PASSED ,0.000717815,5.2024,11.1646,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,11.172,5.20566 +Apps_MASS3DPA,Base_HIP,block_25,101184, PASSED ,8.00744e-06,466.361,1000.83,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_25,1000.83,466.361 +Apps_MASS3DPA,RAJA_HIP,block_25,101184, PASSED ,8.05586e-06,463.558,994.815,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_25,994.815,463.558 +Apps_MASS3DPA,Base_Seq,default,12672, PASSED ,8.8877e-05,5.26504,11.2927,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,11.21085,5.23036 +Apps_MASS3DPA,Base_HIP,block_25,12672, PASSED ,4.14544e-06,112.881,242.112,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_25,485.178,226.1255 +Apps_MASS3DPA,RAJA_HIP,block_25,12672, PASSED ,4.16802e-06,112.269,240.801,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_25,482.71950000000004,224.979 +Apps_MASS3DPA,Base_Seq,default,12648256, PASSED ,0.0905535,5.1546,11.0629,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,11.0617,5.15408 +Apps_MASS3DPA,Base_HIP,block_25,12648256, PASSED ,0.000398865,1170.24,2511.58,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_25,2511.58,1170.24 +Apps_MASS3DPA,RAJA_HIP,block_25,12648256, PASSED ,0.000398662,1170.83,2512.86,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_25,2512.86,1170.83 +Apps_MASS3DPA,Base_Seq,default,1619008, PASSED ,0.0115608,5.16814,11.0919,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,11.0919,5.16814 +Apps_MASS3DPA,Base_HIP,block_25,1619008, PASSED ,5.06945e-05,1178.58,2529.48,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_25,2529.48,1178.58 +Apps_MASS3DPA,RAJA_HIP,block_25,1619008, PASSED ,5.03579e-05,1186.46,2546.38,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_25,2546.38,1186.46 +Apps_MASS3DPA,Base_Seq,default,202368, PASSED ,0.00143467,5.20566,11.172,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,11.172,5.20566 +Apps_MASS3DPA,Base_HIP,block_25,202368, PASSED ,1.30157e-05,573.802,1231.45,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_25,1231.45,573.802 +Apps_MASS3DPA,RAJA_HIP,block_25,202368, PASSED ,1.31381e-05,568.456,1219.98,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MASS3DPA_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_25,1219.98,568.456 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,216, PASSED ,2.36631e-06,15.2267,4.83791,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,4.83791,13.8755 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,216, PASSED ,4.75473e-06,7.57793,2.40771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,HIP,Base_HIP-block_256,15.411,43.2409 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,216, PASSED ,3.81712e-06,9.43932,2.99912,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-block_256,18.0402,50.6178 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,681472, PASSED ,0.018253,4.83293,1.97875,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,1.97875,4.83293 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,681472, PASSED ,3.85147e-05,2290.43,937.771,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,HIP,Base_HIP-block_256,809.14,1977.85 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,681472, PASSED ,3.79982e-05,2321.56,950.518,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-block_256,827.737,2033.64 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,79507, PASSED ,0.000873478,12.0474,4.82424,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,4.73832,11.9863 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,79507, PASSED ,6.34674e-06,1658.04,663.943,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,HIP,Base_HIP-block_256,663.943,1658.04 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,79507, PASSED ,6.02293e-06,1747.18,699.638,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-block_256,699.638,1747.18 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,1000000, PASSED ,0.0300624,4.29488,1.763,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,1.88907,4.59264 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,1000000, PASSED ,6.7599e-05,1910.0,784.035,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,HIP,Base_HIP-block_256,805.027,1967.15 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,1000000, PASSED ,6.79095e-05,1901.27,780.45,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-block_256,804.134,1954.98 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,8000, PASSED ,9.32202e-05,11.9161,4.54837,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,4.77019,12.2455 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,8000, PASSED ,4.66063e-06,238.342,90.9748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,HIP,Base_HIP-block_256,90.9748,238.342 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,8000, PASSED ,3.86673e-06,287.277,109.653,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-block_256,109.653,287.277 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,1404928, PASSED ,0.0394168,4.59264,1.88907,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,1.88388,4.57083 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,1404928, PASSED ,9.20251e-05,1967.15,809.14,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_2048-kernel-run-data.csv,HIP,Base_HIP-block_256,784.035,1910.0 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,1404928, PASSED ,9.25979e-05,1954.98,804.134,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-block_256,780.45,1901.27 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,157464, PASSED ,0.00181254,11.3978,4.60436,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,4.60436,11.3978 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,157464, PASSED ,1.02002e-05,2025.36,818.182,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,HIP,Base_HIP-block_256,805.027,1977.85 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,157464, PASSED ,1.00606e-05,2053.46,829.536,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-block_256,827.737,2033.64 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,2048383, PASSED ,0.0576281,4.57083,1.88388,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,1.82645,4.432855 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,2048383, PASSED ,0.000141351,1863.51,768.05,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,HIP,Base_HIP-block_256,776.0425,1886.755 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,2048383, PASSED ,0.000142007,1854.89,764.498,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,772.474,1878.08 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,17576, PASSED ,0.000195281,12.2455,4.77019,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,4.77019,12.0474 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,17576, PASSED ,4.52192e-06,528.826,206.003,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,HIP,Base_HIP-block_256,206.003,528.826 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,17576, PASSED ,3.80982e-06,627.67,244.507,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-block_256,244.507,627.67 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,1331, PASSED ,1.42649e-05,13.8755,4.94522,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,4.80405,13.060500000000001 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,1331, PASSED ,4.57743e-06,43.2409,15.411,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,HIP,Base_HIP-block_256,53.1929,140.79145 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,1331, PASSED ,3.91033e-06,50.6178,18.0402,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-block_256,63.8466,168.9474 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,2744000, PASSED ,0.0822107,4.28615,1.76902,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,1.88388,4.57083 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,2744000, PASSED ,0.000205224,1716.99,708.65,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4000-kernel-run-data.csv,HIP,Base_HIP-block_256,768.05,1863.51 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,2744000, PASSED ,0.000204514,1722.95,711.109,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-block_256,764.498,1854.89 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,328509, PASSED ,0.00625949,6.83387,2.78153,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,2.78153,6.83387 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,328509, PASSED ,2.16278e-05,1977.85,805.027,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,HIP,Base_HIP-block_256,805.027,1977.85 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,328509, PASSED ,2.10344e-05,2033.64,827.737,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-block_256,827.737,2033.64 +Apps_MATVEC_3D_STENCIL,Base_Seq,default,35937, PASSED ,0.000401969,11.9863,4.73832,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,4.73832,11.9863 +Apps_MATVEC_3D_STENCIL,Base_HIP,block_256,35937, PASSED ,4.53022e-06,1063.56,420.435,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,HIP,Base_HIP-block_256,420.435,1063.56 +Apps_MATVEC_3D_STENCIL,RAJA_HIP,block_256,35937, PASSED ,3.91032e-06,1232.16,487.086,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MATVEC_3D_STENCIL_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-block_256,487.086,1232.16 +Basic_MULTI_REDUCE,Base_Seq,default,6245, PASSED ,1.98491e-05,4.69577,0.314624,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,0.309117,4.60804 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,6245, PASSED ,1.20215e-05,7.75335,0.519487,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,2.13172,31.7778 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,6245, PASSED ,1.21025e-05,7.70146,0.51601,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,2.13558,31.8354 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,6245, PASSED ,1.24317e-05,7.49752,0.502346,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,1.99748,29.7767 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,6245, PASSED ,1.25653e-05,7.4178,0.497004,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,2.00488,29.887 +Basic_MULTI_REDUCE,Base_Seq,default,6399995, PASSED ,0.0208347,4.57733,0.307179,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,0.307179,4.57733 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,6399995, PASSED ,3.731e-05,2556.08,171.536,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,171.536,2556.08 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,6399995, PASSED ,3.78774e-05,2517.79,168.966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,168.966,2517.79 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,6399995, PASSED ,4.07432e-05,2340.7,157.081,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,157.081,2340.7 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,6399995, PASSED ,3.8397e-05,2483.72,166.679,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,166.679,2483.72 +Basic_MULTI_REDUCE,Base_Seq,default,799995, PASSED ,0.00259813,4.58831,0.307912,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,0.307912,4.58831 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,799995, PASSED ,1.37333e-05,868.036,58.2522,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,58.2522,868.036 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,799995, PASSED ,1.36129e-05,875.715,58.7675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,58.7675,875.715 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,799995, PASSED ,1.46365e-05,814.472,54.6576,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,54.6576,814.472 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,799995, PASSED ,1.40993e-05,845.504,56.7401,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,56.7401,845.504 +Basic_MULTI_REDUCE,Base_Seq,default,9374995, PASSED ,0.0305264,4.57632,0.307111,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,0.307156,4.57698 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,9374995, PASSED ,4.86873e-05,2869.3,192.555,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,174.457,2599.61 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,9374995, PASSED ,4.85745e-05,2875.96,193.002,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,189.216,2819.54 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,9374995, PASSED ,5.22557e-05,2673.36,179.406,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,158.254,2358.17 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,9374995, PASSED ,4.92373e-05,2837.25,190.404,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,187.884,2799.69 +Basic_MULTI_REDUCE,Base_Seq,default,99995, PASSED ,0.000324259,4.59568,0.30838,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,0.30838,4.59568 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,99995, PASSED ,1.16043e-05,128.418,8.61709,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,8.61709,128.418 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,99995, PASSED ,1.17173e-05,127.179,8.53398,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,8.53398,127.179 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,99995, PASSED ,1.21031e-05,123.125,8.26195,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,8.26195,123.125 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,99995, PASSED ,1.21883e-05,122.264,8.20421,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,8.20421,122.264 +Basic_MULTI_REDUCE,Base_Seq,default,12799995, PASSED ,0.0416726,4.57698,0.307156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,0.307156,4.57698 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,12799995, PASSED ,6.75148e-05,2825.08,189.588,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,174.457,2599.61 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,12799995, PASSED ,6.43008e-05,2966.29,199.064,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,189.216,2819.54 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,12799995, PASSED ,7.42704e-05,2568.11,172.343,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,158.254,2358.17 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,12799995, PASSED ,6.51102e-05,2929.42,196.59,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,187.884,2799.69 +Basic_MULTI_REDUCE,Base_Seq,default,1599995, PASSED ,0.00519933,4.58558,0.307731,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,0.307731,4.58558 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,1599995, PASSED ,1.58965e-05,1499.82,100.651,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,100.651,1499.82 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,1599995, PASSED ,1.54661e-05,1541.56,103.452,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,103.452,1541.56 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,1599995, PASSED ,1.74297e-05,1367.89,91.7972,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,91.7972,1367.89 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,1599995, PASSED ,1.63223e-05,1460.7,98.0251,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,98.0251,1460.7 +Basic_MULTI_REDUCE,Base_Seq,default,18749995, PASSED ,0.0610529,4.57631,0.307111,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,0.3071335,4.57665 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,18749995, PASSED ,0.000107477,2599.61,174.457,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,182.02249999999998,2712.3450000000003 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,18749995, PASSED ,9.90932e-05,2819.54,189.216,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,191.109,2847.75 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,18749995, PASSED ,0.000118481,2358.17,158.254,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,165.2985,2463.1400000000003 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,18749995, PASSED ,9.97958e-05,2799.69,187.884,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,189.144,2818.4700000000003 +Basic_MULTI_REDUCE,Base_Seq,default,199995, PASSED ,0.000649242,4.59044,0.308044,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,0.308044,4.59044 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,199995, PASSED ,1.19389e-05,249.63,16.7516,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,16.7516,249.63 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,199995, PASSED ,1.19149e-05,250.134,16.7853,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,16.7853,250.134 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,199995, PASSED ,1.23115e-05,242.075,16.2446,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,16.2446,242.075 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,199995, PASSED ,1.28219e-05,232.439,15.5979,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,15.5979,232.439 +Basic_MULTI_REDUCE,Base_Seq,default,24995, PASSED ,8.08595e-05,4.60804,0.309117,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,0.3087485,4.60186 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,24995, PASSED ,1.17253e-05,31.7778,2.13172,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,5.374404999999999,80.09790000000001 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,24995, PASSED ,1.17041e-05,31.8354,2.13558,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,5.33478,79.5072 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,24995, PASSED ,1.25133e-05,29.7767,1.99748,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,5.129715,76.45085 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,24995, PASSED ,1.24671e-05,29.887,2.00488,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,5.104545,76.0755 +Basic_MULTI_REDUCE,Base_Seq,default,24999995, PASSED ,0.0813809,4.5776,0.307197,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,0.307156,4.57698 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,24999995, PASSED ,0.000148723,2504.85,168.098,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,174.457,2599.61 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,24999995, PASSED ,0.000137212,2714.98,182.199,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,189.216,2819.54 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,24999995, PASSED ,0.000164707,2261.77,151.785,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,158.254,2358.17 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,24999995, PASSED ,0.000137989,2699.7,181.174,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,187.884,2799.69 +Basic_MULTI_REDUCE,Base_Seq,default,3199995, PASSED ,0.0104134,4.57907,0.307295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,0.307295,4.57907 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,3199995, PASSED ,2.44475e-05,1950.45,130.892,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,130.892,1950.45 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,3199995, PASSED ,2.39544e-05,1990.61,133.587,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,133.587,1990.61 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,3199995, PASSED ,2.55426e-05,1866.84,125.281,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,125.281,1866.84 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,3199995, PASSED ,2.52989e-05,1884.81,126.487,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,126.487,1884.81 +Basic_MULTI_REDUCE,Base_Seq,default,399995, PASSED ,0.00129884,4.58914,0.307964,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,0.307964,4.58914 +Basic_MULTI_REDUCE,Base_HIP,atomic_direct_256,399995, PASSED ,1.22521e-05,486.492,32.6471,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,Base_HIP-atomic_direct_256,32.6471,486.492 +Basic_MULTI_REDUCE,Base_HIP,atomic_occgs_256,399995, PASSED ,1.19757e-05,497.721,33.4007,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,Base_HIP-atomic_occgs_256,33.4007,497.721 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_direct_256,399995, PASSED ,1.29259e-05,461.132,30.9453,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-atomic_direct_256,30.9453,461.132 +Basic_MULTI_REDUCE,RAJA_HIP,atomic_occgs_256,399995, PASSED ,1.35313e-05,440.501,29.5608,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/MULTI_REDUCE_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-atomic_occgs_256,29.5608,440.501 +Basic_REDUCE_STRUCT,Base_Seq,default,6250, PASSED ,5.19982e-06,17.9107,2.40431,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-default,2.40869,17.946 +Basic_REDUCE_STRUCT,Base_Seq,kahan,6250, PASSED ,2.03471e-05,4.57718,0.614436,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-kahan,0.61557,4.58631 +Basic_REDUCE_STRUCT,Base_Seq,cascade,6250, PASSED ,1.00618e-05,9.25599,1.24252,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26755,9.44387 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,6250, PASSED ,2.08753e-05,4.46136,0.59889,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,1.53972,11.4713 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,6250, PASSED ,2.06031e-05,4.5203,0.606802,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,1.5426,11.4928 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,6250, PASSED ,2.44063e-05,3.81591,0.512244,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,2.06295,15.3696 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,6250, PASSED ,1.99951e-05,4.65775,0.625253,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,1.66529,12.4069 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,6250, PASSED ,3.54508e-05,2.62709,0.352658,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,1.0703,7.97406 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,6250, PASSED ,2.43125e-05,3.83063,0.514221,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,2.06465,15.3823 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,6250, PASSED ,2.00713e-05,4.64007,0.622879,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,1.66655,12.4162 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,6250, PASSED ,3.59216e-05,2.59265,0.348036,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,1.06321,7.92119 +Basic_REDUCE_STRUCT,Base_Seq,default,6400000, PASSED ,0.00556897,17.1248,2.29845,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-default,2.29845,17.1248 +Basic_REDUCE_STRUCT,Base_Seq,kahan,6400000, PASSED ,0.0208567,4.57251,0.613712,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-kahan,0.613712,4.57251 +Basic_REDUCE_STRUCT,Base_Seq,cascade,6400000, PASSED ,0.0101829,9.36547,1.25701,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,Seq,Base_Seq-cascade,1.25623,9.35962 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,6400000, PASSED ,0.00441144,21.6182,2.90154,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.89119,21.541 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,6400000, PASSED ,0.000166293,573.49,76.9726,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,76.9726,573.49 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,6400000, PASSED ,0.000232023,411.026,55.167,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,55.167,411.026 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,6400000, PASSED ,0.000262201,363.719,48.8176,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,48.8176,363.719 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,6400000, PASSED ,0.00392498,24.2975,3.26116,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.26116,24.2975 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,6400000, PASSED ,5.53541e-05,1722.86,231.239,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,231.239,1722.86 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,6400000, PASSED ,6.09455e-05,1564.8,210.024,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,210.024,1564.8 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,6400000, PASSED ,0.000296165,322.008,43.2192,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1024-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,43.2192,322.008 +Basic_REDUCE_STRUCT,Base_Seq,default,800000, PASSED ,0.00066195,18.0088,2.4171,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-default,2.40622,17.9276 +Basic_REDUCE_STRUCT,Base_Seq,kahan,800000, PASSED ,0.00259773,4.58898,0.615924,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615679,4.58714 +Basic_REDUCE_STRUCT,Base_Seq,cascade,800000, PASSED ,0.00125911,9.46773,1.27074,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26578,9.43083 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,800000, PASSED ,0.000483924,24.6339,3.30631,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,3.30631,24.6339 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,800000, PASSED ,0.000168995,70.54,9.46774,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,9.46774,70.54 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,800000, PASSED ,5.01795e-05,237.566,31.8856,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,31.8856,237.566 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,800000, PASSED ,4.94938e-05,240.857,32.3273,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,32.3273,240.857 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,800000, PASSED ,0.000493959,24.1335,3.23914,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.23914,24.1335 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,800000, PASSED ,3.4287e-05,347.681,46.665,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,46.665,347.681 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,800000, PASSED ,3.62e-05,329.308,44.199,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,44.199,329.308 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,800000, PASSED ,0.000259835,45.8789,6.15777,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_128-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,6.15777,45.8789 +Basic_REDUCE_STRUCT,Base_Seq,default,9375000, PASSED ,0.00821376,17.0078,2.28275,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-default,2.29845,17.1248 +Basic_REDUCE_STRUCT,Base_Seq,kahan,9375000, PASSED ,0.0305676,4.57014,0.613394,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-kahan,0.613712,4.57251 +Basic_REDUCE_STRUCT,Base_Seq,cascade,9375000, PASSED ,0.0149403,9.35046,1.255,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,Seq,Base_Seq-cascade,1.25623,9.35962 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,9375000, PASSED ,0.00652613,21.406,2.87306,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.87306,21.406 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,9375000, PASSED ,0.000170969,817.096,109.669,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,109.669,817.096 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,9375000, PASSED ,0.000328871,424.781,57.0132,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,55.8227,415.911 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,9375000, PASSED ,0.000375164,372.367,49.9782,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,49.7044,370.326 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,9375000, PASSED ,0.00604758,23.0999,3.10041,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.18108,23.7009 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,9375000, PASSED ,6.92307e-05,2017.87,270.833,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,270.833,2017.87 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,9375000, PASSED ,7.29238e-05,1915.68,257.118,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,257.118,1915.68 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,9375000, PASSED ,0.000307589,454.172,60.958,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_1500-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,60.958,454.172 +Basic_REDUCE_STRUCT,Base_Seq,default,100000, PASSED ,8.30334e-05,17.946,2.40869,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-default,2.40869,17.946 +Basic_REDUCE_STRUCT,Base_Seq,kahan,100000, PASSED ,0.000324906,4.58631,0.61557,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615679,4.58714 +Basic_REDUCE_STRUCT,Base_Seq,cascade,100000, PASSED ,0.000157787,9.44387,1.26755,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26755,9.44387 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,100000, PASSED ,6.97415e-05,21.3663,2.86776,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.86776,21.3663 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,100000, PASSED ,6.54959e-05,22.7513,3.05366,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,3.05366,22.7513 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,100000, PASSED ,2.63273e-05,56.5996,7.59675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,7.59675,56.5996 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,100000, PASSED ,3.11647e-05,47.8142,6.41757,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,6.41757,47.8142 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,100000, PASSED ,8.6829e-05,17.1615,2.3034,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,2.3034,17.1615 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,100000, PASSED ,2.59281e-05,57.471,7.7137,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,7.7137,57.471 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,100000, PASSED ,3.12357e-05,47.7055,6.40299,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,6.40299,47.7055 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,100000, PASSED ,8.68172e-05,17.1638,2.30371,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_16-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,2.30371,17.1638 +Basic_REDUCE_STRUCT,Base_Seq,default,12800000, PASSED ,0.0112137,17.0091,2.28292,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,Seq,Base_Seq-default,2.29845,17.1248 +Basic_REDUCE_STRUCT,Base_Seq,kahan,12800000, PASSED ,0.0417403,4.56956,0.613316,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,Seq,Base_Seq-kahan,0.613712,4.57251 +Basic_REDUCE_STRUCT,Base_Seq,cascade,12800000, PASSED ,0.020403,9.34837,1.25472,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,Seq,Base_Seq-cascade,1.25686,9.36435 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,12800000, PASSED ,0.00982728,19.4087,2.60499,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.60499,19.4087 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,12800000, PASSED ,0.000206687,922.82,123.859,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,123.859,922.82 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,12800000, PASSED ,0.000458595,415.911,55.8227,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,56.3103,419.544 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,12800000, PASSED ,0.000515045,370.326,49.7044,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,49.7276,370.5 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,12800000, PASSED ,0.00804758,23.7009,3.18108,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.11471,23.2064 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,12800000, PASSED ,8.70784e-05,2190.38,293.988,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,288.97,2153.0 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,12800000, PASSED ,9.37924e-05,2033.58,272.943,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,269.415,2007.29 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,12800000, PASSED ,0.000349956,545.025,73.1521,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_2048-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,73.1521,545.025 +Basic_REDUCE_STRUCT,Base_Seq,default,1600000, PASSED ,0.00134078,17.782,2.38666,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-default,2.38666,17.782 +Basic_REDUCE_STRUCT,Base_Seq,kahan,1600000, PASSED ,0.00520034,4.58467,0.615345,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615345,4.58467 +Basic_REDUCE_STRUCT,Base_Seq,cascade,1600000, PASSED ,0.00252808,9.43083,1.26578,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26578,9.43083 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,1600000, PASSED ,0.00109193,21.8346,2.93059,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.93059,21.8346 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,1600000, PASSED ,0.000163972,145.402,19.5156,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,19.5156,145.402 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,1600000, PASSED ,7.65216e-05,311.57,41.8183,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,41.8183,311.57 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,1600000, PASSED ,8.07812e-05,295.141,39.6132,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,39.6132,295.141 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,1600000, PASSED ,0.000972593,24.5137,3.29018,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.26116,24.2975 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,1600000, PASSED ,3.60642e-05,661.095,88.7308,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,88.7308,661.095 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,1600000, PASSED ,3.9808e-05,598.921,80.3859,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,80.3859,598.921 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,1600000, PASSED ,0.000263307,90.5478,12.1531,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_256-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,12.1531,90.5478 +Basic_REDUCE_STRUCT,Base_Seq,default,18750000, PASSED ,0.0162389,17.2053,2.30926,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-default,2.29609,17.1072 +Basic_REDUCE_STRUCT,Base_Seq,kahan,18750000, PASSED ,0.0610956,4.57311,0.613792,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-kahan,0.613593,4.571625 +Basic_REDUCE_STRUCT,Base_Seq,cascade,18750000, PASSED ,0.0298362,9.36435,1.25686,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,Seq,Base_Seq-cascade,1.25593,9.357405 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,18750000, PASSED ,0.0144824,19.2922,2.58935,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.59717,19.350450000000002 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,18750000, PASSED ,0.000259151,1078.12,144.703,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,134.281,1000.47 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,18750000, PASSED ,0.000660779,422.829,56.7512,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,56.53075,421.1865 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,18750000, PASSED ,0.000754108,370.5,49.7276,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,49.8047,371.0745 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,18750000, PASSED ,0.0120397,23.2064,3.11471,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.1075600000000003,23.15315 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,18750000, PASSED ,0.000129771,2153.0,288.97,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,291.47900000000004,2171.69 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,18750000, PASSED ,0.000139191,2007.29,269.415,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,271.179,2020.435 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,18750000, PASSED ,0.000414244,674.473,90.5263,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_3000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,81.8392,609.749 +Basic_REDUCE_STRUCT,Base_Seq,default,200000, PASSED ,0.000166237,17.9276,2.40622,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-default,2.41169,17.9685 +Basic_REDUCE_STRUCT,Base_Seq,kahan,200000, PASSED ,0.000649693,4.58714,0.615679,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615832,4.58829 +Basic_REDUCE_STRUCT,Base_Seq,cascade,200000, PASSED ,0.000316136,9.42705,1.26528,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26936,9.45746 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,200000, PASSED ,9.46401e-05,31.4902,4.22656,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,3.30631,24.6339 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,200000, PASSED ,9.1948e-05,32.4121,4.3503,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,4.3503,32.4121 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,200000, PASSED ,2.85391e-05,104.426,14.0159,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,14.0159,104.426 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,200000, PASSED ,3.2582e-05,91.4688,12.2768,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,12.2768,91.4688 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,200000, PASSED ,0.000141193,21.1074,2.83301,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,2.83301,21.1074 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,200000, PASSED ,2.81509e-05,105.866,14.2092,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,14.2092,105.866 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,200000, PASSED ,3.28596e-05,90.696,12.1731,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,12.1731,90.696 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,200000, PASSED ,0.000141433,21.0717,2.82821,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_32-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,2.82821,21.0717 +Basic_REDUCE_STRUCT,Base_Seq,default,25000, PASSED ,2.03879e-05,18.2721,2.45253,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-default,2.4074549999999997,17.9368 +Basic_REDUCE_STRUCT,Base_Seq,kahan,25000, PASSED ,8.11766e-05,4.58912,0.615966,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-kahan,0.6156245,4.5867249999999995 +Basic_REDUCE_STRUCT,Base_Seq,cascade,25000, PASSED ,3.92202e-05,9.4984,1.2749,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,Seq,Base_Seq-cascade,1.2664149999999998,9.435459999999999 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,25000, PASSED ,3.24748e-05,11.4713,1.53972,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.20374,16.418799999999997 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,25000, PASSED ,3.24142e-05,11.4928,1.5426,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,2.29813,17.12205 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,25000, PASSED ,2.42381e-05,15.3696,2.06295,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,4.82985,35.9846 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,25000, PASSED ,3.00259e-05,12.4069,1.66529,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,4.04143,30.11055 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,25000, PASSED ,4.67176e-05,7.97406,1.0703,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,1.68685,12.567779999999999 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,25000, PASSED ,2.42181e-05,15.3823,2.06465,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,4.889175,36.426649999999995 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,25000, PASSED ,3.00034e-05,12.4162,1.66655,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,4.03477,30.060850000000002 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,25000, PASSED ,4.70294e-05,7.92119,1.06321,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,1.6834600000000002,12.542494999999999 +Basic_REDUCE_STRUCT,Base_Seq,default,25000000, PASSED ,0.0215959,17.25,2.31526,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-default,2.30926,17.2053 +Basic_REDUCE_STRUCT,Base_Seq,kahan,25000000, PASSED ,0.0814538,4.5735,0.613845,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-kahan,0.613792,4.57311 +Basic_REDUCE_STRUCT,Base_Seq,cascade,25000000, PASSED ,0.0397722,9.36658,1.25716,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,Seq,Base_Seq-cascade,1.25686,9.36435 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,25000000, PASSED ,0.0193672,19.2351,2.58168,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.58935,19.2922 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,25000000, PASSED ,0.00031761,1172.91,157.426,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,144.703,1078.12 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,25000000, PASSED ,0.000887937,419.544,56.3103,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,56.3103,419.544 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,25000000, PASSED ,0.00100237,371.649,49.8818,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,49.7276,370.5 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,25000000, PASSED ,0.0172681,21.5732,2.89551,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.11471,23.2064 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,25000000, PASSED ,0.000167884,2218.97,297.825,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,293.988,2190.38 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,25000000, PASSED ,0.000176688,2108.4,282.985,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,272.943,2033.58 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,25000000, PASSED ,0.000485771,766.882,102.929,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_4000-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,90.5263,674.473 +Basic_REDUCE_STRUCT,Base_Seq,default,3200000, PASSED ,0.00275952,17.2797,2.31924,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-default,2.31924,17.2797 +Basic_REDUCE_STRUCT,Base_Seq,kahan,3200000, PASSED ,0.0104246,4.57414,0.61393,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-kahan,0.61393,4.57414 +Basic_REDUCE_STRUCT,Base_Seq,cascade,3200000, PASSED ,0.00509462,9.35962,1.25623,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,Seq,Base_Seq-cascade,1.25701,9.36547 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,3200000, PASSED ,0.00221362,21.541,2.89119,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,2.90154,21.6182 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,3200000, PASSED ,0.00015563,306.391,41.1232,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,41.1232,306.391 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,3200000, PASSED ,0.000129265,368.882,49.5105,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,49.5105,368.882 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,3200000, PASSED ,0.000143662,331.915,44.5489,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,44.5489,331.915 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,3200000, PASSED ,0.001949,24.4658,3.28374,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.26116,24.2975 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,3200000, PASSED ,4.36898e-05,1091.42,146.487,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,146.487,1091.42 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,3200000, PASSED ,4.80958e-05,991.432,133.068,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,133.068,991.432 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,3200000, PASSED ,0.000275825,172.877,23.2031,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_512-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,23.2031,172.877 +Basic_REDUCE_STRUCT,Base_Seq,default,400000, PASSED ,0.000331718,17.9685,2.41169,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-default,2.40869,17.946 +Basic_REDUCE_STRUCT,Base_Seq,kahan,400000, PASSED ,0.00129906,4.58829,0.615832,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-kahan,0.615679,4.58714 +Basic_REDUCE_STRUCT,Base_Seq,cascade,400000, PASSED ,0.000630239,9.45746,1.26936,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,Seq,Base_Seq-cascade,1.26755,9.44387 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_direct_256,400000, PASSED ,0.000215857,27.613,3.70616,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,Base_HIP-blkatm_direct_256,3.30631,24.6339 +Basic_REDUCE_STRUCT,Base_HIP,blkatm_occgs_256,400000, PASSED ,0.000160878,37.0496,4.97273,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,Base_HIP-blkatm_occgs_256,4.97273,37.0496 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_direct_256,400000, PASSED ,3.34982e-05,177.934,23.882,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_direct_256,23.882,177.934 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_256,400000, PASSED ,3.5396e-05,168.394,22.6015,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_256,22.6015,168.394 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_direct_new_256,400000, PASSED ,0.000255073,23.3677,3.13637,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_direct_new_256,3.13637,23.3677 +Basic_REDUCE_STRUCT,RAJA_HIP,blkatm_occgs_256,400000, PASSED ,3.34524e-05,178.178,23.9147,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkatm_occgs_256,23.9147,178.178 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_256,400000, PASSED ,3.52076e-05,169.295,22.7224,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_256,22.7224,169.295 +Basic_REDUCE_STRUCT,RAJA_HIP,blkdev_occgs_new_256,400000, PASSED ,0.000256678,23.2215,3.11675,build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier2-SPX/REDUCE_STRUCT_factor_64-kernel-run-data.csv,HIP,RAJA_HIP-blkdev_occgs_new_256,3.11675,23.2215 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_CONVECTION3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_CONVECTION3DPA.csv new file mode 100644 index 0000000..2f25852 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_CONVECTION3DPA.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +1377,51.8675,203.569,13.9092,13.9092,50.692,196.974,28.7189,112.498,7.70152,7.70152,28.068,108.853 +5508,203.569,493.27549999999997,13.9848,13.354,196.974,474.1055,112.498,272.4925,7.72835,7.385235,108.853,261.9025 +21951,782.982,782.982,12.139,12.8021,751.237,751.237,432.487,432.487,6.7051,7.07049,414.952,414.952 +43902,1155.74,1155.74,12.7988,12.7988,1163.05,1163.05,638.329,638.329,7.06895,7.06895,642.371,642.371 +87804,1561.48,1561.48,12.8021,12.7893,1522.53,1522.53,862.391,862.391,7.07049,7.0633,840.882,840.882 +175608,1865.48,1865.48,12.7893,12.7893,1834.54,1834.54,1030.27,1030.27,7.0633,7.0633,1013.18,1013.18 +351216,2157.11,2157.11,9.81092,9.81092,2159.83,2159.83,1191.32,1191.32,5.41833,5.41833,1192.82,1192.82 +702459,2452.42,2366.62,4.77572,4.77572,2444.8,2364.06,1354.4,1307.01,2.6375,2.6375,1350.19,1305.6 +1404891,2378.7,2366.62,3.93096,3.93096,2364.06,2364.06,1313.69,1307.01,2.17096,2.17096,1305.6,1305.6 +2057940,2366.62,2366.62,3.82584,3.82584,2365.59,2364.06,1307.01,1307.01,2.1129,2.1129,1306.44,1305.6 +2809755,2290.76,2290.76,3.7803,3.7803,2264.07,2275.59,1265.12,1265.12,2.08775,2.08775,1250.38,1256.74 +4115853,2269.31,2280.035,3.70921,3.7597199999999997,2275.59,2269.83,1253.27,1259.195,2.04849,2.076385,1256.74,1253.56 +5487804,2216.51,2269.31,3.73914,3.73914,2205.61,2264.07,1224.11,1253.27,2.06502,2.06502,1218.09,1250.38 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv new file mode 100644 index 0000000..721d797 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_DEL_DOT_VEC_2D.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +1849,30.8957,154.834,8.22078,8.26791,36.9252,152.791,26.3791,130.131,7.01899,6.94882,31.5271,128.414 +7744,154.834,356.2545,8.26791,8.278425,152.791,389.8755,130.131,297.6135,6.94882,6.93398,128.414,325.6465 +32400,557.675,557.675,8.29641,8.28894,626.96,626.96,465.096,465.096,6.91914,6.91914,522.879,522.879 +65025,1046.35,1046.35,8.28894,8.28894,1061.5,1061.5,870.75,870.75,6.89789,6.90635,883.357,883.357 +131044,1728.47,1728.47,8.31193,8.28894,1746.56,1746.56,1436.18,1436.18,6.90635,6.89789,1451.21,1451.21 +264196,2080.76,2003.36,8.25887,8.28088,1979.87,1979.87,1727.01,1661.51,6.8548,6.86785,1643.27,1643.27 +528529,2003.36,2080.76,8.28088,8.25887,2020.53,2020.53,1661.51,1727.01,6.86785,6.8548,1675.75,1675.75 +1060900,2177.17,2177.17,8.20031,8.20031,2165.8,2165.8,1804.69,1804.69,6.79735,6.79735,1795.26,1795.26 +2125764,2833.35,2491.61,8.12587,8.12587,2865.42,2475.08,2347.72,2064.0,6.73309,6.73309,2374.29,2050.3 +3115225,2599.48,2491.61,8.1121,8.1121,2573.67,2475.08,2153.59,2064.0,6.72062,6.72062,2132.2,2050.3 +4255969,2491.61,2491.61,7.5265,7.85359,2475.08,2475.08,2064.0,2064.0,6.23478,6.50454,2050.3,2050.3 +6235009,2164.16,2344.92,7.47318,7.690045,2193.34,2347.13,1792.54,1942.315,6.18992,6.36966,1816.71,1944.14 +8317456,2198.23,2198.23,7.85359,7.5265,2219.18,2219.18,1820.63,1820.63,6.50454,6.23478,1837.98,1837.98 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_INTSC_HEXHEX.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_INTSC_HEXHEX.csv new file mode 100644 index 0000000..51fae0b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_INTSC_HEXHEX.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_64 (raw),Base_HIP-block_64 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_64 (raw),RAJA_HIP-block_64 (smoothed),Base_HIP-block_64 (raw B/W),Base_HIP-block_64 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_64 (raw B/W),RAJA_HIP-block_64 (smoothed B/W) +27,16.7606,16.9948,3.53728,3.57302,23.1954,25.3459,0.361332,0.366381,0.0762581,0.0770286,0.500055,0.546417 +125,17.0519,17.02335,3.57302,3.571575,25.3459,27.7481,0.367612,0.3669965,0.0770286,0.0769974,0.546417,0.5982050000000001 +512,16.9948,17.0519,3.57408,3.57013,30.1503,30.1503,0.366381,0.367612,0.0770515,0.0769662,0.649993,0.649993 +1000,18.3183,18.3183,3.57013,3.57302,32.4974,32.4974,0.394913,0.394913,0.0769662,0.0770286,0.700591,0.700591 +1728,19.161,19.161,3.56988,3.57013,33.6319,33.6319,0.41308,0.41308,0.0769608,0.0769662,0.72505,0.72505 +3375,19.9581,19.9581,3.5765,3.56988,34.8353,34.8353,0.430266,0.430266,0.0771036,0.0769608,0.750994,0.750994 +6859,20.5383,20.5383,3.56548,3.56988,35.8919,35.8919,0.442773,0.442773,0.0768661,0.0769608,0.773771,0.773771 +13824,20.7291,20.7291,3.55364,3.57103,36.691,36.691,0.446885,0.446885,0.0766108,0.0769857,0.790999,0.790999 +27000,20.8315,20.7685,3.57103,3.56953,36.9388,36.9388,0.449095,0.447736,0.0769857,0.0769533,0.796342,0.796342 +39304,20.7771,20.7771,3.58022,3.56953,37.2253,37.2253,0.447921,0.447921,0.0771837,0.0769533,0.802517,0.802517 +50653,20.7685,20.8315,3.56953,3.57103,37.2927,37.2927,0.447736,0.449095,0.0769533,0.0769857,0.80397,0.80397 +74088,20.8648,20.82095,3.5611,3.572325,37.3937,37.3432,0.449811,0.448866,0.0767716,0.07701355,0.806147,0.8050584999999999 +97336,20.8671,20.8648,3.57512,3.56953,37.4355,37.3937,0.449862,0.449811,0.0770738,0.0769533,0.807049,0.806147 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_LTIMES.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_LTIMES.csv new file mode 100644 index 0000000..74d682a --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_LTIMES.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-kernel_256 (raw),RAJA_HIP-kernel_256 (smoothed),RAJA_HIP-launch_256 (raw),RAJA_HIP-launch_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-kernel_256 (raw B/W),RAJA_HIP-kernel_256 (smoothed B/W),RAJA_HIP-launch_256 (raw B/W),RAJA_HIP-launch_256 (smoothed B/W) +2496,33.6568,127.705,6.38293,6.25147,32.5743,123.045,33.2337,124.885,47.1104,177.9,8.93438,8.70866,45.5952,171.408,46.5183,173.971 +9792,127.705,217.5365,6.25147,6.171535,123.045,208.738,124.885,224.47299999999998,177.9,302.734,8.70866,8.592105,171.408,290.53249999999997,173.971,312.427 +38784,320.146,307.368,6.0916,6.0916,294.431,294.431,324.061,324.061,445.435,427.568,8.47555,8.47555,409.657,409.657,450.883,450.883 +77568,307.368,320.146,6.04761,6.04761,333.83,333.83,372.297,372.297,427.568,445.435,8.41261,8.41261,464.379,464.379,517.889,517.889 +154944,480.199,480.199,6.02887,6.02887,417.029,417.029,477.611,477.611,667.919,667.919,8.38568,8.38568,580.054,580.054,664.319,664.319 +309696,564.698,564.698,6.0219,6.0219,490.998,490.998,565.114,565.114,785.409,785.409,8.37555,8.37555,682.903,682.903,785.988,785.988 +619392,638.563,638.563,5.92931,5.98058,534.613,534.613,631.91,631.91,888.12,888.12,8.24656,8.31775,743.546,743.546,878.867,878.867 +1238784,656.516,656.516,5.98058,5.98058,538.841,538.841,643.288,643.288,913.079,913.079,8.31775,8.31775,749.416,749.416,894.681,894.681 +2477568,672.033,672.033,5.9714,5.9714,551.617,551.617,657.633,657.633,934.653,934.653,8.30493,8.30493,767.18,767.18,914.626,914.626 +3629184,687.039,682.933,5.98197,5.9714,562.389,558.576,664.526,664.526,955.521,949.809,8.31962,8.30493,782.16,776.856,924.21,924.21 +4954944,682.933,687.039,5.91045,5.91045,567.514,558.576,675.018,675.018,949.809,955.521,8.22013,8.22013,789.287,776.856,938.802,938.802 +7258176,688.689,687.864,5.90196,5.906205,558.576,560.4825000000001,681.414,678.216,957.814,956.6675,8.20832,8.214224999999999,776.856,779.508,947.696,943.249 +9677568,688.794,688.689,5.90146,5.90196,557.427,558.576,684.472,681.414,957.959,957.814,8.20761,8.20832,775.257,776.856,951.949,947.696 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_MASS3DPA.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_MASS3DPA.csv new file mode 100644 index 0000000..ecf76fd --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_MASS3DPA.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_25 (raw),Base_HIP-block_25 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_25 (raw),RAJA_HIP-block_25 (smoothed),Base_HIP-block_25 (raw B/W),Base_HIP-block_25 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_25 (raw B/W),RAJA_HIP-block_25 (smoothed B/W) +3200,62.7348,242.112,11.2571,11.2571,61.6721,240.801,29.3042,112.881,5.25832,5.25832,28.8078,112.269 +12672,242.112,485.178,11.2927,11.21085,240.801,482.71950000000004,112.881,226.1255,5.26504,5.23036,112.269,224.979 +50624,728.244,728.244,11.1062,11.172,724.638,724.638,339.37,339.37,5.17562,5.20566,337.689,337.689 +101184,1000.83,1000.83,11.1646,11.172,994.815,994.815,466.361,466.361,5.2024,5.20566,463.558,463.558 +202368,1231.45,1231.45,11.172,11.172,1219.98,1219.98,573.802,573.802,5.20566,5.20566,568.456,568.456 +404736,1771.57,1771.57,11.2015,11.172,1774.57,1774.57,825.456,825.456,5.21928,5.20566,826.853,826.853 +809536,2195.71,2195.71,11.2108,11.172,2217.75,2217.75,1023.07,1023.07,5.22359,5.20566,1033.34,1033.34 +1619008,2529.48,2529.48,11.0919,11.0919,2546.38,2546.38,1178.58,1178.58,5.16814,5.16814,1186.46,1186.46 +3237952,2639.1,2580.96,11.0749,11.0749,2619.83,2555.09,1229.66,1202.57,5.16021,5.16021,1220.68,1190.51 +4743104,2683.36,2580.96,11.0587,11.0617,2599.51,2555.09,1250.28,1202.57,5.15267,5.15408,1211.21,1190.51 +6475904,2580.96,2580.96,11.0617,11.0617,2555.09,2555.09,1202.57,1202.57,5.15408,5.15408,1190.51,1190.51 +9486208,2496.96,2546.27,11.0297,11.0602,2490.55,2533.9750000000004,1163.42,1186.405,5.13914,5.1533750000000005,1160.44,1180.67 +12648256,2511.58,2511.58,11.0629,11.0617,2512.86,2512.86,1170.24,1170.24,5.1546,5.15408,1170.83,1170.83 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv new file mode 100644 index 0000000..d21ecc0 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Apps_MATVEC_3D_STENCIL.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +216,2.40771,15.411,4.83791,4.83791,2.99912,18.0402,7.57793,43.2409,15.2267,13.8755,9.43932,50.6178 +1331,15.411,53.1929,4.94522,4.80405,18.0402,63.8466,43.2409,140.79145,13.8755,13.060500000000001,50.6178,168.9474 +8000,90.9748,90.9748,4.54837,4.77019,109.653,109.653,238.342,238.342,11.9161,12.2455,287.277,287.277 +17576,206.003,206.003,4.77019,4.77019,244.507,244.507,528.826,528.826,12.2455,12.0474,627.67,627.67 +35937,420.435,420.435,4.73832,4.73832,487.086,487.086,1063.56,1063.56,11.9863,11.9863,1232.16,1232.16 +79507,663.943,663.943,4.82424,4.73832,699.638,699.638,1658.04,1658.04,12.0474,11.9863,1747.18,1747.18 +157464,818.182,805.027,4.60436,4.60436,829.536,827.737,2025.36,1977.85,11.3978,11.3978,2053.46,2033.64 +328509,805.027,805.027,2.78153,2.78153,827.737,827.737,1977.85,1977.85,6.83387,6.83387,2033.64,2033.64 +681472,937.771,809.14,1.97875,1.97875,950.518,827.737,2290.43,1977.85,4.83293,4.83293,2321.56,2033.64 +1000000,784.035,805.027,1.763,1.88907,780.45,804.134,1910.0,1967.15,4.29488,4.59264,1901.27,1954.98 +1404928,809.14,784.035,1.88907,1.88388,804.134,780.45,1967.15,1910.0,4.59264,4.57083,1954.98,1901.27 +2048383,768.05,776.0425,1.88388,1.82645,764.498,772.474,1863.51,1886.755,4.57083,4.432855,1854.89,1878.08 +2744000,708.65,768.05,1.76902,1.88388,711.109,764.498,1716.99,1863.51,4.28615,4.57083,1722.95,1854.89 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv new file mode 100644 index 0000000..f148a53 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_INDEXLIST_3LOOP.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-block_256 (raw),Base_HIP-block_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-block_256 (raw),RAJA_HIP-block_256 (smoothed),Base_HIP-block_256 (raw B/W),Base_HIP-block_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-block_256 (raw B/W),RAJA_HIP-block_256 (smoothed B/W) +160000,0.0,0.0,0.0,0.0,0.0,0.0,282.038,484.515,10.9259,10.5095,281.64,491.281 +320000,0.0,0.0,0.0,0.0,0.0,0.0,484.515,627.2565,10.5095,10.486799999999999,491.281,631.3895 +640000,0.0,0.0,0.0,0.0,0.0,0.0,769.998,769.998,10.4641,10.4641,771.498,771.498 +1280000,0.0,0.0,0.0,0.0,0.0,0.0,1098.8,1098.8,10.3463,10.3463,1121.51,1121.51 +2560000,0.0,0.0,0.0,0.0,0.0,0.0,1537.47,1537.47,9.57698,9.57698,1537.84,1537.84 +5120000,0.0,0.0,0.0,0.0,0.0,0.0,2025.0,2025.0,9.33421,9.33421,2002.31,2002.31 +7500000,0.0,0.0,0.0,0.0,0.0,0.0,2268.75,2268.75,9.21605,9.21605,2270.15,2270.15 +10240000,0.0,0.0,0.0,0.0,0.0,0.0,2411.97,2411.97,9.14268,9.14268,2427.37,2427.37 +15000000,0.0,0.0,0.0,0.0,0.0,0.0,2557.58,2557.58,9.06695,9.06695,2543.69,2543.69 +20000000,0.0,0.0,0.0,0.0,0.0,0.0,2588.86,2577.57,9.03661,9.03661,2615.38,2577.97 +25000000,0.0,0.0,0.0,0.0,0.0,0.0,2593.46,2583.215,9.01477,9.02569,2577.97,2578.4049999999997 +30000000,0.0,0.0,0.0,0.0,0.0,0.0,2577.57,2588.86,9.00109,9.01477,2578.84,2578.84 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_MULTI_REDUCE.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_MULTI_REDUCE.csv new file mode 100644 index 0000000..cff3300 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_MULTI_REDUCE.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-atomic_direct_256 (raw),Base_HIP-atomic_direct_256 (smoothed),Base_HIP-atomic_occgs_256 (raw),Base_HIP-atomic_occgs_256 (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),RAJA_HIP-atomic_direct_256 (raw),RAJA_HIP-atomic_direct_256 (smoothed),RAJA_HIP-atomic_occgs_256 (raw),RAJA_HIP-atomic_occgs_256 (smoothed),Base_HIP-atomic_direct_256 (raw B/W),Base_HIP-atomic_direct_256 (smoothed B/W),Base_HIP-atomic_occgs_256 (raw B/W),Base_HIP-atomic_occgs_256 (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),RAJA_HIP-atomic_direct_256 (raw B/W),RAJA_HIP-atomic_direct_256 (smoothed B/W),RAJA_HIP-atomic_occgs_256 (raw B/W),RAJA_HIP-atomic_occgs_256 (smoothed B/W) +6245,0.519487,2.13172,0.51601,2.13558,0.314624,0.309117,0.502346,1.99748,0.497004,2.00488,7.75335,31.7778,7.70146,31.8354,4.69577,4.60804,7.49752,29.7767,7.4178,29.887 +24995,2.13172,5.374404999999999,2.13558,5.33478,0.309117,0.3087485,1.99748,5.129715,2.00488,5.104545,31.7778,80.09790000000001,31.8354,79.5072,4.60804,4.60186,29.7767,76.45085,29.887,76.0755 +99995,8.61709,8.61709,8.53398,8.53398,0.30838,0.30838,8.26195,8.26195,8.20421,8.20421,128.418,128.418,127.179,127.179,4.59568,4.59568,123.125,123.125,122.264,122.264 +199995,16.7516,16.7516,16.7853,16.7853,0.308044,0.308044,16.2446,16.2446,15.5979,15.5979,249.63,249.63,250.134,250.134,4.59044,4.59044,242.075,242.075,232.439,232.439 +399995,32.6471,32.6471,33.4007,33.4007,0.307964,0.307964,30.9453,30.9453,29.5608,29.5608,486.492,486.492,497.721,497.721,4.58914,4.58914,461.132,461.132,440.501,440.501 +799995,58.2522,58.2522,58.7675,58.7675,0.307912,0.307912,54.6576,54.6576,56.7401,56.7401,868.036,868.036,875.715,875.715,4.58831,4.58831,814.472,814.472,845.504,845.504 +1599995,100.651,100.651,103.452,103.452,0.307731,0.307731,91.7972,91.7972,98.0251,98.0251,1499.82,1499.82,1541.56,1541.56,4.58558,4.58558,1367.89,1367.89,1460.7,1460.7 +3199995,130.892,130.892,133.587,133.587,0.307295,0.307295,125.281,125.281,126.487,126.487,1950.45,1950.45,1990.61,1990.61,4.57907,4.57907,1866.84,1866.84,1884.81,1884.81 +6399995,171.536,171.536,168.966,168.966,0.307179,0.307179,157.081,157.081,166.679,166.679,2556.08,2556.08,2517.79,2517.79,4.57733,4.57733,2340.7,2340.7,2483.72,2483.72 +9374995,192.555,174.457,193.002,189.216,0.307111,0.307156,179.406,158.254,190.404,187.884,2869.3,2599.61,2875.96,2819.54,4.57632,4.57698,2673.36,2358.17,2837.25,2799.69 +12799995,189.588,174.457,199.064,189.216,0.307156,0.307156,172.343,158.254,196.59,187.884,2825.08,2599.61,2966.29,2819.54,4.57698,4.57698,2568.11,2358.17,2929.42,2799.69 +18749995,174.457,182.02249999999998,189.216,191.109,0.307111,0.3071335,158.254,165.2985,187.884,189.144,2599.61,2712.3450000000003,2819.54,2847.75,4.57631,4.57665,2358.17,2463.1400000000003,2799.69,2818.4700000000003 +24999995,168.098,174.457,182.199,189.216,0.307197,0.307156,151.785,158.254,181.174,187.884,2504.85,2599.61,2714.98,2819.54,4.5776,4.57698,2261.77,2358.17,2699.7,2799.69 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_REDUCE_STRUCT.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_REDUCE_STRUCT.csv new file mode 100644 index 0000000..5e5158b --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Basic_REDUCE_STRUCT.csv @@ -0,0 +1,14 @@ +Problem size,Base_HIP-blkatm_direct_256 (raw),Base_HIP-blkatm_direct_256 (smoothed),Base_HIP-blkatm_occgs_256 (raw),Base_HIP-blkatm_occgs_256 (smoothed),Base_Seq-cascade (raw),Base_Seq-cascade (smoothed),Base_Seq-default (raw),Base_Seq-default (smoothed),Base_Seq-kahan (raw),Base_Seq-kahan (smoothed),RAJA_HIP-blkatm_direct_256 (raw),RAJA_HIP-blkatm_direct_256 (smoothed),RAJA_HIP-blkatm_occgs_256 (raw),RAJA_HIP-blkatm_occgs_256 (smoothed),RAJA_HIP-blkdev_direct_256 (raw),RAJA_HIP-blkdev_direct_256 (smoothed),RAJA_HIP-blkdev_direct_new_256 (raw),RAJA_HIP-blkdev_direct_new_256 (smoothed),RAJA_HIP-blkdev_occgs_256 (raw),RAJA_HIP-blkdev_occgs_256 (smoothed),RAJA_HIP-blkdev_occgs_new_256 (raw),RAJA_HIP-blkdev_occgs_new_256 (smoothed),Base_HIP-blkatm_direct_256 (raw B/W),Base_HIP-blkatm_direct_256 (smoothed B/W),Base_HIP-blkatm_occgs_256 (raw B/W),Base_HIP-blkatm_occgs_256 (smoothed B/W),Base_Seq-cascade (raw B/W),Base_Seq-cascade (smoothed B/W),Base_Seq-default (raw B/W),Base_Seq-default (smoothed B/W),Base_Seq-kahan (raw B/W),Base_Seq-kahan (smoothed B/W),RAJA_HIP-blkatm_direct_256 (raw B/W),RAJA_HIP-blkatm_direct_256 (smoothed B/W),RAJA_HIP-blkatm_occgs_256 (raw B/W),RAJA_HIP-blkatm_occgs_256 (smoothed B/W),RAJA_HIP-blkdev_direct_256 (raw B/W),RAJA_HIP-blkdev_direct_256 (smoothed B/W),RAJA_HIP-blkdev_direct_new_256 (raw B/W),RAJA_HIP-blkdev_direct_new_256 (smoothed B/W),RAJA_HIP-blkdev_occgs_256 (raw B/W),RAJA_HIP-blkdev_occgs_256 (smoothed B/W),RAJA_HIP-blkdev_occgs_new_256 (raw B/W),RAJA_HIP-blkdev_occgs_new_256 (smoothed B/W) +6250,0.59889,1.53972,0.606802,1.5426,1.24252,1.26755,2.40431,2.40869,0.614436,0.61557,0.512244,2.06295,0.514221,2.06465,0.625253,1.66529,0.352658,1.0703,0.622879,1.66655,0.348036,1.06321,4.46136,11.4713,4.5203,11.4928,9.25599,9.44387,17.9107,17.946,4.57718,4.58631,3.81591,15.3696,3.83063,15.3823,4.65775,12.4069,2.62709,7.97406,4.64007,12.4162,2.59265,7.92119 +25000,1.53972,2.20374,1.5426,2.29813,1.2749,1.2664149999999998,2.45253,2.4074549999999997,0.615966,0.6156245,2.06295,4.82985,2.06465,4.889175,1.66529,4.04143,1.0703,1.68685,1.66655,4.03477,1.06321,1.6834600000000002,11.4713,16.418799999999997,11.4928,17.12205,9.4984,9.435459999999999,18.2721,17.9368,4.58912,4.5867249999999995,15.3696,35.9846,15.3823,36.426649999999995,12.4069,30.11055,7.97406,12.567779999999999,12.4162,30.060850000000002,7.92119,12.542494999999999 +100000,2.86776,2.86776,3.05366,3.05366,1.26755,1.26755,2.40869,2.40869,0.61557,0.615679,7.59675,7.59675,7.7137,7.7137,6.41757,6.41757,2.3034,2.3034,6.40299,6.40299,2.30371,2.30371,21.3663,21.3663,22.7513,22.7513,9.44387,9.44387,17.946,17.946,4.58631,4.58714,56.5996,56.5996,57.471,57.471,47.8142,47.8142,17.1615,17.1615,47.7055,47.7055,17.1638,17.1638 +200000,4.22656,3.30631,4.3503,4.3503,1.26528,1.26936,2.40622,2.41169,0.615679,0.615832,14.0159,14.0159,14.2092,14.2092,12.2768,12.2768,2.83301,2.83301,12.1731,12.1731,2.82821,2.82821,31.4902,24.6339,32.4121,32.4121,9.42705,9.45746,17.9276,17.9685,4.58714,4.58829,104.426,104.426,105.866,105.866,91.4688,91.4688,21.1074,21.1074,90.696,90.696,21.0717,21.0717 +400000,3.70616,3.30631,4.97273,4.97273,1.26936,1.26755,2.41169,2.40869,0.615832,0.615679,23.882,23.882,23.9147,23.9147,22.6015,22.6015,3.13637,3.13637,22.7224,22.7224,3.11675,3.11675,27.613,24.6339,37.0496,37.0496,9.45746,9.44387,17.9685,17.946,4.58829,4.58714,177.934,177.934,178.178,178.178,168.394,168.394,23.3677,23.3677,169.295,169.295,23.2215,23.2215 +800000,3.30631,3.30631,9.46774,9.46774,1.27074,1.26578,2.4171,2.40622,0.615924,0.615679,31.8856,31.8856,46.665,46.665,32.3273,32.3273,3.23914,3.23914,44.199,44.199,6.15777,6.15777,24.6339,24.6339,70.54,70.54,9.46773,9.43083,18.0088,17.9276,4.58898,4.58714,237.566,237.566,347.681,347.681,240.857,240.857,24.1335,24.1335,329.308,329.308,45.8789,45.8789 +1600000,2.93059,2.93059,19.5156,19.5156,1.26578,1.26578,2.38666,2.38666,0.615345,0.615345,41.8183,41.8183,88.7308,88.7308,39.6132,39.6132,3.29018,3.26116,80.3859,80.3859,12.1531,12.1531,21.8346,21.8346,145.402,145.402,9.43083,9.43083,17.782,17.782,4.58467,4.58467,311.57,311.57,661.095,661.095,295.141,295.141,24.5137,24.2975,598.921,598.921,90.5478,90.5478 +3200000,2.89119,2.90154,41.1232,41.1232,1.25623,1.25701,2.31924,2.31924,0.61393,0.61393,49.5105,49.5105,146.487,146.487,44.5489,44.5489,3.28374,3.26116,133.068,133.068,23.2031,23.2031,21.541,21.6182,306.391,306.391,9.35962,9.36547,17.2797,17.2797,4.57414,4.57414,368.882,368.882,1091.42,1091.42,331.915,331.915,24.4658,24.2975,991.432,991.432,172.877,172.877 +6400000,2.90154,2.89119,76.9726,76.9726,1.25701,1.25623,2.29845,2.29845,0.613712,0.613712,55.167,55.167,231.239,231.239,48.8176,48.8176,3.26116,3.26116,210.024,210.024,43.2192,43.2192,21.6182,21.541,573.49,573.49,9.36547,9.35962,17.1248,17.1248,4.57251,4.57251,411.026,411.026,1722.86,1722.86,363.719,363.719,24.2975,24.2975,1564.8,1564.8,322.008,322.008 +9375000,2.87306,2.87306,109.669,109.669,1.255,1.25623,2.28275,2.29845,0.613394,0.613712,57.0132,55.8227,270.833,270.833,49.9782,49.7044,3.10041,3.18108,257.118,257.118,60.958,60.958,21.406,21.406,817.096,817.096,9.35046,9.35962,17.0078,17.1248,4.57014,4.57251,424.781,415.911,2017.87,2017.87,372.367,370.326,23.0999,23.7009,1915.68,1915.68,454.172,454.172 +12800000,2.60499,2.60499,123.859,123.859,1.25472,1.25686,2.28292,2.29845,0.613316,0.613712,55.8227,56.3103,293.988,288.97,49.7044,49.7276,3.18108,3.11471,272.943,269.415,73.1521,73.1521,19.4087,19.4087,922.82,922.82,9.34837,9.36435,17.0091,17.1248,4.56956,4.57251,415.911,419.544,2190.38,2153.0,370.326,370.5,23.7009,23.2064,2033.58,2007.29,545.025,545.025 +18750000,2.58935,2.59717,144.703,134.281,1.25686,1.25593,2.30926,2.29609,0.613792,0.613593,56.7512,56.53075,288.97,291.47900000000004,49.7276,49.8047,3.11471,3.1075600000000003,269.415,271.179,90.5263,81.8392,19.2922,19.350450000000002,1078.12,1000.47,9.36435,9.357405,17.2053,17.1072,4.57311,4.571625,422.829,421.1865,2153.0,2171.69,370.5,371.0745,23.2064,23.15315,2007.29,2020.435,674.473,609.749 +25000000,2.58168,2.58935,157.426,144.703,1.25716,1.25686,2.31526,2.30926,0.613845,0.613792,56.3103,56.3103,297.825,293.988,49.8818,49.7276,2.89551,3.11471,282.985,272.943,102.929,90.5263,19.2351,19.2922,1172.91,1078.12,9.36658,9.36435,17.25,17.2053,4.5735,4.57311,419.544,419.544,2218.97,2190.38,371.649,370.5,21.5732,23.2064,2108.4,2033.58,766.882,674.473 diff --git a/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv new file mode 100644 index 0000000..5e48aa3 --- /dev/null +++ b/docs/13_rajaperf/baseline_data/RPBenchmark_MI300A_tier2-SPX/saturation-curve-data/Comm_HALO_PACKING_FUSED.csv @@ -0,0 +1,13 @@ +Problem size,Base_HIP-direct_1024 (raw),Base_HIP-direct_1024 (smoothed),Base_Seq-direct (raw),Base_Seq-direct (smoothed),RAJA_HIP-direct_1024 (raw),RAJA_HIP-direct_1024 (smoothed),RAJA_HIP-funcptr_1024 (raw),RAJA_HIP-funcptr_1024 (smoothed),RAJA_HIP-virtfunc_1024 (raw),RAJA_HIP-virtfunc_1024 (smoothed),Base_HIP-direct_1024 (raw B/W),Base_HIP-direct_1024 (smoothed B/W),Base_Seq-direct (raw B/W),Base_Seq-direct (smoothed B/W),RAJA_HIP-direct_1024 (raw B/W),RAJA_HIP-direct_1024 (smoothed B/W),RAJA_HIP-funcptr_1024 (raw B/W),RAJA_HIP-funcptr_1024 (smoothed B/W),RAJA_HIP-virtfunc_1024 (raw B/W),RAJA_HIP-virtfunc_1024 (smoothed B/W) +91125,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,53.049,81.0342,30.503,28.801,43.7518,70.0771,46.6773,73.2531,45.935,71.0136 +205379,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,81.0342,106.1101,28.2635,28.532249999999998,70.0771,90.58005,73.2531,96.31555,71.0136,93.29929999999999 +421875,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,131.186,131.186,28.801,28.2635,111.083,111.083,119.378,119.378,115.585,115.585 +884736,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,195.121,195.121,27.1852,27.1852,160.986,160.986,174.266,174.266,165.913,165.913 +1860867,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,305.984,305.984,26.9538,26.9538,251.596,251.596,270.63,270.63,263.685,263.685 +3796416,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,451.394,451.394,22.6057,22.6057,364.717,364.717,407.436,407.436,388.323,388.323 +5639752,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,546.885,546.885,14.3594,14.3594,473.418,473.418,499.463,499.463,476.998,476.998 +7762392,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,557.471,557.471,8.92213,8.92213,495.627,495.627,528.494,528.494,513.647,513.647 +11543176,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,719.735,719.735,8.25019,8.25019,670.95,670.95,670.952,670.952,646.866,646.866 +15438249,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,798.716,798.716,7.70923,7.70923,748.537,748.537,736.716,736.716,712.972,712.972 +19465109,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,861.82,830.268,7.3292,7.519215,787.955,768.2460000000001,797.128,766.922,779.828,746.4 +23393656,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,863.478,861.82,3.9391,7.3292,807.196,787.955,801.537,797.128,783.349,779.828 diff --git a/docs/13_rajaperf/rajaperf.rst b/docs/13_rajaperf/rajaperf.rst index b26a66c..026c652 100644 --- a/docs/13_rajaperf/rajaperf.rst +++ b/docs/13_rajaperf/rajaperf.rst @@ -2,27 +2,34 @@ RAJA Performance Suite ********************** -RAJA Performance Suite source code is near-final at this point. It will be -released soon along with benchmark baseline data and instructions for running -the benchmark and generating evaluation metrics. - The RAJA Performance Suite contains a variety of numerical kernels that represent important computational patterns found in HPC applications. It is a companion project to RAJA, which is a library of software abstractions used by -developers of C++ applications to write portable, single-source code. The RAJA -Performance Suite enables performance experiments and comparisons for kernel -variants that use RAJA and those that do not. +developers of C++ applications to write portable, *single-source* code. Each +kernel in the Suite has multiple implementations using common parallel +programming models, such as OpenMP and CUDA, including RAJA and non-RAJA +(often referred to as Base) variants. +The RAJA Performance Suite enables a wide range of performance experiments and +comparisons for kernel variants, compilers, etc. + +.. important:: The RAJA Performance Suite Benchmark is limited to a subset of + kernels in the RAJA Performance Suite described in + :ref:`rajaperf_problems-label`. -Source code and documentation for RAJA and the RAJA Performance Suite is -available at: +The `RAJAPerf-Benchmark GitHub repo `_ +contains the source code, performance baseline data files, run scripts, +and data processing scripts for the RAJA Performance Suite Benchmark. It includes +the RAJA Performance Suite repo as a submodule which, in turn, contains RAJA as a +submodule. When the benchmark project repo is cloned recursively, everything +necessary to build and run the benchmark is included. Detailed instructions are +included in :ref:`rajaperf_build-label` and :ref:`rajaperf_run-label`. - * `RAJA Performance Suite GitHub project `_ +Additional information about the RAJA Performance Suite and RAJA is available +at these links: - * `RAJA GitHub project `_ + * `RAJA Performance Suite GitHub repo `_ -.. important:: The RAJA Performance Suite benchmark is limited to a subset of - kernels in the RAJA Performance Suite as described in - :ref:`rajaperf_problems-label`. + * `RAJA GitHub repo `_ Purpose @@ -30,59 +37,39 @@ Purpose The main purpose of the RAJA Performance Suite is to analyze performance of loop-based computational kernels representative of those found in HPC -applications and which are implemented using `RAJA `_. -The kernels in the Suite originate from different sources ranging from -open-source HPC benchmarks to restricted-access production applications. -Kernels exercise various loop structures as well as parallel operations such -as reductions, atomics, scans, and sorts. +applications and to compare implementation variants. The kernels in +the Suite originate from various sources ranging from open-source HPC +benchmarks to restricted-access production applications. Kernels exercise +a variety of loop structures and important parallel operations such as +reductions, atomics, scans, and sorts. Each kernel in the Suite appears in RAJA and non-RAJA variants that exercise -common programming models, such as OpenMP, CUDA, HIP, and SYCL. Performance +common programming models, such as OpenMP, CUDA, and HIP. Performance comparisons between RAJA and non-RAJA variants are helpful to improve RAJA -implementation and to identify impacts C++ abstractions have on compilers' -ability to optimize. Often, kernels in the Suite serve as collaboration tools -enabling the RAJA team to work with vendors to resolve performance issues -observed in production applications that use RAJA. - -To more closely align execution of kernels in the Suite with how they would -run in the context of a full application, benchmark runs must be done using -multiple MPI ranks to ensure that all resources on a compute node are being -exercised and avoid misrepresentation of kernel and node performance. RAJA is -a potential *X* in the often referred to *MPI + X* parallel application -paradigm, where MPI is used for coarse-grained, distributed memory parallelism -and X (e.g., RAJA) supports fine-grained parallelism within an MPI rank. The -RAJA Performance Suite can be configured with MPI so that execution of kernels -in the Suite represents how those kernels would be exercised in an MPI + X HPC -application. When the RAJA Performance Suite is run using multiple MPI ranks, -the same kernel code is executed on each rank. Synchronization and -communication across ranks involves only sending execution timing information -to rank zero for reporting purposes. - -.. important:: For RAJA Performance Suite benchmark execution, MPI must be used - to run to ensure that all resources on a compute node are being - exercised and avoid misrepresentation of kernel and node - performance. This is described in the instructions provided in - :ref:`rajaperf_run-label`. +implementations and to identify impacts that C++ abstractions have on compilers' +abilities to optimize. The Suite serves as an important collaboration tool +between the RAJA team and vendors to resolve performance issues observed in +production applications that use RAJA. Characteristics =============== -The `RAJA Performance Suite GitHub project `_ -contains the code for all the Suite kernels and all essential external software -dependencies in Git submodules. Thus, dependency versions are pinned to each -version of the Suite. Building the Suite requires an installation of CMake for -configuring a build, a C++17 compliant compiler to build the code, and an MPI -library installation when MPI is to be used. - -The Suite can be run in a myriad of ways by specifying parameters and options -as command-line arguments. The intent is that one can build the code and -use scripts to execute multiple Suite runs to generate data for a desired -performance experiment. +`RAJAPerf-Benchmark GitHub repo `_ +contains everything needed to build and run the benchmark. This includes +the RAJA Performance Suite and RAJA software dependencies in Git submodules and +scripts to build, run, and analyze output data. Thus, all +dependency versions are pinned to each version of the benchmark. Building +the RAJA Performance Suite code requires CMake to configure a build, a C++17 +(soon to require C++20) compliant compiler to build the code, and an MPI library +installation to link against. -In particular, variants, problem sizes, etc. for the kernels can be set by a -user from the command line. Specific instructions for running the RAJA -Performance Suite benchmark are described in :ref:`rajaperf_run-label`. +The Suite can be run in a myriad of ways via command-line options and their +arguments. The intent is that after compiling the code, simple scripts can be +written to execute necessary Suite runs to generate data for desired performance +experiments. Instructions for getting the code for the RAJA Performance Suite +Benchmark, building it, and running it are described in +:ref:`rajaperf_build-label` and :ref:`rajaperf_run-label`. .. _rajaperf_problems-label: @@ -90,24 +77,32 @@ Performance Suite benchmark are described in :ref:`rajaperf_run-label`. Problems -------- -The RAJA Performance Suite benchmark is limited to a subset of kernels in the -full Suite to focus on some of the more important computational patterns found -in LLNL applications. The subset of kernels is described. +The RAJA Performance Suite Benchmark consists of a subset of kernels in the +full Suite that focus on some key computational patterns found in LLNL +applications. The benchmark kernels are partitioned into two priority levels as +described below, along with notable features and RAJA constructs used in each +kernel (in parentheses). + +.. note:: In the RAJA Performance Suite repository, each kernel contains a + detailed reference description near the top of the header file for + the kernel class; i.e., C++ header file named ``.hpp``. + The reference description is a C-style sequential implementation of + the kernel in a comment section near the top of the file. + +The RAJA Performance Suite Benchmark kernels are partitioned into two +priority levels described below. -.. note:: Each kernel contains a complete reference description located in the - header file for the kernel object ``.hpp``. The - reference is a C-style sequential implementation of the kernel in - a comment section near the top of the header file. Priority 1 kernels ^^^^^^^^^^^^^^^^^^^ -*Apps* group (directory src/apps) +*Priority 1* kernels are most important to us. They are located in the +``RAJAPerf/src/apps`` sub-directory: #. **DIFFUSION3DPA** element-wise action of a 3D finite element volume diffusion operator via partial assembly and sum factorization *(nested loops, GPU shared memory, RAJA::launch API)* #. **EDGE3D** stiffness matrix assembly for a 3D MHD calculation *(single loop with included function call, RAJA::forall API)* #. **ENERGY** internal energy calculation from an explicit hydrodynamics algorithm; *(multiple single-loop operations in sequence, conditional logic for correctness checks and cutoffs, RAJA::forall API)* - #. **FEMSWEEP** finite element implementation of linear sweep algorithm used in radiation transport *(nested loops, RAJA::launch API)* + #. **FEMSWEEP** finite element implementation of linear sweep algorithm used in radiation transport, with a register-heavy LU solver *(nested loops, RAJA::launch API)* #. **INTSC_HEXRECT** intersection between a 24-sided hexahedron and a rectangular solid, including volume and moment calculations *(single loop, RAJA::forall API)* #. **MASS3DEA** element assembly of a 3D finite element mass matrix *(nested loops, GPU shared memory, RAJA::launch API)* #. **MASS3DPA_ATOMIC** action of a 3D finite element mass matrix on elements with shared DOFs via partial assembly and sum factorization *(nested loops, GPU shared memory, RAJA::launch API)* @@ -119,16 +114,20 @@ Priority 1 kernels Priority 2 kernels ^^^^^^^^^^^^^^^^^^^ - #. **Apps/CONVECTION3DPA** element-wise action of a 3D finite element volume convection operator via partial assembly and sum factorization *(nested loops, GPU shared memory, RAJA::launch API)* - #. **Apps/DEL_DOT_VEC_2D** divergence of a vector field at a set of points on a mesh *(single loop, data access via indirection array, RAJA::forall API)* - #. **Apps/INTSC_HEXHEX** intersection between two 24-sided hexahedra, including volume and moment calculations *(multiple single-loop operations in sequence, RAJA::forall API)* - #. **Apps/LTIMES** one step of the source-iteration technique for solving the steady-state linear Boltzmann equation, multi-dimensional matrix product *(nested loops, RAJA::kernel API)* - #. **Apps/MASS3DPA** element-wise action of a 3D finite element mass matrix via partial assembly and sum factorization *(nested loops, GPU shared memory, RAJA::launch API)* - #. **Apps/MATVEC_3D_STENCIL** matrix-vector product based on a 3D mesh stencil *(single loop, data access via indirection array, RAJA::forall API)* - #. **Basic/MULTI_REDUCE** multiple reductions in a kernel, where number of reductions is set at run time *(single loop, irregular atomic contention, RAJA::forall API)* - #. **Basic/REDUCE_STRUCT** multiple reductions in a kernel, where number of reductions (6) is known at compile time *(single loop, multiple reductions, RAJA::forall API)* - #. **Basic/INDEXLIST_3LOOP** construction of set of indices used in other kernel executions *(single loops, vendor scan implementations, RAJA::forall API)* - #. **Comm/HALO_PACKING_FUSED** packing and unpacking MPI message buffers for point-to-point distributed memory halo data exchange for mesh-based codes *(overhead of launching many small kernels, GPU variants use RAJA::Workgroup concepts to execute multiple kernels with one launch)* +*Priority 2* kernels are also important, but less so than the *Priority 1* +kernels listed above. *Priority 2* kernels are listed below and are located in +the ``RAJAPerf/src`` sub-directories noted: + + #. **apps/CONVECTION3DPA** element-wise action of a 3D finite element volume convection operator via partial assembly and sum factorization *(nested loops, GPU shared memory, RAJA::launch API)* + #. **apps/DEL_DOT_VEC_2D** divergence of a vector field at a set of points on a mesh *(single loop, data access via indirection array, RAJA::forall API)* + #. **apps/INTSC_HEXHEX** intersection between two 24-sided hexahedra, including volume and moment calculations *(multiple single-loop operations in sequence, RAJA::forall API)* + #. **apps/LTIMES** one step of the source-iteration technique for solving the steady-state linear Boltzmann equation, multi-dimensional matrix product *(nested loops, RAJA::kernel API)* + #. **apps/MASS3DPA** element-wise action of a 3D finite element mass matrix via partial assembly and sum factorization *(nested loops, GPU shared memory, RAJA::launch API)* + #. **apps/MATVEC_3D_STENCIL** matrix-vector product based on a 3D mesh stencil *(single loop, data access via indirection array, RAJA::forall API)* + #. **basic/MULTI_REDUCE** multiple reductions in a kernel, where number of reductions is set at run time *(single loop, irregular atomic contention, RAJA::forall API)* + #. **basic/REDUCE_STRUCT** multiple reductions in a kernel, where number of reductions (6) is known at compile time *(single loop, multiple reductions, RAJA::forall API)* + #. **basic/INDEXLIST_3LOOP** construction of set of indices used in other kernel executions *(single loops, vendor scan implementations, RAJA::forall API)* + #. **comm/HALO_PACKING_FUSED** packing and unpacking MPI message buffers for point-to-point distributed memory halo data exchange for mesh-based codes *(overhead of launching many small kernels, GPU variants use RAJA::Workgroup concepts to execute multiple kernels with one launch)* .. _rajaperf_fom-label: @@ -136,11 +135,65 @@ Priority 2 kernels Figure of Merit --------------- -There are two figures of merit (FOM) for each benchmark kernel: execution time -and memory bandwidth..... **fill this in*** - -**Describe how to set problem size based on architecture and how key output quantities are computed.....*** - +The figure of merit (FOM) for each kernel is determined by the problem size at +which the kernel *saturates* resources on a *single* compute node. That is, +the problem size at which a computational throughput curve becomes flat, with +zero derivative, and beyond which running larger problem sizes does not yield +an increase in compute rate. The FOM for each kernel includes 3 numerical +values: + + * the saturation problem size (GB) + * the compute rate (GFLOP/sec) at the saturation problem size + * the memory bandwidth (GB/sec) at the saturation problem size + +.. important:: In the results presented in :ref:`rajaperf_results-label`, + problem size is computed individually for each kernel based on + a requested memory allocation size. The concept of size is + subjective and depends on what one is looking for. We discuss + how we determine problem sizes for the kernels in the RAJA + Performance Suite in ``_ + +When the Suite is run, problem size, compute rate, and memory bandwidth, among +other data are reported in output files. We provide a Python script that can +traverse the contents of an output directory and generate condensed summary +files, throughput plots, and FOM information. Usage of the script is +detailed below. + +Computational throughput may be visualized using a plot where compute rate, +such as GFLOP/sec (vertical axis), is plotted as a function of problem size on +the horizontal axis. Ideally, such a curve will be monotonically +increasing and transition to a flat, horizontal line. Then, the saturation point +is the problem size at which the derivative of the throughput curve becomes zero. +In reality, throughput curves are often non-monotonic or do not have a +strictly zero derivative for all points beyond some problem size. Therefore, we +apply a simple median based smoothing algorithm to the throughput curve data +and heuristically estimate the saturation point based on the smoothed +throughput curve. The details of our approach are documented in the +``process_data.py`` script in the +`RAJAPerf-Benchmark GitHub repo `_, +which we use in :ref:`rajaperf_results-label` + +Lastly, we emphasize that we want the kernels to be run in an execution +environment that aligns with how they would run if part of a real application. +Thus, the Suite should be run **using multiple MPI ranks** so that all +resources on a compute node are being exercised in a way that is +representative of how an application would run. + +All applications that use RAJA use it in the *MPI + X* parallel application +paradigm, where MPI is used for coarse-grained, distributed memory parallelism +and X (RAJA in this case) supports fine-grained parallelism within each MPI +rank. The RAJA Performance Suite can be configured with MPI so that execution +of kernels in the Suite follows the *MPI + X* application paradigm. When a +kernel is run using multiple MPI ranks, the same code executes simultaneously +on each, and synchronization and communication among ranks involves only the +sending execution timing information from each rank to rank zero for reporting +purposes. + +.. important:: For RAJA Performance Suite benchmark execution, + **MPI must be used** to run to ensure that all resources on a + compute node are being exercised so as to avoid misrepresentation + of kernel and node performance. This is described in + :ref:`rajaperf_run-label`. .. _rajaperf_codemod-label: @@ -153,12 +206,13 @@ For the RAJA Performance Suite, we define the following restrictions on source code modifications: * While source code changes to the RAJA Performance Suite kernels and to RAJA - can be proposed, RAJA may not be removed from *RAJA kernel variants* in the - Suite or replaced with any other library. The *Base kernel variants* in the - Suite are provided to show how each kernel could be implemented directly - in the corresponding programming model back-end without the RAJA abstraction - layer. Apart from some special cases, the RAJA and Base variants for each - kernel should perform the same computation. + can be proposed for improved performance, for example, RAJA may not be + removed from *RAJA kernel variants* in the Suite or replaced with any other + library. The *non-RAJA kernel variants* in the Suite are provided to show how + each kernel can be implemented directly in the corresponding programming + model back-end without the RAJA abstraction layer. Apart from some special + cases, the RAJA and non-RAJA variants for each kernel should execute the + same operations. .. _rajaperf_build-label: @@ -166,23 +220,41 @@ code modifications: Building ======== -The RAJA Performance Suite uses a CMake-based system to configure the code for -compilation. As noted earlier, all non-system related software dependencies are -included in the RAJA Performance Suite repository as Git submodules. +Getting the code +---------------- + +All non-system related software dependencies needed to compile and run the +benchmark are contained in the +`RAJAPerf-Benchmark GitHub repo `_ +repository as Git submodules. The ``v2026.04.1`` version of the repo is the +current version and was used to generate the baseline data described in +:ref:`rajaperf_results-label`. + +The following command can be used to clone the GitHub repo:: + + $ git clone --recursive git@github.com:llnl/RAJAPerf-Benchmark.git -The current RAJA Performance Suite benchmark uses the ``v2025.12.0`` version of -the code. When the git repository is cloned, you will be on the ``develop`` -branch, which is the default RAJA Performance Suite branch. To get a local copy -of this version of the code and the correct versions of submodules:: +This will clone the repo into your local directory and put you on the ``main`` +branch of the benchmark repo, which is the default branch. To get a local copy +of the version used to generate the baselines, execute the following commands:: - $ git clone --recursive https://github.com/LLNL/RAJAPerf.git - $ git checkout v2025.12.0 - $ git submodule update --init --recursive + $ git checkout v2026.04.1 + $ git submodule update --init --recursive -When building the RAJA Performance Suite, RAJA and the RAJA Performance Suite -are built together using the same CMake configuration. The basic process for -specifying a configuration and generating a build space is to create a build -directory and run CMake in it with the proper options. For example:: +This will assure that you have the proper versions of the RAJAPerf and RAJA +submodules in your repo clone. + + +Configuration and compilation +------------------------------ + +The RAJA Performance Suite uses a CMake-based system to configure the code for +compilation. When building the RAJA Performance Suite, RAJA and the RAJA +Performance Suite are built together with the same CMake configuration which +is specified at the RAJA Performance Suite level. +The generic process for specifying a configuration and generating a build space +is to create a build directory and run CMake in it with the proper options. +For example:: $ pwd path/to/RAJAPerf @@ -191,31 +263,56 @@ directory and run CMake in it with the proper options. For example:: $ cmake .. $ make -j (or make -j to build with a specified number of cores) -For convenience and informational purposes, configuration scripts are maintained -in the ``RAJAPerf/scripts`` subdirectories for various build configurations. -For example, the ``RAJAPerf/scripts/lc-builds`` directory contains scripts that -can be used to generate build configurations for machines in the Livermore -Computing (LC) Center at Lawrence Livermore National Laboratory. These scripts -are to be run in the top-level RAJAPerf directory. Each script creates a -descriptively-named build space directory and runs CMake with a configuration -appropriate for the platform and specified compiler(s) indicated by the build -script name. For example, to build the code to generate baseline data on the -El Capitan system:: +For convenience and informational purposes, we maintain configuration scripts +in ``RAJAPerf/scripts`` subdirectories for various builds. For example, the +``RAJAPerf/scripts/lc-builds`` directory contains scripts that we use to +generate build configurations for machines in the Livermore Computing (LC) +Center at Lawrence Livermore National Laboratory for basic development. +These scripts are run in the top-level RAJAPerf directory. Each script creates +a descriptively-named build space directory and runs CMake to generate a build +space appropriate for the +platform and compiler(s) indicated by the script name and arguments passed to +it. Executing a script with no arguments will print a message indicating +which arguments are required. + +.. _rajaperf_build_mi300a-label: + +MI300A architecture +-------------------- + +To configure and build the code to generate baseline data on a system with +AMD MI300A processors (i.e., ATS-4 (El Capitan) architecture) discussed in +:ref:`rajaperf_results-label`, we ran the following commands:: $ pwd path/to/RAJAPerf $ ./scripts/lc-builds/toss4_cray-mpich_amdclang.sh 9.0.1 6.4.3 gfx942 - $ build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942 + $ cd build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942 + $ make -j + +Specifically, we configured and compiled the code for execution using version +9.0.1 of the Cray MPICH MPI library and the AMD clang compiler with ROCm +version 6.4.3 targeting GPU compute architecture gfx942. + +.. _rajaperf_build_h100-label: + +H100 architecture +-------------------- + +To configure and build the code to generate baseline data on a system with +NVIDIA H100 processors discussed in :ref:`rajaperf_results-label`, we ran the +following commands:: + + $ pwd + path/to/RAJAPerf + $ ./scripts/lc-builds/toss4_mvapich2_nvcc_gcc.sh 2.3.7 12.9.1 90 10.3.1 + $ cd build_lc_toss4-mvapich2-2.3.7-nvcc-12.9.1-90-gcc-10.3.1 $ make -j -This will build the code for CPU-GPU execution using the system-installed -version 9.0.1 of the Cray MPICH MPI library with the version 6.4.3 of the AMD -clang compiler (ROCm version 6.4.3) targeting GPU compute architecture gfx942, -which is appropriate for the AMD MI300A APU hardware on El Capitan. Please -consult the build script files in the ``RAJAPerf/scripts/lc-builds`` directory -for hints at building the code for other architectures and compilers. -Additional information on build configurations is described in the -`RAJA Performance Suite User Guide `_ for the version of the code in which you are interested. +Specifically, we configured and compiled the code for execution using version +2.3.7 of the MVAPICH2 MPI library, version 12.9.1 of the nvcc compiler for CUDA +targeting GPU compute architecture sm_90, and version 10.3.1 of the GNU compiler +for compiling host code. .. _rajaperf_run-label: @@ -223,62 +320,436 @@ Additional information on build configurations is described in the Running ======= -After the code is built, the executable will located in the ``bin`` directory -of the build space. Continuing the El Capitan example above:: +After the RAJA Performance Suite code is built, the executable will be located +in the ``bin`` subdirectory of the build space. + +To get information about how to run the code, use the *help option*:: $ pwd - path/to/build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942 + path/to/RAJAPerf + $ cd my-build $ ls bin rajaperf.exe + $ ./bin/rajaperf.exe --help (or -h) -To get usage information:: - - $ path/to/rajaperf.exe --help (or -h) - -This command will print all available command-line options along with potential -arguments and defaults. Options are avail to print information about the Suite, -to select output directory and file details, to select kernels and variants to -run, and how they are run (problem sizes, # times each kernel is run, data +This will print all available command-line options along with potential +arguments and defaults. Available options allow one to print information about +the kernels in the Suite, to select output directory and file details, to +select kernels and variants to run, to define how kernels are run (problem +sizes, # times each kernel is run to collect min/max/avg timing data, data spaces to use for array allocation, etc.). All arguments are optional. If no arguments are specified, the suite will run all kernels in their default -configurations for the variants that are available for the way the code -is configured to build. - -The script to run the benchmark for generating baselines for EL Capitan is -described in :ref:`rajaperf_results-label`. A similar recipe should be followed -for benchmarking other systems. +configurations for the variants that are available based on the way the code +was compiled. +In :ref:`rajaperf_results-label`, we provide the exact commands we used to +run the code and generate the baseline results for the benchmark. .. _rajaperf_validation-label: Validation ========== -Each kernel and variant run generates a checksum value based on kernel execution -output, such as an output data array computed by the kernel. The checksum +Each kernel variant run generates a checksum value based on the result of its +execution, such as an output data array computed by the kernel. The checksum depends on the problem size run for the kernel; thus, each checksum is -computed at run time. Validation criteria is defined in terms of the checksum +computed at run time. Validation criteria are defined in terms of the checksum difference between each kernel variant and problem size run and a corresponding -reference variant. The ``Base_Seq`` variant is used to define the -reference checksum and so that variant should be run for each kernel as part of -a performance study. Each kernel is annotated in the source code as to whether -the checksum for each variant is expected to match the reference checksum -exactly, or to be within some tolerance due to order of operation differences -when run in parallel. +reference variant. The reference variant is the baseline sequential (CPU) +variant for each kernel. The run scripts, described below, execute the baseline +sequential variant in addition to the benchmark variants to validate the answers +of the benchmark variants. -Whether the checksum for each kernel is considered to be within its expected -tolerance is reported as checksum ``PASSED`` or ``FAILED`` in the output files. +Each kernel is annotated in the source code as to whether the checksum for +each variant is expected to match the reference checksum exactly, or to be +within some tolerance due to order of operation or other differences when run in +parallel. Whether the checksum for a kernel is within its expected tolerance +is reported as checksum ``PASSED`` or ``FAILED`` in the checksum output files. -**Show an example of this for the EL Capitan baseline runs!!** - -**Reminder: add more accurate Base_Seq summation tunings (left fold is inaccurate for large problem sizes).** .. _rajaperf_results-label: Example Benchmark Results =========================== -**Include tables of results of El Capitan baseline results** +As stated earlier, we are mainly interested in single-node performance +with this benchmark. To generate throughput curves and estimate +saturation points, we use a bash shell script to run the code on each +platform and a Python script to process the data to construct throughput +plots, estimate saturation points, and make CSV files for tables of results. +These scripts are also available in the +`RAJAPerf-Benchmark GitHub repo `_. +The scripts and results discussed here are located in the ``scripts/2026-FCR`` +directory there. + +.. important:: In the following sections, we present detailed results, + including FOM tables and throughput plots for the Priority 1 + kernels described above. For completeness, we also include a + brief summary of results for Priority 2 kernels in less detail. + Data files containing results for all kernels run are included + in this repository. + +AMD MI300A throughput results (Priority 1 kernels) +---------------------------------------------------- + +For the MI300A architecture, we present two sets of throughput results. One is +run in ``SPX mode`` where we use 4 MPI ranks on a node, one for each MI300A APU, +and treat each APU as a single GPU. The other is run in +``CPX mode`` where we run with 24 MPI ranks on a node, six for each MI300A +APU, and treat each APU as 6 GPUs (one GPU = 1 XCD). In each case, we run +each kernel over a sequence of problem sizes such that the saturation point is +evident on its associated throughput curve. + +SPX mode (Priority 1) +^^^^^^^^^^^^^^^^^^^^^^ + +For SPX mode (run with 1 MPI rank per APU on a node), we choose the smallest +problem to use ~100,000 bytes of allocated memory and the largest problem +to use ~400MB of allocated memory, which is about 1.5 times the MALL +(Memory Attached Last-Level cache) size on the MI300A. The MALL is 256 MB +(256 * 1024 * 1024 = 268435456 bytes). + +Note that for two of the kernels ``FEMSWEEP`` and ``MASS3DEA``, we ran a +different problem size range because these kernels don't clearly saturate. +For them, we chose the smallest problem to use ~3.2MB of allocated +memory and the largest problem to use ~600MB memory, which is over twice as +large as the MALL. + +After building the code as described in :ref:`rajaperf_build_mi300a-label`, we +run the ``Priority 1`` kernels in **SPX mode** as follows:: + + $ pwd + path/to/RAJAPerf + $ cd build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942 + $ ./run_tier_mi300a.sh spx tier1 + +This generates a directory named ``RPBenchmark_MI300A_tier1-SPX``, which +contains the results files for each kernel run over its range of problem sizes. + +Then, we process the data for reporting the results in a concise form +by running a Python script we provide:: + + $ pwd + path/to/RAJAPerf + $ python3 path/to/process_data.py --root-dir path/to/build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX --output-dir path/to/build_lc_toss4-cray-mpich-9.0.1-amdclang-6.4.3-gfx942/RPBenchmark_MI300A_tier1-SPX/Output + +This generates throughput curve files for ``Base_HIP`` and ``RAJA_HIP`` +variants of each kernel and summarizes the FOM (described in +:ref:`rajaperf_fom-label`) in a CSV file. These files will be located in the +directory specified via the ``--output-dir`` option above. We include +the files generated by the ``process_data.py`` script ` here `_ + + * `RAJA GitHub project `_ + +Other helpful references include: + + * Olga Pearce, Jason Burmark, Rich Hornung, Befikir Bogale, Ian Lumsden, Michael McKinsey, Dewi Yokelson, David Boehme, Stephanie Brink, Michela Taufer, Tom Scogland, "RAJA Performance Suite: Performance Portability Analysis with Caliper and Thicket", in 2024 IEEE/ACM International Workshop on Performance, Portability and Productivity in HPC (P3HPC) at the International Conference on High Performance Computing, Network, Storage, and Analysis (SC-W 2024). [Download here](https://dl.acm.org/doi/pdf/10.1109/SCW63240.2024.00162) + + * D. A. Beckingsale, J. Burmark, R. Hornung, H. Jones, W. Killian, A. J. Kunen, O. Pearce, P. Robinson, B. S. Ryujin, T. R. W. Scogland, "RAJA: Portable Performance for Large-Scale Scientific Applications", 2019 IEEE/ACM International Workshop on Performance, Portability and Productivity in HPC (P3HPC). [Download here](https://conferences.computer.org/sc19w/2019/#!/toc/14) + + * Arturo Vargas, Thomas M. Stitt, Kenneth Weiss, Vladimir Z. Tomov, Jean-Sylvain Camier, Tzanio Kolev, Robert N. Rieben, "Matrix-free Approaches for GPU Acceleration of a High-order Finite Element Hydrodynamic Application using MFEM, Umpire, and RAJA", International Journal of High Performance Computing Applications. 36(4):492-509 (2022). [Download here](https://journals.sagepub.com/doi/10.1177/10943420221100262) diff --git a/docs/50_miniem/build--hops.sh b/docs/50_miniem/build--hops.sh new file mode 100755 index 0000000..2bd761a --- /dev/null +++ b/docs/50_miniem/build--hops.sh @@ -0,0 +1,27 @@ +#!/bin/sh +# spack env create miniem-hops-env +. "${SPACK_ROOT}/share/spack/setup-env.sh" +spack cd -e miniem-hops-env +spacktivate -p miniem-hops-env + +# spack compiler find + +# spack external find curl +# spack external find openssl +# spack external find openmpi +# spack external find gettext +# spack external find ncurses +# spack external find perl +# spack external find m4 + +spack add ninja +spack add cmake +spack add yaml-cpp +spack add blas +spack add lapack +spack add hdf5@1.10.9 api=v110 +spack add parallel-netcdf@1.12.3 +spack add netcdf-c@4.9+mpi+parallel-netcdf~szip~blosc~zstd + +spack concretize +spack install diff --git a/docs/50_miniem/env--ats4.sh b/docs/50_miniem/env--ats4.sh new file mode 100644 index 0000000..035deda --- /dev/null +++ b/docs/50_miniem/env--ats4.sh @@ -0,0 +1,38 @@ +#!/bin/bash + +module load craype-accel-amd-gfx942 +module load PrgEnv-cray +module load rocm/6.2.1 +module load python + +export LD_LIBRARY_PATH=${CRAY_LD_LIBRARY_PATH}:${LD_LIBRARY_PATH} + +export MPICH_GPU_SUPPORT_ENABLED=1 +export MPICH_OFI_NIC_POLICY=GPU + +### FIXME ### Need a system wide install of libfabric from SHS 11 (or newer) +export LD_LIBRARY_PATH=/usr/workspace/wsb/accept/packages-2024/SHS11_lib:${LD_LIBRARY_PATH} + +export HIP_PATH=`hipconfig -p` +export LD_LIBRARY_PATH=${HIP_PATH}/lib:${LD_LIBRARY_PATH} + +### Tell libfabric to only look for the ROCm runtime, not cuda, etc. +export FI_HMEM="rocr" + +# Have malloc() calls use huge pages +export HUGETLB_MORECORE=yes + +# restrict libhugetlbfs to be enabled for these executables only: +export HUGETLB_RESTRICT_EXE="defrag:lmp" + +export HSA_XNACK=1 + +export BUILD_BASE_DIR="` pwd -P `" +export TMPDIR="${BUILD_BASE_DIR}/tmp" +export SPACK_ROOT="${BUILD_BASE_DIR}/spack" +export SPACK_DISABLE_LOCAL_CONFIG=true +export SPACK_USER_CACHE_PATH="${SPACK_ROOT}/${USER}_local_cache" +export SPACK_EDITOR='emacs -nw' +tmppath="${SPACK_ROOT}/bin" +[[ ":$PATH:" != *":${tmppath}:"* ]] && export PATH="${tmppath}:${PATH}" +mkdir -p "${TMPDIR}" diff --git a/docs/50_miniem/env--hops.sh b/docs/50_miniem/env--hops.sh new file mode 100644 index 0000000..89fddd3 --- /dev/null +++ b/docs/50_miniem/env--hops.sh @@ -0,0 +1,15 @@ +#!/bin/sh +module purge +module load cudatoolkit/12.4 +module load gnu/12.2.1 +module load openmpi-gnu/4.1 +export BUILD_BASE_DIR="` pwd -P `" +export OMPI_CXX="${BUILD_BASE_DIR}/Trilinos/packages/kokkos/bin/nvcc_wrapper" +export TMPDIR="${BUILD_BASE_DIR}/tmp" +export SPACK_ROOT="${BUILD_BASE_DIR}/spack" +export SPACK_DISABLE_LOCAL_CONFIG=true +export SPACK_USER_CACHE_PATH="${SPACK_ROOT}/${USER}_local_cache" +export SPACK_EDITOR='emacs -nw' +tmppath="${SPACK_ROOT}/bin" +[[ ":$PATH:" != *":${tmppath}:"* ]] && export PATH="${tmppath}:${PATH}" +mkdir -p "${TMPDIR}" diff --git a/docs/50_miniem/miniem.rst b/docs/50_miniem/miniem.rst index f556aa9..bd45937 100644 --- a/docs/50_miniem/miniem.rst +++ b/docs/50_miniem/miniem.rst @@ -2,29 +2,386 @@ MiniEM ****** +.. note:: + The documentation herein needs to be updated for current + performance. + +This is the documentation for the Future Computing Resource (FCR) FY30 +Benchmark MiniEM. The content herein was created by the following +authors (in alphabetical order). + +- `Anthony M. Agelastos `_ +- `James J. Elliott `_ +- `Christian A. Glusa `_ +- `Roger P. Pawlowski `_ + +This material is based upon work supported by the Sandia National Laboratories +(SNL), a multimission laboratory managed and operated by National Technology and +Engineering Solutions of Sandia under the U.S. Department of Energy's National +Nuclear Security Administration under contract DE-NA0003525. Content herein +considered unclassified with unlimited distribution under SAND2023-01069O. + Purpose ======= +MiniEM solves a first order formulation of Maxwell's equations of +electromagnetics. MiniEM is the [Trilinos]_ proxy driver for the +electromagnetics sub-problem solved by EMPIRE and exercises the relevant +Trilinos components (i.e., Tpetra, Belos, MueLu, Ifpack2, Intrepid2, Panzer). + Characteristics =============== -Problems --------- +The goal is to utilize the specified version of MiniEM (see +:ref:`MiniEMApplicationVersion`) that runs the benchmark problem (see +:ref:`MiniEMProblem`) correctly (see :ref:`MiniEMCorrectness` if +changes are made to MiniEM). + + +.. _MiniEMApplicationVersion: + +Application Version +------------------- + +The command to clone is provided below. + +.. literalinclude:: miniem_clone.sh + :language: sh + :lines: 2- + +.. note:: + The Git SHA will be updated with a tag soon. + +The script to clone can be downloaded from :download:`miniem_clone.sh +`. It can also be executed in place to clone into +``docs/50_miniem/miniem``. + +.. code-block:: bash + + cd docs/50_miniem + ./miniem_clone.sh + + +Problem +------- + +The [Maxwell-Large]_ problem given by the input deck "maxwell-large.xml" +describes a uniform mesh of a 3D box which makes it ideal for scaling studies. +The stock input file for this can be found within the Trilinos repository in the +aforementioned link. + +Useful parameters from within this input deck are shown below. + +.. code-block:: + + + 23 + + 28 + + 35 + 36 + 37 + +These parameters are described below. + +``X Elements, Y Elements, Z Elements`` + This sets the size of the problem, which is the product of these 3 + quantities. These parameters are set to other values with the cases shown + herein. These values should be identical for the calculations herein. + Figure of Merit --------------- +Each MiniEM simulation writes out a Figure of Merit (FOM) block to +STDOUT. The relevant portion of this block is in the below example. + +.. code-block:: + + ================================= + FOM Calculation + ================================= + Number of cells = 4116000 + Time for Belos Linear Solve = 705.737 seconds + Number of Time Steps (one linear solve per step) = 1541 + FOM ( num_cells * num_steps / solver_time / 1000) = 8987.42 k-cell-steps per second + ================================= + +The number of steps, specified with the ``--numTimeSteps`` command +line option, described below in :ref:`MiniEMRunATS4`), must be large +enough so the time for the Belos Linear Solve is greater than 600 +seconds, i.e., so the solver runs for at least 10 minutes. The figure +of merit (FOM) is the bottom entry in this block, i.e., ``FOM ( +num_cells * num_steps / solver_time / 1000)``. + +It is desired to capture the FOM for varying problem sizes that +encompass utilizing 35% to 75% of available memory (when all PEs are +utilized). The ultimate goal is to maximize this throughput FOM while +utilizing at least 50% of available memory. + + +Correctness Check +----------------- + +MiniEM also provides the [Maxwell-AnalyticSolution]_ problem given by +the input deck "maxwell-analyticSolution.xml". This will output +analytic error values (see below for an example) and will cause the +simulation to fail (and return a non-zero exit code) if it exceeds +appropriate thresholds. This should be used to verify the build of +MiniEM upon the system to assess both the used programming environment +and any changes made to the benchmark. + +.. code-block:: + :emphasize-lines: 2 + + The Belos solver "GMRES block system" of type ""Belos::BlockGmresSolMgr": {Flexible: true, Num Blocks: 10, Maximum Iterations: 10, Maximum Restarts: 20, Convergence Tolerance: 1e-08}" returned a solve status of "SOLVE_STATUS_CONVERGED" in 1 iterations with total CPU time of 0.0189103 sec + L2 Error E maxwell - analyticSolution = 0.0566793 + + * finished time step 6, t = 5e-09 + ************************************************** + +This case can be run simply by following the overall instructions in +:ref:`MiniEMRunning` and replacing the benchmark input file with +"maxwell-analyticSolution.xml". Example output of a failed case is +provided below (also note that this case exited with an exit code of +134). + +.. code-block:: + + what(): /path/to/trilinos/packages/panzer/mini-em/example/BlockPrec/main.cpp:690: + + Throw number = 1 + + Throw test that evaluated to true: !( (std::sqrt(Thyra::get_ele(*g,0))) < (0.065) ) + + Error, (std::sqrt(Thyra::get_ele(*g,0)) = 0.0819696) < (0.065 = 0.065)! FAILED! + terminate called after throwing an instance of 'std::out_of_range' + what(): /path/to/trilinos/packages/panzer/mini-em/example/BlockPrec/main.cpp:690: + + +Permissable Modifications +------------------------- + +The authors of this benchmark invite vendors to propose any +algorithmic improvements that: (1.) do not alter the current Multigrid +solver approach; and (2.) follow the advice given in previous +subsections. Please email the authors with any questions about what is +or is not in scope. Some additional guidance is provided below. + +A minimum of one level of V-cycle is required for both sub-hierarchies +to ensure the Trilinos MueLu Algebraic Multigrid (AMG) code path is +exercised. This behavior is reflected in the benchmark problem and +needs to be preserved with vendor changes. In essence, the solver sets +up two sub-problems, and each is solved using AMG. Example Multigrid +output that demonstrates this is below. It is appropriate for the +following characteristics of this output to be preserved. + +* ``Scalar`` should be ``double`` (e.g., line 838) +* ``Number of levels`` should be at least ``2`` (e.g., line 839) +* ``Cycle type`` should be ``V`` (e.g., line 842) + +.. code-block:: + + 835 -------------------------------------------------------------------------------- + 836 --- Multigrid Summary RefMaxwell coarse (1,1) --- + 837 -------------------------------------------------------------------------------- + 838 Scalar = double + 839 Number of levels = 2 + 840 Operator complexity = 1.02 + 841 Smoother complexity = 1.07 + 842 Cycle type = V + 843 + 844 level rows nnz nnz/row c ratio procs + 845 0 21510 1840968 85.59 5 + 846 1 687 29525 42.98 31.31 1 + +Additionally, there are a couple of parameters within +"solverMueLu.xml" that should not be altered since changes will impact +the Multigrid work. The specified target size for the coarse grid +problems should not be modified. These parameters are highlighted +below for reference. + +.. code-block:: + :emphasize-lines: 10,12 + + + + + + + + + + + + + + Source code modifications ========================= Please see :ref:`GlobalRunRules` for general guidance on allowed modifications. + Building ======== +MiniEM and Trilinos prefer static versus dynamic linking for its +third-party libraries. Instructions for two systems will be provided +below. + +The platforms utilized for benchmarking activities are listed and described below. + +* A GPU build and test system within Sandia National Laboratories + named "hops" (see :ref:`MiniEMCTS2PlusHopsBuild`). This system has + compute nodes with two Intel Xeon Sapphire Rapids processors each + and a total of four Nvidia H100 GPUs. +* El Capitan (see :ref:`MiniEMATS4Build`) + + +.. _MiniEMCTS2PlusHopsBuild: + +Hops +---- + +Environment +^^^^^^^^^^^ + +Change to a relevant environment. + +.. code-block:: sh + + # source script to alter environment + . env--hops.sh + +This script is replicated below for posterity. + +.. literalinclude:: env--hops.sh + :language: sh + :lines: 2- + + +Spack +^^^^^ + +The following script will clone Spack and add it to the environment. + +.. code-block:: sh + + # clone Spack and add it to the environment + ./spack--hops.sh + +This script is replicated below for posterity. + +.. literalinclude:: spack--hops.sh + :language: sh + :lines: 2- + + +TPLs +^^^^ + +The following script will build the third-party libraries for Trilinos +and, by extension, MiniEM. + +.. code-block:: sh + + # build TPLs + ./build--hops.sh + +This script is replicated below for posterity. + +.. literalinclude:: build--hops.sh + :language: sh + :lines: 2- + + +MiniEM +^^^^^^ + +The following script will build Trilinos and MiniEM once its +dependencies are taken care of. This directly leverages Trilinos' +CMake build system. + +.. code-block:: sh + + # build Trilinos/MiniEM + ./trilinos--hops.sh + +This script can be quite long. It is replicated below +(:ref:`MiniEMBuildScriptsCTS2PlusHops`) for posterity and can be +easily downloaded (:download:`trilinos--hops.sh `) + + +.. _MiniEMATS4Build: + +El Capitan +---------- + +The El Capitan instructions are slightly more complicated due to +complications with building Trilinos' TPLs in an appropriate manner +for static linking. Accordingly, the TPL stack was built and leveraged +by the bulk of SNL code teams that use Trilinos. This stack will be +regenerated in a reproducible fashion soon. Until then, its existence +is required. + +Environment +^^^^^^^^^^^ + +Change to a relevant environment. + +.. code-block:: sh + + # source script to alter environment + . env--ats4.sh + +This script is replicated below for posterity. + +.. literalinclude:: env--ats4.sh + :language: sh + :lines: 2- + +Spack +^^^^^ + +The TPL stack can be built via Spack. Specific patching for El Capitan +is being created in a reproducible fashion. + +.. note:: + This will be updated once the Spack recipe is reproducible. + +TPLs +^^^^ + +The TPL stack can be built via Spack. Specific patching for El Capitan +is being created in a reproducible fashion. + +.. note:: + This will be updated once the Spack recipe is reproducible. + +MiniEM +^^^^^^ + +The following script will build Trilinos and MiniEM once its +dependencies are taken care of. This directly leverages Trilinos' +CMake build system. + +.. code-block:: sh + + # build Trilinos/MiniEM + ./trilinos--ats4.sh + +.. note:: + This will be updated for referencing ones own TPLs soon. + +This script can be quite long. It is replicated below +(:ref:`MiniEMBuildScriptsATS4`) for posterity and can be +easily downloaded (:download:`trilinos--ats4.sh `) + Running ======= @@ -50,5 +407,43 @@ Weak Scaling on El Capitan ========================== +Trilinos Build Scripts +====================== + + +.. _MiniEMBuildScriptsCTS2PlusHops: + +Hops +---- + +.. literalinclude:: trilinos--hops.sh + :language: sh + :lines: 2- + + +.. _MiniEMBuildScriptsATS4: + +El Capitan +---------- + +.. literalinclude:: trilinos--ats4.sh + :language: sh + :lines: 2- + + References ========== + +.. [Trilinos] M. A. Heroux and R. A. Bartlett and V. E. Howle and R. J. Hoekstra + and J. J. Hu and T. G. Kolda and R. B. Lehoucq and K. R. Long + and R. P. Pawlowski and E. T. Phipps and A. G. Salinger and H. K. + Thornquist and R. S. Tuminaro and J. M. Willenbring and A. + Williams and K. S. Stanley, 'An Overview of the Trilinos Project', + 2005, ACM Trans. Math. Softw., Volume 31, No. 3, ISSN 0098-3500. +.. [TrilinosBuild] R. A. Bartlett, 'Trilinos Configure, Build, Test, and Install + Reference Guide', 2023. [Online]. Available: + https://docs.trilinos.org/files/TrilinosBuildReference.html. + [Accessed: 26- Mar- 2023] +.. [Maxwell-Large] Trilinos developers, 'maxwell-large.xml', 2024. [Online]. Available: https://github.com/trilinos/Trilinos/blob/master/packages/panzer/mini-em/example/BlockPrec/maxwell-large.xml. [Accessed: 22- Feb- 2024] +.. [Maxwell-AnalyticSolution] Trilinos developers, 'maxwell-analyticSolution.xml', 2024. [Online]. Available: https://github.com/trilinos/Trilinos/blob/master/packages/panzer/mini-em/example/BlockPrec/maxwell-analyticSolution.xml. [Accessed: 22- Feb- 2024] +.. [Intel-8260] Intel. 'Intel Xeon Platinum 8260 Processor 35.75M Cache 2.40 GHz Product Specifications', 2024. [Online]. Available: https://ark.intel.com/content/www/us/en/ark/products/192474/intel-xeon-platinum-8260-processor-35-75m-cache-2-40-ghz.html. [Accessed: 18- Mar- 2024] diff --git a/docs/50_miniem/miniem_clone.sh b/docs/50_miniem/miniem_clone.sh new file mode 100755 index 0000000..ef745e8 --- /dev/null +++ b/docs/50_miniem/miniem_clone.sh @@ -0,0 +1,5 @@ +#!/bin/sh +git clone --branch develop git@github.com:trilinos/Trilinos miniem +cd miniem +git checkout e3f3708c16b9cf2a357c34b5e385c87bcb7883bf + diff --git a/docs/50_miniem/spack--hops.sh b/docs/50_miniem/spack--hops.sh new file mode 100755 index 0000000..cc3d541 --- /dev/null +++ b/docs/50_miniem/spack--hops.sh @@ -0,0 +1,4 @@ +#!/bin/sh +if test ! -d "${SPACK_ROOT}" ; then + git clone --branch v1.1.1 git@github.com:spack/spack "${SPACK_ROOT}" +fi diff --git a/docs/50_miniem/trilinos--ats4.sh b/docs/50_miniem/trilinos--ats4.sh new file mode 100755 index 0000000..9ce7d73 --- /dev/null +++ b/docs/50_miniem/trilinos--ats4.sh @@ -0,0 +1,158 @@ +#!/bin/sh + +# go into Spack environment +. "${SPACK_ROOT}/share/spack/setup-env.sh" +spack cd -e miniem-ats4-env +spacktivate -p miniem-ats4-env + +export TRILINOS_SRC_DIR="${BUILD_BASE_DIR}/Trilinos" +export TRILINOS_BUILD_DIR="${BUILD_BASE_DIR}/Trilinos-build" + +mkdir -p "${TRILINOS_BUILD_DIR}" +pushd "${TRILINOS_BUILD_DIR}" + +rm -rf CMake* +cmake \ + "-GNinja" \ + "-DPYTHON_EXECUTABLE=/usr/tce/bin/python3" \ + "-DCMAKE_BUILD_TYPE:STRING=Release" \ + "-DTrilinos_ENABLE_TrilinosBuildStats=OFF" \ + "-DTrilinos_ENABLE_BUILD_STATS=OFF" \ + "-DTrilinosBuildStats_ENABLE_TESTS=OFF" \ + "-DBUILD_SHARED_LIBS:BOOL=OFF" \ + "-DTrilinos_ENABLE_Teuchos=ON" \ + "-DPercept_ENABLE_TESTS=OFF" \ + "-DTrilinos_ENABLE_Panzer=ON" \ + "-DTrilinos_ENABLE_Percept=ON" \ + "-DIntrepid2_ENABLE_TESTS=OFF" \ + "-DTrilinos_ENABLE_PanzerMiniEM=ON" \ + "-DPanzerMiniEM_ENABLE_EXAMPLES=ON" \ + "-DPanzerMiniEM_ENABLE_TESTS=ON" \ + "-DIfpack2_ENABLE_EXAMPLES=ON" \ + "-DTpetra_INST_SERIAL:BOOL=OFF" \ + "-DKokkos_ENABLE_OPENMP:BOOL=OFF" \ + "-DTpetra_INST_OPENMP:BOOL=OFF" \ + "-DTrilinos_ENABLE_OpenMP:BOOL=OFF" \ + "-DKokkos_ENABLE_HIP:BOOL=ON" \ + "-DTpetra_INST_HIP:BOOL=ON" \ + "-DKOKKOSKERNELS_ENABLE_TPL_BLAS:BOOL=ON" \ + "-DKOKKOSKERNELS_ENABLE_TPL_LAPACK:BOOL=ON" \ + "-DSacado_ENABLE_HIERARCHICAL_DFAD=ON" \ + "-DKokkos_ARCH_AMD_GFX942_APU:BOOL=ON" \ + "-DKokkos_ARCH_NATIVE:BOOL=ON" \ + "-DCMAKE_EXE_LINKER_FLAGS=--offload-new-driver -x none --hip-link -Wl,--image-base=0x20000000 -Wl,-z,common-page-size=0x200000 -Wl,-z,max-page-size=0x200000 -Wl,--whole-archive,-lhugetlbfs,--no-whole-archive " \ + "-DCMAKE_SHARED_LINKER_FLAGS=--offload-new-driver -x none --hip-link -Wl,--image-base=0x20000000 -Wl,-z,common-page-size=0x200000 -Wl,-z,max-page-size=0x200000 -Wl,--whole-archive,-lhugetlbfs,--no-whole-archive " \ + "-DFC_FN_UNDERSCORE=UNDER" \ + "-DCMAKE_CXX_COMPILER=/opt/cray/pe/mpich/9.0.1/ofi/amd/6.0/bin/mpicxx" \ + "-DCMAKE_C_COMPILER=/opt/cray/pe/mpich/9.0.1/ofi/amd/6.0/bin/mpicc" \ + "-DCMAKE_Fortran_COMPILER=/opt/cray/pe/mpich/9.0.1/ofi/amd/6.0/bin/mpif90" \ + "-DCMAKE_CXX_FLAGS=--offload-new-driver -x hip -mllvm -amdgpu-early-inline-all=false -mllvm -amdgpu-function-calls=false -g " \ + "-DCMAKE_Fortran_FLAGS=" \ + "-DCMAKE_C_FLAGS=" \ + "-DCMAKE_LINKER=/opt/cray/pe/mpich/9.0.1/ofi/amd/6.0/bin/mpicxx" \ + "-DTrilinos_EXTRA_LINK_FLAGS=-L/opt/cray/pe/mpich/9.0.1/ofi/amd/6.0/lib -Wl,-rpath,/opt/cray/pe/mpich/9.0.1/ofi/amd/6.0/lib -lmpi_amd -lxpmem -L/opt/cray/pe/mpich/9.0.1/gtl/lib -Wl,-rpath,/opt/cray/pe/mpich/9.0.1/gtl/lib -lmpi_gtl_hsa -L/opt/rocm-6.4.3/lib -Wl,-rpath,/opt/rocm-6.4.3/lib -Wl,-rpath,/opt/rocm-6.4.3/llvm/lib -Wl,--disable-new-dtags,--as-needed,-lpthread,-lm,--no-as-needed" \ + "-DCMAKE_CXX_STANDARD=20" \ + "-DTrilinos_ENABLE_Fortran:BOOL=OFF" \ + "-DAztecOO_C_FLAGS=-Wno-implicit-function-declaration" \ + "-DTrilinos_ENABLE_TrilinosATDMConfigTests:BOOL=OFF" \ + "-DTrilinos_ENABLE_TrilinosFrameworkTests=OFF" \ + "-DTrilinos_ENABLE_Isorropia=OFF" \ + "-DTrilinos_ENABLE_KokkosExample=OFF" \ + "-DTrilinos_ENABLE_Domi=OFF" \ + "-DTrilinos_ENABLE_Pliris=OFF" \ + "-DTrilinos_ENABLE_Komplex=OFF" \ + "-DTrilinos_ENABLE_FEI=OFF" \ + "-DTrilinos_ENABLE_TriKota=OFF" \ + "-DTrilinos_ENABLE_Compadre=OFF" \ + "-DTrilinos_ENABLE_Moertel=OFF" \ + "-DTrilinos_ENABLE_Stokhos=OFF" \ + "-DTrilinos_ENABLE_MOOCHO=OFF" \ + "-DTrilinos_ENABLE_PyTrilinos=OFF" \ + "-DTrilinos_ENABLE_TrilinosCouplings=OFF" \ + "-DTrilinos_ENABLE_Pike=OFF" \ + "-DTrilinos_ENABLE_Krino=OFF" \ + "-DShyLU_DD_ENABLE_BDDC=OFF" \ + "-DTrilinos_ENABLE_PyTrilinos=OFF" \ + "-DTrilinos_ENABLE_ThyraEpetraExtAdapters=OFF" \ + "-DTrilinos_ENABLE_ThyraEpetraAdapters=OFF" \ + "-DTrilinos_ENABLE_ML=OFF" \ + "-DTrilinos_ENABLE_Ifpack=OFF" \ + "-DTrilinos_ENABLE_EpetraExt=OFF" \ + "-DTrilinos_ENABLE_Epetra=OFF" \ + "-DTrilinos_ENABLE_AztecOO=OFF" \ + "-DTrilinos_ENABLE_Amesos=OFF" \ + "-DROL_ENABLE_TESTS=OFF" \ + "-DROL_ENABLE_EXAMPLES=OFF" \ + "-DTPL_ENABLE_Gtest=OFF" \ + "-DTrilinos_ENABLE_Gtest=OFF" \ + "-DTPL_ENABLE_gtest=OFF" \ + "-DTrilinos_ENABLE_gtest=OFF" \ + "-DKOKKOSKERNELS_TPL_BLAS_RETURN_COMPLEX=OFF" \ + "-DTacho_ENABLE_INT_INT:BOOL=ON" \ + "-DMATH_LIBRARY_IS_SUPPLIED:BOOL=TRUE" \ + "-DTPL_ENABLE_BinUtils:BOOL=OFF" \ + "-DBinUtils_INCLUDE_DIRS=/include" \ + "-DBinUtils_LIBRARY_DIRS=/lib" \ + "-DTPL_ENABLE_BLAS:BOOL=ON" \ + "-DTPL_ENABLE_LAPACK:BOOL=ON" \ + "-DBLAS_LIBRARY_NAMES=openblas;omp;pthread" \ + "-DBLAS_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/openblas-0.3.26-7ous25omfpnyeakkmkkcuj5yo2flwbz2/include" \ + "-DBLAS_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/openblas-0.3.26-7ous25omfpnyeakkmkkcuj5yo2flwbz2/lib" \ + "-DLAPACK_LIBRARY_NAMES=openblas;omp;pthread" \ + "-DLAPACK_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/openblas-0.3.26-7ous25omfpnyeakkmkkcuj5yo2flwbz2/include" \ + "-DLAPACK_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/openblas-0.3.26-7ous25omfpnyeakkmkkcuj5yo2flwbz2/lib" \ + "-DTPL_ENABLE_Boost:BOOL=ON" \ + "-DTPL_ENABLE_BoostLib:BOOL=ON" \ + "-DBoost_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/boost-1.84.0-s6nrdx55cgkb7nrn7egjj6vghowza7go/include" \ + "-DBoost_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/boost-1.84.0-s6nrdx55cgkb7nrn7egjj6vghowza7go/lib" \ + "-DBoostLib_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/boost-1.84.0-s6nrdx55cgkb7nrn7egjj6vghowza7go/include" \ + "-DBoostLib_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/boost-1.84.0-s6nrdx55cgkb7nrn7egjj6vghowza7go/lib" \ + "-DTPL_ENABLE_METIS:BOOL=ON" \ + "-DTPL_ENABLE_ParMETIS:BOOL=ON" \ + "-DMETIS_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/metis-5.1.0-sonspt6l325bwlxz6vs5e5kp3wy2t27v/include" \ + "-DMETIS_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/metis-5.1.0-sonspt6l325bwlxz6vs5e5kp3wy2t27v/lib" \ + "-DParMETIS_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/parmetis-4.0.3-7me2x3yqtsqjusxnob2tj5ydgevs7d2v/include;/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/metis-5.1.0-sonspt6l325bwlxz6vs5e5kp3wy2t27v/include" \ + "-DParMETIS_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/parmetis-4.0.3-7me2x3yqtsqjusxnob2tj5ydgevs7d2v/lib;/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/metis-5.1.0-sonspt6l325bwlxz6vs5e5kp3wy2t27v/lib" \ + "-DTPL_ENABLE_CGNS:BOOL=ON" \ + "-DCGNS_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/cgns-4.4.0-wdqq2fnyhjgws4qr52civhekb5bxmjow/include" \ + "-DCGNS_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/cgns-4.4.0-wdqq2fnyhjgws4qr52civhekb5bxmjow/lib" \ + "-DTPL_ENABLE_HDF5:BOOL=ON" \ + "-DHDF5_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/hdf5-1.10.7-dact4arqw6rnvz363lp27fvl3zaorg4p/lib;/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/zlib-ng-2.1.6-txnpxomrj6vzuhydnyjnuoalr2uag762/lib" \ + "-DHDF5_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/hdf5-1.10.7-dact4arqw6rnvz363lp27fvl3zaorg4p/include" \ + "-DHDF5_LIBRARY_NAMES=hdf5_hl;hdf5;z;dl" \ + "-DTPL_ENABLE_Netcdf:BOOL=ON" \ + "-DNetcdf_LIBRARY_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/zlib-ng-2.1.6-txnpxomrj6vzuhydnyjnuoalr2uag762/lib;/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/boost-1.84.0-s6nrdx55cgkb7nrn7egjj6vghowza7go/lib;/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/netcdf-c-4.9.2-hocnq5daqf5ei4uutejwr4wih4rmy72f/lib;/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/parallel-netcdf-1.12.3-ukjcb2hshjspzan677qx2267rf6vrny2/lib;/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/hdf5-1.10.7-dact4arqw6rnvz363lp27fvl3zaorg4p/lib;/lib" \ + "-DNetcdf_LIBRARY_NAMES=netcdf;pnetcdf;z;hdf5_hl;hdf5" \ + "-DNetcdf_INCLUDE_DIRS=/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/netcdf-c-4.9.2-hocnq5daqf5ei4uutejwr4wih4rmy72f/include;/tscratch/jjellio/trilinos-dev/spack/nov-25-2025/install/linux-rhel8-zen3/rocmcc-6.4.3/parallel-netcdf-1.12.3-ukjcb2hshjspzan677qx2267rf6vrny2/include" \ + "-DTPL_ENABLE_SuperLUDist:BOOL=OFF" \ + "-DSuperLUDist_INCLUDE_DIRS=/include" \ + "-DSuperLUDist_LIBRARY_DIRS=/lib" \ + "-DTPL_ENABLE_Matio=OFF" \ + "-DTPL_ENABLE_X11=OFF" \ + "-DMPI_EXEC_NUMPROCS_FLAG=run;-x;-N;1;-n" \ + "-DMPI_EXEC=flux" \ + "-DTPL_ENABLE_MPI:BOOL=ON" \ + "-DMPI_USE_COMPILER_WRAPPERS=OFF" \ + "-DTPL_ENABLE_DLlib:BOOL=ON" \ + "-DDLlib_INCLUDE_DIRS=/opt/rocm-6.4.3/include" \ + "-DDLlib_LIBRARY_DIRS=/opt/rocm-6.4.3/lib" \ + "-DDLlib_LIBRARY_NAMES=dl;m" \ + "-DKOKKOSKERNELS_ENABLE_TPL_ROCBLAS:BOOL=ON" \ + "-DTPL_ENABLE_ROCBLAS:BOOL=ON" \ + "-DROCBLAS_INCLUDE_DIRS=/opt/rocm-6.4.3/include" \ + "-DROCBLAS_LIBRARY_DIRS=/opt/rocm-6.4.3/lib" \ + "-DTrilinos_ENABLE_ShyLU_NodeTacho=OFF" \ + "-DKOKKOSKERNELS_ENABLE_TPL_ROCSPARSE:BOOL=ON" \ + "-DTPL_ENABLE_ROCSPARSE:BOOL=ON" \ + "-DROCSPARSE_INCLUDE_DIRS=/opt/rocm-6.4.3/include" \ + "-DROCSPARSE_LIBRARY_DIRS=/opt/rocm-6.4.3/lib" \ + "-DCMAKE_INSTALL_PREFIX=/tscratch/amagela/fcr/miniem/install/amd-6.4.3_prgenv-amd_rocm-6.4.3_mpich-9.0.1_pure-amd_hip_amd-NOinlall-NOfunc-gfx942_devtpls_opt-g_cxx20_libonly_static/trilinos" \ +/tscratch/amagela/fcr/miniem/trilinos 2>&1 | tee configure_trilinos_performance.log + +## Prevents re-configure after a new configure. +touch build.ninja rules.ninja + +ninja -j 32 +ninja -j 8 + +popd diff --git a/docs/50_miniem/trilinos--hops.sh b/docs/50_miniem/trilinos--hops.sh new file mode 100755 index 0000000..5231a89 --- /dev/null +++ b/docs/50_miniem/trilinos--hops.sh @@ -0,0 +1,152 @@ +#!/bin/sh + +# go into Spack environment +. "${SPACK_ROOT}/share/spack/setup-env.sh" +spack cd -e miniem-hops-env +spacktivate -p miniem-hops-env + +export TRILINOS_SRC_DIR="${BUILD_BASE_DIR}/Trilinos" +export TRILINOS_BUILD_DIR="${BUILD_BASE_DIR}/Trilinos-build" + +# get Trilinos if necessary +if test ! -d "${TRILINOS_SRC_DIR}" ; then + git clone --branch develop git@github.com:trilinos/Trilinos "${TRILINOS_SRC_DIR}" +fi + +# This is set in the load_spack_cuda.sh file. +export OMPI_CXX="${TRILINOS_SRC_DIR}/packages/kokkos/bin/nvcc_wrapper" + +mkdir -p "${TRILINOS_BUILD_DIR}" +pushd "${TRILINOS_BUILD_DIR}" + +rm -rf CMake* +cmake \ + -D Teuchos_ENABLE_DEBUG_RCP_NODE_TRACING=OFF \ + -G Ninja \ + -D Trilinos_ENABLE_Fortran:BOOL=OFF \ + -D PYTHON_EXECUTABLE:FILEPATH=python3 \ + -D CMAKE_INSTALL_PREFIX="$BUILD_BASE_DIR/install-trilinos" \ + -D Trilinos_ENABLE_EXPLICIT_INSTANTIATION:BOOL=ON \ + -D CMAKE_CXX_STANDARD="20" \ + -D Trilinos_ENABLE_CHECKED_STL:BOOL=OFF \ + -D Trilinos_ENABLE_TEUCHOS_TIME_MONITOR:BOOL=ON \ + -D Panzer_ENABLE_TEUCHOS_TIME_MONITOR:BOOL=ON \ + -D NOX_ENABLE_TEUCHOS_TIME_MONITOR:BOOL=ON \ + -D NOX_BUILD_PRERELEASE=ON \ + \ + -D NOX_ENABLE_TESTS=OFF \ + -D NOX_ENABLE_EXAMPLES=OFF \ + \ + -D Trilinos_ENABLE_INSTALL_CMAKE_CONFIG_FILES:BOOL=ON \ + -D Trilinos_ENABLE_ALL_PACKAGES:BOOL=OFF \ + -D Trilinos_ENABLE_ALL_OPTIONAL_PACKAGES:BOOL=OFF \ + -D Trilinos_ENABLE_EXAMPLES:BOOL=OFF \ + -D Trilinos_ENABLE_TESTS:BOOL=OFF \ + -D EpetraExt_ENABLE_HDF5:BOOL=OFF \ + -D Teuchos_ENABLE_FLOAT:BOOL=OFF \ + -D Teuchos_ENABLE_COMPLEX:BOOL=OFF \ + -D Teuchos_KOKKOS_PROFILING:BOOL=ON \ + -D Kokkos_ENABLE_PROFILING:BOOL=ON \ + -D Tpetra_INST_FLOAT:BOOL=OFF \ + -D Tpetra_INST_COMPLEX_FLOAT:BOOL=OFF \ + -D Tpetra_INST_COMPLEX_DOUBLE:BOOL=OFF \ + -D Tpetra_INST_INT_INT:BOOL=OFF \ + -D Xpetra_ENABLE_Epetra:BOOL=OFF \ + -D MueLu_ENABLE_Epetra:BOOL=OFF \ + -D Piro_ENABLE_MueLu:BOOL=OFF \ + -D SEACASExodus_ENABLE_MPI:BOOL=OFF \ + -D Trilinos_ENABLE_SEACASExodiff=ON \ + -D Trilinos_ENABLE_SEACASEpu=ON \ + -D Trilinos_ENABLE_SEACASNemspread=ON \ + -D Trilinos_ENABLE_SEACASNemslice=ON \ + -D Trilinos_ENABLE_SEACASAprepro:BOOL=ON \ + -D Trilinos_ENABLE_KokkosCore:BOOL=ON \ + -D Trilinos_ENABLE_KokkosAlgorithms:BOOL=ON \ + -D Trilinos_ENABLE_Tempus:BOOL=OFF \ + -D Trilinos_ENABLE_Zoltan2:BOOL=ON \ + -D Trilinos_ENABLE_Xpetra=ON \ + -D Trilinos_ENABLE_MueLu:BOOL=ON \ + -D MueLu_ENABLE_Kokkos_Refactor:BOOL=ON \ + -D Xpetra_ENABLE_Kokkos_Refactor:BOOL=ON \ + -D MueLu_ENABLE_Kokkos_Refactor_Use_By_Default:BOOL=ON \ + -D Trilinos_ENABLE_Ifpack2:BOOL=ON \ + -D Trilinos_ENABLE_Amesos2:BOOL=ON \ + -D Amesos2_ENABLE_LAPACK:BOOL=ON \ + -D Amesos2_ENABLE_KLU2:BOOL=ON \ + -D Trilinos_ENABLE_Pamgen:BOOL=ON \ + -D Intrepid2_ENABLE_TESTS=OFF \ + -D Phalanx_SHOW_DEPRECATED_WARNINGS:BOOL=ON \ + -D Phalanx_ENABLE_DEVICE_DAG=OFF \ + -D Phalanx_ENABLE_TESTS=OFF \ + -D Trilinos_ENABLE_Panzer:BOOL=ON \ + -D Trilinos_ENABLE_PanzerExprEval=ON \ + -D Sacado_ENABLE_HIERARCHICAL_DFAD=ON \ + -D Panzer_ENABLE_HESSIAN_SUPPORT:BOOL=OFF \ + -D Panzer_ENABLE_TESTS:BOOL=ON \ + -D Panzer_ENABLE_EXAMPLES:BOOL=ON \ + -D Trilinos_ENABLE_Percept=ON \ + -D Trilinos_ENABLE_SECONDARY_TESTED_CODE:BOOL=ON \ + -D Trilinos_ENABLE_TriKota:BOOL=OFF \ + -D TPL_ENABLE_MPI:BOOL=ON \ + -D MPI_EXEC_POST_NUMPROCS_FLAGS="-bind-to;None" \ + -D TPL_ENABLE_Boost:BOOL=OFF \ + -D TPL_ENABLE_HDF5:BOOL=ON \ + -D HDF5_INCLUDE_DIRS="$(spack location -i hdf5)/include" \ + -D HDF5_LIBRARY_DIRS="$(spack location -i hdf5)/lib64" \ + -D TPL_ENABLE_Zlib:BOOL=ON \ + -D TPL_ENABLE_Netcdf:BOOL=ON \ + -DTPL_ENABLE_Matio=OFF \ + -DTPL_ENABLE_X11=OFF \ + -D CMAKE_CXX_COMPILER:FILEPATH="mpicxx" \ + -D CMAKE_C_COMPILER:FILEPATH="mpicc" \ + -D CMAKE_Fortran_COMPILER:FILEPATH="mpifort" \ + -D CMAKE_CXX_FLAGS:STRING="-g1 -Wshadow -Wall -fdiagnostics-color=always -Wno-deprecated-declarations" \ + -D CMAKE_C_FLAGS:STRING="-g1" \ + -D CMAKE_Fortran_FLAGS:STRING="-g1" \ + -D CMAKE_EXE_LINKER_FLAGS:STRING="-lgfortran" \ + -D CMAKE_VERBOSE_MAKEFILE:BOOL=OFF \ + -D Trilinos_VERBOSE_CONFIGURE:BOOL=OFF \ + -D CMAKE_BUILD_TYPE:STRING=Release \ + -D Trilinos_ENABLE_DEBUG=OFF \ + -D Trilinos_ENABLE_DEBUG_SYMBOLS:BOOL=OFF \ + -D Kokkos_ENABLE_DEBUG:BOOL=OFF \ + -D Phalanx_ENABLE_DEBUG=OFF \ + -D BUILD_SHARED_LIBS:BOOL=OFF \ + -D Trilinos_ENABLE_COVERAGE_TESTING:BOOL=OFF \ + -D Trilinos_ENABLE_OpenMP:BOOL=OFF \ + -D Tpetra_ENABLE_CUDA=ON \ + -D Tpetra_INST_CUDA=ON \ + -D Tpetra_INST_SERIAL=ON \ + -D TPL_ENABLE_CUDA=ON \ + -D TPL_ENABLE_CUSPARSE=ON \ + -D CUDA_cublas_LIBRARY=${CUDA_LIBS}/libcublas.so \ + -D CUDA_cusparse_LIBRARY=${CUDA_LIBS}/libcusparse.so \ + -D CUDA_cusolver_LIBRARY=${CUDA_LIBS}/libcusolver.so \ + -D CUDA_cufft_LIBRARY=${CUDA_LIBS}/libcufft.so \ + -D Kokkos_ENABLE_CUDA=ON \ + -D Kokkos_ENABLE_DEBUG_BOUNDS_CHECK=OFF \ + -D Kokkos_ENABLE_CUDA_RELOCATABLE_DEVICE_CODE=ON \ + -D Kokkos_ARCH_HOPPER90=ON \ + \ + -D Trilinos_PARALLEL_LINK_JOBS_LIMIT=12 \ + \ + -D TPL_ENABLE_HDF5=ON \ + -D TPL_ENABLE_Netcdf:BOOL=ON \ + \ + -D Trilinos_AUTOGENERATE_TEST_RESOURCE_FILE=OFF \ + -D Trilinos_CUDA_NUM_GPUS=4 \ + -D Trilinos_CUDA_SLOTS_PER_GPU=3 \ + \ + -D Panzer_ADD_EXPENSIVE_CUDA_TESTS=ON \ + -D TPL_ENABLE_gtest=OFF \ + \ + "${TRILINOS_SRC_DIR}" + +## Prevents re-configure after a new configure. +touch build.ninja rules.ninja + +ninja -j 32 +ninja -j 8 + +popd +