***** Summary of parameters
ARCH : IBM
PLATFORM : SNOW_xlf90
TIMING_FACTOR : 3
NUM_TRY : 3
NUM_ITER : 256
DELAY : 10.00000 ms
WORK TIMER RES : 0.00100 ms
SCH_LOOP_CNT : 32
MIN_OVERHEAD(%) : 15
MIN_TIMING : 1 seconds
MY_LONG_MAX : 999999999
max_num_threads : 8
***** Start Testing : !$OMP atomic
-- iter_facotr : 500
-- try_count : 1
-- delay_time : 0.003333 ms
-- Running Reference case
WC Timing = 1.269667 second
Standard deviation = 0.010965 second
CPU Timing = 1.268333 second
Standard deviation = 0.010069 second
-- Testing 8 threads
WC Timing = 5.656667 second
Standard deviation = 0.007717 second
WC overhead = 4.387000 second
Standard deviation = 0.013408 second
WC overhead/iter = 0.034273 ms
WC overhead(%) wrt reference = 345.523755
CPU Timing = 5.644583 second
Standard deviation = 0.008186 second
CPU overhead = 4.376250 second
Standard deviation = 0.012977 second
CPU overhead/iter = 0.034189 ms
CPU overhead(%) wrt reference = 345.039446
-- Running Reference case
WC Timing = 1.290667 second
Standard deviation = 0.014267 second
CPU Timing = 1.291668 second
Standard deviation = 0.013592 second
-- Testing 4 threads
WC Timing = 1.691333 second
Standard deviation = 0.014704 second
WC overhead = 0.400667 second
Standard deviation = 0.020488 second
WC overhead/iter = 0.003130 ms
WC overhead(%) wrt reference = 31.043389
CPU Timing = 1.690000 second
Standard deviation = 0.014287 second
CPU overhead = 0.398332 second
Standard deviation = 0.019719 second
CPU overhead/iter = 0.003112 ms
CPU overhead(%) wrt reference = 30.838573
-- Running Reference case
WC Timing = 1.279000 second
Standard deviation = 0.001414 second
CPU Timing = 1.276667 second
Standard deviation = 0.002356 second
-- Testing 2 threads
WC Timing = 1.650667 second
Standard deviation = 0.006799 second
WC overhead = 0.371667 second
Standard deviation = 0.006944 second
WC overhead/iter = 0.002904 ms
WC overhead(%) wrt reference = 29.059161
CPU Timing = 1.649999 second
Standard deviation = 0.007069 second
CPU overhead = 0.373332 second
Standard deviation = 0.007451 second
CPU overhead/iter = 0.002917 ms
CPU overhead(%) wrt reference = 29.242678
-- Running Reference case
WC Timing = 1.298333 second
Standard deviation = 0.011842 second
CPU Timing = 1.293335 second
Standard deviation = 0.009430 second
-- Testing 1 threads
WC Timing = 1.359000 second
Standard deviation = 0.003742 second
WC overhead = 0.060667 second
Standard deviation = 0.012419 second
WC overhead/iter = 0.000474 ms
WC overhead(%) wrt reference = 4.672657
CPU Timing = 1.360001 second
Standard deviation = 0.000000 second
CPU overhead = 0.066666 second
Standard deviation = 0.009430 second
CPU overhead/iter = 0.000521 ms
CPU overhead(%) wrt reference = 5.154554
***** Finished


*******************************
* ELAPSE TIME = 46.498001
*******************************



***** Start Testing : !$OMP barrier
-- iter_facotr : 180
-- try_count : 1
-- delay_time : 0.016667 ms
-- Running Reference case
WC Timing = 1.152000 second
Standard deviation = 0.007257 second
CPU Timing = 9.209997 second
Standard deviation = 0.057149 second
-- Testing 8 threads
WC Timing = 2.111000 second
Standard deviation = 0.014445 second
WC overhead = 0.959000 second
Standard deviation = 0.016166 second
WC overhead/iter = 0.020812 ms
WC overhead(%) wrt reference = 83.246530
CPU Timing = 16.870010 second
Standard deviation = 0.104251 second
CPU overhead = 7.660014 second
Standard deviation = 0.118888 second
CPU overhead/iter = 0.166233 ms
CPU overhead(%) wrt reference = 83.170648
-- Running Reference case
WC Timing = 1.158000 second
Standard deviation = 0.005657 second
CPU Timing = 4.633331 second
Standard deviation = 0.026235 second
-- Testing 4 threads
WC Timing = 1.736667 second
Standard deviation = 0.018661 second
WC overhead = 0.578667 second
Standard deviation = 0.019499 second
WC overhead/iter = 0.012558 ms
WC overhead(%) wrt reference = 49.971213
CPU Timing = 6.943329 second
Standard deviation = 0.082620 second
CPU overhead = 2.309998 second
Standard deviation = 0.086685 second
CPU overhead/iter = 0.050130 ms
CPU overhead(%) wrt reference = 49.856084
-- Running Reference case
WC Timing = 1.132000 second
Standard deviation = 0.002160 second
CPU Timing = 2.263346 second
Standard deviation = 0.004719 second
-- Testing 2 threads
WC Timing = 1.540667 second
Standard deviation = 0.002625 second
WC overhead = 0.408667 second
Standard deviation = 0.003399 second
WC overhead/iter = 0.008869 ms
WC overhead(%) wrt reference = 36.101294
CPU Timing = 3.076660 second
Standard deviation = 0.012495 second
CPU overhead = 0.813314 second
Standard deviation = 0.013357 second
CPU overhead/iter = 0.017650 ms
CPU overhead(%) wrt reference = 35.934129
-- Running Reference case
WC Timing = 1.139000 second
Standard deviation = 0.002944 second
CPU Timing = 1.139994 second
Standard deviation = 0.000014 second
-- Testing 1 threads
WC Timing = 1.150000 second
Standard deviation = 0.007118 second
WC overhead = 0.011000 second
Standard deviation = 0.007703 second
WC overhead/iter = 0.000239 ms
WC overhead(%) wrt reference = 0.965758
CPU Timing = 1.150004 second
Standard deviation = 0.008173 second
CPU overhead = 0.010010 second
Standard deviation = 0.008173 second
CPU overhead/iter = 0.000217 ms
CPU overhead(%) wrt reference = 0.878054
***** Finished


*******************************
* ELAPSE TIME = 33.428001
*******************************



***** Start Testing : !$OMP critical
-- iter_facotr : 15000
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 1.271667 second
Standard deviation = 0.008014 second
CPU Timing = 10.163340 second
Standard deviation = 0.068477 second
-- Testing 8 threads
WC Timing = 7.465667 second
Standard deviation = 0.005907 second
WC overhead = 6.194000 second
Standard deviation = 0.009955 second
WC overhead/iter = 0.000538 ms
WC overhead(%) wrt reference = 487.077320
CPU Timing = 59.683350 second
Standard deviation = 0.047832 second
CPU overhead = 49.520009 second
Standard deviation = 0.083529 second
CPU overhead/iter = 0.004299 ms
CPU overhead(%) wrt reference = 487.241479
-- Running Reference case
WC Timing = 1.271000 second
Standard deviation = 0.007789 second
CPU Timing = 5.086629 second
Standard deviation = 0.030956 second
-- Testing 4 threads
WC Timing = 7.452333 second
Standard deviation = 0.000471 second
WC overhead = 6.181333 second
Standard deviation = 0.007803 second
WC overhead/iter = 0.000537 ms
WC overhead(%) wrt reference = 486.336211
CPU Timing = 29.806722 second
Standard deviation = 0.009437 second
CPU overhead = 24.720093 second
Standard deviation = 0.032362 second
CPU overhead/iter = 0.002146 ms
CPU overhead(%) wrt reference = 485.981809
-- Running Reference case
WC Timing = 1.271000 second
Standard deviation = 0.007789 second
CPU Timing = 2.540039 second
Standard deviation = 0.014156 second
-- Testing 2 threads
WC Timing = 7.461667 second
Standard deviation = 0.012970 second
WC overhead = 6.190667 second
Standard deviation = 0.015129 second
WC overhead/iter = 0.000537 ms
WC overhead(%) wrt reference = 487.070543
CPU Timing = 14.920003 second
Standard deviation = 0.028427 second
CPU overhead = 12.379964 second
Standard deviation = 0.031757 second
CPU overhead/iter = 0.001075 ms
CPU overhead(%) wrt reference = 487.392669
-- Running Reference case
WC Timing = 1.270333 second
Standard deviation = 0.008260 second
CPU Timing = 1.269938 second
Standard deviation = 0.008273 second
-- Testing 1 threads
WC Timing = 7.449333 second
Standard deviation = 0.000471 second
WC overhead = 6.179000 second
Standard deviation = 0.008273 second
WC overhead/iter = 0.000536 ms
WC overhead(%) wrt reference = 486.407769
CPU Timing = 7.450033 second
Standard deviation = 0.000115 second
CPU overhead = 6.180094 second
Standard deviation = 0.008274 second
CPU overhead/iter = 0.000536 ms
CPU overhead(%) wrt reference = 486.645306
***** Finished


*******************************
* ELAPSE TIME = 391.950989
*******************************



***** Start Testing : false sharing Note: overhead means comparision with pirvate ref.
-- iter_facotr : 1024000
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 1.371333 second
Standard deviation = 0.001247 second
CPU Timing = 10.966715 second
Standard deviation = 0.004604 second
-- Testing 8 threads
WC Timing = 8.801000 second
Standard deviation = 0.007348 second
WC overhead = 7.429667 second
Standard deviation = 0.007454 second
WC overhead/iter = 0.000028 ms
WC overhead(%) wrt reference = 541.784151
CPU Timing = 70.379964 second
Standard deviation = 0.069725 second
CPU overhead = 59.413249 second
Standard deviation = 0.069876 second
CPU overhead/iter = 0.000227 ms
CPU overhead(%) wrt reference = 541.759734
-- Running Reference case
WC Timing = 1.331667 second
Standard deviation = 0.000471 second
CPU Timing = 5.323324 second
Standard deviation = 0.009552 second
-- Testing 4 threads
WC Timing = 7.783333 second
Standard deviation = 0.051227 second
WC overhead = 6.451667 second
Standard deviation = 0.051229 second
WC overhead/iter = 0.000025 ms
WC overhead(%) wrt reference = 484.480601
CPU Timing = 31.123291 second
Standard deviation = 0.208148 second
CPU overhead = 25.799967 second
Standard deviation = 0.208367 second
CPU overhead/iter = 0.000098 ms
CPU overhead(%) wrt reference = 484.659013
-- Running Reference case
WC Timing = 1.331333 second
Standard deviation = 0.000471 second
CPU Timing = 2.663330 second
Standard deviation = 0.004662 second
-- Testing 2 threads
WC Timing = 7.765333 second
Standard deviation = 0.061266 second
WC overhead = 6.434000 second
Standard deviation = 0.061268 second
WC overhead/iter = 0.000025 ms
WC overhead(%) wrt reference = 483.274912
CPU Timing = 15.533366 second
Standard deviation = 0.123585 second
CPU overhead = 12.870036 second
Standard deviation = 0.123673 second
CPU overhead/iter = 0.000049 ms
CPU overhead(%) wrt reference = 483.230971
-- Running Reference case
WC Timing = 1.349333 second
Standard deviation = 0.000471 second
CPU Timing = 1.346680 second
Standard deviation = 0.004662 second
-- Testing 1 threads
WC Timing = 1.312333 second
Standard deviation = 0.012499 second
WC overhead = -0.037000 second
Standard deviation = 0.012508 second
WC overhead/iter = 0.000000 ms
WC overhead(%) wrt reference = -2.742095
CPU Timing = 1.306641 second
Standard deviation = 0.009322 second
CPU overhead = -0.040039 second
Standard deviation = 0.010423 second
CPU overhead/iter = 0.000000 ms
CPU overhead(%) wrt reference = -2.973169
***** Finished


*******************************
* ELAPSE TIME = 93.147003
*******************************



***** Start Testing : omp_set(unset)_lock
-- iter_facotr : 500
-- try_count : 1
-- delay_time : 0.001100 ms
-- Running Reference case
WC Timing = 1.329667 second
Standard deviation = 0.008179 second
CPU Timing = 10.633301 second
Standard deviation = 0.069412 second
-- Testing 8 threads
WC Timing = 1.555000 second
Standard deviation = 0.015253 second
WC overhead = 0.225333 second
Standard deviation = 0.017308 second
WC overhead/iter = 0.000587 ms
WC overhead(%) wrt reference = 16.946604
CPU Timing = 12.439941 second
Standard deviation = 0.125627 second
CPU overhead = 1.806641 second
Standard deviation = 0.143527 second
CPU overhead/iter = 0.004705 ms
CPU overhead(%) wrt reference = 16.990403
-- Running Reference case
WC Timing = 1.331667 second
Standard deviation = 0.003091 second
CPU Timing = 5.326660 second
Standard deviation = 0.009495 second
-- Testing 4 threads
WC Timing = 1.569333 second
Standard deviation = 0.010403 second
WC overhead = 0.237667 second
Standard deviation = 0.010853 second
WC overhead/iter = 0.000619 ms
WC overhead(%) wrt reference = 17.847309
CPU Timing = 6.266683 second
Standard deviation = 0.045013 second
CPU overhead = 0.940023 second
Standard deviation = 0.046004 second
CPU overhead/iter = 0.002448 ms
CPU overhead(%) wrt reference = 17.647508
-- Running Reference case
WC Timing = 1.335667 second
Standard deviation = 0.008219 second
CPU Timing = 2.676595 second
Standard deviation = 0.012616 second
-- Testing 2 threads
WC Timing = 1.585333 second
Standard deviation = 0.006600 second
WC overhead = 0.249667 second
Standard deviation = 0.010541 second
WC overhead/iter = 0.000650 ms
WC overhead(%) wrt reference = 18.692288
CPU Timing = 3.170085 second
Standard deviation = 0.014041 second
CPU overhead = 0.493490 second
Standard deviation = 0.018876 second
CPU overhead/iter = 0.001285 ms
CPU overhead(%) wrt reference = 18.437215
-- Running Reference case
WC Timing = 1.343667 second
Standard deviation = 0.007587 second
CPU Timing = 1.343262 second
Standard deviation = 0.009324 second
-- Testing 1 threads
WC Timing = 1.584333 second
Standard deviation = 0.010274 second
WC overhead = 0.240667 second
Standard deviation = 0.012772 second
WC overhead/iter = 0.000627 ms
WC overhead(%) wrt reference = 17.911188
CPU Timing = 1.586751 second
Standard deviation = 0.012616 second
CPU overhead = 0.243490 second
Standard deviation = 0.015688 second
CPU overhead/iter = 0.000634 ms
CPU overhead(%) wrt reference = 18.126742
***** Finished


*******************************
* ELAPSE TIME = 130.509995
*******************************



***** try failed *****
try_count = 1
REF Timing = 1.326333 second
TEST Timing = 1.507667 second
***** Start Testing : pingpong omp_set(unset)_lock
-- iter_facotr : 500
-- try_count : 2
-- delay_time : 0.003646 ms
-- Running Reference case
WC Timing = 1.309000 second
Standard deviation = 0.012028 second
CPU Timing = 2.613363 second
Standard deviation = 0.023536 second
-- Testing 2 threads
WC Timing = 1.536000 second
Standard deviation = 0.002449 second
WC overhead = 0.227000 second
Standard deviation = 0.012275 second
WC overhead/iter = 0.001773 ms
WC overhead(%) wrt reference = 17.341483
CPU Timing = 3.076660 second
Standard deviation = 0.004662 second
CPU overhead = 0.463298 second
Standard deviation = 0.023993 second
CPU overhead/iter = 0.003620 ms
CPU overhead(%) wrt reference = 17.728023
***** Finished


*******************************
* ELAPSE TIME = 17.044001
*******************************



***** Start Testing : !$OMP ordered
-- iter_facotr : 20000
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 4.456333 second
Standard deviation = 0.013021 second
CPU Timing = 35.626709 second
Standard deviation = 0.091753 second
-- Testing 8 threads
WC Timing = 13.597667 second
Standard deviation = 0.006600 second
WC overhead = 9.141333 second
Standard deviation = 0.014598 second
WC overhead/iter = 0.001785 ms
WC overhead(%) wrt reference = 205.131275
CPU Timing = 108.603271 second
Standard deviation = 0.020555 second
CPU overhead = 72.976562 second
Standard deviation = 0.094027 second
CPU overhead/iter = 0.014253 ms
CPU overhead(%) wrt reference = 204.836665
-- Running Reference case
WC Timing = 2.219333 second
Standard deviation = 0.000471 second
CPU Timing = 8.873372 second
Standard deviation = 0.004604 second
-- Testing 4 threads
WC Timing = 4.613667 second
Standard deviation = 0.021453 second
WC overhead = 2.394333 second
Standard deviation = 0.021458 second
WC overhead/iter = 0.000468 ms
WC overhead(%) wrt reference = 107.885251
CPU Timing = 18.443278 second
Standard deviation = 0.097506 second
CPU overhead = 9.569906 second
Standard deviation = 0.097615 second
CPU overhead/iter = 0.001869 ms
CPU overhead(%) wrt reference = 107.849701
-- Running Reference case
WC Timing = 1.109667 second
Standard deviation = 0.000471 second
CPU Timing = 2.216634 second
Standard deviation = 0.004723 second
-- Testing 2 threads
WC Timing = 4.590667 second
Standard deviation = 0.021453 second
WC overhead = 3.481000 second
Standard deviation = 0.021458 second
WC overhead/iter = 0.000680 ms
WC overhead(%) wrt reference = 313.697805
CPU Timing = 9.176595 second
Standard deviation = 0.051905 second
CPU overhead = 6.959961 second
Standard deviation = 0.052120 second
CPU overhead/iter = 0.001359 ms
CPU overhead(%) wrt reference = 313.987811
-- Running Reference case
WC Timing = 0.554667 second
Standard deviation = 0.000471 second
CPU Timing = 0.553385 second
Standard deviation = 0.005064 second
-- Testing 1 threads
WC Timing = 4.434333 second
Standard deviation = 0.000471 second
WC overhead = 3.879667 second
Standard deviation = 0.000667 second
WC overhead/iter = 0.000758 ms
WC overhead(%) wrt reference = 699.459143
CPU Timing = 4.433268 second
Standard deviation = 0.005064 second
CPU overhead = 3.879883 second
Standard deviation = 0.007161 second
CPU overhead/iter = 0.000758 ms
CPU overhead(%) wrt reference = 701.117647
***** Finished


*******************************
* ELAPSE TIME = 106.739998
*******************************



***** Start Testing : !$OMP parallel
-- iter_facotr : 50
-- try_count : 1
-- delay_time : 0.100000 ms
-- Running Reference case
WC Timing = 1.378000 second
Standard deviation = 0.000816 second
CPU Timing = 1.380046 second
Standard deviation = 0.000230 second
-- Testing 8 threads
WC Timing = 1.806333 second
Standard deviation = 0.039415 second
WC overhead = 0.428333 second
Standard deviation = 0.039424 second
WC overhead/iter = 0.033464 ms
WC overhead(%) wrt reference = 31.083696
CPU Timing = 1.789164 second
Standard deviation = 0.020958 second
CPU overhead = 0.409119 second
Standard deviation = 0.020959 second
CPU overhead/iter = 0.031962 ms
CPU overhead(%) wrt reference = 29.645300
-- Testing 4 threads
WC Timing = 1.663000 second
Standard deviation = 0.002828 second
WC overhead = 0.285000 second
Standard deviation = 0.002944 second
WC overhead/iter = 0.022266 ms
WC overhead(%) wrt reference = 20.682148
CPU Timing = 1.664144 second
Standard deviation = 0.003089 second
CPU overhead = 0.284098 second
Standard deviation = 0.003097 second
CPU overhead/iter = 0.022195 ms
CPU overhead(%) wrt reference = 20.586154
-- Testing 2 threads
WC Timing = 1.636333 second
Standard deviation = 0.002357 second
WC overhead = 0.258333 second
Standard deviation = 0.002494 second
WC overhead/iter = 0.020182 ms
WC overhead(%) wrt reference = 18.746976
CPU Timing = 1.638346 second
Standard deviation = 0.002187 second
CPU overhead = 0.258301 second
Standard deviation = 0.002199 second
CPU overhead/iter = 0.020180 ms
CPU overhead(%) wrt reference = 18.716830
-- Testing 1 threads
WC Timing = 1.385333 second
Standard deviation = 0.002055 second
WC overhead = 0.007333 second
Standard deviation = 0.002211 second
WC overhead/iter = 0.000573 ms
WC overhead(%) wrt reference = 0.532171
CPU Timing = 1.389974 second
Standard deviation = 0.000230 second
CPU overhead = 0.009928 second
Standard deviation = 0.000326 second
CPU overhead/iter = 0.000776 ms
CPU overhead(%) wrt reference = 0.719424
***** Finished


*******************************
* ELAPSE TIME = 23.613001
*******************************



***** Start Testing : !$OMP parallel do schedule(static)
-- iter_facotr : 1500
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 1.382333 second
Standard deviation = 0.000471 second
CPU Timing = 1.383301 second
Standard deviation = 0.004493 second
-- Testing 8 threads
WC Timing = 14.185000 second
Standard deviation = 0.093908 second
WC overhead = 12.802667 second
Standard deviation = 0.093909 second
WC overhead/iter = 0.033340 ms
WC overhead(%) wrt reference = 926.163491
CPU Timing = 14.120850 second
Standard deviation = 0.095423 second
CPU overhead = 12.737549 second
Standard deviation = 0.095529 second
CPU overhead/iter = 0.033171 ms
CPU overhead(%) wrt reference = 920.808330
-- Testing 4 threads
WC Timing = 10.052667 second
Standard deviation = 0.092557 second
WC overhead = 8.670333 second
Standard deviation = 0.092559 second
WC overhead/iter = 0.022579 ms
WC overhead(%) wrt reference = 627.224499
CPU Timing = 10.052490 second
Standard deviation = 0.096006 second
CPU overhead = 8.669189 second
Standard deviation = 0.096111 second
CPU overhead/iter = 0.022576 ms
CPU overhead(%) wrt reference = 626.703142
-- Testing 2 threads
WC Timing = 9.327000 second
Standard deviation = 0.081490 second
WC overhead = 7.944667 second
Standard deviation = 0.081492 second
WC overhead/iter = 0.020689 ms
WC overhead(%) wrt reference = 574.728718
CPU Timing = 9.318359 second
Standard deviation = 0.086193 second
CPU overhead = 7.935059 second
Standard deviation = 0.086310 second
CPU overhead/iter = 0.020664 ms
CPU overhead(%) wrt reference = 573.632192
-- Testing 1 threads
WC Timing = 1.633667 second
Standard deviation = 0.000471 second
WC overhead = 0.251333 second
Standard deviation = 0.000667 second
WC overhead/iter = 0.000655 ms
WC overhead(%) wrt reference = 18.181818
CPU Timing = 1.633464 second
Standard deviation = 0.004723 second
CPU overhead = 0.250163 second
Standard deviation = 0.006519 second
CPU overhead/iter = 0.000651 ms
CPU overhead(%) wrt reference = 18.084481
***** Finished


***** Start Testing : !$OMP parallel do schedule(dynamic)
-- iter_facotr : 1500
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 1.382333 second
Standard deviation = 0.000471 second
CPU Timing = 1.383301 second
Standard deviation = 0.004493 second
-- Testing 8 threads
WC Timing = 425.288000 second
Standard deviation = 0.139800 second
WC overhead = 423.905667 second
Standard deviation = 0.139801 second
WC overhead/iter = 1.103921 ms
WC overhead(%) wrt reference = 30665.951238
CPU Timing = 423.027913 second
Standard deviation = 0.300541 second
CPU overhead = 421.644613 second
Standard deviation = 0.300575 second
CPU overhead/iter = 1.098033 ms
CPU overhead(%) wrt reference = 30481.050712
-- Testing 4 threads
WC Timing = 102.452000 second
Standard deviation = 0.098796 second
WC overhead = 101.069667 second
Standard deviation = 0.098797 second
WC overhead/iter = 0.263202 ms
WC overhead(%) wrt reference = 7311.526391
CPU Timing = 102.325033 second
Standard deviation = 0.099468 second
CPU overhead = 100.941732 second
Standard deviation = 0.099569 second
CPU overhead/iter = 0.262869 ms
CPU overhead(%) wrt reference = 7297.164372
-- Testing 2 threads
WC Timing = 29.205667 second
Standard deviation = 0.014522 second
WC overhead = 27.823333 second
Standard deviation = 0.014530 second
WC overhead/iter = 0.072457 ms
WC overhead(%) wrt reference = 2012.780320
CPU Timing = 29.188151 second
Standard deviation = 0.015919 second
CPU overhead = 27.804850 second
Standard deviation = 0.016541 second
CPU overhead/iter = 0.072408 ms
CPU overhead(%) wrt reference = 2010.036475
-- Testing 1 threads
WC Timing = 1.634000 second
Standard deviation = 0.000817 second
WC overhead = 0.251667 second
Standard deviation = 0.000943 second
WC overhead/iter = 0.000655 ms
WC overhead(%) wrt reference = 18.205932
CPU Timing = 1.633464 second
Standard deviation = 0.005126 second
CPU overhead = 0.250163 second
Standard deviation = 0.006817 second
CPU overhead/iter = 0.000651 ms
CPU overhead(%) wrt reference = 18.084481
***** Finished


***** Start Testing : !$OMP parallel do schedule(guided)
-- iter_facotr : 1500
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 1.382333 second
Standard deviation = 0.000471 second
CPU Timing = 1.383301 second
Standard deviation = 0.004493 second
-- Testing 8 threads
WC Timing = 77.803667 second
Standard deviation = 0.150741 second
WC overhead = 76.421333 second
Standard deviation = 0.150742 second
WC overhead/iter = 0.199014 ms
WC overhead(%) wrt reference = 5528.430181
CPU Timing = 77.443766 second
Standard deviation = 0.126336 second
CPU overhead = 76.060465 second
Standard deviation = 0.126416 second
CPU overhead/iter = 0.198074 ms
CPU overhead(%) wrt reference = 5498.476291
-- Testing 4 threads
WC Timing = 25.701333 second
Standard deviation = 0.051149 second
WC overhead = 24.319000 second
Standard deviation = 0.051151 second
WC overhead/iter = 0.063331 ms
WC overhead(%) wrt reference = 1759.271759
CPU Timing = 25.665853 second
Standard deviation = 0.039518 second
CPU overhead = 24.282552 second
Standard deviation = 0.039773 second
CPU overhead/iter = 0.063236 ms
CPU overhead(%) wrt reference = 1755.406518
-- Testing 2 threads
WC Timing = 9.378333 second
Standard deviation = 0.459409 second
WC overhead = 7.996000 second
Standard deviation = 0.459409 second
WC overhead/iter = 0.020823 ms
WC overhead(%) wrt reference = 578.442246
CPU Timing = 9.389974 second
Standard deviation = 0.465501 second
CPU overhead = 8.006673 second
Standard deviation = 0.465523 second
CPU overhead/iter = 0.020851 ms
CPU overhead(%) wrt reference = 578.809272
-- Testing 1 threads
WC Timing = 1.633667 second
Standard deviation = 0.000471 second
WC overhead = 0.251333 second
Standard deviation = 0.000667 second
WC overhead/iter = 0.000655 ms
WC overhead(%) wrt reference = 18.181818
CPU Timing = 1.633464 second
Standard deviation = 0.003683 second
CPU overhead = 0.250163 second
Standard deviation = 0.005809 second
CPU overhead/iter = 0.000651 ms
CPU overhead(%) wrt reference = 18.084481
***** Finished


*******************************
* ELAPSE TIME = 2129.056885
*******************************



***** Start Testing : !$OMP parallel do schedule(static,chunk_size)
-- iter_facotr : 1500
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 1.327000 second
Standard deviation = 0.000000 second
CPU Timing = 1.326823 second
Standard deviation = 0.004604 second
CHUNK SIZE = 1
-- Testing 8 threads
WC Timing = 59.108667 second
Standard deviation = 0.082552 second
WC overhead = 57.781667 second
Standard deviation = 0.082552 second
WC overhead/iter = 0.150473 ms
WC overhead(%) wrt reference = 4354.307964
CPU Timing = 58.740804 second
Standard deviation = 0.074736 second
CPU overhead = 57.413981 second
Standard deviation = 0.074878 second
CPU overhead/iter = 0.149516 ms
CPU overhead(%) wrt reference = 4327.177380
CHUNK SIZE = 2
-- Testing 8 threads
WC Timing = 35.154667 second
Standard deviation = 0.106850 second
WC overhead = 33.827667 second
Standard deviation = 0.106850 second
WC overhead/iter = 0.088093 ms
WC overhead(%) wrt reference = 2549.183623
CPU Timing = 34.989583 second
Standard deviation = 0.105483 second
CPU overhead = 33.662760 second
Standard deviation = 0.105583 second
CPU overhead/iter = 0.087663 ms
CPU overhead(%) wrt reference = 2537.095191
CHUNK SIZE = 4
-- Testing 8 threads
WC Timing = 23.068000 second
Standard deviation = 0.074552 second
WC overhead = 21.741000 second
Standard deviation = 0.074552 second
WC overhead/iter = 0.056617 ms
WC overhead(%) wrt reference = 1638.357196
CPU Timing = 22.964193 second
Standard deviation = 0.076356 second
CPU overhead = 21.637370 second
Standard deviation = 0.076495 second
CPU overhead/iter = 0.056347 ms
CPU overhead(%) wrt reference = 1630.765456
CHUNK SIZE = 8
-- Testing 8 threads
WC Timing = 17.383000 second
Standard deviation = 0.094117 second
WC overhead = 16.056000 second
Standard deviation = 0.094117 second
WC overhead/iter = 0.041813 ms
WC overhead(%) wrt reference = 1209.947250
CPU Timing = 17.287028 second
Standard deviation = 0.091107 second
CPU overhead = 15.960205 second
Standard deviation = 0.091223 second
CPU overhead/iter = 0.041563 ms
CPU overhead(%) wrt reference = 1202.888862
CHUNK SIZE = 16
-- Testing 8 threads
WC Timing = 15.960000 second
Standard deviation = 0.063230 second
WC overhead = 14.633000 second
Standard deviation = 0.063230 second
WC overhead/iter = 0.038107 ms
WC overhead(%) wrt reference = 1102.712886
CPU Timing = 15.875488 second
Standard deviation = 0.048513 second
CPU overhead = 14.548665 second
Standard deviation = 0.048731 second
CPU overhead/iter = 0.037887 ms
CPU overhead(%) wrt reference = 1096.503925
CHUNK SIZE = 32
-- Testing 8 threads
WC Timing = 14.954333 second
Standard deviation = 0.028406 second
WC overhead = 13.627333 second
Standard deviation = 0.028406 second
WC overhead/iter = 0.035488 ms
WC overhead(%) wrt reference = 1026.927909
CPU Timing = 14.887858 second
Standard deviation = 0.025262 second
CPU overhead = 13.561035 second
Standard deviation = 0.025678 second
CPU overhead/iter = 0.035315 ms
CPU overhead(%) wrt reference = 1022.068204
CHUNK SIZE = 1
-- Testing 4 threads
WC Timing = 36.628667 second
Standard deviation = 0.110714 second
WC overhead = 35.301667 second
Standard deviation = 0.110714 second
WC overhead/iter = 0.091931 ms
WC overhead(%) wrt reference = 2660.261241
CPU Timing = 36.553548 second
Standard deviation = 0.121784 second
CPU overhead = 35.226725 second
Standard deviation = 0.121871 second
CPU overhead/iter = 0.091736 ms
CPU overhead(%) wrt reference = 2654.968106
CHUNK SIZE = 2
-- Testing 4 threads
WC Timing = 23.385333 second
Standard deviation = 0.110828 second
WC overhead = 22.058333 second
Standard deviation = 0.110828 second
WC overhead/iter = 0.057444 ms
WC overhead(%) wrt reference = 1662.270786
CPU Timing = 23.344076 second
Standard deviation = 0.090920 second
CPU overhead = 22.017253 second
Standard deviation = 0.091037 second
CPU overhead/iter = 0.057337 ms
CPU overhead(%) wrt reference = 1659.396467
CHUNK SIZE = 4
-- Testing 4 threads
WC Timing = 16.412333 second
Standard deviation = 0.031255 second
WC overhead = 15.085333 second
Standard deviation = 0.031255 second
WC overhead/iter = 0.039285 ms
WC overhead(%) wrt reference = 1136.799800
CPU Timing = 16.371582 second
Standard deviation = 0.022315 second
CPU overhead = 15.044759 second
Standard deviation = 0.022785 second
CPU overhead/iter = 0.039179 ms
CPU overhead(%) wrt reference = 1133.893523
CHUNK SIZE = 8
-- Testing 4 threads
WC Timing = 13.474667 second
Standard deviation = 0.012552 second
WC overhead = 12.147667 second
Standard deviation = 0.012552 second
WC overhead/iter = 0.031635 ms
WC overhead(%) wrt reference = 915.423261
CPU Timing = 13.463379 second
Standard deviation = 0.034736 second
CPU overhead = 12.136556 second
Standard deviation = 0.035039 second
CPU overhead/iter = 0.031606 ms
CPU overhead(%) wrt reference = 914.708047
CHUNK SIZE = 16
-- Testing 4 threads
WC Timing = 11.991000 second
Standard deviation = 0.006481 second
WC overhead = 10.664000 second
Standard deviation = 0.006481 second
WC overhead/iter = 0.027771 ms
WC overhead(%) wrt reference = 803.617182
CPU Timing = 11.973307 second
Standard deviation = 0.016846 second
CPU overhead = 10.646484 second
Standard deviation = 0.017463 second
CPU overhead/iter = 0.027725 ms
CPU overhead(%) wrt reference = 802.404318
CHUNK SIZE = 32
-- Testing 4 threads
WC Timing = 11.032000 second
Standard deviation = 0.007071 second
WC overhead = 9.705000 second
Standard deviation = 0.007071 second
WC overhead/iter = 0.025273 ms
WC overhead(%) wrt reference = 731.348908
CPU Timing = 11.025879 second
Standard deviation = 0.015691 second
CPU overhead = 9.699056 second
Standard deviation = 0.016352 second
CPU overhead/iter = 0.025258 ms
CPU overhead(%) wrt reference = 730.998528
CHUNK SIZE = 1
-- Testing 2 threads
WC Timing = 14.594667 second
Standard deviation = 0.020171 second
WC overhead = 13.267667 second
Standard deviation = 0.020171 second
WC overhead/iter = 0.034551 ms
WC overhead(%) wrt reference = 999.824165
CPU Timing = 14.583333 second
Standard deviation = 0.019602 second
CPU overhead = 13.256510 second
Standard deviation = 0.020135 second
CPU overhead/iter = 0.034522 ms
CPU overhead(%) wrt reference = 999.116781
CHUNK SIZE = 2
-- Testing 2 threads
WC Timing = 12.308000 second
Standard deviation = 0.255915 second
WC overhead = 10.981000 second
Standard deviation = 0.255915 second
WC overhead/iter = 0.028596 ms
WC overhead(%) wrt reference = 827.505652
CPU Timing = 12.283203 second
Standard deviation = 0.247281 second
CPU overhead = 10.956380 second
Standard deviation = 0.247323 second
CPU overhead/iter = 0.028532 ms
CPU overhead(%) wrt reference = 825.760550
CHUNK SIZE = 4
-- Testing 2 threads
WC Timing = 10.847667 second
Standard deviation = 0.063189 second
WC overhead = 9.520667 second
Standard deviation = 0.063189 second
WC overhead/iter = 0.024793 ms
WC overhead(%) wrt reference = 717.457925
CPU Timing = 10.851888 second
Standard deviation = 0.078508 second
CPU overhead = 9.525065 second
Standard deviation = 0.078643 second
CPU overhead/iter = 0.024805 ms
CPU overhead(%) wrt reference = 717.885182
CHUNK SIZE = 8
-- Testing 2 threads
WC Timing = 10.015000 second
Standard deviation = 0.027653 second
WC overhead = 8.688000 second
Standard deviation = 0.027653 second
WC overhead/iter = 0.022625 ms
WC overhead(%) wrt reference = 654.709872
CPU Timing = 10.008464 second
Standard deviation = 0.026449 second
CPU overhead = 8.681641 second
Standard deviation = 0.026847 second
CPU overhead/iter = 0.022608 ms
CPU overhead(%) wrt reference = 654.317959
CHUNK SIZE = 16
-- Testing 2 threads
WC Timing = 9.610667 second
Standard deviation = 0.013225 second
WC overhead = 8.283667 second
Standard deviation = 0.013225 second
WC overhead/iter = 0.021572 ms
WC overhead(%) wrt reference = 624.240142
CPU Timing = 9.598307 second
Standard deviation = 0.021341 second
CPU overhead = 8.271484 second
Standard deviation = 0.021832 second
CPU overhead/iter = 0.021540 ms
CPU overhead(%) wrt reference = 623.405299
CHUNK SIZE = 32
-- Testing 2 threads
WC Timing = 9.375000 second
Standard deviation = 0.011518 second
WC overhead = 8.048000 second
Standard deviation = 0.011518 second
WC overhead/iter = 0.020958 ms
WC overhead(%) wrt reference = 606.480783
CPU Timing = 9.376302 second
Standard deviation = 0.006445 second
CPU overhead = 8.049479 second
Standard deviation = 0.007920 second
CPU overhead/iter = 0.020962 ms
CPU overhead(%) wrt reference = 606.673209
CHUNK SIZE = 1
-- Testing 1 threads
WC Timing = 1.519333 second
Standard deviation = 0.000471 second
WC overhead = 0.192333 second
Standard deviation = 0.000471 second
WC overhead/iter = 0.000501 ms
WC overhead(%) wrt reference = 14.493846
CPU Timing = 1.520182 second
Standard deviation = 0.000921 second
CPU overhead = 0.193359 second
Standard deviation = 0.004695 second
CPU overhead/iter = 0.000504 ms
CPU overhead(%) wrt reference = 14.573111
CHUNK SIZE = 2
-- Testing 1 threads
WC Timing = 1.519667 second
Standard deviation = 0.000943 second
WC overhead = 0.192667 second
Standard deviation = 0.000943 second
WC overhead/iter = 0.000502 ms
WC overhead(%) wrt reference = 14.518965
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
CHUNK SIZE = 4
-- Testing 1 threads
WC Timing = 1.519333 second
Standard deviation = 0.000471 second
WC overhead = 0.192333 second
Standard deviation = 0.000471 second
WC overhead/iter = 0.000501 ms
WC overhead(%) wrt reference = 14.493846
CPU Timing = 1.520182 second
Standard deviation = 0.000921 second
CPU overhead = 0.193359 second
Standard deviation = 0.004695 second
CPU overhead/iter = 0.000504 ms
CPU overhead(%) wrt reference = 14.573111
CHUNK SIZE = 8
-- Testing 1 threads
WC Timing = 1.528333 second
Standard deviation = 0.013199 second
WC overhead = 0.201333 second
Standard deviation = 0.013199 second
WC overhead/iter = 0.000524 ms
WC overhead(%) wrt reference = 15.172067
CPU Timing = 1.526693 second
Standard deviation = 0.008783 second
CPU overhead = 0.199870 second
Standard deviation = 0.009916 second
CPU overhead/iter = 0.000520 ms
CPU overhead(%) wrt reference = 15.063788
CHUNK SIZE = 16
-- Testing 1 threads
WC Timing = 1.519000 second
Standard deviation = 0.000000 second
WC overhead = 0.192000 second
Standard deviation = 0.000000 second
WC overhead/iter = 0.000500 ms
WC overhead(%) wrt reference = 14.468727
CPU Timing = 1.516927 second
Standard deviation = 0.005126 second
CPU overhead = 0.190104 second
Standard deviation = 0.006890 second
CPU overhead/iter = 0.000495 ms
CPU overhead(%) wrt reference = 14.327772
CHUNK SIZE = 32
-- Testing 1 threads
WC Timing = 1.519667 second
Standard deviation = 0.000471 second
WC overhead = 0.192667 second
Standard deviation = 0.000471 second
WC overhead/iter = 0.000502 ms
WC overhead(%) wrt reference = 14.518965
CPU Timing = 1.520182 second
Standard deviation = 0.000921 second
CPU overhead = 0.193359 second
Standard deviation = 0.004695 second
CPU overhead/iter = 0.000504 ms
CPU overhead(%) wrt reference = 14.573111
***** Finished


***** Start Testing : !$OMP parallel do schedule(dynamic,chunk_size)
-- iter_facotr : 1500
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 1.327000 second
Standard deviation = 0.000000 second
CPU Timing = 1.326823 second
Standard deviation = 0.004604 second
CHUNK SIZE = 1
-- Testing 8 threads
WC Timing = 411.885333 second
Standard deviation = 0.257528 second
WC overhead = 410.558333 second
Standard deviation = 0.257528 second
WC overhead/iter = 1.069162 ms
WC overhead(%) wrt reference = 30938.834470
CPU Timing = 409.992513 second
Standard deviation = 0.324699 second
CPU overhead = 408.665690 second
Standard deviation = 0.324731 second
CPU overhead/iter = 1.064234 ms
CPU overhead(%) wrt reference = 30800.318940
CHUNK SIZE = 2
-- Testing 8 threads
WC Timing = 226.415667 second
Standard deviation = 0.201776 second
WC overhead = 225.088667 second
Standard deviation = 0.201776 second
WC overhead/iter = 0.586168 ms
WC overhead(%) wrt reference = 16962.220552
CPU Timing = 225.276204 second
Standard deviation = 0.264409 second
CPU overhead = 223.949382 second
Standard deviation = 0.264449 second
CPU overhead/iter = 0.583202 ms
CPU overhead(%) wrt reference = 16878.618744
CHUNK SIZE = 4
-- Testing 8 threads
WC Timing = 125.748667 second
Standard deviation = 0.042898 second
WC overhead = 124.421667 second
Standard deviation = 0.042898 second
WC overhead/iter = 0.324015 ms
WC overhead(%) wrt reference = 9376.161771
CPU Timing = 125.119629 second
Standard deviation = 0.097100 second
CPU overhead = 123.792806 second
Standard deviation = 0.097210 second
CPU overhead/iter = 0.322377 ms
CPU overhead(%) wrt reference = 9330.017174
CHUNK SIZE = 8
-- Testing 8 threads
WC Timing = 68.313667 second
Standard deviation = 0.029533 second
WC overhead = 66.986667 second
Standard deviation = 0.029533 second
WC overhead/iter = 0.174444 ms
WC overhead(%) wrt reference = 5047.977896
CPU Timing = 67.982585 second
Standard deviation = 0.008971 second
CPU overhead = 66.655762 second
Standard deviation = 0.010083 second
CPU overhead/iter = 0.173583 ms
CPU overhead(%) wrt reference = 5023.711973
CHUNK SIZE = 16
-- Testing 8 threads
WC Timing = 37.918667 second
Standard deviation = 0.059253 second
WC overhead = 36.591667 second
Standard deviation = 0.059253 second
WC overhead/iter = 0.095291 ms
WC overhead(%) wrt reference = 2757.472997
CPU Timing = 37.740885 second
Standard deviation = 0.056904 second
CPU overhead = 36.414062 second
Standard deviation = 0.057090 second
CPU overhead/iter = 0.094828 ms
CPU overhead(%) wrt reference = 2744.455348
CHUNK SIZE = 32
-- Testing 8 threads
WC Timing = 22.404000 second
Standard deviation = 0.176845 second
WC overhead = 21.077000 second
Standard deviation = 0.176845 second
WC overhead/iter = 0.054888 ms
WC overhead(%) wrt reference = 1588.319518
CPU Timing = 22.248210 second
Standard deviation = 0.097742 second
CPU overhead = 20.921387 second
Standard deviation = 0.097850 second
CPU overhead/iter = 0.054483 ms
CPU overhead(%) wrt reference = 1576.803238
CHUNK SIZE = 1
-- Testing 4 threads
WC Timing = 102.364000 second
Standard deviation = 0.053467 second
WC overhead = 101.037000 second
Standard deviation = 0.053467 second
WC overhead/iter = 0.263117 ms
WC overhead(%) wrt reference = 7613.941223
CPU Timing = 102.216471 second
Standard deviation = 0.037521 second
CPU overhead = 100.889648 second
Standard deviation = 0.037802 second
CPU overhead/iter = 0.262733 ms
CPU overhead(%) wrt reference = 7603.851816
CHUNK SIZE = 2
-- Testing 4 threads
WC Timing = 54.443000 second
Standard deviation = 0.023367 second
WC overhead = 53.116000 second
Standard deviation = 0.023367 second
WC overhead/iter = 0.138323 ms
WC overhead(%) wrt reference = 4002.712888
CPU Timing = 54.377604 second
Standard deviation = 0.020019 second
CPU overhead = 53.050781 second
Standard deviation = 0.020541 second
CPU overhead/iter = 0.138153 ms
CPU overhead(%) wrt reference = 3998.331698
CHUNK SIZE = 4
-- Testing 4 threads
WC Timing = 30.019667 second
Standard deviation = 0.085811 second
WC overhead = 28.692667 second
Standard deviation = 0.085811 second
WC overhead/iter = 0.074720 ms
WC overhead(%) wrt reference = 2162.220548
CPU Timing = 29.976562 second
Standard deviation = 0.102472 second
CPU overhead = 28.649740 second
Standard deviation = 0.102576 second
CPU overhead/iter = 0.074609 ms
CPU overhead(%) wrt reference = 2159.273798
CHUNK SIZE = 8
-- Testing 4 threads
WC Timing = 18.262667 second
Standard deviation = 0.096562 second
WC overhead = 16.935667 second
Standard deviation = 0.096562 second
WC overhead/iter = 0.044103 ms
WC overhead(%) wrt reference = 1276.237126
CPU Timing = 18.235026 second
Standard deviation = 0.077800 second
CPU overhead = 16.908203 second
Standard deviation = 0.077936 second
CPU overhead/iter = 0.044032 ms
CPU overhead(%) wrt reference = 1274.337586
CHUNK SIZE = 16
-- Testing 4 threads
WC Timing = 12.974333 second
Standard deviation = 0.088973 second
WC overhead = 11.647333 second
Standard deviation = 0.088973 second
WC overhead/iter = 0.030332 ms
WC overhead(%) wrt reference = 877.719166
CPU Timing = 12.959310 second
Standard deviation = 0.096666 second
CPU overhead = 11.632487 second
Standard deviation = 0.096776 second
CPU overhead/iter = 0.030293 ms
CPU overhead(%) wrt reference = 876.717370
CHUNK SIZE = 32
-- Testing 4 threads
WC Timing = 11.162667 second
Standard deviation = 0.127845 second
WC overhead = 9.835667 second
Standard deviation = 0.127845 second
WC overhead/iter = 0.025614 ms
WC overhead(%) wrt reference = 741.195679
CPU Timing = 11.158529 second
Standard deviation = 0.137165 second
CPU overhead = 9.831706 second
Standard deviation = 0.137242 second
CPU overhead/iter = 0.025603 ms
CPU overhead(%) wrt reference = 740.996075
CHUNK SIZE = 1
-- Testing 2 threads
WC Timing = 28.876000 second
Standard deviation = 0.023036 second
WC overhead = 27.549000 second
Standard deviation = 0.023036 second
WC overhead/iter = 0.071742 ms
WC overhead(%) wrt reference = 2076.036173
CPU Timing = 28.850260 second
Standard deviation = 0.022628 second
CPU overhead = 27.523437 second
Standard deviation = 0.023091 second
CPU overhead/iter = 0.071676 ms
CPU overhead(%) wrt reference = 2074.386654
CHUNK SIZE = 2
-- Testing 2 threads
WC Timing = 16.175333 second
Standard deviation = 0.063594 second
WC overhead = 14.848333 second
Standard deviation = 0.063594 second
WC overhead/iter = 0.038668 ms
WC overhead(%) wrt reference = 1118.939965
CPU Timing = 16.173177 second
Standard deviation = 0.068412 second
CPU overhead = 14.846354 second
Standard deviation = 0.068567 second
CPU overhead/iter = 0.038662 ms
CPU overhead(%) wrt reference = 1118.940137
CHUNK SIZE = 4
-- Testing 2 threads
WC Timing = 9.751000 second
Standard deviation = 0.100588 second
WC overhead = 8.424000 second
Standard deviation = 0.100588 second
WC overhead/iter = 0.021938 ms
WC overhead(%) wrt reference = 634.815373
CPU Timing = 9.761719 second
Standard deviation = 0.106154 second
CPU overhead = 8.434896 second
Standard deviation = 0.106254 second
CPU overhead/iter = 0.021966 ms
CPU overhead(%) wrt reference = 635.721295
CHUNK SIZE = 8
-- Testing 2 threads
WC Timing = 7.117000 second
Standard deviation = 0.030474 second
WC overhead = 5.790000 second
Standard deviation = 0.030474 second
WC overhead/iter = 0.015078 ms
WC overhead(%) wrt reference = 436.322533
CPU Timing = 7.116536 second
Standard deviation = 0.032264 second
CPU overhead = 5.789714 second
Standard deviation = 0.032591 second
CPU overhead/iter = 0.015077 ms
CPU overhead(%) wrt reference = 436.359176
CHUNK SIZE = 16
-- Testing 2 threads
WC Timing = 9.478333 second
Standard deviation = 0.197723 second
WC overhead = 8.151333 second
Standard deviation = 0.197723 second
WC overhead/iter = 0.021227 ms
WC overhead(%) wrt reference = 614.267771
CPU Timing = 9.475911 second
Standard deviation = 0.195484 second
CPU overhead = 8.149089 second
Standard deviation = 0.195538 second
CPU overhead/iter = 0.021222 ms
CPU overhead(%) wrt reference = 614.180569
CHUNK SIZE = 32
-- Testing 2 threads
WC Timing = 7.078000 second
Standard deviation = 0.074958 second
WC overhead = 5.751000 second
Standard deviation = 0.074958 second
WC overhead/iter = 0.014977 ms
WC overhead(%) wrt reference = 433.383572
CPU Timing = 7.068359 second
Standard deviation = 0.059391 second
CPU overhead = 5.741536 second
Standard deviation = 0.059569 second
CPU overhead/iter = 0.014952 ms
CPU overhead(%) wrt reference = 432.728165
CHUNK SIZE = 1
-- Testing 1 threads
WC Timing = 1.519000 second
Standard deviation = 0.000000 second
WC overhead = 0.192000 second
Standard deviation = 0.000000 second
WC overhead/iter = 0.000500 ms
WC overhead(%) wrt reference = 14.468726
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
CHUNK SIZE = 2
-- Testing 1 threads
WC Timing = 1.519333 second
Standard deviation = 0.000471 second
WC overhead = 0.192333 second
Standard deviation = 0.000471 second
WC overhead/iter = 0.000501 ms
WC overhead(%) wrt reference = 14.493846
CPU Timing = 1.520833 second
Standard deviation = 0.001841 second
CPU overhead = 0.194010 second
Standard deviation = 0.004958 second
CPU overhead/iter = 0.000505 ms
CPU overhead(%) wrt reference = 14.622179
CHUNK SIZE = 4
-- Testing 1 threads
WC Timing = 1.519667 second
Standard deviation = 0.000943 second
WC overhead = 0.192667 second
Standard deviation = 0.000943 second
WC overhead/iter = 0.000502 ms
WC overhead(%) wrt reference = 14.518965
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
CHUNK SIZE = 8
-- Testing 1 threads
WC Timing = 1.519333 second
Standard deviation = 0.000471 second
WC overhead = 0.192333 second
Standard deviation = 0.000471 second
WC overhead/iter = 0.000501 ms
WC overhead(%) wrt reference = 14.493846
CPU Timing = 1.516927 second
Standard deviation = 0.006639 second
CPU overhead = 0.190104 second
Standard deviation = 0.008079 second
CPU overhead/iter = 0.000495 ms
CPU overhead(%) wrt reference = 14.327772
CHUNK SIZE = 16
-- Testing 1 threads
WC Timing = 1.519000 second
Standard deviation = 0.000000 second
WC overhead = 0.192000 second
Standard deviation = 0.000000 second
WC overhead/iter = 0.000500 ms
WC overhead(%) wrt reference = 14.468726
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
CHUNK SIZE = 32
-- Testing 1 threads
WC Timing = 1.519667 second
Standard deviation = 0.000471 second
WC overhead = 0.192667 second
Standard deviation = 0.000471 second
WC overhead/iter = 0.000502 ms
WC overhead(%) wrt reference = 14.518966
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
***** Finished


***** Start Testing : !$OMP parallel do schedule(guided,chunk_size)
-- iter_facotr : 1500
-- try_count : 1
-- delay_time : 0.000000 ms
-- Running Reference case
WC Timing = 1.327000 second
Standard deviation = 0.000000 second
CPU Timing = 1.326823 second
Standard deviation = 0.004604 second
CHUNK SIZE = 1
-- Testing 8 threads
WC Timing = 78.786333 second
Standard deviation = 0.038029 second
WC overhead = 77.459333 second
Standard deviation = 0.038029 second
WC overhead/iter = 0.201717 ms
WC overhead(%) wrt reference = 5837.176589
CPU Timing = 78.393717 second
Standard deviation = 0.049899 second
CPU overhead = 77.066895 second
Standard deviation = 0.050111 second
CPU overhead/iter = 0.200695 ms
CPU overhead(%) wrt reference = 5808.378312
CHUNK SIZE = 2
-- Testing 8 threads
WC Timing = 71.812667 second
Standard deviation = 0.069811 second
WC overhead = 70.485667 second
Standard deviation = 0.069811 second
WC overhead/iter = 0.183556 ms
WC overhead(%) wrt reference = 5311.655365
CPU Timing = 71.473796 second
Standard deviation = 0.101329 second
CPU overhead = 70.146973 second
Standard deviation = 0.101433 second
CPU overhead/iter = 0.182674 ms
CPU overhead(%) wrt reference = 5286.837586
CHUNK SIZE = 4
-- Testing 8 threads
WC Timing = 60.059000 second
Standard deviation = 0.069986 second
WC overhead = 58.732000 second
Standard deviation = 0.069986 second
WC overhead/iter = 0.152948 ms
WC overhead(%) wrt reference = 4425.923136
CPU Timing = 59.776367 second
Standard deviation = 0.075695 second
CPU overhead = 58.449544 second
Standard deviation = 0.075834 second
CPU overhead/iter = 0.152212 ms
CPU overhead(%) wrt reference = 4405.225711
CHUNK SIZE = 8
-- Testing 8 threads
WC Timing = 48.581667 second
Standard deviation = 0.056958 second
WC overhead = 47.254667 second
Standard deviation = 0.056958 second
WC overhead/iter = 0.123059 ms
WC overhead(%) wrt reference = 3561.014821
CPU Timing = 48.361654 second
Standard deviation = 0.053993 second
CPU overhead = 47.034831 second
Standard deviation = 0.054189 second
CPU overhead/iter = 0.122487 ms
CPU overhead(%) wrt reference = 3544.921492
CHUNK SIZE = 16
-- Testing 8 threads
WC Timing = 38.775000 second
Standard deviation = 0.113264 second
WC overhead = 37.448000 second
Standard deviation = 0.113264 second
WC overhead/iter = 0.097521 ms
WC overhead(%) wrt reference = 2822.004521
CPU Timing = 38.541667 second
Standard deviation = 0.049350 second
CPU overhead = 37.214844 second
Standard deviation = 0.049564 second
CPU overhead/iter = 0.096914 ms
CPU overhead(%) wrt reference = 2804.808636
CHUNK SIZE = 32
-- Testing 8 threads
WC Timing = 23.371000 second
Standard deviation = 0.040208 second
WC overhead = 22.044000 second
Standard deviation = 0.040208 second
WC overhead/iter = 0.057406 ms
WC overhead(%) wrt reference = 1661.190656
CPU Timing = 23.247884 second
Standard deviation = 0.023142 second
CPU overhead = 21.921061 second
Standard deviation = 0.023595 second
CPU overhead/iter = 0.057086 ms
CPU overhead(%) wrt reference = 1652.146712
CHUNK SIZE = 1
-- Testing 4 threads
WC Timing = 26.956000 second
Standard deviation = 0.022862 second
WC overhead = 25.629000 second
Standard deviation = 0.022862 second
WC overhead/iter = 0.066742 ms
WC overhead(%) wrt reference = 1931.348909
CPU Timing = 26.909831 second
Standard deviation = 0.011673 second
CPU overhead = 25.583008 second
Standard deviation = 0.012548 second
CPU overhead/iter = 0.066622 ms
CPU overhead(%) wrt reference = 1928.140334
CHUNK SIZE = 2
-- Testing 4 threads
WC Timing = 25.550667 second
Standard deviation = 0.025486 second
WC overhead = 24.223667 second
Standard deviation = 0.025486 second
WC overhead/iter = 0.063082 ms
WC overhead(%) wrt reference = 1825.445868
CPU Timing = 25.504232 second
Standard deviation = 0.011673 second
CPU overhead = 24.177409 second
Standard deviation = 0.012548 second
CPU overhead/iter = 0.062962 ms
CPU overhead(%) wrt reference = 1822.203140
CHUNK SIZE = 4
-- Testing 4 threads
WC Timing = 21.862333 second
Standard deviation = 0.021203 second
WC overhead = 20.535333 second
Standard deviation = 0.021203 second
WC overhead/iter = 0.053477 ms
WC overhead(%) wrt reference = 1547.500628
CPU Timing = 21.842448 second
Standard deviation = 0.002007 second
CPU overhead = 20.515625 second
Standard deviation = 0.005022 second
CPU overhead/iter = 0.053426 ms
CPU overhead(%) wrt reference = 1546.221786
CHUNK SIZE = 8
-- Testing 4 threads
WC Timing = 19.207667 second
Standard deviation = 0.013768 second
WC overhead = 17.880667 second
Standard deviation = 0.013768 second
WC overhead/iter = 0.046564 ms
WC overhead(%) wrt reference = 1347.450390
CPU Timing = 19.183268 second
Standard deviation = 0.006445 second
CPU overhead = 17.856445 second
Standard deviation = 0.007920 second
CPU overhead/iter = 0.046501 ms
CPU overhead(%) wrt reference = 1345.804711
CHUNK SIZE = 16
-- Testing 4 threads
WC Timing = 16.434333 second
Standard deviation = 0.009428 second
WC overhead = 15.107333 second
Standard deviation = 0.009428 second
WC overhead/iter = 0.039342 ms
WC overhead(%) wrt reference = 1138.457673
CPU Timing = 16.410156 second
Standard deviation = 0.025553 second
CPU overhead = 15.083333 second
Standard deviation = 0.025964 second
CPU overhead/iter = 0.039280 ms
CPU overhead(%) wrt reference = 1136.800785
CHUNK SIZE = 32
-- Testing 4 threads
WC Timing = 11.927667 second
Standard deviation = 0.036234 second
WC overhead = 10.600667 second
Standard deviation = 0.036234 second
WC overhead/iter = 0.027606 ms
WC overhead(%) wrt reference = 798.844513
CPU Timing = 11.900716 second
Standard deviation = 0.027854 second
CPU overhead = 10.573893 second
Standard deviation = 0.028232 second
CPU overhead/iter = 0.027536 ms
CPU overhead(%) wrt reference = 796.933268
CHUNK SIZE = 1
-- Testing 2 threads
WC Timing = 9.784333 second
Standard deviation = 0.042664 second
WC overhead = 8.457333 second
Standard deviation = 0.042664 second
WC overhead/iter = 0.022024 ms
WC overhead(%) wrt reference = 637.327304
CPU Timing = 9.777995 second
Standard deviation = 0.041900 second
CPU overhead = 8.451172 second
Standard deviation = 0.042152 second
CPU overhead/iter = 0.022008 ms
CPU overhead(%) wrt reference = 636.947988
CHUNK SIZE = 2
-- Testing 2 threads
WC Timing = 9.047333 second
Standard deviation = 0.000943 second
WC overhead = 7.720333 second
Standard deviation = 0.000943 second
WC overhead/iter = 0.020105 ms
WC overhead(%) wrt reference = 581.788496
CPU Timing = 9.048177 second
Standard deviation = 0.007536 second
CPU overhead = 7.721354 second
Standard deviation = 0.008831 second
CPU overhead/iter = 0.020108 ms
CPU overhead(%) wrt reference = 581.943081
CHUNK SIZE = 4
-- Testing 2 threads
WC Timing = 8.290667 second
Standard deviation = 0.024445 second
WC overhead = 6.963667 second
Standard deviation = 0.024445 second
WC overhead/iter = 0.018135 ms
WC overhead(%) wrt reference = 524.767646
CPU Timing = 8.296875 second
Standard deviation = 0.030758 second
CPU overhead = 6.970052 second
Standard deviation = 0.031100 second
CPU overhead/iter = 0.018151 ms
CPU overhead(%) wrt reference = 525.318940
CHUNK SIZE = 8
-- Testing 2 threads
WC Timing = 8.066333 second
Standard deviation = 0.044649 second
WC overhead = 6.739333 second
Standard deviation = 0.044649 second
WC overhead/iter = 0.017550 ms
WC overhead(%) wrt reference = 507.862347
CPU Timing = 8.072266 second
Standard deviation = 0.037365 second
CPU overhead = 6.745443 second
Standard deviation = 0.037648 second
CPU overhead/iter = 0.017566 ms
CPU overhead(%) wrt reference = 508.390579
CHUNK SIZE = 16
-- Testing 2 threads
WC Timing = 9.907667 second
Standard deviation = 0.081344 second
WC overhead = 8.580667 second
Standard deviation = 0.081344 second
WC overhead/iter = 0.022345 ms
WC overhead(%) wrt reference = 646.621452
CPU Timing = 9.911458 second
Standard deviation = 0.072104 second
CPU overhead = 8.584635 second
Standard deviation = 0.072251 second
CPU overhead/iter = 0.022356 ms
CPU overhead(%) wrt reference = 647.006869
CHUNK SIZE = 32
-- Testing 2 threads
WC Timing = 8.145333 second
Standard deviation = 0.028288 second
WC overhead = 6.818333 second
Standard deviation = 0.028288 second
WC overhead/iter = 0.017756 ms
WC overhead(%) wrt reference = 513.815625
CPU Timing = 8.139974 second
Standard deviation = 0.027126 second
CPU overhead = 6.813151 second
Standard deviation = 0.027514 second
CPU overhead/iter = 0.017743 ms
CPU overhead(%) wrt reference = 513.493621
CHUNK SIZE = 1
-- Testing 1 threads
WC Timing = 1.519000 second
Standard deviation = 0.000000 second
WC overhead = 0.192000 second
Standard deviation = 0.000000 second
WC overhead/iter = 0.000500 ms
WC overhead(%) wrt reference = 14.468726
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
CHUNK SIZE = 2
-- Testing 1 threads
WC Timing = 1.519000 second
Standard deviation = 0.000000 second
WC overhead = 0.192000 second
Standard deviation = 0.000000 second
WC overhead/iter = 0.000500 ms
WC overhead(%) wrt reference = 14.468727
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
CHUNK SIZE = 4
-- Testing 1 threads
WC Timing = 1.519333 second
Standard deviation = 0.000471 second
WC overhead = 0.192333 second
Standard deviation = 0.000471 second
WC overhead/iter = 0.000501 ms
WC overhead(%) wrt reference = 14.493845
CPU Timing = 1.520833 second
Standard deviation = 0.001841 second
CPU overhead = 0.194010 second
Standard deviation = 0.004958 second
CPU overhead/iter = 0.000505 ms
CPU overhead(%) wrt reference = 14.622179
CHUNK SIZE = 8
-- Testing 1 threads
WC Timing = 1.519000 second
Standard deviation = 0.000000 second
WC overhead = 0.192000 second
Standard deviation = 0.000000 second
WC overhead/iter = 0.000500 ms
WC overhead(%) wrt reference = 14.468727
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
CHUNK SIZE = 16
-- Testing 1 threads
WC Timing = 1.519000 second
Standard deviation = 0.000000 second
WC overhead = 0.192000 second
Standard deviation = 0.000000 second
WC overhead/iter = 0.000500 ms
WC overhead(%) wrt reference = 14.468726
CPU Timing = 1.516927 second
Standard deviation = 0.003683 second
CPU overhead = 0.190104 second
Standard deviation = 0.005895 second
CPU overhead/iter = 0.000495 ms
CPU overhead(%) wrt reference = 14.327772
CHUNK SIZE = 32
-- Testing 1 threads
WC Timing = 1.519333 second
Standard deviation = 0.000471 second
WC overhead = 0.192333 second
Standard deviation = 0.000471 second
WC overhead/iter = 0.000501 ms
WC overhead(%) wrt reference = 14.493845
CPU Timing = 1.519531 second
Standard deviation = 0.000000 second
CPU overhead = 0.192708 second
Standard deviation = 0.004604 second
CPU overhead/iter = 0.000502 ms
CPU overhead(%) wrt reference = 14.524043
***** Finished


*******************************
* ELAPSE TIME = 6212.912109
*******************************



***** Start Testing : !$OMP do reduction
-- iter_facotr : 40
-- try_count : 1
-- delay_time : 0.008333 ms
-- Running Reference case
WC Timing = 1.237667 second
Standard deviation = 0.005185 second
CPU Timing = 9.873698 second
Standard deviation = 0.061708 second
-- Testing 8 threads
WC Timing = 1.945667 second
Standard deviation = 0.019293 second
WC overhead = 0.708000 second
Standard deviation = 0.019978 second
WC overhead/iter = 0.069141 ms
WC overhead(%) wrt reference = 57.204415
CPU Timing = 1.942383 second
Standard deviation = 0.018661 second
CPU overhead = -7.931315 second
Standard deviation = 0.064468 second
CPU overhead/iter = -0.774542 ms
CPU overhead(%) wrt reference = -80.327707
-- Running Reference case
WC Timing = 0.622667 second
Standard deviation = 0.000943 second
CPU Timing = 2.485677 second
Standard deviation = 0.004872 second
-- Testing 4 threads
WC Timing = 1.016667 second
Standard deviation = 0.009104 second
WC overhead = 0.394000 second
Standard deviation = 0.009153 second
WC overhead/iter = 0.038477 ms
WC overhead(%) wrt reference = 63.276232
CPU Timing = 1.017904 second
Standard deviation = 0.007987 second
CPU overhead = -1.467773 second
Standard deviation = 0.009356 second
CPU overhead/iter = -0.143337 ms
CPU overhead(%) wrt reference = -59.049240
-- Running Reference case
WC Timing = 0.315333 second
Standard deviation = 0.001247 second
CPU Timing = 0.632812 second
Standard deviation = 0.011500 second
-- Testing 2 threads
WC Timing = 0.543667 second
Standard deviation = 0.011441 second
WC overhead = 0.228333 second
Standard deviation = 0.011508 second
WC overhead/iter = 0.022298 ms
WC overhead(%) wrt reference = 72.410147
CPU Timing = 0.543620 second
Standard deviation = 0.012988 second
CPU overhead = -0.089193 second
Standard deviation = 0.017348 second
CPU overhead/iter = -0.008710 ms
CPU overhead(%) wrt reference = -14.094650
-- Running Reference case
WC Timing = 0.155000 second
Standard deviation = 0.000000 second
CPU Timing = 0.156250 second
Standard deviation = 0.005524 second
-- Testing 1 threads
WC Timing = 0.164333 second
Standard deviation = 0.002357 second
WC overhead = 0.009333 second
Standard deviation = 0.002357 second
WC overhead/iter = 0.000911 ms
WC overhead(%) wrt reference = 6.021495
CPU Timing = 0.162760 second
Standard deviation = 0.003683 second
CPU overhead = 0.006510 second
Standard deviation = 0.006639 second
CPU overhead/iter = 0.000636 ms
CPU overhead(%) wrt reference = 4.166667
***** Finished


*******************************
* ELAPSE TIME = 18.014999
*******************************



***** Start Testing : !$OMP single
-- iter_facotr : 500
-- try_count : 1
-- delay_time : 0.003333 ms
-- Running Reference case
WC Timing = 1.301000 second
Standard deviation = 0.006377 second
CPU Timing = 1.300944 second
Standard deviation = 0.005727 second
-- Testing 8 threads
WC Timing = 3.042333 second
Standard deviation = 0.013474 second
WC overhead = 1.741333 second
Standard deviation = 0.014907 second
WC overhead/iter = 0.013604 ms
WC overhead(%) wrt reference = 133.845756
CPU Timing = 24.316406 second
Standard deviation = 0.087753 second
CPU overhead = 23.015462 second
Standard deviation = 0.087940 second
CPU overhead/iter = 0.179808 ms
CPU overhead(%) wrt reference = 1769.135494
-- Running Reference case
WC Timing = 1.301333 second
Standard deviation = 0.007717 second
CPU Timing = 1.299805 second
Standard deviation = 0.009401 second
-- Testing 4 threads
WC Timing = 1.824333 second
Standard deviation = 0.001700 second
WC overhead = 0.523000 second
Standard deviation = 0.007902 second
WC overhead/iter = 0.004086 ms
WC overhead(%) wrt reference = 40.189550
CPU Timing = 7.279948 second
Standard deviation = 0.012075 second
CPU overhead = 5.980143 second
Standard deviation = 0.015303 second
CPU overhead/iter = 0.046720 ms
CPU overhead(%) wrt reference = 460.080140
-- Running Reference case
WC Timing = 1.310667 second
Standard deviation = 0.002055 second
CPU Timing = 1.309896 second
Standard deviation = 0.004872 second
-- Testing 2 threads
WC Timing = 1.679000 second
Standard deviation = 0.012754 second
WC overhead = 0.368333 second
Standard deviation = 0.012919 second
WC overhead/iter = 0.002878 ms
WC overhead(%) wrt reference = 28.102747
CPU Timing = 3.352865 second
Standard deviation = 0.025976 second
CPU overhead = 2.042969 second
Standard deviation = 0.026429 second
CPU overhead/iter = 0.015961 ms
CPU overhead(%) wrt reference = 155.964215
-- Running Reference case
WC Timing = 1.297667 second
Standard deviation = 0.004190 second
CPU Timing = 1.299479 second
Standard deviation = 0.001841 second
-- Testing 1 threads
WC Timing = 1.354667 second
Standard deviation = 0.001247 second
WC overhead = 0.057000 second
Standard deviation = 0.004372 second
WC overhead/iter = 0.000445 ms
WC overhead(%) wrt reference = 4.392500
CPU Timing = 1.354167 second
Standard deviation = 0.003683 second
CPU overhead = 0.054688 second
Standard deviation = 0.004118 second
CPU overhead/iter = 0.000427 ms
CPU overhead(%) wrt reference = 4.208417
***** Finished


*******************************
* ELAPSE TIME = 39.432999
*******************************