From ab7be96410c1ddefcd06818d16a15cb03438edb5 Mon Sep 17 00:00:00 2001 From: Sankalp Date: Tue, 10 Feb 2015 23:26:04 -0500 Subject: [PATCH 01/11] initial results --- sankalp/clang_output_100 | 190 +++++++++++----------- sankalp/clang_output_1000 | 210 ++++++++++++------------ sankalp/clang_output_3000 | 180 ++++++++++++++++++++ sankalp/clang_output_optimized_100 | 180 ++++++++++++++++++++ sankalp/clang_output_optimized_1000 | 180 ++++++++++++++++++++ sankalp/clang_output_optimized_3000 | 180 ++++++++++++++++++++ sankalp/gcc_output_100 | 184 ++++++++++----------- sankalp/gcc_output_1000 | 208 ++++++++++++------------ sankalp/gcc_output_3000 | 180 ++++++++++++++++++++ sankalp/gcc_output_optimized_100 | 180 ++++++++++++++++++++ sankalp/gcc_output_optimized_1000 | 180 ++++++++++++++++++++ sankalp/gcc_output_optimized_3000 | 180 ++++++++++++++++++++ sankalp/java_output_100 | 244 ++++++++++++++-------------- sankalp/java_output_1000 | 242 +++++++++++++-------------- sankalp/java_output_3000 | 180 ++++++++++++++++++++ sankalp/python_output_100 | 220 ++++++++++++------------- sankalp/python_output_1000 | 214 ++++++++++++------------ sankalp/python_output_3000 | 180 ++++++++++++++++++++ 18 files changed, 2656 insertions(+), 856 deletions(-) create mode 100644 sankalp/clang_output_3000 create mode 100644 sankalp/clang_output_optimized_100 create mode 100644 sankalp/clang_output_optimized_1000 create mode 100644 sankalp/clang_output_optimized_3000 create mode 100644 sankalp/gcc_output_3000 create mode 100644 sankalp/gcc_output_optimized_100 create mode 100644 sankalp/gcc_output_optimized_1000 create mode 100644 sankalp/gcc_output_optimized_3000 create mode 100644 sankalp/java_output_3000 create mode 100644 sankalp/python_output_3000 diff --git a/sankalp/clang_output_100 b/sankalp/clang_output_100 index b8581c8..62ab0c3 100644 --- a/sankalp/clang_output_100 +++ b/sankalp/clang_output_100 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for './matrixMultiply_clang 100': - 7.081909 task-clock # 0.296 CPUs utilized + 7.053268 task-clock # 0.907 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 159 page-faults # 0.022 M/sec - 21,539,725 cycles # 3.042 GHz [43.77%] - 10,064,535 stalled-cycles-frontend # 46.73% frontend cycles idle - 1,705,546 stalled-cycles-backend # 7.92% backend cycles idle - 26,014,618 instructions # 1.21 insns per cycle - # 0.39 stalled cycles per insn - 2,497,944 branches # 352.722 M/sec - 11,875 branch-misses # 0.48% of all branches [74.92%] + 158 page-faults # 0.022 M/sec + 21,542,512 cycles # 3.054 GHz [43.51%] + 10,448,377 stalled-cycles-frontend # 48.50% frontend cycles idle + 1,620,562 stalled-cycles-backend # 7.52% backend cycles idle + 26,010,263 instructions # 1.21 insns per cycle + # 0.40 stalled cycles per insn + 2,497,209 branches # 354.050 M/sec + 11,897 branch-misses # 0.48% of all branches [71.92%] - 0.023890850 seconds time elapsed + 0.007776978 seconds time elapsed Iteration 2 Performance counter stats for './matrixMultiply_clang 100': - 7.115157 task-clock # 0.390 CPUs utilized + 7.156865 task-clock # 0.912 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 158 page-faults # 0.022 M/sec - 21,621,287 cycles # 3.039 GHz [44.01%] - 11,198,669 stalled-cycles-frontend # 51.79% frontend cycles idle - 1,760,875 stalled-cycles-backend # 8.14% backend cycles idle - 26,010,939 instructions # 1.20 insns per cycle - # 0.43 stalled cycles per insn - 2,496,532 branches # 350.875 M/sec - 11,961 branch-misses # 0.48% of all branches [66.39%] + 21,858,485 cycles # 3.054 GHz [45.75%] + 6,691,620 stalled-cycles-frontend # 30.61% frontend cycles idle + 2,072,908 stalled-cycles-backend # 9.48% backend cycles idle + 26,016,488 instructions # 1.19 insns per cycle + # 0.26 stalled cycles per insn + 2,497,845 branches # 349.014 M/sec + 17,479 branch-misses # 0.70% of all branches - 0.018257320 seconds time elapsed + 0.007849703 seconds time elapsed Iteration 3 Performance counter stats for './matrixMultiply_clang 100': - 7.079986 task-clock # 0.347 CPUs utilized + 7.165353 task-clock # 0.909 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 158 page-faults # 0.022 M/sec - 10,701,717 cycles # 1.512 GHz - 12,488,960 stalled-cycles-frontend # 116.70% frontend cycles idle - 1,879,249 stalled-cycles-backend # 17.56% backend cycles idle - 26,014,281 instructions # 2.43 insns per cycle - # 0.48 stalled cycles per insn - 2,497,901 branches # 352.812 M/sec - 12,145 branch-misses # 0.49% of all branches [50.52%] + 21,780,583 cycles # 3.040 GHz [44.38%] + 7,179,660 stalled-cycles-frontend # 32.96% frontend cycles idle + 2,012,094 stalled-cycles-backend # 9.24% backend cycles idle + 26,010,882 instructions # 1.19 insns per cycle + # 0.28 stalled cycles per insn + 2,497,319 branches # 348.527 M/sec + 15,296 branch-misses # 0.61% of all branches [98.02%] - 0.020401132 seconds time elapsed + 0.007883982 seconds time elapsed Iteration 4 Performance counter stats for './matrixMultiply_clang 100': - 7.161954 task-clock # 0.349 CPUs utilized + 7.098440 task-clock # 0.923 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 159 page-faults # 0.022 M/sec - 21,783,309 cycles # 3.042 GHz [44.34%] - 7,013,348 stalled-cycles-frontend # 32.20% frontend cycles idle - 1,999,347 stalled-cycles-backend # 9.18% backend cycles idle - 26,014,845 instructions # 1.19 insns per cycle - # 0.27 stalled cycles per insn - 2,498,010 branches # 348.789 M/sec - 17,107 branch-misses # 0.68% of all branches [99.46%] + 21,662,885 cycles # 3.052 GHz [43.88%] + 8,869,299 stalled-cycles-frontend # 40.94% frontend cycles idle + 1,888,070 stalled-cycles-backend # 8.72% backend cycles idle + 26,015,267 instructions # 1.20 insns per cycle + # 0.34 stalled cycles per insn + 2,498,064 branches # 351.917 M/sec + 11,733 branch-misses # 0.47% of all branches [84.57%] - 0.020511924 seconds time elapsed + 0.007692507 seconds time elapsed Iteration 5 Performance counter stats for './matrixMultiply_clang 100': - 7.091759 task-clock # 0.382 CPUs utilized + 7.074668 task-clock # 0.881 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 158 page-faults # 0.022 M/sec - 21,631,594 cycles # 3.050 GHz [43.90%] - 8,052,137 stalled-cycles-frontend # 37.22% frontend cycles idle - 1,018,814 stalled-cycles-backend # 4.71% backend cycles idle - 26,016,589 instructions # 1.20 insns per cycle - # 0.31 stalled cycles per insn - 2,498,309 branches # 352.283 M/sec - 11,726 branch-misses # 0.47% of all branches [90.77%] + 159 page-faults # 0.022 M/sec + 9,777,089 cycles # 1.382 GHz + 12,454,494 stalled-cycles-frontend # 127.38% frontend cycles idle + 406,671 stalled-cycles-backend # 4.16% backend cycles idle + 26,021,599 instructions # 2.66 insns per cycle + # 0.48 stalled cycles per insn + 2,498,735 branches # 353.195 M/sec + 12,178 branch-misses # 0.49% of all branches [54.81%] - 0.018581414 seconds time elapsed + 0.008028569 seconds time elapsed Iteration 6 Performance counter stats for './matrixMultiply_clang 100': - 7.058442 task-clock # 0.403 CPUs utilized + 7.085217 task-clock # 0.921 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 159 page-faults # 0.023 M/sec - 10,308,729 cycles # 1.460 GHz - 12,432,356 stalled-cycles-frontend # 120.60% frontend cycles idle - 1,782,986 stalled-cycles-backend # 17.30% backend cycles idle - 26,009,608 instructions # 2.52 insns per cycle - # 0.48 stalled cycles per insn - 2,497,040 branches # 353.766 M/sec - 12,110 branch-misses # 0.48% of all branches [52.22%] + 159 page-faults # 0.022 M/sec + 21,555,105 cycles # 3.042 GHz [43.77%] + 7,800,102 stalled-cycles-frontend # 36.19% frontend cycles idle + 1,788,484 stalled-cycles-backend # 8.30% backend cycles idle + 26,025,558 instructions # 1.21 insns per cycle + # 0.30 stalled cycles per insn + 2,499,437 branches # 352.768 M/sec + 11,719 branch-misses # 0.47% of all branches [92.55%] - 0.017501458 seconds time elapsed + 0.007694468 seconds time elapsed Iteration 7 Performance counter stats for './matrixMultiply_clang 100': - 7.138612 task-clock # 0.384 CPUs utilized + 7.112728 task-clock # 0.634 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 159 page-faults # 0.022 M/sec - 10,763,929 cycles # 1.508 GHz - 12,648,274 stalled-cycles-frontend # 117.51% frontend cycles idle - 2,015,841 stalled-cycles-backend # 18.73% backend cycles idle - 26,010,962 instructions # 2.42 insns per cycle - # 0.49 stalled cycles per insn - 2,497,304 branches # 349.830 M/sec - 12,092 branch-misses # 0.48% of all branches [50.74%] + 21,725,477 cycles # 3.054 GHz [45.19%] + 6,733,958 stalled-cycles-frontend # 31.00% frontend cycles idle + 1,849,361 stalled-cycles-backend # 8.51% backend cycles idle + 26,024,358 instructions # 1.20 insns per cycle + # 0.26 stalled cycles per insn + 2,499,211 branches # 351.372 M/sec + 17,591 branch-misses # 0.70% of all branches - 0.018570746 seconds time elapsed + 0.011223178 seconds time elapsed Iteration 8 Performance counter stats for './matrixMultiply_clang 100': - 7.118796 task-clock # 0.324 CPUs utilized + 7.068877 task-clock # 0.921 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 158 page-faults # 0.022 M/sec - 21,667,171 cycles # 3.044 GHz [44.04%] - 12,063,028 stalled-cycles-frontend # 55.67% frontend cycles idle - 1,636,765 stalled-cycles-backend # 7.55% backend cycles idle - 26,017,653 instructions # 1.20 insns per cycle - # 0.46 stalled cycles per insn - 2,498,553 branches # 350.980 M/sec - 12,127 branch-misses # 0.49% of all branches [59.82%] + 159 page-faults # 0.022 M/sec + 21,592,249 cycles # 3.055 GHz [43.63%] + 7,807,904 stalled-cycles-frontend # 36.16% frontend cycles idle + 1,825,484 stalled-cycles-backend # 8.45% backend cycles idle + 26,012,472 instructions # 1.20 insns per cycle + # 0.30 stalled cycles per insn + 2,497,566 branches # 353.319 M/sec + 11,719 branch-misses # 0.47% of all branches [92.66%] - 0.021960130 seconds time elapsed + 0.007675305 seconds time elapsed Iteration 9 Performance counter stats for './matrixMultiply_clang 100': - 7.156216 task-clock # 0.405 CPUs utilized + 7.096350 task-clock # 0.916 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 159 page-faults # 0.022 M/sec - 21,827,960 cycles # 3.050 GHz [44.35%] - 11,521,800 stalled-cycles-frontend # 52.78% frontend cycles idle - 2,057,334 stalled-cycles-backend # 9.43% backend cycles idle - 26,022,933 instructions # 1.19 insns per cycle - # 0.44 stalled cycles per insn - 2,499,369 branches # 349.258 M/sec - 11,919 branch-misses # 0.48% of all branches [64.67%] + 21,606,442 cycles # 3.045 GHz [43.82%] + 9,785,352 stalled-cycles-frontend # 45.29% frontend cycles idle + 1,812,444 stalled-cycles-backend # 8.39% backend cycles idle + 26,027,894 instructions # 1.20 insns per cycle + # 0.38 stalled cycles per insn + 2,499,871 branches # 352.276 M/sec + 11,876 branch-misses # 0.48% of all branches [77.30%] - 0.017682175 seconds time elapsed + 0.007747817 seconds time elapsed Iteration 10 Performance counter stats for './matrixMultiply_clang 100': - 7.179453 task-clock # 0.347 CPUs utilized + 7.154863 task-clock # 0.920 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 158 page-faults # 0.022 M/sec - 21,825,556 cycles # 3.040 GHz [44.51%] - 11,949,081 stalled-cycles-frontend # 54.75% frontend cycles idle - 2,055,046 stalled-cycles-backend # 9.42% backend cycles idle - 26,016,430 instructions # 1.19 insns per cycle - # 0.46 stalled cycles per insn - 2,498,034 branches # 347.942 M/sec - 11,995 branch-misses # 0.48% of all branches [61.55%] - - 0.020701153 seconds time elapsed + 21,831,902 cycles # 3.051 GHz [44.34%] + 10,234,895 stalled-cycles-frontend # 46.88% frontend cycles idle + 2,001,267 stalled-cycles-backend # 9.17% backend cycles idle + 26,012,404 instructions # 1.19 insns per cycle + # 0.39 stalled cycles per insn + 2,497,750 branches # 349.098 M/sec + 11,843 branch-misses # 0.47% of all branches [74.43%] + + 0.007774080 seconds time elapsed diff --git a/sankalp/clang_output_1000 b/sankalp/clang_output_1000 index e8c639e..9a89831 100644 --- a/sankalp/clang_output_1000 +++ b/sankalp/clang_output_1000 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for './matrixMultiply_clang 1000': - 8769.076082 task-clock # 0.997 CPUs utilized + 8772.711871 task-clock # 0.997 CPUs utilized 11 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 3,074 page-faults # 0.000 M/sec - 26,838,781,079 cycles # 3.061 GHz [83.34%] - 18,717,658,625 stalled-cycles-frontend # 69.74% frontend cycles idle [83.35%] - 6,713,364,797 stalled-cycles-backend # 25.01% backend cycles idle [66.69%] - 24,147,234,143 instructions # 0.90 insns per cycle + 3,075 page-faults # 0.000 M/sec + 26,862,536,545 cycles # 3.062 GHz [83.32%] + 18,725,249,733 stalled-cycles-frontend # 69.71% frontend cycles idle [83.31%] + 6,721,535,337 stalled-cycles-backend # 25.02% backend cycles idle [66.69%] + 24,147,572,347 instructions # 0.90 insns per cycle # 0.78 stalled cycles per insn [83.35%] - 2,039,098,917 branches # 232.533 M/sec [83.35%] - 1,384,269 branch-misses # 0.07% of all branches [83.31%] + 2,039,094,766 branches # 232.436 M/sec [83.35%] + 1,418,553 branch-misses # 0.07% of all branches [83.35%] - 8.792196408 seconds time elapsed + 8.795813556 seconds time elapsed Iteration 2 Performance counter stats for './matrixMultiply_clang 1000': - 8707.169262 task-clock # 0.997 CPUs utilized - 11 context-switches # 0.000 M/sec - 0 CPU-migrations # 0.000 M/sec + 8729.146601 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec 3,074 page-faults # 0.000 M/sec - 26,661,371,630 cycles # 3.062 GHz [83.32%] - 18,528,714,106 stalled-cycles-frontend # 69.50% frontend cycles idle [83.32%] - 6,570,561,597 stalled-cycles-backend # 24.64% backend cycles idle [66.64%] - 24,147,474,932 instructions # 0.91 insns per cycle - # 0.77 stalled cycles per insn [83.32%] - 2,038,834,096 branches # 234.156 M/sec [83.36%] - 1,492,744 branch-misses # 0.07% of all branches [83.36%] + 26,728,257,650 cycles # 3.062 GHz [83.32%] + 18,598,831,843 stalled-cycles-frontend # 69.58% frontend cycles idle [83.32%] + 6,692,039,477 stalled-cycles-backend # 25.04% backend cycles idle [66.68%] + 24,143,696,220 instructions # 0.90 insns per cycle + # 0.77 stalled cycles per insn [83.36%] + 2,039,089,497 branches # 233.596 M/sec [83.36%] + 1,422,028 branch-misses # 0.07% of all branches [83.33%] - 8.729853429 seconds time elapsed + 8.751936365 seconds time elapsed Iteration 3 Performance counter stats for './matrixMultiply_clang 1000': - 8728.280704 task-clock # 0.996 CPUs utilized - 11 context-switches # 0.000 M/sec + 8743.005082 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 3,075 page-faults # 0.000 M/sec - 26,725,445,478 cycles # 3.062 GHz [83.31%] - 18,593,264,002 stalled-cycles-frontend # 69.57% frontend cycles idle [83.31%] - 6,414,166,461 stalled-cycles-backend # 24.00% backend cycles idle [66.67%] - 24,142,810,780 instructions # 0.90 insns per cycle - # 0.77 stalled cycles per insn [83.36%] - 2,039,114,540 branches # 233.622 M/sec [83.36%] - 1,470,269 branch-misses # 0.07% of all branches [83.35%] + 26,760,005,251 cycles # 3.061 GHz [83.34%] + 18,636,540,129 stalled-cycles-frontend # 69.64% frontend cycles idle [83.34%] + 6,696,730,595 stalled-cycles-backend # 25.03% backend cycles idle [66.69%] + 24,146,489,634 instructions # 0.90 insns per cycle + # 0.77 stalled cycles per insn [83.34%] + 2,039,117,188 branches # 233.228 M/sec [83.34%] + 1,512,869 branch-misses # 0.07% of all branches [83.32%] - 8.761864479 seconds time elapsed + 8.765745532 seconds time elapsed Iteration 4 Performance counter stats for './matrixMultiply_clang 1000': - 8739.132157 task-clock # 0.997 CPUs utilized - 11 context-switches # 0.000 M/sec + 8842.501415 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 3,074 page-faults # 0.000 M/sec - 26,758,988,652 cycles # 3.062 GHz [83.34%] - 18,625,435,877 stalled-cycles-frontend # 69.60% frontend cycles idle [83.34%] - 6,666,046,784 stalled-cycles-backend # 24.91% backend cycles idle [66.67%] - 24,146,277,825 instructions # 0.90 insns per cycle - # 0.77 stalled cycles per insn [83.34%] - 2,039,113,610 branches # 233.331 M/sec [83.33%] - 1,468,997 branch-misses # 0.07% of all branches [83.34%] + 27,075,333,912 cycles # 3.062 GHz [83.30%] + 18,932,760,043 stalled-cycles-frontend # 69.93% frontend cycles idle [83.34%] + 6,827,630,830 stalled-cycles-backend # 25.22% backend cycles idle [66.70%] + 24,145,756,817 instructions # 0.89 insns per cycle + # 0.78 stalled cycles per insn [83.35%] + 2,039,239,015 branches # 230.618 M/sec [83.35%] + 1,496,833 branch-misses # 0.07% of all branches [83.33%] - 8.762159807 seconds time elapsed + 8.865507756 seconds time elapsed Iteration 5 Performance counter stats for './matrixMultiply_clang 1000': - 8809.610617 task-clock # 0.997 CPUs utilized - 11 context-switches # 0.000 M/sec - 2 CPU-migrations # 0.000 M/sec - 3,075 page-faults # 0.000 M/sec - 26,973,625,450 cycles # 3.062 GHz [83.33%] - 18,839,441,332 stalled-cycles-frontend # 69.84% frontend cycles idle [83.33%] - 6,844,458,222 stalled-cycles-backend # 25.37% backend cycles idle [66.67%] - 24,146,135,534 instructions # 0.90 insns per cycle - # 0.78 stalled cycles per insn [83.33%] - 2,038,924,872 branches # 231.443 M/sec [83.33%] - 1,474,654 branch-misses # 0.07% of all branches [83.36%] + 8796.936234 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,935,212,998 cycles # 3.062 GHz [83.31%] + 18,792,486,212 stalled-cycles-frontend # 69.77% frontend cycles idle [83.31%] + 6,800,634,030 stalled-cycles-backend # 25.25% backend cycles idle [66.71%] + 24,146,395,655 instructions # 0.90 insns per cycle + # 0.78 stalled cycles per insn [83.35%] + 2,039,272,337 branches # 231.816 M/sec [83.35%] + 1,994,410 branch-misses # 0.10% of all branches [83.32%] - 8.832521671 seconds time elapsed + 8.820084000 seconds time elapsed Iteration 6 Performance counter stats for './matrixMultiply_clang 1000': - 8731.664661 task-clock # 0.997 CPUs utilized - 11 context-switches # 0.000 M/sec + 8777.014189 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 3,075 page-faults # 0.000 M/sec - 26,734,991,494 cycles # 3.062 GHz [83.32%] - 18,600,205,731 stalled-cycles-frontend # 69.57% frontend cycles idle [83.32%] - 6,658,829,501 stalled-cycles-backend # 24.91% backend cycles idle [66.64%] - 24,146,710,783 instructions # 0.90 insns per cycle - # 0.77 stalled cycles per insn [83.32%] - 2,038,590,197 branches # 233.471 M/sec [83.36%] - 1,479,149 branch-misses # 0.07% of all branches [83.37%] + 26,875,307,479 cycles # 3.062 GHz [83.32%] + 18,740,496,292 stalled-cycles-frontend # 69.73% frontend cycles idle [83.32%] + 6,705,290,080 stalled-cycles-backend # 24.95% backend cycles idle [66.68%] + 24,144,531,987 instructions # 0.90 insns per cycle + # 0.78 stalled cycles per insn [83.36%] + 2,039,002,045 branches # 232.312 M/sec [83.36%] + 1,448,566 branch-misses # 0.07% of all branches [83.34%] - 8.754675160 seconds time elapsed + 8.799930149 seconds time elapsed Iteration 7 Performance counter stats for './matrixMultiply_clang 1000': - 8781.456874 task-clock # 0.997 CPUs utilized - 11 context-switches # 0.000 M/sec - 0 CPU-migrations # 0.000 M/sec - 3,074 page-faults # 0.000 M/sec - 26,887,726,132 cycles # 3.062 GHz [83.32%] - 18,751,149,081 stalled-cycles-frontend # 69.74% frontend cycles idle [83.32%] - 6,684,330,025 stalled-cycles-backend # 24.86% backend cycles idle [66.65%] - 24,149,943,484 instructions # 0.90 insns per cycle - # 0.78 stalled cycles per insn [83.32%] - 2,038,235,876 branches # 232.107 M/sec [83.36%] - 1,534,832 branch-misses # 0.08% of all branches [83.36%] + 8796.815931 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,935,093,613 cycles # 3.062 GHz [83.32%] + 18,796,887,746 stalled-cycles-frontend # 69.79% frontend cycles idle [83.31%] + 6,818,360,264 stalled-cycles-backend # 25.31% backend cycles idle [66.69%] + 24,148,095,266 instructions # 0.90 insns per cycle + # 0.78 stalled cycles per insn [83.35%] + 2,039,005,393 branches # 231.789 M/sec [83.35%] + 1,638,652 branch-misses # 0.08% of all branches [83.35%] - 8.804251361 seconds time elapsed + 8.819932807 seconds time elapsed Iteration 8 Performance counter stats for './matrixMultiply_clang 1000': - 8795.785758 task-clock # 0.992 CPUs utilized + 8732.240674 task-clock # 0.997 CPUs utilized 10 context-switches # 0.000 M/sec - 1 CPU-migrations # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec 3,075 page-faults # 0.000 M/sec - 26,931,981,875 cycles # 3.062 GHz [83.31%] - 18,798,044,585 stalled-cycles-frontend # 69.80% frontend cycles idle [83.31%] - 6,712,144,445 stalled-cycles-backend # 24.92% backend cycles idle [66.70%] - 24,146,517,257 instructions # 0.90 insns per cycle - # 0.78 stalled cycles per insn [83.35%] - 2,039,265,646 branches # 231.846 M/sec [83.35%] - 1,412,000 branch-misses # 0.07% of all branches [83.33%] + 26,737,479,415 cycles # 3.062 GHz [83.32%] + 18,601,807,786 stalled-cycles-frontend # 69.57% frontend cycles idle [83.32%] + 6,561,397,504 stalled-cycles-backend # 24.54% backend cycles idle [66.64%] + 24,149,772,261 instructions # 0.90 insns per cycle + # 0.77 stalled cycles per insn [83.32%] + 2,038,395,170 branches # 233.433 M/sec [83.36%] + 1,485,301 branch-misses # 0.07% of all branches [83.36%] - 8.867892519 seconds time elapsed + 8.757509097 seconds time elapsed Iteration 9 Performance counter stats for './matrixMultiply_clang 1000': - 8791.557708 task-clock # 0.997 CPUs utilized - 10 context-switches # 0.000 M/sec + 8706.559421 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 3,075 page-faults # 0.000 M/sec - 26,912,031,887 cycles # 3.061 GHz [83.30%] - 18,778,586,140 stalled-cycles-frontend # 69.78% frontend cycles idle [83.34%] - 6,841,179,980 stalled-cycles-backend # 25.42% backend cycles idle [66.69%] - 24,147,072,411 instructions # 0.90 insns per cycle - # 0.78 stalled cycles per insn [83.34%] - 2,039,492,116 branches # 231.983 M/sec [83.34%] - 1,463,732 branch-misses # 0.07% of all branches [83.34%] + 26,659,676,782 cycles # 3.062 GHz [83.32%] + 18,523,302,399 stalled-cycles-frontend # 69.48% frontend cycles idle [83.32%] + 6,570,207,292 stalled-cycles-backend # 24.64% backend cycles idle [66.67%] + 24,136,767,039 instructions # 0.91 insns per cycle + # 0.77 stalled cycles per insn [83.36%] + 2,038,880,459 branches # 234.178 M/sec [83.36%] + 1,511,548 branch-misses # 0.07% of all branches [83.36%] - 8.814620354 seconds time elapsed + 8.729259859 seconds time elapsed Iteration 10 Performance counter stats for './matrixMultiply_clang 1000': - 8702.176014 task-clock # 0.997 CPUs utilized - 10 context-switches # 0.000 M/sec + 8744.544589 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 3,074 page-faults # 0.000 M/sec - 26,645,316,492 cycles # 3.062 GHz [83.31%] - 18,513,602,676 stalled-cycles-frontend # 69.48% frontend cycles idle [83.31%] - 6,473,846,309 stalled-cycles-backend # 24.30% backend cycles idle [66.71%] - 24,146,713,933 instructions # 0.91 insns per cycle - # 0.77 stalled cycles per insn [83.36%] - 2,039,226,629 branches # 234.335 M/sec [83.35%] - 1,443,603 branch-misses # 0.07% of all branches [83.32%] - - 8.725090631 seconds time elapsed + 26,775,031,633 cycles # 3.062 GHz [83.30%] + 18,640,605,103 stalled-cycles-frontend # 69.62% frontend cycles idle [83.34%] + 6,628,187,063 stalled-cycles-backend # 24.76% backend cycles idle [66.69%] + 24,147,316,203 instructions # 0.90 insns per cycle + # 0.77 stalled cycles per insn [83.35%] + 2,038,977,599 branches # 233.171 M/sec [83.35%] + 1,410,532 branch-misses # 0.07% of all branches [83.34%] + + 8.767426048 seconds time elapsed diff --git a/sankalp/clang_output_3000 b/sankalp/clang_output_3000 new file mode 100644 index 0000000..67b7ded --- /dev/null +++ b/sankalp/clang_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply_clang 3000': + + 435870.895044 task-clock # 0.997 CPUs utilized + 547 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,334,464,156,843 cycles # 3.062 GHz [83.33%] + 1,116,588,716,003 stalled-cycles-frontend # 83.67% frontend cycles idle [83.33%] + 760,549,402,793 stalled-cycles-backend # 56.99% backend cycles idle [66.67%] + 649,625,214,346 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,405,175,566 branches # 124.819 M/sec [83.33%] + 31,641,759 branch-misses # 0.06% of all branches [83.33%] + + 436.970014074 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply_clang 3000': + + 436941.138626 task-clock # 0.997 CPUs utilized + 547 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,337,726,968,521 cycles # 3.062 GHz [83.33%] + 1,119,881,200,210 stalled-cycles-frontend # 83.72% frontend cycles idle [83.33%] + 763,263,721,765 stalled-cycles-backend # 57.06% backend cycles idle [66.67%] + 649,639,608,656 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,408,743,887 branches # 124.522 M/sec [83.33%] + 30,480,854 branch-misses # 0.06% of all branches [83.33%] + + 438.038257320 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply_clang 3000': + + 436215.746174 task-clock # 0.997 CPUs utilized + 545 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,335,345,423,489 cycles # 3.061 GHz [83.33%] + 1,117,485,526,106 stalled-cycles-frontend # 83.69% frontend cycles idle [83.33%] + 759,502,326,023 stalled-cycles-backend # 56.88% backend cycles idle [66.67%] + 649,657,788,647 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,408,979,455 branches # 124.730 M/sec [83.33%] + 29,850,475 branch-misses # 0.05% of all branches [83.33%] + + 437.311297435 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply_clang 3000': + + 434660.839337 task-clock # 0.997 CPUs utilized + 544 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,330,746,441,063 cycles # 3.062 GHz [83.33%] + 1,112,865,667,103 stalled-cycles-frontend # 83.63% frontend cycles idle [83.33%] + 755,733,809,906 stalled-cycles-backend # 56.79% backend cycles idle [66.67%] + 649,629,467,424 instructions # 0.49 insns per cycle + # 1.71 stalled cycles per insn [83.33%] + 54,405,944,056 branches # 125.169 M/sec [83.33%] + 30,324,200 branch-misses # 0.06% of all branches [83.33%] + + 435.752964281 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply_clang 3000': + + 438781.815155 task-clock # 0.997 CPUs utilized + 550 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,343,359,727,224 cycles # 3.062 GHz [83.33%] + 1,125,419,926,576 stalled-cycles-frontend # 83.78% frontend cycles idle [83.33%] + 768,084,785,121 stalled-cycles-backend # 57.18% backend cycles idle [66.67%] + 649,665,121,934 instructions # 0.48 insns per cycle + # 1.73 stalled cycles per insn [83.33%] + 54,408,662,474 branches # 123.999 M/sec [83.33%] + 30,594,105 branch-misses # 0.06% of all branches [83.33%] + + 439.883691061 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply_clang 3000': + + 436113.735318 task-clock # 0.997 CPUs utilized + 546 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,335,204,076,506 cycles # 3.062 GHz [83.33%] + 1,117,295,887,936 stalled-cycles-frontend # 83.68% frontend cycles idle [83.33%] + 749,322,042,821 stalled-cycles-backend # 56.12% backend cycles idle [66.67%] + 649,625,709,220 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,406,397,138 branches # 124.753 M/sec [83.33%] + 30,194,121 branch-misses # 0.06% of all branches [83.33%] + + 437.209951172 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply_clang 3000': + + 436287.286674 task-clock # 0.997 CPUs utilized + 546 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,335,745,938,506 cycles # 3.062 GHz [83.33%] + 1,117,869,103,390 stalled-cycles-frontend # 83.69% frontend cycles idle [83.33%] + 758,032,143,399 stalled-cycles-backend # 56.75% backend cycles idle [66.67%] + 649,644,491,128 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,406,028,719 branches # 124.702 M/sec [83.33%] + 30,072,867 branch-misses # 0.06% of all branches [83.33%] + + 437.394865809 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply_clang 3000': + + 437543.330568 task-clock # 0.997 CPUs utilized + 546 context-switches # 0.000 M/sec + 2 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,339,450,532,302 cycles # 3.061 GHz [83.33%] + 1,121,680,166,977 stalled-cycles-frontend # 83.74% frontend cycles idle [83.33%] + 764,834,662,020 stalled-cycles-backend # 57.10% backend cycles idle [66.67%] + 649,641,184,728 instructions # 0.49 insns per cycle + # 1.73 stalled cycles per insn [83.33%] + 54,409,529,224 branches # 124.352 M/sec [83.33%] + 30,174,500 branch-misses # 0.06% of all branches [83.33%] + + 438.656887155 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply_clang 3000': + + 437737.932628 task-clock # 0.997 CPUs utilized + 549 context-switches # 0.000 M/sec + 2 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,340,168,475,305 cycles # 3.062 GHz [83.33%] + 1,122,266,697,544 stalled-cycles-frontend # 83.74% frontend cycles idle [83.33%] + 762,038,651,178 stalled-cycles-backend # 56.86% backend cycles idle [66.67%] + 649,657,223,429 instructions # 0.48 insns per cycle + # 1.73 stalled cycles per insn [83.33%] + 54,407,338,177 branches # 124.292 M/sec [83.33%] + 29,532,180 branch-misses # 0.05% of all branches [83.33%] + + 438.836735033 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang 3000': + + 438463.682513 task-clock # 0.997 CPUs utilized + 548 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,342,374,344,170 cycles # 3.062 GHz [83.33%] + 1,124,481,215,389 stalled-cycles-frontend # 83.77% frontend cycles idle [83.33%] + 765,398,751,304 stalled-cycles-backend # 57.02% backend cycles idle [66.67%] + 649,726,904,426 instructions # 0.48 insns per cycle + # 1.73 stalled cycles per insn [83.33%] + 54,402,887,069 branches # 124.076 M/sec [83.33%] + 30,000,209 branch-misses # 0.06% of all branches [83.33%] + + 439.566853455 seconds time elapsed + diff --git a/sankalp/clang_output_optimized_100 b/sankalp/clang_output_optimized_100 new file mode 100644 index 0000000..0924dc0 --- /dev/null +++ b/sankalp/clang_output_optimized_100 @@ -0,0 +1,180 @@ +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.962034 task-clock # 0.665 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.081 M/sec + 6,010,763 cycles # 3.064 GHz + 884,158 stalled-cycles-frontend # 14.71% frontend cycles idle + 737,567 stalled-cycles-backend # 12.27% backend cycles idle + 11,047,971 instructions # 1.84 insns per cycle + # 0.08 stalled cycles per insn + 1,468,085 branches # 748.246 M/sec + branch-misses + + 0.002949295 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.948140 task-clock # 0.439 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.082 M/sec + 5,966,906 cycles # 3.063 GHz + 855,303 stalled-cycles-frontend # 14.33% frontend cycles idle + 694,676 stalled-cycles-backend # 11.64% backend cycles idle + 11,045,804 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,467,692 branches # 753.381 M/sec + branch-misses + + 0.004435255 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.947260 task-clock # 0.765 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.081 M/sec + 5,964,814 cycles # 3.063 GHz + 855,649 stalled-cycles-frontend # 14.34% frontend cycles idle + 710,245 stalled-cycles-backend # 11.91% backend cycles idle + 11,043,997 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,467,392 branches # 753.568 M/sec + branch-misses + + 0.002546083 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.947560 task-clock # 0.765 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.081 M/sec + 5,952,625 cycles # 3.056 GHz + 850,406 stalled-cycles-frontend # 14.29% frontend cycles idle + 375,296 stalled-cycles-backend # 6.30% backend cycles idle + 11,022,704 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,463,754 branches # 751.584 M/sec + branch-misses + + 0.002546145 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.943698 task-clock # 0.674 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.082 M/sec + 5,952,763 cycles # 3.063 GHz + 846,909 stalled-cycles-frontend # 14.23% frontend cycles idle + 708,785 stalled-cycles-backend # 11.91% backend cycles idle + 11,039,332 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,466,568 branches # 754.525 M/sec + branch-misses + + 0.002885840 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.949368 task-clock # 0.765 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.082 M/sec + 5,970,129 cycles # 3.063 GHz + 859,909 stalled-cycles-frontend # 14.40% frontend cycles idle + 722,803 stalled-cycles-backend # 12.11% backend cycles idle + 11,045,169 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,467,572 branches # 752.845 M/sec + branch-misses + + 0.002548488 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 2.021036 task-clock # 0.771 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.078 M/sec + 3,528,170 cycles # 1.746 GHz + 1,009,925 stalled-cycles-frontend # 28.62% frontend cycles idle + 726,356 stalled-cycles-backend # 20.59% backend cycles idle + 11,046,780 instructions # 3.13 insns per cycle + # 0.09 stalled cycles per insn + 1,467,943 branches # 726.332 M/sec + 14,164 branch-misses # 0.96% of all branches [42.61%] + + 0.002620696 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.959283 task-clock # 0.779 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.081 M/sec + 5,463,297 cycles # 2.788 GHz + 862,862 stalled-cycles-frontend # 15.79% frontend cycles idle + 699,735 stalled-cycles-backend # 12.81% backend cycles idle + 11,048,711 instructions # 2.02 insns per cycle + # 0.08 stalled cycles per insn + 1,468,247 branches # 749.380 M/sec + 17,826 branch-misses # 1.21% of all branches [ 8.79%] + + 0.002515733 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.948017 task-clock # 0.780 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.081 M/sec + 5,966,888 cycles # 3.063 GHz + 856,064 stalled-cycles-frontend # 14.35% frontend cycles idle + 711,299 stalled-cycles-backend # 11.92% backend cycles idle + 11,046,813 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,467,618 branches # 753.391 M/sec + branch-misses + + 0.002498457 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.949114 task-clock # 0.785 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.082 M/sec + 5,952,365 cycles # 3.054 GHz + 848,125 stalled-cycles-frontend # 14.25% frontend cycles idle + 694,927 stalled-cycles-backend # 11.67% backend cycles idle + 11,033,183 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,465,119 branches # 751.685 M/sec + branch-misses + + 0.002481376 seconds time elapsed + diff --git a/sankalp/clang_output_optimized_1000 b/sankalp/clang_output_optimized_1000 new file mode 100644 index 0000000..8ca645e --- /dev/null +++ b/sankalp/clang_output_optimized_1000 @@ -0,0 +1,180 @@ +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8514.301983 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,069,051,123 cycles # 3.062 GHz [83.32%] + 20,139,826,256 stalled-cycles-frontend # 77.26% frontend cycles idle [83.32%] + 10,074,406,315 stalled-cycles-backend # 38.65% backend cycles idle [66.68%] + 9,145,854,517 instructions # 0.35 insns per cycle + # 2.20 stalled cycles per insn [83.36%] + 1,035,460,914 branches # 121.614 M/sec [83.36%] + 1,085,246 branch-misses # 0.10% of all branches [83.34%] + + 8.536668414 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8533.423369 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,129,292,006 cycles # 3.062 GHz [83.31%] + 20,207,838,356 stalled-cycles-frontend # 77.34% frontend cycles idle [83.31%] + 9,007,753,681 stalled-cycles-backend # 34.47% backend cycles idle [66.71%] + 9,149,245,795 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.35%] + 1,035,427,362 branches # 121.338 M/sec [83.35%] + 1,083,353 branch-misses # 0.10% of all branches [83.33%] + + 8.555680250 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8524.533087 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,102,555,736 cycles # 3.062 GHz [83.34%] + 20,174,883,322 stalled-cycles-frontend # 77.29% frontend cycles idle [83.34%] + 9,795,587,822 stalled-cycles-backend # 37.53% backend cycles idle [66.67%] + 9,149,253,149 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.34%] + 1,035,420,531 branches # 121.464 M/sec [83.34%] + 1,081,429 branch-misses # 0.10% of all branches [83.35%] + + 8.546955580 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8558.061972 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,204,898,727 cycles # 3.062 GHz [83.31%] + 20,288,761,306 stalled-cycles-frontend # 77.42% frontend cycles idle [83.31%] + 9,856,648,639 stalled-cycles-backend # 37.61% backend cycles idle [66.71%] + 9,149,320,923 instructions # 0.35 insns per cycle + # 2.22 stalled cycles per insn [83.36%] + 1,035,453,678 branches # 120.992 M/sec [83.36%] + 1,081,282 branch-misses # 0.10% of all branches [83.32%] + + 8.580455767 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8513.464377 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,067,845,209 cycles # 3.062 GHz [83.32%] + 20,133,798,950 stalled-cycles-frontend # 77.24% frontend cycles idle [83.32%] + 8,624,644,078 stalled-cycles-backend # 33.09% backend cycles idle [66.67%] + 9,145,773,113 instructions # 0.35 insns per cycle + # 2.20 stalled cycles per insn [83.36%] + 1,035,458,509 branches # 121.626 M/sec [83.36%] + 1,089,716 branch-misses # 0.11% of all branches [83.35%] + + 8.535682415 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8519.104099 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,085,519,997 cycles # 3.062 GHz [83.33%] + 20,156,984,198 stalled-cycles-frontend # 77.27% frontend cycles idle [83.33%] + 8,787,917,469 stalled-cycles-backend # 33.69% backend cycles idle [66.65%] + 9,149,566,196 instructions # 0.35 insns per cycle + # 2.20 stalled cycles per insn [83.33%] + 1,034,627,980 branches # 121.448 M/sec [83.37%] + 1,113,417 branch-misses # 0.11% of all branches [83.36%] + + 8.541426918 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8525.969981 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,106,906,116 cycles # 3.062 GHz [83.30%] + 20,176,019,515 stalled-cycles-frontend # 77.28% frontend cycles idle [83.34%] + 8,065,406,321 stalled-cycles-backend # 30.89% backend cycles idle [66.68%] + 9,149,290,275 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.34%] + 1,035,439,656 branches # 121.445 M/sec [83.34%] + 1,090,091 branch-misses # 0.11% of all branches [83.34%] + + 8.548269885 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8530.756566 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,120,379,015 cycles # 3.062 GHz [83.30%] + 20,196,068,508 stalled-cycles-frontend # 77.32% frontend cycles idle [83.30%] + 9,181,947,822 stalled-cycles-backend # 35.15% backend cycles idle [66.70%] + 9,150,553,323 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.35%] + 1,035,656,501 branches # 121.403 M/sec [83.35%] + 1,099,565 branch-misses # 0.11% of all branches [83.35%] + + 8.553018234 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8537.180438 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,141,449,324 cycles # 3.062 GHz [83.31%] + 20,217,377,597 stalled-cycles-frontend # 77.34% frontend cycles idle [83.32%] + 7,883,092,404 stalled-cycles-backend # 30.16% backend cycles idle [66.67%] + 9,145,842,530 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.36%] + 1,035,464,658 branches # 121.289 M/sec [83.36%] + 1,094,606 branch-misses # 0.11% of all branches [83.35%] + + 8.561051194 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8521.967213 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,092,302,546 cycles # 3.062 GHz [83.33%] + 20,165,608,254 stalled-cycles-frontend # 77.29% frontend cycles idle [83.33%] + 9,103,949,656 stalled-cycles-backend # 34.89% backend cycles idle [66.66%] + 9,149,688,050 instructions # 0.35 insns per cycle + # 2.20 stalled cycles per insn [83.33%] + 1,035,529,349 branches # 121.513 M/sec [83.33%] + 1,095,002 branch-misses # 0.11% of all branches [83.36%] + + 8.544265295 seconds time elapsed + diff --git a/sankalp/clang_output_optimized_3000 b/sankalp/clang_output_optimized_3000 new file mode 100644 index 0000000..58371ab --- /dev/null +++ b/sankalp/clang_output_optimized_3000 @@ -0,0 +1,180 @@ +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 312664.887494 task-clock # 0.997 CPUs utilized + 392 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 957,194,643,582 cycles # 3.061 GHz [83.33%] + 801,278,508,780 stalled-cycles-frontend # 83.71% frontend cycles idle [83.33%] + 654,614,518,739 stalled-cycles-backend # 68.39% backend cycles idle [66.67%] + 244,566,461,305 instructions # 0.26 insns per cycle + # 3.28 stalled cycles per insn [83.33%] + 27,360,317,759 branches # 87.507 M/sec [83.33%] + 13,880,850 branch-misses # 0.05% of all branches [83.33%] + + 313.450793586 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 312283.288554 task-clock # 0.997 CPUs utilized + 391 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 955,893,620,144 cycles # 3.061 GHz [83.33%] + 799,959,307,996 stalled-cycles-frontend # 83.69% frontend cycles idle [83.33%] + 624,558,986,255 stalled-cycles-backend # 65.34% backend cycles idle [66.67%] + 244,567,518,923 instructions # 0.26 insns per cycle + # 3.27 stalled cycles per insn [83.33%] + 27,361,026,722 branches # 87.616 M/sec [83.33%] + 12,927,656 branch-misses # 0.05% of all branches [83.33%] + + 313.069529799 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 314069.326289 task-clock # 0.997 CPUs utilized + 393 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 961,431,758,518 cycles # 3.061 GHz [83.33%] + 805,494,232,345 stalled-cycles-frontend # 83.78% frontend cycles idle [83.33%] + 630,365,211,190 stalled-cycles-backend # 65.57% backend cycles idle [66.67%] + 244,567,418,849 instructions # 0.25 insns per cycle + # 3.29 stalled cycles per insn [83.33%] + 27,359,270,785 branches # 87.112 M/sec [83.33%] + 12,925,094 branch-misses # 0.05% of all branches [83.33%] + + 314.901173672 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 313605.668691 task-clock # 0.997 CPUs utilized + 393 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 960,099,341,079 cycles # 3.061 GHz [83.33%] + 804,209,745,312 stalled-cycles-frontend # 83.76% frontend cycles idle [83.33%] + 650,945,842,810 stalled-cycles-backend # 67.80% backend cycles idle [66.67%] + 244,552,833,312 instructions # 0.25 insns per cycle + # 3.29 stalled cycles per insn [83.33%] + 27,360,236,458 branches # 87.244 M/sec [83.33%] + 13,471,738 branch-misses # 0.05% of all branches [83.33%] + + 314.393884834 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 313966.377674 task-clock # 0.997 CPUs utilized + 394 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 961,182,730,314 cycles # 3.061 GHz [83.33%] + 805,474,890,245 stalled-cycles-frontend # 83.80% frontend cycles idle [83.33%] + 655,175,905,580 stalled-cycles-backend # 68.16% backend cycles idle [66.67%] + 244,546,839,813 instructions # 0.25 insns per cycle + # 3.29 stalled cycles per insn [83.33%] + 27,360,307,420 branches # 87.144 M/sec [83.33%] + 13,625,821 branch-misses # 0.05% of all branches [83.33%] + + 314.755038625 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 315025.036094 task-clock # 0.997 CPUs utilized + 395 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 964,449,384,871 cycles # 3.062 GHz [83.33%] + 808,592,472,928 stalled-cycles-frontend # 83.84% frontend cycles idle [83.33%] + 646,222,264,512 stalled-cycles-backend # 67.00% backend cycles idle [66.67%] + 244,552,197,147 instructions # 0.25 insns per cycle + # 3.31 stalled cycles per insn [83.33%] + 27,358,770,723 branches # 86.846 M/sec [83.33%] + 13,799,312 branch-misses # 0.05% of all branches [83.33%] + + 315.816146040 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 313884.082830 task-clock # 0.997 CPUs utilized + 394 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 960,938,455,254 cycles # 3.061 GHz [83.33%] + 804,967,633,007 stalled-cycles-frontend # 83.77% frontend cycles idle [83.33%] + 658,597,647,955 stalled-cycles-backend # 68.54% backend cycles idle [66.67%] + 244,565,187,191 instructions # 0.25 insns per cycle + # 3.29 stalled cycles per insn [83.33%] + 27,361,335,010 branches # 87.170 M/sec [83.33%] + 13,868,957 branch-misses # 0.05% of all branches [83.33%] + + 314.672105390 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 313070.788902 task-clock # 0.997 CPUs utilized + 393 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 958,299,705,663 cycles # 3.061 GHz [83.33%] + 802,791,733,825 stalled-cycles-frontend # 83.77% frontend cycles idle [83.33%] + 620,995,884,839 stalled-cycles-backend # 64.80% backend cycles idle [66.67%] + 244,575,491,330 instructions # 0.26 insns per cycle + # 3.28 stalled cycles per insn [83.33%] + 27,361,827,022 branches # 87.398 M/sec [83.33%] + 13,026,877 branch-misses # 0.05% of all branches [83.33%] + + 313.856410059 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 315731.190936 task-clock # 0.997 CPUs utilized + 396 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 966,582,281,999 cycles # 3.061 GHz [83.33%] + 810,643,864,844 stalled-cycles-frontend # 83.87% frontend cycles idle [83.33%] + 653,645,811,041 stalled-cycles-backend # 67.62% backend cycles idle [66.67%] + 244,568,729,928 instructions # 0.25 insns per cycle + # 3.31 stalled cycles per insn [83.33%] + 27,361,596,499 branches # 86.661 M/sec [83.33%] + 13,710,796 branch-misses # 0.05% of all branches [83.33%] + + 316.523716704 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 312952.702244 task-clock # 0.997 CPUs utilized + 393 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 957,972,776,248 cycles # 3.061 GHz [83.33%] + 802,443,920,049 stalled-cycles-frontend # 83.76% frontend cycles idle [83.33%] + 640,914,452,512 stalled-cycles-backend # 66.90% backend cycles idle [66.67%] + 244,578,176,924 instructions # 0.26 insns per cycle + # 3.28 stalled cycles per insn [83.33%] + 27,363,549,903 branches # 87.437 M/sec [83.33%] + 13,598,396 branch-misses # 0.05% of all branches [83.33%] + + 313.738715536 seconds time elapsed + diff --git a/sankalp/gcc_output_100 b/sankalp/gcc_output_100 index 0ae1a5c..cecefd4 100644 --- a/sankalp/gcc_output_100 +++ b/sankalp/gcc_output_100 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for './matrixMultiply 100': - 8.082594 task-clock # 0.229 CPUs utilized + 8.054504 task-clock # 0.903 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 159 page-faults # 0.020 M/sec - 24,637,996 cycles # 3.048 GHz [50.73%] - 6,986,651 stalled-cycles-frontend # 28.36% frontend cycles idle - 1,008,145 stalled-cycles-backend # 4.09% backend cycles idle - 52,133,562 instructions # 2.12 insns per cycle - # 0.13 stalled cycles per insn - 1,477,235 branches # 182.767 M/sec - 11,701 branch-misses # 0.79% of all branches [84.88%] + 24,610,696 cycles # 3.056 GHz [50.57%] + 7,909,722 stalled-cycles-frontend # 32.14% frontend cycles idle + 689,986 stalled-cycles-backend # 2.80% backend cycles idle + 52,144,755 instructions # 2.12 insns per cycle + # 0.15 stalled cycles per insn + 1,478,711 branches # 183.588 M/sec + 11,727 branch-misses # 0.79% of all branches [76.43%] - 0.035366218 seconds time elapsed + 0.008919947 seconds time elapsed Iteration 2 Performance counter stats for './matrixMultiply 100': - 8.050201 task-clock # 0.479 CPUs utilized + 8.117808 task-clock # 0.932 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 159 page-faults # 0.020 M/sec - 24,595,103 cycles # 3.055 GHz [50.55%] - 8,624,213 stalled-cycles-frontend # 35.06% frontend cycles idle - 689,549 stalled-cycles-backend # 2.80% backend cycles idle - 52,141,529 instructions # 2.12 insns per cycle - # 0.17 stalled cycles per insn - 1,478,633 branches # 183.677 M/sec - 11,859 branch-misses # 0.80% of all branches [69.94%] + 24,718,750 cycles # 3.045 GHz [50.92%] + 8,195,388 stalled-cycles-frontend # 33.15% frontend cycles idle + 897,551 stalled-cycles-backend # 3.63% backend cycles idle + 52,145,300 instructions # 2.11 insns per cycle + # 0.16 stalled cycles per insn + 1,478,850 branches # 182.174 M/sec + 11,724 branch-misses # 0.79% of all branches [74.58%] - 0.016799654 seconds time elapsed + 0.008711930 seconds time elapsed Iteration 3 Performance counter stats for './matrixMultiply 100': - 8.147851 task-clock # 0.375 CPUs utilized + 8.111482 task-clock # 0.927 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 158 page-faults # 0.019 M/sec - 24,820,799 cycles # 3.046 GHz [51.05%] - 8,571,190 stalled-cycles-frontend # 34.53% frontend cycles idle - 1,023,027 stalled-cycles-backend # 4.12% backend cycles idle - 52,141,396 instructions # 2.10 insns per cycle + 24,714,858 cycles # 3.047 GHz [50.88%] + 8,209,540 stalled-cycles-frontend # 33.22% frontend cycles idle + 698,504 stalled-cycles-backend # 2.83% backend cycles idle + 52,145,272 instructions # 2.11 insns per cycle # 0.16 stalled cycles per insn - 1,478,585 branches # 181.469 M/sec - 11,862 branch-misses # 0.80% of all branches [71.63%] + 1,478,847 branches # 182.315 M/sec + 11,726 branch-misses # 0.79% of all branches [74.46%] - 0.021745919 seconds time elapsed + 0.008749660 seconds time elapsed Iteration 4 Performance counter stats for './matrixMultiply 100': - 8.067087 task-clock # 0.404 CPUs utilized + 8.148961 task-clock # 0.917 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 159 page-faults # 0.020 M/sec - 24,615,481 cycles # 3.051 GHz [50.64%] - 7,610,015 stalled-cycles-frontend # 30.92% frontend cycles idle - 706,958 stalled-cycles-backend # 2.87% backend cycles idle - 52,143,297 instructions # 2.12 insns per cycle - # 0.15 stalled cycles per insn - 1,478,700 branches # 183.300 M/sec - 11,797 branch-misses # 0.80% of all branches [79.23%] + 158 page-faults # 0.019 M/sec + 24,818,324 cycles # 3.046 GHz [51.10%] + 6,387,176 stalled-cycles-frontend # 25.74% frontend cycles idle + 574,390 stalled-cycles-backend # 2.31% backend cycles idle + 52,168,459 instructions # 2.10 insns per cycle + # 0.12 stalled cycles per insn + 1,483,171 branches # 182.007 M/sec + 11,840 branch-misses # 0.80% of all branches [90.60%] - 0.019968319 seconds time elapsed + 0.008883245 seconds time elapsed Iteration 5 Performance counter stats for './matrixMultiply 100': - 8.073882 task-clock # 0.362 CPUs utilized + 8.087013 task-clock # 0.908 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 159 page-faults # 0.020 M/sec - 24,681,444 cycles # 3.057 GHz [77.01%] - 10,796,404 stalled-cycles-frontend # 43.74% frontend cycles idle [50.66%] - 655,582 stalled-cycles-backend # 2.66% backend cycles idle - 52,141,219 instructions # 2.11 insns per cycle - # 0.21 stalled cycles per insn - 1,478,123 branches # 183.075 M/sec - 17,389 branch-misses # 1.18% of all branches + 24,632,136 cycles # 3.046 GHz [50.73%] + 6,193,928 stalled-cycles-frontend # 25.15% frontend cycles idle + 772,134 stalled-cycles-backend # 3.13% backend cycles idle + 52,143,390 instructions # 2.12 insns per cycle + # 0.12 stalled cycles per insn + 1,478,507 branches # 182.825 M/sec + 11,557 branch-misses # 0.78% of all branches [91.88%] - 0.022306904 seconds time elapsed + 0.008906666 seconds time elapsed Iteration 6 Performance counter stats for './matrixMultiply 100': - 8.133306 task-clock # 0.422 CPUs utilized + 8.084764 task-clock # 0.930 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 159 page-faults # 0.020 M/sec - 24,829,473 cycles # 3.053 GHz [50.97%] - 9,317,416 stalled-cycles-frontend # 37.53% frontend cycles idle - 1,151,323 stalled-cycles-backend # 4.64% backend cycles idle - 52,140,727 instructions # 2.10 insns per cycle - # 0.18 stalled cycles per insn - 1,478,462 branches # 181.779 M/sec - 11,889 branch-misses # 0.80% of all branches [64.98%] + 24,635,382 cycles # 3.047 GHz [50.73%] + 10,318,247 stalled-cycles-frontend # 41.88% frontend cycles idle + 985,300 stalled-cycles-backend # 4.00% backend cycles idle + 52,144,339 instructions # 2.12 insns per cycle + # 0.20 stalled cycles per insn + 1,478,689 branches # 182.898 M/sec + 12,290 branch-misses # 0.83% of all branches [54.83%] - 0.019272832 seconds time elapsed + 0.008697934 seconds time elapsed Iteration 7 Performance counter stats for './matrixMultiply 100': - 8.088853 task-clock # 0.448 CPUs utilized + 8.080921 task-clock # 0.933 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 158 page-faults # 0.020 M/sec - 24,718,914 cycles # 3.056 GHz [50.73%] - 5,855,324 stalled-cycles-frontend # 23.69% frontend cycles idle - 800,691 stalled-cycles-backend # 3.24% backend cycles idle - 52,142,592 instructions # 2.11 insns per cycle - # 0.11 stalled cycles per insn - 1,478,383 branches # 182.768 M/sec - 11,526 branch-misses # 0.78% of all branches [95.44%] + 159 page-faults # 0.020 M/sec + 24,599,853 cycles # 3.044 GHz [50.70%] + 6,254,276 stalled-cycles-frontend # 25.42% frontend cycles idle + 871,510 stalled-cycles-backend # 3.54% backend cycles idle + 52,146,066 instructions # 2.12 insns per cycle + # 0.12 stalled cycles per insn + 1,479,020 branches # 183.026 M/sec + 11,596 branch-misses # 0.78% of all branches [91.42%] - 0.018044272 seconds time elapsed + 0.008656610 seconds time elapsed Iteration 8 Performance counter stats for './matrixMultiply 100': - 8.100240 task-clock # 0.402 CPUs utilized + 8.104023 task-clock # 0.910 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 158 page-faults # 0.020 M/sec - 24,651,938 cycles # 3.043 GHz [50.81%] - 9,684,842 stalled-cycles-frontend # 39.29% frontend cycles idle - 756,211 stalled-cycles-backend # 3.07% backend cycles idle - 52,135,360 instructions # 2.11 insns per cycle - # 0.19 stalled cycles per insn - 1,477,522 branches # 182.405 M/sec - 11,963 branch-misses # 0.81% of all branches [60.49%] + 159 page-faults # 0.020 M/sec + 24,721,453 cycles # 3.051 GHz [50.81%] + 7,609,755 stalled-cycles-frontend # 30.78% frontend cycles idle + 797,005 stalled-cycles-backend # 3.22% backend cycles idle + 52,152,265 instructions # 2.11 insns per cycle + # 0.15 stalled cycles per insn + 1,480,154 branches # 182.644 M/sec + 11,875 branch-misses # 0.80% of all branches [79.49%] - 0.020160354 seconds time elapsed + 0.008901112 seconds time elapsed Iteration 9 Performance counter stats for './matrixMultiply 100': - 8.053028 task-clock # 0.367 CPUs utilized + 8.105288 task-clock # 0.924 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 158 page-faults # 0.020 M/sec - 24,606,167 cycles # 3.056 GHz [50.56%] - 9,034,157 stalled-cycles-frontend # 36.72% frontend cycles idle - 623,010 stalled-cycles-backend # 2.53% backend cycles idle - 52,142,491 instructions # 2.12 insns per cycle + 159 page-faults # 0.020 M/sec + 24,710,843 cycles # 3.049 GHz [50.85%] + 8,609,115 stalled-cycles-frontend # 34.84% frontend cycles idle + 511,967 stalled-cycles-backend # 2.07% backend cycles idle + 52,146,432 instructions # 2.11 insns per cycle # 0.17 stalled cycles per insn - 1,478,373 branches # 183.580 M/sec - 11,952 branch-misses # 0.81% of all branches [66.29%] + 1,479,068 branches # 182.482 M/sec + 11,732 branch-misses # 0.79% of all branches [70.47%] - 0.021926602 seconds time elapsed + 0.008771563 seconds time elapsed Iteration 10 Performance counter stats for './matrixMultiply 100': - 8.095434 task-clock # 0.411 CPUs utilized + 8.104444 task-clock # 0.935 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 159 page-faults # 0.020 M/sec - 24,739,370 cycles # 3.056 GHz [50.82%] - 10,304,707 stalled-cycles-frontend # 41.65% frontend cycles idle - 719,320 stalled-cycles-backend # 2.91% backend cycles idle - 52,143,820 instructions # 2.11 insns per cycle - # 0.20 stalled cycles per insn - 1,478,991 branches # 182.694 M/sec - 12,024 branch-misses # 0.81% of all branches [55.52%] + 24,657,762 cycles # 3.042 GHz [50.84%] + 8,398,717 stalled-cycles-frontend # 34.06% frontend cycles idle + 1,004,334 stalled-cycles-backend # 4.07% backend cycles idle + 52,144,374 instructions # 2.11 insns per cycle + # 0.16 stalled cycles per insn + 1,478,685 branches # 182.454 M/sec + 11,712 branch-misses # 0.79% of all branches [72.47%] - 0.019719568 seconds time elapsed + 0.008664229 seconds time elapsed diff --git a/sankalp/gcc_output_1000 b/sankalp/gcc_output_1000 index cea6165..143e8fe 100644 --- a/sankalp/gcc_output_1000 +++ b/sankalp/gcc_output_1000 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for './matrixMultiply 1000': - 9989.170541 task-clock # 0.996 CPUs utilized - 11 context-switches # 0.000 M/sec - 0 CPU-migrations # 0.000 M/sec - 3,075 page-faults # 0.000 M/sec - 30,581,586,932 cycles # 3.061 GHz [83.30%] - 17,622,767,995 stalled-cycles-frontend # 57.63% frontend cycles idle [83.34%] - 4,193,237,081 stalled-cycles-backend # 13.71% backend cycles idle [66.69%] - 50,156,776,557 instructions # 1.64 insns per cycle - # 0.35 stalled cycles per insn [83.34%] - 1,037,731,568 branches # 103.886 M/sec [83.34%] - 1,104,588 branch-misses # 0.11% of all branches [83.34%] + 9926.708359 task-clock # 0.997 CPUs utilized + 13 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 30,395,895,247 cycles # 3.062 GHz [83.32%] + 17,442,111,645 stalled-cycles-frontend # 57.38% frontend cycles idle [83.32%] + 4,164,384,143 stalled-cycles-backend # 13.70% backend cycles idle [66.68%] + 50,155,717,267 instructions # 1.65 insns per cycle + # 0.35 stalled cycles per insn [83.36%] + 1,037,542,959 branches # 104.520 M/sec [83.36%] + 1,062,313 branch-misses # 0.10% of all branches [83.32%] - 10.027304870 seconds time elapsed + 9.952598326 seconds time elapsed Iteration 2 Performance counter stats for './matrixMultiply 1000': - 9968.053405 task-clock # 0.997 CPUs utilized - 13 context-switches # 0.000 M/sec + 9989.945693 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 3,074 page-faults # 0.000 M/sec - 30,521,267,945 cycles # 3.062 GHz [83.31%] - 17,556,447,969 stalled-cycles-frontend # 57.52% frontend cycles idle [83.34%] - 4,278,889,715 stalled-cycles-backend # 14.02% backend cycles idle [66.70%] - 50,162,132,165 instructions # 1.64 insns per cycle + 30,589,481,178 cycles # 3.062 GHz [83.31%] + 17,621,887,593 stalled-cycles-frontend # 57.61% frontend cycles idle [83.34%] + 4,027,488,464 stalled-cycles-backend # 13.17% backend cycles idle [66.69%] + 50,159,899,384 instructions # 1.64 insns per cycle # 0.35 stalled cycles per insn [83.35%] - 1,037,644,970 branches # 104.097 M/sec [83.35%] - 1,072,195 branch-misses # 0.10% of all branches [83.32%] + 1,037,610,140 branches # 103.865 M/sec [83.34%] + 1,072,230 branch-misses # 0.10% of all branches [83.34%] - 9.993975874 seconds time elapsed + 10.015847661 seconds time elapsed Iteration 3 Performance counter stats for './matrixMultiply 1000': - 9926.186121 task-clock # 0.997 CPUs utilized + 9872.782392 task-clock # 0.997 CPUs utilized 12 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 3,074 page-faults # 0.000 M/sec - 30,394,192,927 cycles # 3.062 GHz [83.32%] - 17,440,517,077 stalled-cycles-frontend # 57.38% frontend cycles idle [83.32%] - 4,145,893,695 stalled-cycles-backend # 13.64% backend cycles idle [66.67%] - 50,150,109,486 instructions # 1.65 insns per cycle - # 0.35 stalled cycles per insn [83.35%] - 1,037,595,495 branches # 104.531 M/sec [83.36%] - 1,078,895 branch-misses # 0.10% of all branches [83.35%] + 30,230,798,240 cycles # 3.062 GHz [83.31%] + 17,272,580,035 stalled-cycles-frontend # 57.14% frontend cycles idle [83.34%] + 3,944,001,447 stalled-cycles-backend # 13.05% backend cycles idle [66.70%] + 50,157,447,316 instructions # 1.66 insns per cycle + # 0.34 stalled cycles per insn [83.35%] + 1,037,562,856 branches # 105.093 M/sec [83.35%] + 1,070,768 branch-misses # 0.10% of all branches [83.33%] - 9.952122977 seconds time elapsed + 9.898330956 seconds time elapsed Iteration 4 Performance counter stats for './matrixMultiply 1000': - 9881.740024 task-clock # 0.997 CPUs utilized + 9960.652528 task-clock # 0.997 CPUs utilized 12 context-switches # 0.000 M/sec - 0 CPU-migrations # 0.000 M/sec + 2 CPU-migrations # 0.000 M/sec 3,075 page-faults # 0.000 M/sec - 30,257,682,330 cycles # 3.062 GHz [83.32%] - 17,304,847,964 stalled-cycles-frontend # 57.19% frontend cycles idle [83.32%] - 3,844,903,274 stalled-cycles-backend # 12.71% backend cycles idle [66.65%] - 50,164,214,193 instructions # 1.66 insns per cycle - # 0.34 stalled cycles per insn [83.32%] - 1,036,954,474 branches # 104.936 M/sec [83.36%] - 1,080,068 branch-misses # 0.10% of all branches [83.36%] + 30,442,315,955 cycles # 3.056 GHz [83.34%] + 17,495,255,191 stalled-cycles-frontend # 57.47% frontend cycles idle [83.34%] + 4,435,073,572 stalled-cycles-backend # 14.57% backend cycles idle [66.67%] + 50,158,527,538 instructions # 1.65 insns per cycle + # 0.35 stalled cycles per insn [83.34%] + 1,037,684,531 branches # 104.178 M/sec [83.34%] + 1,090,517 branch-misses # 0.11% of all branches [83.35%] - 9.907367067 seconds time elapsed + 9.986475787 seconds time elapsed Iteration 5 Performance counter stats for './matrixMultiply 1000': - 9885.426106 task-clock # 0.997 CPUs utilized - 13 context-switches # 0.000 M/sec + 9983.888308 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 3,075 page-faults # 0.000 M/sec - 30,269,280,501 cycles # 3.062 GHz [83.33%] - 17,313,520,355 stalled-cycles-frontend # 57.20% frontend cycles idle [83.33%] - 3,835,575,528 stalled-cycles-backend # 12.67% backend cycles idle [66.66%] - 50,153,925,918 instructions # 1.66 insns per cycle + 3,074 page-faults # 0.000 M/sec + 30,571,145,817 cycles # 3.062 GHz [83.33%] + 17,613,563,281 stalled-cycles-frontend # 57.61% frontend cycles idle [83.34%] + 4,138,212,697 stalled-cycles-backend # 13.54% backend cycles idle [66.67%] + 50,155,387,715 instructions # 1.64 insns per cycle # 0.35 stalled cycles per insn [83.33%] - 1,036,820,042 branches # 104.884 M/sec [83.37%] - 1,066,630 branch-misses # 0.10% of all branches [83.34%] + 1,037,567,984 branches # 103.924 M/sec [83.33%] + 1,068,596 branch-misses # 0.10% of all branches [83.35%] - 9.911252910 seconds time elapsed + 10.010151775 seconds time elapsed Iteration 6 Performance counter stats for './matrixMultiply 1000': - 9889.983104 task-clock # 0.997 CPUs utilized + 9853.437478 task-clock # 0.997 CPUs utilized 13 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 3,074 page-faults # 0.000 M/sec - 30,280,695,223 cycles # 3.062 GHz [83.34%] - 17,324,211,616 stalled-cycles-frontend # 57.21% frontend cycles idle [83.34%] - 4,051,759,479 stalled-cycles-backend # 13.38% backend cycles idle [66.68%] - 50,157,057,504 instructions # 1.66 insns per cycle - # 0.35 stalled cycles per insn [83.34%] - 1,037,558,475 branches # 104.910 M/sec [83.34%] - 1,070,979 branch-misses # 0.10% of all branches [83.32%] + 3,075 page-faults # 0.000 M/sec + 30,170,703,152 cycles # 3.062 GHz [83.32%] + 17,222,155,727 stalled-cycles-frontend # 57.08% frontend cycles idle [83.32%] + 4,055,670,788 stalled-cycles-backend # 13.44% backend cycles idle [66.67%] + 50,155,779,844 instructions # 1.66 insns per cycle + # 0.34 stalled cycles per insn [83.36%] + 1,037,560,137 branches # 105.299 M/sec [83.36%] + 1,074,365 branch-misses # 0.10% of all branches [83.35%] - 9.915589553 seconds time elapsed + 9.879197104 seconds time elapsed Iteration 7 Performance counter stats for './matrixMultiply 1000': - 9939.642605 task-clock # 0.997 CPUs utilized - 13 context-switches # 0.000 M/sec + 9885.285809 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 3,074 page-faults # 0.000 M/sec - 30,428,586,559 cycles # 3.061 GHz [83.34%] - 17,480,604,113 stalled-cycles-frontend # 57.45% frontend cycles idle [83.34%] - 4,012,801,621 stalled-cycles-backend # 13.19% backend cycles idle [66.68%] - 50,157,234,655 instructions # 1.65 insns per cycle - # 0.35 stalled cycles per insn [83.34%] - 1,037,647,811 branches # 104.395 M/sec [83.34%] - 1,069,193 branch-misses # 0.10% of all branches [83.32%] + 3,075 page-faults # 0.000 M/sec + 30,268,249,154 cycles # 3.062 GHz [83.34%] + 17,314,471,270 stalled-cycles-frontend # 57.20% frontend cycles idle [83.33%] + 4,082,457,570 stalled-cycles-backend # 13.49% backend cycles idle [66.66%] + 50,154,666,290 instructions # 1.66 insns per cycle + # 0.35 stalled cycles per insn [83.33%] + 1,037,650,375 branches # 104.969 M/sec [83.33%] + 1,085,196 branch-misses # 0.10% of all branches [83.37%] - 9.965459847 seconds time elapsed + 9.910950714 seconds time elapsed Iteration 8 Performance counter stats for './matrixMultiply 1000': - 9920.452250 task-clock # 0.997 CPUs utilized - 11 context-switches # 0.000 M/sec + 9914.407092 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 3,074 page-faults # 0.000 M/sec - 30,376,652,538 cycles # 3.062 GHz [83.31%] - 17,415,976,577 stalled-cycles-frontend # 57.33% frontend cycles idle [83.34%] - 3,998,906,672 stalled-cycles-backend # 13.16% backend cycles idle [66.70%] - 50,156,200,190 instructions # 1.65 insns per cycle - # 0.35 stalled cycles per insn [83.35%] - 1,037,605,358 branches # 104.593 M/sec [83.35%] - 1,072,587 branch-misses # 0.10% of all branches [83.32%] + 30,356,897,007 cycles # 3.062 GHz [83.34%] + 17,403,547,284 stalled-cycles-frontend # 57.33% frontend cycles idle [83.34%] + 4,191,887,997 stalled-cycles-backend # 13.81% backend cycles idle [66.68%] + 50,156,122,104 instructions # 1.65 insns per cycle + # 0.35 stalled cycles per insn [83.34%] + 1,037,539,929 branches # 104.650 M/sec [83.34%] + 1,065,113 branch-misses # 0.10% of all branches [83.31%] - 9.946187560 seconds time elapsed + 9.940317228 seconds time elapsed Iteration 9 Performance counter stats for './matrixMultiply 1000': - 9950.631435 task-clock # 0.997 CPUs utilized - 13 context-switches # 0.000 M/sec + 9937.674711 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 3,075 page-faults # 0.000 M/sec - 30,468,120,896 cycles # 3.062 GHz [83.32%] - 17,513,181,615 stalled-cycles-frontend # 57.48% frontend cycles idle [83.32%] - 4,285,615,016 stalled-cycles-backend # 14.07% backend cycles idle [66.67%] - 50,146,044,213 instructions # 1.65 insns per cycle - # 0.35 stalled cycles per insn [83.36%] - 1,037,530,014 branches # 104.268 M/sec [83.36%] - 1,082,040 branch-misses # 0.10% of all branches [83.35%] + 3,074 page-faults # 0.000 M/sec + 30,427,817,353 cycles # 3.062 GHz [83.34%] + 17,471,897,841 stalled-cycles-frontend # 57.42% frontend cycles idle [83.34%] + 4,027,974,555 stalled-cycles-backend # 13.24% backend cycles idle [66.68%] + 50,158,261,034 instructions # 1.65 insns per cycle + # 0.35 stalled cycles per insn [83.34%] + 1,037,803,159 branches # 104.431 M/sec [83.34%] + 1,088,832 branch-misses # 0.10% of all branches [83.32%] - 9.976606602 seconds time elapsed + 9.963562648 seconds time elapsed Iteration 10 Performance counter stats for './matrixMultiply 1000': - 9850.001597 task-clock # 0.997 CPUs utilized - 12 context-switches # 0.000 M/sec + 9878.683493 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 3,075 page-faults # 0.000 M/sec - 30,160,451,883 cycles # 3.062 GHz [83.31%] - 17,209,665,022 stalled-cycles-frontend # 57.06% frontend cycles idle [83.31%] - 3,830,145,916 stalled-cycles-backend # 12.70% backend cycles idle [66.69%] - 50,157,904,839 instructions # 1.66 insns per cycle - # 0.34 stalled cycles per insn [83.35%] - 1,037,634,480 branches # 105.344 M/sec [83.35%] - 1,087,305 branch-misses # 0.10% of all branches [83.35%] - - 9.875574586 seconds time elapsed + 3,074 page-faults # 0.000 M/sec + 30,249,098,352 cycles # 3.062 GHz [83.32%] + 17,298,067,630 stalled-cycles-frontend # 57.19% frontend cycles idle [83.32%] + 3,974,575,999 stalled-cycles-backend # 13.14% backend cycles idle [66.67%] + 50,150,796,611 instructions # 1.66 insns per cycle + # 0.34 stalled cycles per insn [83.36%] + 1,037,562,373 branches # 105.030 M/sec [83.36%] + 1,067,234 branch-misses # 0.10% of all branches [83.34%] + + 9.904228039 seconds time elapsed diff --git a/sankalp/gcc_output_3000 b/sankalp/gcc_output_3000 new file mode 100644 index 0000000..1da4004 --- /dev/null +++ b/sankalp/gcc_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply 3000': + + 475300.257913 task-clock # 0.997 CPUs utilized + 594 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,455,206,821,524 cycles # 3.062 GHz [83.33%] + 1,096,016,878,004 stalled-cycles-frontend # 75.32% frontend cycles idle [83.33%] + 590,754,550,647 stalled-cycles-backend # 40.60% backend cycles idle [66.67%] + 1,351,742,482,872 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,393,869,687 branches # 57.635 M/sec [83.33%] + 14,090,789 branch-misses # 0.05% of all branches [83.33%] + + 476.494079626 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply 3000': + + 476018.020595 task-clock # 0.997 CPUs utilized + 596 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,457,356,444,320 cycles # 3.062 GHz [83.33%] + 1,097,887,781,677 stalled-cycles-frontend # 75.33% frontend cycles idle [83.33%] + 593,165,290,075 stalled-cycles-backend # 40.70% backend cycles idle [66.67%] + 1,351,747,334,373 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,396,936,581 branches # 57.554 M/sec [83.33%] + 14,020,326 branch-misses # 0.05% of all branches [83.33%] + + 477.213941232 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply 3000': + + 474569.437761 task-clock # 0.997 CPUs utilized + 595 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,452,880,580,364 cycles # 3.061 GHz [83.33%] + 1,093,658,008,544 stalled-cycles-frontend # 75.28% frontend cycles idle [83.33%] + 598,953,855,484 stalled-cycles-backend # 41.23% backend cycles idle [66.67%] + 1,351,708,174,318 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,397,137,447 branches # 57.731 M/sec [83.33%] + 13,353,583 branch-misses # 0.05% of all branches [83.33%] + + 475.763890065 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply 3000': + + 475646.500239 task-clock # 0.997 CPUs utilized + 596 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,456,163,649,462 cycles # 3.061 GHz [83.33%] + 1,096,827,868,403 stalled-cycles-frontend # 75.32% frontend cycles idle [83.33%] + 604,183,182,642 stalled-cycles-backend # 41.49% backend cycles idle [66.67%] + 1,351,761,637,391 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,396,786,793 branches # 57.599 M/sec [83.33%] + 13,320,251 branch-misses # 0.05% of all branches [83.33%] + + 476.841596270 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply 3000': + + 476211.404942 task-clock # 0.997 CPUs utilized + 597 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,457,959,876,543 cycles # 3.062 GHz [83.33%] + 1,098,411,393,007 stalled-cycles-frontend # 75.34% frontend cycles idle [83.33%] + 607,061,107,646 stalled-cycles-backend # 41.64% backend cycles idle [66.67%] + 1,351,758,909,796 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,397,007,312 branches # 57.531 M/sec [83.33%] + 13,916,373 branch-misses # 0.05% of all branches [83.33%] + + 477.407551808 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply 3000': + + 475948.824921 task-clock # 0.997 CPUs utilized + 596 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,457,196,407,185 cycles # 3.062 GHz [83.33%] + 1,097,491,418,801 stalled-cycles-frontend # 75.32% frontend cycles idle [83.33%] + 619,424,280,588 stalled-cycles-backend # 42.51% backend cycles idle [66.67%] + 1,351,752,463,467 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,395,156,718 branches # 57.559 M/sec [83.33%] + 13,646,100 branch-misses # 0.05% of all branches [83.33%] + + 477.144006180 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply 3000': + + 476555.496544 task-clock # 0.997 CPUs utilized + 597 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,459,055,808,779 cycles # 3.062 GHz [83.33%] + 1,099,359,336,770 stalled-cycles-frontend # 75.35% frontend cycles idle [83.33%] + 605,859,886,112 stalled-cycles-backend # 41.52% backend cycles idle [66.67%] + 1,351,748,188,845 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,396,976,815 branches # 57.490 M/sec [83.33%] + 13,608,298 branch-misses # 0.05% of all branches [83.33%] + + 477.751263190 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply 3000': + + 476550.619236 task-clock # 0.997 CPUs utilized + 596 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,458,990,788,545 cycles # 3.062 GHz [83.33%] + 1,099,354,204,996 stalled-cycles-frontend # 75.35% frontend cycles idle [83.33%] + 605,327,241,764 stalled-cycles-backend # 41.49% backend cycles idle [66.67%] + 1,351,757,320,368 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,396,713,068 branches # 57.490 M/sec [83.33%] + 13,874,648 branch-misses # 0.05% of all branches [83.33%] + + 477.765602818 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply 3000': + + 477530.594343 task-clock # 0.997 CPUs utilized + 597 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,461,959,826,317 cycles # 3.061 GHz [83.33%] + 1,102,192,822,811 stalled-cycles-frontend # 75.39% frontend cycles idle [83.33%] + 602,765,299,108 stalled-cycles-backend # 41.23% backend cycles idle [66.67%] + 1,351,757,093,932 instructions # 0.92 insns per cycle + # 0.82 stalled cycles per insn [83.33%] + 27,398,383,869 branches # 57.375 M/sec [83.33%] + 13,438,518 branch-misses # 0.05% of all branches [83.33%] + + 478.728380489 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply 3000': + + 477246.288455 task-clock # 0.997 CPUs utilized + 598 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,461,142,413,968 cycles # 3.062 GHz [83.33%] + 1,101,548,208,648 stalled-cycles-frontend # 75.39% frontend cycles idle [83.33%] + 610,983,270,807 stalled-cycles-backend # 41.82% backend cycles idle [66.67%] + 1,351,767,194,355 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,397,222,382 branches # 57.407 M/sec [83.33%] + 14,071,841 branch-misses # 0.05% of all branches [83.33%] + + 478.444205849 seconds time elapsed + diff --git a/sankalp/gcc_output_optimized_100 b/sankalp/gcc_output_optimized_100 new file mode 100644 index 0000000..02b8d64 --- /dev/null +++ b/sankalp/gcc_output_optimized_100 @@ -0,0 +1,180 @@ +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.849608 task-clock # 0.769 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.086 M/sec + 5,664,275 cycles # 3.062 GHz + 732,765 stalled-cycles-frontend # 12.94% frontend cycles idle + 415,452 stalled-cycles-backend # 7.33% backend cycles idle + 10,010,514 instructions # 1.77 insns per cycle + # 0.07 stalled cycles per insn + 1,456,645 branches # 787.543 M/sec + branch-misses + + 0.002405004 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.839908 task-clock # 0.666 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.086 M/sec + 5,636,324 cycles # 3.063 GHz + 708,018 stalled-cycles-frontend # 12.56% frontend cycles idle + 1,488,676 stalled-cycles-backend # 26.41% backend cycles idle + 9,999,645 instructions # 1.77 insns per cycle + # 0.15 stalled cycles per insn + 1,455,193 branches # 790.905 M/sec + branch-misses + + 0.002762590 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.894950 task-clock # 0.768 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.084 M/sec + 2,365,633 cycles # 1.248 GHz + 815,107 stalled-cycles-frontend # 34.46% frontend cycles idle + 1,395,279 stalled-cycles-backend # 58.98% backend cycles idle + 10,005,259 instructions # 4.23 insns per cycle + # 0.14 stalled cycles per insn + 1,456,126 branches # 768.424 M/sec + 14,501 branch-misses # 1.00% of all branches [58.57%] + + 0.002468015 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.875375 task-clock # 0.766 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.085 M/sec + 4,882,424 cycles # 2.603 GHz + 752,488 stalled-cycles-frontend # 15.41% frontend cycles idle + 1,341,572 stalled-cycles-backend # 27.48% backend cycles idle + 10,020,521 instructions # 2.05 insns per cycle + # 0.13 stalled cycles per insn + 1,458,408 branches # 777.662 M/sec + 15,896 branch-misses # 1.09% of all branches [14.62%] + + 0.002449323 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.847871 task-clock # 0.723 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.086 M/sec + 5,660,288 cycles # 3.063 GHz + 727,224 stalled-cycles-frontend # 12.85% frontend cycles idle + 1,493,416 stalled-cycles-backend # 26.38% backend cycles idle + 10,014,309 instructions # 1.77 insns per cycle + # 0.15 stalled cycles per insn + 1,457,300 branches # 788.637 M/sec + branch-misses + + 0.002555472 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.879068 task-clock # 0.768 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.084 M/sec + 3,421,298 cycles # 1.821 GHz + 761,542 stalled-cycles-frontend # 22.26% frontend cycles idle + 1,433,667 stalled-cycles-backend # 41.90% backend cycles idle + 10,018,860 instructions # 2.93 insns per cycle + # 0.14 stalled cycles per insn + 1,458,144 branches # 775.993 M/sec + 14,789 branch-misses # 1.01% of all branches [40.00%] + + 0.002447307 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.883634 task-clock # 0.739 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.084 M/sec + 321,967 cycles # 0.171 GHz + 796,732 stalled-cycles-frontend # 247.46% frontend cycles idle + 443,941 stalled-cycles-backend # 137.88% backend cycles idle + 10,018,569 instructions # 31.12 insns per cycle + # 0.08 stalled cycles per insn + 1,458,017 branches # 774.045 M/sec + 16,126 branch-misses # 1.11% of all branches [93.59%] + + 0.002549813 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.869718 task-clock # 0.709 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.085 M/sec + 1,144,239 cycles # 0.612 GHz + 746,887 stalled-cycles-frontend # 65.27% frontend cycles idle + 1,506,395 stalled-cycles-backend # 131.65% backend cycles idle + 10,012,630 instructions # 8.75 insns per cycle + # 0.15 stalled cycles per insn + 1,457,200 branches # 779.369 M/sec + 13,662 branch-misses # 0.94% of all branches [79.35%] + + 0.002638744 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.919213 task-clock # 0.588 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.083 M/sec + 1,076,319 cycles # 0.561 GHz + 895,237 stalled-cycles-frontend # 83.18% frontend cycles idle + 1,645,401 stalled-cycles-backend # 152.87% backend cycles idle + 10,022,421 instructions # 9.31 insns per cycle + # 0.16 stalled cycles per insn + 1,458,721 branches # 760.062 M/sec + 13,434 branch-misses # 0.92% of all branches [80.97%] + + 0.003264739 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.883476 task-clock # 0.690 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.084 M/sec + 4,552,284 cycles # 2.417 GHz + 783,434 stalled-cycles-frontend # 17.21% frontend cycles idle + 1,317,945 stalled-cycles-backend # 28.95% backend cycles idle + 10,008,721 instructions # 2.20 insns per cycle + # 0.13 stalled cycles per insn + 1,456,761 branches # 773.443 M/sec + 14,949 branch-misses # 1.03% of all branches [20.70%] + + 0.002728343 seconds time elapsed + diff --git a/sankalp/gcc_output_optimized_1000 b/sankalp/gcc_output_optimized_1000 new file mode 100644 index 0000000..4da73bd --- /dev/null +++ b/sankalp/gcc_output_optimized_1000 @@ -0,0 +1,180 @@ +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8524.007146 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,101,094,636 cycles # 3.062 GHz [83.34%] + 21,174,291,573 stalled-cycles-frontend # 81.12% frontend cycles idle [83.34%] + 8,086,059,447 stalled-cycles-backend # 30.98% backend cycles idle [66.67%] + 8,147,023,966 instructions # 0.31 insns per cycle + # 2.60 stalled cycles per insn [83.34%] + 1,034,584,832 branches # 121.373 M/sec [83.34%] + 1,056,203 branch-misses # 0.10% of all branches [83.35%] + + 8.546169904 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8480.788072 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 25,968,524,213 cycles # 3.062 GHz [83.30%] + 21,026,920,732 stalled-cycles-frontend # 80.97% frontend cycles idle [83.35%] + 8,372,590,975 stalled-cycles-backend # 32.24% backend cycles idle [66.69%] + 8,146,964,730 instructions # 0.31 insns per cycle + # 2.58 stalled cycles per insn [83.35%] + 1,034,591,652 branches # 121.992 M/sec [83.34%] + 1,061,216 branch-misses # 0.10% of all branches [83.32%] + + 8.502870304 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8499.518119 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,025,909,327 cycles # 3.062 GHz [83.34%] + 21,094,624,277 stalled-cycles-frontend # 81.05% frontend cycles idle [83.33%] + 7,597,054,786 stalled-cycles-backend # 29.19% backend cycles idle [66.67%] + 8,146,986,115 instructions # 0.31 insns per cycle + # 2.59 stalled cycles per insn [83.34%] + 1,034,616,479 branches # 121.726 M/sec [83.33%] + 1,055,439 branch-misses # 0.10% of all branches [83.34%] + + 8.521753033 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8567.572363 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,233,696,728 cycles # 3.062 GHz [83.33%] + 21,318,293,997 stalled-cycles-frontend # 81.26% frontend cycles idle [83.33%] + 8,013,091,628 stalled-cycles-backend # 30.55% backend cycles idle [66.66%] + 8,147,236,780 instructions # 0.31 insns per cycle + # 2.62 stalled cycles per insn [83.33%] + 1,033,816,017 branches # 120.666 M/sec [83.37%] + 1,057,271 branch-misses # 0.10% of all branches [83.35%] + + 8.589968438 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8498.048583 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,020,348,975 cycles # 3.062 GHz [83.33%] + 21,088,844,072 stalled-cycles-frontend # 81.05% frontend cycles idle [83.33%] + 7,943,621,197 stalled-cycles-backend # 30.53% backend cycles idle [66.66%] + 8,146,770,884 instructions # 0.31 insns per cycle + # 2.59 stalled cycles per insn [83.33%] + 1,034,364,119 branches # 121.718 M/sec [83.33%] + 1,057,797 branch-misses # 0.10% of all branches [83.35%] + + 8.520236784 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8523.980835 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,099,105,396 cycles # 3.062 GHz [83.34%] + 21,174,457,333 stalled-cycles-frontend # 81.13% frontend cycles idle [83.34%] + 7,971,768,233 stalled-cycles-backend # 30.54% backend cycles idle [66.67%] + 8,147,071,539 instructions # 0.31 insns per cycle + # 2.60 stalled cycles per insn [83.34%] + 1,034,599,564 branches # 121.375 M/sec [83.34%] + 1,067,177 branch-misses # 0.10% of all branches [83.33%] + + 8.546194472 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8539.281197 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,147,787,605 cycles # 3.062 GHz [83.32%] + 21,232,515,363 stalled-cycles-frontend # 81.20% frontend cycles idle [83.32%] + 7,997,377,449 stalled-cycles-backend # 30.59% backend cycles idle [66.67%] + 8,142,040,940 instructions # 0.31 insns per cycle + # 2.61 stalled cycles per insn [83.36%] + 1,034,582,094 branches # 121.156 M/sec [83.37%] + 1,067,037 branch-misses # 0.10% of all branches [83.35%] + + 8.561577755 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8483.737252 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 25,976,418,040 cycles # 3.062 GHz [83.30%] + 21,031,895,833 stalled-cycles-frontend # 80.97% frontend cycles idle [83.35%] + 7,905,370,309 stalled-cycles-backend # 30.43% backend cycles idle [66.70%] + 8,147,671,922 instructions # 0.31 insns per cycle + # 2.58 stalled cycles per insn [83.35%] + 1,034,722,307 branches # 121.965 M/sec [83.35%] + 1,058,817 branch-misses # 0.10% of all branches [83.31%] + + 8.505817558 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8487.683539 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 25,989,385,640 cycles # 3.062 GHz [83.31%] + 21,054,478,049 stalled-cycles-frontend # 81.01% frontend cycles idle [83.31%] + 7,474,887,009 stalled-cycles-backend # 28.76% backend cycles idle [66.71%] + 8,146,958,745 instructions # 0.31 insns per cycle + # 2.58 stalled cycles per insn [83.36%] + 1,034,611,204 branches # 121.896 M/sec [83.36%] + 1,063,850 branch-misses # 0.10% of all branches [83.34%] + + 8.509833793 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8485.279076 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 25,980,743,845 cycles # 3.062 GHz [83.31%] + 21,043,200,703 stalled-cycles-frontend # 81.00% frontend cycles idle [83.31%] + 7,855,243,129 stalled-cycles-backend # 30.23% backend cycles idle [66.70%] + 8,147,134,514 instructions # 0.31 insns per cycle + # 2.58 stalled cycles per insn [83.35%] + 1,034,632,398 branches # 121.933 M/sec [83.35%] + 1,068,154 branch-misses # 0.10% of all branches [83.34%] + + 8.507968113 seconds time elapsed + diff --git a/sankalp/gcc_output_optimized_3000 b/sankalp/gcc_output_optimized_3000 new file mode 100644 index 0000000..bed3fc6 --- /dev/null +++ b/sankalp/gcc_output_optimized_3000 @@ -0,0 +1,180 @@ +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 307990.722698 task-clock # 0.997 CPUs utilized + 385 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 942,885,267,154 cycles # 3.061 GHz [83.33%] + 813,151,718,128 stalled-cycles-frontend # 86.24% frontend cycles idle [83.33%] + 479,110,721,206 stalled-cycles-backend # 50.81% backend cycles idle [66.67%] + 217,537,751,166 instructions # 0.23 insns per cycle + # 3.74 stalled cycles per insn [83.33%] + 27,350,281,815 branches # 88.802 M/sec [83.33%] + 13,416,834 branch-misses # 0.05% of all branches [83.33%] + + 308.764947876 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 309095.950256 task-clock # 0.997 CPUs utilized + 388 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 946,223,423,681 cycles # 3.061 GHz [83.33%] + 816,700,149,527 stalled-cycles-frontend # 86.31% frontend cycles idle [83.33%] + 478,184,484,905 stalled-cycles-backend # 50.54% backend cycles idle [66.67%] + 217,549,241,887 instructions # 0.23 insns per cycle + # 3.75 stalled cycles per insn [83.33%] + 27,352,134,829 branches # 88.491 M/sec [83.33%] + 12,496,243 branch-misses # 0.05% of all branches [83.33%] + + 309.874694599 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 308456.151399 task-clock # 0.997 CPUs utilized + 387 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 944,147,394,731 cycles # 3.061 GHz [83.33%] + 815,004,329,682 stalled-cycles-frontend # 86.32% frontend cycles idle [83.33%] + 492,153,218,620 stalled-cycles-backend # 52.13% backend cycles idle [66.67%] + 217,542,001,519 instructions # 0.23 insns per cycle + # 3.75 stalled cycles per insn [83.33%] + 27,351,929,959 branches # 88.674 M/sec [83.33%] + 12,737,640 branch-misses # 0.05% of all branches [83.33%] + + 309.231466001 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 308648.298096 task-clock # 0.997 CPUs utilized + 387 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 944,897,614,537 cycles # 3.061 GHz [83.33%] + 815,188,834,965 stalled-cycles-frontend # 86.27% frontend cycles idle [83.33%] + 485,379,940,869 stalled-cycles-backend # 51.37% backend cycles idle [66.67%] + 217,534,979,891 instructions # 0.23 insns per cycle + # 3.75 stalled cycles per insn [83.33%] + 27,351,527,278 branches # 88.617 M/sec [83.33%] + 13,388,415 branch-misses # 0.05% of all branches [83.33%] + + 309.423862273 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 309909.768801 task-clock # 0.997 CPUs utilized + 388 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 948,763,312,383 cycles # 3.061 GHz [83.33%] + 819,052,696,950 stalled-cycles-frontend # 86.33% frontend cycles idle [83.33%] + 482,990,679,317 stalled-cycles-backend # 50.91% backend cycles idle [66.67%] + 217,539,864,459 instructions # 0.23 insns per cycle + # 3.77 stalled cycles per insn [83.33%] + 27,352,050,126 branches # 88.258 M/sec [83.33%] + 13,177,647 branch-misses # 0.05% of all branches [83.33%] + + 310.688240232 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 309327.733528 task-clock # 0.997 CPUs utilized + 388 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 947,010,787,729 cycles # 3.062 GHz [83.33%] + 817,412,412,659 stalled-cycles-frontend # 86.32% frontend cycles idle [83.33%] + 488,015,320,106 stalled-cycles-backend # 51.53% backend cycles idle [66.67%] + 217,532,974,150 instructions # 0.23 insns per cycle + # 3.76 stalled cycles per insn [83.33%] + 27,349,693,081 branches # 88.417 M/sec [83.33%] + 13,212,984 branch-misses # 0.05% of all branches [83.33%] + + 310.105193532 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 310282.492791 task-clock # 0.997 CPUs utilized + 389 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 949,907,449,960 cycles # 3.061 GHz [83.33%] + 820,459,518,182 stalled-cycles-frontend # 86.37% frontend cycles idle [83.33%] + 471,778,705,376 stalled-cycles-backend # 49.67% backend cycles idle [66.67%] + 217,524,558,295 instructions # 0.23 insns per cycle + # 3.77 stalled cycles per insn [83.33%] + 27,351,609,383 branches # 88.151 M/sec [83.33%] + 13,344,766 branch-misses # 0.05% of all branches [83.33%] + + 311.104012259 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 310349.330476 task-clock # 0.997 CPUs utilized + 389 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 950,012,415,697 cycles # 3.061 GHz [83.33%] + 820,923,300,577 stalled-cycles-frontend # 86.41% frontend cycles idle [83.33%] + 468,957,637,855 stalled-cycles-backend # 49.36% backend cycles idle [66.67%] + 217,545,884,095 instructions # 0.23 insns per cycle + # 3.77 stalled cycles per insn [83.33%] + 27,353,566,509 branches # 88.138 M/sec [83.33%] + 12,597,801 branch-misses # 0.05% of all branches [83.33%] + + 311.146848527 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 310848.446781 task-clock # 0.997 CPUs utilized + 389 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 951,637,386,126 cycles # 3.061 GHz [83.33%] + 822,546,224,447 stalled-cycles-frontend # 86.43% frontend cycles idle [83.33%] + 495,897,697,137 stalled-cycles-backend # 52.11% backend cycles idle [66.67%] + 217,546,544,859 instructions # 0.23 insns per cycle + # 3.78 stalled cycles per insn [83.33%] + 27,353,133,771 branches # 87.995 M/sec [83.33%] + 13,283,333 branch-misses # 0.05% of all branches [83.33%] + + 311.629074931 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 312178.283971 task-clock # 0.997 CPUs utilized + 391 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 955,712,667,148 cycles # 3.061 GHz [83.33%] + 826,044,644,959 stalled-cycles-frontend # 86.43% frontend cycles idle [83.33%] + 499,061,986,949 stalled-cycles-backend # 52.22% backend cycles idle [66.67%] + 217,558,514,147 instructions # 0.23 insns per cycle + # 3.80 stalled cycles per insn [83.33%] + 27,352,241,903 branches # 87.617 M/sec [83.33%] + 13,193,839 branch-misses # 0.05% of all branches [83.33%] + + 312.962113204 seconds time elapsed + diff --git a/sankalp/java_output_100 b/sankalp/java_output_100 index e48a203..5ff2003 100644 --- a/sankalp/java_output_100 +++ b/sankalp/java_output_100 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for 'java MatrixMultiplier 100': - 104.746489 task-clock # 0.826 CPUs utilized - 169 context-switches # 0.002 M/sec - 44 CPU-migrations # 0.000 M/sec - 4,911 page-faults # 0.047 M/sec - 308,572,871 cycles # 2.946 GHz [85.84%] - 163,849,227 stalled-cycles-frontend # 53.10% frontend cycles idle [74.67%] - 110,314,966 stalled-cycles-backend # 35.75% backend cycles idle [65.15%] - 271,187,853 instructions # 0.88 insns per cycle - # 0.60 stalled cycles per insn [88.30%] - 55,037,045 branches # 525.431 M/sec [88.79%] - 2,958,690 branch-misses # 5.38% of all branches [86.56%] - - 0.126846272 seconds time elapsed + 103.321799 task-clock # 1.117 CPUs utilized + 175 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.000 M/sec + 4,909 page-faults # 0.048 M/sec + 301,216,233 cycles # 2.915 GHz [84.32%] + 163,477,231 stalled-cycles-frontend # 54.27% frontend cycles idle [75.05%] + 103,759,590 stalled-cycles-backend # 34.45% backend cycles idle [66.56%] + 297,736,573 instructions # 0.99 insns per cycle + # 0.55 stalled cycles per insn [88.51%] + 55,643,691 branches # 538.547 M/sec [88.33%] + 2,889,288 branch-misses # 5.19% of all branches [87.38%] + + 0.092533164 seconds time elapsed Iteration 2 Performance counter stats for 'java MatrixMultiplier 100': - 105.073416 task-clock # 0.870 CPUs utilized - 162 context-switches # 0.002 M/sec - 42 CPU-migrations # 0.000 M/sec - 4,910 page-faults # 0.047 M/sec - 311,169,627 cycles # 2.961 GHz [82.20%] - 166,008,039 stalled-cycles-frontend # 53.35% frontend cycles idle [86.19%] - 102,128,765 stalled-cycles-backend # 32.82% backend cycles idle [59.47%] - 284,206,036 instructions # 0.91 insns per cycle - # 0.58 stalled cycles per insn [80.84%] - 53,250,065 branches # 506.789 M/sec [86.90%] - 3,065,376 branch-misses # 5.76% of all branches [86.93%] + 103.759715 task-clock # 1.117 CPUs utilized + 160 context-switches # 0.002 M/sec + 47 CPU-migrations # 0.000 M/sec + 4,901 page-faults # 0.047 M/sec + 305,125,075 cycles # 2.941 GHz [84.89%] + 160,369,545 stalled-cycles-frontend # 52.56% frontend cycles idle [74.82%] + 101,259,462 stalled-cycles-backend # 33.19% backend cycles idle [66.10%] + 287,525,333 instructions # 0.94 insns per cycle + # 0.56 stalled cycles per insn [89.35%] + 54,463,632 branches # 524.902 M/sec [88.47%] + 3,052,971 branch-misses # 5.61% of all branches [87.52%] - 0.120828804 seconds time elapsed + 0.092870741 seconds time elapsed Iteration 3 Performance counter stats for 'java MatrixMultiplier 100': - 104.806678 task-clock # 0.827 CPUs utilized - 158 context-switches # 0.002 M/sec + 104.375659 task-clock # 1.059 CPUs utilized + 159 context-switches # 0.002 M/sec 44 CPU-migrations # 0.000 M/sec - 4,905 page-faults # 0.047 M/sec - 307,136,933 cycles # 2.931 GHz [83.58%] - 161,088,688 stalled-cycles-frontend # 52.45% frontend cycles idle [85.57%] - 110,906,935 stalled-cycles-backend # 36.11% backend cycles idle [60.44%] - 284,480,493 instructions # 0.93 insns per cycle - # 0.57 stalled cycles per insn [81.51%] - 53,693,355 branches # 512.309 M/sec [84.70%] - 2,776,226 branch-misses # 5.17% of all branches [87.10%] + 4,899 page-faults # 0.047 M/sec + 312,875,028 cycles # 2.998 GHz [77.06%] + 168,819,560 stalled-cycles-frontend # 53.96% frontend cycles idle [78.79%] + 101,445,345 stalled-cycles-backend # 32.42% backend cycles idle [71.36%] + 301,146,158 instructions # 0.96 insns per cycle + # 0.56 stalled cycles per insn [88.93%] + 55,088,281 branches # 527.789 M/sec [88.62%] + 2,998,976 branch-misses # 5.44% of all branches [85.92%] - 0.126797557 seconds time elapsed + 0.098543800 seconds time elapsed Iteration 4 Performance counter stats for 'java MatrixMultiplier 100': - 102.669223 task-clock # 0.804 CPUs utilized - 174 context-switches # 0.002 M/sec - 43 CPU-migrations # 0.000 M/sec - 4,902 page-faults # 0.048 M/sec - 302,708,684 cycles # 2.948 GHz [84.85%] - 162,212,866 stalled-cycles-frontend # 53.59% frontend cycles idle [75.03%] - 102,355,542 stalled-cycles-backend # 33.81% backend cycles idle [66.93%] - 291,250,018 instructions # 0.96 insns per cycle - # 0.56 stalled cycles per insn [88.35%] - 53,438,847 branches # 520.495 M/sec [88.52%] - 3,076,528 branch-misses # 5.76% of all branches [85.95%] + 106.506564 task-clock # 1.098 CPUs utilized + 150 context-switches # 0.001 M/sec + 44 CPU-migrations # 0.000 M/sec + 4,908 page-faults # 0.046 M/sec + 314,107,537 cycles # 2.949 GHz [80.00%] + 168,129,079 stalled-cycles-frontend # 53.53% frontend cycles idle [83.52%] + 110,233,792 stalled-cycles-backend # 35.09% backend cycles idle [61.34%] + 267,033,663 instructions # 0.85 insns per cycle + # 0.63 stalled cycles per insn [88.69%] + 54,684,767 branches # 513.440 M/sec [89.14%] + 3,034,135 branch-misses # 5.55% of all branches [87.76%] - 0.127664616 seconds time elapsed + 0.096957055 seconds time elapsed Iteration 5 Performance counter stats for 'java MatrixMultiplier 100': - 103.803424 task-clock # 0.776 CPUs utilized - 155 context-switches # 0.001 M/sec - 42 CPU-migrations # 0.000 M/sec - 4,904 page-faults # 0.047 M/sec - 305,255,769 cycles # 2.941 GHz [86.83%] - 162,227,950 stalled-cycles-frontend # 53.14% frontend cycles idle [76.48%] - 107,322,939 stalled-cycles-backend # 35.16% backend cycles idle [64.30%] - 288,359,451 instructions # 0.94 insns per cycle - # 0.56 stalled cycles per insn [87.61%] - 54,283,919 branches # 522.949 M/sec [88.61%] - 3,101,270 branch-misses # 5.71% of all branches [85.20%] + 103.919871 task-clock # 1.123 CPUs utilized + 172 context-switches # 0.002 M/sec + 44 CPU-migrations # 0.000 M/sec + 4,916 page-faults # 0.047 M/sec + 302,840,737 cycles # 2.914 GHz [85.86%] + 156,296,630 stalled-cycles-frontend # 51.61% frontend cycles idle [83.16%] + 112,184,665 stalled-cycles-backend # 37.04% backend cycles idle [58.29%] + 266,462,000 instructions # 0.88 insns per cycle + # 0.59 stalled cycles per insn [80.55%] + 54,001,529 branches # 519.646 M/sec [87.11%] + 2,916,764 branch-misses # 5.40% of all branches [87.46%] - 0.133713233 seconds time elapsed + 0.092571453 seconds time elapsed Iteration 6 Performance counter stats for 'java MatrixMultiplier 100': - 104.215729 task-clock # 0.819 CPUs utilized - 176 context-switches # 0.002 M/sec - 43 CPU-migrations # 0.000 M/sec - 4,912 page-faults # 0.047 M/sec - 302,453,171 cycles # 2.902 GHz [87.65%] - 161,623,945 stalled-cycles-frontend # 53.44% frontend cycles idle [79.60%] - 111,110,021 stalled-cycles-backend # 36.74% backend cycles idle [60.70%] - 271,333,536 instructions # 0.90 insns per cycle - # 0.60 stalled cycles per insn [87.65%] - 53,593,260 branches # 514.253 M/sec [88.57%] - 3,160,617 branch-misses # 5.90% of all branches [85.11%] + 104.129244 task-clock # 1.110 CPUs utilized + 167 context-switches # 0.002 M/sec + 40 CPU-migrations # 0.000 M/sec + 4,901 page-faults # 0.047 M/sec + 305,068,140 cycles # 2.930 GHz [84.38%] + 160,683,594 stalled-cycles-frontend # 52.67% frontend cycles idle [83.04%] + 108,136,607 stalled-cycles-backend # 35.45% backend cycles idle [58.36%] + 262,531,379 instructions # 0.86 insns per cycle + # 0.61 stalled cycles per insn [84.17%] + 52,184,320 branches # 501.150 M/sec [87.66%] + 3,073,796 branch-misses # 5.89% of all branches [88.33%] - 0.127218799 seconds time elapsed + 0.093834708 seconds time elapsed Iteration 7 Performance counter stats for 'java MatrixMultiplier 100': - 104.762398 task-clock # 0.829 CPUs utilized - 156 context-switches # 0.001 M/sec - 46 CPU-migrations # 0.000 M/sec - 4,917 page-faults # 0.047 M/sec - 314,196,799 cycles # 2.999 GHz [70.14%] - 162,936,333 stalled-cycles-frontend # 51.86% frontend cycles idle [79.89%] - 104,204,007 stalled-cycles-backend # 33.17% backend cycles idle [76.48%] - 303,203,042 instructions # 0.97 insns per cycle - # 0.54 stalled cycles per insn [88.72%] - 55,501,074 branches # 529.780 M/sec [88.95%] - 2,874,787 branch-misses # 5.18% of all branches [86.15%] + 104.108239 task-clock # 1.125 CPUs utilized + 157 context-switches # 0.002 M/sec + 42 CPU-migrations # 0.000 M/sec + 4,898 page-faults # 0.047 M/sec + 307,017,870 cycles # 2.949 GHz [84.90%] + 164,306,170 stalled-cycles-frontend # 53.52% frontend cycles idle [77.93%] + 103,125,565 stalled-cycles-backend # 33.59% backend cycles idle [65.45%] + 288,379,192 instructions # 0.94 insns per cycle + # 0.57 stalled cycles per insn [85.16%] + 53,702,811 branches # 515.836 M/sec [86.05%] + 3,044,773 branch-misses # 5.67% of all branches [87.57%] - 0.126417299 seconds time elapsed + 0.092529815 seconds time elapsed Iteration 8 Performance counter stats for 'java MatrixMultiplier 100': - 104.286359 task-clock # 0.818 CPUs utilized - 159 context-switches # 0.002 M/sec - 41 CPU-migrations # 0.000 M/sec - 4,897 page-faults # 0.047 M/sec - 307,665,208 cycles # 2.950 GHz [82.64%] - 161,525,319 stalled-cycles-frontend # 52.50% frontend cycles idle [83.76%] - 104,838,283 stalled-cycles-backend # 34.08% backend cycles idle [60.68%] - 270,038,666 instructions # 0.88 insns per cycle - # 0.60 stalled cycles per insn [84.04%] - 53,152,819 branches # 509.681 M/sec [88.08%] - 3,059,602 branch-misses # 5.76% of all branches [86.23%] - - 0.127504121 seconds time elapsed + 104.765434 task-clock # 1.108 CPUs utilized + 169 context-switches # 0.002 M/sec + 45 CPU-migrations # 0.000 M/sec + 4,901 page-faults # 0.047 M/sec + 307,535,192 cycles # 2.935 GHz [84.82%] + 164,207,959 stalled-cycles-frontend # 53.39% frontend cycles idle [79.74%] + 106,454,679 stalled-cycles-backend # 34.62% backend cycles idle [60.71%] + 268,169,951 instructions # 0.87 insns per cycle + # 0.61 stalled cycles per insn [88.10%] + 54,860,528 branches # 523.651 M/sec [88.40%] + 2,968,193 branch-misses # 5.41% of all branches [87.39%] + + 0.094565311 seconds time elapsed Iteration 9 Performance counter stats for 'java MatrixMultiplier 100': - 103.018370 task-clock # 0.802 CPUs utilized - 172 context-switches # 0.002 M/sec - 47 CPU-migrations # 0.000 M/sec - 4,901 page-faults # 0.048 M/sec - 310,294,538 cycles # 3.012 GHz [75.30%] - 164,104,338 stalled-cycles-frontend # 52.89% frontend cycles idle [78.12%] - 99,758,390 stalled-cycles-backend # 32.15% backend cycles idle [74.32%] - 294,822,518 instructions # 0.95 insns per cycle - # 0.56 stalled cycles per insn [88.55%] - 54,467,883 branches # 528.720 M/sec [88.57%] - 3,033,202 branch-misses # 5.57% of all branches [85.17%] + 105.879995 task-clock # 1.108 CPUs utilized + 181 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.000 M/sec + 4,910 page-faults # 0.046 M/sec + 309,713,266 cycles # 2.925 GHz [86.13%] + 164,906,341 stalled-cycles-frontend # 53.24% frontend cycles idle [79.10%] + 111,500,921 stalled-cycles-backend # 36.00% backend cycles idle [61.51%] + 272,166,057 instructions # 0.88 insns per cycle + # 0.61 stalled cycles per insn [87.40%] + 53,079,383 branches # 501.316 M/sec [88.80%] + 3,046,810 branch-misses # 5.74% of all branches [86.44%] - 0.128460788 seconds time elapsed + 0.095518615 seconds time elapsed Iteration 10 Performance counter stats for 'java MatrixMultiplier 100': - 104.261775 task-clock # 0.826 CPUs utilized - 177 context-switches # 0.002 M/sec - 45 CPU-migrations # 0.000 M/sec - 4,899 page-faults # 0.047 M/sec - 308,568,212 cycles # 2.960 GHz [74.85%] - 166,638,943 stalled-cycles-frontend # 54.00% frontend cycles idle [77.71%] - 106,033,306 stalled-cycles-backend # 34.36% backend cycles idle [74.27%] - 294,497,423 instructions # 0.95 insns per cycle - # 0.57 stalled cycles per insn [88.55%] - 54,219,007 branches # 520.028 M/sec [88.63%] - 3,099,068 branch-misses # 5.72% of all branches [86.05%] - - 0.126175195 seconds time elapsed + 104.498642 task-clock # 1.120 CPUs utilized + 166 context-switches # 0.002 M/sec + 43 CPU-migrations # 0.000 M/sec + 4,912 page-faults # 0.047 M/sec + 306,585,731 cycles # 2.934 GHz [86.11%] + 157,952,036 stalled-cycles-frontend # 51.52% frontend cycles idle [76.53%] + 109,596,785 stalled-cycles-backend # 35.75% backend cycles idle [65.42%] + 284,918,343 instructions # 0.93 insns per cycle + # 0.55 stalled cycles per insn [88.44%] + 54,016,381 branches # 516.910 M/sec [88.80%] + 3,056,357 branch-misses # 5.66% of all branches [85.71%] + + 0.093262045 seconds time elapsed diff --git a/sankalp/java_output_1000 b/sankalp/java_output_1000 index 2676cb0..0e72482 100644 --- a/sankalp/java_output_1000 +++ b/sankalp/java_output_1000 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for 'java MatrixMultiplier 1000': - 8189.705765 task-clock # 0.996 CPUs utilized - 345 context-switches # 0.000 M/sec - 52 CPU-migrations # 0.000 M/sec - 7,923 page-faults # 0.001 M/sec - 25,046,613,587 cycles # 3.058 GHz [83.37%] - 19,626,824,372 stalled-cycles-frontend # 78.36% frontend cycles idle [83.30%] - 5,625,217,098 stalled-cycles-backend # 22.46% backend cycles idle [66.65%] - 11,498,998,059 instructions # 0.46 insns per cycle - # 1.71 stalled cycles per insn [83.32%] - 1,584,699,622 branches # 193.499 M/sec [83.30%] - 5,035,668 branch-misses # 0.32% of all branches [83.41%] + 8230.895013 task-clock # 1.000 CPUs utilized + 349 context-switches # 0.000 M/sec + 51 CPU-migrations # 0.000 M/sec + 7,924 page-faults # 0.001 M/sec + 25,179,610,041 cycles # 3.059 GHz [83.31%] + 19,733,923,171 stalled-cycles-frontend # 78.37% frontend cycles idle [83.35%] + 5,763,803,893 stalled-cycles-backend # 22.89% backend cycles idle [66.59%] + 11,489,775,504 instructions # 0.46 insns per cycle + # 1.72 stalled cycles per insn [83.39%] + 1,586,764,019 branches # 192.781 M/sec [83.37%] + 5,033,764 branch-misses # 0.32% of all branches [83.39%] - 8.224508473 seconds time elapsed + 8.231041043 seconds time elapsed Iteration 2 Performance counter stats for 'java MatrixMultiplier 1000': - 8201.366801 task-clock # 1.000 CPUs utilized - 356 context-switches # 0.000 M/sec - 59 CPU-migrations # 0.000 M/sec - 7,926 page-faults # 0.001 M/sec - 25,086,666,257 cycles # 3.059 GHz [83.37%] - 19,653,613,981 stalled-cycles-frontend # 78.34% frontend cycles idle [83.34%] - 6,044,554,119 stalled-cycles-backend # 24.09% backend cycles idle [66.54%] - 11,489,727,013 instructions # 0.46 insns per cycle - # 1.71 stalled cycles per insn [83.27%] - 1,583,699,875 branches # 193.102 M/sec [83.36%] - 4,928,257 branch-misses # 0.31% of all branches [83.41%] + 8259.814170 task-clock # 1.000 CPUs utilized + 348 context-switches # 0.000 M/sec + 49 CPU-migrations # 0.000 M/sec + 7,921 page-faults # 0.001 M/sec + 25,267,638,160 cycles # 3.059 GHz [83.34%] + 19,841,583,037 stalled-cycles-frontend # 78.53% frontend cycles idle [83.21%] + 6,527,775,541 stalled-cycles-backend # 25.83% backend cycles idle [66.69%] + 11,513,813,855 instructions # 0.46 insns per cycle + # 1.72 stalled cycles per insn [83.38%] + 1,587,852,465 branches # 192.238 M/sec [83.37%] + 5,136,172 branch-misses # 0.32% of all branches [83.43%] - 8.201853253 seconds time elapsed + 8.260232738 seconds time elapsed Iteration 3 Performance counter stats for 'java MatrixMultiplier 1000': - 8226.593365 task-clock # 1.000 CPUs utilized - 340 context-switches # 0.000 M/sec - 54 CPU-migrations # 0.000 M/sec + 8194.756476 task-clock # 1.000 CPUs utilized + 375 context-switches # 0.000 M/sec + 52 CPU-migrations # 0.000 M/sec 7,917 page-faults # 0.001 M/sec - 25,167,840,017 cycles # 3.059 GHz [83.36%] - 19,742,382,690 stalled-cycles-frontend # 78.44% frontend cycles idle [83.21%] - 5,920,768,984 stalled-cycles-backend # 23.53% backend cycles idle [66.67%] - 11,483,707,296 instructions # 0.46 insns per cycle - # 1.72 stalled cycles per insn [83.41%] - 1,588,778,433 branches # 193.127 M/sec [83.42%] - 5,038,893 branch-misses # 0.32% of all branches [83.37%] + 25,071,710,073 cycles # 3.059 GHz [83.35%] + 19,634,941,038 stalled-cycles-frontend # 78.32% frontend cycles idle [83.36%] + 5,481,936,492 stalled-cycles-backend # 21.87% backend cycles idle [66.57%] + 11,497,785,971 instructions # 0.46 insns per cycle + # 1.71 stalled cycles per insn [83.26%] + 1,585,354,953 branches # 193.460 M/sec [83.36%] + 4,624,130 branch-misses # 0.29% of all branches [83.37%] - 8.226387546 seconds time elapsed + 8.195429601 seconds time elapsed Iteration 4 Performance counter stats for 'java MatrixMultiplier 1000': - 8260.429550 task-clock # 0.999 CPUs utilized - 344 context-switches # 0.000 M/sec - 46 CPU-migrations # 0.000 M/sec - 7,927 page-faults # 0.001 M/sec - 25,262,443,048 cycles # 3.058 GHz [83.37%] - 19,840,033,810 stalled-cycles-frontend # 78.54% frontend cycles idle [83.39%] - 6,387,603,184 stalled-cycles-backend # 25.28% backend cycles idle [66.64%] - 11,499,888,815 instructions # 0.46 insns per cycle - # 1.73 stalled cycles per insn [83.25%] - 1,583,378,720 branches # 191.682 M/sec [83.26%] - 4,695,896 branch-misses # 0.30% of all branches [83.36%] - - 8.265790251 seconds time elapsed + 8289.424086 task-clock # 1.000 CPUs utilized + 351 context-switches # 0.000 M/sec + 50 CPU-migrations # 0.000 M/sec + 7,924 page-faults # 0.001 M/sec + 25,357,184,443 cycles # 3.059 GHz [83.40%] + 19,924,099,338 stalled-cycles-frontend # 78.57% frontend cycles idle [83.30%] + 5,665,731,789 stalled-cycles-backend # 22.34% backend cycles idle [66.62%] + 11,497,881,177 instructions # 0.45 insns per cycle + # 1.73 stalled cycles per insn [83.36%] + 1,586,295,230 branches # 191.364 M/sec [83.35%] + 4,864,960 branch-misses # 0.31% of all branches [83.36%] + + 8.289548645 seconds time elapsed Iteration 5 Performance counter stats for 'java MatrixMultiplier 1000': - 8232.352704 task-clock # 1.000 CPUs utilized - 355 context-switches # 0.000 M/sec - 46 CPU-migrations # 0.000 M/sec - 7,920 page-faults # 0.001 M/sec - 25,181,505,621 cycles # 3.059 GHz [83.38%] - 19,745,669,605 stalled-cycles-frontend # 78.41% frontend cycles idle [83.37%] - 5,924,168,083 stalled-cycles-backend # 23.53% backend cycles idle [66.59%] - 11,492,938,290 instructions # 0.46 insns per cycle - # 1.72 stalled cycles per insn [83.24%] - 1,584,816,005 branches # 192.511 M/sec [83.28%] - 4,682,747 branch-misses # 0.30% of all branches [83.40%] - - 8.233134328 seconds time elapsed + 8295.510219 task-clock # 1.000 CPUs utilized + 344 context-switches # 0.000 M/sec + 45 CPU-migrations # 0.000 M/sec + 7,914 page-faults # 0.001 M/sec + 25,375,983,015 cycles # 3.059 GHz [83.35%] + 19,927,717,481 stalled-cycles-frontend # 78.53% frontend cycles idle [83.38%] + 5,775,388,326 stalled-cycles-backend # 22.76% backend cycles idle [66.64%] + 11,510,303,341 instructions # 0.45 insns per cycle + # 1.73 stalled cycles per insn [83.34%] + 1,584,048,659 branches # 190.953 M/sec [83.33%] + 4,757,923 branch-misses # 0.30% of all branches [83.34%] + + 8.295597912 seconds time elapsed Iteration 6 Performance counter stats for 'java MatrixMultiplier 1000': - 8234.639802 task-clock # 1.000 CPUs utilized - 334 context-switches # 0.000 M/sec - 52 CPU-migrations # 0.000 M/sec - 7,915 page-faults # 0.001 M/sec - 25,205,280,543 cycles # 3.061 GHz [83.31%] - 19,763,735,705 stalled-cycles-frontend # 78.41% frontend cycles idle [83.26%] - 5,702,847,993 stalled-cycles-backend # 22.63% backend cycles idle [66.67%] - 11,500,159,783 instructions # 0.46 insns per cycle - # 1.72 stalled cycles per insn [83.38%] - 1,590,468,625 branches # 193.144 M/sec [83.43%] - 4,924,546 branch-misses # 0.31% of all branches [83.36%] + 8279.033166 task-clock # 1.000 CPUs utilized + 338 context-switches # 0.000 M/sec + 49 CPU-migrations # 0.000 M/sec + 7,921 page-faults # 0.001 M/sec + 25,325,475,010 cycles # 3.059 GHz [83.38%] + 19,889,516,972 stalled-cycles-frontend # 78.54% frontend cycles idle [83.24%] + 6,028,939,780 stalled-cycles-backend # 23.81% backend cycles idle [66.57%] + 11,486,000,036 instructions # 0.45 insns per cycle + # 1.73 stalled cycles per insn [83.42%] + 1,588,599,157 branches # 191.882 M/sec [83.43%] + 4,920,256 branch-misses # 0.31% of all branches [83.40%] - 8.235079008 seconds time elapsed + 8.280647843 seconds time elapsed Iteration 7 Performance counter stats for 'java MatrixMultiplier 1000': - 8194.075299 task-clock # 1.000 CPUs utilized - 342 context-switches # 0.000 M/sec - 52 CPU-migrations # 0.000 M/sec - 7,930 page-faults # 0.001 M/sec - 25,069,438,902 cycles # 3.059 GHz [83.31%] - 19,660,679,181 stalled-cycles-frontend # 78.42% frontend cycles idle [83.31%] - 5,702,572,352 stalled-cycles-backend # 22.75% backend cycles idle [66.64%] - 11,484,198,067 instructions # 0.46 insns per cycle - # 1.71 stalled cycles per insn [83.35%] - 1,587,837,333 branches # 193.779 M/sec [83.38%] - 5,038,709 branch-misses # 0.32% of all branches [83.39%] + 8238.691565 task-clock # 0.979 CPUs utilized + 350 context-switches # 0.000 M/sec + 60 CPU-migrations # 0.000 M/sec + 7,908 page-faults # 0.001 M/sec + 25,200,142,210 cycles # 3.059 GHz [83.36%] + 19,774,075,612 stalled-cycles-frontend # 78.47% frontend cycles idle [83.35%] + 5,690,178,267 stalled-cycles-backend # 22.58% backend cycles idle [66.56%] + 11,493,062,103 instructions # 0.46 insns per cycle + # 1.72 stalled cycles per insn [83.30%] + 1,590,593,567 branches # 193.064 M/sec [83.37%] + 4,824,786 branch-misses # 0.30% of all branches [83.40%] - 8.193395991 seconds time elapsed + 8.418598063 seconds time elapsed Iteration 8 Performance counter stats for 'java MatrixMultiplier 1000': - 8198.617619 task-clock # 1.000 CPUs utilized - 346 context-switches # 0.000 M/sec - 57 CPU-migrations # 0.000 M/sec - 7,921 page-faults # 0.001 M/sec - 25,080,914,449 cycles # 3.059 GHz [83.34%] - 19,639,873,745 stalled-cycles-frontend # 78.31% frontend cycles idle [83.40%] - 5,508,518,414 stalled-cycles-backend # 21.96% backend cycles idle [66.56%] - 11,499,212,780 instructions # 0.46 insns per cycle - # 1.71 stalled cycles per insn [83.33%] - 1,588,578,794 branches # 193.762 M/sec [83.36%] - 5,123,825 branch-misses # 0.32% of all branches [83.37%] + 8261.292085 task-clock # 1.000 CPUs utilized + 363 context-switches # 0.000 M/sec + 47 CPU-migrations # 0.000 M/sec + 7,924 page-faults # 0.001 M/sec + 25,267,234,464 cycles # 3.059 GHz [83.38%] + 19,828,388,563 stalled-cycles-frontend # 78.47% frontend cycles idle [83.37%] + 5,913,581,026 stalled-cycles-backend # 23.40% backend cycles idle [66.54%] + 11,491,742,369 instructions # 0.45 insns per cycle + # 1.73 stalled cycles per insn [83.26%] + 1,584,928,928 branches # 191.850 M/sec [83.35%] + 4,710,317 branch-misses # 0.30% of all branches [83.39%] - 8.199200929 seconds time elapsed + 8.263920402 seconds time elapsed Iteration 9 Performance counter stats for 'java MatrixMultiplier 1000': - 8309.905416 task-clock # 0.994 CPUs utilized - 342 context-switches # 0.000 M/sec - 55 CPU-migrations # 0.000 M/sec + 8159.608685 task-clock # 1.000 CPUs utilized + 352 context-switches # 0.000 M/sec + 44 CPU-migrations # 0.000 M/sec 7,922 page-faults # 0.001 M/sec - 25,422,985,224 cycles # 3.059 GHz [83.40%] - 19,982,855,266 stalled-cycles-frontend # 78.60% frontend cycles idle [83.28%] - 5,648,979,964 stalled-cycles-backend # 22.22% backend cycles idle [66.57%] - 11,501,679,926 instructions # 0.45 insns per cycle - # 1.74 stalled cycles per insn [83.39%] - 1,587,673,401 branches # 191.058 M/sec [83.39%] - 4,705,502 branch-misses # 0.30% of all branches [83.38%] + 24,966,244,868 cycles # 3.060 GHz [83.38%] + 19,528,618,282 stalled-cycles-frontend # 78.22% frontend cycles idle [83.38%] + 5,211,081,380 stalled-cycles-backend # 20.87% backend cycles idle [66.60%] + 11,505,569,740 instructions # 0.46 insns per cycle + # 1.70 stalled cycles per insn [83.31%] + 1,582,342,745 branches # 193.924 M/sec [83.29%] + 4,717,778 branch-misses # 0.30% of all branches [83.38%] - 8.363947305 seconds time elapsed + 8.161167189 seconds time elapsed Iteration 10 Performance counter stats for 'java MatrixMultiplier 1000': - 8272.681053 task-clock # 1.000 CPUs utilized - 364 context-switches # 0.000 M/sec - 53 CPU-migrations # 0.000 M/sec - 7,924 page-faults # 0.001 M/sec - 25,307,211,479 cycles # 3.059 GHz [83.31%] - 19,865,790,949 stalled-cycles-frontend # 78.50% frontend cycles idle [83.33%] - 6,055,880,576 stalled-cycles-backend # 23.93% backend cycles idle [66.64%] - 11,504,664,919 instructions # 0.45 insns per cycle - # 1.73 stalled cycles per insn [83.37%] - 1,586,728,612 branches # 191.803 M/sec [83.35%] - 4,551,682 branch-misses # 0.29% of all branches [83.37%] - - 8.273447669 seconds time elapsed + 8325.978080 task-clock # 1.000 CPUs utilized + 336 context-switches # 0.000 M/sec + 51 CPU-migrations # 0.000 M/sec + 7,920 page-faults # 0.001 M/sec + 25,465,415,040 cycles # 3.059 GHz [83.39%] + 20,014,451,796 stalled-cycles-frontend # 78.59% frontend cycles idle [83.35%] + 5,716,481,850 stalled-cycles-backend # 22.45% backend cycles idle [66.57%] + 11,496,878,405 instructions # 0.45 insns per cycle + # 1.74 stalled cycles per insn [83.29%] + 1,583,971,382 branches # 190.244 M/sec [83.35%] + 4,654,654 branch-misses # 0.29% of all branches [83.37%] + + 8.327184267 seconds time elapsed diff --git a/sankalp/java_output_3000 b/sankalp/java_output_3000 new file mode 100644 index 0000000..bcb0278 --- /dev/null +++ b/sankalp/java_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 570246.408556 task-clock # 0.998 CPUs utilized + 13,594 context-switches # 0.000 M/sec + 67 CPU-migrations # 0.000 M/sec + 55,723 page-faults # 0.000 M/sec + 1,745,855,585,043 cycles # 3.062 GHz [83.33%] + 1,586,556,006,830 stalled-cycles-frontend # 90.88% frontend cycles idle [83.33%] + 667,253,690,712 stalled-cycles-backend # 38.22% backend cycles idle [66.66%] + 299,663,523,851 instructions # 0.17 insns per cycle + # 5.29 stalled cycles per insn [83.33%] + 40,925,007,356 branches # 71.767 M/sec [83.34%] + 21,839,815 branch-misses # 0.05% of all branches [83.34%] + + 571.200174838 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 526618.685030 task-clock # 0.998 CPUs utilized + 12,618 context-switches # 0.000 M/sec + 65 CPU-migrations # 0.000 M/sec + 54,849 page-faults # 0.000 M/sec + 1,612,309,554,009 cycles # 3.062 GHz [83.33%] + 1,453,911,024,610 stalled-cycles-frontend # 90.18% frontend cycles idle [83.33%] + 604,419,114,381 stalled-cycles-backend # 37.49% backend cycles idle [66.67%] + 299,550,354,418 instructions # 0.19 insns per cycle + # 4.85 stalled cycles per insn [83.34%] + 40,909,432,652 branches # 77.683 M/sec [83.33%] + 21,245,062 branch-misses # 0.05% of all branches [83.33%] + + 527.548551694 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 535466.680458 task-clock # 0.998 CPUs utilized + 12,846 context-switches # 0.000 M/sec + 62 CPU-migrations # 0.000 M/sec + 54,956 page-faults # 0.000 M/sec + 1,639,046,450,367 cycles # 3.061 GHz [83.34%] + 1,480,430,768,242 stalled-cycles-frontend # 90.32% frontend cycles idle [83.33%] + 601,908,499,977 stalled-cycles-backend # 36.72% backend cycles idle [66.66%] + 299,553,327,633 instructions # 0.18 insns per cycle + # 4.94 stalled cycles per insn [83.34%] + 40,910,210,705 branches # 76.401 M/sec [83.33%] + 20,911,209 branch-misses # 0.05% of all branches [83.34%] + + 536.698723828 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 552650.707551 task-clock # 0.997 CPUs utilized + 12,976 context-switches # 0.000 M/sec + 77 CPU-migrations # 0.000 M/sec + 55,114 page-faults # 0.000 M/sec + 1,691,511,828,074 cycles # 3.061 GHz [83.33%] + 1,532,208,381,110 stalled-cycles-frontend # 90.58% frontend cycles idle [83.33%] + 621,744,344,523 stalled-cycles-backend # 36.76% backend cycles idle [66.67%] + 299,846,020,001 instructions # 0.18 insns per cycle + # 5.11 stalled cycles per insn [83.34%] + 40,958,238,817 branches # 74.112 M/sec [83.33%] + 21,459,929 branch-misses # 0.05% of all branches [83.33%] + + 554.276915012 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 556814.234121 task-clock # 0.998 CPUs utilized + 13,237 context-switches # 0.000 M/sec + 70 CPU-migrations # 0.000 M/sec + 55,552 page-faults # 0.000 M/sec + 1,704,664,130,406 cycles # 3.061 GHz [83.34%] + 1,545,675,582,807 stalled-cycles-frontend # 90.67% frontend cycles idle [83.33%] + 633,094,029,679 stalled-cycles-backend # 37.14% backend cycles idle [66.67%] + 299,667,160,749 instructions # 0.18 insns per cycle + # 5.16 stalled cycles per insn [83.33%] + 40,929,141,875 branches # 73.506 M/sec [83.33%] + 21,024,237 branch-misses # 0.05% of all branches [83.33%] + + 557.952865517 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 560832.876628 task-clock # 0.998 CPUs utilized + 12,793 context-switches # 0.000 M/sec + 77 CPU-migrations # 0.000 M/sec + 55,513 page-faults # 0.000 M/sec + 1,713,840,185,302 cycles # 3.056 GHz [83.34%] + 1,555,002,421,280 stalled-cycles-frontend # 90.73% frontend cycles idle [83.33%] + 637,113,380,734 stalled-cycles-backend # 37.17% backend cycles idle [66.66%] + 299,715,387,470 instructions # 0.17 insns per cycle + # 5.19 stalled cycles per insn [83.33%] + 40,932,284,030 branches # 72.985 M/sec [83.33%] + 21,650,917 branch-misses # 0.05% of all branches [83.34%] + + 561.996199196 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 550567.500826 task-clock # 0.998 CPUs utilized + 12,798 context-switches # 0.000 M/sec + 82 CPU-migrations # 0.000 M/sec + 55,289 page-faults # 0.000 M/sec + 1,684,502,992,534 cycles # 3.060 GHz [83.34%] + 1,525,773,333,416 stalled-cycles-frontend # 90.58% frontend cycles idle [83.34%] + 624,056,379,930 stalled-cycles-backend # 37.05% backend cycles idle [66.66%] + 299,717,851,374 instructions # 0.18 insns per cycle + # 5.09 stalled cycles per insn [83.33%] + 40,933,551,765 branches # 74.348 M/sec [83.33%] + 21,857,346 branch-misses # 0.05% of all branches [83.33%] + + 551.751018706 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 555494.391825 task-clock # 0.998 CPUs utilized + 12,852 context-switches # 0.000 M/sec + 58 CPU-migrations # 0.000 M/sec + 55,583 page-faults # 0.000 M/sec + 1,698,991,939,785 cycles # 3.059 GHz [83.34%] + 1,540,286,255,055 stalled-cycles-frontend # 90.66% frontend cycles idle [83.33%] + 640,738,068,956 stalled-cycles-backend # 37.71% backend cycles idle [66.66%] + 299,551,757,727 instructions # 0.18 insns per cycle + # 5.14 stalled cycles per insn [83.33%] + 40,913,471,509 branches # 73.652 M/sec [83.33%] + 20,264,283 branch-misses # 0.05% of all branches [83.34%] + + 556.645024828 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 546762.798329 task-clock # 0.998 CPUs utilized + 13,058 context-switches # 0.000 M/sec + 64 CPU-migrations # 0.000 M/sec + 55,257 page-faults # 0.000 M/sec + 1,673,716,383,400 cycles # 3.061 GHz [83.33%] + 1,514,986,220,797 stalled-cycles-frontend # 90.52% frontend cycles idle [83.33%] + 625,080,656,461 stalled-cycles-backend # 37.35% backend cycles idle [66.66%] + 299,613,800,760 instructions # 0.18 insns per cycle + # 5.06 stalled cycles per insn [83.33%] + 40,915,862,013 branches # 74.833 M/sec [83.34%] + 20,910,287 branch-misses # 0.05% of all branches [83.34%] + + 547.893249032 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 548287.545724 task-clock # 0.998 CPUs utilized + 12,824 context-switches # 0.000 M/sec + 78 CPU-migrations # 0.000 M/sec + 55,174 page-faults # 0.000 M/sec + 1,678,345,846,454 cycles # 3.061 GHz [83.33%] + 1,519,483,980,886 stalled-cycles-frontend # 90.53% frontend cycles idle [83.34%] + 617,643,582,895 stalled-cycles-backend # 36.80% backend cycles idle [66.66%] + 299,920,288,315 instructions # 0.18 insns per cycle + # 5.07 stalled cycles per insn [83.33%] + 40,977,709,387 branches # 74.738 M/sec [83.33%] + 22,271,141 branch-misses # 0.05% of all branches [83.34%] + + 549.477799232 seconds time elapsed + diff --git a/sankalp/python_output_100 b/sankalp/python_output_100 index 5ab3afa..7179958 100644 --- a/sankalp/python_output_100 +++ b/sankalp/python_output_100 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for 'python MatrixMultiplier.py 100': - 309.630672 task-clock # 0.901 CPUs utilized - 4 context-switches # 0.000 M/sec - 1 CPU-migrations # 0.000 M/sec - 1,676 page-faults # 0.005 M/sec - 946,757,404 cycles # 3.058 GHz [83.22%] - 212,867,613 stalled-cycles-frontend # 22.48% frontend cycles idle [83.24%] - 63,819,070 stalled-cycles-backend # 6.74% backend cycles idle [65.44%] - 1,884,057,121 instructions # 1.99 insns per cycle - # 0.11 stalled cycles per insn [83.30%] - 408,704,860 branches # 1319.975 M/sec [84.60%] - 7,928,681 branch-misses # 1.94% of all branches [83.55%] + 310.595374 task-clock # 0.995 CPUs utilized + 2 context-switches # 0.000 M/sec + 2 CPU-migrations # 0.000 M/sec + 1,677 page-faults # 0.005 M/sec + 950,305,447 cycles # 3.060 GHz [83.21%] + 208,977,194 stalled-cycles-frontend # 21.99% frontend cycles idle [83.21%] + 114,820,345 stalled-cycles-backend # 12.08% backend cycles idle [66.85%] + 1,889,541,274 instructions # 1.99 insns per cycle + # 0.11 stalled cycles per insn [83.50%] + 410,537,156 branches # 1321.775 M/sec [83.23%] + 7,787,667 branch-misses # 1.90% of all branches [84.54%] - 0.343684558 seconds time elapsed + 0.312207034 seconds time elapsed Iteration 2 Performance counter stats for 'python MatrixMultiplier.py 100': - 309.810240 task-clock # 0.939 CPUs utilized + 317.375154 task-clock # 0.995 CPUs utilized 2 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 1,677 page-faults # 0.005 M/sec - 946,679,912 cycles # 3.056 GHz [83.28%] - 211,551,237 stalled-cycles-frontend # 22.35% frontend cycles idle [83.28%] - 104,969,613 stalled-cycles-backend # 11.09% backend cycles idle [66.13%] - 1,892,945,019 instructions # 2.00 insns per cycle - # 0.11 stalled cycles per insn [82.89%] - 409,063,013 branches # 1320.366 M/sec [83.32%] - 7,892,268 branch-misses # 1.93% of all branches [84.40%] + 968,794,927 cycles # 3.053 GHz [82.10%] + 235,456,003 stalled-cycles-frontend # 24.30% frontend cycles idle [84.10%] + 126,450,464 stalled-cycles-backend # 13.05% backend cycles idle [67.22%] + 1,886,858,184 instructions # 1.95 insns per cycle + # 0.12 stalled cycles per insn [84.04%] + 410,592,651 branches # 1293.714 M/sec [83.56%] + 7,942,732 branch-misses # 1.93% of all branches [83.62%] - 0.329926008 seconds time elapsed + 0.319033877 seconds time elapsed Iteration 3 Performance counter stats for 'python MatrixMultiplier.py 100': - 307.754121 task-clock # 0.918 CPUs utilized - 3 context-switches # 0.000 M/sec - 2 CPU-migrations # 0.000 M/sec - 1,677 page-faults # 0.005 M/sec - 941,277,678 cycles # 3.059 GHz [83.12%] - 206,091,632 stalled-cycles-frontend # 21.89% frontend cycles idle [83.21%] - 73,096,393 stalled-cycles-backend # 7.77% backend cycles idle [67.02%] - 1,882,387,542 instructions # 2.00 insns per cycle - # 0.11 stalled cycles per insn [83.97%] - 409,667,607 branches # 1331.152 M/sec [83.26%] - 7,918,631 branch-misses # 1.93% of all branches [83.83%] + 314.206104 task-clock # 0.993 CPUs utilized + 2 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 1,676 page-faults # 0.005 M/sec + 952,191,165 cycles # 3.030 GHz [83.38%] + 226,100,081 stalled-cycles-frontend # 23.75% frontend cycles idle [83.56%] + 113,909,956 stalled-cycles-backend # 11.96% backend cycles idle [67.26%] + 1,888,342,829 instructions # 1.98 insns per cycle + # 0.12 stalled cycles per insn [83.75%] + 410,184,188 branches # 1305.462 M/sec [83.46%] + 7,930,634 branch-misses # 1.93% of all branches [83.01%] - 0.335373945 seconds time elapsed + 0.316389357 seconds time elapsed Iteration 4 Performance counter stats for 'python MatrixMultiplier.py 100': - 313.358990 task-clock # 0.925 CPUs utilized - 3 context-switches # 0.000 M/sec - 1 CPU-migrations # 0.000 M/sec + 318.647132 task-clock # 0.993 CPUs utilized + 2 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec 1,677 page-faults # 0.005 M/sec - 954,493,807 cycles # 3.046 GHz [83.43%] - 222,811,750 stalled-cycles-frontend # 23.34% frontend cycles idle [83.43%] - 111,393,953 stalled-cycles-backend # 11.67% backend cycles idle [67.06%] - 1,885,328,197 instructions # 1.98 insns per cycle - # 0.12 stalled cycles per insn [83.68%] - 410,549,506 branches # 1310.157 M/sec [83.30%] - 7,946,380 branch-misses # 1.94% of all branches [83.04%] + 970,010,198 cycles # 3.044 GHz [83.64%] + 249,031,275 stalled-cycles-frontend # 25.67% frontend cycles idle [83.85%] + 113,651,853 stalled-cycles-backend # 11.72% backend cycles idle [66.25%] + 1,881,454,144 instructions # 1.94 insns per cycle + # 0.13 stalled cycles per insn [83.70%] + 409,510,112 branches # 1285.152 M/sec [83.75%] + 7,919,968 branch-misses # 1.93% of all branches [82.85%] - 0.338875999 seconds time elapsed + 0.320770553 seconds time elapsed Iteration 5 Performance counter stats for 'python MatrixMultiplier.py 100': - 309.532625 task-clock # 0.940 CPUs utilized - 3 context-switches # 0.000 M/sec + 309.620454 task-clock # 0.995 CPUs utilized + 2 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 1,677 page-faults # 0.005 M/sec - 946,871,219 cycles # 3.059 GHz [83.28%] - 210,150,718 stalled-cycles-frontend # 22.19% frontend cycles idle [83.04%] - 101,615,670 stalled-cycles-backend # 10.73% backend cycles idle [67.32%] - 1,884,865,391 instructions # 1.99 insns per cycle - # 0.11 stalled cycles per insn [84.02%] - 409,424,874 branches # 1322.720 M/sec [83.44%] - 7,877,566 branch-misses # 1.92% of all branches [83.69%] + 1,676 page-faults # 0.005 M/sec + 946,532,189 cycles # 3.057 GHz [83.19%] + 210,553,105 stalled-cycles-frontend # 22.24% frontend cycles idle [83.23%] + 113,183,915 stalled-cycles-backend # 11.96% backend cycles idle [66.64%] + 1,893,323,130 instructions # 2.00 insns per cycle + # 0.11 stalled cycles per insn [83.24%] + 409,998,761 branches # 1324.198 M/sec [83.31%] + 7,838,513 branch-misses # 1.91% of all branches [84.37%] - 0.329377165 seconds time elapsed + 0.311134204 seconds time elapsed Iteration 6 Performance counter stats for 'python MatrixMultiplier.py 100': - 309.909108 task-clock # 0.916 CPUs utilized - 2 context-switches # 0.000 M/sec + 318.340423 task-clock # 0.994 CPUs utilized + 3 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 1,677 page-faults # 0.005 M/sec - 947,672,806 cycles # 3.058 GHz [83.16%] - 215,893,789 stalled-cycles-frontend # 22.78% frontend cycles idle [83.48%] - 92,382,477 stalled-cycles-backend # 9.75% backend cycles idle [66.10%] - 1,878,061,333 instructions # 1.98 insns per cycle - # 0.11 stalled cycles per insn [83.32%] - 406,940,873 branches # 1313.097 M/sec [84.42%] - 7,925,019 branch-misses # 1.95% of all branches [83.67%] + 971,951,980 cycles # 3.053 GHz [82.61%] + 234,448,727 stalled-cycles-frontend # 24.12% frontend cycles idle [83.63%] + 118,368,059 stalled-cycles-backend # 12.18% backend cycles idle [67.48%] + 1,893,410,464 instructions # 1.95 insns per cycle + # 0.12 stalled cycles per insn [83.70%] + 409,296,419 branches # 1285.719 M/sec [83.89%] + 7,987,643 branch-misses # 1.95% of all branches [83.04%] - 0.338324604 seconds time elapsed + 0.320257431 seconds time elapsed Iteration 7 Performance counter stats for 'python MatrixMultiplier.py 100': - 312.018739 task-clock # 0.927 CPUs utilized + 313.579500 task-clock # 0.991 CPUs utilized 2 context-switches # 0.000 M/sec - 1 CPU-migrations # 0.000 M/sec - 1,677 page-faults # 0.005 M/sec - 954,723,282 cycles # 3.060 GHz [83.46%] - 212,491,394 stalled-cycles-frontend # 22.26% frontend cycles idle [83.38%] - 85,512,351 stalled-cycles-backend # 8.96% backend cycles idle [66.64%] - 1,880,918,004 instructions # 1.97 insns per cycle - # 0.11 stalled cycles per insn [83.37%] - 409,713,240 branches # 1313.105 M/sec [83.32%] - 7,930,123 branch-misses # 1.94% of all branches [83.49%] + 0 CPU-migrations # 0.000 M/sec + 1,676 page-faults # 0.005 M/sec + 949,176,021 cycles # 3.027 GHz [83.01%] + 228,235,538 stalled-cycles-frontend # 24.05% frontend cycles idle [83.85%] + 114,803,497 stalled-cycles-backend # 12.10% backend cycles idle [67.14%] + 1,891,305,914 instructions # 1.99 insns per cycle + # 0.12 stalled cycles per insn [83.78%] + 410,801,526 branches # 1310.039 M/sec [83.50%] + 7,908,011 branch-misses # 1.93% of all branches [83.37%] - 0.336552045 seconds time elapsed + 0.316310514 seconds time elapsed Iteration 8 Performance counter stats for 'python MatrixMultiplier.py 100': - 311.949662 task-clock # 0.915 CPUs utilized + 311.678671 task-clock # 0.995 CPUs utilized 3 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 1,676 page-faults # 0.005 M/sec - 953,568,526 cycles # 3.057 GHz [83.29%] - 220,879,860 stalled-cycles-frontend # 23.16% frontend cycles idle [83.41%] - 95,581,611 stalled-cycles-backend # 10.02% backend cycles idle [66.64%] - 1,888,017,871 instructions # 1.98 insns per cycle - # 0.12 stalled cycles per insn [83.26%] - 409,626,977 branches # 1313.119 M/sec [83.40%] - 7,853,768 branch-misses # 1.92% of all branches [84.14%] + 1,677 page-faults # 0.005 M/sec + 952,970,698 cycles # 3.058 GHz [83.55%] + 219,662,189 stalled-cycles-frontend # 23.05% frontend cycles idle [83.21%] + 114,701,620 stalled-cycles-backend # 12.04% backend cycles idle [65.68%] + 1,881,293,638 instructions # 1.97 insns per cycle + # 0.12 stalled cycles per insn [83.24%] + 407,180,681 branches # 1306.412 M/sec [84.60%] + 7,910,731 branch-misses # 1.94% of all branches [83.53%] - 0.340900825 seconds time elapsed + 0.313387753 seconds time elapsed Iteration 9 Performance counter stats for 'python MatrixMultiplier.py 100': - 311.984667 task-clock # 0.939 CPUs utilized - 3 context-switches # 0.000 M/sec - 1 CPU-migrations # 0.000 M/sec - 1,677 page-faults # 0.005 M/sec - 948,431,759 cycles # 3.040 GHz [83.35%] - 222,625,163 stalled-cycles-frontend # 23.47% frontend cycles idle [83.45%] - 87,610,769 stalled-cycles-backend # 9.24% backend cycles idle [67.49%] - 1,883,279,034 instructions # 1.99 insns per cycle - # 0.12 stalled cycles per insn [84.22%] - 409,864,722 branches # 1313.734 M/sec [83.51%] - 7,971,632 branch-misses # 1.94% of all branches [82.71%] + 313.124990 task-clock # 0.994 CPUs utilized + 2 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 1,676 page-faults # 0.005 M/sec + 956,698,466 cycles # 3.055 GHz [83.50%] + 223,911,216 stalled-cycles-frontend # 23.40% frontend cycles idle [83.42%] + 115,882,792 stalled-cycles-backend # 12.11% backend cycles idle [67.14%] + 1,882,183,891 instructions # 1.97 insns per cycle + # 0.12 stalled cycles per insn [83.69%] + 410,823,001 branches # 1312.010 M/sec [83.30%] + 7,796,918 branch-misses # 1.90% of all branches [83.70%] - 0.332133520 seconds time elapsed + 0.314875304 seconds time elapsed Iteration 10 Performance counter stats for 'python MatrixMultiplier.py 100': - 312.281585 task-clock # 0.924 CPUs utilized - 2 context-switches # 0.000 M/sec + 312.917352 task-clock # 0.995 CPUs utilized + 3 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 1,677 page-faults # 0.005 M/sec - 953,498,584 cycles # 3.053 GHz [83.28%] - 219,264,614 stalled-cycles-frontend # 23.00% frontend cycles idle [83.50%] - 129,042,533 stalled-cycles-backend # 13.53% backend cycles idle [66.84%] - 1,888,368,126 instructions # 1.98 insns per cycle - # 0.12 stalled cycles per insn [83.48%] - 409,597,520 branches # 1311.629 M/sec [83.44%] - 7,947,842 branch-misses # 1.94% of all branches [83.03%] - - 0.337871973 seconds time elapsed + 1,676 page-faults # 0.005 M/sec + 953,503,523 cycles # 3.047 GHz [83.52%] + 221,432,711 stalled-cycles-frontend # 23.22% frontend cycles idle [83.33%] + 118,735,335 stalled-cycles-backend # 12.45% backend cycles idle [66.92%] + 1,895,676,857 instructions # 1.99 insns per cycle + # 0.12 stalled cycles per insn [83.27%] + 409,307,868 branches # 1308.038 M/sec [83.60%] + 7,932,060 branch-misses # 1.94% of all branches [82.88%] + + 0.314535722 seconds time elapsed diff --git a/sankalp/python_output_1000 b/sankalp/python_output_1000 index 297bd4b..daa13b6 100644 --- a/sankalp/python_output_1000 +++ b/sankalp/python_output_1000 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for 'python MatrixMultiplier.py 1000': - 267280.814532 task-clock # 0.997 CPUs utilized - 618 context-switches # 0.000 M/sec - 12 CPU-migrations # 0.000 M/sec + 269282.747218 task-clock # 0.997 CPUs utilized + 399 context-switches # 0.000 M/sec + 5 CPU-migrations # 0.000 M/sec 14,191 page-faults # 0.000 M/sec - 818,286,395,614 cycles # 3.062 GHz [83.33%] - 180,604,814,729 stalled-cycles-frontend # 22.07% frontend cycles idle [83.33%] - 105,054,409,109 stalled-cycles-backend # 12.84% backend cycles idle [66.67%] - 1,675,451,103,916 instructions # 2.05 insns per cycle + 824,332,821,090 cycles # 3.061 GHz [83.33%] + 184,047,857,986 stalled-cycles-frontend # 22.33% frontend cycles idle [83.33%] + 113,724,809,194 stalled-cycles-backend # 13.80% backend cycles idle [66.67%] + 1,675,622,016,239 instructions # 2.03 insns per cycle # 0.11 stalled cycles per insn [83.33%] - 368,032,473,888 branches # 1376.951 M/sec [83.33%] - 6,799,436,812 branch-misses # 1.85% of all branches [83.33%] + 368,064,088,818 branches # 1366.831 M/sec [83.33%] + 6,801,038,963 branch-misses # 1.85% of all branches [83.33%] - 267.974093315 seconds time elapsed + 269.959034322 seconds time elapsed Iteration 2 Performance counter stats for 'python MatrixMultiplier.py 1000': - 272457.321966 task-clock # 0.997 CPUs utilized - 394 context-switches # 0.000 M/sec - 8 CPU-migrations # 0.000 M/sec + 267375.571056 task-clock # 0.997 CPUs utilized + 630 context-switches # 0.000 M/sec + 3 CPU-migrations # 0.000 M/sec 14,192 page-faults # 0.000 M/sec - 834,049,245,426 cycles # 3.061 GHz [83.33%] - 196,463,689,527 stalled-cycles-frontend # 23.56% frontend cycles idle [83.33%] - 116,885,123,956 stalled-cycles-backend # 14.01% backend cycles idle [66.67%] - 1,675,713,892,162 instructions # 2.01 insns per cycle - # 0.12 stalled cycles per insn [83.33%] - 368,082,576,307 branches # 1350.973 M/sec [83.33%] - 6,809,192,349 branch-misses # 1.85% of all branches [83.33%] + 818,590,575,447 cycles # 3.062 GHz [83.33%] + 180,175,917,569 stalled-cycles-frontend # 22.01% frontend cycles idle [83.33%] + 98,729,139,584 stalled-cycles-backend # 12.06% backend cycles idle [66.67%] + 1,675,448,445,333 instructions # 2.05 insns per cycle + # 0.11 stalled cycles per insn [83.33%] + 368,047,151,115 branches # 1376.517 M/sec [83.33%] + 6,801,684,659 branch-misses # 1.85% of all branches [83.33%] - 273.141445282 seconds time elapsed + 268.052131536 seconds time elapsed Iteration 3 Performance counter stats for 'python MatrixMultiplier.py 1000': - 269214.913459 task-clock # 0.997 CPUs utilized - 377 context-switches # 0.000 M/sec - 16 CPU-migrations # 0.000 M/sec + 270536.297082 task-clock # 0.997 CPUs utilized + 385 context-switches # 0.000 M/sec + 7 CPU-migrations # 0.000 M/sec 14,192 page-faults # 0.000 M/sec - 824,184,535,691 cycles # 3.061 GHz [83.33%] - 185,016,771,239 stalled-cycles-frontend # 22.45% frontend cycles idle [83.33%] - 112,245,834,876 stalled-cycles-backend # 13.62% backend cycles idle [66.67%] - 1,675,618,159,052 instructions # 2.03 insns per cycle + 828,177,247,407 cycles # 3.061 GHz [83.33%] + 190,302,828,758 stalled-cycles-frontend # 22.98% frontend cycles idle [83.33%] + 111,509,216,863 stalled-cycles-backend # 13.46% backend cycles idle [66.67%] + 1,675,651,972,999 instructions # 2.02 insns per cycle # 0.11 stalled cycles per insn [83.33%] - 368,067,256,574 branches # 1367.187 M/sec [83.33%] - 6,792,464,919 branch-misses # 1.85% of all branches [83.33%] + 368,065,321,647 branches # 1360.503 M/sec [83.33%] + 6,802,010,625 branch-misses # 1.85% of all branches [83.33%] - 269.890848007 seconds time elapsed + 271.216315241 seconds time elapsed Iteration 4 Performance counter stats for 'python MatrixMultiplier.py 1000': - 270243.943203 task-clock # 0.997 CPUs utilized - 389 context-switches # 0.000 M/sec - 38 CPU-migrations # 0.000 M/sec + 267143.335703 task-clock # 0.997 CPUs utilized + 631 context-switches # 0.000 M/sec + 3 CPU-migrations # 0.000 M/sec 14,192 page-faults # 0.000 M/sec - 827,327,544,769 cycles # 3.061 GHz [83.33%] - 189,627,024,293 stalled-cycles-frontend # 22.92% frontend cycles idle [83.33%] - 112,487,969,169 stalled-cycles-backend # 13.60% backend cycles idle [66.67%] - 1,675,633,568,320 instructions # 2.03 insns per cycle + 817,877,099,883 cycles # 3.062 GHz [83.33%] + 177,863,330,934 stalled-cycles-frontend # 21.75% frontend cycles idle [83.33%] + 104,333,252,905 stalled-cycles-backend # 12.76% backend cycles idle [66.67%] + 1,675,414,737,246 instructions # 2.05 insns per cycle # 0.11 stalled cycles per insn [83.33%] - 368,073,749,361 branches # 1362.006 M/sec [83.33%] - 6,792,047,631 branch-misses # 1.85% of all branches [83.33%] + 368,030,482,689 branches # 1377.652 M/sec [83.33%] + 6,804,610,204 branch-misses # 1.85% of all branches [83.33%] - 270.923142149 seconds time elapsed + 267.820554414 seconds time elapsed Iteration 5 Performance counter stats for 'python MatrixMultiplier.py 1000': - 269233.488892 task-clock # 0.997 CPUs utilized - 391 context-switches # 0.000 M/sec - 7 CPU-migrations # 0.000 M/sec + 270786.976270 task-clock # 0.997 CPUs utilized + 392 context-switches # 0.000 M/sec + 8 CPU-migrations # 0.000 M/sec 14,192 page-faults # 0.000 M/sec - 824,229,800,983 cycles # 3.061 GHz [83.33%] - 184,441,623,933 stalled-cycles-frontend # 22.38% frontend cycles idle [83.33%] - 112,599,539,674 stalled-cycles-backend # 13.66% backend cycles idle [66.67%] - 1,675,645,540,946 instructions # 2.03 insns per cycle + 828,955,726,200 cycles # 3.061 GHz [83.33%] + 191,131,185,033 stalled-cycles-frontend # 23.06% frontend cycles idle [83.33%] + 110,784,470,024 stalled-cycles-backend # 13.36% backend cycles idle [66.66%] + 1,675,621,686,314 instructions # 2.02 insns per cycle # 0.11 stalled cycles per insn [83.33%] - 368,073,051,507 branches # 1367.115 M/sec [83.33%] - 6,801,591,839 branch-misses # 1.85% of all branches [83.33%] + 368,063,843,470 branches # 1359.238 M/sec [83.33%] + 6,796,925,570 branch-misses # 1.85% of all branches [83.33%] - 269.909263784 seconds time elapsed + 271.467826332 seconds time elapsed Iteration 6 Performance counter stats for 'python MatrixMultiplier.py 1000': - 270924.199539 task-clock # 0.997 CPUs utilized - 392 context-switches # 0.000 M/sec - 5 CPU-migrations # 0.000 M/sec + 266481.557526 task-clock # 0.997 CPUs utilized + 682 context-switches # 0.000 M/sec + 3 CPU-migrations # 0.000 M/sec 14,191 page-faults # 0.000 M/sec - 829,404,152,812 cycles # 3.061 GHz [83.33%] - 191,576,161,764 stalled-cycles-frontend # 23.10% frontend cycles idle [83.33%] - 109,757,553,847 stalled-cycles-backend # 13.23% backend cycles idle [66.67%] - 1,675,651,122,253 instructions # 2.02 insns per cycle - # 0.11 stalled cycles per insn [83.33%] - 368,061,317,346 branches # 1358.540 M/sec [83.33%] - 6,800,629,641 branch-misses # 1.85% of all branches [83.33%] + 815,865,288,439 cycles # 3.062 GHz [83.33%] + 174,967,867,583 stalled-cycles-frontend # 21.45% frontend cycles idle [83.33%] + 103,802,945,276 stalled-cycles-backend # 12.72% backend cycles idle [66.67%] + 1,675,408,073,433 instructions # 2.05 insns per cycle + # 0.10 stalled cycles per insn [83.33%] + 368,018,560,950 branches # 1381.028 M/sec [83.33%] + 6,808,676,461 branch-misses # 1.85% of all branches [83.33%] - 271.604913915 seconds time elapsed + 267.176207471 seconds time elapsed Iteration 7 Performance counter stats for 'python MatrixMultiplier.py 1000': - 267138.407719 task-clock # 0.997 CPUs utilized - 571 context-switches # 0.000 M/sec - 16 CPU-migrations # 0.000 M/sec - 14,192 page-faults # 0.000 M/sec - 817,746,930,697 cycles # 3.061 GHz [83.33%] - 179,545,380,139 stalled-cycles-frontend # 21.96% frontend cycles idle [83.33%] - 102,411,013,679 stalled-cycles-backend # 12.52% backend cycles idle [66.67%] - 1,675,464,943,177 instructions # 2.05 insns per cycle - # 0.11 stalled cycles per insn [83.33%] - 368,036,073,449 branches # 1377.698 M/sec [83.33%] - 6,799,103,875 branch-misses # 1.85% of all branches [83.33%] + 270991.243058 task-clock # 0.997 CPUs utilized + 394 context-switches # 0.000 M/sec + 5 CPU-migrations # 0.000 M/sec + 14,191 page-faults # 0.000 M/sec + 829,550,545,038 cycles # 3.061 GHz [83.33%] + 193,114,889,886 stalled-cycles-frontend # 23.28% frontend cycles idle [83.33%] + 104,913,989,265 stalled-cycles-backend # 12.65% backend cycles idle [66.67%] + 1,675,622,166,992 instructions # 2.02 insns per cycle + # 0.12 stalled cycles per insn [83.33%] + 368,073,492,609 branches # 1358.249 M/sec [83.33%] + 6,789,236,703 branch-misses # 1.84% of all branches [83.33%] - 267.813587562 seconds time elapsed + 271.673019731 seconds time elapsed Iteration 8 Performance counter stats for 'python MatrixMultiplier.py 1000': - 266004.784787 task-clock # 0.997 CPUs utilized - 2,997 context-switches # 0.000 M/sec - 9 CPU-migrations # 0.000 M/sec - 14,192 page-faults # 0.000 M/sec - 814,343,717,270 cycles # 3.061 GHz [83.33%] - 175,078,806,513 stalled-cycles-frontend # 21.50% frontend cycles idle [83.33%] - 102,777,765,524 stalled-cycles-backend # 12.62% backend cycles idle [66.67%] - 1,675,461,872,198 instructions # 2.06 insns per cycle - # 0.10 stalled cycles per insn [83.33%] - 368,038,416,864 branches # 1383.578 M/sec [83.33%] - 6,793,612,297 branch-misses # 1.85% of all branches [83.33%] + 269957.671129 task-clock # 0.997 CPUs utilized + 385 context-switches # 0.000 M/sec + 8 CPU-migrations # 0.000 M/sec + 14,191 page-faults # 0.000 M/sec + 826,371,949,154 cycles # 3.061 GHz [83.33%] + 186,319,358,104 stalled-cycles-frontend # 22.55% frontend cycles idle [83.33%] + 110,557,057,319 stalled-cycles-backend # 13.38% backend cycles idle [66.67%] + 1,675,653,988,579 instructions # 2.03 insns per cycle + # 0.11 stalled cycles per insn [83.33%] + 368,074,137,717 branches # 1363.451 M/sec [83.33%] + 6,801,014,501 branch-misses # 1.85% of all branches [83.33%] - 266.694441514 seconds time elapsed + 270.643451433 seconds time elapsed Iteration 9 Performance counter stats for 'python MatrixMultiplier.py 1000': - 266997.466078 task-clock # 0.997 CPUs utilized - 584 context-switches # 0.000 M/sec - 16 CPU-migrations # 0.000 M/sec + 266655.793295 task-clock # 0.997 CPUs utilized + 360 context-switches # 0.000 M/sec + 12 CPU-migrations # 0.000 M/sec 14,191 page-faults # 0.000 M/sec - 817,276,456,257 cycles # 3.061 GHz [83.33%] - 179,119,347,530 stalled-cycles-frontend # 21.92% frontend cycles idle [83.33%] - 105,092,501,446 stalled-cycles-backend # 12.86% backend cycles idle [66.67%] - 1,675,426,259,219 instructions # 2.05 insns per cycle - # 0.11 stalled cycles per insn [83.33%] - 368,045,895,215 branches # 1378.462 M/sec [83.33%] - 6,800,401,406 branch-misses # 1.85% of all branches [83.33%] + 814,924,829,284 cycles # 3.056 GHz [83.33%] + 175,516,485,947 stalled-cycles-frontend # 21.54% frontend cycles idle [83.33%] + 103,063,698,100 stalled-cycles-backend # 12.65% backend cycles idle [66.67%] + 1,675,341,118,528 instructions # 2.06 insns per cycle + # 0.10 stalled cycles per insn [83.33%] + 368,025,542,159 branches # 1380.152 M/sec [83.33%] + 6,794,780,148 branch-misses # 1.85% of all branches [83.33%] - 267.671841948 seconds time elapsed + 267.326775664 seconds time elapsed Iteration 10 Performance counter stats for 'python MatrixMultiplier.py 1000': - 268668.245846 task-clock # 0.997 CPUs utilized - 526 context-switches # 0.000 M/sec - 15 CPU-migrations # 0.000 M/sec + 267167.128601 task-clock # 0.997 CPUs utilized + 613 context-switches # 0.000 M/sec + 3 CPU-migrations # 0.000 M/sec 14,191 page-faults # 0.000 M/sec - 822,518,004,071 cycles # 3.061 GHz [83.33%] - 183,378,969,649 stalled-cycles-frontend # 22.29% frontend cycles idle [83.33%] - 111,191,115,504 stalled-cycles-backend # 13.52% backend cycles idle [66.67%] - 1,675,475,742,837 instructions # 2.04 insns per cycle + 817,945,425,517 cycles # 3.062 GHz [83.33%] + 177,423,498,342 stalled-cycles-frontend # 21.69% frontend cycles idle [83.33%] + 103,607,614,525 stalled-cycles-backend # 12.67% backend cycles idle [66.67%] + 1,675,455,127,498 instructions # 2.05 insns per cycle # 0.11 stalled cycles per insn [83.33%] - 368,056,693,946 branches # 1369.930 M/sec [83.33%] - 6,783,515,299 branch-misses # 1.84% of all branches [83.33%] + 368,044,081,352 branches # 1377.580 M/sec [83.33%] + 6,808,538,361 branch-misses # 1.85% of all branches [83.33%] - 269.345677227 seconds time elapsed + 267.844663061 seconds time elapsed diff --git a/sankalp/python_output_3000 b/sankalp/python_output_3000 new file mode 100644 index 0000000..fce7978 --- /dev/null +++ b/sankalp/python_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7523810.309535 task-clock # 0.997 CPUs utilized + 9,751 context-switches # 0.000 M/sec + 8 CPU-migrations # 0.000 M/sec + 114,447 page-faults # 0.000 M/sec +23,034,818,294,027 cycles # 3.062 GHz [83.33%] + 5,968,883,838,194 stalled-cycles-frontend # 25.91% frontend cycles idle [83.33%] + 4,880,944,759,305 stalled-cycles-backend # 21.19% backend cycles idle [66.67%] +44,998,941,716,288 instructions # 1.95 insns per cycle + # 0.13 stalled cycles per insn [83.33%] + 9,897,609,637,503 branches # 1315.505 M/sec [83.33%] + 183,578,089,307 branch-misses # 1.85% of all branches [83.33%] + + 7542.694127137 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7498643.490297 task-clock # 0.997 CPUs utilized + 19,051 context-switches # 0.000 M/sec + 31 CPU-migrations # 0.000 M/sec + 114,446 page-faults # 0.000 M/sec +22,951,558,904,261 cycles # 3.061 GHz [83.33%] + 5,832,251,128,139 stalled-cycles-frontend # 25.41% frontend cycles idle [83.33%] + 3,618,097,374,083 stalled-cycles-backend # 15.76% backend cycles idle [66.67%] +44,999,411,660,202 instructions # 1.96 insns per cycle + # 0.13 stalled cycles per insn [83.33%] + 9,897,544,359,143 branches # 1319.911 M/sec [83.33%] + 183,740,042,922 branch-misses # 1.86% of all branches [83.33%] + + 7517.591400120 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7483792.891740 task-clock # 0.997 CPUs utilized + 22,969 context-switches # 0.000 M/sec + 22 CPU-migrations # 0.000 M/sec + 114,446 page-faults # 0.000 M/sec +22,912,468,249,119 cycles # 3.062 GHz [83.33%] + 5,856,707,430,611 stalled-cycles-frontend # 25.56% frontend cycles idle [83.33%] + 3,455,911,751,229 stalled-cycles-backend # 15.08% backend cycles idle [66.67%] +44,999,614,162,598 instructions # 1.96 insns per cycle + # 0.13 stalled cycles per insn [83.33%] + 9,897,554,607,056 branches # 1322.532 M/sec [83.33%] + 183,410,877,949 branch-misses # 1.85% of all branches [83.33%] + + 7502.761384304 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7549522.903096 task-clock # 0.997 CPUs utilized + 23,441 context-switches # 0.000 M/sec + 32 CPU-migrations # 0.000 M/sec + 114,447 page-faults # 0.000 M/sec +23,113,526,053,863 cycles # 3.062 GHz [83.33%] + 6,255,990,972,442 stalled-cycles-frontend # 27.07% frontend cycles idle [83.33%] + 3,731,224,987,519 stalled-cycles-backend # 16.14% backend cycles idle [66.67%] +44,999,604,113,259 instructions # 1.95 insns per cycle + # 0.14 stalled cycles per insn [83.33%] + 9,897,591,589,417 branches # 1311.022 M/sec [83.33%] + 183,158,257,498 branch-misses # 1.85% of all branches [83.33%] + + 7568.657794504 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7555363.394251 task-clock # 0.997 CPUs utilized + 18,629 context-switches # 0.000 M/sec + 58 CPU-migrations # 0.000 M/sec + 114,447 page-faults # 0.000 M/sec +23,130,554,145,427 cycles # 3.061 GHz [83.33%] + 6,061,009,314,946 stalled-cycles-frontend # 26.20% frontend cycles idle [83.33%] + 3,605,997,031,545 stalled-cycles-backend # 15.59% backend cycles idle [66.67%] +45,002,350,539,512 instructions # 1.95 insns per cycle + # 0.13 stalled cycles per insn [83.33%] + 9,898,112,358,093 branches # 1310.078 M/sec [83.33%] + 183,597,319,733 branch-misses # 1.85% of all branches [83.33%] + + 7574.440265690 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7610335.221888 task-clock # 0.997 CPUs utilized + 105,302 context-switches # 0.000 M/sec + 108 CPU-migrations # 0.000 M/sec + 114,447 page-faults # 0.000 M/sec +23,293,714,648,979 cycles # 3.061 GHz [83.33%] + 6,206,749,761,668 stalled-cycles-frontend # 26.65% frontend cycles idle [83.33%] + 3,824,341,662,716 stalled-cycles-backend # 16.42% backend cycles idle [66.67%] +45,006,031,070,183 instructions # 1.93 insns per cycle + # 0.14 stalled cycles per insn [83.33%] + 9,898,867,944,732 branches # 1300.714 M/sec [83.33%] + 183,658,672,714 branch-misses # 1.86% of all branches [83.33%] + + 7631.555253916 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7464989.755747 task-clock # 0.998 CPUs utilized + 9,420 context-switches # 0.000 M/sec + 12 CPU-migrations # 0.000 M/sec + 114,446 page-faults # 0.000 M/sec +22,854,732,878,961 cycles # 3.062 GHz [83.33%] + 5,775,378,736,735 stalled-cycles-frontend # 25.27% frontend cycles idle [83.33%] + 3,825,353,159,613 stalled-cycles-backend # 16.74% backend cycles idle [66.67%] +44,999,115,833,895 instructions # 1.97 insns per cycle + # 0.13 stalled cycles per insn [83.33%] + 9,897,565,422,599 branches # 1325.865 M/sec [83.33%] + 183,420,495,811 branch-misses # 1.85% of all branches [83.33%] + + 7483.692644492 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7555610.198573 task-clock # 0.997 CPUs utilized + 89,590 context-switches # 0.000 M/sec + 642 CPU-migrations # 0.000 M/sec + 114,446 page-faults # 0.000 M/sec +23,099,935,439,113 cycles # 3.057 GHz [83.33%] + 6,057,433,380,007 stalled-cycles-frontend # 26.22% frontend cycles idle [83.33%] + 3,566,096,589,507 stalled-cycles-backend # 15.44% backend cycles idle [66.67%] +45,000,051,037,611 instructions # 1.95 insns per cycle + # 0.13 stalled cycles per insn [83.33%] + 9,897,877,108,270 branches # 1310.004 M/sec [83.33%] + 183,378,353,145 branch-misses # 1.85% of all branches [83.33%] + + 7576.476900949 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7493653.279874 task-clock # 0.997 CPUs utilized + 10,320 context-switches # 0.000 M/sec + 101 CPU-migrations # 0.000 M/sec + 114,447 page-faults # 0.000 M/sec +22,916,625,486,398 cycles # 3.058 GHz [83.33%] + 5,815,540,864,650 stalled-cycles-frontend # 25.38% frontend cycles idle [83.33%] + 3,618,177,935,613 stalled-cycles-backend # 15.79% backend cycles idle [66.67%] +45,002,457,894,219 instructions # 1.96 insns per cycle + # 0.13 stalled cycles per insn [83.33%] + 9,897,894,738,132 branches # 1320.837 M/sec [83.33%] + 183,576,494,427 branch-misses # 1.85% of all branches [83.33%] + + 7512.482340293 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'python MatrixMultiplier.py 3000': + + 7548991.984084 task-clock # 0.997 CPUs utilized + 9,907 context-switches # 0.000 M/sec + 65 CPU-migrations # 0.000 M/sec + 114,447 page-faults # 0.000 M/sec +23,084,767,596,054 cycles # 3.058 GHz [83.33%] + 5,979,164,330,026 stalled-cycles-frontend # 25.90% frontend cycles idle [83.33%] + 3,688,713,485,327 stalled-cycles-backend # 15.98% backend cycles idle [66.67%] +45,002,278,293,577 instructions # 1.95 insns per cycle + # 0.13 stalled cycles per insn [83.33%] + 9,898,235,501,388 branches # 1311.200 M/sec [83.33%] + 183,446,892,349 branch-misses # 1.85% of all branches [83.33%] + + 7567.915102659 seconds time elapsed + From 509014083323141b7c0d8f60784d2291e79cf1ea Mon Sep 17 00:00:00 2001 From: shrutir25 Date: Thu, 12 Feb 2015 17:16:52 -0500 Subject: [PATCH 02/11] Create MatrixMultiply.py --- MatrixMultiply.py | 47 +++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 47 insertions(+) create mode 100644 MatrixMultiply.py diff --git a/MatrixMultiply.py b/MatrixMultiply.py new file mode 100644 index 0000000..d567a9d --- /dev/null +++ b/MatrixMultiply.py @@ -0,0 +1,47 @@ +import sys +import random +import threading +from threading import Thread + +matrixDim = int(sys.argv[1]) +randomMaxValue = 100 +t1 = [0 for i in range(matrixDim)] + +## INITIALISING MATRICES A B C + +matrixA = [[0 for i in range(matrixDim)] for j in range(matrixDim)] +matrixB = [[0 for i in range(matrixDim)] for j in range(matrixDim)] +matrixC = [[0 for i in range(matrixDim)] for j in range(matrixDim)] + +for i in range (0,matrixDim): + for j in range (0,matrixDim): + + matrixA[i][j] = random.randint(0, randomMaxValue) + matrixB[i][j] = random.randint(0, randomMaxValue) + +## DEFINING THREAD + +def MyThread1(arg): + + + for j in range(0,matrixDim): + for k in range (0,matrixDim): + matrixC[arg][j] += matrixA[arg][k] * matrixB[k][j] + + + + pass + +def printMat(): + for i in range (0, matrixDim): + print "\n" + for j in range (0,matrixDim): + print str(matrixC[i][j]) + " ", + + +for i in range (0,matrixDim): + t1[i] = threading.Thread(target=MyThread1, args=(i, )) + t1[i].start() + +for i in range (0,matrixDim): + t1[i].join() From bc5e434b313acc2ca7903cb3a9b643077e3dc7d7 Mon Sep 17 00:00:00 2001 From: Sankalp Date: Thu, 12 Feb 2015 20:17:36 -0500 Subject: [PATCH 03/11] final --- MatrixMultiply.py | 23 +- finalExperimentRuns/MatrixMultiplier.class | Bin 0 -> 1877 bytes finalExperimentRuns/MatrixMultiplier.java | 134 ++++++++++ finalExperimentRuns/MatrixMultiplier.py | 73 ++++++ finalExperimentRuns/MatrixMultiplier_clean.py | 22 ++ finalExperimentRuns/README.MD | 1 + finalExperimentRuns/clang_output_10 | 180 +++++++++++++ finalExperimentRuns/clang_output_100 | 180 +++++++++++++ finalExperimentRuns/clang_output_1000 | 180 +++++++++++++ finalExperimentRuns/clang_output_3000 | 180 +++++++++++++ finalExperimentRuns/clang_output_optimized_10 | 180 +++++++++++++ .../clang_output_optimized_100 | 180 +++++++++++++ .../clang_output_optimized_1000 | 180 +++++++++++++ .../clang_output_optimized_3000 | 180 +++++++++++++ finalExperimentRuns/gcc_output_10 | 180 +++++++++++++ finalExperimentRuns/gcc_output_100 | 180 +++++++++++++ finalExperimentRuns/gcc_output_1000 | 180 +++++++++++++ finalExperimentRuns/gcc_output_3000 | 180 +++++++++++++ finalExperimentRuns/gcc_output_optimized_10 | 180 +++++++++++++ finalExperimentRuns/gcc_output_optimized_100 | 180 +++++++++++++ finalExperimentRuns/gcc_output_optimized_1000 | 180 +++++++++++++ finalExperimentRuns/gcc_output_optimized_3000 | 180 +++++++++++++ finalExperimentRuns/java_output_10 | 180 +++++++++++++ finalExperimentRuns/java_output_100 | 180 +++++++++++++ finalExperimentRuns/java_output_1000 | 180 +++++++++++++ finalExperimentRuns/java_output_3000 | 180 +++++++++++++ finalExperimentRuns/matrixMultiply | Bin 0 -> 13242 bytes finalExperimentRuns/matrixMultiply.c | 157 ++++++++++++ finalExperimentRuns/matrixMultiply_clang | Bin 0 -> 13277 bytes .../matrixMultiply_clang_optimized | Bin 0 -> 13285 bytes .../matrixMultiply_gcc_optimized | Bin 0 -> 13203 bytes finalExperimentRuns/matrixMultiply_mod.c | 157 ++++++++++++ finalExperimentRuns/python_output_10 | 180 +++++++++++++ finalExperimentRuns/python_output_100 | 180 +++++++++++++ finalExperimentRuns/python_output_1000 | 180 +++++++++++++ finalExperimentRuns/python_output_3000 | 180 +++++++++++++ finalExperimentRuns/script.sh | 35 +++ .../threading/.MatrixMultiplier.java.swp | Bin 0 -> 12288 bytes .../MatrixMultiplier$ThreadMultiply.class | Bin 0 -> 699 bytes .../threading/MatrixMultiplier.class | Bin 0 -> 2457 bytes .../threading/MatrixMultiplier.java | 181 +++++++++++++ .../MatrixMultiplierNew$ThreadMultiply.class | Bin 0 -> 736 bytes .../threading/MatrixMultiplierNew.class | Bin 0 -> 2675 bytes .../threading/MatrixMultiplierNew.java | 193 ++++++++++++++ finalExperimentRuns/threading/matrixMultiply | Bin 0 -> 13348 bytes .../threading/matrixMultiply.c | 203 +++++++++++++++ .../threading/matrixMultiply_clang | Bin 0 -> 13383 bytes .../threading/matrixMultiply_new | Bin 0 -> 13352 bytes .../threading/matrixMultiply_new.c | 240 +++++++++++++++++ sankalp/clang_output_10 | 170 ++++++------ sankalp/clang_output_10000 | 1 - sankalp/clang_output_optimized_10 | 180 +++++++++++++ sankalp/gcc_output_10 | 176 ++++++------- sankalp/gcc_output_10000 | 1 - sankalp/gcc_output_optimized_10 | 180 +++++++++++++ sankalp/java_output_10 | 242 +++++++++--------- sankalp/java_output_10000 | 1 - sankalp/matrixMultiply_clang_optimized | Bin 0 -> 13285 bytes sankalp/matrixMultiply_gcc_optimized | Bin 0 -> 13203 bytes sankalp/matrixMultiply_mod.c | 157 ++++++++++++ sankalp/python_output_10 | 204 +++++++-------- sankalp/python_output_10000 | 1 - sankalp/script.sh | 12 +- sankalp/threading/matrixMultiply_clang | Bin 0 -> 13383 bytes 64 files changed, 6653 insertions(+), 411 deletions(-) create mode 100644 finalExperimentRuns/MatrixMultiplier.class create mode 100644 finalExperimentRuns/MatrixMultiplier.java create mode 100644 finalExperimentRuns/MatrixMultiplier.py create mode 100644 finalExperimentRuns/MatrixMultiplier_clean.py create mode 100644 finalExperimentRuns/README.MD create mode 100644 finalExperimentRuns/clang_output_10 create mode 100644 finalExperimentRuns/clang_output_100 create mode 100644 finalExperimentRuns/clang_output_1000 create mode 100644 finalExperimentRuns/clang_output_3000 create mode 100644 finalExperimentRuns/clang_output_optimized_10 create mode 100644 finalExperimentRuns/clang_output_optimized_100 create mode 100644 finalExperimentRuns/clang_output_optimized_1000 create mode 100644 finalExperimentRuns/clang_output_optimized_3000 create mode 100644 finalExperimentRuns/gcc_output_10 create mode 100644 finalExperimentRuns/gcc_output_100 create mode 100644 finalExperimentRuns/gcc_output_1000 create mode 100644 finalExperimentRuns/gcc_output_3000 create mode 100644 finalExperimentRuns/gcc_output_optimized_10 create mode 100644 finalExperimentRuns/gcc_output_optimized_100 create mode 100644 finalExperimentRuns/gcc_output_optimized_1000 create mode 100644 finalExperimentRuns/gcc_output_optimized_3000 create mode 100644 finalExperimentRuns/java_output_10 create mode 100644 finalExperimentRuns/java_output_100 create mode 100644 finalExperimentRuns/java_output_1000 create mode 100644 finalExperimentRuns/java_output_3000 create mode 100755 finalExperimentRuns/matrixMultiply create mode 100644 finalExperimentRuns/matrixMultiply.c create mode 100755 finalExperimentRuns/matrixMultiply_clang create mode 100755 finalExperimentRuns/matrixMultiply_clang_optimized create mode 100755 finalExperimentRuns/matrixMultiply_gcc_optimized create mode 100644 finalExperimentRuns/matrixMultiply_mod.c create mode 100644 finalExperimentRuns/python_output_10 create mode 100644 finalExperimentRuns/python_output_100 create mode 100644 finalExperimentRuns/python_output_1000 create mode 100644 finalExperimentRuns/python_output_3000 create mode 100644 finalExperimentRuns/script.sh create mode 100644 finalExperimentRuns/threading/.MatrixMultiplier.java.swp create mode 100644 finalExperimentRuns/threading/MatrixMultiplier$ThreadMultiply.class create mode 100644 finalExperimentRuns/threading/MatrixMultiplier.class create mode 100644 finalExperimentRuns/threading/MatrixMultiplier.java create mode 100644 finalExperimentRuns/threading/MatrixMultiplierNew$ThreadMultiply.class create mode 100644 finalExperimentRuns/threading/MatrixMultiplierNew.class create mode 100644 finalExperimentRuns/threading/MatrixMultiplierNew.java create mode 100755 finalExperimentRuns/threading/matrixMultiply create mode 100644 finalExperimentRuns/threading/matrixMultiply.c create mode 100755 finalExperimentRuns/threading/matrixMultiply_clang create mode 100755 finalExperimentRuns/threading/matrixMultiply_new create mode 100644 finalExperimentRuns/threading/matrixMultiply_new.c delete mode 100644 sankalp/clang_output_10000 create mode 100644 sankalp/clang_output_optimized_10 delete mode 100644 sankalp/gcc_output_10000 create mode 100644 sankalp/gcc_output_optimized_10 delete mode 100644 sankalp/java_output_10000 create mode 100755 sankalp/matrixMultiply_clang_optimized create mode 100755 sankalp/matrixMultiply_gcc_optimized create mode 100644 sankalp/matrixMultiply_mod.c delete mode 100644 sankalp/python_output_10000 create mode 100755 sankalp/threading/matrixMultiply_clang diff --git a/MatrixMultiply.py b/MatrixMultiply.py index d567a9d..7e2979c 100644 --- a/MatrixMultiply.py +++ b/MatrixMultiply.py @@ -5,7 +5,9 @@ matrixDim = int(sys.argv[1]) randomMaxValue = 100 -t1 = [0 for i in range(matrixDim)] +#t1 = [0 for i in range(matrixDim)] + +t1 = [] ## INITIALISING MATRICES A B C @@ -22,15 +24,13 @@ ## DEFINING THREAD def MyThread1(arg): - + + print "Thread " + str(arg) for j in range(0,matrixDim): for k in range (0,matrixDim): matrixC[arg][j] += matrixA[arg][k] * matrixB[k][j] - - - - pass +# print "Thread " + str(arg) + " " + str(j) def printMat(): for i in range (0, matrixDim): @@ -40,8 +40,13 @@ def printMat(): for i in range (0,matrixDim): - t1[i] = threading.Thread(target=MyThread1, args=(i, )) - t1[i].start() - + t = threading.Thread(target=MyThread1, args=(i, )) + t1.append(t) + t.start() + for i in range (0,matrixDim): t1[i].join() + +#for temp in t: +# temp.join() + diff --git a/finalExperimentRuns/MatrixMultiplier.class b/finalExperimentRuns/MatrixMultiplier.class new file mode 100644 index 0000000000000000000000000000000000000000..1dc5df4a1cc369f460fc9fd0e429dfc68ee1003c GIT binary patch literal 1877 zcma)6-%}e^6#i~DVUuO~*#boprLCnYNJ3Ms%8%F*OPe-nC{(nAGrEuk7L!dTY#cf| zzR39GlMh;7^}%OxCOG2s%@_5>XZ=@-e)ldUW6LPBv*+GD_uO;7^L_X3uLnOp29Uzr z1_qGSF&IHFCZxG6O-jcV18qo3^Kt~Q;Hr*S4H!s<@tPc8mu6C$DFf4(ktVI<4FlJ3 z-C&AYX)@BhspE!#UbeiNvwdAaTVBpKzh|4Xj6i42a*LI6-r8QWN_AU6Ft8(2ako6n z^^{K|?4m&1wBtHnS|AwDURvUisT3LCm2+JCZoRx>*X~;@C3?EooKh*TN-wD7tRI&< zIu<=^^@F@sRe|hRpto9cTrcZZ>z>-NYHu+?xnA;|YUyFi)uZAT>@BYNsR^KLIj%r| zd^xvieP|_1mb;!@WXJCMlq_c~R_e7?d(M%d`utsaKeJ=k5^|4;VO%hA27@M^lV%8m ztgq75J*SlP8!$14n>ucp$l|uZz|-Ys>rSa?*GS&5i95(ilQ(e}1s(Gy?qR{iA}%oV z(QOY;-X>L?Nd+jAkJE4a;g)BYNpz*o^*)~v zr;?nP^pX?XDo;^Dt6H^PYB?T1hO%c|hi!3Vlm-7|IqX$@-UUv_pABS!Q>vYR0}==+ zRf+dFI8;zq>m`cZ)1re6*z1z)aMh}9*@}>36J&9gS7CssH;Ay*n6t2yS&dYh;~7K| zgTV8g2k-)~o{&n=o}=d$eF2Wcqk9lTL%$#p_yO9{BzQClea{$y^R)d4(YCW<2cJ%U zcQI=ZS1Ijb)-SmlWYo=lv_05^p3`Quv^Epnh4%OxT+z}oe|DZjG!+}`E;bM@>>}9u z*wMsyfB(4?p#4o252)g!{541jVYX(lQIpN}v$bJ9<7{e@^K10YVT2C|FnEAY9T$a& zTnrIiyovD%5z2f2wKh$3(?dR@OcUk!E+YFd2*178Y@mbdL#b$@fll?=Kvx6Z3f~`$ zY@laH5bOSlG6hePsnvCw6a!=A;3a}ikn{=4n&QuK0<*YE5fi+LlX!=o6{PVQ$IrR) z1$~cjLov~b@DsF=hRf~pB^A7chjM+(Lm}mwS5%~%EzCB_NHrxpw~G+bznf5e#5e?F zq-Ep%f>P`+#mMi9i=SH^BzR!JUrPYDS?Lbz< branch-misses + + 0.001226038 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.263159 task-clock # 0.297 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.483 M/sec + 791,625 cycles # 3.008 GHz + 482,299 stalled-cycles-frontend # 60.93% frontend cycles idle + 319,678 stalled-cycles-backend # 40.38% backend cycles idle + 550,734 instructions # 0.70 insns per cycle + # 0.88 stalled cycles per insn + 106,158 branches # 403.399 M/sec + branch-misses + + 0.000886637 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.263879 task-clock # 0.315 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.481 M/sec + 801,437 cycles # 3.037 GHz + 489,881 stalled-cycles-frontend # 61.13% frontend cycles idle + 298,681 stalled-cycles-backend # 37.27% backend cycles idle + 552,821 instructions # 0.69 insns per cycle + # 0.89 stalled cycles per insn + 106,287 branches # 402.787 M/sec + branch-misses + + 0.000838731 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.261170 task-clock # 0.325 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.486 M/sec + 794,662 cycles # 3.043 GHz + 483,324 stalled-cycles-frontend # 60.82% frontend cycles idle + 324,726 stalled-cycles-backend # 40.86% backend cycles idle + 552,409 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 106,457 branches # 407.616 M/sec + branch-misses + + 0.000802414 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.259817 task-clock # 0.203 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.489 M/sec + 789,490 cycles # 3.039 GHz + 480,273 stalled-cycles-frontend # 60.83% frontend cycles idle + 338,648 stalled-cycles-backend # 42.89% backend cycles idle + 549,001 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 105,856 branches # 407.425 M/sec + branch-misses + + 0.001277214 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.259312 task-clock # 0.237 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.490 M/sec + 788,093 cycles # 3.039 GHz + 480,367 stalled-cycles-frontend # 60.95% frontend cycles idle + 337,791 stalled-cycles-backend # 42.86% backend cycles idle + 542,295 instructions # 0.69 insns per cycle + # 0.89 stalled cycles per insn + 104,332 branches # 402.342 M/sec + branch-misses + + 0.001092917 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.291974 task-clock # 0.199 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.432 M/sec + 202,297 cycles # 0.693 GHz + 553,682 stalled-cycles-frontend # 273.70% frontend cycles idle + 387,858 stalled-cycles-backend # 191.73% backend cycles idle + 548,059 instructions # 2.71 insns per cycle + # 1.01 stalled cycles per insn + 105,755 branches # 362.207 M/sec + 7,631 branch-misses # 7.22% of all branches [73.27%] + + 0.001464449 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.260737 task-clock # 0.142 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.487 M/sec + 791,866 cycles # 3.037 GHz + 481,917 stalled-cycles-frontend # 60.86% frontend cycles idle + 338,794 stalled-cycles-backend # 42.78% backend cycles idle + 554,114 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 106,770 branches # 409.493 M/sec + branch-misses + + 0.001834688 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.265581 task-clock # 0.269 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.478 M/sec + 798,282 cycles # 3.006 GHz + 486,961 stalled-cycles-frontend # 61.00% frontend cycles idle + 343,026 stalled-cycles-backend # 42.97% backend cycles idle + 555,199 instructions # 0.70 insns per cycle + # 0.88 stalled cycles per insn + 106,951 branches # 402.706 M/sec + branch-misses + + 0.000988402 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang 10': + + 0.260504 task-clock # 0.180 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.484 M/sec + 792,825 cycles # 3.043 GHz + 482,255 stalled-cycles-frontend # 60.83% frontend cycles idle + 333,878 stalled-cycles-backend # 42.11% backend cycles idle + 551,967 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 106,390 branches # 408.401 M/sec + branch-misses + + 0.001444313 seconds time elapsed + diff --git a/finalExperimentRuns/clang_output_100 b/finalExperimentRuns/clang_output_100 new file mode 100644 index 0000000..62ab0c3 --- /dev/null +++ b/finalExperimentRuns/clang_output_100 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.053268 task-clock # 0.907 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.022 M/sec + 21,542,512 cycles # 3.054 GHz [43.51%] + 10,448,377 stalled-cycles-frontend # 48.50% frontend cycles idle + 1,620,562 stalled-cycles-backend # 7.52% backend cycles idle + 26,010,263 instructions # 1.21 insns per cycle + # 0.40 stalled cycles per insn + 2,497,209 branches # 354.050 M/sec + 11,897 branch-misses # 0.48% of all branches [71.92%] + + 0.007776978 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.156865 task-clock # 0.912 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.022 M/sec + 21,858,485 cycles # 3.054 GHz [45.75%] + 6,691,620 stalled-cycles-frontend # 30.61% frontend cycles idle + 2,072,908 stalled-cycles-backend # 9.48% backend cycles idle + 26,016,488 instructions # 1.19 insns per cycle + # 0.26 stalled cycles per insn + 2,497,845 branches # 349.014 M/sec + 17,479 branch-misses # 0.70% of all branches + + 0.007849703 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.165353 task-clock # 0.909 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.022 M/sec + 21,780,583 cycles # 3.040 GHz [44.38%] + 7,179,660 stalled-cycles-frontend # 32.96% frontend cycles idle + 2,012,094 stalled-cycles-backend # 9.24% backend cycles idle + 26,010,882 instructions # 1.19 insns per cycle + # 0.28 stalled cycles per insn + 2,497,319 branches # 348.527 M/sec + 15,296 branch-misses # 0.61% of all branches [98.02%] + + 0.007883982 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.098440 task-clock # 0.923 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.022 M/sec + 21,662,885 cycles # 3.052 GHz [43.88%] + 8,869,299 stalled-cycles-frontend # 40.94% frontend cycles idle + 1,888,070 stalled-cycles-backend # 8.72% backend cycles idle + 26,015,267 instructions # 1.20 insns per cycle + # 0.34 stalled cycles per insn + 2,498,064 branches # 351.917 M/sec + 11,733 branch-misses # 0.47% of all branches [84.57%] + + 0.007692507 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.074668 task-clock # 0.881 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.022 M/sec + 9,777,089 cycles # 1.382 GHz + 12,454,494 stalled-cycles-frontend # 127.38% frontend cycles idle + 406,671 stalled-cycles-backend # 4.16% backend cycles idle + 26,021,599 instructions # 2.66 insns per cycle + # 0.48 stalled cycles per insn + 2,498,735 branches # 353.195 M/sec + 12,178 branch-misses # 0.49% of all branches [54.81%] + + 0.008028569 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.085217 task-clock # 0.921 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.022 M/sec + 21,555,105 cycles # 3.042 GHz [43.77%] + 7,800,102 stalled-cycles-frontend # 36.19% frontend cycles idle + 1,788,484 stalled-cycles-backend # 8.30% backend cycles idle + 26,025,558 instructions # 1.21 insns per cycle + # 0.30 stalled cycles per insn + 2,499,437 branches # 352.768 M/sec + 11,719 branch-misses # 0.47% of all branches [92.55%] + + 0.007694468 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.112728 task-clock # 0.634 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.022 M/sec + 21,725,477 cycles # 3.054 GHz [45.19%] + 6,733,958 stalled-cycles-frontend # 31.00% frontend cycles idle + 1,849,361 stalled-cycles-backend # 8.51% backend cycles idle + 26,024,358 instructions # 1.20 insns per cycle + # 0.26 stalled cycles per insn + 2,499,211 branches # 351.372 M/sec + 17,591 branch-misses # 0.70% of all branches + + 0.011223178 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.068877 task-clock # 0.921 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.022 M/sec + 21,592,249 cycles # 3.055 GHz [43.63%] + 7,807,904 stalled-cycles-frontend # 36.16% frontend cycles idle + 1,825,484 stalled-cycles-backend # 8.45% backend cycles idle + 26,012,472 instructions # 1.20 insns per cycle + # 0.30 stalled cycles per insn + 2,497,566 branches # 353.319 M/sec + 11,719 branch-misses # 0.47% of all branches [92.66%] + + 0.007675305 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.096350 task-clock # 0.916 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.022 M/sec + 21,606,442 cycles # 3.045 GHz [43.82%] + 9,785,352 stalled-cycles-frontend # 45.29% frontend cycles idle + 1,812,444 stalled-cycles-backend # 8.39% backend cycles idle + 26,027,894 instructions # 1.20 insns per cycle + # 0.38 stalled cycles per insn + 2,499,871 branches # 352.276 M/sec + 11,876 branch-misses # 0.48% of all branches [77.30%] + + 0.007747817 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang 100': + + 7.154863 task-clock # 0.920 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.022 M/sec + 21,831,902 cycles # 3.051 GHz [44.34%] + 10,234,895 stalled-cycles-frontend # 46.88% frontend cycles idle + 2,001,267 stalled-cycles-backend # 9.17% backend cycles idle + 26,012,404 instructions # 1.19 insns per cycle + # 0.39 stalled cycles per insn + 2,497,750 branches # 349.098 M/sec + 11,843 branch-misses # 0.47% of all branches [74.43%] + + 0.007774080 seconds time elapsed + diff --git a/finalExperimentRuns/clang_output_1000 b/finalExperimentRuns/clang_output_1000 new file mode 100644 index 0000000..9a89831 --- /dev/null +++ b/finalExperimentRuns/clang_output_1000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8772.711871 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,862,536,545 cycles # 3.062 GHz [83.32%] + 18,725,249,733 stalled-cycles-frontend # 69.71% frontend cycles idle [83.31%] + 6,721,535,337 stalled-cycles-backend # 25.02% backend cycles idle [66.69%] + 24,147,572,347 instructions # 0.90 insns per cycle + # 0.78 stalled cycles per insn [83.35%] + 2,039,094,766 branches # 232.436 M/sec [83.35%] + 1,418,553 branch-misses # 0.07% of all branches [83.35%] + + 8.795813556 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8729.146601 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,728,257,650 cycles # 3.062 GHz [83.32%] + 18,598,831,843 stalled-cycles-frontend # 69.58% frontend cycles idle [83.32%] + 6,692,039,477 stalled-cycles-backend # 25.04% backend cycles idle [66.68%] + 24,143,696,220 instructions # 0.90 insns per cycle + # 0.77 stalled cycles per insn [83.36%] + 2,039,089,497 branches # 233.596 M/sec [83.36%] + 1,422,028 branch-misses # 0.07% of all branches [83.33%] + + 8.751936365 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8743.005082 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,760,005,251 cycles # 3.061 GHz [83.34%] + 18,636,540,129 stalled-cycles-frontend # 69.64% frontend cycles idle [83.34%] + 6,696,730,595 stalled-cycles-backend # 25.03% backend cycles idle [66.69%] + 24,146,489,634 instructions # 0.90 insns per cycle + # 0.77 stalled cycles per insn [83.34%] + 2,039,117,188 branches # 233.228 M/sec [83.34%] + 1,512,869 branch-misses # 0.07% of all branches [83.32%] + + 8.765745532 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8842.501415 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 27,075,333,912 cycles # 3.062 GHz [83.30%] + 18,932,760,043 stalled-cycles-frontend # 69.93% frontend cycles idle [83.34%] + 6,827,630,830 stalled-cycles-backend # 25.22% backend cycles idle [66.70%] + 24,145,756,817 instructions # 0.89 insns per cycle + # 0.78 stalled cycles per insn [83.35%] + 2,039,239,015 branches # 230.618 M/sec [83.35%] + 1,496,833 branch-misses # 0.07% of all branches [83.33%] + + 8.865507756 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8796.936234 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,935,212,998 cycles # 3.062 GHz [83.31%] + 18,792,486,212 stalled-cycles-frontend # 69.77% frontend cycles idle [83.31%] + 6,800,634,030 stalled-cycles-backend # 25.25% backend cycles idle [66.71%] + 24,146,395,655 instructions # 0.90 insns per cycle + # 0.78 stalled cycles per insn [83.35%] + 2,039,272,337 branches # 231.816 M/sec [83.35%] + 1,994,410 branch-misses # 0.10% of all branches [83.32%] + + 8.820084000 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8777.014189 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,875,307,479 cycles # 3.062 GHz [83.32%] + 18,740,496,292 stalled-cycles-frontend # 69.73% frontend cycles idle [83.32%] + 6,705,290,080 stalled-cycles-backend # 24.95% backend cycles idle [66.68%] + 24,144,531,987 instructions # 0.90 insns per cycle + # 0.78 stalled cycles per insn [83.36%] + 2,039,002,045 branches # 232.312 M/sec [83.36%] + 1,448,566 branch-misses # 0.07% of all branches [83.34%] + + 8.799930149 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8796.815931 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,935,093,613 cycles # 3.062 GHz [83.32%] + 18,796,887,746 stalled-cycles-frontend # 69.79% frontend cycles idle [83.31%] + 6,818,360,264 stalled-cycles-backend # 25.31% backend cycles idle [66.69%] + 24,148,095,266 instructions # 0.90 insns per cycle + # 0.78 stalled cycles per insn [83.35%] + 2,039,005,393 branches # 231.789 M/sec [83.35%] + 1,638,652 branch-misses # 0.08% of all branches [83.35%] + + 8.819932807 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8732.240674 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,737,479,415 cycles # 3.062 GHz [83.32%] + 18,601,807,786 stalled-cycles-frontend # 69.57% frontend cycles idle [83.32%] + 6,561,397,504 stalled-cycles-backend # 24.54% backend cycles idle [66.64%] + 24,149,772,261 instructions # 0.90 insns per cycle + # 0.77 stalled cycles per insn [83.32%] + 2,038,395,170 branches # 233.433 M/sec [83.36%] + 1,485,301 branch-misses # 0.07% of all branches [83.36%] + + 8.757509097 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8706.559421 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,659,676,782 cycles # 3.062 GHz [83.32%] + 18,523,302,399 stalled-cycles-frontend # 69.48% frontend cycles idle [83.32%] + 6,570,207,292 stalled-cycles-backend # 24.64% backend cycles idle [66.67%] + 24,136,767,039 instructions # 0.91 insns per cycle + # 0.77 stalled cycles per insn [83.36%] + 2,038,880,459 branches # 234.178 M/sec [83.36%] + 1,511,548 branch-misses # 0.07% of all branches [83.36%] + + 8.729259859 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang 1000': + + 8744.544589 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,775,031,633 cycles # 3.062 GHz [83.30%] + 18,640,605,103 stalled-cycles-frontend # 69.62% frontend cycles idle [83.34%] + 6,628,187,063 stalled-cycles-backend # 24.76% backend cycles idle [66.69%] + 24,147,316,203 instructions # 0.90 insns per cycle + # 0.77 stalled cycles per insn [83.35%] + 2,038,977,599 branches # 233.171 M/sec [83.35%] + 1,410,532 branch-misses # 0.07% of all branches [83.34%] + + 8.767426048 seconds time elapsed + diff --git a/finalExperimentRuns/clang_output_3000 b/finalExperimentRuns/clang_output_3000 new file mode 100644 index 0000000..67b7ded --- /dev/null +++ b/finalExperimentRuns/clang_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply_clang 3000': + + 435870.895044 task-clock # 0.997 CPUs utilized + 547 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,334,464,156,843 cycles # 3.062 GHz [83.33%] + 1,116,588,716,003 stalled-cycles-frontend # 83.67% frontend cycles idle [83.33%] + 760,549,402,793 stalled-cycles-backend # 56.99% backend cycles idle [66.67%] + 649,625,214,346 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,405,175,566 branches # 124.819 M/sec [83.33%] + 31,641,759 branch-misses # 0.06% of all branches [83.33%] + + 436.970014074 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply_clang 3000': + + 436941.138626 task-clock # 0.997 CPUs utilized + 547 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,337,726,968,521 cycles # 3.062 GHz [83.33%] + 1,119,881,200,210 stalled-cycles-frontend # 83.72% frontend cycles idle [83.33%] + 763,263,721,765 stalled-cycles-backend # 57.06% backend cycles idle [66.67%] + 649,639,608,656 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,408,743,887 branches # 124.522 M/sec [83.33%] + 30,480,854 branch-misses # 0.06% of all branches [83.33%] + + 438.038257320 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply_clang 3000': + + 436215.746174 task-clock # 0.997 CPUs utilized + 545 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,335,345,423,489 cycles # 3.061 GHz [83.33%] + 1,117,485,526,106 stalled-cycles-frontend # 83.69% frontend cycles idle [83.33%] + 759,502,326,023 stalled-cycles-backend # 56.88% backend cycles idle [66.67%] + 649,657,788,647 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,408,979,455 branches # 124.730 M/sec [83.33%] + 29,850,475 branch-misses # 0.05% of all branches [83.33%] + + 437.311297435 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply_clang 3000': + + 434660.839337 task-clock # 0.997 CPUs utilized + 544 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,330,746,441,063 cycles # 3.062 GHz [83.33%] + 1,112,865,667,103 stalled-cycles-frontend # 83.63% frontend cycles idle [83.33%] + 755,733,809,906 stalled-cycles-backend # 56.79% backend cycles idle [66.67%] + 649,629,467,424 instructions # 0.49 insns per cycle + # 1.71 stalled cycles per insn [83.33%] + 54,405,944,056 branches # 125.169 M/sec [83.33%] + 30,324,200 branch-misses # 0.06% of all branches [83.33%] + + 435.752964281 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply_clang 3000': + + 438781.815155 task-clock # 0.997 CPUs utilized + 550 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,343,359,727,224 cycles # 3.062 GHz [83.33%] + 1,125,419,926,576 stalled-cycles-frontend # 83.78% frontend cycles idle [83.33%] + 768,084,785,121 stalled-cycles-backend # 57.18% backend cycles idle [66.67%] + 649,665,121,934 instructions # 0.48 insns per cycle + # 1.73 stalled cycles per insn [83.33%] + 54,408,662,474 branches # 123.999 M/sec [83.33%] + 30,594,105 branch-misses # 0.06% of all branches [83.33%] + + 439.883691061 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply_clang 3000': + + 436113.735318 task-clock # 0.997 CPUs utilized + 546 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,335,204,076,506 cycles # 3.062 GHz [83.33%] + 1,117,295,887,936 stalled-cycles-frontend # 83.68% frontend cycles idle [83.33%] + 749,322,042,821 stalled-cycles-backend # 56.12% backend cycles idle [66.67%] + 649,625,709,220 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,406,397,138 branches # 124.753 M/sec [83.33%] + 30,194,121 branch-misses # 0.06% of all branches [83.33%] + + 437.209951172 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply_clang 3000': + + 436287.286674 task-clock # 0.997 CPUs utilized + 546 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,335,745,938,506 cycles # 3.062 GHz [83.33%] + 1,117,869,103,390 stalled-cycles-frontend # 83.69% frontend cycles idle [83.33%] + 758,032,143,399 stalled-cycles-backend # 56.75% backend cycles idle [66.67%] + 649,644,491,128 instructions # 0.49 insns per cycle + # 1.72 stalled cycles per insn [83.33%] + 54,406,028,719 branches # 124.702 M/sec [83.33%] + 30,072,867 branch-misses # 0.06% of all branches [83.33%] + + 437.394865809 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply_clang 3000': + + 437543.330568 task-clock # 0.997 CPUs utilized + 546 context-switches # 0.000 M/sec + 2 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,339,450,532,302 cycles # 3.061 GHz [83.33%] + 1,121,680,166,977 stalled-cycles-frontend # 83.74% frontend cycles idle [83.33%] + 764,834,662,020 stalled-cycles-backend # 57.10% backend cycles idle [66.67%] + 649,641,184,728 instructions # 0.49 insns per cycle + # 1.73 stalled cycles per insn [83.33%] + 54,409,529,224 branches # 124.352 M/sec [83.33%] + 30,174,500 branch-misses # 0.06% of all branches [83.33%] + + 438.656887155 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply_clang 3000': + + 437737.932628 task-clock # 0.997 CPUs utilized + 549 context-switches # 0.000 M/sec + 2 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,340,168,475,305 cycles # 3.062 GHz [83.33%] + 1,122,266,697,544 stalled-cycles-frontend # 83.74% frontend cycles idle [83.33%] + 762,038,651,178 stalled-cycles-backend # 56.86% backend cycles idle [66.67%] + 649,657,223,429 instructions # 0.48 insns per cycle + # 1.73 stalled cycles per insn [83.33%] + 54,407,338,177 branches # 124.292 M/sec [83.33%] + 29,532,180 branch-misses # 0.05% of all branches [83.33%] + + 438.836735033 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang 3000': + + 438463.682513 task-clock # 0.997 CPUs utilized + 548 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,342,374,344,170 cycles # 3.062 GHz [83.33%] + 1,124,481,215,389 stalled-cycles-frontend # 83.77% frontend cycles idle [83.33%] + 765,398,751,304 stalled-cycles-backend # 57.02% backend cycles idle [66.67%] + 649,726,904,426 instructions # 0.48 insns per cycle + # 1.73 stalled cycles per insn [83.33%] + 54,402,887,069 branches # 124.076 M/sec [83.33%] + 30,000,209 branch-misses # 0.06% of all branches [83.33%] + + 439.566853455 seconds time elapsed + diff --git a/finalExperimentRuns/clang_output_optimized_10 b/finalExperimentRuns/clang_output_optimized_10 new file mode 100644 index 0000000..62f3d83 --- /dev/null +++ b/finalExperimentRuns/clang_output_optimized_10 @@ -0,0 +1,180 @@ +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.254738 task-clock # 0.186 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.499 M/sec + 773,561 cycles # 3.037 GHz + 467,851 stalled-cycles-frontend # 60.48% frontend cycles idle + 310,294 stalled-cycles-backend # 40.11% backend cycles idle + 535,991 instructions # 0.69 insns per cycle + # 0.87 stalled cycles per insn + 104,877 branches # 411.705 M/sec + branch-misses + + 0.001369651 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.253462 task-clock # 0.312 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.501 M/sec + 770,150 cycles # 3.039 GHz + 467,124 stalled-cycles-frontend # 60.65% frontend cycles idle + 321,201 stalled-cycles-backend # 41.71% backend cycles idle + 537,198 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 105,085 branches # 414.599 M/sec + branch-misses + + 0.000812752 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.252371 task-clock # 0.313 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.503 M/sec + 767,605 cycles # 3.042 GHz + 462,629 stalled-cycles-frontend # 60.27% frontend cycles idle + 328,909 stalled-cycles-backend # 42.85% backend cycles idle + 536,671 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 104,982 branches # 415.983 M/sec + branch-misses + + 0.000806311 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.255736 task-clock # 0.336 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.493 M/sec + 762,557 cycles # 2.982 GHz + 460,565 stalled-cycles-frontend # 60.40% frontend cycles idle + 323,600 stalled-cycles-backend # 42.44% backend cycles idle + 538,377 instructions # 0.71 insns per cycle + # 0.86 stalled cycles per insn + 105,324 branches # 411.847 M/sec + branch-misses + + 0.000760748 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.256619 task-clock # 0.325 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.495 M/sec + 772,169 cycles # 3.009 GHz + 465,669 stalled-cycles-frontend # 60.31% frontend cycles idle + 306,523 stalled-cycles-backend # 39.70% backend cycles idle + 541,471 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 105,836 branches # 412.425 M/sec + branch-misses + + 0.000790370 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.252237 task-clock # 0.135 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.503 M/sec + 766,577 cycles # 3.039 GHz + 463,314 stalled-cycles-frontend # 60.44% frontend cycles idle + 326,037 stalled-cycles-backend # 42.53% backend cycles idle + 538,054 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 105,236 branches # 417.211 M/sec + branch-misses + + 0.001870156 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.260936 task-clock # 0.320 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.487 M/sec + 779,990 cycles # 2.989 GHz + 473,885 stalled-cycles-frontend # 60.76% frontend cycles idle + 324,297 stalled-cycles-backend # 41.58% backend cycles idle + 539,619 instructions # 0.69 insns per cycle + # 0.88 stalled cycles per insn + 105,485 branches # 404.256 M/sec + branch-misses + + 0.000815701 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.246294 task-clock # 0.338 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.516 M/sec + cycles + 443,508 stalled-cycles-frontend # 0.00% frontend cycles idle + 317,155 stalled-cycles-backend # 0.00% backend cycles idle + 542,075 instructions # 0.00 insns per cycle + # 0.82 stalled cycles per insn + 105,925 branches # 430.075 M/sec + 6,517 branch-misses # 6.15% of all branches + + 0.000728607 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.242933 task-clock # 0.293 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.523 M/sec + 727,267 cycles # 2.994 GHz + 425,098 stalled-cycles-frontend # 58.45% frontend cycles idle + 304,182 stalled-cycles-backend # 41.83% backend cycles idle + 537,280 instructions # 0.74 insns per cycle + # 0.79 stalled cycles per insn + 105,121 branches # 432.716 M/sec + branch-misses + + 0.000830440 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.256732 task-clock # 0.216 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.491 M/sec + 768,563 cycles # 2.994 GHz + 464,524 stalled-cycles-frontend # 60.44% frontend cycles idle + 330,887 stalled-cycles-backend # 43.05% backend cycles idle + 536,485 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 104,979 branches # 408.905 M/sec + branch-misses + + 0.001186233 seconds time elapsed + diff --git a/finalExperimentRuns/clang_output_optimized_100 b/finalExperimentRuns/clang_output_optimized_100 new file mode 100644 index 0000000..0924dc0 --- /dev/null +++ b/finalExperimentRuns/clang_output_optimized_100 @@ -0,0 +1,180 @@ +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.962034 task-clock # 0.665 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.081 M/sec + 6,010,763 cycles # 3.064 GHz + 884,158 stalled-cycles-frontend # 14.71% frontend cycles idle + 737,567 stalled-cycles-backend # 12.27% backend cycles idle + 11,047,971 instructions # 1.84 insns per cycle + # 0.08 stalled cycles per insn + 1,468,085 branches # 748.246 M/sec + branch-misses + + 0.002949295 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.948140 task-clock # 0.439 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.082 M/sec + 5,966,906 cycles # 3.063 GHz + 855,303 stalled-cycles-frontend # 14.33% frontend cycles idle + 694,676 stalled-cycles-backend # 11.64% backend cycles idle + 11,045,804 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,467,692 branches # 753.381 M/sec + branch-misses + + 0.004435255 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.947260 task-clock # 0.765 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.081 M/sec + 5,964,814 cycles # 3.063 GHz + 855,649 stalled-cycles-frontend # 14.34% frontend cycles idle + 710,245 stalled-cycles-backend # 11.91% backend cycles idle + 11,043,997 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,467,392 branches # 753.568 M/sec + branch-misses + + 0.002546083 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.947560 task-clock # 0.765 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.081 M/sec + 5,952,625 cycles # 3.056 GHz + 850,406 stalled-cycles-frontend # 14.29% frontend cycles idle + 375,296 stalled-cycles-backend # 6.30% backend cycles idle + 11,022,704 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,463,754 branches # 751.584 M/sec + branch-misses + + 0.002546145 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.943698 task-clock # 0.674 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.082 M/sec + 5,952,763 cycles # 3.063 GHz + 846,909 stalled-cycles-frontend # 14.23% frontend cycles idle + 708,785 stalled-cycles-backend # 11.91% backend cycles idle + 11,039,332 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,466,568 branches # 754.525 M/sec + branch-misses + + 0.002885840 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.949368 task-clock # 0.765 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.082 M/sec + 5,970,129 cycles # 3.063 GHz + 859,909 stalled-cycles-frontend # 14.40% frontend cycles idle + 722,803 stalled-cycles-backend # 12.11% backend cycles idle + 11,045,169 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,467,572 branches # 752.845 M/sec + branch-misses + + 0.002548488 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 2.021036 task-clock # 0.771 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.078 M/sec + 3,528,170 cycles # 1.746 GHz + 1,009,925 stalled-cycles-frontend # 28.62% frontend cycles idle + 726,356 stalled-cycles-backend # 20.59% backend cycles idle + 11,046,780 instructions # 3.13 insns per cycle + # 0.09 stalled cycles per insn + 1,467,943 branches # 726.332 M/sec + 14,164 branch-misses # 0.96% of all branches [42.61%] + + 0.002620696 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.959283 task-clock # 0.779 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.081 M/sec + 5,463,297 cycles # 2.788 GHz + 862,862 stalled-cycles-frontend # 15.79% frontend cycles idle + 699,735 stalled-cycles-backend # 12.81% backend cycles idle + 11,048,711 instructions # 2.02 insns per cycle + # 0.08 stalled cycles per insn + 1,468,247 branches # 749.380 M/sec + 17,826 branch-misses # 1.21% of all branches [ 8.79%] + + 0.002515733 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.948017 task-clock # 0.780 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.081 M/sec + 5,966,888 cycles # 3.063 GHz + 856,064 stalled-cycles-frontend # 14.35% frontend cycles idle + 711,299 stalled-cycles-backend # 11.92% backend cycles idle + 11,046,813 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,467,618 branches # 753.391 M/sec + branch-misses + + 0.002498457 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_clang_optimized 100': + + 1.949114 task-clock # 0.785 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.082 M/sec + 5,952,365 cycles # 3.054 GHz + 848,125 stalled-cycles-frontend # 14.25% frontend cycles idle + 694,927 stalled-cycles-backend # 11.67% backend cycles idle + 11,033,183 instructions # 1.85 insns per cycle + # 0.08 stalled cycles per insn + 1,465,119 branches # 751.685 M/sec + branch-misses + + 0.002481376 seconds time elapsed + diff --git a/finalExperimentRuns/clang_output_optimized_1000 b/finalExperimentRuns/clang_output_optimized_1000 new file mode 100644 index 0000000..8ca645e --- /dev/null +++ b/finalExperimentRuns/clang_output_optimized_1000 @@ -0,0 +1,180 @@ +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8514.301983 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,069,051,123 cycles # 3.062 GHz [83.32%] + 20,139,826,256 stalled-cycles-frontend # 77.26% frontend cycles idle [83.32%] + 10,074,406,315 stalled-cycles-backend # 38.65% backend cycles idle [66.68%] + 9,145,854,517 instructions # 0.35 insns per cycle + # 2.20 stalled cycles per insn [83.36%] + 1,035,460,914 branches # 121.614 M/sec [83.36%] + 1,085,246 branch-misses # 0.10% of all branches [83.34%] + + 8.536668414 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8533.423369 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,129,292,006 cycles # 3.062 GHz [83.31%] + 20,207,838,356 stalled-cycles-frontend # 77.34% frontend cycles idle [83.31%] + 9,007,753,681 stalled-cycles-backend # 34.47% backend cycles idle [66.71%] + 9,149,245,795 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.35%] + 1,035,427,362 branches # 121.338 M/sec [83.35%] + 1,083,353 branch-misses # 0.10% of all branches [83.33%] + + 8.555680250 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8524.533087 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,102,555,736 cycles # 3.062 GHz [83.34%] + 20,174,883,322 stalled-cycles-frontend # 77.29% frontend cycles idle [83.34%] + 9,795,587,822 stalled-cycles-backend # 37.53% backend cycles idle [66.67%] + 9,149,253,149 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.34%] + 1,035,420,531 branches # 121.464 M/sec [83.34%] + 1,081,429 branch-misses # 0.10% of all branches [83.35%] + + 8.546955580 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8558.061972 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,204,898,727 cycles # 3.062 GHz [83.31%] + 20,288,761,306 stalled-cycles-frontend # 77.42% frontend cycles idle [83.31%] + 9,856,648,639 stalled-cycles-backend # 37.61% backend cycles idle [66.71%] + 9,149,320,923 instructions # 0.35 insns per cycle + # 2.22 stalled cycles per insn [83.36%] + 1,035,453,678 branches # 120.992 M/sec [83.36%] + 1,081,282 branch-misses # 0.10% of all branches [83.32%] + + 8.580455767 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8513.464377 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,067,845,209 cycles # 3.062 GHz [83.32%] + 20,133,798,950 stalled-cycles-frontend # 77.24% frontend cycles idle [83.32%] + 8,624,644,078 stalled-cycles-backend # 33.09% backend cycles idle [66.67%] + 9,145,773,113 instructions # 0.35 insns per cycle + # 2.20 stalled cycles per insn [83.36%] + 1,035,458,509 branches # 121.626 M/sec [83.36%] + 1,089,716 branch-misses # 0.11% of all branches [83.35%] + + 8.535682415 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8519.104099 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,085,519,997 cycles # 3.062 GHz [83.33%] + 20,156,984,198 stalled-cycles-frontend # 77.27% frontend cycles idle [83.33%] + 8,787,917,469 stalled-cycles-backend # 33.69% backend cycles idle [66.65%] + 9,149,566,196 instructions # 0.35 insns per cycle + # 2.20 stalled cycles per insn [83.33%] + 1,034,627,980 branches # 121.448 M/sec [83.37%] + 1,113,417 branch-misses # 0.11% of all branches [83.36%] + + 8.541426918 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8525.969981 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,106,906,116 cycles # 3.062 GHz [83.30%] + 20,176,019,515 stalled-cycles-frontend # 77.28% frontend cycles idle [83.34%] + 8,065,406,321 stalled-cycles-backend # 30.89% backend cycles idle [66.68%] + 9,149,290,275 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.34%] + 1,035,439,656 branches # 121.445 M/sec [83.34%] + 1,090,091 branch-misses # 0.11% of all branches [83.34%] + + 8.548269885 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8530.756566 task-clock # 0.997 CPUs utilized + 10 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,120,379,015 cycles # 3.062 GHz [83.30%] + 20,196,068,508 stalled-cycles-frontend # 77.32% frontend cycles idle [83.30%] + 9,181,947,822 stalled-cycles-backend # 35.15% backend cycles idle [66.70%] + 9,150,553,323 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.35%] + 1,035,656,501 branches # 121.403 M/sec [83.35%] + 1,099,565 branch-misses # 0.11% of all branches [83.35%] + + 8.553018234 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8537.180438 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,141,449,324 cycles # 3.062 GHz [83.31%] + 20,217,377,597 stalled-cycles-frontend # 77.34% frontend cycles idle [83.32%] + 7,883,092,404 stalled-cycles-backend # 30.16% backend cycles idle [66.67%] + 9,145,842,530 instructions # 0.35 insns per cycle + # 2.21 stalled cycles per insn [83.36%] + 1,035,464,658 branches # 121.289 M/sec [83.36%] + 1,094,606 branch-misses # 0.11% of all branches [83.35%] + + 8.561051194 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_clang_optimized 1000': + + 8521.967213 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,092,302,546 cycles # 3.062 GHz [83.33%] + 20,165,608,254 stalled-cycles-frontend # 77.29% frontend cycles idle [83.33%] + 9,103,949,656 stalled-cycles-backend # 34.89% backend cycles idle [66.66%] + 9,149,688,050 instructions # 0.35 insns per cycle + # 2.20 stalled cycles per insn [83.33%] + 1,035,529,349 branches # 121.513 M/sec [83.33%] + 1,095,002 branch-misses # 0.11% of all branches [83.36%] + + 8.544265295 seconds time elapsed + diff --git a/finalExperimentRuns/clang_output_optimized_3000 b/finalExperimentRuns/clang_output_optimized_3000 new file mode 100644 index 0000000..58371ab --- /dev/null +++ b/finalExperimentRuns/clang_output_optimized_3000 @@ -0,0 +1,180 @@ +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 312664.887494 task-clock # 0.997 CPUs utilized + 392 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 957,194,643,582 cycles # 3.061 GHz [83.33%] + 801,278,508,780 stalled-cycles-frontend # 83.71% frontend cycles idle [83.33%] + 654,614,518,739 stalled-cycles-backend # 68.39% backend cycles idle [66.67%] + 244,566,461,305 instructions # 0.26 insns per cycle + # 3.28 stalled cycles per insn [83.33%] + 27,360,317,759 branches # 87.507 M/sec [83.33%] + 13,880,850 branch-misses # 0.05% of all branches [83.33%] + + 313.450793586 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 312283.288554 task-clock # 0.997 CPUs utilized + 391 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 955,893,620,144 cycles # 3.061 GHz [83.33%] + 799,959,307,996 stalled-cycles-frontend # 83.69% frontend cycles idle [83.33%] + 624,558,986,255 stalled-cycles-backend # 65.34% backend cycles idle [66.67%] + 244,567,518,923 instructions # 0.26 insns per cycle + # 3.27 stalled cycles per insn [83.33%] + 27,361,026,722 branches # 87.616 M/sec [83.33%] + 12,927,656 branch-misses # 0.05% of all branches [83.33%] + + 313.069529799 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 314069.326289 task-clock # 0.997 CPUs utilized + 393 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 961,431,758,518 cycles # 3.061 GHz [83.33%] + 805,494,232,345 stalled-cycles-frontend # 83.78% frontend cycles idle [83.33%] + 630,365,211,190 stalled-cycles-backend # 65.57% backend cycles idle [66.67%] + 244,567,418,849 instructions # 0.25 insns per cycle + # 3.29 stalled cycles per insn [83.33%] + 27,359,270,785 branches # 87.112 M/sec [83.33%] + 12,925,094 branch-misses # 0.05% of all branches [83.33%] + + 314.901173672 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 313605.668691 task-clock # 0.997 CPUs utilized + 393 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 960,099,341,079 cycles # 3.061 GHz [83.33%] + 804,209,745,312 stalled-cycles-frontend # 83.76% frontend cycles idle [83.33%] + 650,945,842,810 stalled-cycles-backend # 67.80% backend cycles idle [66.67%] + 244,552,833,312 instructions # 0.25 insns per cycle + # 3.29 stalled cycles per insn [83.33%] + 27,360,236,458 branches # 87.244 M/sec [83.33%] + 13,471,738 branch-misses # 0.05% of all branches [83.33%] + + 314.393884834 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 313966.377674 task-clock # 0.997 CPUs utilized + 394 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 961,182,730,314 cycles # 3.061 GHz [83.33%] + 805,474,890,245 stalled-cycles-frontend # 83.80% frontend cycles idle [83.33%] + 655,175,905,580 stalled-cycles-backend # 68.16% backend cycles idle [66.67%] + 244,546,839,813 instructions # 0.25 insns per cycle + # 3.29 stalled cycles per insn [83.33%] + 27,360,307,420 branches # 87.144 M/sec [83.33%] + 13,625,821 branch-misses # 0.05% of all branches [83.33%] + + 314.755038625 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 315025.036094 task-clock # 0.997 CPUs utilized + 395 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 964,449,384,871 cycles # 3.062 GHz [83.33%] + 808,592,472,928 stalled-cycles-frontend # 83.84% frontend cycles idle [83.33%] + 646,222,264,512 stalled-cycles-backend # 67.00% backend cycles idle [66.67%] + 244,552,197,147 instructions # 0.25 insns per cycle + # 3.31 stalled cycles per insn [83.33%] + 27,358,770,723 branches # 86.846 M/sec [83.33%] + 13,799,312 branch-misses # 0.05% of all branches [83.33%] + + 315.816146040 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 313884.082830 task-clock # 0.997 CPUs utilized + 394 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 960,938,455,254 cycles # 3.061 GHz [83.33%] + 804,967,633,007 stalled-cycles-frontend # 83.77% frontend cycles idle [83.33%] + 658,597,647,955 stalled-cycles-backend # 68.54% backend cycles idle [66.67%] + 244,565,187,191 instructions # 0.25 insns per cycle + # 3.29 stalled cycles per insn [83.33%] + 27,361,335,010 branches # 87.170 M/sec [83.33%] + 13,868,957 branch-misses # 0.05% of all branches [83.33%] + + 314.672105390 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 313070.788902 task-clock # 0.997 CPUs utilized + 393 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 958,299,705,663 cycles # 3.061 GHz [83.33%] + 802,791,733,825 stalled-cycles-frontend # 83.77% frontend cycles idle [83.33%] + 620,995,884,839 stalled-cycles-backend # 64.80% backend cycles idle [66.67%] + 244,575,491,330 instructions # 0.26 insns per cycle + # 3.28 stalled cycles per insn [83.33%] + 27,361,827,022 branches # 87.398 M/sec [83.33%] + 13,026,877 branch-misses # 0.05% of all branches [83.33%] + + 313.856410059 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 315731.190936 task-clock # 0.997 CPUs utilized + 396 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 966,582,281,999 cycles # 3.061 GHz [83.33%] + 810,643,864,844 stalled-cycles-frontend # 83.87% frontend cycles idle [83.33%] + 653,645,811,041 stalled-cycles-backend # 67.62% backend cycles idle [66.67%] + 244,568,729,928 instructions # 0.25 insns per cycle + # 3.31 stalled cycles per insn [83.33%] + 27,361,596,499 branches # 86.661 M/sec [83.33%] + 13,710,796 branch-misses # 0.05% of all branches [83.33%] + + 316.523716704 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_clang_optimized 3000': + + 312952.702244 task-clock # 0.997 CPUs utilized + 393 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 957,972,776,248 cycles # 3.061 GHz [83.33%] + 802,443,920,049 stalled-cycles-frontend # 83.76% frontend cycles idle [83.33%] + 640,914,452,512 stalled-cycles-backend # 66.90% backend cycles idle [66.67%] + 244,578,176,924 instructions # 0.26 insns per cycle + # 3.28 stalled cycles per insn [83.33%] + 27,363,549,903 branches # 87.437 M/sec [83.33%] + 13,598,396 branch-misses # 0.05% of all branches [83.33%] + + 313.738715536 seconds time elapsed + diff --git a/finalExperimentRuns/gcc_output_10 b/finalExperimentRuns/gcc_output_10 new file mode 100644 index 0000000..d533c09 --- /dev/null +++ b/finalExperimentRuns/gcc_output_10 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply 10': + + 0.264216 task-clock # 0.234 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.481 M/sec + 801,618 cycles # 3.034 GHz + 485,598 stalled-cycles-frontend # 60.58% frontend cycles idle + 331,763 stalled-cycles-backend # 41.39% backend cycles idle + 579,543 instructions # 0.72 insns per cycle + # 0.84 stalled cycles per insn + 105,217 branches # 398.223 M/sec + branch-misses + + 0.001130275 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply 10': + + 0.260784 task-clock # 0.312 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.487 M/sec + 793,277 cycles # 3.042 GHz + 476,100 stalled-cycles-frontend # 60.02% frontend cycles idle + 334,152 stalled-cycles-backend # 42.12% backend cycles idle + 582,916 instructions # 0.73 insns per cycle + # 0.82 stalled cycles per insn + 105,800 branches # 405.700 M/sec + branch-misses + + 0.000836036 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply 10': + + 0.260142 task-clock # 0.341 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.488 M/sec + cycles + 469,818 stalled-cycles-frontend # 0.00% frontend cycles idle + 330,664 stalled-cycles-backend # 0.00% backend cycles idle + 581,476 instructions # 0.00 insns per cycle + # 0.81 stalled cycles per insn + 105,525 branches # 405.644 M/sec + 6,383 branch-misses # 6.05% of all branches + + 0.000763764 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply 10': + + 0.265972 task-clock # 0.264 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.477 M/sec + 783,856 cycles # 2.947 GHz + 469,562 stalled-cycles-frontend # 59.90% frontend cycles idle + 316,315 stalled-cycles-backend # 40.35% backend cycles idle + 579,399 instructions # 0.74 insns per cycle + # 0.81 stalled cycles per insn + 105,152 branches # 395.350 M/sec + branch-misses + + 0.001005965 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply 10': + + 0.262319 task-clock # 0.287 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.480 M/sec + 798,897 cycles # 3.046 GHz + 481,149 stalled-cycles-frontend # 60.23% frontend cycles idle + 294,473 stalled-cycles-backend # 36.86% backend cycles idle + 584,326 instructions # 0.73 insns per cycle + # 0.82 stalled cycles per insn + 105,770 branches # 403.211 M/sec + branch-misses + + 0.000915591 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply 10': + + 0.261447 task-clock # 0.150 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.486 M/sec + 795,646 cycles # 3.043 GHz + 481,327 stalled-cycles-frontend # 60.50% frontend cycles idle + 341,767 stalled-cycles-backend # 42.95% backend cycles idle + 574,374 instructions # 0.72 insns per cycle + # 0.84 stalled cycles per insn + 103,651 branches # 396.451 M/sec + branch-misses + + 0.001741528 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply 10': + + 0.264455 task-clock # 0.300 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.480 M/sec + 790,618 cycles # 2.990 GHz + 478,470 stalled-cycles-frontend # 60.52% frontend cycles idle + 330,579 stalled-cycles-backend # 41.81% backend cycles idle + 568,364 instructions # 0.72 insns per cycle + # 0.84 stalled cycles per insn + 102,901 branches # 389.106 M/sec + branch-misses + + 0.000881953 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply 10': + + 0.259611 task-clock # 0.320 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.485 M/sec + 789,701 cycles # 3.042 GHz + 474,512 stalled-cycles-frontend # 60.09% frontend cycles idle + 332,633 stalled-cycles-backend # 42.12% backend cycles idle + 576,821 instructions # 0.73 insns per cycle + # 0.82 stalled cycles per insn + 104,740 branches # 403.450 M/sec + branch-misses + + 0.000811846 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply 10': + + 0.261265 task-clock # 0.147 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.482 M/sec + 793,438 cycles # 3.037 GHz + 479,473 stalled-cycles-frontend # 60.43% frontend cycles idle + 320,606 stalled-cycles-backend # 40.41% backend cycles idle + 572,808 instructions # 0.72 insns per cycle + # 0.84 stalled cycles per insn + 104,034 branches # 398.193 M/sec + branch-misses + + 0.001780051 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply 10': + + 0.261124 task-clock # 0.302 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.486 M/sec + 794,602 cycles # 3.043 GHz + 476,906 stalled-cycles-frontend # 60.02% frontend cycles idle + 329,122 stalled-cycles-backend # 41.42% backend cycles idle + 583,923 instructions # 0.73 insns per cycle + # 0.82 stalled cycles per insn + 105,965 branches # 405.803 M/sec + branch-misses + + 0.000863590 seconds time elapsed + diff --git a/finalExperimentRuns/gcc_output_100 b/finalExperimentRuns/gcc_output_100 new file mode 100644 index 0000000..cecefd4 --- /dev/null +++ b/finalExperimentRuns/gcc_output_100 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply 100': + + 8.054504 task-clock # 0.903 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.020 M/sec + 24,610,696 cycles # 3.056 GHz [50.57%] + 7,909,722 stalled-cycles-frontend # 32.14% frontend cycles idle + 689,986 stalled-cycles-backend # 2.80% backend cycles idle + 52,144,755 instructions # 2.12 insns per cycle + # 0.15 stalled cycles per insn + 1,478,711 branches # 183.588 M/sec + 11,727 branch-misses # 0.79% of all branches [76.43%] + + 0.008919947 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply 100': + + 8.117808 task-clock # 0.932 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.020 M/sec + 24,718,750 cycles # 3.045 GHz [50.92%] + 8,195,388 stalled-cycles-frontend # 33.15% frontend cycles idle + 897,551 stalled-cycles-backend # 3.63% backend cycles idle + 52,145,300 instructions # 2.11 insns per cycle + # 0.16 stalled cycles per insn + 1,478,850 branches # 182.174 M/sec + 11,724 branch-misses # 0.79% of all branches [74.58%] + + 0.008711930 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply 100': + + 8.111482 task-clock # 0.927 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.019 M/sec + 24,714,858 cycles # 3.047 GHz [50.88%] + 8,209,540 stalled-cycles-frontend # 33.22% frontend cycles idle + 698,504 stalled-cycles-backend # 2.83% backend cycles idle + 52,145,272 instructions # 2.11 insns per cycle + # 0.16 stalled cycles per insn + 1,478,847 branches # 182.315 M/sec + 11,726 branch-misses # 0.79% of all branches [74.46%] + + 0.008749660 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply 100': + + 8.148961 task-clock # 0.917 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.019 M/sec + 24,818,324 cycles # 3.046 GHz [51.10%] + 6,387,176 stalled-cycles-frontend # 25.74% frontend cycles idle + 574,390 stalled-cycles-backend # 2.31% backend cycles idle + 52,168,459 instructions # 2.10 insns per cycle + # 0.12 stalled cycles per insn + 1,483,171 branches # 182.007 M/sec + 11,840 branch-misses # 0.80% of all branches [90.60%] + + 0.008883245 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply 100': + + 8.087013 task-clock # 0.908 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.020 M/sec + 24,632,136 cycles # 3.046 GHz [50.73%] + 6,193,928 stalled-cycles-frontend # 25.15% frontend cycles idle + 772,134 stalled-cycles-backend # 3.13% backend cycles idle + 52,143,390 instructions # 2.12 insns per cycle + # 0.12 stalled cycles per insn + 1,478,507 branches # 182.825 M/sec + 11,557 branch-misses # 0.78% of all branches [91.88%] + + 0.008906666 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply 100': + + 8.084764 task-clock # 0.930 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.020 M/sec + 24,635,382 cycles # 3.047 GHz [50.73%] + 10,318,247 stalled-cycles-frontend # 41.88% frontend cycles idle + 985,300 stalled-cycles-backend # 4.00% backend cycles idle + 52,144,339 instructions # 2.12 insns per cycle + # 0.20 stalled cycles per insn + 1,478,689 branches # 182.898 M/sec + 12,290 branch-misses # 0.83% of all branches [54.83%] + + 0.008697934 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply 100': + + 8.080921 task-clock # 0.933 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.020 M/sec + 24,599,853 cycles # 3.044 GHz [50.70%] + 6,254,276 stalled-cycles-frontend # 25.42% frontend cycles idle + 871,510 stalled-cycles-backend # 3.54% backend cycles idle + 52,146,066 instructions # 2.12 insns per cycle + # 0.12 stalled cycles per insn + 1,479,020 branches # 183.026 M/sec + 11,596 branch-misses # 0.78% of all branches [91.42%] + + 0.008656610 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply 100': + + 8.104023 task-clock # 0.910 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.020 M/sec + 24,721,453 cycles # 3.051 GHz [50.81%] + 7,609,755 stalled-cycles-frontend # 30.78% frontend cycles idle + 797,005 stalled-cycles-backend # 3.22% backend cycles idle + 52,152,265 instructions # 2.11 insns per cycle + # 0.15 stalled cycles per insn + 1,480,154 branches # 182.644 M/sec + 11,875 branch-misses # 0.80% of all branches [79.49%] + + 0.008901112 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply 100': + + 8.105288 task-clock # 0.924 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.020 M/sec + 24,710,843 cycles # 3.049 GHz [50.85%] + 8,609,115 stalled-cycles-frontend # 34.84% frontend cycles idle + 511,967 stalled-cycles-backend # 2.07% backend cycles idle + 52,146,432 instructions # 2.11 insns per cycle + # 0.17 stalled cycles per insn + 1,479,068 branches # 182.482 M/sec + 11,732 branch-misses # 0.79% of all branches [70.47%] + + 0.008771563 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply 100': + + 8.104444 task-clock # 0.935 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.020 M/sec + 24,657,762 cycles # 3.042 GHz [50.84%] + 8,398,717 stalled-cycles-frontend # 34.06% frontend cycles idle + 1,004,334 stalled-cycles-backend # 4.07% backend cycles idle + 52,144,374 instructions # 2.11 insns per cycle + # 0.16 stalled cycles per insn + 1,478,685 branches # 182.454 M/sec + 11,712 branch-misses # 0.79% of all branches [72.47%] + + 0.008664229 seconds time elapsed + diff --git a/finalExperimentRuns/gcc_output_1000 b/finalExperimentRuns/gcc_output_1000 new file mode 100644 index 0000000..143e8fe --- /dev/null +++ b/finalExperimentRuns/gcc_output_1000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply 1000': + + 9926.708359 task-clock # 0.997 CPUs utilized + 13 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 30,395,895,247 cycles # 3.062 GHz [83.32%] + 17,442,111,645 stalled-cycles-frontend # 57.38% frontend cycles idle [83.32%] + 4,164,384,143 stalled-cycles-backend # 13.70% backend cycles idle [66.68%] + 50,155,717,267 instructions # 1.65 insns per cycle + # 0.35 stalled cycles per insn [83.36%] + 1,037,542,959 branches # 104.520 M/sec [83.36%] + 1,062,313 branch-misses # 0.10% of all branches [83.32%] + + 9.952598326 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply 1000': + + 9989.945693 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 30,589,481,178 cycles # 3.062 GHz [83.31%] + 17,621,887,593 stalled-cycles-frontend # 57.61% frontend cycles idle [83.34%] + 4,027,488,464 stalled-cycles-backend # 13.17% backend cycles idle [66.69%] + 50,159,899,384 instructions # 1.64 insns per cycle + # 0.35 stalled cycles per insn [83.35%] + 1,037,610,140 branches # 103.865 M/sec [83.34%] + 1,072,230 branch-misses # 0.10% of all branches [83.34%] + + 10.015847661 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply 1000': + + 9872.782392 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 30,230,798,240 cycles # 3.062 GHz [83.31%] + 17,272,580,035 stalled-cycles-frontend # 57.14% frontend cycles idle [83.34%] + 3,944,001,447 stalled-cycles-backend # 13.05% backend cycles idle [66.70%] + 50,157,447,316 instructions # 1.66 insns per cycle + # 0.34 stalled cycles per insn [83.35%] + 1,037,562,856 branches # 105.093 M/sec [83.35%] + 1,070,768 branch-misses # 0.10% of all branches [83.33%] + + 9.898330956 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply 1000': + + 9960.652528 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 2 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 30,442,315,955 cycles # 3.056 GHz [83.34%] + 17,495,255,191 stalled-cycles-frontend # 57.47% frontend cycles idle [83.34%] + 4,435,073,572 stalled-cycles-backend # 14.57% backend cycles idle [66.67%] + 50,158,527,538 instructions # 1.65 insns per cycle + # 0.35 stalled cycles per insn [83.34%] + 1,037,684,531 branches # 104.178 M/sec [83.34%] + 1,090,517 branch-misses # 0.11% of all branches [83.35%] + + 9.986475787 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply 1000': + + 9983.888308 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 30,571,145,817 cycles # 3.062 GHz [83.33%] + 17,613,563,281 stalled-cycles-frontend # 57.61% frontend cycles idle [83.34%] + 4,138,212,697 stalled-cycles-backend # 13.54% backend cycles idle [66.67%] + 50,155,387,715 instructions # 1.64 insns per cycle + # 0.35 stalled cycles per insn [83.33%] + 1,037,567,984 branches # 103.924 M/sec [83.33%] + 1,068,596 branch-misses # 0.10% of all branches [83.35%] + + 10.010151775 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply 1000': + + 9853.437478 task-clock # 0.997 CPUs utilized + 13 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 30,170,703,152 cycles # 3.062 GHz [83.32%] + 17,222,155,727 stalled-cycles-frontend # 57.08% frontend cycles idle [83.32%] + 4,055,670,788 stalled-cycles-backend # 13.44% backend cycles idle [66.67%] + 50,155,779,844 instructions # 1.66 insns per cycle + # 0.34 stalled cycles per insn [83.36%] + 1,037,560,137 branches # 105.299 M/sec [83.36%] + 1,074,365 branch-misses # 0.10% of all branches [83.35%] + + 9.879197104 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply 1000': + + 9885.285809 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 30,268,249,154 cycles # 3.062 GHz [83.34%] + 17,314,471,270 stalled-cycles-frontend # 57.20% frontend cycles idle [83.33%] + 4,082,457,570 stalled-cycles-backend # 13.49% backend cycles idle [66.66%] + 50,154,666,290 instructions # 1.66 insns per cycle + # 0.35 stalled cycles per insn [83.33%] + 1,037,650,375 branches # 104.969 M/sec [83.33%] + 1,085,196 branch-misses # 0.10% of all branches [83.37%] + + 9.910950714 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply 1000': + + 9914.407092 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 30,356,897,007 cycles # 3.062 GHz [83.34%] + 17,403,547,284 stalled-cycles-frontend # 57.33% frontend cycles idle [83.34%] + 4,191,887,997 stalled-cycles-backend # 13.81% backend cycles idle [66.68%] + 50,156,122,104 instructions # 1.65 insns per cycle + # 0.35 stalled cycles per insn [83.34%] + 1,037,539,929 branches # 104.650 M/sec [83.34%] + 1,065,113 branch-misses # 0.10% of all branches [83.31%] + + 9.940317228 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply 1000': + + 9937.674711 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 30,427,817,353 cycles # 3.062 GHz [83.34%] + 17,471,897,841 stalled-cycles-frontend # 57.42% frontend cycles idle [83.34%] + 4,027,974,555 stalled-cycles-backend # 13.24% backend cycles idle [66.68%] + 50,158,261,034 instructions # 1.65 insns per cycle + # 0.35 stalled cycles per insn [83.34%] + 1,037,803,159 branches # 104.431 M/sec [83.34%] + 1,088,832 branch-misses # 0.10% of all branches [83.32%] + + 9.963562648 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply 1000': + + 9878.683493 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 30,249,098,352 cycles # 3.062 GHz [83.32%] + 17,298,067,630 stalled-cycles-frontend # 57.19% frontend cycles idle [83.32%] + 3,974,575,999 stalled-cycles-backend # 13.14% backend cycles idle [66.67%] + 50,150,796,611 instructions # 1.66 insns per cycle + # 0.34 stalled cycles per insn [83.36%] + 1,037,562,373 branches # 105.030 M/sec [83.36%] + 1,067,234 branch-misses # 0.10% of all branches [83.34%] + + 9.904228039 seconds time elapsed + diff --git a/finalExperimentRuns/gcc_output_3000 b/finalExperimentRuns/gcc_output_3000 new file mode 100644 index 0000000..1da4004 --- /dev/null +++ b/finalExperimentRuns/gcc_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply 3000': + + 475300.257913 task-clock # 0.997 CPUs utilized + 594 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,455,206,821,524 cycles # 3.062 GHz [83.33%] + 1,096,016,878,004 stalled-cycles-frontend # 75.32% frontend cycles idle [83.33%] + 590,754,550,647 stalled-cycles-backend # 40.60% backend cycles idle [66.67%] + 1,351,742,482,872 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,393,869,687 branches # 57.635 M/sec [83.33%] + 14,090,789 branch-misses # 0.05% of all branches [83.33%] + + 476.494079626 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply 3000': + + 476018.020595 task-clock # 0.997 CPUs utilized + 596 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,457,356,444,320 cycles # 3.062 GHz [83.33%] + 1,097,887,781,677 stalled-cycles-frontend # 75.33% frontend cycles idle [83.33%] + 593,165,290,075 stalled-cycles-backend # 40.70% backend cycles idle [66.67%] + 1,351,747,334,373 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,396,936,581 branches # 57.554 M/sec [83.33%] + 14,020,326 branch-misses # 0.05% of all branches [83.33%] + + 477.213941232 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply 3000': + + 474569.437761 task-clock # 0.997 CPUs utilized + 595 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,452,880,580,364 cycles # 3.061 GHz [83.33%] + 1,093,658,008,544 stalled-cycles-frontend # 75.28% frontend cycles idle [83.33%] + 598,953,855,484 stalled-cycles-backend # 41.23% backend cycles idle [66.67%] + 1,351,708,174,318 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,397,137,447 branches # 57.731 M/sec [83.33%] + 13,353,583 branch-misses # 0.05% of all branches [83.33%] + + 475.763890065 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply 3000': + + 475646.500239 task-clock # 0.997 CPUs utilized + 596 context-switches # 0.000 M/sec + 1 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,456,163,649,462 cycles # 3.061 GHz [83.33%] + 1,096,827,868,403 stalled-cycles-frontend # 75.32% frontend cycles idle [83.33%] + 604,183,182,642 stalled-cycles-backend # 41.49% backend cycles idle [66.67%] + 1,351,761,637,391 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,396,786,793 branches # 57.599 M/sec [83.33%] + 13,320,251 branch-misses # 0.05% of all branches [83.33%] + + 476.841596270 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply 3000': + + 476211.404942 task-clock # 0.997 CPUs utilized + 597 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,457,959,876,543 cycles # 3.062 GHz [83.33%] + 1,098,411,393,007 stalled-cycles-frontend # 75.34% frontend cycles idle [83.33%] + 607,061,107,646 stalled-cycles-backend # 41.64% backend cycles idle [66.67%] + 1,351,758,909,796 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,397,007,312 branches # 57.531 M/sec [83.33%] + 13,916,373 branch-misses # 0.05% of all branches [83.33%] + + 477.407551808 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply 3000': + + 475948.824921 task-clock # 0.997 CPUs utilized + 596 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,457,196,407,185 cycles # 3.062 GHz [83.33%] + 1,097,491,418,801 stalled-cycles-frontend # 75.32% frontend cycles idle [83.33%] + 619,424,280,588 stalled-cycles-backend # 42.51% backend cycles idle [66.67%] + 1,351,752,463,467 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,395,156,718 branches # 57.559 M/sec [83.33%] + 13,646,100 branch-misses # 0.05% of all branches [83.33%] + + 477.144006180 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply 3000': + + 476555.496544 task-clock # 0.997 CPUs utilized + 597 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,459,055,808,779 cycles # 3.062 GHz [83.33%] + 1,099,359,336,770 stalled-cycles-frontend # 75.35% frontend cycles idle [83.33%] + 605,859,886,112 stalled-cycles-backend # 41.52% backend cycles idle [66.67%] + 1,351,748,188,845 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,396,976,815 branches # 57.490 M/sec [83.33%] + 13,608,298 branch-misses # 0.05% of all branches [83.33%] + + 477.751263190 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply 3000': + + 476550.619236 task-clock # 0.997 CPUs utilized + 596 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 1,458,990,788,545 cycles # 3.062 GHz [83.33%] + 1,099,354,204,996 stalled-cycles-frontend # 75.35% frontend cycles idle [83.33%] + 605,327,241,764 stalled-cycles-backend # 41.49% backend cycles idle [66.67%] + 1,351,757,320,368 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,396,713,068 branches # 57.490 M/sec [83.33%] + 13,874,648 branch-misses # 0.05% of all branches [83.33%] + + 477.765602818 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply 3000': + + 477530.594343 task-clock # 0.997 CPUs utilized + 597 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,461,959,826,317 cycles # 3.061 GHz [83.33%] + 1,102,192,822,811 stalled-cycles-frontend # 75.39% frontend cycles idle [83.33%] + 602,765,299,108 stalled-cycles-backend # 41.23% backend cycles idle [66.67%] + 1,351,757,093,932 instructions # 0.92 insns per cycle + # 0.82 stalled cycles per insn [83.33%] + 27,398,383,869 branches # 57.375 M/sec [83.33%] + 13,438,518 branch-misses # 0.05% of all branches [83.33%] + + 478.728380489 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply 3000': + + 477246.288455 task-clock # 0.997 CPUs utilized + 598 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 1,461,142,413,968 cycles # 3.062 GHz [83.33%] + 1,101,548,208,648 stalled-cycles-frontend # 75.39% frontend cycles idle [83.33%] + 610,983,270,807 stalled-cycles-backend # 41.82% backend cycles idle [66.67%] + 1,351,767,194,355 instructions # 0.93 insns per cycle + # 0.81 stalled cycles per insn [83.33%] + 27,397,222,382 branches # 57.407 M/sec [83.33%] + 14,071,841 branch-misses # 0.05% of all branches [83.33%] + + 478.444205849 seconds time elapsed + diff --git a/finalExperimentRuns/gcc_output_optimized_10 b/finalExperimentRuns/gcc_output_optimized_10 new file mode 100644 index 0000000..ac95581 --- /dev/null +++ b/finalExperimentRuns/gcc_output_optimized_10 @@ -0,0 +1,180 @@ +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.248266 task-clock # 0.177 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.512 M/sec + cycles + 456,214 stalled-cycles-frontend # 0.00% frontend cycles idle + 322,343 stalled-cycles-backend # 0.00% backend cycles idle + 525,274 instructions # 0.00 insns per cycle + # 0.87 stalled cycles per insn + 102,761 branches # 413.915 M/sec + 6,305 branch-misses # 6.14% of all branches + + 0.001399414 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.250526 task-clock # 0.158 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.503 M/sec + 761,374 cycles # 3.039 GHz + 460,669 stalled-cycles-frontend # 60.50% frontend cycles idle + 278,379 stalled-cycles-backend # 36.56% backend cycles idle + 531,203 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 104,155 branches # 415.745 M/sec + branch-misses + + 0.001584906 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.256776 task-clock # 0.261 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.495 M/sec + 769,126 cycles # 2.995 GHz + 464,343 stalled-cycles-frontend # 60.37% frontend cycles idle + 305,155 stalled-cycles-backend # 39.68% backend cycles idle + 537,950 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 105,335 branches # 410.221 M/sec + branch-misses + + 0.000984387 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.252672 task-clock # 0.303 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.503 M/sec + 758,151 cycles # 3.001 GHz + 456,805 stalled-cycles-frontend # 60.25% frontend cycles idle + 312,114 stalled-cycles-backend # 41.17% backend cycles idle + 535,170 instructions # 0.71 insns per cycle + # 0.85 stalled cycles per insn + 104,829 branches # 414.882 M/sec + branch-misses + + 0.000834122 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.256107 task-clock # 0.319 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.496 M/sec + 777,635 cycles # 3.036 GHz + 471,077 stalled-cycles-frontend # 60.58% frontend cycles idle + 311,009 stalled-cycles-backend # 39.99% backend cycles idle + 537,745 instructions # 0.69 insns per cycle + # 0.88 stalled cycles per insn + 105,304 branches # 411.172 M/sec + branch-misses + + 0.000803563 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.253460 task-clock # 0.266 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.501 M/sec + 770,539 cycles # 3.040 GHz + 464,693 stalled-cycles-frontend # 60.31% frontend cycles idle + 320,075 stalled-cycles-backend # 41.54% backend cycles idle + 535,462 instructions # 0.69 insns per cycle + # 0.87 stalled cycles per insn + 104,877 branches # 413.781 M/sec + branch-misses + + 0.000953846 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.257419 task-clock # 0.307 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.493 M/sec + 771,110 cycles # 2.996 GHz + 466,926 stalled-cycles-frontend # 60.55% frontend cycles idle + 338,319 stalled-cycles-backend # 43.87% backend cycles idle + 536,400 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 105,084 branches # 408.222 M/sec + branch-misses + + 0.000837879 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.251920 task-clock # 0.292 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.504 M/sec + 765,830 cycles # 3.040 GHz + 460,303 stalled-cycles-frontend # 60.11% frontend cycles idle + 311,031 stalled-cycles-backend # 40.61% backend cycles idle + 536,633 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 105,101 branches # 417.200 M/sec + branch-misses + + 0.000862143 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.251167 task-clock # 0.329 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.506 M/sec + 765,608 cycles # 3.048 GHz + 463,671 stalled-cycles-frontend # 60.56% frontend cycles idle + 321,814 stalled-cycles-backend # 42.03% backend cycles idle + 534,394 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 104,724 branches # 416.950 M/sec + branch-misses + + 0.000763382 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.257385 task-clock # 0.271 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.493 M/sec + 781,086 cycles # 3.035 GHz + 474,101 stalled-cycles-frontend # 60.70% frontend cycles idle + 323,675 stalled-cycles-backend # 41.44% backend cycles idle + 537,279 instructions # 0.69 insns per cycle + # 0.88 stalled cycles per insn + 105,124 branches # 408.431 M/sec + branch-misses + + 0.000949143 seconds time elapsed + diff --git a/finalExperimentRuns/gcc_output_optimized_100 b/finalExperimentRuns/gcc_output_optimized_100 new file mode 100644 index 0000000..02b8d64 --- /dev/null +++ b/finalExperimentRuns/gcc_output_optimized_100 @@ -0,0 +1,180 @@ +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.849608 task-clock # 0.769 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.086 M/sec + 5,664,275 cycles # 3.062 GHz + 732,765 stalled-cycles-frontend # 12.94% frontend cycles idle + 415,452 stalled-cycles-backend # 7.33% backend cycles idle + 10,010,514 instructions # 1.77 insns per cycle + # 0.07 stalled cycles per insn + 1,456,645 branches # 787.543 M/sec + branch-misses + + 0.002405004 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.839908 task-clock # 0.666 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.086 M/sec + 5,636,324 cycles # 3.063 GHz + 708,018 stalled-cycles-frontend # 12.56% frontend cycles idle + 1,488,676 stalled-cycles-backend # 26.41% backend cycles idle + 9,999,645 instructions # 1.77 insns per cycle + # 0.15 stalled cycles per insn + 1,455,193 branches # 790.905 M/sec + branch-misses + + 0.002762590 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.894950 task-clock # 0.768 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.084 M/sec + 2,365,633 cycles # 1.248 GHz + 815,107 stalled-cycles-frontend # 34.46% frontend cycles idle + 1,395,279 stalled-cycles-backend # 58.98% backend cycles idle + 10,005,259 instructions # 4.23 insns per cycle + # 0.14 stalled cycles per insn + 1,456,126 branches # 768.424 M/sec + 14,501 branch-misses # 1.00% of all branches [58.57%] + + 0.002468015 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.875375 task-clock # 0.766 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.085 M/sec + 4,882,424 cycles # 2.603 GHz + 752,488 stalled-cycles-frontend # 15.41% frontend cycles idle + 1,341,572 stalled-cycles-backend # 27.48% backend cycles idle + 10,020,521 instructions # 2.05 insns per cycle + # 0.13 stalled cycles per insn + 1,458,408 branches # 777.662 M/sec + 15,896 branch-misses # 1.09% of all branches [14.62%] + + 0.002449323 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.847871 task-clock # 0.723 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.086 M/sec + 5,660,288 cycles # 3.063 GHz + 727,224 stalled-cycles-frontend # 12.85% frontend cycles idle + 1,493,416 stalled-cycles-backend # 26.38% backend cycles idle + 10,014,309 instructions # 1.77 insns per cycle + # 0.15 stalled cycles per insn + 1,457,300 branches # 788.637 M/sec + branch-misses + + 0.002555472 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.879068 task-clock # 0.768 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.084 M/sec + 3,421,298 cycles # 1.821 GHz + 761,542 stalled-cycles-frontend # 22.26% frontend cycles idle + 1,433,667 stalled-cycles-backend # 41.90% backend cycles idle + 10,018,860 instructions # 2.93 insns per cycle + # 0.14 stalled cycles per insn + 1,458,144 branches # 775.993 M/sec + 14,789 branch-misses # 1.01% of all branches [40.00%] + + 0.002447307 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.883634 task-clock # 0.739 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.084 M/sec + 321,967 cycles # 0.171 GHz + 796,732 stalled-cycles-frontend # 247.46% frontend cycles idle + 443,941 stalled-cycles-backend # 137.88% backend cycles idle + 10,018,569 instructions # 31.12 insns per cycle + # 0.08 stalled cycles per insn + 1,458,017 branches # 774.045 M/sec + 16,126 branch-misses # 1.11% of all branches [93.59%] + + 0.002549813 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.869718 task-clock # 0.709 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.085 M/sec + 1,144,239 cycles # 0.612 GHz + 746,887 stalled-cycles-frontend # 65.27% frontend cycles idle + 1,506,395 stalled-cycles-backend # 131.65% backend cycles idle + 10,012,630 instructions # 8.75 insns per cycle + # 0.15 stalled cycles per insn + 1,457,200 branches # 779.369 M/sec + 13,662 branch-misses # 0.94% of all branches [79.35%] + + 0.002638744 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.919213 task-clock # 0.588 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 159 page-faults # 0.083 M/sec + 1,076,319 cycles # 0.561 GHz + 895,237 stalled-cycles-frontend # 83.18% frontend cycles idle + 1,645,401 stalled-cycles-backend # 152.87% backend cycles idle + 10,022,421 instructions # 9.31 insns per cycle + # 0.16 stalled cycles per insn + 1,458,721 branches # 760.062 M/sec + 13,434 branch-misses # 0.92% of all branches [80.97%] + + 0.003264739 seconds time elapsed + +Iteration 100 + + Performance counter stats for './matrixMultiply_gcc_optimized 100': + + 1.883476 task-clock # 0.690 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 158 page-faults # 0.084 M/sec + 4,552,284 cycles # 2.417 GHz + 783,434 stalled-cycles-frontend # 17.21% frontend cycles idle + 1,317,945 stalled-cycles-backend # 28.95% backend cycles idle + 10,008,721 instructions # 2.20 insns per cycle + # 0.13 stalled cycles per insn + 1,456,761 branches # 773.443 M/sec + 14,949 branch-misses # 1.03% of all branches [20.70%] + + 0.002728343 seconds time elapsed + diff --git a/finalExperimentRuns/gcc_output_optimized_1000 b/finalExperimentRuns/gcc_output_optimized_1000 new file mode 100644 index 0000000..4da73bd --- /dev/null +++ b/finalExperimentRuns/gcc_output_optimized_1000 @@ -0,0 +1,180 @@ +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8524.007146 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,101,094,636 cycles # 3.062 GHz [83.34%] + 21,174,291,573 stalled-cycles-frontend # 81.12% frontend cycles idle [83.34%] + 8,086,059,447 stalled-cycles-backend # 30.98% backend cycles idle [66.67%] + 8,147,023,966 instructions # 0.31 insns per cycle + # 2.60 stalled cycles per insn [83.34%] + 1,034,584,832 branches # 121.373 M/sec [83.34%] + 1,056,203 branch-misses # 0.10% of all branches [83.35%] + + 8.546169904 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8480.788072 task-clock # 0.997 CPUs utilized + 12 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 25,968,524,213 cycles # 3.062 GHz [83.30%] + 21,026,920,732 stalled-cycles-frontend # 80.97% frontend cycles idle [83.35%] + 8,372,590,975 stalled-cycles-backend # 32.24% backend cycles idle [66.69%] + 8,146,964,730 instructions # 0.31 insns per cycle + # 2.58 stalled cycles per insn [83.35%] + 1,034,591,652 branches # 121.992 M/sec [83.34%] + 1,061,216 branch-misses # 0.10% of all branches [83.32%] + + 8.502870304 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8499.518119 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,025,909,327 cycles # 3.062 GHz [83.34%] + 21,094,624,277 stalled-cycles-frontend # 81.05% frontend cycles idle [83.33%] + 7,597,054,786 stalled-cycles-backend # 29.19% backend cycles idle [66.67%] + 8,146,986,115 instructions # 0.31 insns per cycle + # 2.59 stalled cycles per insn [83.34%] + 1,034,616,479 branches # 121.726 M/sec [83.33%] + 1,055,439 branch-misses # 0.10% of all branches [83.34%] + + 8.521753033 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8567.572363 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,233,696,728 cycles # 3.062 GHz [83.33%] + 21,318,293,997 stalled-cycles-frontend # 81.26% frontend cycles idle [83.33%] + 8,013,091,628 stalled-cycles-backend # 30.55% backend cycles idle [66.66%] + 8,147,236,780 instructions # 0.31 insns per cycle + # 2.62 stalled cycles per insn [83.33%] + 1,033,816,017 branches # 120.666 M/sec [83.37%] + 1,057,271 branch-misses # 0.10% of all branches [83.35%] + + 8.589968438 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8498.048583 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,020,348,975 cycles # 3.062 GHz [83.33%] + 21,088,844,072 stalled-cycles-frontend # 81.05% frontend cycles idle [83.33%] + 7,943,621,197 stalled-cycles-backend # 30.53% backend cycles idle [66.66%] + 8,146,770,884 instructions # 0.31 insns per cycle + # 2.59 stalled cycles per insn [83.33%] + 1,034,364,119 branches # 121.718 M/sec [83.33%] + 1,057,797 branch-misses # 0.10% of all branches [83.35%] + + 8.520236784 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8523.980835 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 26,099,105,396 cycles # 3.062 GHz [83.34%] + 21,174,457,333 stalled-cycles-frontend # 81.13% frontend cycles idle [83.34%] + 7,971,768,233 stalled-cycles-backend # 30.54% backend cycles idle [66.67%] + 8,147,071,539 instructions # 0.31 insns per cycle + # 2.60 stalled cycles per insn [83.34%] + 1,034,599,564 branches # 121.375 M/sec [83.34%] + 1,067,177 branch-misses # 0.10% of all branches [83.33%] + + 8.546194472 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8539.281197 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 26,147,787,605 cycles # 3.062 GHz [83.32%] + 21,232,515,363 stalled-cycles-frontend # 81.20% frontend cycles idle [83.32%] + 7,997,377,449 stalled-cycles-backend # 30.59% backend cycles idle [66.67%] + 8,142,040,940 instructions # 0.31 insns per cycle + # 2.61 stalled cycles per insn [83.36%] + 1,034,582,094 branches # 121.156 M/sec [83.37%] + 1,067,037 branch-misses # 0.10% of all branches [83.35%] + + 8.561577755 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8483.737252 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 25,976,418,040 cycles # 3.062 GHz [83.30%] + 21,031,895,833 stalled-cycles-frontend # 80.97% frontend cycles idle [83.35%] + 7,905,370,309 stalled-cycles-backend # 30.43% backend cycles idle [66.70%] + 8,147,671,922 instructions # 0.31 insns per cycle + # 2.58 stalled cycles per insn [83.35%] + 1,034,722,307 branches # 121.965 M/sec [83.35%] + 1,058,817 branch-misses # 0.10% of all branches [83.31%] + + 8.505817558 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8487.683539 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,075 page-faults # 0.000 M/sec + 25,989,385,640 cycles # 3.062 GHz [83.31%] + 21,054,478,049 stalled-cycles-frontend # 81.01% frontend cycles idle [83.31%] + 7,474,887,009 stalled-cycles-backend # 28.76% backend cycles idle [66.71%] + 8,146,958,745 instructions # 0.31 insns per cycle + # 2.58 stalled cycles per insn [83.36%] + 1,034,611,204 branches # 121.896 M/sec [83.36%] + 1,063,850 branch-misses # 0.10% of all branches [83.34%] + + 8.509833793 seconds time elapsed + +Iteration 1000 + + Performance counter stats for './matrixMultiply_gcc_optimized 1000': + + 8485.279076 task-clock # 0.997 CPUs utilized + 11 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 3,074 page-faults # 0.000 M/sec + 25,980,743,845 cycles # 3.062 GHz [83.31%] + 21,043,200,703 stalled-cycles-frontend # 81.00% frontend cycles idle [83.31%] + 7,855,243,129 stalled-cycles-backend # 30.23% backend cycles idle [66.70%] + 8,147,134,514 instructions # 0.31 insns per cycle + # 2.58 stalled cycles per insn [83.35%] + 1,034,632,398 branches # 121.933 M/sec [83.35%] + 1,068,154 branch-misses # 0.10% of all branches [83.34%] + + 8.507968113 seconds time elapsed + diff --git a/finalExperimentRuns/gcc_output_optimized_3000 b/finalExperimentRuns/gcc_output_optimized_3000 new file mode 100644 index 0000000..bed3fc6 --- /dev/null +++ b/finalExperimentRuns/gcc_output_optimized_3000 @@ -0,0 +1,180 @@ +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 307990.722698 task-clock # 0.997 CPUs utilized + 385 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 942,885,267,154 cycles # 3.061 GHz [83.33%] + 813,151,718,128 stalled-cycles-frontend # 86.24% frontend cycles idle [83.33%] + 479,110,721,206 stalled-cycles-backend # 50.81% backend cycles idle [66.67%] + 217,537,751,166 instructions # 0.23 insns per cycle + # 3.74 stalled cycles per insn [83.33%] + 27,350,281,815 branches # 88.802 M/sec [83.33%] + 13,416,834 branch-misses # 0.05% of all branches [83.33%] + + 308.764947876 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 309095.950256 task-clock # 0.997 CPUs utilized + 388 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 946,223,423,681 cycles # 3.061 GHz [83.33%] + 816,700,149,527 stalled-cycles-frontend # 86.31% frontend cycles idle [83.33%] + 478,184,484,905 stalled-cycles-backend # 50.54% backend cycles idle [66.67%] + 217,549,241,887 instructions # 0.23 insns per cycle + # 3.75 stalled cycles per insn [83.33%] + 27,352,134,829 branches # 88.491 M/sec [83.33%] + 12,496,243 branch-misses # 0.05% of all branches [83.33%] + + 309.874694599 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 308456.151399 task-clock # 0.997 CPUs utilized + 387 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 944,147,394,731 cycles # 3.061 GHz [83.33%] + 815,004,329,682 stalled-cycles-frontend # 86.32% frontend cycles idle [83.33%] + 492,153,218,620 stalled-cycles-backend # 52.13% backend cycles idle [66.67%] + 217,542,001,519 instructions # 0.23 insns per cycle + # 3.75 stalled cycles per insn [83.33%] + 27,351,929,959 branches # 88.674 M/sec [83.33%] + 12,737,640 branch-misses # 0.05% of all branches [83.33%] + + 309.231466001 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 308648.298096 task-clock # 0.997 CPUs utilized + 387 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 944,897,614,537 cycles # 3.061 GHz [83.33%] + 815,188,834,965 stalled-cycles-frontend # 86.27% frontend cycles idle [83.33%] + 485,379,940,869 stalled-cycles-backend # 51.37% backend cycles idle [66.67%] + 217,534,979,891 instructions # 0.23 insns per cycle + # 3.75 stalled cycles per insn [83.33%] + 27,351,527,278 branches # 88.617 M/sec [83.33%] + 13,388,415 branch-misses # 0.05% of all branches [83.33%] + + 309.423862273 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 309909.768801 task-clock # 0.997 CPUs utilized + 388 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 948,763,312,383 cycles # 3.061 GHz [83.33%] + 819,052,696,950 stalled-cycles-frontend # 86.33% frontend cycles idle [83.33%] + 482,990,679,317 stalled-cycles-backend # 50.91% backend cycles idle [66.67%] + 217,539,864,459 instructions # 0.23 insns per cycle + # 3.77 stalled cycles per insn [83.33%] + 27,352,050,126 branches # 88.258 M/sec [83.33%] + 13,177,647 branch-misses # 0.05% of all branches [83.33%] + + 310.688240232 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 309327.733528 task-clock # 0.997 CPUs utilized + 388 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 947,010,787,729 cycles # 3.062 GHz [83.33%] + 817,412,412,659 stalled-cycles-frontend # 86.32% frontend cycles idle [83.33%] + 488,015,320,106 stalled-cycles-backend # 51.53% backend cycles idle [66.67%] + 217,532,974,150 instructions # 0.23 insns per cycle + # 3.76 stalled cycles per insn [83.33%] + 27,349,693,081 branches # 88.417 M/sec [83.33%] + 13,212,984 branch-misses # 0.05% of all branches [83.33%] + + 310.105193532 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 310282.492791 task-clock # 0.997 CPUs utilized + 389 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 949,907,449,960 cycles # 3.061 GHz [83.33%] + 820,459,518,182 stalled-cycles-frontend # 86.37% frontend cycles idle [83.33%] + 471,778,705,376 stalled-cycles-backend # 49.67% backend cycles idle [66.67%] + 217,524,558,295 instructions # 0.23 insns per cycle + # 3.77 stalled cycles per insn [83.33%] + 27,351,609,383 branches # 88.151 M/sec [83.33%] + 13,344,766 branch-misses # 0.05% of all branches [83.33%] + + 311.104012259 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 310349.330476 task-clock # 0.997 CPUs utilized + 389 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,356 page-faults # 0.000 M/sec + 950,012,415,697 cycles # 3.061 GHz [83.33%] + 820,923,300,577 stalled-cycles-frontend # 86.41% frontend cycles idle [83.33%] + 468,957,637,855 stalled-cycles-backend # 49.36% backend cycles idle [66.67%] + 217,545,884,095 instructions # 0.23 insns per cycle + # 3.77 stalled cycles per insn [83.33%] + 27,353,566,509 branches # 88.138 M/sec [83.33%] + 12,597,801 branch-misses # 0.05% of all branches [83.33%] + + 311.146848527 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 310848.446781 task-clock # 0.997 CPUs utilized + 389 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 951,637,386,126 cycles # 3.061 GHz [83.33%] + 822,546,224,447 stalled-cycles-frontend # 86.43% frontend cycles idle [83.33%] + 495,897,697,137 stalled-cycles-backend # 52.11% backend cycles idle [66.67%] + 217,546,544,859 instructions # 0.23 insns per cycle + # 3.78 stalled cycles per insn [83.33%] + 27,353,133,771 branches # 87.995 M/sec [83.33%] + 13,283,333 branch-misses # 0.05% of all branches [83.33%] + + 311.629074931 seconds time elapsed + +Iteration 3000 + + Performance counter stats for './matrixMultiply_gcc_optimized 3000': + + 312178.283971 task-clock # 0.997 CPUs utilized + 391 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 32,357 page-faults # 0.000 M/sec + 955,712,667,148 cycles # 3.061 GHz [83.33%] + 826,044,644,959 stalled-cycles-frontend # 86.43% frontend cycles idle [83.33%] + 499,061,986,949 stalled-cycles-backend # 52.22% backend cycles idle [66.67%] + 217,558,514,147 instructions # 0.23 insns per cycle + # 3.80 stalled cycles per insn [83.33%] + 27,352,241,903 branches # 87.617 M/sec [83.33%] + 13,193,839 branch-misses # 0.05% of all branches [83.33%] + + 312.962113204 seconds time elapsed + diff --git a/finalExperimentRuns/java_output_10 b/finalExperimentRuns/java_output_10 new file mode 100644 index 0000000..e2ed670 --- /dev/null +++ b/finalExperimentRuns/java_output_10 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'java MatrixMultiplier 10': + + 72.815106 task-clock # 0.984 CPUs utilized + 139 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.001 M/sec + 4,253 page-faults # 0.058 M/sec + 212,160,742 cycles # 2.914 GHz [83.64%] + 114,430,847 stalled-cycles-frontend # 53.94% frontend cycles idle [83.36%] + 80,787,912 stalled-cycles-backend # 38.08% backend cycles idle [62.53%] + 182,410,561 instructions # 0.86 insns per cycle + # 0.63 stalled cycles per insn [79.34%] + 34,469,054 branches # 473.378 M/sec [86.37%] + 2,054,782 branch-misses # 5.96% of all branches [86.95%] + + 0.073987229 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'java MatrixMultiplier 10': + + 74.167240 task-clock # 0.981 CPUs utilized + 146 context-switches # 0.002 M/sec + 44 CPU-migrations # 0.001 M/sec + 4,255 page-faults # 0.057 M/sec + 217,762,691 cycles # 2.936 GHz [79.75%] + 119,247,170 stalled-cycles-frontend # 54.76% frontend cycles idle [82.58%] + 81,455,743 stalled-cycles-backend # 37.41% backend cycles idle [68.10%] + 183,508,037 instructions # 0.84 insns per cycle + # 0.65 stalled cycles per insn [84.40%] + 35,369,835 branches # 476.893 M/sec [85.66%] + 2,040,142 branch-misses # 5.77% of all branches [86.07%] + + 0.075620599 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'java MatrixMultiplier 10': + + 75.588706 task-clock # 0.981 CPUs utilized + 148 context-switches # 0.002 M/sec + 47 CPU-migrations # 0.001 M/sec + 4,233 page-faults # 0.056 M/sec + 219,952,171 cycles # 2.910 GHz [83.32%] + 123,320,418 stalled-cycles-frontend # 56.07% frontend cycles idle [85.04%] + 82,988,638 stalled-cycles-backend # 37.73% backend cycles idle [68.62%] + 183,258,921 instructions # 0.83 insns per cycle + # 0.67 stalled cycles per insn [85.04%] + 34,664,677 branches # 458.596 M/sec [83.94%] + 2,046,911 branch-misses # 5.90% of all branches [81.13%] + + 0.077076913 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'java MatrixMultiplier 10': + + 73.785766 task-clock # 0.983 CPUs utilized + 156 context-switches # 0.002 M/sec + 44 CPU-migrations # 0.001 M/sec + 4,255 page-faults # 0.058 M/sec + 213,783,464 cycles # 2.897 GHz [83.60%] + 116,799,942 stalled-cycles-frontend # 54.63% frontend cycles idle [78.27%] + 77,769,074 stalled-cycles-backend # 36.38% backend cycles idle [68.20%] + 182,198,452 instructions # 0.85 insns per cycle + # 0.64 stalled cycles per insn [84.73%] + 35,172,437 branches # 476.683 M/sec [84.90%] + 2,002,118 branch-misses # 5.69% of all branches [87.69%] + + 0.075044359 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'java MatrixMultiplier 10': + + 75.848184 task-clock # 0.963 CPUs utilized + 177 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.001 M/sec + 4,256 page-faults # 0.056 M/sec + 222,550,625 cycles # 2.934 GHz [75.92%] + 122,058,241 stalled-cycles-frontend # 54.85% frontend cycles idle [83.66%] + 82,982,505 stalled-cycles-backend # 37.29% backend cycles idle [68.71%] + 183,204,443 instructions # 0.82 insns per cycle + # 0.67 stalled cycles per insn [84.97%] + 35,265,600 branches # 464.950 M/sec [85.01%] + 2,010,327 branch-misses # 5.70% of all branches [88.69%] + + 0.078736540 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'java MatrixMultiplier 10': + + 74.552674 task-clock # 0.978 CPUs utilized + 146 context-switches # 0.002 M/sec + 45 CPU-migrations # 0.001 M/sec + 4,252 page-faults # 0.057 M/sec + 220,109,964 cycles # 2.952 GHz [78.21%] + 119,486,246 stalled-cycles-frontend # 54.28% frontend cycles idle [84.59%] + 80,845,000 stalled-cycles-backend # 36.73% backend cycles idle [68.08%] + 184,366,056 instructions # 0.84 insns per cycle + # 0.65 stalled cycles per insn [84.04%] + 34,909,548 branches # 468.253 M/sec [84.14%] + 2,006,308 branch-misses # 5.75% of all branches [87.11%] + + 0.076255589 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'java MatrixMultiplier 10': + + 74.919822 task-clock # 0.945 CPUs utilized + 136 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.001 M/sec + 4,232 page-faults # 0.056 M/sec + 215,665,200 cycles # 2.879 GHz [79.71%] + 122,784,131 stalled-cycles-frontend # 56.93% frontend cycles idle [86.01%] + 83,019,995 stalled-cycles-backend # 38.49% backend cycles idle [68.15%] + 184,014,109 instructions # 0.85 insns per cycle + # 0.67 stalled cycles per insn [84.43%] + 34,335,055 branches # 458.291 M/sec [85.30%] + 2,017,824 branch-misses # 5.88% of all branches [83.15%] + + 0.079275197 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'java MatrixMultiplier 10': + + 72.325490 task-clock # 0.978 CPUs utilized + 136 context-switches # 0.002 M/sec + 48 CPU-migrations # 0.001 M/sec + 4,255 page-faults # 0.059 M/sec + 211,331,070 cycles # 2.922 GHz [83.78%] + 115,877,185 stalled-cycles-frontend # 54.83% frontend cycles idle [77.28%] + 75,513,035 stalled-cycles-backend # 35.73% backend cycles idle [67.46%] + 182,895,864 instructions # 0.87 insns per cycle + # 0.63 stalled cycles per insn [83.79%] + 35,178,485 branches # 486.391 M/sec [85.16%] + 2,003,949 branch-misses # 5.70% of all branches [88.08%] + + 0.073979011 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'java MatrixMultiplier 10': + + 74.615253 task-clock # 0.984 CPUs utilized + 136 context-switches # 0.002 M/sec + 41 CPU-migrations # 0.001 M/sec + 4,233 page-faults # 0.057 M/sec + 221,217,036 cycles # 2.965 GHz [78.81%] + 120,264,263 stalled-cycles-frontend # 54.36% frontend cycles idle [83.70%] + 80,040,282 stalled-cycles-backend # 36.18% backend cycles idle [68.39%] + 183,237,659 instructions # 0.83 insns per cycle + # 0.66 stalled cycles per insn [85.00%] + 35,439,125 branches # 474.958 M/sec [85.72%] + 2,039,792 branch-misses # 5.76% of all branches [85.90%] + + 0.075848324 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'java MatrixMultiplier 10': + + 74.492689 task-clock # 0.973 CPUs utilized + 150 context-switches # 0.002 M/sec + 41 CPU-migrations # 0.001 M/sec + 4,255 page-faults # 0.057 M/sec + 216,573,426 cycles # 2.907 GHz [84.20%] + 120,115,088 stalled-cycles-frontend # 55.46% frontend cycles idle [79.15%] + 81,505,498 stalled-cycles-backend # 37.63% backend cycles idle [67.75%] + 184,181,901 instructions # 0.85 insns per cycle + # 0.65 stalled cycles per insn [84.02%] + 35,341,758 branches # 474.433 M/sec [84.88%] + 2,031,210 branch-misses # 5.75% of all branches [86.54%] + + 0.076539126 seconds time elapsed + diff --git a/finalExperimentRuns/java_output_100 b/finalExperimentRuns/java_output_100 new file mode 100644 index 0000000..5ff2003 --- /dev/null +++ b/finalExperimentRuns/java_output_100 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'java MatrixMultiplier 100': + + 103.321799 task-clock # 1.117 CPUs utilized + 175 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.000 M/sec + 4,909 page-faults # 0.048 M/sec + 301,216,233 cycles # 2.915 GHz [84.32%] + 163,477,231 stalled-cycles-frontend # 54.27% frontend cycles idle [75.05%] + 103,759,590 stalled-cycles-backend # 34.45% backend cycles idle [66.56%] + 297,736,573 instructions # 0.99 insns per cycle + # 0.55 stalled cycles per insn [88.51%] + 55,643,691 branches # 538.547 M/sec [88.33%] + 2,889,288 branch-misses # 5.19% of all branches [87.38%] + + 0.092533164 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'java MatrixMultiplier 100': + + 103.759715 task-clock # 1.117 CPUs utilized + 160 context-switches # 0.002 M/sec + 47 CPU-migrations # 0.000 M/sec + 4,901 page-faults # 0.047 M/sec + 305,125,075 cycles # 2.941 GHz [84.89%] + 160,369,545 stalled-cycles-frontend # 52.56% frontend cycles idle [74.82%] + 101,259,462 stalled-cycles-backend # 33.19% backend cycles idle [66.10%] + 287,525,333 instructions # 0.94 insns per cycle + # 0.56 stalled cycles per insn [89.35%] + 54,463,632 branches # 524.902 M/sec [88.47%] + 3,052,971 branch-misses # 5.61% of all branches [87.52%] + + 0.092870741 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'java MatrixMultiplier 100': + + 104.375659 task-clock # 1.059 CPUs utilized + 159 context-switches # 0.002 M/sec + 44 CPU-migrations # 0.000 M/sec + 4,899 page-faults # 0.047 M/sec + 312,875,028 cycles # 2.998 GHz [77.06%] + 168,819,560 stalled-cycles-frontend # 53.96% frontend cycles idle [78.79%] + 101,445,345 stalled-cycles-backend # 32.42% backend cycles idle [71.36%] + 301,146,158 instructions # 0.96 insns per cycle + # 0.56 stalled cycles per insn [88.93%] + 55,088,281 branches # 527.789 M/sec [88.62%] + 2,998,976 branch-misses # 5.44% of all branches [85.92%] + + 0.098543800 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'java MatrixMultiplier 100': + + 106.506564 task-clock # 1.098 CPUs utilized + 150 context-switches # 0.001 M/sec + 44 CPU-migrations # 0.000 M/sec + 4,908 page-faults # 0.046 M/sec + 314,107,537 cycles # 2.949 GHz [80.00%] + 168,129,079 stalled-cycles-frontend # 53.53% frontend cycles idle [83.52%] + 110,233,792 stalled-cycles-backend # 35.09% backend cycles idle [61.34%] + 267,033,663 instructions # 0.85 insns per cycle + # 0.63 stalled cycles per insn [88.69%] + 54,684,767 branches # 513.440 M/sec [89.14%] + 3,034,135 branch-misses # 5.55% of all branches [87.76%] + + 0.096957055 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'java MatrixMultiplier 100': + + 103.919871 task-clock # 1.123 CPUs utilized + 172 context-switches # 0.002 M/sec + 44 CPU-migrations # 0.000 M/sec + 4,916 page-faults # 0.047 M/sec + 302,840,737 cycles # 2.914 GHz [85.86%] + 156,296,630 stalled-cycles-frontend # 51.61% frontend cycles idle [83.16%] + 112,184,665 stalled-cycles-backend # 37.04% backend cycles idle [58.29%] + 266,462,000 instructions # 0.88 insns per cycle + # 0.59 stalled cycles per insn [80.55%] + 54,001,529 branches # 519.646 M/sec [87.11%] + 2,916,764 branch-misses # 5.40% of all branches [87.46%] + + 0.092571453 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'java MatrixMultiplier 100': + + 104.129244 task-clock # 1.110 CPUs utilized + 167 context-switches # 0.002 M/sec + 40 CPU-migrations # 0.000 M/sec + 4,901 page-faults # 0.047 M/sec + 305,068,140 cycles # 2.930 GHz [84.38%] + 160,683,594 stalled-cycles-frontend # 52.67% frontend cycles idle [83.04%] + 108,136,607 stalled-cycles-backend # 35.45% backend cycles idle [58.36%] + 262,531,379 instructions # 0.86 insns per cycle + # 0.61 stalled cycles per insn [84.17%] + 52,184,320 branches # 501.150 M/sec [87.66%] + 3,073,796 branch-misses # 5.89% of all branches [88.33%] + + 0.093834708 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'java MatrixMultiplier 100': + + 104.108239 task-clock # 1.125 CPUs utilized + 157 context-switches # 0.002 M/sec + 42 CPU-migrations # 0.000 M/sec + 4,898 page-faults # 0.047 M/sec + 307,017,870 cycles # 2.949 GHz [84.90%] + 164,306,170 stalled-cycles-frontend # 53.52% frontend cycles idle [77.93%] + 103,125,565 stalled-cycles-backend # 33.59% backend cycles idle [65.45%] + 288,379,192 instructions # 0.94 insns per cycle + # 0.57 stalled cycles per insn [85.16%] + 53,702,811 branches # 515.836 M/sec [86.05%] + 3,044,773 branch-misses # 5.67% of all branches [87.57%] + + 0.092529815 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'java MatrixMultiplier 100': + + 104.765434 task-clock # 1.108 CPUs utilized + 169 context-switches # 0.002 M/sec + 45 CPU-migrations # 0.000 M/sec + 4,901 page-faults # 0.047 M/sec + 307,535,192 cycles # 2.935 GHz [84.82%] + 164,207,959 stalled-cycles-frontend # 53.39% frontend cycles idle [79.74%] + 106,454,679 stalled-cycles-backend # 34.62% backend cycles idle [60.71%] + 268,169,951 instructions # 0.87 insns per cycle + # 0.61 stalled cycles per insn [88.10%] + 54,860,528 branches # 523.651 M/sec [88.40%] + 2,968,193 branch-misses # 5.41% of all branches [87.39%] + + 0.094565311 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'java MatrixMultiplier 100': + + 105.879995 task-clock # 1.108 CPUs utilized + 181 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.000 M/sec + 4,910 page-faults # 0.046 M/sec + 309,713,266 cycles # 2.925 GHz [86.13%] + 164,906,341 stalled-cycles-frontend # 53.24% frontend cycles idle [79.10%] + 111,500,921 stalled-cycles-backend # 36.00% backend cycles idle [61.51%] + 272,166,057 instructions # 0.88 insns per cycle + # 0.61 stalled cycles per insn [87.40%] + 53,079,383 branches # 501.316 M/sec [88.80%] + 3,046,810 branch-misses # 5.74% of all branches [86.44%] + + 0.095518615 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'java MatrixMultiplier 100': + + 104.498642 task-clock # 1.120 CPUs utilized + 166 context-switches # 0.002 M/sec + 43 CPU-migrations # 0.000 M/sec + 4,912 page-faults # 0.047 M/sec + 306,585,731 cycles # 2.934 GHz [86.11%] + 157,952,036 stalled-cycles-frontend # 51.52% frontend cycles idle [76.53%] + 109,596,785 stalled-cycles-backend # 35.75% backend cycles idle [65.42%] + 284,918,343 instructions # 0.93 insns per cycle + # 0.55 stalled cycles per insn [88.44%] + 54,016,381 branches # 516.910 M/sec [88.80%] + 3,056,357 branch-misses # 5.66% of all branches [85.71%] + + 0.093262045 seconds time elapsed + diff --git a/finalExperimentRuns/java_output_1000 b/finalExperimentRuns/java_output_1000 new file mode 100644 index 0000000..0e72482 --- /dev/null +++ b/finalExperimentRuns/java_output_1000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8230.895013 task-clock # 1.000 CPUs utilized + 349 context-switches # 0.000 M/sec + 51 CPU-migrations # 0.000 M/sec + 7,924 page-faults # 0.001 M/sec + 25,179,610,041 cycles # 3.059 GHz [83.31%] + 19,733,923,171 stalled-cycles-frontend # 78.37% frontend cycles idle [83.35%] + 5,763,803,893 stalled-cycles-backend # 22.89% backend cycles idle [66.59%] + 11,489,775,504 instructions # 0.46 insns per cycle + # 1.72 stalled cycles per insn [83.39%] + 1,586,764,019 branches # 192.781 M/sec [83.37%] + 5,033,764 branch-misses # 0.32% of all branches [83.39%] + + 8.231041043 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8259.814170 task-clock # 1.000 CPUs utilized + 348 context-switches # 0.000 M/sec + 49 CPU-migrations # 0.000 M/sec + 7,921 page-faults # 0.001 M/sec + 25,267,638,160 cycles # 3.059 GHz [83.34%] + 19,841,583,037 stalled-cycles-frontend # 78.53% frontend cycles idle [83.21%] + 6,527,775,541 stalled-cycles-backend # 25.83% backend cycles idle [66.69%] + 11,513,813,855 instructions # 0.46 insns per cycle + # 1.72 stalled cycles per insn [83.38%] + 1,587,852,465 branches # 192.238 M/sec [83.37%] + 5,136,172 branch-misses # 0.32% of all branches [83.43%] + + 8.260232738 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8194.756476 task-clock # 1.000 CPUs utilized + 375 context-switches # 0.000 M/sec + 52 CPU-migrations # 0.000 M/sec + 7,917 page-faults # 0.001 M/sec + 25,071,710,073 cycles # 3.059 GHz [83.35%] + 19,634,941,038 stalled-cycles-frontend # 78.32% frontend cycles idle [83.36%] + 5,481,936,492 stalled-cycles-backend # 21.87% backend cycles idle [66.57%] + 11,497,785,971 instructions # 0.46 insns per cycle + # 1.71 stalled cycles per insn [83.26%] + 1,585,354,953 branches # 193.460 M/sec [83.36%] + 4,624,130 branch-misses # 0.29% of all branches [83.37%] + + 8.195429601 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8289.424086 task-clock # 1.000 CPUs utilized + 351 context-switches # 0.000 M/sec + 50 CPU-migrations # 0.000 M/sec + 7,924 page-faults # 0.001 M/sec + 25,357,184,443 cycles # 3.059 GHz [83.40%] + 19,924,099,338 stalled-cycles-frontend # 78.57% frontend cycles idle [83.30%] + 5,665,731,789 stalled-cycles-backend # 22.34% backend cycles idle [66.62%] + 11,497,881,177 instructions # 0.45 insns per cycle + # 1.73 stalled cycles per insn [83.36%] + 1,586,295,230 branches # 191.364 M/sec [83.35%] + 4,864,960 branch-misses # 0.31% of all branches [83.36%] + + 8.289548645 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8295.510219 task-clock # 1.000 CPUs utilized + 344 context-switches # 0.000 M/sec + 45 CPU-migrations # 0.000 M/sec + 7,914 page-faults # 0.001 M/sec + 25,375,983,015 cycles # 3.059 GHz [83.35%] + 19,927,717,481 stalled-cycles-frontend # 78.53% frontend cycles idle [83.38%] + 5,775,388,326 stalled-cycles-backend # 22.76% backend cycles idle [66.64%] + 11,510,303,341 instructions # 0.45 insns per cycle + # 1.73 stalled cycles per insn [83.34%] + 1,584,048,659 branches # 190.953 M/sec [83.33%] + 4,757,923 branch-misses # 0.30% of all branches [83.34%] + + 8.295597912 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8279.033166 task-clock # 1.000 CPUs utilized + 338 context-switches # 0.000 M/sec + 49 CPU-migrations # 0.000 M/sec + 7,921 page-faults # 0.001 M/sec + 25,325,475,010 cycles # 3.059 GHz [83.38%] + 19,889,516,972 stalled-cycles-frontend # 78.54% frontend cycles idle [83.24%] + 6,028,939,780 stalled-cycles-backend # 23.81% backend cycles idle [66.57%] + 11,486,000,036 instructions # 0.45 insns per cycle + # 1.73 stalled cycles per insn [83.42%] + 1,588,599,157 branches # 191.882 M/sec [83.43%] + 4,920,256 branch-misses # 0.31% of all branches [83.40%] + + 8.280647843 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8238.691565 task-clock # 0.979 CPUs utilized + 350 context-switches # 0.000 M/sec + 60 CPU-migrations # 0.000 M/sec + 7,908 page-faults # 0.001 M/sec + 25,200,142,210 cycles # 3.059 GHz [83.36%] + 19,774,075,612 stalled-cycles-frontend # 78.47% frontend cycles idle [83.35%] + 5,690,178,267 stalled-cycles-backend # 22.58% backend cycles idle [66.56%] + 11,493,062,103 instructions # 0.46 insns per cycle + # 1.72 stalled cycles per insn [83.30%] + 1,590,593,567 branches # 193.064 M/sec [83.37%] + 4,824,786 branch-misses # 0.30% of all branches [83.40%] + + 8.418598063 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8261.292085 task-clock # 1.000 CPUs utilized + 363 context-switches # 0.000 M/sec + 47 CPU-migrations # 0.000 M/sec + 7,924 page-faults # 0.001 M/sec + 25,267,234,464 cycles # 3.059 GHz [83.38%] + 19,828,388,563 stalled-cycles-frontend # 78.47% frontend cycles idle [83.37%] + 5,913,581,026 stalled-cycles-backend # 23.40% backend cycles idle [66.54%] + 11,491,742,369 instructions # 0.45 insns per cycle + # 1.73 stalled cycles per insn [83.26%] + 1,584,928,928 branches # 191.850 M/sec [83.35%] + 4,710,317 branch-misses # 0.30% of all branches [83.39%] + + 8.263920402 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8159.608685 task-clock # 1.000 CPUs utilized + 352 context-switches # 0.000 M/sec + 44 CPU-migrations # 0.000 M/sec + 7,922 page-faults # 0.001 M/sec + 24,966,244,868 cycles # 3.060 GHz [83.38%] + 19,528,618,282 stalled-cycles-frontend # 78.22% frontend cycles idle [83.38%] + 5,211,081,380 stalled-cycles-backend # 20.87% backend cycles idle [66.60%] + 11,505,569,740 instructions # 0.46 insns per cycle + # 1.70 stalled cycles per insn [83.31%] + 1,582,342,745 branches # 193.924 M/sec [83.29%] + 4,717,778 branch-misses # 0.30% of all branches [83.38%] + + 8.161167189 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 8325.978080 task-clock # 1.000 CPUs utilized + 336 context-switches # 0.000 M/sec + 51 CPU-migrations # 0.000 M/sec + 7,920 page-faults # 0.001 M/sec + 25,465,415,040 cycles # 3.059 GHz [83.39%] + 20,014,451,796 stalled-cycles-frontend # 78.59% frontend cycles idle [83.35%] + 5,716,481,850 stalled-cycles-backend # 22.45% backend cycles idle [66.57%] + 11,496,878,405 instructions # 0.45 insns per cycle + # 1.74 stalled cycles per insn [83.29%] + 1,583,971,382 branches # 190.244 M/sec [83.35%] + 4,654,654 branch-misses # 0.29% of all branches [83.37%] + + 8.327184267 seconds time elapsed + diff --git a/finalExperimentRuns/java_output_3000 b/finalExperimentRuns/java_output_3000 new file mode 100644 index 0000000..bcb0278 --- /dev/null +++ b/finalExperimentRuns/java_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 570246.408556 task-clock # 0.998 CPUs utilized + 13,594 context-switches # 0.000 M/sec + 67 CPU-migrations # 0.000 M/sec + 55,723 page-faults # 0.000 M/sec + 1,745,855,585,043 cycles # 3.062 GHz [83.33%] + 1,586,556,006,830 stalled-cycles-frontend # 90.88% frontend cycles idle [83.33%] + 667,253,690,712 stalled-cycles-backend # 38.22% backend cycles idle [66.66%] + 299,663,523,851 instructions # 0.17 insns per cycle + # 5.29 stalled cycles per insn [83.33%] + 40,925,007,356 branches # 71.767 M/sec [83.34%] + 21,839,815 branch-misses # 0.05% of all branches [83.34%] + + 571.200174838 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 526618.685030 task-clock # 0.998 CPUs utilized + 12,618 context-switches # 0.000 M/sec + 65 CPU-migrations # 0.000 M/sec + 54,849 page-faults # 0.000 M/sec + 1,612,309,554,009 cycles # 3.062 GHz [83.33%] + 1,453,911,024,610 stalled-cycles-frontend # 90.18% frontend cycles idle [83.33%] + 604,419,114,381 stalled-cycles-backend # 37.49% backend cycles idle [66.67%] + 299,550,354,418 instructions # 0.19 insns per cycle + # 4.85 stalled cycles per insn [83.34%] + 40,909,432,652 branches # 77.683 M/sec [83.33%] + 21,245,062 branch-misses # 0.05% of all branches [83.33%] + + 527.548551694 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 535466.680458 task-clock # 0.998 CPUs utilized + 12,846 context-switches # 0.000 M/sec + 62 CPU-migrations # 0.000 M/sec + 54,956 page-faults # 0.000 M/sec + 1,639,046,450,367 cycles # 3.061 GHz [83.34%] + 1,480,430,768,242 stalled-cycles-frontend # 90.32% frontend cycles idle [83.33%] + 601,908,499,977 stalled-cycles-backend # 36.72% backend cycles idle [66.66%] + 299,553,327,633 instructions # 0.18 insns per cycle + # 4.94 stalled cycles per insn [83.34%] + 40,910,210,705 branches # 76.401 M/sec [83.33%] + 20,911,209 branch-misses # 0.05% of all branches [83.34%] + + 536.698723828 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 552650.707551 task-clock # 0.997 CPUs utilized + 12,976 context-switches # 0.000 M/sec + 77 CPU-migrations # 0.000 M/sec + 55,114 page-faults # 0.000 M/sec + 1,691,511,828,074 cycles # 3.061 GHz [83.33%] + 1,532,208,381,110 stalled-cycles-frontend # 90.58% frontend cycles idle [83.33%] + 621,744,344,523 stalled-cycles-backend # 36.76% backend cycles idle [66.67%] + 299,846,020,001 instructions # 0.18 insns per cycle + # 5.11 stalled cycles per insn [83.34%] + 40,958,238,817 branches # 74.112 M/sec [83.33%] + 21,459,929 branch-misses # 0.05% of all branches [83.33%] + + 554.276915012 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 556814.234121 task-clock # 0.998 CPUs utilized + 13,237 context-switches # 0.000 M/sec + 70 CPU-migrations # 0.000 M/sec + 55,552 page-faults # 0.000 M/sec + 1,704,664,130,406 cycles # 3.061 GHz [83.34%] + 1,545,675,582,807 stalled-cycles-frontend # 90.67% frontend cycles idle [83.33%] + 633,094,029,679 stalled-cycles-backend # 37.14% backend cycles idle [66.67%] + 299,667,160,749 instructions # 0.18 insns per cycle + # 5.16 stalled cycles per insn [83.33%] + 40,929,141,875 branches # 73.506 M/sec [83.33%] + 21,024,237 branch-misses # 0.05% of all branches [83.33%] + + 557.952865517 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 560832.876628 task-clock # 0.998 CPUs utilized + 12,793 context-switches # 0.000 M/sec + 77 CPU-migrations # 0.000 M/sec + 55,513 page-faults # 0.000 M/sec + 1,713,840,185,302 cycles # 3.056 GHz [83.34%] + 1,555,002,421,280 stalled-cycles-frontend # 90.73% frontend cycles idle [83.33%] + 637,113,380,734 stalled-cycles-backend # 37.17% backend cycles idle [66.66%] + 299,715,387,470 instructions # 0.17 insns per cycle + # 5.19 stalled cycles per insn [83.33%] + 40,932,284,030 branches # 72.985 M/sec [83.33%] + 21,650,917 branch-misses # 0.05% of all branches [83.34%] + + 561.996199196 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 550567.500826 task-clock # 0.998 CPUs utilized + 12,798 context-switches # 0.000 M/sec + 82 CPU-migrations # 0.000 M/sec + 55,289 page-faults # 0.000 M/sec + 1,684,502,992,534 cycles # 3.060 GHz [83.34%] + 1,525,773,333,416 stalled-cycles-frontend # 90.58% frontend cycles idle [83.34%] + 624,056,379,930 stalled-cycles-backend # 37.05% backend cycles idle [66.66%] + 299,717,851,374 instructions # 0.18 insns per cycle + # 5.09 stalled cycles per insn [83.33%] + 40,933,551,765 branches # 74.348 M/sec [83.33%] + 21,857,346 branch-misses # 0.05% of all branches [83.33%] + + 551.751018706 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 555494.391825 task-clock # 0.998 CPUs utilized + 12,852 context-switches # 0.000 M/sec + 58 CPU-migrations # 0.000 M/sec + 55,583 page-faults # 0.000 M/sec + 1,698,991,939,785 cycles # 3.059 GHz [83.34%] + 1,540,286,255,055 stalled-cycles-frontend # 90.66% frontend cycles idle [83.33%] + 640,738,068,956 stalled-cycles-backend # 37.71% backend cycles idle [66.66%] + 299,551,757,727 instructions # 0.18 insns per cycle + # 5.14 stalled cycles per insn [83.33%] + 40,913,471,509 branches # 73.652 M/sec [83.33%] + 20,264,283 branch-misses # 0.05% of all branches [83.34%] + + 556.645024828 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 546762.798329 task-clock # 0.998 CPUs utilized + 13,058 context-switches # 0.000 M/sec + 64 CPU-migrations # 0.000 M/sec + 55,257 page-faults # 0.000 M/sec + 1,673,716,383,400 cycles # 3.061 GHz [83.33%] + 1,514,986,220,797 stalled-cycles-frontend # 90.52% frontend cycles idle [83.33%] + 625,080,656,461 stalled-cycles-backend # 37.35% backend cycles idle [66.66%] + 299,613,800,760 instructions # 0.18 insns per cycle + # 5.06 stalled cycles per insn [83.33%] + 40,915,862,013 branches # 74.833 M/sec [83.34%] + 20,910,287 branch-misses # 0.05% of all branches [83.34%] + + 547.893249032 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 548287.545724 task-clock # 0.998 CPUs utilized + 12,824 context-switches # 0.000 M/sec + 78 CPU-migrations # 0.000 M/sec + 55,174 page-faults # 0.000 M/sec + 1,678,345,846,454 cycles # 3.061 GHz [83.33%] + 1,519,483,980,886 stalled-cycles-frontend # 90.53% frontend cycles idle [83.34%] + 617,643,582,895 stalled-cycles-backend # 36.80% backend cycles idle [66.66%] + 299,920,288,315 instructions # 0.18 insns per cycle + # 5.07 stalled cycles per insn [83.33%] + 40,977,709,387 branches # 74.738 M/sec [83.33%] + 22,271,141 branch-misses # 0.05% of all branches [83.34%] + + 549.477799232 seconds time elapsed + diff --git a/finalExperimentRuns/matrixMultiply b/finalExperimentRuns/matrixMultiply new file mode 100755 index 0000000000000000000000000000000000000000..70e131108c590ee77d158a3ad52523d196fc36d3 GIT binary patch literal 13242 zcmeHNeQ;b=6~DWiw1IwP8(K&ynpL+mEt;jJrIS*@mnLan>b4CfMYJt1+s&p~+$1}@ zZ#9LgbppuF28@Udq7FEYALAFGj8>hI#EP+uIz=6eRl4ns^ihvhqhxnq61^f^P{=Z(W%Gl^c&!aH;9N< zd9F~>rPlF+-A(;FmPi)VkR7J`6)c#t-3_p#IA3eyIQM9ObLHifo*z@qimOt|gPS&9 zmFjLxCHr%Oje|{_8aHi>WCtQw%XtS82{>|gJuYKF1wXI~!2fDAh?SW?9EZVE*z#HeljXChk=fEk}5Dsq(0hleGjdS2z z=D=6YfeXtz)Hl#?W$jqTwk(0m5~r)MNn|sz{%&C>`w}9Zv*W$7j7Vpa{dSM&i=|Qn zaS^izk}xL=ZQd74_KTiOA|bX%+qbq@S4XanTm#3#U;eA~38!o16LhWVpq9Hlc@gQn zOR-|2p-c8?ZMxQHNZ|{CQ|`FcIPmhV2w~8H)4JhS@4)$9AX&(PJNJt<4xD^*Tj#*} z-XK|%1INV5&2Zosmr)_iq3N399{?0Hm{#$p@L>-9u;w_cl&-n$@{lO4K7w;?gMl9L zy(FHTD50&+5Kk$YJSq8GiKkRdj!OO@@d4r=ll*&#r>RdqBKbYU)08JiB)@}rO8w+f z$!{f|raqaL{I$f>lqb8uum4MX{+V0M{PX6}A5V95wvUg7umhRnVG)WOrTqGWa3CcHJ=vA-0+WPnvL4nmBNLWQ1d?A8(r`g+lcQY2XLVv5A10A20s+ z)lvz*Zva@Rj=Mx(Q=;po$aIPBQ=+#5)Z2-eZldz z88w^pib!s%YrIYJQ`aM&gEF2O&s5GU-f#L&7J|o);9kf-iz{}FhACR-$@h8qzE1i+ zf8^Uw(q>THBn2}Ngr#8S$R~6JZl7l_r5wC2pHnZh&l51-+*bDa11TV%k4XW1o{-mf zyzPu*(t64ooO})<9opom?8}TyeinTs<$w(Ej3+5NU`mQvSh1OOc0%WbIrjU2>3iBN z)D?C@hj{2bUAP!p0n*Ar>#RBUCuqGyS~;Ybcxb&;xEfk7tbo=BfR@a$KSS#rX?*}= z5f80%g}T~DpY=VR530OB1%2e8cDO?>1DgFeBs5byyk0_Q06i?BGquBYfYhRYjf>&{ z#q;_u(2jF_f!3(tcu~Ab3Mj-{6(V0C6^mY(YC*=3`)8JuZ@mDK3%a*xvpDfD+`fhC z@6I9qvJ!u84siiumAgDNX#L!e!4l}x*nP_Q7R}zG*mr4mH(0f%DC9h@Q$BavEVP}* zZjC2_9N|;Y$yYbRLfs=D#jI6t1PfI4dT?K>-YeM5PGCzeH#46KpNi(Y!xQE`jYG>q zB6`p2BSe4~qj@`gI+{Nco-yU;)pwnNsd=`U$0;mBqhO zZ0gs555JK@tGh$w!?!B1`@K0edK-5Sth2v4g zJpo$Q+X202DthGeejJA|FZsid$Me4|l}P>sj_sK53a7t7&_@a+|0RyMBM-x%Wk3Fp zl49sU>J_GX^n9sm`2L4|& zfY%AKar|DMar&2?8h;O3tXR=eZOESftSNf+cg=siS{fk1gMNcZ`P=SjK=J&|=$K#e z{H-MpU22OI5%rp`(3A;%D4|wt=#rHGS3f1W%KH)i7Ic}$2dfO(W4ufA{Jw+z@i!sn z@ft?X$I$x7ljJ!sr!^nea_#PaPWXGZ*U?@2x;&ui7c~8rra#j3Sxx_>=~+z|EHJ!7 zO1>NC?JX_WhSuyonCrK5S4ETkvCKedV`NigL*x3K1g}}Ecp)O$!+mz_AgG;Dw3mDM zWSPjMMWlbgPDGlwwl~_bLz+9(pNkyKCGinD*)1Z(^~SQjBGP@hALA)%XO!f9iA*** z(C=a_$TEpkj0|)yow7wF*`LJOP7LDQ0|v5z?wB1DkwmZ6lZo{utlnoI*Vgj>gxIp;2^5MK5MIr_mvd=ijC6 z_lK0mIz`H7ul+wDq4>ReY=33hQguj|8q;Oyvu`QTr@KO`^Qsd>pY0eXp6?yTh}NuC z+++IweFNAHge$oGyN~X#+58{V6Y_h6UjKTySxErVHu;SUWC29X&q=2+fJpfH=fmCRzw_OAt>FF9jR(v1j&6LJ;Qh>v*Om7vH+~8Boh~ON`vH8l<9)>`42Tt| z@0?Bl(sKQpTmQ21{}XP!UhsYE##aiyAKf@r6S|wa50;3xFECsJy1%N#-%2hJ4E-+h zp~8?pKsy`VuRd{M9-1V6VIJCm`^6H`R00D`{q`S_v(Fy@5ezs&PmTWbH#s$ z9H&mK^Thu#i7yi!wFY{X_At7>S+3((fK&YI^mC6b#?YB9Z$FpgtQ2Wa{J+uopa*|m z<3~NX+P7DVyER?~J!;c9eAu0C_TVo|X`Kjr=DQe)_06&l{wg>X^X-*`Rj06tqC@P3Ie5ma7DEiccgrIriUoU@T?Hf8DKEZcyOg@^mU;C%Pk>uGz3&kibfI4-&Tl)zS3de|N60 z?=bsm+tn)FY}?bkv&~|T+;G3*MZPDHUixBoCONn>m$H-T)L}%efM!j%YTAPTY^jiY zpl@ev@TOQQmw;P(KVii(nb=_~ff{eC_1(Lgceb~C$u-P^X^*w$%v zHgAo#QBGvlcRZW3 +#include +#include +#include +#include + +static int **matrixA; +static int **matrixB; +static int **matrixC; +static int N; + +static int randomMaxValue = 100; + +void setUpMatrices() { + + int i = 0; + + matrixA = malloc(sizeof(int *) * N); + matrixB = malloc(sizeof(int *) * N); + matrixC = malloc(sizeof(int *) * N); + + + + for (i=0 ; iOxsxl28NFXGFG&+9|LdcEUe2yF@kSrXJ%n!c6KxK zMi+||1gzr}#iq4rOr(uAM*Bh3SXymef-Q+nincW+5ff@8nFUPO6lGO#`aAdCGxO%{ zj2}(-hJo3y>q_j53F)jR0u8(akC(9u-Ydf^De}xuSr&6UNJ%V z#I<6!7zd;pmru43HET>qRM$*vlw2if6)vyC1iTKPtT3Hp!h$JVNR-Aa6rZY^bVjYo zG8Mul0n#H|=UppV&@NeFxvZ_Q5$_`+ zTI9VzNtR0cStBg-cSag zT?QArzO}b6t|yIP!q9aA_lL;aD?~C8jE990?Tv{3L^N*nh~8i<))x{%qb~|Il2mHF z!Dw9cBq9;9I?&qGtS|K}^(@DL!lC{OwF-Ejo*`XSQnR8HsCAvmiZgS&WR2f{1;aTe zJ{|!1ic5_J&%a`5bXss)4_xXjIInSPb6IffdY@;(X>2ZwEjX`vYV%rfOe|lty%%b- ze*>HChWXjI(U-RO)tcihkX!z{SuT;Qe;N1Mxjxj0-$uj z9vYPV&xo%i{)prsBc7%>bXf8~B%VUt&_T&RKs-%#Xt(6=C7z}@)DM2id#&j=Zr9T9 zXnWrsZtrY8F*rQgC$tmCx+FQ_1j*h7!HWkE(%iI6_0UY0(Dn}+j@;{VY6q=lgO)zK zo&uEPb#&&=PR@uP9@zvwR2kpoHSUWrK_hvC^zGe zQYcfMqmgbnm3Ze*)#p*Ipy6)Ya=fRf$5T6ZAErQhHw|8cacEp)`cVnNwwf)kXc#DW zX3KG_bq5cU9L#f`@L!g)p{n|Ac$C_)GnHEUME3We=5kuPs=l8vTiZ`n+dzr7{iO8YMl8F+YboO8=@T5mjm?G>6nmF#b?66*Rs3_x4_(!O%#8k-b zsx{*u$=tyb=WLRF z2rdr&xUdKcD5ZQ}O=x2_U;)3l5Vedw>7^uWu$ zC|)Vvj4>y&O~lK%VvWb_?=%8iIyJ0i=-O42H6V?+O0hOO0AFO2Sf|-IfXa5iPyhjos*iH!%NfWBN*K z`a|v5mCDxiKeF3LVCMe!j5$l*qWBj`e;i1E*pmKNV{XQ2ZSQgHLFZHFw9IBVwzint z8OVg)bpg~|fsEmv7s%{%FUBmr2%fv)c=7KN`-$A|u*22CE^Y5f&Y1ZU{ac{+wevOD zCo|aZMslh5(G~4r=3bgTNw%3^2Nn1>a@B`jVj{kKW>?-wPZ?El`cf`ufNqBW9w!Rl zy$rel?mJC9;tnm506aMdA^$SyO3;_FD{Kax4Cn3yeH`>jQ2K7BQgL^Os2Ffo%$_{H zhW__(1Dk`Z3*#LmfvL__Q|s2$PP(gRxA@kq8?SG0f1O~G!FDZedF}0zP;lgay(dhpvtjnDt!l%9|MpZhMe_#lvKvbmJ+_NQ6`nDlAYTn zYy7|dpu+h)g?><>a*atudzDYt822ike?#K&__rhGacm>!Q>WzNC&{y4h816>+SPFX zbHcw@+Xq^up36o>dlbD>(fbsAMA4rs`l6!t{=xuOH#dLNHE%1 zPh(T-LiDS+t?`tnI~B!m+R?D^5VtLu+$KEX9dYz$QX^ruC}WEl9c_t7EJzBf)*my3 zCmN69ZbSxfht*NE^@W2*P2^oEfBnC9e9U(NL&tPvfgaP}| z4Q?LUx7km364If*-rh*uus@Oij-L%RTC@DVcpW})g?tShOWXxugPyC1>V_(A-&{6nj{oi#!0eO70)wGrCMCt6;s=rvptHnxRo{?J=c)w!$ zBbz?wLk%kZ0a~1v!g>rnhKhB3-tW9>1Dwi&iYm9{(Zi^bKKox&`=zGzdEa9NyZ+NQ zea;{1RQj7)QBk}8i#GiuYWyQgKTO713O_%F22mjq-hVmIit~)@{<7h^zd+VHK4lY7(UiV@JUdS*Ahh<_e%?Ph4~+A@czv=y+jSbc*6}%C=FD6)ps>8j z6?n$~i3Y1af4^jv{w7vbl=YaNv+4U>T~gBLk|h5-lF1duXMPwJ>Wk;UN$GdGOo_!N z$=`Wg20lQA?6=FY{vH-olw_$eorXG(EgRJBO_y2u)C!``dJGfK?+#-`H{t7m$|3ds zeie1f#bWz8uF!W~squ%^gx<4tZXX}&WlJTj^*Vf`+ACpkXGy$L7$xzl{CBgpvr0tO zqb23X3Eqc_<;M%&UyAV>!TUxrK0)w)P>fH^e>WH7lk)Mq7@sUSE*Ild^7*I5_|*LW z4aIn^;P_aKI|awRVtkt5cvg&0&*y~}<5wZ>bXg%;uf$u#amCtLDXvDoXes%xe5T;{u^6YU#o}VV2UElawf}J|yAR=`nT#B-8NXiQ zqy6BO_-H@)fjh($;T-2ftx)K@r$Q9$=lA9gg?Fhq!|&q&aO!8bt)FuC@00yZ7mIEF ze^}zvgtOL%TA@6FYDJ0X_$+W5SEzlDHIAWD%5Q&_{mc}UAVG!q)4!um^Q9CjDm*W9 zf0!vKJHv{<3x?z=OT&s^ka(S-)GR98|0j~0F5I^HPKIMEO02`HrNc+d&y(__*Wt~; zr^64FRY--y-dc%EsOZ)O+=c(f?dx{C>gVu8pOk+}Y25?diFMei=Ea@ulk%hA_Xkuz zN5-4|oKy-wkvMA?=(9?Gca148a~9D22jJ5jR|!gPw3a`Y>E~P-{0eYqiTO^1qg>XG zRedJ#X^uLf+2(s4;i3@7`1vjeKD|Ugt0g`~P?{$d`rf7Toig&k&7NIKp1*sQxY)1c?a%9BB~SULRGQ>nh)00CRNYFRQS$ARd=h>^H9jYCtE5?f zRmmTj;FG{vCGw`kNAE9hmFY)>kQ{AEr52%tku*}s;0hsEy18>*haPBM--!%sU2iGk z)-+q1!hQPISYLNArpy1)^=}kdV6>9 zIR3RQa+p;ejctCNIU0uRg;C^zfE=YaXe6QoZK;?M?T_t%)oYROO;DqvO^P-PN(}Go zZ3_-;48~Fs3`++QdN7d)?$9I18P{8GUEA2!+FaZsGt7m)I+L<|9U)J5%#{0LnPkM+(4U{7>2c*;9S1hbOEM>4UvsD45!o6|;%urp7EC5F*HA1H YjBn_dY5c_<_o|0q=v&%AkGoj#KV^V#Gynhq literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/matrixMultiply_clang_optimized b/finalExperimentRuns/matrixMultiply_clang_optimized new file mode 100755 index 0000000000000000000000000000000000000000..cec7923b87ebd9fe40a0fb7c27d0b3b70bc80e0a GIT binary patch literal 13285 zcmeHNeQ;FQb-%l-1!1I>z}OZBM_X59AQKjZ1QkJ)w?cvyUO))pLcxAoNh?@qC9QYg zI>J#29$BQ@1)}tmq)zP4q@B(r9@FWJhlxX3ECO*S%|Oz$N<~^~>||w}7Efy`o8ay5 z+;`9J+b1a>o#}tNn)l8zR_~q9wFI|09S*_8DSlfJS2<6Uka-tk{5K@4 zum-U}XyRjHnV1K}jZ2d)M9mu0DP@{zsgiSnmf&h|nm~h7lNF}RO;|8x4~bHLg`%md zNw0fMmZ=b436LK7y7FU^1?`j-rfZcSoruq|LnbVkvfdu(k)OY6VL#hdf3wA9T#b*ZV#S(h zq-#U{nrP4JXrwOq1u6` zH~q=yUH>wE;pM;ht^LNk?Zc0fE?=nr%B2I6i)WBtF$=zW7QAT|{NY(}^3{vWUg`nN zxcUW`t^hniW|Bv@L0O(DQpmlc&NWe7?HlPh$W5gBcZs6#UuSj zuSghiV<0N}Lec0zHw=)DGSC-_^o!njI4rgYTbs7(>wN2c>(RAv=Kl(H!X5adXH6HC zhU|$5j%8EGg6q3oSl7EVL3dLkb@?FHch(9a&-zA=gKKYX5+li+kPmW4{ z2k{j8$>Wl5BA$jm8I$~{h^HY>c7m_{S!?RrlY!Kmf#J7qw{^5$$z;kj5x8=3tt3~j z-lvJ|XCV0BqoXv|K-&GKrCt#j$r#SuRXNmAYuOh_y}g$Nk8jRGP9z_DO~V!nwKqxa zxmyjyUA*fG4Bv7DHjXE1dMm1%1%j4w1XAwv5Xvq2wiHUcUm=x^x6&sr1kh3L#uH;!??y-czvF-0-?6tX*uD7x zOzt?f{GQZF{ag0hN4Z>U>T)o(emnIGlr789-*xHGmBZSohJGOV%shaboeyf80 z38vRCKvOXF)9iE7Udg{wJxP|*<#(#caLJDd>N25Q3JT=Lnm67Zx**5sKjeSXua8w! z3;*ML+gfVx)aJ5}LOyjRd-q;0mv(;zS|gc?(|?H05spGUMl!FFL&stj)yJulT}a)W z2}HhAJ#uSLAocfwi|=d+T>M~#n`(s%D#nN>JX}Fwr z-w%G{*wCM~<}Uj;UamO#SSnNMN-Tn!- z-(s;JV*6{^K99@d|K9ZGMQ9$$Rh<4kI2BC0?*ki5KeAAg@-mQ?+V5kMoAY%fcdV^8 zV|iY=V;dh!FS+_yy8c?a>_qJZJxz=K)^y`Uy7BWBuQYzy@j0wFAFlyeoRV)Q4l4 zYtw#EnoU8tZ-8Eh=nJ4H@xU(;j=B66=qEA5N-&eY1-cxx5gTYD=r=$+K+CWl8lW$L zz5u!eI#e9bwhPB#rDIvy{8IW~q6XMcn_{I72)6`3+oNjPo?L`#qJzO79ZbGr*ICqkpSi(t8Wn6xw6dZqfTW*fzxJ zAjWIgqj6FEMiI9Z>SE7H_lbGBM;o611?OqksS@XY5B+E%`^}J>f*k!wnk#b=n2W$% z1m+?z7lFA5%tc@>0&@|Vi@;n2<{~f`fw>6$-y?w66|%4eJI^@%D^I1;B%(~wHn%2g z>a(UORo^w=|0p*=4QHGhk^HyajLYQto6$L^$@90CFl4DLG>NEE^Z`Yg(1#K#+3HS7 z`5nQy9J3Lh-dWR3Ao#nU?nD%>A`6Jj23%;b19C672sp5t;`@gG<1rnUe7 zJAbdX_jE!%mp@hXuM~Y%(aVbdlcGOS^p2wQ=4p15lHa~{>!-Xc_jM)vjpUkOq(2lN z@Yee_`07^ICMCFjmB|ZJ#@ihY^&j>=6OJb$1O47QUp))f9gD@o-H}9iop+@XI-FS3 z-V$u_?`_fR>euwbaCDV-WmhN>?(sq|7<_yuDX$X3mpIyIgt|cSxl__3T*Ft;a6Be_ z{R2kW=Wl9V4ZDgv+@JJyB_sH*9qAE1;*Nw8M})8EXg}ox}B33OvuRcaD{vbujC51l0sG1YH_#f8%|B)hB8R+2d%}f-;BmPSZmz>8K)-2&nSTX=WoNj zuB8xeyKvFo!usc&8aN@&DWFshcpfmSvOezvj{~EB_b-UZVvpaGKxyw_ zecmrVt_J#`(qsQwj_Ie-PJ0paydP;w->dZP{wr8KiwcRdKJR~>N}tEc{oBX?yiK3? z(?O*_t~w%pIwS1*^p2TgLjFd%W!WS8V!}0YIfe znh-;1XK>$6|ip=<4*^I&dNqXC8G zO|HN*{_kk8>htfHtkUmfMMYVU={q+4fY;OrcufWN)8q>MGk+Tuvc==yuk`nOO^LN8 z$=|tO2Hr=7{I|=o{&Os-D9KV`x(IddTQ;cMkGy8(BP)nH>oH6`uN}sS?#C|!Dre|$ zL3sq%I$Z2O?<=&vX6pa88qoVTVMb?MGvV_EpD$J=7owt-%p|`+bk2z1CwQMPwzDw5e;4Crg7@WOygZ+O zT8w-0|2Gul6@vH2V!Se+KUs_~61<-kh&v7_Sn%Zj14yg4bg)PT7gY#asvFqH&&9)IjU2M7)RMlA_p=S zdB5iNPe^=v92z7(Jq|6vouXWH+WI{xa44>mL;!vyIC< zAC`(i8~&D(KW@X{mG%~k8r!(;N%`sXZJrG5bor&g9b)=?TLXMC#!K0LRCs&aB5?^7 z-S*6a_X79gzhnEneOk(wiyI3xX-DP?pf(J=67$eLpZ`G0PhanJ?vkHp=bLuUOKU=W zMdFIFkiSv#u~Jk1hpO!o@I}u11tlX|%e7hT+@1w@AyAbwjJFcF*J@bRtAWpy4_pU) zk+Vv)sprnB8sVa_zwx}gfr;?AU_U|gZP0gRv3jeXhr=Kr3 zC2liLY&Wu=Eh*EYJ8mS5Br>EZ6MAdM?sh%cy0-(F)VkhW#O>H>Y3do!4@U>OLQ!4* zf3Am;g9871$D&~)+~eD@zOGhKgC6M_B(4rQ)$}iZPqMG?DEHH{t66rlt=+$~MQ4t> z;d-GL`7%KE(ibw~k-?qGs1b=pkHYI+NaQBSuV|B^ThR}_blXKH>GNi4{51K*fPMto^wF@;TX$n%J&}GriC0cCz1}XJkC=StV`kYG%Ot|azF1*6 z^3kZLpyM@;ik!^F*LOUlw}%f$5_n^^H5y7J5T@>EIMlx{Ci>JQC|Hs`Qr>@YfBy>t C>raXR literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/matrixMultiply_gcc_optimized b/finalExperimentRuns/matrixMultiply_gcc_optimized new file mode 100755 index 0000000000000000000000000000000000000000..42919cf32e32d7a6ed36a855e2fd8ece469f4c68 GIT binary patch literal 13203 zcmeHNeQ;FQb-&tO31MI*h-?cC(Z*dI;aF>luS&+Qcf|_c(gkFY91?>ci*|+9UVUWu ztqmCpN`z=PD-mVdnNkm#YTCNvX{KXOr{iH7JC=fN(oCksjwfZt*rq8sD+2?WHW(Y@ z?eE-o&+gkNDNQ@m|8zC)oqK-woO{ka_v5YJJ4f2Wn;d0jf{R1^fgmnX;g^tk7h>>B zl2ur5;GXUz9B9URhz_M7uJo9WDaV-d_-Jf&b*TP2 z9DZ=b`-zC4yca3SQfa?rM5%5plq{%UR+#QKVZoI39)lkF`MVbObBD4wTU^em@iA4b zcrX#)w|?z|iD*M2-j_bmaG-g8!}_(pRKIVv9CtMwA=%B_I;Be-$69dYa}6$91JwS? zvcLFb#l7>d?|g6J&#(OK(a&Gmn4U+ve4+X~m#;%|$qdq~XTh~u@GsATlTRL8_VN&b znd~;qf(K^7m(7CL&w>kG-{0Hcr>Bfa($IB*Y3ZU_SdWH*WW3Ml*1LM17O7;UFDi_9 zZ%hoNjjoIPVo|^H^}}zNxq1WSdK)1?Rm(ZOs-O11l821;3+!3ZV^Msm#@3 zM7h7B+xKBx8+yI+G>hcdeSMiniGNA*4-rp8pBk6^YU1e#of?z;{lrrUrUoT{FYz?=sR79^Bc6slwHG}3uVoKc z{u2$V=|=7(uuS=VkZGF8ho`Y>U#IdHUq0C!PYMEbZLl>{NcZAMN zRO58h&P)z2AabU$!Y^`PL5Ke}HfGu>e`KjgXu}hRBY)QHqf^UV+DVOrkBp;Dr2p`T zejLeKw){B~{nq7X;wEo7wV}&pTFbeVx4Wt?DB!_FnU*O}LnvSKh7`({?t0=cF3-=26>W6+RjHi$AonMqBaWF5LYX(<(XCpK$UVczn?ODxBnqT$_+lt? z2FS-i4sXyVFFBgtt*RR|`?;3$ORa06Oz=ICTf>a&{oI#P4`o~*XhWyV0xjo{yloCF zusg6P@MJ*801M*_e6=ZW@whhk?rluyncP2uWXrd~@bE;{@qd8Hpox(Q$zM6NOwe077S68qhO-ZNo8ApO*VREi>};q9;dq8J=eIiV%RNt4 zCO^KK`N`zXy2($=SN-@@6#Z1acy`rWfy_d$6pM-6A4$0%Q5y#1vMN-)_={CHPF%4bkUrlZ241|UK-=8u+fb* z+Vt-5#NqYqFBaCCER_bfC>k!f{S(hhUQ{Ob94ZY#Y{q(bZzGa0MLPy?yjdn#~ z=#8=vR#L7VE!pxr&=PFP9eEzz?uK31uc{Nujt~9M|Ly%hCHsHzeWB39a^aW zzb{VmY0La}2D6L)7$O++@IQC%Jp6QEG>{Kx8~z$tIJ@$YBrAqNnyzAz4!badt=ZsJ z+-j~g-3VkCHa1NZ`wL|sJ{`!`e4F-D)r&R1U-nj@WfD`+c;u2c^rlN|c|ZL#gaylP z>c}ZG_$B*kdi+1Slj46kV(!x!;{OQ*eoOqfAPOxj{suz!_@Dih;`1G}$oS73pU1=5 zbWe;K3?UA*I&(luJwS#GS z@5uRZ=Hpxt^>F4|?qSd;_JlLPGMC}h1K_O(hL%Zq&xJEl?*(nN;ZK)fPDWRb5CNVG zXAJN4aORNrrk2_5#R+(&IlSspAagsExuH$oc7`(lmixgcI827G8q4Wu@I&v@aOOrZ zb1jgskzQ#nm(w3<+1<1|65i@?HtMYnqvi=`4R3uod&t{}z%-v$R_YUz;&TA9O_Lwqvk_;OR!c3p^{M9;_}=c8_zz zE>PMm%i+EO`U+?bo?_>rauWOqX7wWIA*}ufuh_GfTHW;{s{ z6k6St)Xxa6arAS!&`)soe%c*pXXq_+^`7Kq=`f?lXp&(UYmAR!@0F9^L|&^tx|hBKqR{!)7nL-Y{zUV@&X z^o~1VZ`2ubdq!NEyZ%`DW_ROI1%gSQVhCoWNZ6dWSD-)saX!C+fS|kj8F!_eH=5^j z=r=?7V0&@}gKSThpS7c#TJI^@&1($`t|ESNHVxZhF@kM5{*rmQ}{^s+1 zKS3uPej%*70=&(*dBlLVIHrg~n$H>-AK?*EMQ(%^Np94-{V{CGFuFzF)?Y1H#wWZ^V3o)=+~H*{`_$eQDpmbQ~X`<5A%w zt|yY}5x(fbKJ;f&BWbog6HBJz{e2~jj<#eh5g`Rt8%P+!7w?PXZp04Y-VFwA{n3aK z5x!WD-kpr}#`K;jbeR*rE~7u0fhExZmH`#n_V;bQ#`haX%qZ^0wE;>}g8%32fd zR(-?am$;!i^h&OHv+D=ZbOU>W?VoV?rSJ&_u>YL%!TV1N;kFGIodK+W%Han`=Y=Gq zQVqBQELB;b_v_=p=!{@}K6fV6!NKPYL}anY?@6Gv$625Eb+a1iT}qGrXE~u9 zbEsJL`MI=9J-FN~sHh4{0Ubw;^f~@L>bcgV^!fR~3U>V$Z2Fw%!}&kESy55D{>wJ~ zv&#NiWuLyOSPRb|V-u*5|NNZfd??Nb;yAOsUH^pXO=_BkKrLLC}VSl;A{Jmde42CF{*&d4eK zy{xDx>oNVvrmuNS4b5XJu%9MZw9ou?RH!c=|6ZlP%VSDtCMn$Q{rv_lh^7qS^3-wqRx5@6K`9hX45K@oS=sb$_iYR!^LsqbA|TTO!iNx z0o}57ZnqEhS&I|iHaq;&+9}hCpOe-`Cp_WjUn%Y?{Jt&4%L~72OYsUZ;q+S}S$E<| z%g+~UqZ3i#=SC?$U-0vw6u(38IbVt|D4gG=_(H+waw)zD=d9lf$+}ax3%~EJjZRS| z_#T^ihlv;&R#1d>rVX2=X1r{=oEJ%uX85(y9#+}rSf+d z{*NfdYX$GyQhcf4{aA`qmS1Tx_rW4@!WK{3UoP=$%B(6W^t-4G8Hapcb0h87GBG_4 z%@Us;hc@62u}HjRv-^aUFZ$2><|&2usB?z*;{nx=XPzImVwuhVqYxqg8*TCbp2Qc6 z3vPe06V(1v;?w>A0dVr)qn>-LG>OVgaeG_#vs4Ty|6NMq9fc3t#$`SqmWnYOeo@Jf z+wd#0za_$J8`o_qKYhJb$iPmQUkbcTOkZyg0$+mhQsx{LKHeUcxP(e>kIjO21NY#+ zX8XGRhLm3<2JZ07evYZ$hJaUN9qv-&Wh38_^3(S_J$K1ZQEB#bSt)#9;nx-Zp~7DR zzS!{vLCJj9@~V`#B4+*kEci9x)iaEXasxcmyAcZzz?t%P>wqtI)QWc7cq!LpvE>}& z^|N7?ezr<{k)RYuDj9hfV$Uq{-%#@HY9BqX%`3RQ^Na)1NO>5;tW^?p?@B zwxl+TuB4GN(#Tw-T;+`&+jr>U(9RBIJnMR}gxj*w(iH92_b2-IMH0IF_gs&p4+#A0 zJ&=eQv8ZqTx;0IL8uWPd0C8)O^-TZaN7KE%2iZ>BwxBe#X-8mdo6a1W;d;@Ed>0_C z^hS(i{J_?9!iWzf4#MkgNVO&?plGY28)1iDI_QyPGICIlAx~Qmer;P|Ysl6jQ@n+~ zIlR3!5Z1SE+O)H+L+=Q*hTA9zGJU%%mDc4;3rgPh`#F1?GPYIPcPU6OB+Q&|A(O>- z#8Pm0tMpUoG5Nkibr?@1B;FNEnX;iibXkDZEO10@$>gP0Wiomxr0W(}Y$@$#qWU!X zRKMPXr1nHi=%MWxL^R%~r&BRA%iS(rh>m={W9Gb<%A{gO=Rk2davD^`b-b}rQIeVQ z*39~1CzK+uZ+S-F5!)Y6;kDJqL?o3$u(}elNMGlG=v7OhXhZr!iTTA&Xr}%fRebti literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/matrixMultiply_mod.c b/finalExperimentRuns/matrixMultiply_mod.c new file mode 100644 index 0000000..99c3b69 --- /dev/null +++ b/finalExperimentRuns/matrixMultiply_mod.c @@ -0,0 +1,157 @@ +#include +#include +#include +#include +#include + +static int **matrixA; +static int **matrixB; +static int **matrixC; +static int N; + +static int randomMaxValue = 100; + +void setUpMatrices() { + + int i = 0; + + matrixA = malloc(sizeof(int *) * N); + matrixB = malloc(sizeof(int *) * N); + matrixC = malloc(sizeof(int *) * N); + + + + for (i=0 ; i " + exit +fi + + + +STR_C_GCC="gcc_output_$1" +STR_JAVA="java_output_$1" +STR_PYTHON="python_output_$1" +STR_C_CLANG="clang_output_$1" +STR_C_GCC_OPTIMIZED="gcc_output_optimized_$1" +STR_C_CLANG_OPTIMIZED="clang_output_optimized_$1" + +for i in {1..10} +do + + echo "Iteration $i" >> $STR_C_GCC + echo "Iteration $i" >> $STR_JAVA + echo "Iteration $i" >> $STR_PYTHON + echo "Iteration $i" >> $STR_C_CLANG + echo "Iteration $1" >> $STR_C_GCC_OPTIMIZED + echo "Iteration $1" >> $STR_C_CLANG_OPTIMIZED + + 3>>$STR_C_GCC perf stat --log-fd 3 ./$2 $1 > /dev/null + 3>>$STR_JAVA perf stat --log-fd 3 java $3 $1 > /dev/null + 3>>$STR_PYTHON perf stat --log-fd 3 python $4 $1 > /dev/null + 3>>$STR_C_CLANG perf stat --log-fd 3 ./$5 $1 > /dev/null + 3>>$STR_C_GCC_OPTIMIZED perf stat --log-fd 3 ./$6 $1 > /dev/null + 3>>$STR_C_CLANG_OPTIMIZED perf stat --log-fd 3 ./$7 $1 > /dev/null +done + + diff --git a/finalExperimentRuns/threading/.MatrixMultiplier.java.swp b/finalExperimentRuns/threading/.MatrixMultiplier.java.swp new file mode 100644 index 0000000000000000000000000000000000000000..774971d29b67580d1a7c19addfe63d3be6a2e291 GIT binary patch literal 12288 zcmeI2dx#ZP9LJB*!<(65(H}u@GK0Hr-My}w*}BrM8f>x~u3JX8Yu())cjrFlUS{UH zF8Lse0uw{bd?XtcWKog*VSn_%0trkE1*ss2iY!Vg`lEjmvd=j)_r0$BhY7~H%!hI2 zJm&nq^ZlJOi>E*Sa96in7@H^f-5^B&*{}KzzPCc$zexzso4>I29#t^$Z#cCs<)kLA zqe?dg9k!(0f#H_nk-07Yuxq6TZD**ZJLS9f`tD-Zw+mU@a${-wyl{`EhEc#MFnI;0 zi+Qbc+lNfgFWyP?11gyKnB*pO6Y+mxC72b7$+Qo!*B>bg4bXS_QEcB z5w^oN*a}-<3ADlQQ-$~qK7oC(8+Jkg)<6Q5!F|vQvq8eCYlL_g_QMnKDD=UD@Bl1_ z4rqr(umD;i4lVHO)k6FXJHZDJZiSz&65CKzQ2ss!=J$VAV51O`jUp1^P^XA*(;JVZD!y0xP4Yl?w;WMy;Cu!rP-0_RA}ZR6TdCoy`W)^roD_d@c~YUMyK@aUMCNU5;-Jv2(1D zay^TSXv!V(67gh{)>1?Y#r~{4AbG1kr*(OIQ07uNV--8koFPI}^_x_H`4La5-dwj> z@U6k+>j$iYkH*+U;11;y?G(<+ESj=)g3HiKx`=S~yIPtUD7voY_`Ug&q%u@Puw(oiO}FEQ^x}Gv8a-C!wIi9;*u58Ga>(w-4iF0?AT!Z@a^zojcz zM%q_x$R zOU*zfZw29(6yO|LHR>@{#qvczR=})&wrV~Lou;Za)QirNvt)DVrKK1NJ8{k3V1CiB zR!@kbqjG^AV_C}?@`v$Q*+2BJE85C>Ohk1R%Wk1wjaO={Qcgl`6dg*hRM3yN_@ZYJGDP`7Vr3+`nQLWp6 z!<5CTKvTsbAy~`;S1Fu)Tv$_SP%HlzimEJ(Rbe)*Pq|(LO zHa8w-aF~c;xZ~F$i-P36R9UVvC0NZFbGTktR(GA()hkBhCqOVADk;iSMleN$ldJmh zsP;SosvrX~%HKphxksmYaDQny5?)!NC&^J&);U30$9QEEj7wRfM=uZ}60Q&GR^8y* zq?+$5<%uMpAmKn6*ti9q=PT%-K!lP8Yf-nJpsVEK+l6%}@3M}wwLVt#?QCpLoA?(E CYPrV% literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/threading/MatrixMultiplier$ThreadMultiply.class b/finalExperimentRuns/threading/MatrixMultiplier$ThreadMultiply.class new file mode 100644 index 0000000000000000000000000000000000000000..6e53c73c7e53f21c3c34417e4d501aa9830123a9 GIT binary patch literal 699 zcmZXR%WD%+6vn?hlV+MY?bO=FM@Fl))-;6_BI2T{&_;wnW1%f>>cZRfVn-)8WisPq zBPvBu6t}M3xHeb>7p}#Bz`w@Fcc(!mZhrTibI(1G?|%FF`3rz5=JLqlL=M9^X>ck> zw`eTi;IzRR2U8BF9h?^!i+3X>cbZ8U2YX?lB7yPMri`QD;osPzK)#hkk<#&c=YfD| z2xM!44&ti+tSw(d3MUjHt? z(Mh6~x*nLs$-zM?cjbNQ!o!4%BXC`eVAREo!3E5^xM)zqtiaUZ)0xeG7kwl!Iv8*p zTC1oY%5GP6smx#nDr4F&gi_yGSWmP*+{SCCYF!K3N_T?}H**dnb?&&eMXCD!@*isj zXZZ~|P*zy{HLgO!Y(rX%dl(~+(z`_8=INC`L6qkYV3qv?*dG|;K;$?w`$-b?m<#lc^rfH%0zbCLcs-eQs&d1QVdE5z{p5OWLZ`{Ov5 K-iTBJ3h^5N_LRH; literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/threading/MatrixMultiplier.class b/finalExperimentRuns/threading/MatrixMultiplier.class new file mode 100644 index 0000000000000000000000000000000000000000..889ccffbcb44e637a2aea56e6a660e1d41943452 GIT binary patch literal 2457 zcma)8TT@e46#h=mNlrK%5Yd1b5J9U51~e#bxv9ikED!{$Qmpkrj&LA3Npop+rcW)? zC!hMz%S$_@9ea7`v^WzwrS+{ZZD%@tZht}lK>H&0+dG&jGSx}4*4}Hcz1O$Cwf2Tz z)_=GMAdJ@yG@(yNO9ghIUx)!A28B4Gx{eL|e7zz`xjP8+C1pC4z0J}bmIARJf>DD<#Do~raZ$&(fqG0B*o8?UUKZk#j>`(FC+9P^6(7kba!xvNOMw}6 zT{{y=SlO(dRiG!WT*kS1N`X2(9WBj=N~4H^ZAG8cPSSR>PRdoF(9_rNxK3_Rfz}p1 zbcrgGiraJ^c3gWjpPaEXlh#av7PU<**W7Rti4hrW+;Zcoq=Kr6oHe^RVx^@c2~kj+ z&Nyx^>ZbEK={qYh)+9I3mrdKH-?*LSO7TzvNLmiD)wN9zFIaC_T?xyb>zZJ8?p)s? zvT=pv>6p^-iUQ-z%~?C0V=`GC)0|JF@|juttRnyiiYIPx=Gd7|ah{0-Xg9GJEhbup z*eAq(JV$^sUOwj}x{A4(xQbVGTr=?+t}CeDjAtnCB;t04MD8_VVMd5q6LHu&ZkU+E zya@;GJb5z|9SbHFkq~GOn&=Qt&6}O}Z!UTfpd_TYB(^7oa80B{T4@=rj59W~V9(|h z?AU@#1+CM=Pl?&LX=^bot$WHbqHfO4Wb)~p9WRxGedpRY*#V3#8jFqg2>6Lx*__SJ zQB!%Y2a0ueQe9)BYglUAN-~7cN~di%t{~L5MJGIA+9(D$HZtJC`$D(Rq|@oQ=W553s*| z6-qGpGd!NVP#+GohXZf$E_~n7Pr)I|-SAOXGFlZs)u_WZG^2(Ws#c!fzHxdBwL(v? zIK8~xkRf++dmWc~12){>r$wXtxi#ohtMCu21L~kU(6|Ei-ZHw?!KUJ9A5~+xsiVdy zpdz*ctvp#$l`kIrx#XezRRr`%yzMYJ4w92S95urvBXvZ(myCqSMlZ)FX*)|Whv``b zZ5`D*LW)vx&`WfkC5-opP^HU9YCqBS2aAXzC6u8R7;C5`e6zNyfNHJ>!;PHqHtE)eA!lT-|rQWz?c5iXUibp>9c zzuGDJXrj`ZNXz{7n5@`el9Ase7eAIW=wy$97(IwF(ir27v&$ygf0y`fU%>!%g!3rv zF+RS<+WFSuR|vV{fLGM+ND1%<8?}o)bL|A?r`E2F_W&x0cb<41hFT=!Niv=y<4H1} zCF6_C=9a{1Kzqn6cOB(_8yGb)#oLDbY0Y0Yugjf7iUZrIg;B!7BcW?|}GP$pC5nr<; zcW@2g;7xpsx2WI7U72hvv*uO=;6cAy$(Z+lz(Moiswtg3nb!2M)UAm OHd7n4)$@7V1OI<@@)?l; literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/threading/MatrixMultiplier.java b/finalExperimentRuns/threading/MatrixMultiplier.java new file mode 100644 index 0000000..2a5204f --- /dev/null +++ b/finalExperimentRuns/threading/MatrixMultiplier.java @@ -0,0 +1,181 @@ +import java.util.*; + +public class MatrixMultiplier { + + static int[][] matrixA; + static int[][] matrixB; + static int[][] matrixC; + + static int matrixDimension; + + public MatrixMultiplier (int N) { + + matrixA = new int[N][N]; + matrixB = new int[N][N]; + matrixC = new int[N][N]; + matrixDimension = N; + + } + + public MatrixMultiplier () { + + } + + public void fillMatrixRandom() { + + + Random rn = new Random(); + + + int i = 0; + int j = 0; + + for (i=0; i20qU%3Ewf5mDQVDUp@NYN9nJO(-Tn+`xjNOl0(SF1ZiUl~Gx0 zh)cI_TuW?BT=)ar`Gb6%xg}yqH{Y4_o!5M4=Ev`E-vKP)nga)=0tzS_m^Ls|VD7v* zT`(|f;G&H=8<%ZdAq>a6p%go<#E;dUuVhG=SZ;|pRL@Vi6}f+l;Ixx4lsaAw_6gKH zAsT^C$kmlr@f|{`(zm|ZtUe-S8^Mkw6ql8jD@kWthU;S6XT}N>%~&x>gKM#9KW&M< zTMSgfMDuvgix_cyTq+x~Hw!N%whQb)=3|z&h<7(_qCL8@$P5 z|L(ujJg)TDQbQhL4(?#|( z^MrB6NenQ)*85e7b@c7&Yw1=bQnc9T6j z^~!w8ms7H~yY=vZ=+mE{W?Uv6SK?N{TlU`Z$U~O#o`32gZr}sXawLz;FXV`>bH-F! Pbq@1vjdZhsOUVBPegT}j literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/threading/MatrixMultiplierNew.class b/finalExperimentRuns/threading/MatrixMultiplierNew.class new file mode 100644 index 0000000000000000000000000000000000000000..97e20685a5d5b2019612f3fddd91b9c8a1a18f46 GIT binary patch literal 2675 zcma)8OH&+G6#ja8W_qS+2#-u)0+@s#Aw11!FyUnaNz5d?0(l`((?AEB%=C=&P~y^} zEEkpwH)@qtrpO}dA}T3|lqgkM#6>Eb=+ez#B4g3A5K#vf;LcAfwF%8FcXy_KA&yRkb&~Q>m5xRXiCB`>}I4wk2 z#~GXzVnD;7jv)-|bTJ~tISr#4#x$JQ5yS-z7j;zQk`R}L7}xNYf|B#I3Co-wOh;07 zJaR*U5q2Ca(H}9BNh_&9i<+r~J%3z*Ix!K>ulw?|eg!+SHYe<;PB4eXf zo>Aqh#e+2r_&?jeR4nU+JU2dTNCy=%xvhW{cw{#d?{;u_cQm;lVRM&lC1*zTkS}f~ zl9nW7TL)xlcjI>5(G`{#w{mmT(X``;Ys(u$T*;J~5IoPtYzO=J=P85vjh4l5uc1UkyQ26Hd5H6sJlZG3s?y{uwVOD*tFzep z^LU9;UqKNQG0KZGDB*r}sHQE09demLX$EBy-(y;4P`;oL>&gpxa=(bDLe{;k5pakc zgb4aIR;>e7ID&4DeUzuE8^SSM=4z50e9ZAvYCos$OPrNVl)(1{UO_{V_#+jE@>JYn zKZwGONGf{sDfH#Z2<3}cw*(K-Uulzk)N*jwl9t)4!?I$3Nk$$?E`BX!(8dogFw6`_ z80j42jj`u0uoEw_V&mxH*w1yC`e9hP+IiRDQwZ7L;1RV8`H!wF@3`jTYRLcUn8WLGNmZrgr!OzJRuf!$EJr7wYr} z{hfMHU+pMTJB)x4C|X1ys0WNtXK|4I|I&iN(|<4cC?6Jx8sd`ye8WUOaHJw94Q z(4nDHLzTjJ$oLn>J!{bAa-IK}6>qhWdJV7hSD3G}V*YI`fPeT<9U*Kto9Za5)ycUF QT?7xlDhfSU@I~?c2L$#?cmMzZ literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/threading/MatrixMultiplierNew.java b/finalExperimentRuns/threading/MatrixMultiplierNew.java new file mode 100644 index 0000000..64871be --- /dev/null +++ b/finalExperimentRuns/threading/MatrixMultiplierNew.java @@ -0,0 +1,193 @@ + +import java.util.*; + +public class MatrixMultiplierNew { + + static int[][] matrixA; + static int[][] matrixB; + static int[][] matrixC; + + static int matrixDimension; + + public MatrixMultiplierNew (int N) { + + matrixA = new int[N][N]; + matrixB = new int[N][N]; + matrixC = new int[N][N]; + matrixDimension = N; + + } + + public MatrixMultiplierNew () { + + } + + public void fillMatrixRandom() { + + + Random rn = new Random(); + + + int i = 0; + int j = 0; + + for (i=0; iV_q(C+cCW`HxOm0wLUM~V30Y?$Mn1_B zLTI8%EXMg0;s&u0a0L#Q(^QS=v@*@KQkn6AF2K>`wSXqCCM!&Dv|z!MBP2@xN<~vu zizaF4{ykfN+dEa_=VPg8nKkE_6#a{s7rbhImb?OqKW z@fs1aO`c1XWT~`WFr!pA{gMUMWQA$ef(297+YLR6^P?7ybC2>@E-!i2Kcz_hkmw4m539yJb@_oeXY}{ig6q_Ksa0G9=DpJvfTF4hM|^YX9ta2M0F( z;hr2uoU@rUjl)(kAXTRB#ibbMy5!VT0$Nk2h*nxQ3jHOx8d6hC$}K$j}y%PDT2n!i@JqA!By+L{g$Z74I{< zMQx*PfodTV*LKxZSQfb506qikY8&2b! zOT7)}IZJH;8*X3MR@-pDh)R`TB=o>De3 zD)}df_Ywc+lK&dAD0W~jJ{i~C!i5vUCrw>nh z^jpuR8@p>7wh1J2)T3uB{tdPZb$=^`auxqTo^CytdgFA(v#5H=-97tGb$53MYZ?xr z3#9kC{_Eg}{F=2VC4|^2_dVAHM}_nIPK}IkO!ecTizJY%_$C=XrjMQX>Dlr8$qx$! z_>Ke2RXpfu`a`SfZrRl7XnNRcY5}P1PCN$V=xKnYJ1**7FY9A(`1B(;`g0YHtm`F@ z+oi4#vNJ1Y%T5E6(Mj3si?ZkDkbTJ^`>U(e6W?&?q9<4J7ihXQbg|}e9G4HNt4HdJ zsd$bOk^dp&5zegTJpLaQeKkoYL~KeEy|0 zO+HUT`PNX;=fR@SCuIYCz90v}c<8dN)5R1>aN-v-D>5Auqp~hDH1QPbNJcv(ENik%@M2li89SwWfU}i24oa7gGXVk9d)wZXesYh z>~f3UuGocOtudu%AIdxDl%5Oa^=xQLp%bTVgXw8Gn3fl6;UpKDLN}~MSuHB1;q<(o ztNQ0zQfFxCu??s*IozK%KQ&8kisWoVYAUx5UHdBJ>_cjrq-;ZKIwxv=blP(!>$Qed z1oCo7?I;eZT@u2O`V1gB^^1dOUG|~Z^lS##CWPDMC<2ptOiW`jtGEt&YQE(v7K16> zj6MSaq${7RcxS1?!F7<~?fW&4(KNi%B65O_f6}R$D=9rzRJvU$y<%PT@%*LtX-I~q zXb8QIx)pN(E4r+`a7xc68qbBZ(Z=)ok+s9s0TDj3YLE!tG?FkKjpi~!y}i>8`u9UJ%5F>SHju%w`JdMF4VoI51+y_#$@I# zJ$G*-u0W#EAI?P^>%*u8!a1{XbvQTJxDNNmrc*TyLzIO7#Pfo^@C_5%75OS$km2cq zx$;?hZC1}Mla+W5%Hertx{!HCJ)v07O8K`bHhM~=XJ@YntcnK6hvx?0ZJnUk;&|!3 zLSYcJA36LJ&sxho|(@_7`;W9XlJ zkzjk?52O&aKZBzO{a$Xj4PO5hPhVjS3D)bIXrQRZ9xuQ(y z!vd9jL#L$tPEx4?ruP*p{LN>D#fm_MCTomWDxTl_*dKpuVIF^0%l@2E@gr}NXTMX5 zKcU){yZ>{-->cn@?pD{OThaR!eN@qJD*8P|f1>DVMPF6)O-0{V)a~bvmX_ZNtnS#K z=`%C8gyVgYR5GwBxFxu8?fQ%aH?OgHA%f|Hy=G)TsF|{857+S7FqY~U!M>y!3pQ_U zU28@TDDFUCCb&Nn#|P_RM%aw>#=GD! z2{SkarESa3{xqb!lD)mLKGU7HkImlz4I0`!-kQ7`xY9lg`X9kwc-}JhX;f&;vwpi* z16SI|5RhEyw4hX#we>jL^-ZrPaZ?#=lw9fL*58IE{N<8l|Hr(V6h5W^j=#80$kx(n z7pk--u>MJ}1`hv6D4o%|Zs};a<5RpZ7i&;VcE!p+8g_>;Bl>VsXN+-XnGCd03t}hm8 zmV{c!_ws`6(o?MX4k~tizEAB{4ysvDQFr{ul|JXcN8RUol)lToyjFIT-*@Trz8~HX z6txSZ?)Lu^m;O2B|D5uFlsacCeEk?2MTJE8zRCNecz+P*ndRO3<1T&rl1*i`+CTNb z>Hj@s?f&U2HkBr&@Al{B{}Hk@R5*UV@A3Yv-~XKWg5vY86R*I1 zO0z?7LhH zTZ2zj3tmTUFtSr4cztx@{^GtzC%#nhdgjDyi~Bj9_%f_JopwmpefUbj>x#Y6hqnh_ zFP!*wg4Y2jzM}YE;l%3&&s!(HQt*6q;@8_*S-0jvmAKiJPnur~#5)DI0zFrFu;Y){ zYi_6c>JhW^&?NEMc?bdbiYn3O@=N;$J)#sp&zt)c-mlgfo{s~{&Zx^yx%dxBJGCO< zx?bOq_)^hRtD#mZPonCX<2wEsaEd>m?t82;hRR%dds*69DF$5e|BJ$hT=*Lbf6Rqj z>-I`9qHw-1UxYmE#H@4m>#DRfd%VeSb92bAM8Z8{_ISGmcrE%%yVj`i+WC2jOUQBB zT?X$igFg&BfVXS+cs?TKt3=fjP1={=BvE@3xF6%wJL*`dy?9k1d#`E+w znzSUpg`>7q;9`<~{VA%i(`!}XFE`JaOH(i<^T@qwM0gc(5&cI zMO(x!_@O^9j7TaKIcUVN3ESBA+q;@~wzfE1P zk|4Kbccn9i{PTl0Wow#!SGL;I?EZ)-DU7O0C>T+kg6EX~2c&;t&XiF!J9_(gM#Dvj$ zCpr<0_ZgXV%-Y`Wwp7fV{0qt2?Cz9F$IOoYQt0v$sjFe&Um=wxxf`Ch-qT)tr;)if i>USk#k-m<8xwYOY-Kz#p$*UEe1;=A4LEH76I{yv4q@@r5 literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/threading/matrixMultiply.c b/finalExperimentRuns/threading/matrixMultiply.c new file mode 100644 index 0000000..9f69324 --- /dev/null +++ b/finalExperimentRuns/threading/matrixMultiply.c @@ -0,0 +1,203 @@ +#include +#include +#include +#include +#include +#include + +#define RANDOM_MAX_VALUE 100 + +static int **matrixA; +static int **matrixB; +static int **matrixC; +static int N; + +void setUpMatrices() { + + int i = 0; + + matrixA = malloc(sizeof(int *) * N); + matrixB = malloc(sizeof(int *) * N); + matrixC = malloc(sizeof(int *) * N); + + + + for (i=0 ; i8cy2pxvfT=maVH(qzjEZb~RE0|LHmcQ?)AW;e6@ z7E=UFZ9&$h5*R=5yQAo!j$=m|t)h}pG>oEvIAc}*2oBYajbj)JjaXQJ=e~P(-+S2= z`NO}=-Pw2U`Q3BQJ@>r(?tLHUqoMG2PhFkh;t}r^#7!*GBxD_hn0}jN71k-12~Aum zE)YwAG~lnv7NS;->AW({v{A`uq|m<0=_taml^$j|?_u%A0sf3@OLRO4f+Sg|pg*t4Z$V=}fO znMmbEH;i^}*|4P}m`w*a%W;$YBzwh<-O?qFV+%O)xfy?&1Js^+qV%rae{FrS(Ddvx zqG^2X;g25BNtgeq{@3LbkW^E^q0?FekJrFQYv3QKfp-D-<9icXGoI;AMzYy>Rww}@3NbTYW^Ya> zQo=Cy4yRK_){JCK!yt1}GPFfxGm%tGn2BL1WD+TJPz*^TbmqW(FjGKk*cTnSSt_{@$B^=7W0v&-#HE=K6Q_PEAa# z)Pz1Y*(S-<^m0uU_d@X0__&U->xG7y7QfK%oG?A5r{&Pc?Pa%~KXDBSj$N*yBawUm zBW+mnq4plI`u>yaiJSbFS3hvFPQUbcHZZtyU5`KzC+hTk!#NNtHUC@+6&jY3%B9CM zfBr?oOX#$Yy1U_~V}pZ(!IkR{VhE&n`H^$c5A|!VJ}M#j)_BvSo#?1EebX_!cjMzE z2lsqap)*o8THiW?Q>{-wcU+2Wx5bLbD3p) z<)Pci(~3C{b+wIDqPL&X3r$vc`TBplWiFI5eURDOD!a|sKjoHr^)<3%$x!!j|0(p{ zKvOIqIx}P9ywqcI4OpB1dNbgCpOT5=FNom;ruVIWk`ESe>HyR`K-v z)kF4i2}`9y=u~+I(2j`+o~jZ-71&c0SRT*H?{@6B2V72F8t2yib*J-N_rtWB1gB;` zU6}-xnUSb~mC1fNKw2Qm>jTes_n76?k06!Zf0L)B?5><2TV8#m`Oz#T7R(Rp!u(JE zE^w5tGz6})ZWQV#X+63BpR^8GxD{jzztx6YUR(Gc;PzQUSDLOaR=GZr9(ZXB_BSiu zT4Sb)Zzo=^EB5tR#yfxe{8UKIsyVoe<^T41J%4*qq4sHW2+dO=DOCu~l}|^+8s(f` z=qu{cWv)vSG>S`rT-m`#V^g{#9OQURA`oz^k|3LQT~D*<#h1|Na*>{w0qg^w(#S{n-Rxi9MeM? zD1>IqQMjHA{*260(GNAZ`mi5E0)wALP><*9?^V@lee!v)UWe_WZ#G;A9S7^_t$QMz zpDf;enr7$kpr%GYJM&o#v`T+L>ZQ_O6de`%rm_1>7QZHqJZ(4fn4B>f8fHf`nsw?H z^+wc-?O5k!Br!+YD!Z_rPX>;M^Rd9RerUt9EBqpSsP#!Az>DF$8JG*_ZwnyEHwJKb zG20ow=tNikwch+I`s8cg-u&;2A9)2G-T8NO?WRA`eiqKZ8qUAclmACosrfnmz%krY zoXq`AFWeZwtx7WB3m0O6mN07maKQ|$4;O9=w85iJY=&bL)0e8;AISR`+_7}RFa5xL z$z1aYJ?5(Wl#`9P?smdH2jZmGnC)m_lEv~e7G0N7gmhtTg45?JBezM|#Im1lpraZJ4L{L3zG z54@dVlIg*J8bgpvPS*=Ur z`{RK7G5)XDXnz6tG}<4o(O!>!#}K#Q)MyW&y$x}c563S51JLO~`vBsbC;hAMX}D{N zu|hkr^j^;=y@%>O*R7zNXo_!mc&2Rs^)^0(bNuf_B8 z+fk3j<8f4$FDT02JX#cgj-pJws#07xAZz^0BVX76;pa~N26LX07s_A8i}jjp;cqhB zAAN|R!aQDh%key<-j#CS{S8;n&x!|5$0^he2F%cwg zD3To#!PveO>{-;zSS`v~2VvFoQ!-+P3WM$wE4s9v+UTO!wJ%^ZW%+ zp=+DxZ>L8CSIOI;_bT?n>i}c#K!vU$*5BpPz*X`h{F192>MK=Q+k~TC-}Gn_HF+~M?D%iA&x4bQw^BbDXOwQ zuLsuxqcw>2d0m@R3lpzn5Rt_lzYhYXHH7tf-MB{$^n9hq{<9p@522mbB<6WtdPwPO zN}v2E8TMbn;#O2hl=XQXEGm5-C-=|#j30FA^Sa6lJ+H&0PkV)1|C7KdCgdL#-bdzC zhun|VYWd1_qVz7zuJ2o-5iESlpnRt&5$oVnb*7&JZ`Yqt`V&fD=MBK6r&#fMmp<=% zjjDqcEU2goYZ*O^8uicdZ&CYZi_+))j}_ed54rR?kBIY&VyvjBTmJ_x{kv8FcdPyn zl5@7g=Z~QYR7iyPVa~VWd?SuC%e(cbT>A87oyvNZkM&0S^e)xjKYdlF(y8>_{ki#P zAxo#4{pWp@^T7_Q@$>v-efH})=-T_|Je28mXh30ki>vUAKaU2xKHtX_mHrSbD$06H z|K`%~_YX+Pe!nE;d>M+F^|70PYN^JfUvz-irEW{MmnASLpJt*8h6im{8Wa z8r}U{Qq_-MjIz_CEoh`1DBdUSjb3=d`=1l9FW)~q@doTunjMmLFJ?6FL-s~5c3R$F zoOq+)eZz?_6TBZdaonXhXm&`}z1T^4{kAuHvGVh}?8KLs^H81m3c>5B6JIHKeRSf! zavr4v0Th9(JCNnbbZx}7fTKh4BZ#iA+wOzYi_?-;tS)@De;AI z2mz;leM>deD&+=L>qNzWzHV+-_>fv>_<9@#PIkszc53;5P}*57{I2-lC-GIHakYk8 zrF;d|x+>@K+rX*cr;$!(FOy)Z#qGDiXsq0$=565!b2n%OdTB zi^@92^Jg3I)huMAlwVHgi_#sbAuZ`yGhIJfrONH)#@hSjqgMhMkj2{>WLD{0Sw0 zM&b+i9go+F1LdPoq5DKC%O!5r9mgn=nQf`hBAPL?W)7K8QRFsv@49NI5$?Ta7c!y^ zqsPHr*==izrH#GG^qxr4kk9i*BsVJXtUi*AoAFq1%O&lb1T`3m*eG%B$daa40~t7}_0L_v`0-qCE% zkZ(CC*;~`>+1}0^b7vd9$gonytyJ=z@htrAlkN&5F5hz~yNP5{;!#RlmucrtQxfY< zjpQtK5>qFLgXPLgcdE;zb|+*QHuqfF@Mz1XjUgn$C*#8Cy$XYfB~nHXZ>3~ryxUSa zNb;6ywlDAV7m^KYhDcZUD~ literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/threading/matrixMultiply_new b/finalExperimentRuns/threading/matrixMultiply_new new file mode 100755 index 0000000000000000000000000000000000000000..1bdd9f3fc5a6c1a4fab3b06f72c303572a51f038 GIT binary patch literal 13352 zcmeHNeQ;FQb-%ldKzwQu5M&@>TMG|P!fJ9#qMQ6apOWHNpHs|DGZ?b(N*(?q(NM}z z4Qe{>pHPd{RKQiZM93BED?+#FIQDBQcEpmMq3sN9C-j&OOsMpa`bJla_SfP!z!7f{ zQ5*SQp`=S?+j%QN^_S-|3uk%wh7=;K0%GaxonEj54Z}>A+_>@NEu!wgWf&E>sua z1yKAN(ol@dgp0nPSDz@|_@iq=sDe4 z!2A*71H?bU{MU%56pb8X{wu^&YDNw-e;@Ibl9Bz)XNafAGt$HSZsI95BW=v@Af8e( zvW@vWh^JJH7~ogE(VTzji)Q{6v+vc5+gh53270jKnnQ!bK_Wxz=NPKE3yPNxAEq3b zg{mLcg_QZ#0n1-H!znoIEUjk#{H>(8|FhL-NageufZR_1(`mprO+6-6swomYC{>A{R)ZQ1wl6eAFBq4w(6&V*mT4 z6537yEL45TCHk%{x{XC`F40$PQ4>JzcjQ4hM^8hf-Fm@n{}*%cm4JC@Nw82=FSdSa zaTD7HpnGNE)w*NAI6Br{RMtH=j_zrf?r-0to&@?L7kq`Pe}HIx8@yQgw&*W$52Pa8#s!h^v-w2EL3{yr{1!^{NS^@@SyT1 z|M2?YWq9k*u68E^!!$S)8AG?w$165rZnRDFqn|^Fw{VDKo(^BJdB5p9Qwa8-#-z!g z#iQjBSiJ5EwS5I`e~R0_viF(iY04Gfc$WlY5X@u2*xqmG2;6O+UqEU3NNxTjyQVh# zVZ1(4ZgWq$%|}^)HecX@Fci7u=yW*+437LKXNA)-GQf4t(8%{tM^d72RcO8BNs11b zl42GXEGL~U(0Rce{7u00oiYoxg)Pt_9y+HAGoba>d}!sM^^Q6C8noUbtsK%zJha{_ ztcKRhq_q!d$sGJ|Xk8|)eegv*v@REFYySSM?^Hf$=lv<@BL_7HY0)a3_c$D&6jlhHVG zKLD*ls~&*J1lYga|7ty z05&mfkesgrV_3AR!Z36%tc9vYz$$yspF$5wLe6;k9sLs|OQa{vz}@ExRU>nq1~b_J zOFXS?FG93FQrvs0P<6tkb^Z_Rc6cJU!-c9NE`z7oK)bzH+}f+zb7<18{S?nxwuWbT zQQ!@Ab2#hnSbfo=xjs% z6GGu9aO54DRkRU47Njg;Bm4qSd`jFm7{ZqDX+V;sX1&vmu5yOKEmd}No^9nu4wV~e zvK!g^bNk7xwHw&`xHw&HuI8cLMKl zqq*13!d>+k`RV##w2-K;i=q~a7OeW^(Zb&Pl@!y7nx*^c$^5<&8pkLvB=lnW;4BRE zzOj;Z&2jp-gnlm^t;Tz10q=`rrQDnP4bXlU<^B_Lf_|I$RcKivL~ZyM2R_pVig$FC zzEmph1r6ds{Qz_^#`$T`dW>n>=xAM=kGJ#nSe(~_{sOcGv=<4rK$FVlio&L38Z%>>{R2N;Qjul*;DWA3;0Lj3=kF4OXJ#%_@_JdZi3$BiXOH32(IPm zAOBDjfBtt_iR4e=sz$#TIQ;~IK2jk0%edZy{2*vK9{&Sn`%8dR$k&rD`A^F7`S5!M z@;6-aBFm{CYaxFD`TcA9^&|1!(H97O+0Qy;MtXNa&!m?=0&Y22b^p}Z9HVdA*ZmI# z4o&gjK8JEMAJ+lsJpn!E?@uzBERz|S%)n#@CNnUZfyoR^W?(V{lNtD^8Nh2k7qRp5 zg5wpGiTIGGXexw0EKn&fZDT6$%GEkxdXJ_e-+UI@tO`{bTob%n^YXhy+LLcB!sDOS+@F&= ze&mgLY4@V$AJ=l--2Xd~@73OhZqv_Yr>6I4dcUUM)b#H(eOl9BYI;`F*ED@cQ*S$) zo0>iyTHd-N*Jb5yh^D&YneNcq@VfAt6{~U#-gv#uD;3V}>9pcIK&^~TJEVrshRIBi z3U_r|$#CO_<`q_am*#eL<-$91DSVJlB~+NWj(E01g%f+a;LoO3#+KZZ%w$vDT`ndD zStgl|lYy@Fq%9Rrb)|5(lD)X^1Or)jB5uW1IN1@~nTdBMV;u?D3a7&DR(B?g25qvt z9YXkwcc$9WU^m?07G~eJpB-6fw|94TCc7+e+CDPB7#1|NWxO@`4RDon7W6yUS!CV{ zb}cG2=Ec6nZ-A?uV+b);dgdxOul+`d@Ke8A+CSwU`!P3fYE2^|6h<(4`0H;*H2Da%A)4D=c?|i-u7_Av%FY8dX4pi11sBrP-?~6cb z&WpXw^T)NlH-6C*`sc8xHAHw>M^0*cgIl%Fq>zrpuVHl`Dx@m*<#kIZOx7uH{sceZ zv6po)qzz=B%RD)%PwjW@watrFJ z&_}>K?bS5H*3b)izic2LJI$(ZqvEueeX4)1tuaRwHTA}S3^>_K{!i+C?xePt{X(1b zvywW|$8b6A<=l^)2TC}VQTMk0w8y@o)?kZ z^u6{&9(($dO=Y=0KlMTOFGAPZK7GZe(xC0V?Roisg)R*hiC^|TIlpyG_g}`R*h^f$ zhOM)GITtd#6ao~{x48;0_-`O^+RJ-KQQP;3p{8Od^mUK@?V&c-ygkIEe165|D(wq@ z5f$T2xYyYC|P=iP4ZQpKX{Cfb=Hu#OJgmfZF_DQEO zfJkKjbK_IW@4Ifi3j37dgt#8Sh?afGDGXqzmHowyS1Z{!-1u}Q`+*yuQGVZb<1>}4 z-)?-Cl6BdQjrK$$I9-Ys=?3-S|ALJ8e#g z>jC`tT-Ft*Fo0hVvR=6Hk11IP-1x%s?+Q0wr)1u`@oSXKM>oF6$#UJE2eZ|uJo%*g zHATHy@*2>4g%2nGWW5$S%~zkgIu8wuU!8{taKDJ#;uSI|9 z)EX68JDV71$aQO-0N*_Uen0RKeqDRV^TVt^Tg{$juz&t$hT8Xm2Qfaq zg!c2hYTFNguN_|Eiu} z{0$X0j{>LsAN9oZ1Fi2}pMR|Nz0d0ztxxA4sqi;T(B~Lu$aOmlJmf-b=5_7oFZDQi zQtP}mfuAV>dpwWLFj$kn)uOh5@vHZv#af?^K2YIrub|g4&XD`ojzhaT)Qr?Ct?>U8xRuVhl}Yt( z$)&ASPkK+RD|s&>x4}kDH)z_VwxTWi2SzNO$;9`>k~oMR+xUg8ja!DEX~tfg^7G(w5squK4*T#Ww#LI<-A!+A1WpX>I3_Gxl`Sllh6e|*?y zz3sE$+ml&zXbX2u#ghDg5#3lSoo2k9&Y$zSakneRn!6A}SxrAV$)e|Ax!asir@Nt8 z%n_dFSUY6d?pOy-w5O9Q)_gNMkw|sLa@nMP#NF$uoH_nCl6~Oat&>e!tv!{{`4Q=- z5yO9mbe8x;yd1x$^Y(5h;~my-PbcGDtv!6a-mTrK2T!F{J31RqB{PbS?7MCL7YvC` AE&u=k literal 0 HcmV?d00001 diff --git a/finalExperimentRuns/threading/matrixMultiply_new.c b/finalExperimentRuns/threading/matrixMultiply_new.c new file mode 100644 index 0000000..f20713e --- /dev/null +++ b/finalExperimentRuns/threading/matrixMultiply_new.c @@ -0,0 +1,240 @@ +#include +#include +#include +#include +#include +#include +#include + +#define RANDOM_MAX_VALUE 10 + +static int **matrixA; +static int **matrixB; +static int **matrixC; +static int N; + +struct threadArguments { + + int row; + int column; +}; + +void setUpMatrices() { + + int i = 0; + + matrixA = malloc(sizeof(int *) * N); + matrixB = malloc(sizeof(int *) * N); + matrixC = malloc(sizeof(int *) * N); + + + + for (i=0 ; irow; + int currentColumn = threadArgs->column; + + + for (i=0; i branch-misses - 0.001220843 seconds time elapsed + 0.001226038 seconds time elapsed Iteration 2 Performance counter stats for './matrixMultiply_clang 10': - 0.260170 task-clock # 0.323 CPUs utilized + 0.263159 task-clock # 0.297 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 126 page-faults # 0.484 M/sec - 791,246 cycles # 3.041 GHz - 483,075 stalled-cycles-frontend # 61.05% frontend cycles idle - 321,165 stalled-cycles-backend # 40.59% backend cycles idle - 546,129 instructions # 0.69 insns per cycle + 127 page-faults # 0.483 M/sec + 791,625 cycles # 3.008 GHz + 482,299 stalled-cycles-frontend # 60.93% frontend cycles idle + 319,678 stalled-cycles-backend # 40.38% backend cycles idle + 550,734 instructions # 0.70 insns per cycle # 0.88 stalled cycles per insn - 105,385 branches # 405.062 M/sec + 106,158 branches # 403.399 M/sec branch-misses - 0.000804638 seconds time elapsed + 0.000886637 seconds time elapsed Iteration 3 Performance counter stats for './matrixMultiply_clang 10': - 0.265903 task-clock # 0.296 CPUs utilized + 0.263879 task-clock # 0.315 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.478 M/sec - 800,185 cycles # 3.009 GHz - 489,441 stalled-cycles-frontend # 61.17% frontend cycles idle - 292,939 stalled-cycles-backend # 36.61% backend cycles idle - 553,591 instructions # 0.69 insns per cycle - # 0.88 stalled cycles per insn - 106,658 branches # 401.116 M/sec + 127 page-faults # 0.481 M/sec + 801,437 cycles # 3.037 GHz + 489,881 stalled-cycles-frontend # 61.13% frontend cycles idle + 298,681 stalled-cycles-backend # 37.27% backend cycles idle + 552,821 instructions # 0.69 insns per cycle + # 0.89 stalled cycles per insn + 106,287 branches # 402.787 M/sec branch-misses - 0.000897592 seconds time elapsed + 0.000838731 seconds time elapsed Iteration 4 Performance counter stats for './matrixMultiply_clang 10': - 0.261262 task-clock # 0.266 CPUs utilized + 0.261170 task-clock # 0.325 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 126 page-faults # 0.482 M/sec - 793,774 cycles # 3.038 GHz - 483,727 stalled-cycles-frontend # 60.94% frontend cycles idle - 330,050 stalled-cycles-backend # 41.58% backend cycles idle - 550,492 instructions # 0.69 insns per cycle - # 0.88 stalled cycles per insn - 106,129 branches # 406.217 M/sec + 127 page-faults # 0.486 M/sec + 794,662 cycles # 3.043 GHz + 483,324 stalled-cycles-frontend # 60.82% frontend cycles idle + 324,726 stalled-cycles-backend # 40.86% backend cycles idle + 552,409 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 106,457 branches # 407.616 M/sec branch-misses - 0.000982477 seconds time elapsed + 0.000802414 seconds time elapsed Iteration 5 Performance counter stats for './matrixMultiply_clang 10': - 0.262448 task-clock # 0.325 CPUs utilized + 0.259817 task-clock # 0.203 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 126 page-faults # 0.480 M/sec - 798,906 cycles # 3.044 GHz - 488,680 stalled-cycles-frontend # 61.17% frontend cycles idle - 331,857 stalled-cycles-backend # 41.54% backend cycles idle - 551,880 instructions # 0.69 insns per cycle - # 0.89 stalled cycles per insn - 106,196 branches # 404.636 M/sec + 127 page-faults # 0.489 M/sec + 789,490 cycles # 3.039 GHz + 480,273 stalled-cycles-frontend # 60.83% frontend cycles idle + 338,648 stalled-cycles-backend # 42.89% backend cycles idle + 549,001 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 105,856 branches # 407.425 M/sec branch-misses - 0.000806293 seconds time elapsed + 0.001277214 seconds time elapsed Iteration 6 Performance counter stats for './matrixMultiply_clang 10': - 0.262853 task-clock # 0.198 CPUs utilized + 0.259312 task-clock # 0.237 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 126 page-faults # 0.479 M/sec - 799,558 cycles # 3.042 GHz - 487,996 stalled-cycles-frontend # 61.03% frontend cycles idle - 325,493 stalled-cycles-backend # 40.71% backend cycles idle - 550,468 instructions # 0.69 insns per cycle + 127 page-faults # 0.490 M/sec + 788,093 cycles # 3.039 GHz + 480,367 stalled-cycles-frontend # 60.95% frontend cycles idle + 337,791 stalled-cycles-backend # 42.86% backend cycles idle + 542,295 instructions # 0.69 insns per cycle # 0.89 stalled cycles per insn - 106,139 branches # 403.796 M/sec + 104,332 branches # 402.342 M/sec branch-misses - 0.001325592 seconds time elapsed + 0.001092917 seconds time elapsed Iteration 7 Performance counter stats for './matrixMultiply_clang 10': - 0.261662 task-clock # 0.194 CPUs utilized + 0.291974 task-clock # 0.199 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.485 M/sec - 795,241 cycles # 3.039 GHz - 484,709 stalled-cycles-frontend # 60.95% frontend cycles idle - 318,825 stalled-cycles-backend # 40.09% backend cycles idle - 552,907 instructions # 0.70 insns per cycle - # 0.88 stalled cycles per insn - 106,529 branches # 407.124 M/sec - branch-misses + 126 page-faults # 0.432 M/sec + 202,297 cycles # 0.693 GHz + 553,682 stalled-cycles-frontend # 273.70% frontend cycles idle + 387,858 stalled-cycles-backend # 191.73% backend cycles idle + 548,059 instructions # 2.71 insns per cycle + # 1.01 stalled cycles per insn + 105,755 branches # 362.207 M/sec + 7,631 branch-misses # 7.22% of all branches [73.27%] - 0.001346394 seconds time elapsed + 0.001464449 seconds time elapsed Iteration 8 Performance counter stats for './matrixMultiply_clang 10': - 0.260743 task-clock # 0.229 CPUs utilized + 0.260737 task-clock # 0.142 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 127 page-faults # 0.487 M/sec - 792,813 cycles # 3.041 GHz - 482,015 stalled-cycles-frontend # 60.80% frontend cycles idle - 325,041 stalled-cycles-backend # 41.00% backend cycles idle - 553,391 instructions # 0.70 insns per cycle + 791,866 cycles # 3.037 GHz + 481,917 stalled-cycles-frontend # 60.86% frontend cycles idle + 338,794 stalled-cycles-backend # 42.78% backend cycles idle + 554,114 instructions # 0.70 insns per cycle # 0.87 stalled cycles per insn - 106,659 branches # 409.058 M/sec + 106,770 branches # 409.493 M/sec branch-misses - 0.001138278 seconds time elapsed + 0.001834688 seconds time elapsed Iteration 9 Performance counter stats for './matrixMultiply_clang 10': - 0.261250 task-clock # 0.323 CPUs utilized + 0.265581 task-clock # 0.269 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 126 page-faults # 0.482 M/sec - 794,471 cycles # 3.041 GHz - 483,254 stalled-cycles-frontend # 60.83% frontend cycles idle - 299,255 stalled-cycles-backend # 37.67% backend cycles idle - 556,212 instructions # 0.70 insns per cycle - # 0.87 stalled cycles per insn - 107,136 branches # 410.090 M/sec + 127 page-faults # 0.478 M/sec + 798,282 cycles # 3.006 GHz + 486,961 stalled-cycles-frontend # 61.00% frontend cycles idle + 343,026 stalled-cycles-backend # 42.97% backend cycles idle + 555,199 instructions # 0.70 insns per cycle + # 0.88 stalled cycles per insn + 106,951 branches # 402.706 M/sec branch-misses - 0.000808962 seconds time elapsed + 0.000988402 seconds time elapsed Iteration 10 Performance counter stats for './matrixMultiply_clang 10': - 0.260392 task-clock # 0.312 CPUs utilized + 0.260504 task-clock # 0.180 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec 126 page-faults # 0.484 M/sec - 791,548 cycles # 3.040 GHz - 480,852 stalled-cycles-frontend # 60.75% frontend cycles idle - 335,540 stalled-cycles-backend # 42.39% backend cycles idle - 553,631 instructions # 0.70 insns per cycle + 792,825 cycles # 3.043 GHz + 482,255 stalled-cycles-frontend # 60.83% frontend cycles idle + 333,878 stalled-cycles-backend # 42.11% backend cycles idle + 551,967 instructions # 0.70 insns per cycle # 0.87 stalled cycles per insn - 106,679 branches # 409.686 M/sec + 106,390 branches # 408.401 M/sec branch-misses - 0.000835158 seconds time elapsed + 0.001444313 seconds time elapsed diff --git a/sankalp/clang_output_10000 b/sankalp/clang_output_10000 deleted file mode 100644 index 78f379f..0000000 --- a/sankalp/clang_output_10000 +++ /dev/null @@ -1 +0,0 @@ -Iteration 1 diff --git a/sankalp/clang_output_optimized_10 b/sankalp/clang_output_optimized_10 new file mode 100644 index 0000000..62f3d83 --- /dev/null +++ b/sankalp/clang_output_optimized_10 @@ -0,0 +1,180 @@ +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.254738 task-clock # 0.186 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.499 M/sec + 773,561 cycles # 3.037 GHz + 467,851 stalled-cycles-frontend # 60.48% frontend cycles idle + 310,294 stalled-cycles-backend # 40.11% backend cycles idle + 535,991 instructions # 0.69 insns per cycle + # 0.87 stalled cycles per insn + 104,877 branches # 411.705 M/sec + branch-misses + + 0.001369651 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.253462 task-clock # 0.312 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.501 M/sec + 770,150 cycles # 3.039 GHz + 467,124 stalled-cycles-frontend # 60.65% frontend cycles idle + 321,201 stalled-cycles-backend # 41.71% backend cycles idle + 537,198 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 105,085 branches # 414.599 M/sec + branch-misses + + 0.000812752 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.252371 task-clock # 0.313 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.503 M/sec + 767,605 cycles # 3.042 GHz + 462,629 stalled-cycles-frontend # 60.27% frontend cycles idle + 328,909 stalled-cycles-backend # 42.85% backend cycles idle + 536,671 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 104,982 branches # 415.983 M/sec + branch-misses + + 0.000806311 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.255736 task-clock # 0.336 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.493 M/sec + 762,557 cycles # 2.982 GHz + 460,565 stalled-cycles-frontend # 60.40% frontend cycles idle + 323,600 stalled-cycles-backend # 42.44% backend cycles idle + 538,377 instructions # 0.71 insns per cycle + # 0.86 stalled cycles per insn + 105,324 branches # 411.847 M/sec + branch-misses + + 0.000760748 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.256619 task-clock # 0.325 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.495 M/sec + 772,169 cycles # 3.009 GHz + 465,669 stalled-cycles-frontend # 60.31% frontend cycles idle + 306,523 stalled-cycles-backend # 39.70% backend cycles idle + 541,471 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 105,836 branches # 412.425 M/sec + branch-misses + + 0.000790370 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.252237 task-clock # 0.135 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.503 M/sec + 766,577 cycles # 3.039 GHz + 463,314 stalled-cycles-frontend # 60.44% frontend cycles idle + 326,037 stalled-cycles-backend # 42.53% backend cycles idle + 538,054 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 105,236 branches # 417.211 M/sec + branch-misses + + 0.001870156 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.260936 task-clock # 0.320 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.487 M/sec + 779,990 cycles # 2.989 GHz + 473,885 stalled-cycles-frontend # 60.76% frontend cycles idle + 324,297 stalled-cycles-backend # 41.58% backend cycles idle + 539,619 instructions # 0.69 insns per cycle + # 0.88 stalled cycles per insn + 105,485 branches # 404.256 M/sec + branch-misses + + 0.000815701 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.246294 task-clock # 0.338 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.516 M/sec + cycles + 443,508 stalled-cycles-frontend # 0.00% frontend cycles idle + 317,155 stalled-cycles-backend # 0.00% backend cycles idle + 542,075 instructions # 0.00 insns per cycle + # 0.82 stalled cycles per insn + 105,925 branches # 430.075 M/sec + 6,517 branch-misses # 6.15% of all branches + + 0.000728607 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.242933 task-clock # 0.293 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.523 M/sec + 727,267 cycles # 2.994 GHz + 425,098 stalled-cycles-frontend # 58.45% frontend cycles idle + 304,182 stalled-cycles-backend # 41.83% backend cycles idle + 537,280 instructions # 0.74 insns per cycle + # 0.79 stalled cycles per insn + 105,121 branches # 432.716 M/sec + branch-misses + + 0.000830440 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang_optimized 10': + + 0.256732 task-clock # 0.216 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.491 M/sec + 768,563 cycles # 2.994 GHz + 464,524 stalled-cycles-frontend # 60.44% frontend cycles idle + 330,887 stalled-cycles-backend # 43.05% backend cycles idle + 536,485 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 104,979 branches # 408.905 M/sec + branch-misses + + 0.001186233 seconds time elapsed + diff --git a/sankalp/gcc_output_10 b/sankalp/gcc_output_10 index de1da14..d533c09 100644 --- a/sankalp/gcc_output_10 +++ b/sankalp/gcc_output_10 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for './matrixMultiply 10': - 0.266541 task-clock # 0.194 CPUs utilized + 0.264216 task-clock # 0.234 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.476 M/sec - 807,616 cycles # 3.030 GHz - 489,993 stalled-cycles-frontend # 60.67% frontend cycles idle - 346,852 stalled-cycles-backend # 42.95% backend cycles idle - 583,105 instructions # 0.72 insns per cycle + 127 page-faults # 0.481 M/sec + 801,618 cycles # 3.034 GHz + 485,598 stalled-cycles-frontend # 60.58% frontend cycles idle + 331,763 stalled-cycles-backend # 41.39% backend cycles idle + 579,543 instructions # 0.72 insns per cycle # 0.84 stalled cycles per insn - 105,807 branches # 396.963 M/sec + 105,217 branches # 398.223 M/sec branch-misses - 0.001377109 seconds time elapsed + 0.001130275 seconds time elapsed Iteration 2 Performance counter stats for './matrixMultiply 10': - 0.260838 task-clock # 0.259 CPUs utilized + 0.260784 task-clock # 0.312 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 126 page-faults # 0.483 M/sec - 792,688 cycles # 3.039 GHz - 477,943 stalled-cycles-frontend # 60.29% frontend cycles idle - 321,946 stalled-cycles-backend # 40.61% backend cycles idle - 575,323 instructions # 0.73 insns per cycle - # 0.83 stalled cycles per insn - 104,469 branches # 400.513 M/sec + 127 page-faults # 0.487 M/sec + 793,277 cycles # 3.042 GHz + 476,100 stalled-cycles-frontend # 60.02% frontend cycles idle + 334,152 stalled-cycles-backend # 42.12% backend cycles idle + 582,916 instructions # 0.73 insns per cycle + # 0.82 stalled cycles per insn + 105,800 branches # 405.700 M/sec branch-misses - 0.001007969 seconds time elapsed + 0.000836036 seconds time elapsed Iteration 3 Performance counter stats for './matrixMultiply 10': - 0.261618 task-clock # 0.283 CPUs utilized + 0.260142 task-clock # 0.341 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.485 M/sec - 795,541 cycles # 3.041 GHz - 477,412 stalled-cycles-frontend # 60.01% frontend cycles idle - 337,422 stalled-cycles-backend # 42.41% backend cycles idle - 582,806 instructions # 0.73 insns per cycle - # 0.82 stalled cycles per insn - 105,752 branches # 404.223 M/sec - branch-misses + 127 page-faults # 0.488 M/sec + cycles + 469,818 stalled-cycles-frontend # 0.00% frontend cycles idle + 330,664 stalled-cycles-backend # 0.00% backend cycles idle + 581,476 instructions # 0.00 insns per cycle + # 0.81 stalled cycles per insn + 105,525 branches # 405.644 M/sec + 6,383 branch-misses # 6.05% of all branches - 0.000924018 seconds time elapsed + 0.000763764 seconds time elapsed Iteration 4 Performance counter stats for './matrixMultiply 10': - 0.261609 task-clock # 0.274 CPUs utilized + 0.265972 task-clock # 0.264 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.485 M/sec - 795,911 cycles # 3.042 GHz - 479,407 stalled-cycles-frontend # 60.23% frontend cycles idle - 329,890 stalled-cycles-backend # 41.45% backend cycles idle - 576,865 instructions # 0.72 insns per cycle - # 0.83 stalled cycles per insn - 104,737 branches # 400.357 M/sec + 127 page-faults # 0.477 M/sec + 783,856 cycles # 2.947 GHz + 469,562 stalled-cycles-frontend # 59.90% frontend cycles idle + 316,315 stalled-cycles-backend # 40.35% backend cycles idle + 579,399 instructions # 0.74 insns per cycle + # 0.81 stalled cycles per insn + 105,152 branches # 395.350 M/sec branch-misses - 0.000954734 seconds time elapsed + 0.001005965 seconds time elapsed Iteration 5 Performance counter stats for './matrixMultiply 10': - 0.264603 task-clock # 0.306 CPUs utilized + 0.262319 task-clock # 0.287 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.480 M/sec - 804,473 cycles # 3.040 GHz - 485,108 stalled-cycles-frontend # 60.30% frontend cycles idle - 323,522 stalled-cycles-backend # 40.22% backend cycles idle - 588,043 instructions # 0.73 insns per cycle + 126 page-faults # 0.480 M/sec + 798,897 cycles # 3.046 GHz + 481,149 stalled-cycles-frontend # 60.23% frontend cycles idle + 294,473 stalled-cycles-backend # 36.86% backend cycles idle + 584,326 instructions # 0.73 insns per cycle # 0.82 stalled cycles per insn - 106,407 branches # 402.138 M/sec + 105,770 branches # 403.211 M/sec branch-misses - 0.000864057 seconds time elapsed + 0.000915591 seconds time elapsed Iteration 6 Performance counter stats for './matrixMultiply 10': - 0.260205 task-clock # 0.112 CPUs utilized + 0.261447 task-clock # 0.150 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 126 page-faults # 0.484 M/sec - 790,756 cycles # 3.039 GHz - 477,383 stalled-cycles-frontend # 60.37% frontend cycles idle - 310,137 stalled-cycles-backend # 39.22% backend cycles idle - 579,178 instructions # 0.73 insns per cycle - # 0.82 stalled cycles per insn - 105,108 branches # 403.943 M/sec + 127 page-faults # 0.486 M/sec + 795,646 cycles # 3.043 GHz + 481,327 stalled-cycles-frontend # 60.50% frontend cycles idle + 341,767 stalled-cycles-backend # 42.95% backend cycles idle + 574,374 instructions # 0.72 insns per cycle + # 0.84 stalled cycles per insn + 103,651 branches # 396.451 M/sec branch-misses - 0.002318265 seconds time elapsed + 0.001741528 seconds time elapsed Iteration 7 Performance counter stats for './matrixMultiply 10': - 0.259797 task-clock # 0.330 CPUs utilized + 0.264455 task-clock # 0.300 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 126 page-faults # 0.485 M/sec - 789,876 cycles # 3.040 GHz - 473,244 stalled-cycles-frontend # 59.91% frontend cycles idle - 312,912 stalled-cycles-backend # 39.62% backend cycles idle - 580,156 instructions # 0.73 insns per cycle - # 0.82 stalled cycles per insn - 105,308 branches # 405.347 M/sec + 127 page-faults # 0.480 M/sec + 790,618 cycles # 2.990 GHz + 478,470 stalled-cycles-frontend # 60.52% frontend cycles idle + 330,579 stalled-cycles-backend # 41.81% backend cycles idle + 568,364 instructions # 0.72 insns per cycle + # 0.84 stalled cycles per insn + 102,901 branches # 389.106 M/sec branch-misses - 0.000787977 seconds time elapsed + 0.000881953 seconds time elapsed Iteration 8 Performance counter stats for './matrixMultiply 10': - 0.260692 task-clock # 0.343 CPUs utilized + 0.259611 task-clock # 0.320 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.487 M/sec - 792,954 cycles # 3.042 GHz - 475,780 stalled-cycles-frontend # 60.00% frontend cycles idle - 345,732 stalled-cycles-backend # 43.60% backend cycles idle - 582,379 instructions # 0.73 insns per cycle + 126 page-faults # 0.485 M/sec + 789,701 cycles # 3.042 GHz + 474,512 stalled-cycles-frontend # 60.09% frontend cycles idle + 332,633 stalled-cycles-backend # 42.12% backend cycles idle + 576,821 instructions # 0.73 insns per cycle # 0.82 stalled cycles per insn - 105,697 branches # 405.448 M/sec + 104,740 branches # 403.450 M/sec branch-misses - 0.000759952 seconds time elapsed + 0.000811846 seconds time elapsed Iteration 9 Performance counter stats for './matrixMultiply 10': - 0.260917 task-clock # 0.268 CPUs utilized + 0.261265 task-clock # 0.147 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.487 M/sec - 793,729 cycles # 3.042 GHz - 477,328 stalled-cycles-frontend # 60.14% frontend cycles idle - 328,501 stalled-cycles-backend # 41.39% backend cycles idle - 578,107 instructions # 0.73 insns per cycle - # 0.83 stalled cycles per insn - 104,943 branches # 402.208 M/sec + 126 page-faults # 0.482 M/sec + 793,438 cycles # 3.037 GHz + 479,473 stalled-cycles-frontend # 60.43% frontend cycles idle + 320,606 stalled-cycles-backend # 40.41% backend cycles idle + 572,808 instructions # 0.72 insns per cycle + # 0.84 stalled cycles per insn + 104,034 branches # 398.193 M/sec branch-misses - 0.000975280 seconds time elapsed + 0.001780051 seconds time elapsed Iteration 10 Performance counter stats for './matrixMultiply 10': - 0.263182 task-clock # 0.237 CPUs utilized + 0.261124 task-clock # 0.302 CPUs utilized 0 context-switches # 0.000 M/sec 0 CPU-migrations # 0.000 M/sec - 127 page-faults # 0.483 M/sec - 791,537 cycles # 3.008 GHz - 478,876 stalled-cycles-frontend # 60.50% frontend cycles idle - 307,587 stalled-cycles-backend # 38.86% backend cycles idle - 569,014 instructions # 0.72 insns per cycle - # 0.84 stalled cycles per insn - 102,992 branches # 391.334 M/sec + 127 page-faults # 0.486 M/sec + 794,602 cycles # 3.043 GHz + 476,906 stalled-cycles-frontend # 60.02% frontend cycles idle + 329,122 stalled-cycles-backend # 41.42% backend cycles idle + 583,923 instructions # 0.73 insns per cycle + # 0.82 stalled cycles per insn + 105,965 branches # 405.803 M/sec branch-misses - 0.001110128 seconds time elapsed + 0.000863590 seconds time elapsed diff --git a/sankalp/gcc_output_10000 b/sankalp/gcc_output_10000 deleted file mode 100644 index 78f379f..0000000 --- a/sankalp/gcc_output_10000 +++ /dev/null @@ -1 +0,0 @@ -Iteration 1 diff --git a/sankalp/gcc_output_optimized_10 b/sankalp/gcc_output_optimized_10 new file mode 100644 index 0000000..ac95581 --- /dev/null +++ b/sankalp/gcc_output_optimized_10 @@ -0,0 +1,180 @@ +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.248266 task-clock # 0.177 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.512 M/sec + cycles + 456,214 stalled-cycles-frontend # 0.00% frontend cycles idle + 322,343 stalled-cycles-backend # 0.00% backend cycles idle + 525,274 instructions # 0.00 insns per cycle + # 0.87 stalled cycles per insn + 102,761 branches # 413.915 M/sec + 6,305 branch-misses # 6.14% of all branches + + 0.001399414 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.250526 task-clock # 0.158 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 126 page-faults # 0.503 M/sec + 761,374 cycles # 3.039 GHz + 460,669 stalled-cycles-frontend # 60.50% frontend cycles idle + 278,379 stalled-cycles-backend # 36.56% backend cycles idle + 531,203 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 104,155 branches # 415.745 M/sec + branch-misses + + 0.001584906 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.256776 task-clock # 0.261 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.495 M/sec + 769,126 cycles # 2.995 GHz + 464,343 stalled-cycles-frontend # 60.37% frontend cycles idle + 305,155 stalled-cycles-backend # 39.68% backend cycles idle + 537,950 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 105,335 branches # 410.221 M/sec + branch-misses + + 0.000984387 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.252672 task-clock # 0.303 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.503 M/sec + 758,151 cycles # 3.001 GHz + 456,805 stalled-cycles-frontend # 60.25% frontend cycles idle + 312,114 stalled-cycles-backend # 41.17% backend cycles idle + 535,170 instructions # 0.71 insns per cycle + # 0.85 stalled cycles per insn + 104,829 branches # 414.882 M/sec + branch-misses + + 0.000834122 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.256107 task-clock # 0.319 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.496 M/sec + 777,635 cycles # 3.036 GHz + 471,077 stalled-cycles-frontend # 60.58% frontend cycles idle + 311,009 stalled-cycles-backend # 39.99% backend cycles idle + 537,745 instructions # 0.69 insns per cycle + # 0.88 stalled cycles per insn + 105,304 branches # 411.172 M/sec + branch-misses + + 0.000803563 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.253460 task-clock # 0.266 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.501 M/sec + 770,539 cycles # 3.040 GHz + 464,693 stalled-cycles-frontend # 60.31% frontend cycles idle + 320,075 stalled-cycles-backend # 41.54% backend cycles idle + 535,462 instructions # 0.69 insns per cycle + # 0.87 stalled cycles per insn + 104,877 branches # 413.781 M/sec + branch-misses + + 0.000953846 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.257419 task-clock # 0.307 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.493 M/sec + 771,110 cycles # 2.996 GHz + 466,926 stalled-cycles-frontend # 60.55% frontend cycles idle + 338,319 stalled-cycles-backend # 43.87% backend cycles idle + 536,400 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 105,084 branches # 408.222 M/sec + branch-misses + + 0.000837879 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.251920 task-clock # 0.292 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.504 M/sec + 765,830 cycles # 3.040 GHz + 460,303 stalled-cycles-frontend # 60.11% frontend cycles idle + 311,031 stalled-cycles-backend # 40.61% backend cycles idle + 536,633 instructions # 0.70 insns per cycle + # 0.86 stalled cycles per insn + 105,101 branches # 417.200 M/sec + branch-misses + + 0.000862143 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.251167 task-clock # 0.329 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.506 M/sec + 765,608 cycles # 3.048 GHz + 463,671 stalled-cycles-frontend # 60.56% frontend cycles idle + 321,814 stalled-cycles-backend # 42.03% backend cycles idle + 534,394 instructions # 0.70 insns per cycle + # 0.87 stalled cycles per insn + 104,724 branches # 416.950 M/sec + branch-misses + + 0.000763382 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_gcc_optimized 10': + + 0.257385 task-clock # 0.271 CPUs utilized + 0 context-switches # 0.000 M/sec + 0 CPU-migrations # 0.000 M/sec + 127 page-faults # 0.493 M/sec + 781,086 cycles # 3.035 GHz + 474,101 stalled-cycles-frontend # 60.70% frontend cycles idle + 323,675 stalled-cycles-backend # 41.44% backend cycles idle + 537,279 instructions # 0.69 insns per cycle + # 0.88 stalled cycles per insn + 105,124 branches # 408.431 M/sec + branch-misses + + 0.000949143 seconds time elapsed + diff --git a/sankalp/java_output_10 b/sankalp/java_output_10 index 4bde1f1..e2ed670 100644 --- a/sankalp/java_output_10 +++ b/sankalp/java_output_10 @@ -2,179 +2,179 @@ Iteration 1 Performance counter stats for 'java MatrixMultiplier 10': - 73.814756 task-clock # 0.948 CPUs utilized - 157 context-switches # 0.002 M/sec - 44 CPU-migrations # 0.001 M/sec - 4,254 page-faults # 0.058 M/sec - 211,869,891 cycles # 2.870 GHz [83.29%] - 118,128,398 stalled-cycles-frontend # 55.76% frontend cycles idle [79.91%] - 79,711,925 stalled-cycles-backend # 37.62% backend cycles idle [71.12%] - 182,350,254 instructions # 0.86 insns per cycle - # 0.65 stalled cycles per insn [84.54%] - 35,144,284 branches # 476.115 M/sec [87.90%] - 2,037,718 branch-misses # 5.80% of all branches [80.29%] + 72.815106 task-clock # 0.984 CPUs utilized + 139 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.001 M/sec + 4,253 page-faults # 0.058 M/sec + 212,160,742 cycles # 2.914 GHz [83.64%] + 114,430,847 stalled-cycles-frontend # 53.94% frontend cycles idle [83.36%] + 80,787,912 stalled-cycles-backend # 38.08% backend cycles idle [62.53%] + 182,410,561 instructions # 0.86 insns per cycle + # 0.63 stalled cycles per insn [79.34%] + 34,469,054 branches # 473.378 M/sec [86.37%] + 2,054,782 branch-misses # 5.96% of all branches [86.95%] - 0.077889679 seconds time elapsed + 0.073987229 seconds time elapsed Iteration 2 Performance counter stats for 'java MatrixMultiplier 10': - 75.426543 task-clock # 0.977 CPUs utilized - 153 context-switches # 0.002 M/sec - 46 CPU-migrations # 0.001 M/sec - 4,254 page-faults # 0.056 M/sec - 220,055,780 cycles # 2.917 GHz [81.76%] - 122,029,915 stalled-cycles-frontend # 55.45% frontend cycles idle [87.61%] - 83,438,109 stalled-cycles-backend # 37.92% backend cycles idle [63.25%] - 184,216,236 instructions # 0.84 insns per cycle - # 0.66 stalled cycles per insn [80.25%] - 34,523,087 branches # 457.705 M/sec [86.17%] - 2,081,771 branch-misses # 6.03% of all branches [84.51%] + 74.167240 task-clock # 0.981 CPUs utilized + 146 context-switches # 0.002 M/sec + 44 CPU-migrations # 0.001 M/sec + 4,255 page-faults # 0.057 M/sec + 217,762,691 cycles # 2.936 GHz [79.75%] + 119,247,170 stalled-cycles-frontend # 54.76% frontend cycles idle [82.58%] + 81,455,743 stalled-cycles-backend # 37.41% backend cycles idle [68.10%] + 183,508,037 instructions # 0.84 insns per cycle + # 0.65 stalled cycles per insn [84.40%] + 35,369,835 branches # 476.893 M/sec [85.66%] + 2,040,142 branch-misses # 5.77% of all branches [86.07%] - 0.077238487 seconds time elapsed + 0.075620599 seconds time elapsed Iteration 3 Performance counter stats for 'java MatrixMultiplier 10': - 74.246438 task-clock # 0.981 CPUs utilized - 145 context-switches # 0.002 M/sec - 46 CPU-migrations # 0.001 M/sec - 4,255 page-faults # 0.057 M/sec - 214,968,414 cycles # 2.895 GHz [83.94%] - 119,504,714 stalled-cycles-frontend # 55.59% frontend cycles idle [84.70%] - 82,353,595 stalled-cycles-backend # 38.31% backend cycles idle [66.94%] - 184,093,021 instructions # 0.86 insns per cycle - # 0.65 stalled cycles per insn [84.65%] - 34,534,006 branches # 465.127 M/sec [83.49%] - 2,022,065 branch-misses # 5.86% of all branches [83.13%] + 75.588706 task-clock # 0.981 CPUs utilized + 148 context-switches # 0.002 M/sec + 47 CPU-migrations # 0.001 M/sec + 4,233 page-faults # 0.056 M/sec + 219,952,171 cycles # 2.910 GHz [83.32%] + 123,320,418 stalled-cycles-frontend # 56.07% frontend cycles idle [85.04%] + 82,988,638 stalled-cycles-backend # 37.73% backend cycles idle [68.62%] + 183,258,921 instructions # 0.83 insns per cycle + # 0.67 stalled cycles per insn [85.04%] + 34,664,677 branches # 458.596 M/sec [83.94%] + 2,046,911 branch-misses # 5.90% of all branches [81.13%] - 0.075715403 seconds time elapsed + 0.077076913 seconds time elapsed Iteration 4 Performance counter stats for 'java MatrixMultiplier 10': - 75.395700 task-clock # 0.977 CPUs utilized - 138 context-switches # 0.002 M/sec - 41 CPU-migrations # 0.001 M/sec - 4,255 page-faults # 0.056 M/sec - 219,917,317 cycles # 2.917 GHz [78.13%] - 121,004,839 stalled-cycles-frontend # 55.02% frontend cycles idle [85.20%] - 81,215,365 stalled-cycles-backend # 36.93% backend cycles idle [68.88%] - 185,224,171 instructions # 0.84 insns per cycle - # 0.65 stalled cycles per insn [84.46%] - 34,656,814 branches # 459.666 M/sec [84.82%] - 2,077,280 branch-misses # 5.99% of all branches [85.34%] + 73.785766 task-clock # 0.983 CPUs utilized + 156 context-switches # 0.002 M/sec + 44 CPU-migrations # 0.001 M/sec + 4,255 page-faults # 0.058 M/sec + 213,783,464 cycles # 2.897 GHz [83.60%] + 116,799,942 stalled-cycles-frontend # 54.63% frontend cycles idle [78.27%] + 77,769,074 stalled-cycles-backend # 36.38% backend cycles idle [68.20%] + 182,198,452 instructions # 0.85 insns per cycle + # 0.64 stalled cycles per insn [84.73%] + 35,172,437 branches # 476.683 M/sec [84.90%] + 2,002,118 branch-misses # 5.69% of all branches [87.69%] - 0.077180782 seconds time elapsed + 0.075044359 seconds time elapsed Iteration 5 Performance counter stats for 'java MatrixMultiplier 10': - 72.910525 task-clock # 0.962 CPUs utilized - 139 context-switches # 0.002 M/sec - 39 CPU-migrations # 0.001 M/sec - 4,253 page-faults # 0.058 M/sec - 214,855,398 cycles # 2.947 GHz [68.96%] - 117,804,486 stalled-cycles-frontend # 54.83% frontend cycles idle [84.19%] - 78,255,771 stalled-cycles-backend # 36.42% backend cycles idle [71.08%] - 182,706,403 instructions # 0.85 insns per cycle - # 0.64 stalled cycles per insn [89.11%] - 34,836,400 branches # 477.797 M/sec [89.82%] - 2,026,736 branch-misses # 5.82% of all branches [87.97%] + 75.848184 task-clock # 0.963 CPUs utilized + 177 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.001 M/sec + 4,256 page-faults # 0.056 M/sec + 222,550,625 cycles # 2.934 GHz [75.92%] + 122,058,241 stalled-cycles-frontend # 54.85% frontend cycles idle [83.66%] + 82,982,505 stalled-cycles-backend # 37.29% backend cycles idle [68.71%] + 183,204,443 instructions # 0.82 insns per cycle + # 0.67 stalled cycles per insn [84.97%] + 35,265,600 branches # 464.950 M/sec [85.01%] + 2,010,327 branch-misses # 5.70% of all branches [88.69%] - 0.075795774 seconds time elapsed + 0.078736540 seconds time elapsed Iteration 6 Performance counter stats for 'java MatrixMultiplier 10': - 75.648039 task-clock # 0.965 CPUs utilized - 168 context-switches # 0.002 M/sec - 46 CPU-migrations # 0.001 M/sec - 4,235 page-faults # 0.056 M/sec - 218,965,621 cycles # 2.895 GHz [85.82%] - 121,200,611 stalled-cycles-frontend # 55.35% frontend cycles idle [79.76%] - 84,094,158 stalled-cycles-backend # 38.41% backend cycles idle [68.13%] - 185,778,627 instructions # 0.85 insns per cycle - # 0.65 stalled cycles per insn [83.98%] - 34,528,645 branches # 456.438 M/sec [85.01%] - 2,049,866 branch-misses # 5.94% of all branches [83.50%] + 74.552674 task-clock # 0.978 CPUs utilized + 146 context-switches # 0.002 M/sec + 45 CPU-migrations # 0.001 M/sec + 4,252 page-faults # 0.057 M/sec + 220,109,964 cycles # 2.952 GHz [78.21%] + 119,486,246 stalled-cycles-frontend # 54.28% frontend cycles idle [84.59%] + 80,845,000 stalled-cycles-backend # 36.73% backend cycles idle [68.08%] + 184,366,056 instructions # 0.84 insns per cycle + # 0.65 stalled cycles per insn [84.04%] + 34,909,548 branches # 468.253 M/sec [84.14%] + 2,006,308 branch-misses # 5.75% of all branches [87.11%] - 0.078417437 seconds time elapsed + 0.076255589 seconds time elapsed Iteration 7 Performance counter stats for 'java MatrixMultiplier 10': - 74.829798 task-clock # 0.981 CPUs utilized - 157 context-switches # 0.002 M/sec - 41 CPU-migrations # 0.001 M/sec - 4,254 page-faults # 0.057 M/sec - 216,250,673 cycles # 2.890 GHz [84.46%] - 118,790,030 stalled-cycles-frontend # 54.93% frontend cycles idle [77.62%] - 78,834,710 stalled-cycles-backend # 36.46% backend cycles idle [68.42%] - 185,004,511 instructions # 0.86 insns per cycle - # 0.64 stalled cycles per insn [83.84%] - 35,127,218 branches # 469.428 M/sec [85.23%] - 2,014,756 branch-misses # 5.74% of all branches [86.76%] + 74.919822 task-clock # 0.945 CPUs utilized + 136 context-switches # 0.002 M/sec + 49 CPU-migrations # 0.001 M/sec + 4,232 page-faults # 0.056 M/sec + 215,665,200 cycles # 2.879 GHz [79.71%] + 122,784,131 stalled-cycles-frontend # 56.93% frontend cycles idle [86.01%] + 83,019,995 stalled-cycles-backend # 38.49% backend cycles idle [68.15%] + 184,014,109 instructions # 0.85 insns per cycle + # 0.67 stalled cycles per insn [84.43%] + 34,335,055 branches # 458.291 M/sec [85.30%] + 2,017,824 branch-misses # 5.88% of all branches [83.15%] - 0.076248085 seconds time elapsed + 0.079275197 seconds time elapsed Iteration 8 Performance counter stats for 'java MatrixMultiplier 10': - 74.739696 task-clock # 0.980 CPUs utilized - 149 context-switches # 0.002 M/sec - 56 CPU-migrations # 0.001 M/sec - 4,252 page-faults # 0.057 M/sec - 220,490,767 cycles # 2.950 GHz [82.19%] - 121,004,653 stalled-cycles-frontend # 54.88% frontend cycles idle [85.74%] - 81,908,614 stalled-cycles-backend # 37.15% backend cycles idle [67.71%] - 183,789,555 instructions # 0.83 insns per cycle - # 0.66 stalled cycles per insn [84.33%] - 34,221,793 branches # 457.880 M/sec [84.40%] - 2,058,395 branch-misses # 6.01% of all branches [81.97%] + 72.325490 task-clock # 0.978 CPUs utilized + 136 context-switches # 0.002 M/sec + 48 CPU-migrations # 0.001 M/sec + 4,255 page-faults # 0.059 M/sec + 211,331,070 cycles # 2.922 GHz [83.78%] + 115,877,185 stalled-cycles-frontend # 54.83% frontend cycles idle [77.28%] + 75,513,035 stalled-cycles-backend # 35.73% backend cycles idle [67.46%] + 182,895,864 instructions # 0.87 insns per cycle + # 0.63 stalled cycles per insn [83.79%] + 35,178,485 branches # 486.391 M/sec [85.16%] + 2,003,949 branch-misses # 5.70% of all branches [88.08%] - 0.076228013 seconds time elapsed + 0.073979011 seconds time elapsed Iteration 9 Performance counter stats for 'java MatrixMultiplier 10': - 75.068830 task-clock # 0.977 CPUs utilized - 162 context-switches # 0.002 M/sec - 47 CPU-migrations # 0.001 M/sec - 4,255 page-faults # 0.057 M/sec - 215,412,368 cycles # 2.870 GHz [80.58%] - 121,493,936 stalled-cycles-frontend # 56.40% frontend cycles idle [81.92%] - 81,065,739 stalled-cycles-backend # 37.63% backend cycles idle [71.00%] - 182,646,249 instructions # 0.85 insns per cycle - # 0.67 stalled cycles per insn [84.17%] - 34,559,117 branches # 460.366 M/sec [84.07%] - 1,927,007 branch-misses # 5.58% of all branches [84.32%] + 74.615253 task-clock # 0.984 CPUs utilized + 136 context-switches # 0.002 M/sec + 41 CPU-migrations # 0.001 M/sec + 4,233 page-faults # 0.057 M/sec + 221,217,036 cycles # 2.965 GHz [78.81%] + 120,264,263 stalled-cycles-frontend # 54.36% frontend cycles idle [83.70%] + 80,040,282 stalled-cycles-backend # 36.18% backend cycles idle [68.39%] + 183,237,659 instructions # 0.83 insns per cycle + # 0.66 stalled cycles per insn [85.00%] + 35,439,125 branches # 474.958 M/sec [85.72%] + 2,039,792 branch-misses # 5.76% of all branches [85.90%] - 0.076856148 seconds time elapsed + 0.075848324 seconds time elapsed Iteration 10 Performance counter stats for 'java MatrixMultiplier 10': - 74.789082 task-clock # 0.983 CPUs utilized - 140 context-switches # 0.002 M/sec - 43 CPU-migrations # 0.001 M/sec - 4,233 page-faults # 0.057 M/sec - 221,271,457 cycles # 2.959 GHz [81.80%] - 120,519,135 stalled-cycles-frontend # 54.47% frontend cycles idle [84.80%] - 83,902,857 stalled-cycles-backend # 37.92% backend cycles idle [68.31%] - 183,981,689 instructions # 0.83 insns per cycle - # 0.66 stalled cycles per insn [84.58%] - 34,659,362 branches # 463.428 M/sec [84.13%] - 2,036,761 branch-misses # 5.88% of all branches [82.59%] - - 0.076072401 seconds time elapsed + 74.492689 task-clock # 0.973 CPUs utilized + 150 context-switches # 0.002 M/sec + 41 CPU-migrations # 0.001 M/sec + 4,255 page-faults # 0.057 M/sec + 216,573,426 cycles # 2.907 GHz [84.20%] + 120,115,088 stalled-cycles-frontend # 55.46% frontend cycles idle [79.15%] + 81,505,498 stalled-cycles-backend # 37.63% backend cycles idle [67.75%] + 184,181,901 instructions # 0.85 insns per cycle + # 0.65 stalled cycles per insn [84.02%] + 35,341,758 branches # 474.433 M/sec [84.88%] + 2,031,210 branch-misses # 5.75% of all branches [86.54%] + + 0.076539126 seconds time elapsed diff --git a/sankalp/java_output_10000 b/sankalp/java_output_10000 deleted file mode 100644 index 78f379f..0000000 --- a/sankalp/java_output_10000 +++ /dev/null @@ -1 +0,0 @@ -Iteration 1 diff --git a/sankalp/matrixMultiply_clang_optimized b/sankalp/matrixMultiply_clang_optimized new file mode 100755 index 0000000000000000000000000000000000000000..cec7923b87ebd9fe40a0fb7c27d0b3b70bc80e0a GIT binary patch literal 13285 zcmeHNeQ;FQb-%l-1!1I>z}OZBM_X59AQKjZ1QkJ)w?cvyUO))pLcxAoNh?@qC9QYg zI>J#29$BQ@1)}tmq)zP4q@B(r9@FWJhlxX3ECO*S%|Oz$N<~^~>||w}7Efy`o8ay5 z+;`9J+b1a>o#}tNn)l8zR_~q9wFI|09S*_8DSlfJS2<6Uka-tk{5K@4 zum-U}XyRjHnV1K}jZ2d)M9mu0DP@{zsgiSnmf&h|nm~h7lNF}RO;|8x4~bHLg`%md zNw0fMmZ=b436LK7y7FU^1?`j-rfZcSoruq|LnbVkvfdu(k)OY6VL#hdf3wA9T#b*ZV#S(h zq-#U{nrP4JXrwOq1u6` zH~q=yUH>wE;pM;ht^LNk?Zc0fE?=nr%B2I6i)WBtF$=zW7QAT|{NY(}^3{vWUg`nN zxcUW`t^hniW|Bv@L0O(DQpmlc&NWe7?HlPh$W5gBcZs6#UuSj zuSghiV<0N}Lec0zHw=)DGSC-_^o!njI4rgYTbs7(>wN2c>(RAv=Kl(H!X5adXH6HC zhU|$5j%8EGg6q3oSl7EVL3dLkb@?FHch(9a&-zA=gKKYX5+li+kPmW4{ z2k{j8$>Wl5BA$jm8I$~{h^HY>c7m_{S!?RrlY!Kmf#J7qw{^5$$z;kj5x8=3tt3~j z-lvJ|XCV0BqoXv|K-&GKrCt#j$r#SuRXNmAYuOh_y}g$Nk8jRGP9z_DO~V!nwKqxa zxmyjyUA*fG4Bv7DHjXE1dMm1%1%j4w1XAwv5Xvq2wiHUcUm=x^x6&sr1kh3L#uH;!??y-czvF-0-?6tX*uD7x zOzt?f{GQZF{ag0hN4Z>U>T)o(emnIGlr789-*xHGmBZSohJGOV%shaboeyf80 z38vRCKvOXF)9iE7Udg{wJxP|*<#(#caLJDd>N25Q3JT=Lnm67Zx**5sKjeSXua8w! z3;*ML+gfVx)aJ5}LOyjRd-q;0mv(;zS|gc?(|?H05spGUMl!FFL&stj)yJulT}a)W z2}HhAJ#uSLAocfwi|=d+T>M~#n`(s%D#nN>JX}Fwr z-w%G{*wCM~<}Uj;UamO#SSnNMN-Tn!- z-(s;JV*6{^K99@d|K9ZGMQ9$$Rh<4kI2BC0?*ki5KeAAg@-mQ?+V5kMoAY%fcdV^8 zV|iY=V;dh!FS+_yy8c?a>_qJZJxz=K)^y`Uy7BWBuQYzy@j0wFAFlyeoRV)Q4l4 zYtw#EnoU8tZ-8Eh=nJ4H@xU(;j=B66=qEA5N-&eY1-cxx5gTYD=r=$+K+CWl8lW$L zz5u!eI#e9bwhPB#rDIvy{8IW~q6XMcn_{I72)6`3+oNjPo?L`#qJzO79ZbGr*ICqkpSi(t8Wn6xw6dZqfTW*fzxJ zAjWIgqj6FEMiI9Z>SE7H_lbGBM;o611?OqksS@XY5B+E%`^}J>f*k!wnk#b=n2W$% z1m+?z7lFA5%tc@>0&@|Vi@;n2<{~f`fw>6$-y?w66|%4eJI^@%D^I1;B%(~wHn%2g z>a(UORo^w=|0p*=4QHGhk^HyajLYQto6$L^$@90CFl4DLG>NEE^Z`Yg(1#K#+3HS7 z`5nQy9J3Lh-dWR3Ao#nU?nD%>A`6Jj23%;b19C672sp5t;`@gG<1rnUe7 zJAbdX_jE!%mp@hXuM~Y%(aVbdlcGOS^p2wQ=4p15lHa~{>!-Xc_jM)vjpUkOq(2lN z@Yee_`07^ICMCFjmB|ZJ#@ihY^&j>=6OJb$1O47QUp))f9gD@o-H}9iop+@XI-FS3 z-V$u_?`_fR>euwbaCDV-WmhN>?(sq|7<_yuDX$X3mpIyIgt|cSxl__3T*Ft;a6Be_ z{R2kW=Wl9V4ZDgv+@JJyB_sH*9qAE1;*Nw8M})8EXg}ox}B33OvuRcaD{vbujC51l0sG1YH_#f8%|B)hB8R+2d%}f-;BmPSZmz>8K)-2&nSTX=WoNj zuB8xeyKvFo!usc&8aN@&DWFshcpfmSvOezvj{~EB_b-UZVvpaGKxyw_ zecmrVt_J#`(qsQwj_Ie-PJ0paydP;w->dZP{wr8KiwcRdKJR~>N}tEc{oBX?yiK3? z(?O*_t~w%pIwS1*^p2TgLjFd%W!WS8V!}0YIfe znh-;1XK>$6|ip=<4*^I&dNqXC8G zO|HN*{_kk8>htfHtkUmfMMYVU={q+4fY;OrcufWN)8q>MGk+Tuvc==yuk`nOO^LN8 z$=|tO2Hr=7{I|=o{&Os-D9KV`x(IddTQ;cMkGy8(BP)nH>oH6`uN}sS?#C|!Dre|$ zL3sq%I$Z2O?<=&vX6pa88qoVTVMb?MGvV_EpD$J=7owt-%p|`+bk2z1CwQMPwzDw5e;4Crg7@WOygZ+O zT8w-0|2Gul6@vH2V!Se+KUs_~61<-kh&v7_Sn%Zj14yg4bg)PT7gY#asvFqH&&9)IjU2M7)RMlA_p=S zdB5iNPe^=v92z7(Jq|6vouXWH+WI{xa44>mL;!vyIC< zAC`(i8~&D(KW@X{mG%~k8r!(;N%`sXZJrG5bor&g9b)=?TLXMC#!K0LRCs&aB5?^7 z-S*6a_X79gzhnEneOk(wiyI3xX-DP?pf(J=67$eLpZ`G0PhanJ?vkHp=bLuUOKU=W zMdFIFkiSv#u~Jk1hpO!o@I}u11tlX|%e7hT+@1w@AyAbwjJFcF*J@bRtAWpy4_pU) zk+Vv)sprnB8sVa_zwx}gfr;?AU_U|gZP0gRv3jeXhr=Kr3 zC2liLY&Wu=Eh*EYJ8mS5Br>EZ6MAdM?sh%cy0-(F)VkhW#O>H>Y3do!4@U>OLQ!4* zf3Am;g9871$D&~)+~eD@zOGhKgC6M_B(4rQ)$}iZPqMG?DEHH{t66rlt=+$~MQ4t> z;d-GL`7%KE(ibw~k-?qGs1b=pkHYI+NaQBSuV|B^ThR}_blXKH>GNi4{51K*fPMto^wF@;TX$n%J&}GriC0cCz1}XJkC=StV`kYG%Ot|azF1*6 z^3kZLpyM@;ik!^F*LOUlw}%f$5_n^^H5y7J5T@>EIMlx{Ci>JQC|Hs`Qr>@YfBy>t C>raXR literal 0 HcmV?d00001 diff --git a/sankalp/matrixMultiply_gcc_optimized b/sankalp/matrixMultiply_gcc_optimized new file mode 100755 index 0000000000000000000000000000000000000000..42919cf32e32d7a6ed36a855e2fd8ece469f4c68 GIT binary patch literal 13203 zcmeHNeQ;FQb-&tO31MI*h-?cC(Z*dI;aF>luS&+Qcf|_c(gkFY91?>ci*|+9UVUWu ztqmCpN`z=PD-mVdnNkm#YTCNvX{KXOr{iH7JC=fN(oCksjwfZt*rq8sD+2?WHW(Y@ z?eE-o&+gkNDNQ@m|8zC)oqK-woO{ka_v5YJJ4f2Wn;d0jf{R1^fgmnX;g^tk7h>>B zl2ur5;GXUz9B9URhz_M7uJo9WDaV-d_-Jf&b*TP2 z9DZ=b`-zC4yca3SQfa?rM5%5plq{%UR+#QKVZoI39)lkF`MVbObBD4wTU^em@iA4b zcrX#)w|?z|iD*M2-j_bmaG-g8!}_(pRKIVv9CtMwA=%B_I;Be-$69dYa}6$91JwS? zvcLFb#l7>d?|g6J&#(OK(a&Gmn4U+ve4+X~m#;%|$qdq~XTh~u@GsATlTRL8_VN&b znd~;qf(K^7m(7CL&w>kG-{0Hcr>Bfa($IB*Y3ZU_SdWH*WW3Ml*1LM17O7;UFDi_9 zZ%hoNjjoIPVo|^H^}}zNxq1WSdK)1?Rm(ZOs-O11l821;3+!3ZV^Msm#@3 zM7h7B+xKBx8+yI+G>hcdeSMiniGNA*4-rp8pBk6^YU1e#of?z;{lrrUrUoT{FYz?=sR79^Bc6slwHG}3uVoKc z{u2$V=|=7(uuS=VkZGF8ho`Y>U#IdHUq0C!PYMEbZLl>{NcZAMN zRO58h&P)z2AabU$!Y^`PL5Ke}HfGu>e`KjgXu}hRBY)QHqf^UV+DVOrkBp;Dr2p`T zejLeKw){B~{nq7X;wEo7wV}&pTFbeVx4Wt?DB!_FnU*O}LnvSKh7`({?t0=cF3-=26>W6+RjHi$AonMqBaWF5LYX(<(XCpK$UVczn?ODxBnqT$_+lt? z2FS-i4sXyVFFBgtt*RR|`?;3$ORa06Oz=ICTf>a&{oI#P4`o~*XhWyV0xjo{yloCF zusg6P@MJ*801M*_e6=ZW@whhk?rluyncP2uWXrd~@bE;{@qd8Hpox(Q$zM6NOwe077S68qhO-ZNo8ApO*VREi>};q9;dq8J=eIiV%RNt4 zCO^KK`N`zXy2($=SN-@@6#Z1acy`rWfy_d$6pM-6A4$0%Q5y#1vMN-)_={CHPF%4bkUrlZ241|UK-=8u+fb* z+Vt-5#NqYqFBaCCER_bfC>k!f{S(hhUQ{Ob94ZY#Y{q(bZzGa0MLPy?yjdn#~ z=#8=vR#L7VE!pxr&=PFP9eEzz?uK31uc{Nujt~9M|Ly%hCHsHzeWB39a^aW zzb{VmY0La}2D6L)7$O++@IQC%Jp6QEG>{Kx8~z$tIJ@$YBrAqNnyzAz4!badt=ZsJ z+-j~g-3VkCHa1NZ`wL|sJ{`!`e4F-D)r&R1U-nj@WfD`+c;u2c^rlN|c|ZL#gaylP z>c}ZG_$B*kdi+1Slj46kV(!x!;{OQ*eoOqfAPOxj{suz!_@Dih;`1G}$oS73pU1=5 zbWe;K3?UA*I&(luJwS#GS z@5uRZ=Hpxt^>F4|?qSd;_JlLPGMC}h1K_O(hL%Zq&xJEl?*(nN;ZK)fPDWRb5CNVG zXAJN4aORNrrk2_5#R+(&IlSspAagsExuH$oc7`(lmixgcI827G8q4Wu@I&v@aOOrZ zb1jgskzQ#nm(w3<+1<1|65i@?HtMYnqvi=`4R3uod&t{}z%-v$R_YUz;&TA9O_Lwqvk_;OR!c3p^{M9;_}=c8_zz zE>PMm%i+EO`U+?bo?_>rauWOqX7wWIA*}ufuh_GfTHW;{s{ z6k6St)Xxa6arAS!&`)soe%c*pXXq_+^`7Kq=`f?lXp&(UYmAR!@0F9^L|&^tx|hBKqR{!)7nL-Y{zUV@&X z^o~1VZ`2ubdq!NEyZ%`DW_ROI1%gSQVhCoWNZ6dWSD-)saX!C+fS|kj8F!_eH=5^j z=r=?7V0&@}gKSThpS7c#TJI^@&1($`t|ESNHVxZhF@kM5{*rmQ}{^s+1 zKS3uPej%*70=&(*dBlLVIHrg~n$H>-AK?*EMQ(%^Np94-{V{CGFuFzF)?Y1H#wWZ^V3o)=+~H*{`_$eQDpmbQ~X`<5A%w zt|yY}5x(fbKJ;f&BWbog6HBJz{e2~jj<#eh5g`Rt8%P+!7w?PXZp04Y-VFwA{n3aK z5x!WD-kpr}#`K;jbeR*rE~7u0fhExZmH`#n_V;bQ#`haX%qZ^0wE;>}g8%32fd zR(-?am$;!i^h&OHv+D=ZbOU>W?VoV?rSJ&_u>YL%!TV1N;kFGIodK+W%Han`=Y=Gq zQVqBQELB;b_v_=p=!{@}K6fV6!NKPYL}anY?@6Gv$625Eb+a1iT}qGrXE~u9 zbEsJL`MI=9J-FN~sHh4{0Ubw;^f~@L>bcgV^!fR~3U>V$Z2Fw%!}&kESy55D{>wJ~ zv&#NiWuLyOSPRb|V-u*5|NNZfd??Nb;yAOsUH^pXO=_BkKrLLC}VSl;A{Jmde42CF{*&d4eK zy{xDx>oNVvrmuNS4b5XJu%9MZw9ou?RH!c=|6ZlP%VSDtCMn$Q{rv_lh^7qS^3-wqRx5@6K`9hX45K@oS=sb$_iYR!^LsqbA|TTO!iNx z0o}57ZnqEhS&I|iHaq;&+9}hCpOe-`Cp_WjUn%Y?{Jt&4%L~72OYsUZ;q+S}S$E<| z%g+~UqZ3i#=SC?$U-0vw6u(38IbVt|D4gG=_(H+waw)zD=d9lf$+}ax3%~EJjZRS| z_#T^ihlv;&R#1d>rVX2=X1r{=oEJ%uX85(y9#+}rSf+d z{*NfdYX$GyQhcf4{aA`qmS1Tx_rW4@!WK{3UoP=$%B(6W^t-4G8Hapcb0h87GBG_4 z%@Us;hc@62u}HjRv-^aUFZ$2><|&2usB?z*;{nx=XPzImVwuhVqYxqg8*TCbp2Qc6 z3vPe06V(1v;?w>A0dVr)qn>-LG>OVgaeG_#vs4Ty|6NMq9fc3t#$`SqmWnYOeo@Jf z+wd#0za_$J8`o_qKYhJb$iPmQUkbcTOkZyg0$+mhQsx{LKHeUcxP(e>kIjO21NY#+ zX8XGRhLm3<2JZ07evYZ$hJaUN9qv-&Wh38_^3(S_J$K1ZQEB#bSt)#9;nx-Zp~7DR zzS!{vLCJj9@~V`#B4+*kEci9x)iaEXasxcmyAcZzz?t%P>wqtI)QWc7cq!LpvE>}& z^|N7?ezr<{k)RYuDj9hfV$Uq{-%#@HY9BqX%`3RQ^Na)1NO>5;tW^?p?@B zwxl+TuB4GN(#Tw-T;+`&+jr>U(9RBIJnMR}gxj*w(iH92_b2-IMH0IF_gs&p4+#A0 zJ&=eQv8ZqTx;0IL8uWPd0C8)O^-TZaN7KE%2iZ>BwxBe#X-8mdo6a1W;d;@Ed>0_C z^hS(i{J_?9!iWzf4#MkgNVO&?plGY28)1iDI_QyPGICIlAx~Qmer;P|Ysl6jQ@n+~ zIlR3!5Z1SE+O)H+L+=Q*hTA9zGJU%%mDc4;3rgPh`#F1?GPYIPcPU6OB+Q&|A(O>- z#8Pm0tMpUoG5Nkibr?@1B;FNEnX;iibXkDZEO10@$>gP0Wiomxr0W(}Y$@$#qWU!X zRKMPXr1nHi=%MWxL^R%~r&BRA%iS(rh>m={W9Gb<%A{gO=Rk2davD^`b-b}rQIeVQ z*39~1CzK+uZ+S-F5!)Y6;kDJqL?o3$u(}elNMGlG=v7OhXhZr!iTTA&Xr}%fRebti literal 0 HcmV?d00001 diff --git a/sankalp/matrixMultiply_mod.c b/sankalp/matrixMultiply_mod.c new file mode 100644 index 0000000..99c3b69 --- /dev/null +++ b/sankalp/matrixMultiply_mod.c @@ -0,0 +1,157 @@ +#include +#include +#include +#include +#include + +static int **matrixA; +static int **matrixB; +static int **matrixC; +static int N; + +static int randomMaxValue = 100; + +void setUpMatrices() { + + int i = 0; + + matrixA = malloc(sizeof(int *) * N); + matrixB = malloc(sizeof(int *) * N); + matrixC = malloc(sizeof(int *) * N); + + + + for (i=0 ; i " +if [ "$#" -ne 7 ]; then + echo "Usage: bash $0 <# of integers> " exit fi @@ -11,6 +11,9 @@ STR_C_GCC="gcc_output_$1" STR_JAVA="java_output_$1" STR_PYTHON="python_output_$1" STR_C_CLANG="clang_output_$1" +STR_C_GCC_OPTIMIZED="gcc_output_optimized_$1" +STR_C_CLANG_OPTIMIZED="clang_output_optimized_$1" + for i in {1..10} do @@ -18,10 +21,15 @@ do echo "Iteration $i" >> $STR_JAVA echo "Iteration $i" >> $STR_PYTHON echo "Iteration $i" >> $STR_C_CLANG + echo "Iteration $1" >> $STR_C_GCC_OPTIMIZED + echo "Iteration $1" >> $STR_C_CLANG_OPTIMIZED + 3>>$STR_C_GCC perf stat --log-fd 3 ./$2 $1 > /dev/null 3>>$STR_JAVA perf stat --log-fd 3 java $3 $1 > /dev/null 3>>$STR_PYTHON perf stat --log-fd 3 python $4 $1 > /dev/null 3>>$STR_C_CLANG perf stat --log-fd 3 ./$5 $1 > /dev/null + 3>>$STR_C_GCC_OPTIMIZED perf stat --log-fd 3 ./$6 $1 > /dev/null + 3>>$STR_C_CLANG_OPTIMIZED perf stat --log-fd 3 ./$7 $1 > /dev/null done diff --git a/sankalp/threading/matrixMultiply_clang b/sankalp/threading/matrixMultiply_clang new file mode 100755 index 0000000000000000000000000000000000000000..fc4eb797f4f09842fb272d3380998f286c93f76e GIT binary patch literal 13383 zcmeHNeQ;b=6~Ea{+7!}uTLYv}>8cy2pxvfT=maVH(qzjEZb~RE0|LHmcQ?)AW;e6@ z7E=UFZ9&$h5*R=5yQAo!j$=m|t)h}pG>oEvIAc}*2oBYajbj)JjaXQJ=e~P(-+S2= z`NO}=-Pw2U`Q3BQJ@>r(?tLHUqoMG2PhFkh;t}r^#7!*GBxD_hn0}jN71k-12~Aum zE)YwAG~lnv7NS;->AW({v{A`uq|m<0=_taml^$j|?_u%A0sf3@OLRO4f+Sg|pg*t4Z$V=}fO znMmbEH;i^}*|4P}m`w*a%W;$YBzwh<-O?qFV+%O)xfy?&1Js^+qV%rae{FrS(Ddvx zqG^2X;g25BNtgeq{@3LbkW^E^q0?FekJrFQYv3QKfp-D-<9icXGoI;AMzYy>Rww}@3NbTYW^Ya> zQo=Cy4yRK_){JCK!yt1}GPFfxGm%tGn2BL1WD+TJPz*^TbmqW(FjGKk*cTnSSt_{@$B^=7W0v&-#HE=K6Q_PEAa# z)Pz1Y*(S-<^m0uU_d@X0__&U->xG7y7QfK%oG?A5r{&Pc?Pa%~KXDBSj$N*yBawUm zBW+mnq4plI`u>yaiJSbFS3hvFPQUbcHZZtyU5`KzC+hTk!#NNtHUC@+6&jY3%B9CM zfBr?oOX#$Yy1U_~V}pZ(!IkR{VhE&n`H^$c5A|!VJ}M#j)_BvSo#?1EebX_!cjMzE z2lsqap)*o8THiW?Q>{-wcU+2Wx5bLbD3p) z<)Pci(~3C{b+wIDqPL&X3r$vc`TBplWiFI5eURDOD!a|sKjoHr^)<3%$x!!j|0(p{ zKvOIqIx}P9ywqcI4OpB1dNbgCpOT5=FNom;ruVIWk`ESe>HyR`K-v z)kF4i2}`9y=u~+I(2j`+o~jZ-71&c0SRT*H?{@6B2V72F8t2yib*J-N_rtWB1gB;` zU6}-xnUSb~mC1fNKw2Qm>jTes_n76?k06!Zf0L)B?5><2TV8#m`Oz#T7R(Rp!u(JE zE^w5tGz6})ZWQV#X+63BpR^8GxD{jzztx6YUR(Gc;PzQUSDLOaR=GZr9(ZXB_BSiu zT4Sb)Zzo=^EB5tR#yfxe{8UKIsyVoe<^T41J%4*qq4sHW2+dO=DOCu~l}|^+8s(f` z=qu{cWv)vSG>S`rT-m`#V^g{#9OQURA`oz^k|3LQT~D*<#h1|Na*>{w0qg^w(#S{n-Rxi9MeM? zD1>IqQMjHA{*260(GNAZ`mi5E0)wALP><*9?^V@lee!v)UWe_WZ#G;A9S7^_t$QMz zpDf;enr7$kpr%GYJM&o#v`T+L>ZQ_O6de`%rm_1>7QZHqJZ(4fn4B>f8fHf`nsw?H z^+wc-?O5k!Br!+YD!Z_rPX>;M^Rd9RerUt9EBqpSsP#!Az>DF$8JG*_ZwnyEHwJKb zG20ow=tNikwch+I`s8cg-u&;2A9)2G-T8NO?WRA`eiqKZ8qUAclmACosrfnmz%krY zoXq`AFWeZwtx7WB3m0O6mN07maKQ|$4;O9=w85iJY=&bL)0e8;AISR`+_7}RFa5xL z$z1aYJ?5(Wl#`9P?smdH2jZmGnC)m_lEv~e7G0N7gmhtTg45?JBezM|#Im1lpraZJ4L{L3zG z54@dVlIg*J8bgpvPS*=Ur z`{RK7G5)XDXnz6tG}<4o(O!>!#}K#Q)MyW&y$x}c563S51JLO~`vBsbC;hAMX}D{N zu|hkr^j^;=y@%>O*R7zNXo_!mc&2Rs^)^0(bNuf_B8 z+fk3j<8f4$FDT02JX#cgj-pJws#07xAZz^0BVX76;pa~N26LX07s_A8i}jjp;cqhB zAAN|R!aQDh%key<-j#CS{S8;n&x!|5$0^he2F%cwg zD3To#!PveO>{-;zSS`v~2VvFoQ!-+P3WM$wE4s9v+UTO!wJ%^ZW%+ zp=+DxZ>L8CSIOI;_bT?n>i}c#K!vU$*5BpPz*X`h{F192>MK=Q+k~TC-}Gn_HF+~M?D%iA&x4bQw^BbDXOwQ zuLsuxqcw>2d0m@R3lpzn5Rt_lzYhYXHH7tf-MB{$^n9hq{<9p@522mbB<6WtdPwPO zN}v2E8TMbn;#O2hl=XQXEGm5-C-=|#j30FA^Sa6lJ+H&0PkV)1|C7KdCgdL#-bdzC zhun|VYWd1_qVz7zuJ2o-5iESlpnRt&5$oVnb*7&JZ`Yqt`V&fD=MBK6r&#fMmp<=% zjjDqcEU2goYZ*O^8uicdZ&CYZi_+))j}_ed54rR?kBIY&VyvjBTmJ_x{kv8FcdPyn zl5@7g=Z~QYR7iyPVa~VWd?SuC%e(cbT>A87oyvNZkM&0S^e)xjKYdlF(y8>_{ki#P zAxo#4{pWp@^T7_Q@$>v-efH})=-T_|Je28mXh30ki>vUAKaU2xKHtX_mHrSbD$06H z|K`%~_YX+Pe!nE;d>M+F^|70PYN^JfUvz-irEW{MmnASLpJt*8h6im{8Wa z8r}U{Qq_-MjIz_CEoh`1DBdUSjb3=d`=1l9FW)~q@doTunjMmLFJ?6FL-s~5c3R$F zoOq+)eZz?_6TBZdaonXhXm&`}z1T^4{kAuHvGVh}?8KLs^H81m3c>5B6JIHKeRSf! zavr4v0Th9(JCNnbbZx}7fTKh4BZ#iA+wOzYi_?-;tS)@De;AI z2mz;leM>deD&+=L>qNzWzHV+-_>fv>_<9@#PIkszc53;5P}*57{I2-lC-GIHakYk8 zrF;d|x+>@K+rX*cr;$!(FOy)Z#qGDiXsq0$=565!b2n%OdTB zi^@92^Jg3I)huMAlwVHgi_#sbAuZ`yGhIJfrONH)#@hSjqgMhMkj2{>WLD{0Sw0 zM&b+i9go+F1LdPoq5DKC%O!5r9mgn=nQf`hBAPL?W)7K8QRFsv@49NI5$?Ta7c!y^ zqsPHr*==izrH#GG^qxr4kk9i*BsVJXtUi*AoAFq1%O&lb1T`3m*eG%B$daa40~t7}_0L_v`0-qCE% zkZ(CC*;~`>+1}0^b7vd9$gonytyJ=z@htrAlkN&5F5hz~yNP5{;!#RlmucrtQxfY< zjpQtK5>qFLgXPLgcdE;zb|+*QHuqfF@Mz1XjUgn$C*#8Cy$XYfB~nHXZ>3~ryxUSa zNb;6ywlDAV7m^KYhDcZUD~ literal 0 HcmV?d00001 From f2b668081af218716d1678178e927919069f443f Mon Sep 17 00:00:00 2001 From: Nachiket N Rau Date: Thu, 12 Feb 2015 23:43:28 -0500 Subject: [PATCH 04/11] Threading results --- nachi/clang_output_100 | 180 ++++++++++++++++++++++++++++++++++++++++ nachi/clang_output_1000 | 180 ++++++++++++++++++++++++++++++++++++++++ nachi/clang_output_3000 | 180 ++++++++++++++++++++++++++++++++++++++++ nachi/gcc_output_100 | 180 ++++++++++++++++++++++++++++++++++++++++ nachi/gcc_output_1000 | 180 ++++++++++++++++++++++++++++++++++++++++ nachi/gcc_output_3000 | 180 ++++++++++++++++++++++++++++++++++++++++ nachi/java_output_100 | 180 ++++++++++++++++++++++++++++++++++++++++ nachi/java_output_1000 | 180 ++++++++++++++++++++++++++++++++++++++++ nachi/java_output_3000 | 180 ++++++++++++++++++++++++++++++++++++++++ 9 files changed, 1620 insertions(+) create mode 100644 nachi/clang_output_100 create mode 100644 nachi/clang_output_1000 create mode 100644 nachi/clang_output_3000 create mode 100644 nachi/gcc_output_100 create mode 100644 nachi/gcc_output_1000 create mode 100644 nachi/gcc_output_3000 create mode 100644 nachi/java_output_100 create mode 100644 nachi/java_output_1000 create mode 100644 nachi/java_output_3000 diff --git a/nachi/clang_output_100 b/nachi/clang_output_100 new file mode 100644 index 0000000..8613750 --- /dev/null +++ b/nachi/clang_output_100 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply_clang 100': + + 15.071694 task-clock # 2.628 CPUs utilized + 127 context-switches # 0.008 M/sec + 100 CPU-migrations # 0.007 M/sec + 399 page-faults # 0.026 M/sec + 31,101,001 cycles # 2.064 GHz [ 4.30%] + 28,337,526 stalled-cycles-frontend # 91.11% frontend cycles idle [99.25%] + 10,734,719 stalled-cycles-backend # 34.52% backend cycles idle + 34,618,612 instructions # 1.11 insns per cycle + # 0.82 stalled cycles per insn + 3,822,365 branches # 253.612 M/sec + 41,811 branch-misses # 1.09% of all branches [97.78%] + + 0.005735029 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply_clang 100': + + 14.593209 task-clock # 2.494 CPUs utilized + 102 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.007 M/sec + 399 page-faults # 0.027 M/sec + 28,783,921 cycles # 1.972 GHz [48.38%] + 27,903,223 stalled-cycles-frontend # 96.94% frontend cycles idle + 10,382,581 stalled-cycles-backend # 36.07% backend cycles idle + 34,516,366 instructions # 1.20 insns per cycle + # 0.81 stalled cycles per insn + 3,810,205 branches # 261.094 M/sec + 33,301 branch-misses # 0.87% of all branches [72.66%] + + 0.005852332 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply_clang 100': + + 14.345599 task-clock # 2.691 CPUs utilized + 97 context-switches # 0.007 M/sec + 102 CPU-migrations # 0.007 M/sec + 398 page-faults # 0.028 M/sec + 32,425,568 cycles # 2.260 GHz [69.19%] + 27,432,781 stalled-cycles-frontend # 84.60% frontend cycles idle + 10,667,385 stalled-cycles-backend # 32.90% backend cycles idle + 34,542,622 instructions # 1.07 insns per cycle + # 0.79 stalled cycles per insn + 3,817,996 branches # 266.144 M/sec + 31,758 branch-misses # 0.83% of all branches [52.88%] + + 0.005331603 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply_clang 100': + + 15.279836 task-clock # 2.976 CPUs utilized + 90 context-switches # 0.006 M/sec + 100 CPU-migrations # 0.007 M/sec + 398 page-faults # 0.026 M/sec + 20,673,626 cycles # 1.353 GHz [ 3.15%] + 28,411,948 stalled-cycles-frontend # 137.43% frontend cycles idle [99.00%] + 10,904,807 stalled-cycles-backend # 52.75% backend cycles idle + 34,701,052 instructions # 1.68 insns per cycle + # 0.82 stalled cycles per insn + 3,857,795 branches # 252.476 M/sec + 44,207 branch-misses # 1.15% of all branches [99.32%] + + 0.005133844 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply_clang 100': + + 15.031845 task-clock # 2.751 CPUs utilized + 99 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.007 M/sec + 399 page-faults # 0.027 M/sec + 31,971,840 cycles # 2.127 GHz [ 6.04%] + 27,963,708 stalled-cycles-frontend # 87.46% frontend cycles idle + 10,453,352 stalled-cycles-backend # 32.70% backend cycles idle + 34,769,282 instructions # 1.09 insns per cycle + # 0.80 stalled cycles per insn + 3,877,105 branches # 257.926 M/sec + 41,565 branch-misses # 1.07% of all branches [97.98%] + + 0.005463449 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply_clang 100': + + 15.359790 task-clock # 2.957 CPUs utilized + 91 context-switches # 0.006 M/sec + 100 CPU-migrations # 0.007 M/sec + 398 page-faults # 0.026 M/sec + 28,618,862 cycles # 1.863 GHz [39.98%] + 28,431,317 stalled-cycles-frontend # 99.34% frontend cycles idle + 10,648,456 stalled-cycles-backend # 37.21% backend cycles idle + 34,519,354 instructions # 1.21 insns per cycle + # 0.82 stalled cycles per insn + 3,813,770 branches # 248.296 M/sec + 35,097 branch-misses # 0.92% of all branches [81.22%] + + 0.005194823 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply_clang 100': + + 15.317013 task-clock # 2.470 CPUs utilized + 120 context-switches # 0.008 M/sec + 100 CPU-migrations # 0.007 M/sec + 408 page-faults # 0.027 M/sec + 30,267,289 cycles # 1.976 GHz [10.27%] + 28,537,036 stalled-cycles-frontend # 94.28% frontend cycles idle [98.68%] + 11,180,217 stalled-cycles-backend # 36.94% backend cycles idle + 34,766,298 instructions # 1.15 insns per cycle + # 0.82 stalled cycles per insn + 3,860,893 branches # 252.066 M/sec + 42,126 branch-misses # 1.09% of all branches [96.90%] + + 0.006200448 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply_clang 100': + + 14.798275 task-clock # 2.732 CPUs utilized + 107 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.007 M/sec + 397 page-faults # 0.027 M/sec + 31,455,395 cycles # 2.126 GHz [61.20%] + 27,765,095 stalled-cycles-frontend # 88.27% frontend cycles idle + 10,711,491 stalled-cycles-backend # 34.05% backend cycles idle + 34,767,136 instructions # 1.11 insns per cycle + # 0.80 stalled cycles per insn + 3,874,184 branches # 261.800 M/sec + 33,155 branch-misses # 0.86% of all branches [59.28%] + + 0.005416411 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply_clang 100': + + 14.519964 task-clock # 2.835 CPUs utilized + 99 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.007 M/sec + 401 page-faults # 0.028 M/sec + 27,900,765 cycles # 1.922 GHz [ 6.07%] + 27,230,344 stalled-cycles-frontend # 97.60% frontend cycles idle + 10,481,084 stalled-cycles-backend # 37.57% backend cycles idle + 34,637,637 instructions # 1.24 insns per cycle + # 0.79 stalled cycles per insn + 3,842,227 branches # 264.617 M/sec + 37,938 branch-misses # 0.99% of all branches [97.21%] + + 0.005121954 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang 100': + + 15.061104 task-clock # 2.691 CPUs utilized + 111 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.007 M/sec + 397 page-faults # 0.026 M/sec + 40,602,016 cycles # 2.696 GHz [98.68%] + 28,505,449 stalled-cycles-frontend # 70.21% frontend cycles idle + 10,731,646 stalled-cycles-backend # 26.43% backend cycles idle + 34,830,384 instructions # 0.86 insns per cycle + # 0.82 stalled cycles per insn + 3,889,367 branches # 258.239 M/sec + 30,932 branch-misses # 0.80% of all branches [ 2.38%] + + 0.005597097 seconds time elapsed + diff --git a/nachi/clang_output_1000 b/nachi/clang_output_1000 new file mode 100644 index 0000000..2e934cc --- /dev/null +++ b/nachi/clang_output_1000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18396.287875 task-clock # 15.476 CPUs utilized + 5,329 context-switches # 0.000 M/sec + 2,069 CPU-migrations # 0.000 M/sec + 5,180 page-faults # 0.000 M/sec + 53,349,914,221 cycles # 2.900 GHz [84.90%] + 45,724,619,380 stalled-cycles-frontend # 85.71% frontend cycles idle [84.09%] + 9,423,771,208 stalled-cycles-backend # 17.66% backend cycles idle [66.08%] + 26,043,932,314 instructions # 0.49 insns per cycle + # 1.76 stalled cycles per insn [83.60%] + 2,043,110,731 branches # 111.061 M/sec [83.96%] + 1,822,446 branch-misses # 0.09% of all branches [84.58%] + + 1.188702842 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18835.885586 task-clock # 15.515 CPUs utilized + 5,599 context-switches # 0.000 M/sec + 2,228 CPU-migrations # 0.000 M/sec + 5,181 page-faults # 0.000 M/sec + 54,659,225,975 cycles # 2.902 GHz [83.43%] + 47,004,345,518 stalled-cycles-frontend # 86.00% frontend cycles idle [83.16%] + 9,931,049,071 stalled-cycles-backend # 18.17% backend cycles idle [67.47%] + 26,085,984,878 instructions # 0.48 insns per cycle + # 1.80 stalled cycles per insn [84.53%] + 2,047,829,944 branches # 108.720 M/sec [84.28%] + 1,818,376 branch-misses # 0.09% of all branches [84.42%] + + 1.214018383 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18349.744926 task-clock # 15.483 CPUs utilized + 5,281 context-switches # 0.000 M/sec + 2,379 CPU-migrations # 0.000 M/sec + 5,182 page-faults # 0.000 M/sec + 53,488,227,542 cycles # 2.915 GHz [85.07%] + 45,809,055,421 stalled-cycles-frontend # 85.64% frontend cycles idle [85.24%] + 9,330,085,107 stalled-cycles-backend # 17.44% backend cycles idle [66.96%] + 25,885,880,720 instructions # 0.48 insns per cycle + # 1.77 stalled cycles per insn [82.53%] + 2,029,368,491 branches # 110.594 M/sec [82.03%] + 1,800,665 branch-misses # 0.09% of all branches [83.98%] + + 1.185121953 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18377.494558 task-clock # 15.456 CPUs utilized + 5,591 context-switches # 0.000 M/sec + 2,447 CPU-migrations # 0.000 M/sec + 5,179 page-faults # 0.000 M/sec + 53,652,351,697 cycles # 2.919 GHz [84.19%] + 45,821,210,425 stalled-cycles-frontend # 85.40% frontend cycles idle [83.41%] + 9,458,937,540 stalled-cycles-backend # 17.63% backend cycles idle [66.14%] + 25,964,104,996 instructions # 0.48 insns per cycle + # 1.76 stalled cycles per insn [83.85%] + 2,050,532,931 branches # 111.578 M/sec [84.23%] + 1,840,610 branch-misses # 0.09% of all branches [83.96%] + + 1.189050216 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18582.968211 task-clock # 15.459 CPUs utilized + 5,598 context-switches # 0.000 M/sec + 2,314 CPU-migrations # 0.000 M/sec + 5,179 page-faults # 0.000 M/sec + 54,087,449,650 cycles # 2.911 GHz [83.56%] + 46,413,498,667 stalled-cycles-frontend # 85.81% frontend cycles idle [82.71%] + 9,631,910,593 stalled-cycles-backend # 17.81% backend cycles idle [66.94%] + 26,059,275,705 instructions # 0.48 insns per cycle + # 1.78 stalled cycles per insn [84.17%] + 2,052,254,573 branches # 110.437 M/sec [84.51%] + 1,814,430 branch-misses # 0.09% of all branches [84.49%] + + 1.202079615 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18506.448315 task-clock # 15.451 CPUs utilized + 5,891 context-switches # 0.000 M/sec + 2,220 CPU-migrations # 0.000 M/sec + 5,180 page-faults # 0.000 M/sec + 54,050,865,680 cycles # 2.921 GHz [84.36%] + 46,330,742,406 stalled-cycles-frontend # 85.72% frontend cycles idle [83.54%] + 9,786,155,885 stalled-cycles-backend # 18.11% backend cycles idle [66.06%] + 26,060,272,982 instructions # 0.48 insns per cycle + # 1.78 stalled cycles per insn [83.54%] + 2,054,510,777 branches # 111.016 M/sec [83.21%] + 1,861,805 branch-misses # 0.09% of all branches [83.79%] + + 1.197731831 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18630.834955 task-clock # 15.481 CPUs utilized + 5,309 context-switches # 0.000 M/sec + 2,335 CPU-migrations # 0.000 M/sec + 5,181 page-faults # 0.000 M/sec + 54,252,758,893 cycles # 2.912 GHz [84.69%] + 46,551,150,266 stalled-cycles-frontend # 85.80% frontend cycles idle [83.33%] + 9,696,696,720 stalled-cycles-backend # 17.87% backend cycles idle [66.37%] + 25,966,694,333 instructions # 0.48 insns per cycle + # 1.79 stalled cycles per insn [84.15%] + 2,047,371,966 branches # 109.892 M/sec [83.93%] + 1,842,127 branch-misses # 0.09% of all branches [84.14%] + + 1.203491446 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18471.836002 task-clock # 15.474 CPUs utilized + 5,642 context-switches # 0.000 M/sec + 2,357 CPU-migrations # 0.000 M/sec + 5,180 page-faults # 0.000 M/sec + 53,882,889,065 cycles # 2.917 GHz [84.18%] + 46,160,739,219 stalled-cycles-frontend # 85.67% frontend cycles idle [83.07%] + 9,725,193,069 stalled-cycles-backend # 18.05% backend cycles idle [65.87%] + 26,026,994,638 instructions # 0.48 insns per cycle + # 1.77 stalled cycles per insn [83.46%] + 2,048,276,811 branches # 110.886 M/sec [84.33%] + 1,813,793 branch-misses # 0.09% of all branches [84.31%] + + 1.193724889 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18392.390099 task-clock # 15.478 CPUs utilized + 5,486 context-switches # 0.000 M/sec + 1,903 CPU-migrations # 0.000 M/sec + 5,182 page-faults # 0.000 M/sec + 53,630,048,548 cycles # 2.916 GHz [84.22%] + 45,852,620,885 stalled-cycles-frontend # 85.50% frontend cycles idle [84.02%] + 9,484,042,119 stalled-cycles-backend # 17.68% backend cycles idle [67.16%] + 25,920,042,284 instructions # 0.48 insns per cycle + # 1.77 stalled cycles per insn [83.50%] + 2,040,023,559 branches # 110.917 M/sec [83.30%] + 1,819,577 branch-misses # 0.09% of all branches [84.02%] + + 1.188283145 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang 1000': + + 18399.857023 task-clock # 15.462 CPUs utilized + 5,734 context-switches # 0.000 M/sec + 2,071 CPU-migrations # 0.000 M/sec + 5,180 page-faults # 0.000 M/sec + 53,564,351,453 cycles # 2.911 GHz [84.27%] + 45,867,324,666 stalled-cycles-frontend # 85.63% frontend cycles idle [83.26%] + 9,547,362,193 stalled-cycles-backend # 17.82% backend cycles idle [65.78%] + 26,037,577,838 instructions # 0.49 insns per cycle + # 1.76 stalled cycles per insn [83.50%] + 2,049,506,105 branches # 111.387 M/sec [83.90%] + 1,855,088 branch-misses # 0.09% of all branches [84.71%] + + 1.190042345 seconds time elapsed + diff --git a/nachi/clang_output_3000 b/nachi/clang_output_3000 new file mode 100644 index 0000000..0b8f544 --- /dev/null +++ b/nachi/clang_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply_clang 3000': + + 683602.290403 task-clock # 15.450 CPUs utilized + 188,550 context-switches # 0.000 M/sec + 124,825 CPU-migrations # 0.000 M/sec + 38,610 page-faults # 0.000 M/sec + 1,999,462,444,454 cycles # 2.925 GHz [83.42%] + 1,792,201,743,624 stalled-cycles-frontend # 89.63% frontend cycles idle [83.39%] + 732,108,261,478 stalled-cycles-backend # 36.62% backend cycles idle [66.64%] + 704,703,744,949 instructions # 0.35 insns per cycle + # 2.54 stalled cycles per insn [83.36%] + 54,751,821,576 branches # 80.093 M/sec [83.31%] + 28,992,325 branch-misses # 0.05% of all branches [83.36%] + + 44.246815535 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply_clang 3000': + + 656346.268253 task-clock # 15.808 CPUs utilized + 180,684 context-switches # 0.000 M/sec + 60,920 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 1,920,078,756,344 cycles # 2.925 GHz [83.35%] + 1,713,914,650,003 stalled-cycles-frontend # 89.26% frontend cycles idle [83.40%] + 673,492,997,060 stalled-cycles-backend # 35.08% backend cycles idle [66.69%] + 704,563,852,613 instructions # 0.37 insns per cycle + # 2.43 stalled cycles per insn [83.40%] + 54,680,965,978 branches # 83.311 M/sec [83.33%] + 23,359,720 branch-misses # 0.04% of all branches [83.36%] + + 41.519713143 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply_clang 3000': + + 650472.372196 task-clock # 15.842 CPUs utilized + 179,054 context-switches # 0.000 M/sec + 51,924 CPU-migrations # 0.000 M/sec + 38,667 page-faults # 0.000 M/sec + 1,902,954,424,195 cycles # 2.925 GHz [83.39%] + 1,697,271,920,745 stalled-cycles-frontend # 89.19% frontend cycles idle [83.34%] + 657,960,307,195 stalled-cycles-backend # 34.58% backend cycles idle [66.66%] + 704,440,174,470 instructions # 0.37 insns per cycle + # 2.41 stalled cycles per insn [83.40%] + 54,675,514,763 branches # 84.055 M/sec [83.33%] + 22,892,161 branch-misses # 0.04% of all branches [83.40%] + + 41.059065184 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply_clang 3000': + + 651631.525229 task-clock # 15.824 CPUs utilized + 182,372 context-switches # 0.000 M/sec + 52,036 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 1,906,309,513,113 cycles # 2.925 GHz [83.26%] + 1,700,558,939,253 stalled-cycles-frontend # 89.21% frontend cycles idle [83.34%] + 661,130,828,448 stalled-cycles-backend # 34.68% backend cycles idle [66.77%] + 704,518,430,975 instructions # 0.37 insns per cycle + # 2.41 stalled cycles per insn [83.44%] + 54,700,285,137 branches # 83.944 M/sec [83.42%] + 23,179,824 branch-misses # 0.04% of all branches [83.35%] + + 41.179632917 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply_clang 3000': + + 645090.508110 task-clock # 15.842 CPUs utilized + 177,144 context-switches # 0.000 M/sec + 37,511 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 1,887,230,872,785 cycles # 2.926 GHz [83.46%] + 1,681,916,680,900 stalled-cycles-frontend # 89.12% frontend cycles idle [83.33%] + 643,726,007,507 stalled-cycles-backend # 34.11% backend cycles idle [66.56%] + 704,240,725,796 instructions # 0.37 insns per cycle + # 2.39 stalled cycles per insn [83.38%] + 54,650,770,111 branches # 84.718 M/sec [83.37%] + 22,788,180 branch-misses # 0.04% of all branches [83.40%] + + 40.720662136 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply_clang 3000': + + 654735.637357 task-clock # 15.838 CPUs utilized + 178,992 context-switches # 0.000 M/sec + 57,843 CPU-migrations # 0.000 M/sec + 38,676 page-faults # 0.000 M/sec + 1,915,287,511,362 cycles # 2.925 GHz [83.36%] + 1,709,570,929,231 stalled-cycles-frontend # 89.26% frontend cycles idle [83.45%] + 666,106,751,593 stalled-cycles-backend # 34.78% backend cycles idle [66.80%] + 704,465,971,543 instructions # 0.37 insns per cycle + # 2.43 stalled cycles per insn [83.46%] + 54,674,026,380 branches # 83.505 M/sec [83.27%] + 22,966,114 branch-misses # 0.04% of all branches [83.27%] + + 41.339847085 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply_clang 3000': + + 651946.916267 task-clock # 15.840 CPUs utilized + 178,727 context-switches # 0.000 M/sec + 58,382 CPU-migrations # 0.000 M/sec + 38,612 page-faults # 0.000 M/sec + 1,907,272,880,774 cycles # 2.926 GHz [83.35%] + 1,701,658,946,649 stalled-cycles-frontend # 89.22% frontend cycles idle [83.38%] + 662,579,277,388 stalled-cycles-backend # 34.74% backend cycles idle [66.68%] + 704,411,723,866 instructions # 0.37 insns per cycle + # 2.42 stalled cycles per insn [83.39%] + 54,682,387,688 branches # 83.876 M/sec [83.33%] + 23,006,900 branch-misses # 0.04% of all branches [83.36%] + + 41.157774093 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply_clang 3000': + + 658702.116455 task-clock # 15.831 CPUs utilized + 180,021 context-switches # 0.000 M/sec + 65,424 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 1,927,171,386,102 cycles # 2.926 GHz [83.37%] + 1,721,331,876,817 stalled-cycles-frontend # 89.32% frontend cycles idle [83.37%] + 680,225,081,166 stalled-cycles-backend # 35.30% backend cycles idle [66.65%] + 704,546,852,605 instructions # 0.37 insns per cycle + # 2.44 stalled cycles per insn [83.38%] + 54,713,327,269 branches # 83.062 M/sec [83.33%] + 23,170,747 branch-misses # 0.04% of all branches [83.36%] + + 41.607310118 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply_clang 3000': + + 655546.843395 task-clock # 15.839 CPUs utilized + 179,504 context-switches # 0.000 M/sec + 48,274 CPU-migrations # 0.000 M/sec + 38,633 page-faults # 0.000 M/sec + 1,917,585,435,185 cycles # 2.925 GHz [83.48%] + 1,711,878,739,585 stalled-cycles-frontend # 89.27% frontend cycles idle [83.44%] + 670,847,756,771 stalled-cycles-backend # 34.98% backend cycles idle [66.53%] + 704,441,322,711 instructions # 0.37 insns per cycle + # 2.43 stalled cycles per insn [83.27%] + 54,673,205,128 branches # 83.401 M/sec [83.31%] + 22,751,239 branch-misses # 0.04% of all branches [83.41%] + + 41.388974142 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply_clang 3000': + + 654964.010122 task-clock # 15.837 CPUs utilized + 177,750 context-switches # 0.000 M/sec + 55,614 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 1,915,850,649,855 cycles # 2.925 GHz [83.41%] + 1,710,329,479,237 stalled-cycles-frontend # 89.27% frontend cycles idle [83.45%] + 669,851,934,369 stalled-cycles-backend # 34.96% backend cycles idle [66.78%] + 704,428,294,267 instructions # 0.37 insns per cycle + # 2.43 stalled cycles per insn [83.35%] + 54,682,454,453 branches # 83.489 M/sec [83.26%] + 22,859,901 branch-misses # 0.04% of all branches [83.27%] + + 41.355687125 seconds time elapsed + diff --git a/nachi/gcc_output_100 b/nachi/gcc_output_100 new file mode 100644 index 0000000..01762c8 --- /dev/null +++ b/nachi/gcc_output_100 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply 100': + + 16.526964 task-clock # 3.146 CPUs utilized + 104 context-switches # 0.006 M/sec + 100 CPU-migrations # 0.006 M/sec + 399 page-faults # 0.024 M/sec + 36,453,917 cycles # 2.206 GHz [69.79%] + 26,162,628 stalled-cycles-frontend # 71.77% frontend cycles idle + 9,686,357 stalled-cycles-backend # 26.57% backend cycles idle + 62,112,652 instructions # 1.70 insns per cycle + # 0.42 stalled cycles per insn + 2,865,529 branches # 173.385 M/sec + 36,638 branch-misses # 1.28% of all branches [51.54%] + + 0.005252944 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply 100': + + 16.487582 task-clock # 2.873 CPUs utilized + 119 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.006 M/sec + 399 page-faults # 0.024 M/sec + 28,029,197 cycles # 1.700 GHz [17.05%] + 25,904,797 stalled-cycles-frontend # 92.42% frontend cycles idle + 9,941,702 stalled-cycles-backend # 35.47% backend cycles idle + 62,135,429 instructions # 2.22 insns per cycle + # 0.42 stalled cycles per insn + 2,870,676 branches # 174.111 M/sec + 40,771 branch-misses # 1.42% of all branches [88.98%] + + 0.005739271 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply 100': + + 15.581824 task-clock # 3.007 CPUs utilized + 121 context-switches # 0.008 M/sec + 101 CPU-migrations # 0.006 M/sec + 399 page-faults # 0.026 M/sec + 39,399,884 cycles # 2.529 GHz [81.89%] + 25,020,285 stalled-cycles-frontend # 63.50% frontend cycles idle + 9,474,898 stalled-cycles-backend # 24.05% backend cycles idle + 62,002,884 instructions # 1.57 insns per cycle + # 0.40 stalled cycles per insn + 2,835,542 branches # 181.978 M/sec + 33,644 branch-misses # 1.19% of all branches [33.57%] + + 0.005182704 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply 100': + + 15.996230 task-clock # 3.122 CPUs utilized + 111 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.006 M/sec + 399 page-faults # 0.025 M/sec + 33,421,613 cycles # 2.089 GHz [ 5.64%] + 25,280,416 stalled-cycles-frontend # 75.64% frontend cycles idle + 9,395,885 stalled-cycles-backend # 28.11% backend cycles idle + 62,037,017 instructions # 1.86 insns per cycle + # 0.41 stalled cycles per insn + 2,846,710 branches # 177.961 M/sec + 38,797 branch-misses # 1.36% of all branches [98.10%] + + 0.005124444 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply 100': + + 16.851912 task-clock # 3.227 CPUs utilized + 96 context-switches # 0.006 M/sec + 100 CPU-migrations # 0.006 M/sec + 398 page-faults # 0.024 M/sec + 33,311,860 cycles # 1.977 GHz [35.15%] + 27,000,368 stalled-cycles-frontend # 81.05% frontend cycles idle + 9,238,737 stalled-cycles-backend # 27.73% backend cycles idle + 62,062,439 instructions # 1.86 insns per cycle + # 0.44 stalled cycles per insn + 2,856,031 branches # 169.478 M/sec + 34,865 branch-misses # 1.22% of all branches [82.37%] + + 0.005221378 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply 100': + + 16.155562 task-clock # 3.110 CPUs utilized + 118 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.006 M/sec + 399 page-faults # 0.025 M/sec + 31,345,899 cycles # 1.940 GHz [12.53%] + 24,728,314 stalled-cycles-frontend # 78.89% frontend cycles idle [95.24%] + 9,425,647 stalled-cycles-backend # 30.07% backend cycles idle + 62,014,321 instructions # 1.98 insns per cycle + # 0.40 stalled cycles per insn + 2,836,967 branches # 175.603 M/sec + 48,434 branch-misses # 1.71% of all branches + + 0.005195433 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply 100': + + 15.929430 task-clock # 3.082 CPUs utilized + 96 context-switches # 0.006 M/sec + 100 CPU-migrations # 0.006 M/sec + 399 page-faults # 0.025 M/sec + 31,810,590 cycles # 1.997 GHz [47.91%] + 25,710,626 stalled-cycles-frontend # 80.82% frontend cycles idle + 9,458,253 stalled-cycles-backend # 29.73% backend cycles idle + 61,868,247 instructions # 1.94 insns per cycle + # 0.42 stalled cycles per insn + 2,804,292 branches # 176.045 M/sec + 34,165 branch-misses # 1.22% of all branches [73.62%] + + 0.005168431 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply 100': + + 16.602924 task-clock # 3.231 CPUs utilized + 109 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.006 M/sec + 398 page-faults # 0.024 M/sec + 44,344,904 cycles # 2.671 GHz [99.55%] + 25,951,364 stalled-cycles-frontend # 58.52% frontend cycles idle + 8,793,077 stalled-cycles-backend # 19.83% backend cycles idle + 62,102,026 instructions # 1.40 insns per cycle + # 0.42 stalled cycles per insn + 2,865,263 branches # 172.576 M/sec + 62,286 branch-misses # 2.17% of all branches [ 1.20%] + + 0.005138379 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply 100': + + 16.110245 task-clock # 3.122 CPUs utilized + 105 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.006 M/sec + 401 page-faults # 0.025 M/sec + 27,924,498 cycles # 1.733 GHz [25.42%] + 24,404,014 stalled-cycles-frontend # 87.39% frontend cycles idle [88.13%] + 9,187,331 stalled-cycles-backend # 32.90% backend cycles idle + 61,917,705 instructions # 2.22 insns per cycle + # 0.39 stalled cycles per insn + 2,814,112 branches # 174.678 M/sec + 46,487 branch-misses # 1.65% of all branches + + 0.005159764 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply 100': + + 16.366322 task-clock # 3.210 CPUs utilized + 112 context-switches # 0.007 M/sec + 100 CPU-migrations # 0.006 M/sec + 399 page-faults # 0.024 M/sec + 42,830,254 cycles # 2.617 GHz [97.59%] + 25,580,641 stalled-cycles-frontend # 59.73% frontend cycles idle + 8,832,468 stalled-cycles-backend # 20.62% backend cycles idle + 62,013,287 instructions # 1.45 insns per cycle + # 0.41 stalled cycles per insn + 2,837,106 branches # 173.350 M/sec + 39,891 branch-misses # 1.41% of all branches [ 7.17%] + + 0.005098681 seconds time elapsed + diff --git a/nachi/gcc_output_1000 b/nachi/gcc_output_1000 new file mode 100644 index 0000000..d958bd2 --- /dev/null +++ b/nachi/gcc_output_1000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply 1000': + + 21759.987600 task-clock # 15.556 CPUs utilized + 6,481 context-switches # 0.000 M/sec + 2,665 CPU-migrations # 0.000 M/sec + 5,179 page-faults # 0.000 M/sec + 63,429,892,465 cycles # 2.915 GHz [83.23%] + 49,367,792,493 stalled-cycles-frontend # 77.83% frontend cycles idle [82.77%] + 6,604,925,305 stalled-cycles-backend # 10.41% backend cycles idle [67.78%] + 53,053,790,943 instructions # 0.84 insns per cycle + # 0.93 stalled cycles per insn [84.29%] + 1,053,913,894 branches # 48.434 M/sec [84.06%] + 1,988,565 branch-misses # 0.19% of all branches [83.87%] + + 1.398773861 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply 1000': + + 21894.620421 task-clock # 15.505 CPUs utilized + 6,398 context-switches # 0.000 M/sec + 1,823 CPU-migrations # 0.000 M/sec + 5,180 page-faults # 0.000 M/sec + 63,609,698,331 cycles # 2.905 GHz [83.12%] + 49,851,579,001 stalled-cycles-frontend # 78.37% frontend cycles idle [83.36%] + 6,602,385,045 stalled-cycles-backend # 10.38% backend cycles idle [68.41%] + 52,938,537,510 instructions # 0.83 insns per cycle + # 0.94 stalled cycles per insn [84.59%] + 1,054,775,480 branches # 48.175 M/sec [83.96%] + 1,927,116 branch-misses # 0.18% of all branches [83.13%] + + 1.412111503 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply 1000': + + 22043.617028 task-clock # 15.553 CPUs utilized + 6,153 context-switches # 0.000 M/sec + 2,272 CPU-migrations # 0.000 M/sec + 5,180 page-faults # 0.000 M/sec + 64,173,061,402 cycles # 2.911 GHz [84.03%] + 50,266,809,847 stalled-cycles-frontend # 78.33% frontend cycles idle [83.75%] + 7,014,131,878 stalled-cycles-backend # 10.93% backend cycles idle [67.34%] + 52,936,825,652 instructions # 0.82 insns per cycle + # 0.95 stalled cycles per insn [83.62%] + 1,048,455,744 branches # 47.563 M/sec [83.34%] + 1,984,549 branch-misses # 0.19% of all branches [83.86%] + + 1.417367737 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply 1000': + + 21777.939104 task-clock # 15.565 CPUs utilized + 6,330 context-switches # 0.000 M/sec + 1,992 CPU-migrations # 0.000 M/sec + 5,179 page-faults # 0.000 M/sec + 63,551,374,319 cycles # 2.918 GHz [84.78%] + 49,438,624,981 stalled-cycles-frontend # 77.79% frontend cycles idle [84.27%] + 6,528,975,952 stalled-cycles-backend # 10.27% backend cycles idle [66.11%] + 52,810,033,203 instructions # 0.83 insns per cycle + # 0.94 stalled cycles per insn [82.89%] + 1,051,573,786 branches # 48.286 M/sec [82.83%] + 1,978,837 branch-misses # 0.19% of all branches [84.06%] + + 1.399185690 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply 1000': + + 21761.865117 task-clock # 15.553 CPUs utilized + 6,094 context-switches # 0.000 M/sec + 2,149 CPU-migrations # 0.000 M/sec + 5,181 page-faults # 0.000 M/sec + 63,479,203,754 cycles # 2.917 GHz [84.38%] + 49,378,720,984 stalled-cycles-frontend # 77.79% frontend cycles idle [83.74%] + 6,477,708,666 stalled-cycles-backend # 10.20% backend cycles idle [66.28%] + 52,776,416,740 instructions # 0.83 insns per cycle + # 0.94 stalled cycles per insn [83.58%] + 1,049,396,297 branches # 48.222 M/sec [83.90%] + 1,987,217 branch-misses # 0.19% of all branches [84.29%] + + 1.399180433 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply 1000': + + 22204.242397 task-clock # 15.573 CPUs utilized + 6,320 context-switches # 0.000 M/sec + 2,059 CPU-migrations # 0.000 M/sec + 5,179 page-faults # 0.000 M/sec + 64,588,153,302 cycles # 2.909 GHz [83.86%] + 50,539,262,151 stalled-cycles-frontend # 78.25% frontend cycles idle [83.35%] + 7,212,614,272 stalled-cycles-backend # 11.17% backend cycles idle [66.98%] + 52,844,422,587 instructions # 0.82 insns per cycle + # 0.96 stalled cycles per insn [84.03%] + 1,053,775,012 branches # 47.458 M/sec [84.05%] + 1,916,621 branch-misses # 0.18% of all branches [84.11%] + + 1.425771983 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply 1000': + + 22045.653567 task-clock # 15.567 CPUs utilized + 6,182 context-switches # 0.000 M/sec + 2,397 CPU-migrations # 0.000 M/sec + 5,181 page-faults # 0.000 M/sec + 64,260,596,853 cycles # 2.915 GHz [84.27%] + 50,027,251,096 stalled-cycles-frontend # 77.85% frontend cycles idle [83.07%] + 6,941,098,071 stalled-cycles-backend # 10.80% backend cycles idle [66.48%] + 52,706,233,989 instructions # 0.82 insns per cycle + # 0.95 stalled cycles per insn [84.15%] + 1,051,008,488 branches # 47.674 M/sec [84.36%] + 1,868,622 branch-misses # 0.18% of all branches [84.50%] + + 1.416151975 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply 1000': + + 21750.280495 task-clock # 15.565 CPUs utilized + 6,411 context-switches # 0.000 M/sec + 1,987 CPU-migrations # 0.000 M/sec + 5,181 page-faults # 0.000 M/sec + 63,249,133,857 cycles # 2.908 GHz [83.30%] + 49,462,677,649 stalled-cycles-frontend # 78.20% frontend cycles idle [83.90%] + 6,482,133,844 stalled-cycles-backend # 10.25% backend cycles idle [67.59%] + 52,955,706,253 instructions # 0.84 insns per cycle + # 0.93 stalled cycles per insn [83.95%] + 1,052,780,102 branches # 48.403 M/sec [84.16%] + 1,912,232 branch-misses # 0.18% of all branches [83.08%] + + 1.397370694 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply 1000': + + 21740.348672 task-clock # 15.569 CPUs utilized + 6,535 context-switches # 0.000 M/sec + 2,098 CPU-migrations # 0.000 M/sec + 5,180 page-faults # 0.000 M/sec + 63,456,817,523 cycles # 2.919 GHz [83.70%] + 49,356,070,441 stalled-cycles-frontend # 77.78% frontend cycles idle [83.18%] + 6,457,644,708 stalled-cycles-backend # 10.18% backend cycles idle [66.90%] + 52,944,698,361 instructions # 0.83 insns per cycle + # 0.93 stalled cycles per insn [84.19%] + 1,053,467,394 branches # 48.457 M/sec [83.89%] + 1,998,667 branch-misses # 0.19% of all branches [83.76%] + + 1.396364487 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply 1000': + + 21851.753067 task-clock # 15.553 CPUs utilized + 5,992 context-switches # 0.000 M/sec + 2,186 CPU-migrations # 0.000 M/sec + 5,181 page-faults # 0.000 M/sec + 63,679,830,358 cycles # 2.914 GHz [84.73%] + 49,469,602,085 stalled-cycles-frontend # 77.68% frontend cycles idle [84.59%] + 6,666,706,967 stalled-cycles-backend # 10.47% backend cycles idle [66.33%] + 52,737,810,072 instructions # 0.83 insns per cycle + # 0.94 stalled cycles per insn [83.30%] + 1,051,670,417 branches # 48.128 M/sec [83.39%] + 1,886,049 branch-misses # 0.18% of all branches [84.03%] + + 1.405030068 seconds time elapsed + diff --git a/nachi/gcc_output_3000 b/nachi/gcc_output_3000 new file mode 100644 index 0000000..3fdec9e --- /dev/null +++ b/nachi/gcc_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for './matrixMultiply 3000': + + 860205.810931 task-clock # 15.849 CPUs utilized + 234,510 context-switches # 0.000 M/sec + 70,354 CPU-migrations # 0.000 M/sec + 38,611 page-faults # 0.000 M/sec + 2,516,822,235,355 cycles # 2.926 GHz [83.42%] + 2,114,479,764,565 stalled-cycles-frontend # 84.01% frontend cycles idle [83.37%] + 790,618,924,042 stalled-cycles-backend # 31.41% backend cycles idle [66.59%] + 1,433,763,926,057 instructions # 0.57 insns per cycle + # 1.47 stalled cycles per insn [83.35%] + 27,720,667,138 branches # 32.226 M/sec [83.29%] + 28,519,942 branch-misses # 0.10% of all branches [83.42%] + + 54.276120649 seconds time elapsed + +Iteration 2 + + Performance counter stats for './matrixMultiply 3000': + + 882515.006472 task-clock # 15.430 CPUs utilized + 227,863 context-switches # 0.000 M/sec + 126,644 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 2,580,962,745,542 cycles # 2.925 GHz [83.45%] + 2,177,625,159,135 stalled-cycles-frontend # 84.37% frontend cycles idle [83.33%] + 859,801,396,498 stalled-cycles-backend # 33.31% backend cycles idle [66.66%] + 1,433,457,377,962 instructions # 0.56 insns per cycle + # 1.52 stalled cycles per insn [83.39%] + 27,762,808,794 branches # 31.459 M/sec [83.39%] + 28,465,567 branch-misses # 0.10% of all branches [83.42%] + + 57.193802752 seconds time elapsed + +Iteration 3 + + Performance counter stats for './matrixMultiply 3000': + + 854264.765174 task-clock # 15.871 CPUs utilized + 230,580 context-switches # 0.000 M/sec + 76,576 CPU-migrations # 0.000 M/sec + 38,611 page-faults # 0.000 M/sec + 2,499,416,883,824 cycles # 2.926 GHz [83.37%] + 2,096,498,739,190 stalled-cycles-frontend # 83.88% frontend cycles idle [83.40%] + 782,605,462,912 stalled-cycles-backend # 31.31% backend cycles idle [66.69%] + 1,433,878,355,477 instructions # 0.57 insns per cycle + # 1.46 stalled cycles per insn [83.37%] + 27,730,091,575 branches # 32.461 M/sec [83.30%] + 26,719,814 branch-misses # 0.10% of all branches [83.34%] + + 53.825933410 seconds time elapsed + +Iteration 4 + + Performance counter stats for './matrixMultiply 3000': + + 858505.869421 task-clock # 15.870 CPUs utilized + 231,124 context-switches # 0.000 M/sec + 80,180 CPU-migrations # 0.000 M/sec + 38,660 page-faults # 0.000 M/sec + 2,511,605,766,623 cycles # 2.926 GHz [83.35%] + 2,109,221,164,800 stalled-cycles-frontend # 83.98% frontend cycles idle [83.41%] + 786,062,347,244 stalled-cycles-backend # 31.30% backend cycles idle [66.70%] + 1,433,565,203,990 instructions # 0.57 insns per cycle + # 1.47 stalled cycles per insn [83.35%] + 27,733,411,713 branches # 32.304 M/sec [83.32%] + 26,318,172 branch-misses # 0.09% of all branches [83.36%] + + 54.097194945 seconds time elapsed + +Iteration 5 + + Performance counter stats for './matrixMultiply 3000': + + 860441.294798 task-clock # 15.863 CPUs utilized + 230,922 context-switches # 0.000 M/sec + 108,948 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 2,517,063,934,337 cycles # 2.925 GHz [83.26%] + 2,113,756,857,333 stalled-cycles-frontend # 83.98% frontend cycles idle [83.36%] + 801,321,762,168 stalled-cycles-backend # 31.84% backend cycles idle [66.77%] + 1,433,674,478,670 instructions # 0.57 insns per cycle + # 1.47 stalled cycles per insn [83.40%] + 27,762,467,992 branches # 32.265 M/sec [83.43%] + 26,886,576 branch-misses # 0.10% of all branches [83.31%] + + 54.243632261 seconds time elapsed + +Iteration 6 + + Performance counter stats for './matrixMultiply 3000': + + 856399.807280 task-clock # 15.866 CPUs utilized + 230,812 context-switches # 0.000 M/sec + 78,590 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 2,505,658,591,134 cycles # 2.926 GHz [83.37%] + 2,102,572,425,641 stalled-cycles-frontend # 83.91% frontend cycles idle [83.35%] + 789,308,853,316 stalled-cycles-backend # 31.50% backend cycles idle [66.66%] + 1,433,495,093,882 instructions # 0.57 insns per cycle + # 1.47 stalled cycles per insn [83.38%] + 27,717,954,377 branches # 32.366 M/sec [83.35%] + 26,736,752 branch-misses # 0.10% of all branches [83.39%] + + 53.976446689 seconds time elapsed + +Iteration 7 + + Performance counter stats for './matrixMultiply 3000': + + 868141.868761 task-clock # 15.866 CPUs utilized + 233,574 context-switches # 0.000 M/sec + 128,584 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 2,540,079,445,525 cycles # 2.926 GHz [83.33%] + 2,136,275,085,706 stalled-cycles-frontend # 84.10% frontend cycles idle [83.32%] + 820,148,490,377 stalled-cycles-backend # 32.29% backend cycles idle [66.70%] + 1,433,896,448,048 instructions # 0.56 insns per cycle + # 1.49 stalled cycles per insn [83.39%] + 27,773,516,427 branches # 31.992 M/sec [83.37%] + 26,879,804 branch-misses # 0.10% of all branches [83.35%] + + 54.717140316 seconds time elapsed + +Iteration 8 + + Performance counter stats for './matrixMultiply 3000': + + 855862.319539 task-clock # 15.862 CPUs utilized + 228,776 context-switches # 0.000 M/sec + 61,235 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 2,503,713,416,489 cycles # 2.925 GHz [83.39%] + 2,100,939,156,723 stalled-cycles-frontend # 83.91% frontend cycles idle [83.38%] + 786,888,683,406 stalled-cycles-backend # 31.43% backend cycles idle [66.77%] + 1,433,385,300,767 instructions # 0.57 insns per cycle + # 1.47 stalled cycles per insn [83.39%] + 27,702,826,813 branches # 32.368 M/sec [83.31%] + 26,354,787 branch-misses # 0.10% of all branches [83.32%] + + 53.957777043 seconds time elapsed + +Iteration 9 + + Performance counter stats for './matrixMultiply 3000': + + 852778.721646 task-clock # 15.870 CPUs utilized + 230,420 context-switches # 0.000 M/sec + 78,270 CPU-migrations # 0.000 M/sec + 38,609 page-faults # 0.000 M/sec + 2,495,232,336,534 cycles # 2.926 GHz [83.40%] + 2,092,343,344,322 stalled-cycles-frontend # 83.85% frontend cycles idle [83.40%] + 777,115,946,059 stalled-cycles-backend # 31.14% backend cycles idle [66.60%] + 1,433,546,934,907 instructions # 0.57 insns per cycle + # 1.46 stalled cycles per insn [83.32%] + 27,725,994,034 branches # 32.513 M/sec [83.32%] + 26,644,251 branch-misses # 0.10% of all branches [83.35%] + + 53.735780919 seconds time elapsed + +Iteration 10 + + Performance counter stats for './matrixMultiply 3000': + + 858392.389037 task-clock # 15.864 CPUs utilized + 231,489 context-switches # 0.000 M/sec + 97,281 CPU-migrations # 0.000 M/sec + 38,611 page-faults # 0.000 M/sec + 2,511,541,413,765 cycles # 2.926 GHz [83.35%] + 2,108,405,510,692 stalled-cycles-frontend # 83.95% frontend cycles idle [83.38%] + 794,482,610,456 stalled-cycles-backend # 31.63% backend cycles idle [66.64%] + 1,433,654,552,499 instructions # 0.57 insns per cycle + # 1.47 stalled cycles per insn [83.35%] + 27,737,245,944 branches # 32.313 M/sec [83.35%] + 26,708,999 branch-misses # 0.10% of all branches [83.37%] + + 54.107802245 seconds time elapsed + diff --git a/nachi/java_output_100 b/nachi/java_output_100 new file mode 100644 index 0000000..3c00152 --- /dev/null +++ b/nachi/java_output_100 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'java MatrixMultiplier 100': + + 283.354441 task-clock # 2.145 CPUs utilized + 1,996 context-switches # 0.007 M/sec + 327 CPU-migrations # 0.001 M/sec + 6,725 page-faults # 0.024 M/sec + 757,684,865 cycles # 2.674 GHz [94.55%] + 601,008,093 stalled-cycles-frontend # 79.32% frontend cycles idle [66.66%] + 368,681,319 stalled-cycles-backend # 48.66% backend cycles idle [52.15%] + 325,081,879 instructions # 0.43 insns per cycle + # 1.85 stalled cycles per insn [90.10%] + 62,748,470 branches # 221.449 M/sec [92.86%] + 3,322,751 branch-misses # 5.30% of all branches [94.71%] + + 0.132115786 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'java MatrixMultiplier 100': + + 338.088850 task-clock # 2.509 CPUs utilized + 2,106 context-switches # 0.006 M/sec + 363 CPU-migrations # 0.001 M/sec + 6,757 page-faults # 0.020 M/sec + 911,763,181 cycles # 2.697 GHz [93.04%] + 712,594,242 stalled-cycles-frontend # 78.16% frontend cycles idle [85.89%] + 456,617,220 stalled-cycles-backend # 50.08% backend cycles idle [54.26%] + 341,933,515 instructions # 0.38 insns per cycle + # 2.08 stalled cycles per insn [86.11%] + 69,819,614 branches # 206.513 M/sec [81.09%] + 3,657,203 branch-misses # 5.24% of all branches [86.68%] + + 0.134743537 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'java MatrixMultiplier 100': + + 268.245880 task-clock # 2.303 CPUs utilized + 2,005 context-switches # 0.007 M/sec + 336 CPU-migrations # 0.001 M/sec + 6,727 page-faults # 0.025 M/sec + 763,576,936 cycles # 2.847 GHz [93.65%] + 577,455,623 stalled-cycles-frontend # 75.63% frontend cycles idle [84.35%] + 386,997,172 stalled-cycles-backend # 50.68% backend cycles idle [39.23%] + 313,757,058 instructions # 0.41 insns per cycle + # 1.84 stalled cycles per insn [78.64%] + 63,043,597 branches # 235.022 M/sec [89.57%] + 3,332,056 branch-misses # 5.29% of all branches [94.03%] + + 0.116471144 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'java MatrixMultiplier 100': + + 280.450477 task-clock # 2.256 CPUs utilized + 1,949 context-switches # 0.007 M/sec + 319 CPU-migrations # 0.001 M/sec + 6,736 page-faults # 0.024 M/sec + 759,302,803 cycles # 2.707 GHz [93.55%] + 591,418,156 stalled-cycles-frontend # 77.89% frontend cycles idle [92.39%] + 380,043,335 stalled-cycles-backend # 50.05% backend cycles idle [39.39%] + 368,571,468 instructions # 0.49 insns per cycle + # 1.60 stalled cycles per insn [74.79%] + 63,949,851 branches # 228.025 M/sec [80.46%] + 3,356,008 branch-misses # 5.25% of all branches [95.20%] + + 0.124339154 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'java MatrixMultiplier 100': + + 293.770032 task-clock # 2.301 CPUs utilized + 1,953 context-switches # 0.007 M/sec + 352 CPU-migrations # 0.001 M/sec + 6,782 page-faults # 0.023 M/sec + 804,373,299 cycles # 2.738 GHz [90.22%] + 630,742,200 stalled-cycles-frontend # 78.41% frontend cycles idle [93.44%] + 422,195,526 stalled-cycles-backend # 52.49% backend cycles idle [71.92%] + 378,129,558 instructions # 0.47 insns per cycle + # 1.67 stalled cycles per insn [79.63%] + 75,350,522 branches # 256.495 M/sec [71.36%] + 3,597,886 branch-misses # 4.77% of all branches [74.10%] + + 0.127679668 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'java MatrixMultiplier 100': + + 242.775518 task-clock # 1.922 CPUs utilized + 1,874 context-switches # 0.008 M/sec + 304 CPU-migrations # 0.001 M/sec + 6,714 page-faults # 0.028 M/sec + 644,332,032 cycles # 2.654 GHz [90.98%] + 467,888,070 stalled-cycles-frontend # 72.62% frontend cycles idle [73.19%] + 321,306,239 stalled-cycles-backend # 49.87% backend cycles idle [57.02%] + 321,581,664 instructions # 0.50 insns per cycle + # 1.45 stalled cycles per insn [88.59%] + 62,690,569 branches # 258.224 M/sec [89.76%] + 3,292,013 branch-misses # 5.25% of all branches [91.18%] + + 0.126314213 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'java MatrixMultiplier 100': + + 323.610399 task-clock # 2.501 CPUs utilized + 2,068 context-switches # 0.006 M/sec + 347 CPU-migrations # 0.001 M/sec + 6,754 page-faults # 0.021 M/sec + 888,192,688 cycles # 2.745 GHz [94.02%] + 728,669,291 stalled-cycles-frontend # 82.04% frontend cycles idle [69.68%] + 435,937,233 stalled-cycles-backend # 49.08% backend cycles idle [48.98%] + 343,965,630 instructions # 0.39 insns per cycle + # 2.12 stalled cycles per insn [85.53%] + 65,793,733 branches # 203.312 M/sec [92.89%] + 3,416,021 branch-misses # 5.19% of all branches [95.79%] + + 0.129381639 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'java MatrixMultiplier 100': + + 273.971717 task-clock # 2.096 CPUs utilized + 1,802 context-switches # 0.007 M/sec + 296 CPU-migrations # 0.001 M/sec + 6,723 page-faults # 0.025 M/sec + 727,064,381 cycles # 2.654 GHz [80.14%] + 522,523,220 stalled-cycles-frontend # 71.87% frontend cycles idle [69.62%] + 434,702,589 stalled-cycles-backend # 59.79% backend cycles idle [60.80%] + 300,057,996 instructions # 0.41 insns per cycle + # 1.74 stalled cycles per insn [91.04%] + 63,443,400 branches # 231.569 M/sec [95.34%] + 3,330,994 branch-misses # 5.25% of all branches [94.94%] + + 0.130718321 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'java MatrixMultiplier 100': + + 282.056510 task-clock # 2.229 CPUs utilized + 2,094 context-switches # 0.007 M/sec + 340 CPU-migrations # 0.001 M/sec + 6,752 page-faults # 0.024 M/sec + 769,116,910 cycles # 2.727 GHz [93.06%] + 596,936,505 stalled-cycles-frontend # 77.61% frontend cycles idle [90.56%] + 343,706,833 stalled-cycles-backend # 44.69% backend cycles idle [43.33%] + 366,040,953 instructions # 0.48 insns per cycle + # 1.63 stalled cycles per insn [81.06%] + 68,732,974 branches # 243.685 M/sec [81.13%] + 3,348,250 branch-misses # 4.87% of all branches [92.96%] + + 0.126540647 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'java MatrixMultiplier 100': + + 299.855978 task-clock # 2.392 CPUs utilized + 1,848 context-switches # 0.006 M/sec + 329 CPU-migrations # 0.001 M/sec + 6,745 page-faults # 0.022 M/sec + 808,730,353 cycles # 2.697 GHz [94.81%] + 653,295,569 stalled-cycles-frontend # 80.78% frontend cycles idle [67.35%] + 394,780,343 stalled-cycles-backend # 48.81% backend cycles idle [48.92%] + 300,769,692 instructions # 0.37 insns per cycle + # 2.17 stalled cycles per insn [91.90%] + 63,824,979 branches # 212.852 M/sec [94.60%] + 3,336,194 branch-misses # 5.23% of all branches [95.28%] + + 0.125348658 seconds time elapsed + diff --git a/nachi/java_output_1000 b/nachi/java_output_1000 new file mode 100644 index 0000000..a35834b --- /dev/null +++ b/nachi/java_output_1000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15463.497643 task-clock # 10.876 CPUs utilized + 22,306 context-switches # 0.001 M/sec + 6,881 CPU-migrations # 0.000 M/sec + 24,766 page-faults # 0.002 M/sec + 45,169,805,707 cycles # 2.921 GHz [82.46%] + 38,887,899,493 stalled-cycles-frontend # 86.09% frontend cycles idle [83.54%] + 18,094,789,687 stalled-cycles-backend # 40.06% backend cycles idle [68.64%] + 11,723,814,904 instructions # 0.26 insns per cycle + # 3.32 stalled cycles per insn [85.25%] + 1,664,427,035 branches # 107.636 M/sec [83.22%] + 9,666,208 branch-misses # 0.58% of all branches [83.29%] + + 1.421771575 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15536.291359 task-clock # 10.865 CPUs utilized + 21,152 context-switches # 0.001 M/sec + 6,832 CPU-migrations # 0.000 M/sec + 24,637 page-faults # 0.002 M/sec + 45,329,423,308 cycles # 2.918 GHz [84.03%] + 39,153,854,215 stalled-cycles-frontend # 86.38% frontend cycles idle [82.57%] + 18,069,588,087 stalled-cycles-backend # 39.86% backend cycles idle [65.30%] + 11,749,027,673 instructions # 0.26 insns per cycle + # 3.33 stalled cycles per insn [84.47%] + 1,668,791,692 branches # 107.412 M/sec [84.86%] + 9,303,055 branch-misses # 0.56% of all branches [84.41%] + + 1.429977275 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15551.541367 task-clock # 11.253 CPUs utilized + 21,717 context-switches # 0.001 M/sec + 7,276 CPU-migrations # 0.000 M/sec + 24,689 page-faults # 0.002 M/sec + 45,371,967,474 cycles # 2.918 GHz [82.47%] + 39,193,073,684 stalled-cycles-frontend # 86.38% frontend cycles idle [83.09%] + 18,065,558,844 stalled-cycles-backend # 39.82% backend cycles idle [68.32%] + 11,733,606,524 instructions # 0.26 insns per cycle + # 3.34 stalled cycles per insn [85.53%] + 1,659,102,181 branches # 106.684 M/sec [84.64%] + 9,154,605 branch-misses # 0.55% of all branches [82.88%] + + 1.381995838 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15735.397801 task-clock # 11.167 CPUs utilized + 22,145 context-switches # 0.001 M/sec + 7,299 CPU-migrations # 0.000 M/sec + 24,778 page-faults # 0.002 M/sec + 45,902,129,052 cycles # 2.917 GHz [84.69%] + 39,710,801,032 stalled-cycles-frontend # 86.51% frontend cycles idle [83.40%] + 18,310,819,764 stalled-cycles-backend # 39.89% backend cycles idle [66.97%] + 11,782,579,345 instructions # 0.26 insns per cycle + # 3.37 stalled cycles per insn [84.25%] + 1,669,509,926 branches # 106.099 M/sec [83.07%] + 9,358,463 branch-misses # 0.56% of all branches [83.28%] + + 1.409036472 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15335.872318 task-clock # 11.047 CPUs utilized + 21,225 context-switches # 0.001 M/sec + 6,691 CPU-migrations # 0.000 M/sec + 24,636 page-faults # 0.002 M/sec + 44,731,915,650 cycles # 2.917 GHz [84.01%] + 38,543,076,947 stalled-cycles-frontend # 86.16% frontend cycles idle [83.84%] + 17,989,972,378 stalled-cycles-backend # 40.22% backend cycles idle [65.38%] + 11,623,305,279 instructions # 0.26 insns per cycle + # 3.32 stalled cycles per insn [84.46%] + 1,658,274,295 branches # 108.130 M/sec [85.07%] + 8,698,301 branch-misses # 0.52% of all branches [83.01%] + + 1.388207432 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15592.311662 task-clock # 11.263 CPUs utilized + 19,832 context-switches # 0.001 M/sec + 5,753 CPU-migrations # 0.000 M/sec + 24,815 page-faults # 0.002 M/sec + 45,452,158,085 cycles # 2.915 GHz [82.89%] + 39,138,858,277 stalled-cycles-frontend # 86.11% frontend cycles idle [83.53%] + 17,898,884,103 stalled-cycles-backend # 39.38% backend cycles idle [69.08%] + 11,710,820,480 instructions # 0.26 insns per cycle + # 3.34 stalled cycles per insn [85.76%] + 1,651,684,642 branches # 105.929 M/sec [83.26%] + 9,078,967 branch-misses # 0.55% of all branches [83.24%] + + 1.384377412 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15654.331781 task-clock # 11.479 CPUs utilized + 20,227 context-switches # 0.001 M/sec + 6,349 CPU-migrations # 0.000 M/sec + 24,741 page-faults # 0.002 M/sec + 45,657,141,163 cycles # 2.917 GHz [83.36%] + 39,401,435,093 stalled-cycles-frontend # 86.30% frontend cycles idle [84.03%] + 17,745,380,441 stalled-cycles-backend # 38.87% backend cycles idle [67.68%] + 11,706,300,347 instructions # 0.26 insns per cycle + # 3.37 stalled cycles per insn [85.12%] + 1,653,571,188 branches # 105.630 M/sec [83.28%] + 9,246,034 branch-misses # 0.56% of all branches [83.29%] + + 1.363755206 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15455.435348 task-clock # 10.921 CPUs utilized + 21,811 context-switches # 0.001 M/sec + 6,659 CPU-migrations # 0.000 M/sec + 24,630 page-faults # 0.002 M/sec + 45,133,225,981 cycles # 2.920 GHz [85.80%] + 38,989,293,367 stalled-cycles-frontend # 86.39% frontend cycles idle [82.88%] + 17,921,589,451 stalled-cycles-backend # 39.71% backend cycles idle [63.48%] + 11,713,626,557 instructions # 0.26 insns per cycle + # 3.33 stalled cycles per insn [83.36%] + 1,673,323,324 branches # 108.268 M/sec [84.28%] + 9,168,563 branch-misses # 0.55% of all branches [84.64%] + + 1.415227686 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15538.632158 task-clock # 11.416 CPUs utilized + 22,666 context-switches # 0.001 M/sec + 7,372 CPU-migrations # 0.000 M/sec + 24,687 page-faults # 0.002 M/sec + 45,347,372,190 cycles # 2.918 GHz [83.45%] + 39,169,333,472 stalled-cycles-frontend # 86.38% frontend cycles idle [83.37%] + 17,940,245,903 stalled-cycles-backend # 39.56% backend cycles idle [68.00%] + 11,723,294,261 instructions # 0.26 insns per cycle + # 3.34 stalled cycles per insn [84.83%] + 1,671,077,921 branches # 107.543 M/sec [83.62%] + 9,236,837 branch-misses # 0.55% of all branches [82.75%] + + 1.361126626 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'java MatrixMultiplier 1000': + + 15792.455525 task-clock # 11.248 CPUs utilized + 20,135 context-switches # 0.001 M/sec + 6,314 CPU-migrations # 0.000 M/sec + 24,724 page-faults # 0.002 M/sec + 46,090,703,603 cycles # 2.919 GHz [84.12%] + 39,815,476,619 stalled-cycles-frontend # 86.39% frontend cycles idle [85.13%] + 18,256,298,976 stalled-cycles-backend # 39.61% backend cycles idle [65.38%] + 11,751,190,874 instructions # 0.25 insns per cycle + # 3.39 stalled cycles per insn [83.29%] + 1,665,700,655 branches # 105.474 M/sec [82.53%] + 9,526,366 branch-misses # 0.57% of all branches [84.23%] + + 1.403973693 seconds time elapsed + diff --git a/nachi/java_output_3000 b/nachi/java_output_3000 new file mode 100644 index 0000000..4303492 --- /dev/null +++ b/nachi/java_output_3000 @@ -0,0 +1,180 @@ +Iteration 1 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1098229.495232 task-clock # 15.810 CPUs utilized + 283,933 context-switches # 0.000 M/sec + 14,301 CPU-migrations # 0.000 M/sec + 108,174 page-faults # 0.000 M/sec + 3,213,068,817,618 cycles # 2.926 GHz [83.34%] + 3,044,819,074,741 stalled-cycles-frontend # 94.76% frontend cycles idle [83.35%] + 1,918,427,858,676 stalled-cycles-backend # 59.71% backend cycles idle [66.69%] + 301,226,849,351 instructions # 0.09 insns per cycle + # 10.11 stalled cycles per insn [83.35%] + 41,257,136,015 branches # 37.567 M/sec [83.35%] + 41,574,782 branch-misses # 0.10% of all branches [83.34%] + + 69.463141367 seconds time elapsed + +Iteration 2 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1095733.540371 task-clock # 15.833 CPUs utilized + 285,563 context-switches # 0.000 M/sec + 15,217 CPU-migrations # 0.000 M/sec + 108,138 page-faults # 0.000 M/sec + 3,205,643,537,535 cycles # 2.926 GHz [83.35%] + 3,037,250,231,623 stalled-cycles-frontend # 94.75% frontend cycles idle [83.34%] + 1,923,617,163,998 stalled-cycles-backend # 60.01% backend cycles idle [66.67%] + 301,261,892,754 instructions # 0.09 insns per cycle + # 10.08 stalled cycles per insn [83.35%] + 41,265,413,266 branches # 37.660 M/sec [83.34%] + 40,906,179 branch-misses # 0.10% of all branches [83.37%] + + 69.207783278 seconds time elapsed + +Iteration 3 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1118977.992693 task-clock # 15.834 CPUs utilized + 289,818 context-switches # 0.000 M/sec + 16,778 CPU-migrations # 0.000 M/sec + 108,758 page-faults # 0.000 M/sec + 3,273,695,989,903 cycles # 2.926 GHz [83.35%] + 3,105,261,402,539 stalled-cycles-frontend # 94.85% frontend cycles idle [83.34%] + 1,969,326,796,304 stalled-cycles-backend # 60.16% backend cycles idle [66.69%] + 301,362,486,909 instructions # 0.09 insns per cycle + # 10.30 stalled cycles per insn [83.36%] + 41,293,973,902 branches # 36.903 M/sec [83.35%] + 41,342,242 branch-misses # 0.10% of all branches [83.34%] + + 70.671154426 seconds time elapsed + +Iteration 4 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1107212.571510 task-clock # 15.831 CPUs utilized + 292,284 context-switches # 0.000 M/sec + 15,069 CPU-migrations # 0.000 M/sec + 107,633 page-faults # 0.000 M/sec + 3,239,218,642,983 cycles # 2.926 GHz [83.37%] + 3,070,910,582,536 stalled-cycles-frontend # 94.80% frontend cycles idle [83.33%] + 1,946,392,137,462 stalled-cycles-backend # 60.09% backend cycles idle [66.67%] + 301,303,292,829 instructions # 0.09 insns per cycle + # 10.19 stalled cycles per insn [83.36%] + 41,266,660,187 branches # 37.271 M/sec [83.35%] + 41,265,327 branch-misses # 0.10% of all branches [83.36%] + + 69.940252820 seconds time elapsed + +Iteration 5 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1090520.324067 task-clock # 15.832 CPUs utilized + 285,305 context-switches # 0.000 M/sec + 14,134 CPU-migrations # 0.000 M/sec + 108,387 page-faults # 0.000 M/sec + 3,190,358,410,683 cycles # 2.926 GHz [83.36%] + 3,022,101,893,539 stalled-cycles-frontend # 94.73% frontend cycles idle [83.34%] + 1,902,324,866,447 stalled-cycles-backend # 59.63% backend cycles idle [66.68%] + 301,179,982,830 instructions # 0.09 insns per cycle + # 10.03 stalled cycles per insn [83.37%] + 41,243,427,689 branches # 37.820 M/sec [83.35%] + 41,371,527 branch-misses # 0.10% of all branches [83.33%] + + 68.881409184 seconds time elapsed + +Iteration 6 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1109467.608506 task-clock # 15.818 CPUs utilized + 289,661 context-switches # 0.000 M/sec + 16,182 CPU-migrations # 0.000 M/sec + 107,866 page-faults # 0.000 M/sec + 3,245,869,342,157 cycles # 2.926 GHz [83.35%] + 3,077,573,759,564 stalled-cycles-frontend # 94.82% frontend cycles idle [83.35%] + 1,945,681,194,886 stalled-cycles-backend # 59.94% backend cycles idle [66.65%] + 301,341,373,348 instructions # 0.09 insns per cycle + # 10.21 stalled cycles per insn [83.35%] + 41,279,475,336 branches # 37.207 M/sec [83.37%] + 41,170,012 branch-misses # 0.10% of all branches [83.34%] + + 70.140477125 seconds time elapsed + +Iteration 7 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1106925.344375 task-clock # 15.831 CPUs utilized + 288,953 context-switches # 0.000 M/sec + 14,985 CPU-migrations # 0.000 M/sec + 107,010 page-faults # 0.000 M/sec + 3,238,328,486,255 cycles # 2.926 GHz [83.34%] + 3,069,946,411,387 stalled-cycles-frontend # 94.80% frontend cycles idle [83.36%] + 1,955,237,041,454 stalled-cycles-backend # 60.38% backend cycles idle [66.68%] + 301,139,640,713 instructions # 0.09 insns per cycle + # 10.19 stalled cycles per insn [83.37%] + 41,244,125,655 branches # 37.260 M/sec [83.34%] + 40,845,997 branch-misses # 0.10% of all branches [83.35%] + + 69.920967418 seconds time elapsed + +Iteration 8 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1133007.332365 task-clock # 15.849 CPUs utilized + 298,339 context-switches # 0.000 M/sec + 16,592 CPU-migrations # 0.000 M/sec + 108,263 page-faults # 0.000 M/sec + 3,314,692,749,448 cycles # 2.926 GHz [83.35%] + 3,146,436,215,319 stalled-cycles-frontend # 94.92% frontend cycles idle [83.34%] + 2,000,489,659,309 stalled-cycles-backend # 60.35% backend cycles idle [66.67%] + 301,342,529,373 instructions # 0.09 insns per cycle + # 10.44 stalled cycles per insn [83.35%] + 41,266,633,341 branches # 36.422 M/sec [83.36%] + 41,410,662 branch-misses # 0.10% of all branches [83.35%] + + 71.488854647 seconds time elapsed + +Iteration 9 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1096714.839110 task-clock # 15.846 CPUs utilized + 287,766 context-switches # 0.000 M/sec + 14,751 CPU-migrations # 0.000 M/sec + 107,237 page-faults # 0.000 M/sec + 3,208,458,988,986 cycles # 2.926 GHz [83.34%] + 3,040,183,290,594 stalled-cycles-frontend # 94.76% frontend cycles idle [83.35%] + 1,919,430,795,918 stalled-cycles-backend # 59.82% backend cycles idle [66.69%] + 301,295,082,840 instructions # 0.09 insns per cycle + # 10.09 stalled cycles per insn [83.36%] + 41,257,749,770 branches # 37.619 M/sec [83.32%] + 40,759,321 branch-misses # 0.10% of all branches [83.36%] + + 69.211665980 seconds time elapsed + +Iteration 10 + + Performance counter stats for 'java MatrixMultiplier 3000': + + 1091514.137386 task-clock # 15.847 CPUs utilized + 284,874 context-switches # 0.000 M/sec + 14,917 CPU-migrations # 0.000 M/sec + 108,210 page-faults # 0.000 M/sec + 3,193,314,030,878 cycles # 2.926 GHz [83.36%] + 3,024,871,428,578 stalled-cycles-frontend # 94.73% frontend cycles idle [83.35%] + 1,912,217,350,173 stalled-cycles-backend # 59.88% backend cycles idle [66.69%] + 301,179,963,863 instructions # 0.09 insns per cycle + # 10.04 stalled cycles per insn [83.37%] + 41,255,242,230 branches # 37.796 M/sec [83.33%] + 40,674,138 branch-misses # 0.10% of all branches [83.34%] + + 68.880153973 seconds time elapsed + From dc87507ad37499a4982a018435673a0f38a770ee Mon Sep 17 00:00:00 2001 From: Nachiket N Rau Date: Thu, 12 Feb 2015 23:50:30 -0500 Subject: [PATCH 05/11] threading rsults --- MatrixMultiplier$ThreadMultiply.class | Bin 0 -> 699 bytes MatrixMultiplier.class | Bin 0 -> 2457 bytes MatrixMultiplier.java | 181 +++++++++++++++++++++++ matrixMultiply | Bin 0 -> 13348 bytes matrixMultiply.c | 203 ++++++++++++++++++++++++++ matrixMultiply_clang | Bin 0 -> 13383 bytes script.sh | 24 +++ 7 files changed, 408 insertions(+) create mode 100644 MatrixMultiplier$ThreadMultiply.class create mode 100644 MatrixMultiplier.class create mode 100644 MatrixMultiplier.java create mode 100755 matrixMultiply create mode 100644 matrixMultiply.c create mode 100755 matrixMultiply_clang create mode 100644 script.sh diff --git a/MatrixMultiplier$ThreadMultiply.class b/MatrixMultiplier$ThreadMultiply.class new file mode 100644 index 0000000000000000000000000000000000000000..6e53c73c7e53f21c3c34417e4d501aa9830123a9 GIT binary patch literal 699 zcmZXR%WD%+6vn?hlV+MY?bO=FM@Fl))-;6_BI2T{&_;wnW1%f>>cZRfVn-)8WisPq zBPvBu6t}M3xHeb>7p}#Bz`w@Fcc(!mZhrTibI(1G?|%FF`3rz5=JLqlL=M9^X>ck> zw`eTi;IzRR2U8BF9h?^!i+3X>cbZ8U2YX?lB7yPMri`QD;osPzK)#hkk<#&c=YfD| z2xM!44&ti+tSw(d3MUjHt? z(Mh6~x*nLs$-zM?cjbNQ!o!4%BXC`eVAREo!3E5^xM)zqtiaUZ)0xeG7kwl!Iv8*p zTC1oY%5GP6smx#nDr4F&gi_yGSWmP*+{SCCYF!K3N_T?}H**dnb?&&eMXCD!@*isj zXZZ~|P*zy{HLgO!Y(rX%dl(~+(z`_8=INC`L6qkYV3qv?*dG|;K;$?w`$-b?m<#lc^rfH%0zbCLcs-eQs&d1QVdE5z{p5OWLZ`{Ov5 K-iTBJ3h^5N_LRH; literal 0 HcmV?d00001 diff --git a/MatrixMultiplier.class b/MatrixMultiplier.class new file mode 100644 index 0000000000000000000000000000000000000000..889ccffbcb44e637a2aea56e6a660e1d41943452 GIT binary patch literal 2457 zcma)8TT@e46#h=mNlrK%5Yd1b5J9U51~e#bxv9ikED!{$Qmpkrj&LA3Npop+rcW)? zC!hMz%S$_@9ea7`v^WzwrS+{ZZD%@tZht}lK>H&0+dG&jGSx}4*4}Hcz1O$Cwf2Tz z)_=GMAdJ@yG@(yNO9ghIUx)!A28B4Gx{eL|e7zz`xjP8+C1pC4z0J}bmIARJf>DD<#Do~raZ$&(fqG0B*o8?UUKZk#j>`(FC+9P^6(7kba!xvNOMw}6 zT{{y=SlO(dRiG!WT*kS1N`X2(9WBj=N~4H^ZAG8cPSSR>PRdoF(9_rNxK3_Rfz}p1 zbcrgGiraJ^c3gWjpPaEXlh#av7PU<**W7Rti4hrW+;Zcoq=Kr6oHe^RVx^@c2~kj+ z&Nyx^>ZbEK={qYh)+9I3mrdKH-?*LSO7TzvNLmiD)wN9zFIaC_T?xyb>zZJ8?p)s? zvT=pv>6p^-iUQ-z%~?C0V=`GC)0|JF@|juttRnyiiYIPx=Gd7|ah{0-Xg9GJEhbup z*eAq(JV$^sUOwj}x{A4(xQbVGTr=?+t}CeDjAtnCB;t04MD8_VVMd5q6LHu&ZkU+E zya@;GJb5z|9SbHFkq~GOn&=Qt&6}O}Z!UTfpd_TYB(^7oa80B{T4@=rj59W~V9(|h z?AU@#1+CM=Pl?&LX=^bot$WHbqHfO4Wb)~p9WRxGedpRY*#V3#8jFqg2>6Lx*__SJ zQB!%Y2a0ueQe9)BYglUAN-~7cN~di%t{~L5MJGIA+9(D$HZtJC`$D(Rq|@oQ=W553s*| z6-qGpGd!NVP#+GohXZf$E_~n7Pr)I|-SAOXGFlZs)u_WZG^2(Ws#c!fzHxdBwL(v? zIK8~xkRf++dmWc~12){>r$wXtxi#ohtMCu21L~kU(6|Ei-ZHw?!KUJ9A5~+xsiVdy zpdz*ctvp#$l`kIrx#XezRRr`%yzMYJ4w92S95urvBXvZ(myCqSMlZ)FX*)|Whv``b zZ5`D*LW)vx&`WfkC5-opP^HU9YCqBS2aAXzC6u8R7;C5`e6zNyfNHJ>!;PHqHtE)eA!lT-|rQWz?c5iXUibp>9c zzuGDJXrj`ZNXz{7n5@`el9Ase7eAIW=wy$97(IwF(ir27v&$ygf0y`fU%>!%g!3rv zF+RS<+WFSuR|vV{fLGM+ND1%<8?}o)bL|A?r`E2F_W&x0cb<41hFT=!Niv=y<4H1} zCF6_C=9a{1Kzqn6cOB(_8yGb)#oLDbY0Y0Yugjf7iUZrIg;B!7BcW?|}GP$pC5nr<; zcW@2g;7xpsx2WI7U72hvv*uO=;6cAy$(Z+lz(Moiswtg3nb!2M)UAm OHd7n4)$@7V1OI<@@)?l; literal 0 HcmV?d00001 diff --git a/MatrixMultiplier.java b/MatrixMultiplier.java new file mode 100644 index 0000000..2a5204f --- /dev/null +++ b/MatrixMultiplier.java @@ -0,0 +1,181 @@ +import java.util.*; + +public class MatrixMultiplier { + + static int[][] matrixA; + static int[][] matrixB; + static int[][] matrixC; + + static int matrixDimension; + + public MatrixMultiplier (int N) { + + matrixA = new int[N][N]; + matrixB = new int[N][N]; + matrixC = new int[N][N]; + matrixDimension = N; + + } + + public MatrixMultiplier () { + + } + + public void fillMatrixRandom() { + + + Random rn = new Random(); + + + int i = 0; + int j = 0; + + for (i=0; iV_q(C+cCW`HxOm0wLUM~V30Y?$Mn1_B zLTI8%EXMg0;s&u0a0L#Q(^QS=v@*@KQkn6AF2K>`wSXqCCM!&Dv|z!MBP2@xN<~vu zizaF4{ykfN+dEa_=VPg8nKkE_6#a{s7rbhImb?OqKW z@fs1aO`c1XWT~`WFr!pA{gMUMWQA$ef(297+YLR6^P?7ybC2>@E-!i2Kcz_hkmw4m539yJb@_oeXY}{ig6q_Ksa0G9=DpJvfTF4hM|^YX9ta2M0F( z;hr2uoU@rUjl)(kAXTRB#ibbMy5!VT0$Nk2h*nxQ3jHOx8d6hC$}K$j}y%PDT2n!i@JqA!By+L{g$Z74I{< zMQx*PfodTV*LKxZSQfb506qikY8&2b! zOT7)}IZJH;8*X3MR@-pDh)R`TB=o>De3 zD)}df_Ywc+lK&dAD0W~jJ{i~C!i5vUCrw>nh z^jpuR8@p>7wh1J2)T3uB{tdPZb$=^`auxqTo^CytdgFA(v#5H=-97tGb$53MYZ?xr z3#9kC{_Eg}{F=2VC4|^2_dVAHM}_nIPK}IkO!ecTizJY%_$C=XrjMQX>Dlr8$qx$! z_>Ke2RXpfu`a`SfZrRl7XnNRcY5}P1PCN$V=xKnYJ1**7FY9A(`1B(;`g0YHtm`F@ z+oi4#vNJ1Y%T5E6(Mj3si?ZkDkbTJ^`>U(e6W?&?q9<4J7ihXQbg|}e9G4HNt4HdJ zsd$bOk^dp&5zegTJpLaQeKkoYL~KeEy|0 zO+HUT`PNX;=fR@SCuIYCz90v}c<8dN)5R1>aN-v-D>5Auqp~hDH1QPbNJcv(ENik%@M2li89SwWfU}i24oa7gGXVk9d)wZXesYh z>~f3UuGocOtudu%AIdxDl%5Oa^=xQLp%bTVgXw8Gn3fl6;UpKDLN}~MSuHB1;q<(o ztNQ0zQfFxCu??s*IozK%KQ&8kisWoVYAUx5UHdBJ>_cjrq-;ZKIwxv=blP(!>$Qed z1oCo7?I;eZT@u2O`V1gB^^1dOUG|~Z^lS##CWPDMC<2ptOiW`jtGEt&YQE(v7K16> zj6MSaq${7RcxS1?!F7<~?fW&4(KNi%B65O_f6}R$D=9rzRJvU$y<%PT@%*LtX-I~q zXb8QIx)pN(E4r+`a7xc68qbBZ(Z=)ok+s9s0TDj3YLE!tG?FkKjpi~!y}i>8`u9UJ%5F>SHju%w`JdMF4VoI51+y_#$@I# zJ$G*-u0W#EAI?P^>%*u8!a1{XbvQTJxDNNmrc*TyLzIO7#Pfo^@C_5%75OS$km2cq zx$;?hZC1}Mla+W5%Hertx{!HCJ)v07O8K`bHhM~=XJ@YntcnK6hvx?0ZJnUk;&|!3 zLSYcJA36LJ&sxho|(@_7`;W9XlJ zkzjk?52O&aKZBzO{a$Xj4PO5hPhVjS3D)bIXrQRZ9xuQ(y z!vd9jL#L$tPEx4?ruP*p{LN>D#fm_MCTomWDxTl_*dKpuVIF^0%l@2E@gr}NXTMX5 zKcU){yZ>{-->cn@?pD{OThaR!eN@qJD*8P|f1>DVMPF6)O-0{V)a~bvmX_ZNtnS#K z=`%C8gyVgYR5GwBxFxu8?fQ%aH?OgHA%f|Hy=G)TsF|{857+S7FqY~U!M>y!3pQ_U zU28@TDDFUCCb&Nn#|P_RM%aw>#=GD! z2{SkarESa3{xqb!lD)mLKGU7HkImlz4I0`!-kQ7`xY9lg`X9kwc-}JhX;f&;vwpi* z16SI|5RhEyw4hX#we>jL^-ZrPaZ?#=lw9fL*58IE{N<8l|Hr(V6h5W^j=#80$kx(n z7pk--u>MJ}1`hv6D4o%|Zs};a<5RpZ7i&;VcE!p+8g_>;Bl>VsXN+-XnGCd03t}hm8 zmV{c!_ws`6(o?MX4k~tizEAB{4ysvDQFr{ul|JXcN8RUol)lToyjFIT-*@Trz8~HX z6txSZ?)Lu^m;O2B|D5uFlsacCeEk?2MTJE8zRCNecz+P*ndRO3<1T&rl1*i`+CTNb z>Hj@s?f&U2HkBr&@Al{B{}Hk@R5*UV@A3Yv-~XKWg5vY86R*I1 zO0z?7LhH zTZ2zj3tmTUFtSr4cztx@{^GtzC%#nhdgjDyi~Bj9_%f_JopwmpefUbj>x#Y6hqnh_ zFP!*wg4Y2jzM}YE;l%3&&s!(HQt*6q;@8_*S-0jvmAKiJPnur~#5)DI0zFrFu;Y){ zYi_6c>JhW^&?NEMc?bdbiYn3O@=N;$J)#sp&zt)c-mlgfo{s~{&Zx^yx%dxBJGCO< zx?bOq_)^hRtD#mZPonCX<2wEsaEd>m?t82;hRR%dds*69DF$5e|BJ$hT=*Lbf6Rqj z>-I`9qHw-1UxYmE#H@4m>#DRfd%VeSb92bAM8Z8{_ISGmcrE%%yVj`i+WC2jOUQBB zT?X$igFg&BfVXS+cs?TKt3=fjP1={=BvE@3xF6%wJL*`dy?9k1d#`E+w znzSUpg`>7q;9`<~{VA%i(`!}XFE`JaOH(i<^T@qwM0gc(5&cI zMO(x!_@O^9j7TaKIcUVN3ESBA+q;@~wzfE1P zk|4Kbccn9i{PTl0Wow#!SGL;I?EZ)-DU7O0C>T+kg6EX~2c&;t&XiF!J9_(gM#Dvj$ zCpr<0_ZgXV%-Y`Wwp7fV{0qt2?Cz9F$IOoYQt0v$sjFe&Um=wxxf`Ch-qT)tr;)if i>USk#k-m<8xwYOY-Kz#p$*UEe1;=A4LEH76I{yv4q@@r5 literal 0 HcmV?d00001 diff --git a/matrixMultiply.c b/matrixMultiply.c new file mode 100644 index 0000000..9f69324 --- /dev/null +++ b/matrixMultiply.c @@ -0,0 +1,203 @@ +#include +#include +#include +#include +#include +#include + +#define RANDOM_MAX_VALUE 100 + +static int **matrixA; +static int **matrixB; +static int **matrixC; +static int N; + +void setUpMatrices() { + + int i = 0; + + matrixA = malloc(sizeof(int *) * N); + matrixB = malloc(sizeof(int *) * N); + matrixC = malloc(sizeof(int *) * N); + + + + for (i=0 ; i8cy2pxvfT=maVH(qzjEZb~RE0|LHmcQ?)AW;e6@ z7E=UFZ9&$h5*R=5yQAo!j$=m|t)h}pG>oEvIAc}*2oBYajbj)JjaXQJ=e~P(-+S2= z`NO}=-Pw2U`Q3BQJ@>r(?tLHUqoMG2PhFkh;t}r^#7!*GBxD_hn0}jN71k-12~Aum zE)YwAG~lnv7NS;->AW({v{A`uq|m<0=_taml^$j|?_u%A0sf3@OLRO4f+Sg|pg*t4Z$V=}fO znMmbEH;i^}*|4P}m`w*a%W;$YBzwh<-O?qFV+%O)xfy?&1Js^+qV%rae{FrS(Ddvx zqG^2X;g25BNtgeq{@3LbkW^E^q0?FekJrFQYv3QKfp-D-<9icXGoI;AMzYy>Rww}@3NbTYW^Ya> zQo=Cy4yRK_){JCK!yt1}GPFfxGm%tGn2BL1WD+TJPz*^TbmqW(FjGKk*cTnSSt_{@$B^=7W0v&-#HE=K6Q_PEAa# z)Pz1Y*(S-<^m0uU_d@X0__&U->xG7y7QfK%oG?A5r{&Pc?Pa%~KXDBSj$N*yBawUm zBW+mnq4plI`u>yaiJSbFS3hvFPQUbcHZZtyU5`KzC+hTk!#NNtHUC@+6&jY3%B9CM zfBr?oOX#$Yy1U_~V}pZ(!IkR{VhE&n`H^$c5A|!VJ}M#j)_BvSo#?1EebX_!cjMzE z2lsqap)*o8THiW?Q>{-wcU+2Wx5bLbD3p) z<)Pci(~3C{b+wIDqPL&X3r$vc`TBplWiFI5eURDOD!a|sKjoHr^)<3%$x!!j|0(p{ zKvOIqIx}P9ywqcI4OpB1dNbgCpOT5=FNom;ruVIWk`ESe>HyR`K-v z)kF4i2}`9y=u~+I(2j`+o~jZ-71&c0SRT*H?{@6B2V72F8t2yib*J-N_rtWB1gB;` zU6}-xnUSb~mC1fNKw2Qm>jTes_n76?k06!Zf0L)B?5><2TV8#m`Oz#T7R(Rp!u(JE zE^w5tGz6})ZWQV#X+63BpR^8GxD{jzztx6YUR(Gc;PzQUSDLOaR=GZr9(ZXB_BSiu zT4Sb)Zzo=^EB5tR#yfxe{8UKIsyVoe<^T41J%4*qq4sHW2+dO=DOCu~l}|^+8s(f` z=qu{cWv)vSG>S`rT-m`#V^g{#9OQURA`oz^k|3LQT~D*<#h1|Na*>{w0qg^w(#S{n-Rxi9MeM? zD1>IqQMjHA{*260(GNAZ`mi5E0)wALP><*9?^V@lee!v)UWe_WZ#G;A9S7^_t$QMz zpDf;enr7$kpr%GYJM&o#v`T+L>ZQ_O6de`%rm_1>7QZHqJZ(4fn4B>f8fHf`nsw?H z^+wc-?O5k!Br!+YD!Z_rPX>;M^Rd9RerUt9EBqpSsP#!Az>DF$8JG*_ZwnyEHwJKb zG20ow=tNikwch+I`s8cg-u&;2A9)2G-T8NO?WRA`eiqKZ8qUAclmACosrfnmz%krY zoXq`AFWeZwtx7WB3m0O6mN07maKQ|$4;O9=w85iJY=&bL)0e8;AISR`+_7}RFa5xL z$z1aYJ?5(Wl#`9P?smdH2jZmGnC)m_lEv~e7G0N7gmhtTg45?JBezM|#Im1lpraZJ4L{L3zG z54@dVlIg*J8bgpvPS*=Ur z`{RK7G5)XDXnz6tG}<4o(O!>!#}K#Q)MyW&y$x}c563S51JLO~`vBsbC;hAMX}D{N zu|hkr^j^;=y@%>O*R7zNXo_!mc&2Rs^)^0(bNuf_B8 z+fk3j<8f4$FDT02JX#cgj-pJws#07xAZz^0BVX76;pa~N26LX07s_A8i}jjp;cqhB zAAN|R!aQDh%key<-j#CS{S8;n&x!|5$0^he2F%cwg zD3To#!PveO>{-;zSS`v~2VvFoQ!-+P3WM$wE4s9v+UTO!wJ%^ZW%+ zp=+DxZ>L8CSIOI;_bT?n>i}c#K!vU$*5BpPz*X`h{F192>MK=Q+k~TC-}Gn_HF+~M?D%iA&x4bQw^BbDXOwQ zuLsuxqcw>2d0m@R3lpzn5Rt_lzYhYXHH7tf-MB{$^n9hq{<9p@522mbB<6WtdPwPO zN}v2E8TMbn;#O2hl=XQXEGm5-C-=|#j30FA^Sa6lJ+H&0PkV)1|C7KdCgdL#-bdzC zhun|VYWd1_qVz7zuJ2o-5iESlpnRt&5$oVnb*7&JZ`Yqt`V&fD=MBK6r&#fMmp<=% zjjDqcEU2goYZ*O^8uicdZ&CYZi_+))j}_ed54rR?kBIY&VyvjBTmJ_x{kv8FcdPyn zl5@7g=Z~QYR7iyPVa~VWd?SuC%e(cbT>A87oyvNZkM&0S^e)xjKYdlF(y8>_{ki#P zAxo#4{pWp@^T7_Q@$>v-efH})=-T_|Je28mXh30ki>vUAKaU2xKHtX_mHrSbD$06H z|K`%~_YX+Pe!nE;d>M+F^|70PYN^JfUvz-irEW{MmnASLpJt*8h6im{8Wa z8r}U{Qq_-MjIz_CEoh`1DBdUSjb3=d`=1l9FW)~q@doTunjMmLFJ?6FL-s~5c3R$F zoOq+)eZz?_6TBZdaonXhXm&`}z1T^4{kAuHvGVh}?8KLs^H81m3c>5B6JIHKeRSf! zavr4v0Th9(JCNnbbZx}7fTKh4BZ#iA+wOzYi_?-;tS)@De;AI z2mz;leM>deD&+=L>qNzWzHV+-_>fv>_<9@#PIkszc53;5P}*57{I2-lC-GIHakYk8 zrF;d|x+>@K+rX*cr;$!(FOy)Z#qGDiXsq0$=565!b2n%OdTB zi^@92^Jg3I)huMAlwVHgi_#sbAuZ`yGhIJfrONH)#@hSjqgMhMkj2{>WLD{0Sw0 zM&b+i9go+F1LdPoq5DKC%O!5r9mgn=nQf`hBAPL?W)7K8QRFsv@49NI5$?Ta7c!y^ zqsPHr*==izrH#GG^qxr4kk9i*BsVJXtUi*AoAFq1%O&lb1T`3m*eG%B$daa40~t7}_0L_v`0-qCE% zkZ(CC*;~`>+1}0^b7vd9$gonytyJ=z@htrAlkN&5F5hz~yNP5{;!#RlmucrtQxfY< zjpQtK5>qFLgXPLgcdE;zb|+*QHuqfF@Mz1XjUgn$C*#8Cy$XYfB~nHXZ>3~ryxUSa zNb;6ywlDAV7m^KYhDcZUD~ literal 0 HcmV?d00001 diff --git a/script.sh b/script.sh new file mode 100644 index 0000000..d780eec --- /dev/null +++ b/script.sh @@ -0,0 +1,24 @@ +#! /bin/bash + +if [ "$#" -ne 4 ]; then + echo "Usage: bash $0 <# of integers> " + exit +fi + + + +STR_C_GCC="gcc_output_$1" +STR_JAVA="java_output_$1" +#STR_PYTHON="python_output_$1" +STR_C_CLANG="clang_output_$1" +for i in {1..10} +do + + echo "Iteration $i" >> $STR_C_GCC + echo "Iteration $i" >> $STR_JAVA + #echo "Iteration $i" >> $STR_PYTHON + echo "Iteration $i" >> $STR_C_CLANG + 3>>$STR_C_GCC perf stat --log-fd 3 ./$2 $1 > /dev/null + 3>>$STR_JAVA perf stat --log-fd 3 java $3 $1 > /dev/null + 3>>$STR_C_CLANG perf stat --log-fd 3 ./$4 $1 > /dev/null +done From 173227f1f28be65d44de1f16e9342bcd4a4ed1d0 Mon Sep 17 00:00:00 2001 From: Nachiket Rau Date: Thu, 12 Feb 2015 23:53:38 -0500 Subject: [PATCH 06/11] Delete MatrixMultiplier$ThreadMultiply.class --- MatrixMultiplier$ThreadMultiply.class | Bin 699 -> 0 bytes 1 file changed, 0 insertions(+), 0 deletions(-) delete mode 100644 MatrixMultiplier$ThreadMultiply.class diff --git a/MatrixMultiplier$ThreadMultiply.class b/MatrixMultiplier$ThreadMultiply.class deleted file mode 100644 index 6e53c73c7e53f21c3c34417e4d501aa9830123a9..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 699 zcmZXR%WD%+6vn?hlV+MY?bO=FM@Fl))-;6_BI2T{&_;wnW1%f>>cZRfVn-)8WisPq zBPvBu6t}M3xHeb>7p}#Bz`w@Fcc(!mZhrTibI(1G?|%FF`3rz5=JLqlL=M9^X>ck> zw`eTi;IzRR2U8BF9h?^!i+3X>cbZ8U2YX?lB7yPMri`QD;osPzK)#hkk<#&c=YfD| z2xM!44&ti+tSw(d3MUjHt? z(Mh6~x*nLs$-zM?cjbNQ!o!4%BXC`eVAREo!3E5^xM)zqtiaUZ)0xeG7kwl!Iv8*p zTC1oY%5GP6smx#nDr4F&gi_yGSWmP*+{SCCYF!K3N_T?}H**dnb?&&eMXCD!@*isj zXZZ~|P*zy{HLgO!Y(rX%dl(~+(z`_8=INC`L6qkYV3qv?*dG|;K;$?w`$-b?m<#lc^rfH%0zbCLcs-eQs&d1QVdE5z{p5OWLZ`{Ov5 K-iTBJ3h^5N_LRH; From e0b4a9bfd12329ecd780015c9099c1e4771b7893 Mon Sep 17 00:00:00 2001 From: Nachiket Rau Date: Fri, 13 Feb 2015 00:15:32 -0500 Subject: [PATCH 07/11] Delete MatrixMultiplier.class --- MatrixMultiplier.class | Bin 2457 -> 0 bytes 1 file changed, 0 insertions(+), 0 deletions(-) delete mode 100644 MatrixMultiplier.class diff --git a/MatrixMultiplier.class b/MatrixMultiplier.class deleted file mode 100644 index 889ccffbcb44e637a2aea56e6a660e1d41943452..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 2457 zcma)8TT@e46#h=mNlrK%5Yd1b5J9U51~e#bxv9ikED!{$Qmpkrj&LA3Npop+rcW)? zC!hMz%S$_@9ea7`v^WzwrS+{ZZD%@tZht}lK>H&0+dG&jGSx}4*4}Hcz1O$Cwf2Tz z)_=GMAdJ@yG@(yNO9ghIUx)!A28B4Gx{eL|e7zz`xjP8+C1pC4z0J}bmIARJf>DD<#Do~raZ$&(fqG0B*o8?UUKZk#j>`(FC+9P^6(7kba!xvNOMw}6 zT{{y=SlO(dRiG!WT*kS1N`X2(9WBj=N~4H^ZAG8cPSSR>PRdoF(9_rNxK3_Rfz}p1 zbcrgGiraJ^c3gWjpPaEXlh#av7PU<**W7Rti4hrW+;Zcoq=Kr6oHe^RVx^@c2~kj+ z&Nyx^>ZbEK={qYh)+9I3mrdKH-?*LSO7TzvNLmiD)wN9zFIaC_T?xyb>zZJ8?p)s? zvT=pv>6p^-iUQ-z%~?C0V=`GC)0|JF@|juttRnyiiYIPx=Gd7|ah{0-Xg9GJEhbup z*eAq(JV$^sUOwj}x{A4(xQbVGTr=?+t}CeDjAtnCB;t04MD8_VVMd5q6LHu&ZkU+E zya@;GJb5z|9SbHFkq~GOn&=Qt&6}O}Z!UTfpd_TYB(^7oa80B{T4@=rj59W~V9(|h z?AU@#1+CM=Pl?&LX=^bot$WHbqHfO4Wb)~p9WRxGedpRY*#V3#8jFqg2>6Lx*__SJ zQB!%Y2a0ueQe9)BYglUAN-~7cN~di%t{~L5MJGIA+9(D$HZtJC`$D(Rq|@oQ=W553s*| z6-qGpGd!NVP#+GohXZf$E_~n7Pr)I|-SAOXGFlZs)u_WZG^2(Ws#c!fzHxdBwL(v? zIK8~xkRf++dmWc~12){>r$wXtxi#ohtMCu21L~kU(6|Ei-ZHw?!KUJ9A5~+xsiVdy zpdz*ctvp#$l`kIrx#XezRRr`%yzMYJ4w92S95urvBXvZ(myCqSMlZ)FX*)|Whv``b zZ5`D*LW)vx&`WfkC5-opP^HU9YCqBS2aAXzC6u8R7;C5`e6zNyfNHJ>!;PHqHtE)eA!lT-|rQWz?c5iXUibp>9c zzuGDJXrj`ZNXz{7n5@`el9Ase7eAIW=wy$97(IwF(ir27v&$ygf0y`fU%>!%g!3rv zF+RS<+WFSuR|vV{fLGM+ND1%<8?}o)bL|A?r`E2F_W&x0cb<41hFT=!Niv=y<4H1} zCF6_C=9a{1Kzqn6cOB(_8yGb)#oLDbY0Y0Yugjf7iUZrIg;B!7BcW?|}GP$pC5nr<; zcW@2g;7xpsx2WI7U72hvv*uO=;6cAy$(Z+lz(Moiswtg3nb!2M)UAm OHd7n4)$@7V1OI<@@)?l; From d4d8163a52ed737e81f18568d459c7838052581c Mon Sep 17 00:00:00 2001 From: Nachiket Rau Date: Fri, 13 Feb 2015 00:15:43 -0500 Subject: [PATCH 08/11] Delete MatrixMultiplier.java --- MatrixMultiplier.java | 181 ------------------------------------------ 1 file changed, 181 deletions(-) delete mode 100644 MatrixMultiplier.java diff --git a/MatrixMultiplier.java b/MatrixMultiplier.java deleted file mode 100644 index 2a5204f..0000000 --- a/MatrixMultiplier.java +++ /dev/null @@ -1,181 +0,0 @@ -import java.util.*; - -public class MatrixMultiplier { - - static int[][] matrixA; - static int[][] matrixB; - static int[][] matrixC; - - static int matrixDimension; - - public MatrixMultiplier (int N) { - - matrixA = new int[N][N]; - matrixB = new int[N][N]; - matrixC = new int[N][N]; - matrixDimension = N; - - } - - public MatrixMultiplier () { - - } - - public void fillMatrixRandom() { - - - Random rn = new Random(); - - - int i = 0; - int j = 0; - - for (i=0; i Date: Fri, 13 Feb 2015 00:15:56 -0500 Subject: [PATCH 09/11] Delete matrixMultiply --- matrixMultiply | Bin 13348 -> 0 bytes 1 file changed, 0 insertions(+), 0 deletions(-) delete mode 100755 matrixMultiply diff --git a/matrixMultiply b/matrixMultiply deleted file mode 100755 index 5007b232c0bc6beb7dd957e0c214e76be30ed95a..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 13348 zcmeHNe{dYteSddn*)mwtS(dR3G`b{m$0qpj?-3;-E6ZnA&e_ODB5uH0opmSc$VsQU z+oLjwse%mUayC&IH*u17Fl{F!ttV+4CUwJ1k#K4mhPDo6sN2%UFflzLI|yosYGkgT z@7wpi+g<5e_@guZL+@ty`@Wy|{q?^4-rL>V_q(C+cCW`HxOm0wLUM~V30Y?$Mn1_B zLTI8%EXMg0;s&u0a0L#Q(^QS=v@*@KQkn6AF2K>`wSXqCCM!&Dv|z!MBP2@xN<~vu zizaF4{ykfN+dEa_=VPg8nKkE_6#a{s7rbhImb?OqKW z@fs1aO`c1XWT~`WFr!pA{gMUMWQA$ef(297+YLR6^P?7ybC2>@E-!i2Kcz_hkmw4m539yJb@_oeXY}{ig6q_Ksa0G9=DpJvfTF4hM|^YX9ta2M0F( z;hr2uoU@rUjl)(kAXTRB#ibbMy5!VT0$Nk2h*nxQ3jHOx8d6hC$}K$j}y%PDT2n!i@JqA!By+L{g$Z74I{< zMQx*PfodTV*LKxZSQfb506qikY8&2b! zOT7)}IZJH;8*X3MR@-pDh)R`TB=o>De3 zD)}df_Ywc+lK&dAD0W~jJ{i~C!i5vUCrw>nh z^jpuR8@p>7wh1J2)T3uB{tdPZb$=^`auxqTo^CytdgFA(v#5H=-97tGb$53MYZ?xr z3#9kC{_Eg}{F=2VC4|^2_dVAHM}_nIPK}IkO!ecTizJY%_$C=XrjMQX>Dlr8$qx$! z_>Ke2RXpfu`a`SfZrRl7XnNRcY5}P1PCN$V=xKnYJ1**7FY9A(`1B(;`g0YHtm`F@ z+oi4#vNJ1Y%T5E6(Mj3si?ZkDkbTJ^`>U(e6W?&?q9<4J7ihXQbg|}e9G4HNt4HdJ zsd$bOk^dp&5zegTJpLaQeKkoYL~KeEy|0 zO+HUT`PNX;=fR@SCuIYCz90v}c<8dN)5R1>aN-v-D>5Auqp~hDH1QPbNJcv(ENik%@M2li89SwWfU}i24oa7gGXVk9d)wZXesYh z>~f3UuGocOtudu%AIdxDl%5Oa^=xQLp%bTVgXw8Gn3fl6;UpKDLN}~MSuHB1;q<(o ztNQ0zQfFxCu??s*IozK%KQ&8kisWoVYAUx5UHdBJ>_cjrq-;ZKIwxv=blP(!>$Qed z1oCo7?I;eZT@u2O`V1gB^^1dOUG|~Z^lS##CWPDMC<2ptOiW`jtGEt&YQE(v7K16> zj6MSaq${7RcxS1?!F7<~?fW&4(KNi%B65O_f6}R$D=9rzRJvU$y<%PT@%*LtX-I~q zXb8QIx)pN(E4r+`a7xc68qbBZ(Z=)ok+s9s0TDj3YLE!tG?FkKjpi~!y}i>8`u9UJ%5F>SHju%w`JdMF4VoI51+y_#$@I# zJ$G*-u0W#EAI?P^>%*u8!a1{XbvQTJxDNNmrc*TyLzIO7#Pfo^@C_5%75OS$km2cq zx$;?hZC1}Mla+W5%Hertx{!HCJ)v07O8K`bHhM~=XJ@YntcnK6hvx?0ZJnUk;&|!3 zLSYcJA36LJ&sxho|(@_7`;W9XlJ zkzjk?52O&aKZBzO{a$Xj4PO5hPhVjS3D)bIXrQRZ9xuQ(y z!vd9jL#L$tPEx4?ruP*p{LN>D#fm_MCTomWDxTl_*dKpuVIF^0%l@2E@gr}NXTMX5 zKcU){yZ>{-->cn@?pD{OThaR!eN@qJD*8P|f1>DVMPF6)O-0{V)a~bvmX_ZNtnS#K z=`%C8gyVgYR5GwBxFxu8?fQ%aH?OgHA%f|Hy=G)TsF|{857+S7FqY~U!M>y!3pQ_U zU28@TDDFUCCb&Nn#|P_RM%aw>#=GD! z2{SkarESa3{xqb!lD)mLKGU7HkImlz4I0`!-kQ7`xY9lg`X9kwc-}JhX;f&;vwpi* z16SI|5RhEyw4hX#we>jL^-ZrPaZ?#=lw9fL*58IE{N<8l|Hr(V6h5W^j=#80$kx(n z7pk--u>MJ}1`hv6D4o%|Zs};a<5RpZ7i&;VcE!p+8g_>;Bl>VsXN+-XnGCd03t}hm8 zmV{c!_ws`6(o?MX4k~tizEAB{4ysvDQFr{ul|JXcN8RUol)lToyjFIT-*@Trz8~HX z6txSZ?)Lu^m;O2B|D5uFlsacCeEk?2MTJE8zRCNecz+P*ndRO3<1T&rl1*i`+CTNb z>Hj@s?f&U2HkBr&@Al{B{}Hk@R5*UV@A3Yv-~XKWg5vY86R*I1 zO0z?7LhH zTZ2zj3tmTUFtSr4cztx@{^GtzC%#nhdgjDyi~Bj9_%f_JopwmpefUbj>x#Y6hqnh_ zFP!*wg4Y2jzM}YE;l%3&&s!(HQt*6q;@8_*S-0jvmAKiJPnur~#5)DI0zFrFu;Y){ zYi_6c>JhW^&?NEMc?bdbiYn3O@=N;$J)#sp&zt)c-mlgfo{s~{&Zx^yx%dxBJGCO< zx?bOq_)^hRtD#mZPonCX<2wEsaEd>m?t82;hRR%dds*69DF$5e|BJ$hT=*Lbf6Rqj z>-I`9qHw-1UxYmE#H@4m>#DRfd%VeSb92bAM8Z8{_ISGmcrE%%yVj`i+WC2jOUQBB zT?X$igFg&BfVXS+cs?TKt3=fjP1={=BvE@3xF6%wJL*`dy?9k1d#`E+w znzSUpg`>7q;9`<~{VA%i(`!}XFE`JaOH(i<^T@qwM0gc(5&cI zMO(x!_@O^9j7TaKIcUVN3ESBA+q;@~wzfE1P zk|4Kbccn9i{PTl0Wow#!SGL;I?EZ)-DU7O0C>T+kg6EX~2c&;t&XiF!J9_(gM#Dvj$ zCpr<0_ZgXV%-Y`Wwp7fV{0qt2?Cz9F$IOoYQt0v$sjFe&Um=wxxf`Ch-qT)tr;)if i>USk#k-m<8xwYOY-Kz#p$*UEe1;=A4LEH76I{yv4q@@r5 From cdbc3850765e4ba299d74c88c2a079a0802c4881 Mon Sep 17 00:00:00 2001 From: Nachiket Rau Date: Fri, 13 Feb 2015 00:16:09 -0500 Subject: [PATCH 10/11] Delete matrixMultiply_clang --- matrixMultiply_clang | Bin 13383 -> 0 bytes 1 file changed, 0 insertions(+), 0 deletions(-) delete mode 100755 matrixMultiply_clang diff --git a/matrixMultiply_clang b/matrixMultiply_clang deleted file mode 100755 index fc4eb797f4f09842fb272d3380998f286c93f76e..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 13383 zcmeHNeQ;b=6~Ea{+7!}uTLYv}>8cy2pxvfT=maVH(qzjEZb~RE0|LHmcQ?)AW;e6@ z7E=UFZ9&$h5*R=5yQAo!j$=m|t)h}pG>oEvIAc}*2oBYajbj)JjaXQJ=e~P(-+S2= z`NO}=-Pw2U`Q3BQJ@>r(?tLHUqoMG2PhFkh;t}r^#7!*GBxD_hn0}jN71k-12~Aum zE)YwAG~lnv7NS;->AW({v{A`uq|m<0=_taml^$j|?_u%A0sf3@OLRO4f+Sg|pg*t4Z$V=}fO znMmbEH;i^}*|4P}m`w*a%W;$YBzwh<-O?qFV+%O)xfy?&1Js^+qV%rae{FrS(Ddvx zqG^2X;g25BNtgeq{@3LbkW^E^q0?FekJrFQYv3QKfp-D-<9icXGoI;AMzYy>Rww}@3NbTYW^Ya> zQo=Cy4yRK_){JCK!yt1}GPFfxGm%tGn2BL1WD+TJPz*^TbmqW(FjGKk*cTnSSt_{@$B^=7W0v&-#HE=K6Q_PEAa# z)Pz1Y*(S-<^m0uU_d@X0__&U->xG7y7QfK%oG?A5r{&Pc?Pa%~KXDBSj$N*yBawUm zBW+mnq4plI`u>yaiJSbFS3hvFPQUbcHZZtyU5`KzC+hTk!#NNtHUC@+6&jY3%B9CM zfBr?oOX#$Yy1U_~V}pZ(!IkR{VhE&n`H^$c5A|!VJ}M#j)_BvSo#?1EebX_!cjMzE z2lsqap)*o8THiW?Q>{-wcU+2Wx5bLbD3p) z<)Pci(~3C{b+wIDqPL&X3r$vc`TBplWiFI5eURDOD!a|sKjoHr^)<3%$x!!j|0(p{ zKvOIqIx}P9ywqcI4OpB1dNbgCpOT5=FNom;ruVIWk`ESe>HyR`K-v z)kF4i2}`9y=u~+I(2j`+o~jZ-71&c0SRT*H?{@6B2V72F8t2yib*J-N_rtWB1gB;` zU6}-xnUSb~mC1fNKw2Qm>jTes_n76?k06!Zf0L)B?5><2TV8#m`Oz#T7R(Rp!u(JE zE^w5tGz6})ZWQV#X+63BpR^8GxD{jzztx6YUR(Gc;PzQUSDLOaR=GZr9(ZXB_BSiu zT4Sb)Zzo=^EB5tR#yfxe{8UKIsyVoe<^T41J%4*qq4sHW2+dO=DOCu~l}|^+8s(f` z=qu{cWv)vSG>S`rT-m`#V^g{#9OQURA`oz^k|3LQT~D*<#h1|Na*>{w0qg^w(#S{n-Rxi9MeM? zD1>IqQMjHA{*260(GNAZ`mi5E0)wALP><*9?^V@lee!v)UWe_WZ#G;A9S7^_t$QMz zpDf;enr7$kpr%GYJM&o#v`T+L>ZQ_O6de`%rm_1>7QZHqJZ(4fn4B>f8fHf`nsw?H z^+wc-?O5k!Br!+YD!Z_rPX>;M^Rd9RerUt9EBqpSsP#!Az>DF$8JG*_ZwnyEHwJKb zG20ow=tNikwch+I`s8cg-u&;2A9)2G-T8NO?WRA`eiqKZ8qUAclmACosrfnmz%krY zoXq`AFWeZwtx7WB3m0O6mN07maKQ|$4;O9=w85iJY=&bL)0e8;AISR`+_7}RFa5xL z$z1aYJ?5(Wl#`9P?smdH2jZmGnC)m_lEv~e7G0N7gmhtTg45?JBezM|#Im1lpraZJ4L{L3zG z54@dVlIg*J8bgpvPS*=Ur z`{RK7G5)XDXnz6tG}<4o(O!>!#}K#Q)MyW&y$x}c563S51JLO~`vBsbC;hAMX}D{N zu|hkr^j^;=y@%>O*R7zNXo_!mc&2Rs^)^0(bNuf_B8 z+fk3j<8f4$FDT02JX#cgj-pJws#07xAZz^0BVX76;pa~N26LX07s_A8i}jjp;cqhB zAAN|R!aQDh%key<-j#CS{S8;n&x!|5$0^he2F%cwg zD3To#!PveO>{-;zSS`v~2VvFoQ!-+P3WM$wE4s9v+UTO!wJ%^ZW%+ zp=+DxZ>L8CSIOI;_bT?n>i}c#K!vU$*5BpPz*X`h{F192>MK=Q+k~TC-}Gn_HF+~M?D%iA&x4bQw^BbDXOwQ zuLsuxqcw>2d0m@R3lpzn5Rt_lzYhYXHH7tf-MB{$^n9hq{<9p@522mbB<6WtdPwPO zN}v2E8TMbn;#O2hl=XQXEGm5-C-=|#j30FA^Sa6lJ+H&0PkV)1|C7KdCgdL#-bdzC zhun|VYWd1_qVz7zuJ2o-5iESlpnRt&5$oVnb*7&JZ`Yqt`V&fD=MBK6r&#fMmp<=% zjjDqcEU2goYZ*O^8uicdZ&CYZi_+))j}_ed54rR?kBIY&VyvjBTmJ_x{kv8FcdPyn zl5@7g=Z~QYR7iyPVa~VWd?SuC%e(cbT>A87oyvNZkM&0S^e)xjKYdlF(y8>_{ki#P zAxo#4{pWp@^T7_Q@$>v-efH})=-T_|Je28mXh30ki>vUAKaU2xKHtX_mHrSbD$06H z|K`%~_YX+Pe!nE;d>M+F^|70PYN^JfUvz-irEW{MmnASLpJt*8h6im{8Wa z8r}U{Qq_-MjIz_CEoh`1DBdUSjb3=d`=1l9FW)~q@doTunjMmLFJ?6FL-s~5c3R$F zoOq+)eZz?_6TBZdaonXhXm&`}z1T^4{kAuHvGVh}?8KLs^H81m3c>5B6JIHKeRSf! zavr4v0Th9(JCNnbbZx}7fTKh4BZ#iA+wOzYi_?-;tS)@De;AI z2mz;leM>deD&+=L>qNzWzHV+-_>fv>_<9@#PIkszc53;5P}*57{I2-lC-GIHakYk8 zrF;d|x+>@K+rX*cr;$!(FOy)Z#qGDiXsq0$=565!b2n%OdTB zi^@92^Jg3I)huMAlwVHgi_#sbAuZ`yGhIJfrONH)#@hSjqgMhMkj2{>WLD{0Sw0 zM&b+i9go+F1LdPoq5DKC%O!5r9mgn=nQf`hBAPL?W)7K8QRFsv@49NI5$?Ta7c!y^ zqsPHr*==izrH#GG^qxr4kk9i*BsVJXtUi*AoAFq1%O&lb1T`3m*eG%B$daa40~t7}_0L_v`0-qCE% zkZ(CC*;~`>+1}0^b7vd9$gonytyJ=z@htrAlkN&5F5hz~yNP5{;!#RlmucrtQxfY< zjpQtK5>qFLgXPLgcdE;zb|+*QHuqfF@Mz1XjUgn$C*#8Cy$XYfB~nHXZ>3~ryxUSa zNb;6ywlDAV7m^KYhDcZUD~ From ac1d86f7245518a53ee7a694b8353c081d159c2c Mon Sep 17 00:00:00 2001 From: Nachiket Rau Date: Fri, 13 Feb 2015 00:16:17 -0500 Subject: [PATCH 11/11] Delete matrixMultiply.c --- matrixMultiply.c | 203 ----------------------------------------------- 1 file changed, 203 deletions(-) delete mode 100644 matrixMultiply.c diff --git a/matrixMultiply.c b/matrixMultiply.c deleted file mode 100644 index 9f69324..0000000 --- a/matrixMultiply.c +++ /dev/null @@ -1,203 +0,0 @@ -#include -#include -#include -#include -#include -#include - -#define RANDOM_MAX_VALUE 100 - -static int **matrixA; -static int **matrixB; -static int **matrixC; -static int N; - -void setUpMatrices() { - - int i = 0; - - matrixA = malloc(sizeof(int *) * N); - matrixB = malloc(sizeof(int *) * N); - matrixC = malloc(sizeof(int *) * N); - - - - for (i=0 ; i