blob: 55ee31cad25411076bd944a0f050c40ffba227f0 [file] [log] [blame]
bart8785c122008-05-29 08:34:27 +00001#!/bin/bash
2
3########################
4# Function definitions #
5########################
6
bartf33ce892008-06-07 11:40:14 +00007source "$(dirname $0)/measurement-functions"
bart8785c122008-05-29 08:34:27 +00008
9function run_test {
bart8a2cd9b2008-06-19 07:49:49 +000010 local tmp avg1 stddev1 avg2 stddev2 avg4 stddev4 p
bart8785c122008-05-29 08:34:27 +000011
12 tmp="/tmp/test-timing.$$"
bart334db5e2008-06-05 10:14:53 +000013 rm -f "${tmp}"
14
bart8a2cd9b2008-06-19 07:49:49 +000015 p=1
bart3b7e2e32008-07-10 14:07:22 +000016 test_output="${1}-p${p}.out" measure_runtime "$@" -p${psep}${p} "${test_args}" | avgstddev > "$tmp"
barta5a95dd2008-06-18 14:15:11 +000017 read avg1 stddev1 vsz1 vszdev1 < "$tmp"
18 echo "Average time: ${avg1} +/- ${stddev1} seconds." \
19 " VSZ: ${vsz1} +/- ${vszdev1} KB"
bart8785c122008-05-29 08:34:27 +000020
bart8a2cd9b2008-06-19 07:49:49 +000021 p=2
bart3b7e2e32008-07-10 14:07:22 +000022 test_output="${1}-p${p}.out" measure_runtime "$@" -p${psep}${p} "${test_args}" | avgstddev > "$tmp"
barta5a95dd2008-06-18 14:15:11 +000023 read avg2 stddev2 vsz2 vszdev2 < "$tmp"
24 echo "Average time: ${avg2} +/- ${stddev2} seconds." \
25 " VSZ: ${vsz2} +/- ${vszdev2} KB"
bart0d4e5c22008-06-07 10:42:52 +000026
bart8a2cd9b2008-06-19 07:49:49 +000027 p=4
bart3b7e2e32008-07-10 14:07:22 +000028 test_output="${1}-p${p}.out" measure_runtime "$@" -p${psep}${p} "${test_args}" | avgstddev > "$tmp"
barta5a95dd2008-06-18 14:15:11 +000029 read avg4 stddev4 vsz4 vszdev4 < "$tmp"
30 echo "Average time: ${avg4} +/- ${stddev4} seconds." \
31 " VSZ: ${vsz4} +/- ${vszdev4} KB"
bartd1763bc2008-06-08 14:44:41 +000032
bart8a2cd9b2008-06-19 07:49:49 +000033 p=1
bartf16de382008-06-18 08:47:06 +000034 test_output="/dev/null" \
bart8a2cd9b2008-06-19 07:49:49 +000035 print_runtime_ratio ${avg1} ${stddev1} ${vsz1} ${vszdev1} $VG --tool=none "$@" -p${psep}${p} "${test_args}"
bartf16de382008-06-18 08:47:06 +000036
bart8a2cd9b2008-06-19 07:49:49 +000037 p=4
bartf16de382008-06-18 08:47:06 +000038 test_output="/dev/null" \
bart8a2cd9b2008-06-19 07:49:49 +000039 print_runtime_ratio ${avg4} ${stddev4} ${vsz4} ${vszdev4} $VG --tool=none "$@" -p${psep}${p} "${test_args}"
barta9952832008-06-17 14:20:26 +000040
bart8a2cd9b2008-06-19 07:49:49 +000041 p=4
42 test_output="${1}-drd-with-stack-var-4.out" \
barta5a95dd2008-06-18 14:15:11 +000043 print_runtime_ratio ${avg4} ${stddev4} ${vsz4} ${vszdev4} \
bartef1b9722008-07-04 15:34:23 +000044 $VG --tool=drd --check-stack-var=yes "$@" -p${psep}${p} "${test_args}"
bartcf801352008-06-15 09:13:28 +000045
bart8a2cd9b2008-06-19 07:49:49 +000046 p=4
47 test_output="${1}-drd-without-stack-var-4.out" \
barta5a95dd2008-06-18 14:15:11 +000048 print_runtime_ratio ${avg4} ${stddev4} ${vsz4} ${vszdev4} \
bartef1b9722008-07-04 15:34:23 +000049 $VG --tool=drd --check-stack-var=no "$@" -p${psep}${p} "${test_args}"
bartcf801352008-06-15 09:13:28 +000050
bart8a2cd9b2008-06-19 07:49:49 +000051 p=4
52 test_output="${1}-helgrind-4.out" \
53 print_runtime_ratio ${avg4} ${stddev4} ${vsz4} ${vszdev4} $VG --tool=helgrind "$@" -p${psep}${p} "${test_args}"
bart8785c122008-05-29 08:34:27 +000054
bart3b7e2e32008-07-10 14:07:22 +000055 if [ -e $HGDEV_VG ]; then
56 p=4
57 test_output="${1}-helgrind-hb-4.out" \
58 print_runtime_ratio ${avg4} ${stddev4} ${vsz4} ${vszdev4} $HGDEV_VG --tool=helgrind --pure-happens-before=yes "$@" -p${psep}${p} "${test_args}"
59 fi
60
bart8785c122008-05-29 08:34:27 +000061 echo ''
62
63 rm -f "$tmp"
64}
65
66
bart9cdd1782008-06-08 11:22:23 +000067########################
68# Script body #
69########################
bart8785c122008-05-29 08:34:27 +000070
bart32811502008-06-03 15:12:59 +000071DRD_SCRIPTS_DIR="$(dirname $0)"
bart7acf3802008-06-06 10:17:26 +000072if [ "${DRD_SCRIPTS_DIR:0:1}" != "/" ]; then
73 DRD_SCRIPTS_DIR="$PWD/$DRD_SCRIPTS_DIR"
bart32811502008-06-03 15:12:59 +000074fi
75
76SPLASH2="${DRD_SCRIPTS_DIR}/../splash2"
bartc4a174f2008-06-03 11:41:19 +000077if [ ! -e "${SPLASH2}" ]; then
78 echo "Error: splash2 directory not found (${SPLASH2})."
bart8785c122008-05-29 08:34:27 +000079 exit 1
80fi
81
82if [ "$VG" = "" ]; then
bart32811502008-06-03 15:12:59 +000083 VG="${DRD_SCRIPTS_DIR}/../../vg-in-place"
bart8785c122008-05-29 08:34:27 +000084fi
85
bart3b7e2e32008-07-10 14:07:22 +000086if [ "$HGDEV_VG" = "" ]; then
87 HGDEV_VG="${DRD_SCRIPTS_DIR}/../../../valgrind-hgdev/vg-in-place"
88fi
89
bart8785c122008-05-29 08:34:27 +000090if [ ! -e "$VG" ]; then
91 echo "Could not find $VG."
92 exit 1
93fi
94
bartee17ad62008-06-18 13:31:05 +000095######################################################################################################################
barta5a95dd2008-06-18 14:15:11 +000096# Meaning of the different colums:
97# 1. SPLASH2 test name.
98# 2. Execution time in seconds for native run with argument -p1.
99# 3. Virtual memory size in KB for the native run with argument -p1.
100# 4. Execution time in seconds for native run with argument -p2.
101# 5. Virtual memory size in KB for the native run with argument -p2.
102# 6. Execution time in seconds for native run with argument -p4.
103# 7. Virtual memory size in KB for the native run with argument -p4.
104# 8. Execution time ratio for --tool=none -p1 versus -p1.
105# 9. Virtual memory size ratio for --tool=none -p1 versus -p1.
106# 10. Execution time ratio for --tool=none -p4 versus -p4.
107# 11. Virtual memory size ratio for --tool=none -p4 versus -p4.
bartef1b9722008-07-04 15:34:23 +0000108# 12. Execution time ratio for --tool=drd --check-stack-var=yes -p4 versus -p4.
109# 13. Virtual memory size ratio for --tool=drd --check-stack-var=yes -p4 versus -p4.
110# 14. Execution time ratio for --tool=drd --check-stack-var=no -p4 versus -p4.
111# 15. Virtual memory size ratio for --tool=drd --check-stack-var=no -p4 versus -p4.
barta5a95dd2008-06-18 14:15:11 +0000112# 16. Execution time ratio for --tool=helgrind -p4 versus -p4.
113# 17. Virtual memory size ratio for --tool=helgrind -p4 versus -p4.
bart3b7e2e32008-07-10 14:07:22 +0000114# 18. Execution time ratio for --tool=helgrind --pure-happens-before=yes -p4 versus -p4.
115# 19. Virtual memory size ratio for --tool=helgrind --pure-happens-before=yes -p4 versus -p4.
116# 20. Execution time ratio for Intel Thread Checker -p4 versus -p4.
117# 21. Execution time ratio for Intel Thread Checker -p4 versus -p4.
barta5a95dd2008-06-18 14:15:11 +0000118#
bart3b7e2e32008-07-10 14:07:22 +0000119# Note: Helgrind uses a granularity of four bytes for data race detection, and DRD a granularity of one byte.
120#
121# 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
122####################################################################################################################################
123# Results: native native native none none DRD DRD HG HG-hb ITC ITC
124# -p1 -p2 -p4 -p1 -p4 -p4 -p4+f -p4 -p4 -p4 -p4+f
125# ..................................................................................................................................
126# Cholesky 0.37 45867 0.25 55965 0.20 74944 8.8 2.08 28.9 1.66 171 1.96 114 2.85 54 3.13 ... .... 239 82
127# FFT 0.20 23976 0.13 54026 0.09 114112 8.2 3.02 18.4 0.85 130 1.20 85 1.27 416 1.65 ... .... 90 41
128# LU, contiguous 0.95 16784 0.64 24984 0.43 41392 8.0 3.88 19.3 2.17 120 2.84 113 3.04 223 4.36 ... .... 428 128
129# LU, non-contiguous 1.06 16792 0.67 24984 0.40 41376 7.5 3.88 20.0 2.17 210 3.04 190 3.24 166 4.26 ... .... - -
130# Ocean, contiguous 24.25 918016 14.57 927732 9.09 945664 2.4 1.05 6.6 1.05 89 1.92 77 1.93 149 1.88 ... .... 90 28
131# Ocean, non-contiguous 0.36 32120 0.18 40320 0.16 56728 4.2 2.51 10.4 1.86 58 2.27 71 2.43 127 3.54 ... .... - -
132# Radiosity 4.73 56120 .... ..... .... ..... 16.6 1.86 .... .... ... .... .. .... .. .... ... .... 485 163
133# Radix 4.98 279744 2.55 287936 1.36 304448 6.1 1.17 22.4 1.16 57 1.90 52 1.92 208 2.09 ... .... 222 56
134# Raytrace 2.76 320526 1.44 328448 0.77 344832 8.3 1.15 28.6 1.14 2324 1.31 326 1.34 420 0.60 ... .... 172 53
135# Water-n2 0.19 17304 0.12 33680 0.12 66432 12.0 3.85 20.2 3.53 2789 2.78 562 2.84 121 3.32 ... .... 189 39
136# Water-sp 0.21 10976 0.11 19176 0.07 35568 11.0 5.41 33.3 2.37 475 2.85 147 3.08 196 4.61 ... .... 183 34
137# ..................................................................................................................................
138# Hardware: Two quad-core Intel Xeon L5130, 1.6 GHz, 4 MB L2 cache, 16 GB RAM.
139# Software: Ubuntu 8.04 server, 64-bit, gcc 4.3.1.
140####################################################################################################################################
141# Results: native native native none none DRD DRD HG HG-hb ITC ITC
142# -p1 -p2 -p4 -p1 -p4 -p4 -p4+f -p4 -p4 -p4 -p4+f
143# ..................................................................................................................................
144# Cholesky 0.29 45835 0.21 55933 4.51 74944 8.8 2.21 1.0 1.75 6 2.05 4 2.16 2 3.22 ... .... 239 82
145# FFT 0.17 23949 0.12 32144 0.11 48536 7.8 3.28 12.0 2.13 85 2.96 56 3.13 282 4.02 ... .... 90 41
146# LU, contiguous 0.78 16752 0.53 24957 0.53 41365 7.9 4.27 11.7 2.33 78 3.00 74 3.20 146 4.51 ... .... 428 128
147# LU, non-contiguous 0.86 16760 0.47 24957 0.50 41352 7.0 4.26 12.2 2.33 135 3.20 125 3.40 107 4.41 ... .... - -
148# Ocean, contiguous 19.47 918016 12.59 927232 12.61 945664 2.4 1.06 3.8 1.06 53 1.92 47 1.93 86 1.88 ... .... 90 28
149# Ocean, non-contiguous 0.31 32088 0.17 40291 0.19 56696 3.9 2.71 6.8 1.97 38 2.38 47 2.55 84 3.66 ... .... - -
150# Radiosity 3.85 56088 .... ..... .... ..... 16.4 1.98 .... .... ... .... .. .... .. .... ... .... 485 163
151# Radix 4.05 279680 2.12 287872 2.14 304405 6.0 1.20 11.4 1.18 29 1.92 27 1.94 157 2.12 ... .... 222 56
152# Raytrace 2.22 320192 .... ..... 2.20 ...... 7.4 1.17 ... .... ... .... .. .... .. .... ... .... 172 53
153# Water-n2 0.15 17272 0.10 33651 0.11 66432 12.3 4.22 17.5 1.84 2320 2.90 583 2.92 105 3.41 ... .... 189 39
154# Water-sp 0.16 10947 0.09 19144 0.09 35536 11.4 6.00 20.7 2.55 251 3.03 91 3.26 123 4.79 ... .... 183 34
155# ..................................................................................................................................
156# Hardware: dual-core Intel Xeon 5130, 2.0 GHz, 4 MB L2 cache, 4 GB RAM.
157# Software: Ubuntu 7.10 server, 64-bit, gcc 4.3.1, xload -update 1 running.
158####################################################################################################################################
159# Results: native native native none none DRD DRD HG HG-hb ITC ITC
160# -p1 -p2 -p4 -p1 -p4 -p4 -p4+f -p4 -p4 -p4 -p4+f
161# ..................................................................................................................................
162# Cholesky 0.08 21760 0.05 31728 0.56 50148 13.6 3.62 3.8 2.14 16 2.51 14 2.68 9 4.03 15 5.01 239 82
163# FFT 0.02 13024 0.02 64931 0.01 81317 17.5 5.37 36.0 1.16 248 1.35 219 1.45 704 2.19 182 2.50 90 41
164# LU, contiguous 0.08 10440 0.06 18640 0.06 35048 9.9 6.45 13.0 2.63 81 2.89 88 3.13 156 4.92 125 5.63 428 128
165# Ocean, contiguous 0.19 23208 0.18 31744 0.13 48888 4.8 3.45 7.6 2.17 59 2.58 50 2.75 77 4.01 72 4.96 90 28
166# Radiosity 0.43 55912 .... ..... .... ..... .... .... .... .... ... .... .. .... .. .... ... .... 485 163
167# Radix 0.17 33760 0.10 41952 0.10 58488 7.2 2.68 14.0 1.98 28 2.52 41 2.66 159 3.70 34 4.12 222 56
168# Raytrace 0.21 320064 0.21 320064 0.21 320064 13.3 1.18 13.2 1.18 169 1.25 58 1.25 105 2.10 71 2.96 172 53
169# Water-n2 0.11 17104 0.07 33480 0.08 66240 12.4 4.38 17.5 1.88 1877 2.93 525 2.97 106 3.47 105 4.15 189 39
170# Water-sp 0.12 10784 0.06 84352 0.06 100835 11.0 6.27 22.7 0.92 257 1.09 91 1.17 129 1.72 139 1.97 183 34
171# ..................................................................................................................................
172# Hardware: dual-core Intel Core2 Duo E6750, 2.66 GHz, 4 MB L2 cache, 2 GB RAM.
173# Software: openSUSE 11.0, 64-bit, gcc 4.3.1, runlevel 3.
174####################################################################################################################################
175
176####
177# Note: the input parameters for benchmarks below originate from table 1 in the
178# following paper:
179# The SPLASH-2 programs: characterization and methodological considerations
180# Woo, S.C.; Ohara, M.; Torrie, E.; Singh, J.P.; Gupta, A.
181# Computer Architecture, 1995. Proceedings. 22nd Annual International Symposium
182# on Volume , Issue , 22-24 Jun 1995 Page(s): 24 - 36.
183# ftp://www-flash.stanford.edu/pub/splash2/splash2_isca95.ps.Z
184####
bart8785c122008-05-29 08:34:27 +0000185
bart66bb75c2008-06-17 06:19:29 +0000186cache_size=$(get_cache_size)
bart32811502008-06-03 15:12:59 +0000187log2_cache_size=$(log2 ${cache_size})
188
189# Cholesky
bart32811502008-06-03 15:12:59 +0000190(
bart868d73a2008-06-04 13:02:22 +0000191 cd ${SPLASH2}/codes/kernels/cholesky/inputs
192 for f in *Z
193 do
194 gzip -cd <$f >${f%.Z}
195 done
bart3b7e2e32008-07-10 14:07:22 +0000196 test_args=tk15.O run_test ../CHOLESKY -C$((cache_size))
bart32811502008-06-03 15:12:59 +0000197)
bart32811502008-06-03 15:12:59 +0000198
199# FFT
bart3b7e2e32008-07-10 14:07:22 +0000200run_test ${SPLASH2}/codes/kernels/fft/FFT -t -l$((log2_cache_size/2)) -m16
bart32811502008-06-03 15:12:59 +0000201
202# LU, contiguous blocks.
bart3b7e2e32008-07-10 14:07:22 +0000203run_test ${SPLASH2}/codes/kernels/lu/contiguous_blocks/LU -n512
bart8785c122008-05-29 08:34:27 +0000204
bart32811502008-06-03 15:12:59 +0000205# LU, non-contiguous blocks.
bart3b7e2e32008-07-10 14:07:22 +0000206#run_test ${SPLASH2}/codes/kernels/lu/non_contiguous_blocks/LU -n512
bart8785c122008-05-29 08:34:27 +0000207
bart868d73a2008-06-04 13:02:22 +0000208# Ocean
bart3b7e2e32008-07-10 14:07:22 +0000209run_test ${SPLASH2}/codes/apps/ocean/contiguous_partitions/OCEAN -n258
210#run_test ${SPLASH2}/codes/apps/ocean/non_contiguous_partitions/OCEAN -n258
bart868d73a2008-06-04 13:02:22 +0000211
bart3b7e2e32008-07-10 14:07:22 +0000212# Radiosity. Disabled this benchmark because it deadlocks.
bart3f56f872008-06-20 07:52:28 +0000213if false; then
bart3b7e2e32008-07-10 14:07:22 +0000214psep=' ' run_test ${SPLASH2}/codes/apps/radiosity/RADIOSITY -batch -room -ae 5000.0 -en 0.050 -bf 0.10
bart3f56f872008-06-20 07:52:28 +0000215fi
bartc4a174f2008-06-03 11:41:19 +0000216
bart868d73a2008-06-04 13:02:22 +0000217# Radix
bart3b7e2e32008-07-10 14:07:22 +0000218run_test ${SPLASH2}/codes/kernels/radix/RADIX -n$((2**20)) -r1024
bart868d73a2008-06-04 13:02:22 +0000219
220# Raytrace
221(
222 cd ${SPLASH2}/codes/apps/raytrace/inputs
223 rm -f *.env *.geo *.rl
224 for f in *Z
225 do
226 gzip -cd <$f >${f%.Z}
227 done
bart3b7e2e32008-07-10 14:07:22 +0000228 cd ..
229 test_args=inputs/car.env psep=' ' run_test ./RAYTRACE
bart868d73a2008-06-04 13:02:22 +0000230)
bart334db5e2008-06-05 10:14:53 +0000231
bart868d73a2008-06-04 13:02:22 +0000232# Water-n2
bart334db5e2008-06-05 10:14:53 +0000233(
234 cd ${SPLASH2}/codes/apps/water-nsquared
bart8a2cd9b2008-06-19 07:49:49 +0000235 test_input=${DRD_SCRIPTS_DIR}/run-splash2-water-input psep=' ' run_test ./WATER-NSQUARED
bart334db5e2008-06-05 10:14:53 +0000236)
bart868d73a2008-06-04 13:02:22 +0000237
238# Water-sp
bart334db5e2008-06-05 10:14:53 +0000239(
240 cd ${SPLASH2}/codes/apps/water-spatial
bart8a2cd9b2008-06-19 07:49:49 +0000241 test_input=${DRD_SCRIPTS_DIR}/run-splash2-water-input psep=' ' run_test ./WATER-SPATIAL
bart334db5e2008-06-05 10:14:53 +0000242)
bart868d73a2008-06-04 13:02:22 +0000243
244
bartc4a174f2008-06-03 11:41:19 +0000245
246# Local variables:
247# compile-command: "./run-splash2"
248# End: