bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 1 | #!/bin/bash |
| 2 | |
| 3 | ######################## |
| 4 | # Function definitions # |
| 5 | ######################## |
| 6 | |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 7 | function log2 { |
| 8 | local i |
| 9 | |
| 10 | for ((i=0;i<64;i++)) |
| 11 | do |
| 12 | if [ $((2**i)) = $1 ]; then |
| 13 | echo $i |
| 14 | return 0 |
| 15 | fi |
| 16 | done |
| 17 | echo "" |
| 18 | return 1 |
| 19 | } |
| 20 | |
| 21 | function get_cache_size { |
| 22 | local s |
| 23 | s=$(</sys/devices/system/cpu/cpu0/cache/index2/size) |
| 24 | if [ "${s%M}" != "$s" ]; then |
| 25 | echo $((${s%M}*1024*1024)) |
| 26 | elif [ "${s%K}" != "$s" ]; then |
| 27 | echo $((${s%K}*1024)) |
| 28 | else |
| 29 | echo $s |
| 30 | fi |
| 31 | } |
| 32 | |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 33 | # Read a stream of numbers from stdin (one per line), and print the average |
| 34 | # and standard deviation. |
| 35 | function avgstddev { |
bart | f06b427 | 2008-05-30 09:52:13 +0000 | [diff] [blame] | 36 | awk '{n++;sum+=$1;sumsq+=$1*$1}END{d=sumsq/n-sum*sum/n/n;print sum/n,(d>0?sqrt(d):0)}' |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 37 | } |
| 38 | |
| 39 | function run_test { |
| 40 | local tmp avg1=1 stddev1=1 avg2=1 stddev2=1 |
| 41 | |
| 42 | tmp="/tmp/test-timing.$$" |
bart | 334db5e | 2008-06-05 10:14:53 +0000 | [diff] [blame] | 43 | rm -f "${tmp}" |
| 44 | |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 45 | echo "$@" |
| 46 | for ((i=0;i<3;i++)) |
| 47 | do |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 48 | cat "${test_input:-/dev/null}" | \ |
| 49 | /usr/bin/time --format="%e" "$@" 2>&1 | \ |
| 50 | tail -n 1 |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 51 | done | avgstddev > "$tmp" |
| 52 | read avg1 stddev1 < "$tmp" |
| 53 | echo "Average time: ${avg1} +/- ${stddev1} seconds" |
| 54 | |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 55 | for p in 1 2 4 |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 56 | do |
bart | c4a174f | 2008-06-03 11:41:19 +0000 | [diff] [blame] | 57 | echo "$VG --tool=exp-drd $@ -p$p" |
| 58 | for ((i=0;i<3;i++)) |
| 59 | do |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 60 | cat "${test_input:-/dev/null}" | \ |
| 61 | /usr/bin/time --format="%e" $VG --tool=exp-drd "$@" -p$p 2>&1 | \ |
| 62 | tail -n 1 |
bart | c4a174f | 2008-06-03 11:41:19 +0000 | [diff] [blame] | 63 | done | avgstddev > "$tmp" |
| 64 | read avg2 stddev2 < "$tmp" |
| 65 | echo "Average time: ${avg2} +/- ${stddev2} seconds" |
| 66 | awk "END{print "'"'"Ratio ="'"'", ${avg2}/${avg1}, "'"'"+/-"'"'", ${avg2}/${avg1}*(${stddev1}/${avg1}+${stddev2}/${avg2})}" </dev/null |
| 67 | done |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 68 | |
| 69 | echo '' |
| 70 | |
| 71 | rm -f "$tmp" |
| 72 | } |
| 73 | |
| 74 | |
| 75 | # Script body |
| 76 | |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 77 | DRD_SCRIPTS_DIR="$(dirname $0)" |
bart | 7acf380 | 2008-06-06 10:17:26 +0000 | [diff] [blame] | 78 | if [ "${DRD_SCRIPTS_DIR:0:1}" != "/" ]; then |
| 79 | DRD_SCRIPTS_DIR="$PWD/$DRD_SCRIPTS_DIR" |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 80 | fi |
| 81 | |
| 82 | SPLASH2="${DRD_SCRIPTS_DIR}/../splash2" |
bart | c4a174f | 2008-06-03 11:41:19 +0000 | [diff] [blame] | 83 | if [ ! -e "${SPLASH2}" ]; then |
| 84 | echo "Error: splash2 directory not found (${SPLASH2})." |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 85 | exit 1 |
| 86 | fi |
| 87 | |
| 88 | if [ "$VG" = "" ]; then |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 89 | VG="${DRD_SCRIPTS_DIR}/../../vg-in-place" |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 90 | fi |
| 91 | |
| 92 | if [ ! -e "$VG" ]; then |
| 93 | echo "Could not find $VG." |
| 94 | exit 1 |
| 95 | fi |
| 96 | |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 97 | # Results: (-p1) (-p2) (-p3) (-p4) ITC (-p4) ITC (-p4) |
| 98 | # original w/ filter |
| 99 | # ......................................................................... |
bart | 0886562 | 2008-06-06 14:31:36 +0000 | [diff] [blame] | 100 | # Cholesky 40 47 ? 82 239 82 |
| 101 | # FFT 16 17 N/A 47 90 41 |
| 102 | # LU, contiguous blocks 39 41 ? 45 428 128 |
| 103 | # LU, non-contiguous blocks 39 41 ? 49 428 128 |
| 104 | # Ocean, contiguous partitions 17 19 N/A 25 90 28 |
| 105 | # Ocean, non-continguous partns 18 21 N/A 30 90 28 |
| 106 | # Radiosity 78 78 ? 78 485 163 |
| 107 | # Radix 10 12 ? 15 222 56 |
| 108 | # Raytrace 56 56 ? 56 172 53 |
| 109 | # Water-n2 34 34 ? 34 189 39 |
| 110 | # Water-sp 33 33 ? 33 183 34 |
bart | 0ce652f | 2008-06-05 13:47:15 +0000 | [diff] [blame] | 111 | # |
| 112 | # Hardware: dual-core Intel Xeon 5130, 1.995 MHz, 4 MB L2 cache, 4 GB RAM. |
bart | 7acf380 | 2008-06-06 10:17:26 +0000 | [diff] [blame] | 113 | # Software: Ubuntu 7.10 server, 64-bit (includes gcc 4.1.3). |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 114 | |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 115 | cache_size=$(get_cache_size) |
| 116 | log2_cache_size=$(log2 ${cache_size}) |
| 117 | |
| 118 | # Cholesky |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 119 | ( |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 120 | cd ${SPLASH2}/codes/kernels/cholesky/inputs |
| 121 | for f in *Z |
| 122 | do |
| 123 | gzip -cd <$f >${f%.Z} |
| 124 | done |
| 125 | run_test ../CHOLESKY -C${cache_size} -n1024 tk29.O |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 126 | ) |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 127 | |
| 128 | # FFT |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 129 | run_test ${SPLASH2}/codes/kernels/fft/FFT -t -l${log2_cache_size} -m20 |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 130 | |
| 131 | # LU, contiguous blocks. |
bart | c4a174f | 2008-06-03 11:41:19 +0000 | [diff] [blame] | 132 | run_test ${SPLASH2}/codes/kernels/lu/contiguous_blocks/LU -n1024 |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 133 | |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 134 | # LU, non-contiguous blocks. |
bart | c4a174f | 2008-06-03 11:41:19 +0000 | [diff] [blame] | 135 | run_test ${SPLASH2}/codes/kernels/lu/non_contiguous_blocks/LU -n1024 |
bart | 8785c12 | 2008-05-29 08:34:27 +0000 | [diff] [blame] | 136 | |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 137 | # Ocean |
| 138 | run_test ${SPLASH2}/codes/apps/ocean/contiguous_partitions/OCEAN -n2050 |
| 139 | run_test ${SPLASH2}/codes/apps/ocean/non_contiguous_partitions/OCEAN -n258 |
| 140 | |
bart | 3281150 | 2008-06-03 15:12:59 +0000 | [diff] [blame] | 141 | # Radiosity. |
bart | c4a174f | 2008-06-03 11:41:19 +0000 | [diff] [blame] | 142 | run_test ${SPLASH2}/codes/apps/radiosity/RADIOSITY -batch -room |
| 143 | |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 144 | # Radix |
| 145 | run_test ${SPLASH2}/codes/kernels/radix/RADIX -n$((2**24)) |
| 146 | |
| 147 | # Raytrace |
| 148 | ( |
| 149 | cd ${SPLASH2}/codes/apps/raytrace/inputs |
| 150 | rm -f *.env *.geo *.rl |
| 151 | for f in *Z |
| 152 | do |
| 153 | gzip -cd <$f >${f%.Z} |
| 154 | done |
| 155 | run_test ../RAYTRACE balls4.env |
| 156 | ) |
bart | 334db5e | 2008-06-05 10:14:53 +0000 | [diff] [blame] | 157 | |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 158 | # Water-n2 |
bart | 334db5e | 2008-06-05 10:14:53 +0000 | [diff] [blame] | 159 | ( |
| 160 | cd ${SPLASH2}/codes/apps/water-nsquared |
| 161 | test_input=input run_test ./WATER-NSQUARED |
| 162 | ) |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 163 | |
| 164 | # Water-sp |
bart | 334db5e | 2008-06-05 10:14:53 +0000 | [diff] [blame] | 165 | ( |
| 166 | cd ${SPLASH2}/codes/apps/water-spatial |
| 167 | test_input=input run_test ./WATER-SPATIAL |
| 168 | ) |
bart | 868d73a | 2008-06-04 13:02:22 +0000 | [diff] [blame] | 169 | |
| 170 | |
bart | c4a174f | 2008-06-03 11:41:19 +0000 | [diff] [blame] | 171 | |
| 172 | # Local variables: |
| 173 | # compile-command: "./run-splash2" |
| 174 | # End: |