Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 1 | #!/usr/bin/env python |
| 2 | # Merge or print the coverage data collected by asan's coverage. |
| 3 | # Input files are sequences of 4-byte integers. |
| 4 | # We need to merge these integers into a set and then |
| 5 | # either print them (as hex) or dump them into another file. |
| 6 | import array |
Sergey Matveev | 6cb47a08 | 2014-05-19 12:53:03 +0000 | [diff] [blame] | 7 | import struct |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 8 | import sys |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 9 | import bisect |
| 10 | import os.path |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 11 | |
| 12 | prog_name = ""; |
| 13 | |
| 14 | def Usage(): |
| 15 | print >> sys.stderr, "Usage: \n" + \ |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 16 | " " + prog_name + " [32|64] merge file1 [file2 ...] > output\n" \ |
| 17 | " " + prog_name + " [32|64] print file1 [file2 ...]\n" \ |
| 18 | " " + prog_name + " [32|64] unpack file1 [file2 ...]\n" \ |
| 19 | " " + prog_name + " [32|64] rawunpack file1 [file2 ...]\n" |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 20 | exit(1) |
| 21 | |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 22 | def TypeCodeForBits(bits): |
| 23 | if bits == 64: |
| 24 | return 'L' |
| 25 | else: |
| 26 | return 'I' |
| 27 | |
| 28 | def ReadOneFile(path, bits): |
Sergey Matveev | 6cb47a08 | 2014-05-19 12:53:03 +0000 | [diff] [blame] | 29 | with open(path, mode="rb") as f: |
| 30 | f.seek(0, 2) |
| 31 | size = f.tell() |
| 32 | f.seek(0, 0) |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 33 | s = set(array.array(TypeCodeForBits(bits), f.read(size))) |
| 34 | print >>sys.stderr, "%s: read %d PCs from %s" % (prog_name, size * 8 / bits, path) |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 35 | return s |
| 36 | |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 37 | def Merge(files, bits): |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 38 | s = set() |
| 39 | for f in files: |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 40 | s = s.union(ReadOneFile(f, bits)) |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 41 | print >> sys.stderr, "%s: %d files merged; %d PCs total" % \ |
| 42 | (prog_name, len(files), len(s)) |
| 43 | return sorted(s) |
| 44 | |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 45 | def PrintFiles(files, bits): |
| 46 | s = Merge(files, bits) |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 47 | for i in s: |
| 48 | print "0x%x" % i |
| 49 | |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 50 | def MergeAndPrint(files, bits): |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 51 | if sys.stdout.isatty(): |
| 52 | Usage() |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 53 | s = Merge(files, bits) |
| 54 | a = array.array(TypeCodeForBits(bits), s) |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 55 | a.tofile(sys.stdout) |
| 56 | |
Sergey Matveev | 6cb47a08 | 2014-05-19 12:53:03 +0000 | [diff] [blame] | 57 | |
| 58 | def UnpackOneFile(path): |
| 59 | with open(path, mode="rb") as f: |
| 60 | print >> sys.stderr, "%s: unpacking %s" % (prog_name, path) |
| 61 | while True: |
| 62 | header = f.read(12) |
| 63 | if not header: return |
| 64 | if len(header) < 12: |
| 65 | break |
| 66 | pid, module_length, blob_size = struct.unpack('iII', header) |
| 67 | module = f.read(module_length) |
| 68 | blob = f.read(blob_size) |
| 69 | assert(len(module) == module_length) |
| 70 | assert(len(blob) == blob_size) |
| 71 | extracted_file = "%s.%d.sancov" % (module, pid) |
| 72 | print >> sys.stderr, "%s: extracting %s" % \ |
| 73 | (prog_name, extracted_file) |
| 74 | # The packed file may contain multiple blobs for the same pid/module |
| 75 | # pair. Append to the end of the file instead of overwriting. |
| 76 | with open(extracted_file, 'ab') as f2: |
| 77 | f2.write(blob) |
| 78 | # fail |
| 79 | raise Exception('Error reading file %s' % path) |
| 80 | |
| 81 | |
| 82 | def Unpack(files): |
| 83 | for f in files: |
| 84 | UnpackOneFile(f) |
| 85 | |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 86 | def UnpackOneRawFile(path, map_path, bits): |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 87 | mem_map = [] |
| 88 | with open(map_path, mode="rt") as f_map: |
| 89 | print >> sys.stderr, "%s: reading map %s" % (prog_name, map_path) |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 90 | if bits != int(f_map.readline()): |
| 91 | raise Exception('Wrong bits size in the map') |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 92 | for line in f_map: |
| 93 | parts = line.rstrip().split() |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 94 | mem_map.append((int(parts[0], 16), |
| 95 | int(parts[1], 16), |
| 96 | int(parts[2], 16), |
Evgeniy Stepanov | 937afa1 | 2014-06-03 15:25:43 +0000 | [diff] [blame] | 97 | ' '.join(parts[3:]))) |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 98 | mem_map.sort(key=lambda m : m[0]) |
| 99 | mem_map_keys = [m[0] for m in mem_map] |
| 100 | |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 101 | with open(path, mode="rb") as f: |
| 102 | print >> sys.stderr, "%s: unpacking %s" % (prog_name, path) |
| 103 | |
| 104 | f.seek(0, 2) |
| 105 | size = f.tell() |
| 106 | f.seek(0, 0) |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 107 | pcs = array.array(TypeCodeForBits(bits), f.read(size)) |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 108 | mem_map_pcs = [[] for i in range(0, len(mem_map))] |
| 109 | |
| 110 | for pc in pcs: |
| 111 | if pc == 0: continue |
| 112 | map_idx = bisect.bisect(mem_map_keys, pc) - 1 |
| 113 | (start, end, base, module_path) = mem_map[map_idx] |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 114 | assert pc >= start |
| 115 | if pc >= end: |
| 116 | print >> sys.stderr, "warning: %s: pc %x outside of any known mapping" % (prog_name, pc) |
| 117 | continue |
| 118 | mem_map_pcs[map_idx].append(pc - base) |
| 119 | |
| 120 | for ((start, end, base, module_path), pc_list) in zip(mem_map, mem_map_pcs): |
| 121 | if len(pc_list) == 0: continue |
| 122 | assert path.endswith('.sancov.raw') |
| 123 | dst_path = module_path + '.' + os.path.basename(path)[:-4] |
Evgeniy Stepanov | b723834 | 2014-12-25 16:03:24 +0000 | [diff] [blame] | 124 | print >> sys.stderr, "%s: writing %d PCs to %s" % (prog_name, len(pc_list), dst_path) |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 125 | arr = array.array(TypeCodeForBits(bits)) |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 126 | arr.fromlist(sorted(pc_list)) |
| 127 | with open(dst_path, 'ab') as f2: |
| 128 | arr.tofile(f2) |
| 129 | |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 130 | def RawUnpack(files, bits): |
Evgeniy Stepanov | 567e516 | 2014-05-27 12:37:52 +0000 | [diff] [blame] | 131 | for f in files: |
| 132 | if not f.endswith('.sancov.raw'): |
| 133 | raise Exception('Unexpected raw file name %s' % f) |
| 134 | f_map = f[:-3] + 'map' |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 135 | UnpackOneRawFile(f, f_map, bits) |
Sergey Matveev | 6cb47a08 | 2014-05-19 12:53:03 +0000 | [diff] [blame] | 136 | |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 137 | if __name__ == '__main__': |
| 138 | prog_name = sys.argv[0] |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 139 | if len(sys.argv) <= 3: |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 140 | Usage(); |
Kostya Serebryany | 9f1243e | 2015-03-17 22:09:19 +0000 | [diff] [blame^] | 141 | |
| 142 | if sys.argv[1] == "32": |
| 143 | bits = 32 |
| 144 | elif sys.argv[1] == "64": |
| 145 | bits = 64 |
| 146 | else: |
| 147 | Usage(); |
| 148 | |
| 149 | if sys.argv[2] == "print": |
| 150 | PrintFiles(sys.argv[3:], bits) |
| 151 | elif sys.argv[2] == "merge": |
| 152 | MergeAndPrint(sys.argv[3:], bits) |
| 153 | elif sys.argv[2] == "unpack": |
| 154 | Unpack(sys.argv[3:]) |
| 155 | elif sys.argv[2] == "rawunpack": |
| 156 | RawUnpack(sys.argv[3:], bits) |
Kostya Serebryany | b415032 | 2013-11-15 11:51:08 +0000 | [diff] [blame] | 157 | else: |
| 158 | Usage() |