Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 1 | """ttLib/sfnt.py -- low-level module to deal with the sfnt file format. |
| 2 | |
| 3 | Defines two public classes: |
| 4 | SFNTReader |
| 5 | SFNTWriter |
| 6 | |
| 7 | (Normally you don't have to use these classes explicitly; they are |
| 8 | used automatically by ttLib.TTFont.) |
| 9 | |
| 10 | The reading and writing of sfnt files is separated in two distinct |
| 11 | classes, since whenever to number of tables changes or whenever |
| 12 | a table's length chages you need to rewrite the whole file anyway. |
| 13 | """ |
| 14 | |
jvr | 9be387c | 2008-03-01 11:43:01 +0000 | [diff] [blame] | 15 | import sys |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 16 | import struct, sstruct |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 17 | import os |
| 18 | |
jvr | 04b3204 | 2002-05-14 12:09:10 +0000 | [diff] [blame] | 19 | |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 20 | class SFNTReader: |
| 21 | |
pabs3 | 7e91e77 | 2009-02-22 08:55:00 +0000 | [diff] [blame] | 22 | def __init__(self, file, checkChecksums=1, fontNumber=-1): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 23 | self.file = file |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 24 | self.checkChecksums = checkChecksums |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 25 | data = self.file.read(sfntDirectorySize) |
| 26 | if len(data) <> sfntDirectorySize: |
| 27 | from fontTools import ttLib |
| 28 | raise ttLib.TTLibError, "Not a TrueType or OpenType font (not enough data)" |
| 29 | sstruct.unpack(sfntDirectoryFormat, data, self) |
pabs3 | 7e91e77 | 2009-02-22 08:55:00 +0000 | [diff] [blame] | 30 | if self.sfntVersion == "ttcf": |
| 31 | assert ttcHeaderSize == sfntDirectorySize |
| 32 | sstruct.unpack(ttcHeaderFormat, data, self) |
| 33 | assert self.Version == 0x00010000 or self.Version == 0x00020000, "unrecognized TTC version 0x%08x" % self.Version |
| 34 | if not 0 <= fontNumber < self.numFonts: |
| 35 | from fontTools import ttLib |
| 36 | raise ttLib.TTLibError, "specify a font number between 0 and %d (inclusive)" % (self.numFonts - 1) |
| 37 | offsetTable = struct.unpack(">%dL" % self.numFonts, self.file.read(self.numFonts * 4)) |
| 38 | if self.Version == 0x00020000: |
| 39 | pass # ignoring version 2.0 signatures |
| 40 | self.file.seek(offsetTable[fontNumber]) |
| 41 | data = self.file.read(sfntDirectorySize) |
| 42 | sstruct.unpack(sfntDirectoryFormat, data, self) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 43 | if self.sfntVersion not in ("\000\001\000\000", "OTTO", "true"): |
| 44 | from fontTools import ttLib |
| 45 | raise ttLib.TTLibError, "Not a TrueType or OpenType font (bad sfntVersion)" |
| 46 | self.tables = {} |
| 47 | for i in range(self.numTables): |
| 48 | entry = SFNTDirectoryEntry() |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 49 | entry.fromFile(self.file) |
jvr | ce1d50a | 2002-05-12 17:02:50 +0000 | [diff] [blame] | 50 | if entry.length > 0: |
| 51 | self.tables[entry.tag] = entry |
| 52 | else: |
| 53 | # Ignore zero-length tables. This doesn't seem to be documented, |
| 54 | # yet it's apparently how the Windows TT rasterizer behaves. |
| 55 | # Besides, at least one font has been sighted which actually |
| 56 | # *has* a zero-length table. |
| 57 | pass |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 58 | |
| 59 | def has_key(self, tag): |
| 60 | return self.tables.has_key(tag) |
| 61 | |
| 62 | def keys(self): |
| 63 | return self.tables.keys() |
| 64 | |
| 65 | def __getitem__(self, tag): |
| 66 | """Fetch the raw table data.""" |
| 67 | entry = self.tables[tag] |
| 68 | self.file.seek(entry.offset) |
| 69 | data = self.file.read(entry.length) |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 70 | if self.checkChecksums: |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 71 | if tag == 'head': |
| 72 | # Beh: we have to special-case the 'head' table. |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 73 | checksum = calcChecksum(data[:8] + '\0\0\0\0' + data[12:]) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 74 | else: |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 75 | checksum = calcChecksum(data) |
| 76 | if self.checkChecksums > 1: |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 77 | # Be obnoxious, and barf when it's wrong |
| 78 | assert checksum == entry.checksum, "bad checksum for '%s' table" % tag |
| 79 | elif checksum <> entry.checkSum: |
| 80 | # Be friendly, and just print a warning. |
| 81 | print "bad checksum for '%s' table" % tag |
| 82 | return data |
| 83 | |
jvr | f707463 | 2002-05-04 22:04:02 +0000 | [diff] [blame] | 84 | def __delitem__(self, tag): |
| 85 | del self.tables[tag] |
| 86 | |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 87 | def close(self): |
| 88 | self.file.close() |
| 89 | |
| 90 | |
| 91 | class SFNTWriter: |
| 92 | |
| 93 | def __init__(self, file, numTables, sfntVersion="\000\001\000\000"): |
| 94 | self.file = file |
| 95 | self.numTables = numTables |
| 96 | self.sfntVersion = sfntVersion |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 97 | self.searchRange, self.entrySelector, self.rangeShift = getSearchRange(numTables) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 98 | self.nextTableOffset = sfntDirectorySize + numTables * sfntDirectoryEntrySize |
| 99 | # clear out directory area |
| 100 | self.file.seek(self.nextTableOffset) |
| 101 | # make sure we're actually where we want to be. (XXX old cStringIO bug) |
| 102 | self.file.write('\0' * (self.nextTableOffset - self.file.tell())) |
| 103 | self.tables = {} |
| 104 | |
| 105 | def __setitem__(self, tag, data): |
| 106 | """Write raw table data to disk.""" |
| 107 | if self.tables.has_key(tag): |
| 108 | # We've written this table to file before. If the length |
jvr | 04b3204 | 2002-05-14 12:09:10 +0000 | [diff] [blame] | 109 | # of the data is still the same, we allow overwriting it. |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 110 | entry = self.tables[tag] |
| 111 | if len(data) <> entry.length: |
| 112 | from fontTools import ttLib |
| 113 | raise ttLib.TTLibError, "cannot rewrite '%s' table: length does not match directory entry" % tag |
| 114 | else: |
| 115 | entry = SFNTDirectoryEntry() |
| 116 | entry.tag = tag |
| 117 | entry.offset = self.nextTableOffset |
| 118 | entry.length = len(data) |
| 119 | self.nextTableOffset = self.nextTableOffset + ((len(data) + 3) & ~3) |
| 120 | self.file.seek(entry.offset) |
| 121 | self.file.write(data) |
jvr | c63ac64 | 2008-06-17 20:41:15 +0000 | [diff] [blame] | 122 | # Add NUL bytes to pad the table data to a 4-byte boundary. |
| 123 | # Don't depend on f.seek() as we need to add the padding even if no |
| 124 | # subsequent write follows (seek is lazy), ie. after the final table |
| 125 | # in the font. |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 126 | self.file.write('\0' * (self.nextTableOffset - self.file.tell())) |
jvr | c63ac64 | 2008-06-17 20:41:15 +0000 | [diff] [blame] | 127 | assert self.nextTableOffset == self.file.tell() |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 128 | |
| 129 | if tag == 'head': |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 130 | entry.checkSum = calcChecksum(data[:8] + '\0\0\0\0' + data[12:]) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 131 | else: |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 132 | entry.checkSum = calcChecksum(data) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 133 | self.tables[tag] = entry |
| 134 | |
jvr | 28ae196 | 2004-11-16 10:37:59 +0000 | [diff] [blame] | 135 | def close(self): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 136 | """All tables must have been written to disk. Now write the |
| 137 | directory. |
| 138 | """ |
| 139 | tables = self.tables.items() |
| 140 | tables.sort() |
| 141 | if len(tables) <> self.numTables: |
| 142 | from fontTools import ttLib |
| 143 | raise ttLib.TTLibError, "wrong number of tables; expected %d, found %d" % (self.numTables, len(tables)) |
| 144 | |
| 145 | directory = sstruct.pack(sfntDirectoryFormat, self) |
| 146 | |
| 147 | self.file.seek(sfntDirectorySize) |
jvr | f509c0f | 2003-08-22 19:38:37 +0000 | [diff] [blame] | 148 | seenHead = 0 |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 149 | for tag, entry in tables: |
jvr | f509c0f | 2003-08-22 19:38:37 +0000 | [diff] [blame] | 150 | if tag == "head": |
| 151 | seenHead = 1 |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 152 | directory = directory + entry.toString() |
jvr | f509c0f | 2003-08-22 19:38:37 +0000 | [diff] [blame] | 153 | if seenHead: |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 154 | self.writeMasterChecksum(directory) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 155 | self.file.seek(0) |
| 156 | self.file.write(directory) |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 157 | |
| 158 | def _calcMasterChecksum(self, directory): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 159 | # calculate checkSumAdjustment |
| 160 | tags = self.tables.keys() |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 161 | checksums = [] |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 162 | for i in range(len(tags)): |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 163 | checksums.append(self.tables[tags[i]].checkSum) |
| 164 | |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 165 | directory_end = sfntDirectorySize + len(self.tables) * sfntDirectoryEntrySize |
| 166 | assert directory_end == len(directory) |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 167 | |
| 168 | checksums.append(calcChecksum(directory)) |
| 169 | checksum = sum(checksums) & 0xffffffff |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 170 | # BiboAfba! |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 171 | checksumadjustment = (0xB1B0AFBA - checksum) & 0xffffffff |
| 172 | return checksumadjustment |
| 173 | |
| 174 | def writeMasterChecksum(self, directory): |
| 175 | checksumadjustment = self._calcMasterChecksum(directory) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 176 | # write the checksum to the file |
| 177 | self.file.seek(self.tables['head'].offset + 8) |
pabs3 | 0e2aece | 2009-03-24 09:42:15 +0000 | [diff] [blame] | 178 | self.file.write(struct.pack(">L", checksumadjustment)) |
jvr | 1ebda67 | 2008-03-08 20:29:30 +0000 | [diff] [blame] | 179 | |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 180 | |
| 181 | # -- sfnt directory helpers and cruft |
| 182 | |
pabs3 | 7e91e77 | 2009-02-22 08:55:00 +0000 | [diff] [blame] | 183 | ttcHeaderFormat = """ |
| 184 | > # big endian |
| 185 | TTCTag: 4s # "ttcf" |
| 186 | Version: L # 0x00010000 or 0x00020000 |
| 187 | numFonts: L # number of fonts |
| 188 | # OffsetTable[numFonts]: L # array with offsets from beginning of file |
| 189 | # ulDsigTag: L # version 2.0 only |
| 190 | # ulDsigLength: L # version 2.0 only |
| 191 | # ulDsigOffset: L # version 2.0 only |
| 192 | """ |
| 193 | |
| 194 | ttcHeaderSize = sstruct.calcsize(ttcHeaderFormat) |
| 195 | |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 196 | sfntDirectoryFormat = """ |
| 197 | > # big endian |
jvr | b0e5f29 | 2002-05-13 11:21:48 +0000 | [diff] [blame] | 198 | sfntVersion: 4s |
| 199 | numTables: H # number of tables |
| 200 | searchRange: H # (max2 <= numTables)*16 |
| 201 | entrySelector: H # log2(max2 <= numTables) |
| 202 | rangeShift: H # numTables*16-searchRange |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 203 | """ |
| 204 | |
| 205 | sfntDirectorySize = sstruct.calcsize(sfntDirectoryFormat) |
| 206 | |
| 207 | sfntDirectoryEntryFormat = """ |
| 208 | > # big endian |
jvr | b0e5f29 | 2002-05-13 11:21:48 +0000 | [diff] [blame] | 209 | tag: 4s |
pabs3 | 0e2aece | 2009-03-24 09:42:15 +0000 | [diff] [blame] | 210 | checkSum: L |
| 211 | offset: L |
| 212 | length: L |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 213 | """ |
| 214 | |
| 215 | sfntDirectoryEntrySize = sstruct.calcsize(sfntDirectoryEntryFormat) |
| 216 | |
| 217 | class SFNTDirectoryEntry: |
| 218 | |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 219 | def fromFile(self, file): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 220 | sstruct.unpack(sfntDirectoryEntryFormat, |
| 221 | file.read(sfntDirectoryEntrySize), self) |
| 222 | |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 223 | def fromString(self, str): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 224 | sstruct.unpack(sfntDirectoryEntryFormat, str, self) |
| 225 | |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 226 | def toString(self): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 227 | return sstruct.pack(sfntDirectoryEntryFormat, self) |
| 228 | |
| 229 | def __repr__(self): |
| 230 | if hasattr(self, "tag"): |
| 231 | return "<SFNTDirectoryEntry '%s' at %x>" % (self.tag, id(self)) |
| 232 | else: |
| 233 | return "<SFNTDirectoryEntry at %x>" % id(self) |
| 234 | |
| 235 | |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 236 | def calcChecksum(data): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 237 | """Calculate the checksum for an arbitrary block of data. |
| 238 | Optionally takes a 'start' argument, which allows you to |
| 239 | calculate a checksum in chunks by feeding it a previous |
| 240 | result. |
| 241 | |
| 242 | If the data length is not a multiple of four, it assumes |
| 243 | it is to be padded with null byte. |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 244 | |
| 245 | >>> print calcChecksum("abcd") |
| 246 | 1633837924 |
| 247 | >>> print calcChecksum("abcdxyz") |
| 248 | 3655064932 |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 249 | """ |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 250 | remainder = len(data) % 4 |
| 251 | if remainder: |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 252 | data += "\0" * (4 - remainder) |
| 253 | value = 0 |
| 254 | blockSize = 4096 |
| 255 | assert blockSize % 4 == 0 |
| 256 | for i in xrange(0, len(data), blockSize): |
| 257 | block = data[i:i+blockSize] |
| 258 | longs = struct.unpack(">%dL" % (len(block) // 4), block) |
| 259 | value = (value + sum(longs)) & 0xffffffff |
| 260 | return value |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 261 | |
| 262 | |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 263 | def maxPowerOfTwo(x): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 264 | """Return the highest exponent of two, so that |
| 265 | (2 ** exponent) <= x |
| 266 | """ |
| 267 | exponent = 0 |
| 268 | while x: |
| 269 | x = x >> 1 |
| 270 | exponent = exponent + 1 |
Just | fdea99d | 2000-08-23 12:34:44 +0000 | [diff] [blame] | 271 | return max(exponent - 1, 0) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 272 | |
| 273 | |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 274 | def getSearchRange(n): |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 275 | """Calculate searchRange, entrySelector, rangeShift for the |
| 276 | sfnt directory. 'n' is the number of tables. |
| 277 | """ |
| 278 | # This stuff needs to be stored in the file, because? |
| 279 | import math |
jvr | ea9dfa9 | 2002-05-12 17:14:50 +0000 | [diff] [blame] | 280 | exponent = maxPowerOfTwo(n) |
Just | 7842e56 | 1999-12-16 21:34:53 +0000 | [diff] [blame] | 281 | searchRange = (2 ** exponent) * 16 |
| 282 | entrySelector = exponent |
| 283 | rangeShift = n * 16 - searchRange |
| 284 | return searchRange, entrySelector, rangeShift |
| 285 | |
jvr | 91bca42 | 2012-10-18 12:49:22 +0000 | [diff] [blame^] | 286 | |
| 287 | if __name__ == "__main__": |
| 288 | import doctest |
| 289 | doctest.testmod() |