maruel@chromium.org | 1f144a3 | 2011-11-24 04:13:44 +0900 | [diff] [blame] | 1 | #!/usr/bin/env python |
tony@chromium.org | dfc65a9 | 2011-09-15 12:35:53 +0900 | [diff] [blame] | 2 | # Copyright (c) 2011 The Chromium Authors. All rights reserved. |
| 3 | # Use of this source code is governed by a BSD-style license that can be |
| 4 | # found in the LICENSE file. |
| 5 | |
| 6 | """Convert any unicode characters found in the input file to C literals.""" |
| 7 | |
| 8 | import codecs |
| 9 | import optparse |
| 10 | import os |
| 11 | import sys |
| 12 | |
maruel@chromium.org | 1f144a3 | 2011-11-24 04:13:44 +0900 | [diff] [blame] | 13 | |
tony@chromium.org | dfc65a9 | 2011-09-15 12:35:53 +0900 | [diff] [blame] | 14 | def main(argv): |
| 15 | parser = optparse.OptionParser() |
| 16 | usage = 'Usage: %prog -o <output_dir> <input_file>' |
| 17 | parser.set_usage(usage) |
| 18 | parser.add_option('-o', dest='output_dir') |
| 19 | |
| 20 | options, arglist = parser.parse_args(argv) |
| 21 | |
| 22 | if not options.output_dir: |
| 23 | print "output_dir required" |
| 24 | return 1 |
| 25 | |
| 26 | if len(arglist) != 2: |
| 27 | print "input_file required" |
| 28 | return 1 |
| 29 | |
| 30 | in_filename = arglist[1] |
| 31 | |
| 32 | if not in_filename.endswith('.utf8'): |
| 33 | print "input_file should end in .utf8" |
| 34 | return 1 |
| 35 | |
| 36 | out_filename = os.path.join(options.output_dir, os.path.basename( |
| 37 | os.path.splitext(in_filename)[0])) |
| 38 | |
| 39 | WriteEscapedFile(in_filename, out_filename) |
maruel@chromium.org | 1f144a3 | 2011-11-24 04:13:44 +0900 | [diff] [blame] | 40 | return 0 |
tony@chromium.org | dfc65a9 | 2011-09-15 12:35:53 +0900 | [diff] [blame] | 41 | |
| 42 | |
| 43 | def WriteEscapedFile(in_filename, out_filename): |
| 44 | input_data = codecs.open(in_filename, 'r', 'utf8').read() |
| 45 | with codecs.open(out_filename, 'w', 'ascii') as out_file: |
| 46 | for i, char in enumerate(input_data): |
| 47 | if ord(char) > 127: |
| 48 | out_file.write(repr(char.encode('utf8'))[1:-1]) |
| 49 | if input_data[i + 1:i + 2] in '0123456789abcdefABCDEF': |
| 50 | out_file.write('""') |
| 51 | else: |
| 52 | out_file.write(char.encode('ascii')) |
| 53 | |
| 54 | |
| 55 | if __name__ == '__main__': |
maruel@chromium.org | 1f144a3 | 2011-11-24 04:13:44 +0900 | [diff] [blame] | 56 | sys.exit(main(sys.argv)) |