Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 1 | #! /usr/bin/env python |
| 2 | |
| 3 | """Combine similar index entries into an entry and subentries. |
| 4 | |
| 5 | For example: |
| 6 | |
| 7 | \item {foobar} (in module flotz), 23 |
| 8 | \item {foobar} (in module whackit), 4323 |
| 9 | |
| 10 | becomes |
| 11 | |
| 12 | \item {foobar} |
| 13 | \subitem in module flotz, 23 |
| 14 | \subitem in module whackit, 4323 |
| 15 | |
| 16 | Note that an item which matches the format of a collapsable item but which |
| 17 | isn't part of a group of similar items is not modified. |
| 18 | """ |
| 19 | __version__ = '$Revision$' |
| 20 | |
| 21 | import re |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 22 | import StringIO |
| 23 | import sys |
| 24 | |
| 25 | |
Fred Drake | 071972e | 2002-10-16 15:30:17 +0000 | [diff] [blame] | 26 | def cmp_entries(e1, e2): |
| 27 | return cmp(e1[1].lower(), e2[1].lower()) or cmp(e1, e2) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 28 | |
| 29 | |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 30 | def dump_entries(write, entries): |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 31 | if len(entries) == 1: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame] | 32 | write(" \\item %s (%s)%s\n" % entries[0]) |
| 33 | return |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 34 | write(" \item %s\n" % entries[0][0]) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 35 | # now sort these in a case insensitive manner: |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 36 | if len(entries) > 0: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame] | 37 | entries.sort(cmp_entries) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 38 | for xxx, subitem, pages in entries: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame] | 39 | write(" \subitem %s%s\n" % (subitem, pages)) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 40 | |
| 41 | |
Fred Drake | c02fbe5 | 1998-02-19 06:05:29 +0000 | [diff] [blame] | 42 | breakable_re = re.compile( |
| 43 | r" \\item (.*) [(](.*)[)]((?:(?:, \d+)|(?:, \\[a-z]*\{\d+\}))+)") |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 44 | |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 45 | |
| 46 | def process(ifn, ofn=None): |
| 47 | if ifn == "-": |
| 48 | ifp = sys.stdin |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 49 | else: |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 50 | ifp = open(ifn) |
| 51 | if ofn is None: |
| 52 | ofn = ifn |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 53 | ofp = StringIO.StringIO() |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 54 | entries = [] |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 55 | match = breakable_re.match |
| 56 | write = ofp.write |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 57 | while 1: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame] | 58 | line = ifp.readline() |
| 59 | if not line: |
| 60 | break |
| 61 | m = match(line) |
| 62 | if m: |
| 63 | entry = m.group(1, 2, 3) |
| 64 | if entries and entries[-1][0] != entry[0]: |
| 65 | dump_entries(write, entries) |
| 66 | entries = [] |
| 67 | entries.append(entry) |
| 68 | elif entries: |
| 69 | dump_entries(write, entries) |
| 70 | entries = [] |
| 71 | write(line) |
| 72 | else: |
| 73 | write(line) |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 74 | del write |
| 75 | del match |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 76 | ifp.close() |
| 77 | data = ofp.getvalue() |
| 78 | ofp.close() |
| 79 | if ofn == "-": |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame] | 80 | ofp = sys.stdout |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 81 | else: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame] | 82 | ofp = open(ofn, "w") |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 83 | ofp.write(data) |
| 84 | ofp.close() |
| 85 | |
| 86 | |
| 87 | def main(): |
| 88 | import getopt |
| 89 | outfile = None |
| 90 | opts, args = getopt.getopt(sys.argv[1:], "o:") |
| 91 | for opt, val in opts: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame] | 92 | if opt in ("-o", "--output"): |
| 93 | outfile = val |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 94 | filename = args[0] |
| 95 | outfile = outfile or filename |
| 96 | process(filename, outfile) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 97 | |
| 98 | |
| 99 | if __name__ == "__main__": |
| 100 | main() |