Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 1 | #! /usr/bin/env python |
| 2 | |
| 3 | """Combine similar index entries into an entry and subentries. |
| 4 | |
| 5 | For example: |
| 6 | |
| 7 | \item {foobar} (in module flotz), 23 |
| 8 | \item {foobar} (in module whackit), 4323 |
| 9 | |
| 10 | becomes |
| 11 | |
| 12 | \item {foobar} |
| 13 | \subitem in module flotz, 23 |
| 14 | \subitem in module whackit, 4323 |
| 15 | |
| 16 | Note that an item which matches the format of a collapsable item but which |
| 17 | isn't part of a group of similar items is not modified. |
| 18 | """ |
| 19 | __version__ = '$Revision$' |
| 20 | |
| 21 | import re |
| 22 | import string |
| 23 | import StringIO |
| 24 | import sys |
| 25 | |
| 26 | |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 27 | def cmp_entries(e1, e2, lower=string.lower): |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 28 | return cmp(lower(e1[1]), lower(e2[1])) or cmp(e1, e2) |
| 29 | |
| 30 | |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 31 | def dump_entries(write, entries): |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 32 | if len(entries) == 1: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame^] | 33 | write(" \\item %s (%s)%s\n" % entries[0]) |
| 34 | return |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 35 | write(" \item %s\n" % entries[0][0]) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 36 | # now sort these in a case insensitive manner: |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 37 | if len(entries) > 0: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame^] | 38 | entries.sort(cmp_entries) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 39 | for xxx, subitem, pages in entries: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame^] | 40 | write(" \subitem %s%s\n" % (subitem, pages)) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 41 | |
| 42 | |
Fred Drake | c02fbe5 | 1998-02-19 06:05:29 +0000 | [diff] [blame] | 43 | breakable_re = re.compile( |
| 44 | r" \\item (.*) [(](.*)[)]((?:(?:, \d+)|(?:, \\[a-z]*\{\d+\}))+)") |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 45 | |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 46 | |
| 47 | def process(ifn, ofn=None): |
| 48 | if ifn == "-": |
| 49 | ifp = sys.stdin |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 50 | else: |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 51 | ifp = open(ifn) |
| 52 | if ofn is None: |
| 53 | ofn = ifn |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 54 | ofp = StringIO.StringIO() |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 55 | entries = [] |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 56 | match = breakable_re.match |
| 57 | write = ofp.write |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 58 | while 1: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame^] | 59 | line = ifp.readline() |
| 60 | if not line: |
| 61 | break |
| 62 | m = match(line) |
| 63 | if m: |
| 64 | entry = m.group(1, 2, 3) |
| 65 | if entries and entries[-1][0] != entry[0]: |
| 66 | dump_entries(write, entries) |
| 67 | entries = [] |
| 68 | entries.append(entry) |
| 69 | elif entries: |
| 70 | dump_entries(write, entries) |
| 71 | entries = [] |
| 72 | write(line) |
| 73 | else: |
| 74 | write(line) |
Fred Drake | a94d21f | 1998-02-10 21:35:49 +0000 | [diff] [blame] | 75 | del write |
| 76 | del match |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 77 | ifp.close() |
| 78 | data = ofp.getvalue() |
| 79 | ofp.close() |
| 80 | if ofn == "-": |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame^] | 81 | ofp = sys.stdout |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 82 | else: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame^] | 83 | ofp = open(ofn, "w") |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 84 | ofp.write(data) |
| 85 | ofp.close() |
| 86 | |
| 87 | |
| 88 | def main(): |
| 89 | import getopt |
| 90 | outfile = None |
| 91 | opts, args = getopt.getopt(sys.argv[1:], "o:") |
| 92 | for opt, val in opts: |
Fred Drake | 7787841 | 2000-10-07 12:50:05 +0000 | [diff] [blame^] | 93 | if opt in ("-o", "--output"): |
| 94 | outfile = val |
Fred Drake | 749f943 | 1999-03-03 19:36:23 +0000 | [diff] [blame] | 95 | filename = args[0] |
| 96 | outfile = outfile or filename |
| 97 | process(filename, outfile) |
Fred Drake | dd244a0 | 1998-02-09 22:17:52 +0000 | [diff] [blame] | 98 | |
| 99 | |
| 100 | if __name__ == "__main__": |
| 101 | main() |