Tim Peters | 4f109c1 | 2002-04-19 18:41:46 +0000 | [diff] [blame] | 1 | """ |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 2 | Makes the necesary files to convert from plain html of |
| 3 | Python 1.5 and 1.5.x Documentation to |
| 4 | Microsoft HTML Help format version 1.1 |
| 5 | Doesn't change the html's docs. |
| 6 | |
| 7 | by hernan.foffani@iname.com |
| 8 | no copyright and no responsabilities. |
| 9 | |
| 10 | modified by Dale Nagata for Python 1.5.2 |
| 11 | |
| 12 | Renamed from make_chm.py to prechm.py, and checked into the Python |
| 13 | project, 19-Apr-2002 by Tim Peters. Assorted modifications by Tim |
| 14 | and Fred Drake. Obtained from Robin Dunn's .chm packaging of the |
| 15 | Python 2.2 docs, at <http://alldunn.com/python/>. |
Tim Peters | 4f109c1 | 2002-04-19 18:41:46 +0000 | [diff] [blame] | 16 | """ |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 17 | |
| 18 | import sys |
| 19 | import os |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 20 | from formatter import NullWriter, AbstractFormatter |
| 21 | from htmllib import HTMLParser |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 22 | import getopt |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 23 | import cgi |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 24 | |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 25 | usage_mode = ''' |
Raymond Hettinger | 7820554 | 2004-02-08 20:05:40 +0000 | [diff] [blame] | 26 | Usage: prechm.py [-c] [-k] [-p] [-v 1.5[.x]] filename |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 27 | -c: does not build filename.hhc (Table of Contents) |
| 28 | -k: does not build filename.hhk (Index) |
| 29 | -p: does not build filename.hhp (Project File) |
| 30 | -v 1.5[.x]: makes help for the python 1.5[.x] docs |
| 31 | (default is python 1.5.2 docs) |
| 32 | ''' |
| 33 | |
Tim Peters | e6b63e6 | 2002-04-19 18:07:52 +0000 | [diff] [blame] | 34 | # Project file (*.hhp) template. 'arch' is the file basename (like |
| 35 | # the pythlp in pythlp.hhp); 'version' is the doc version number (like |
| 36 | # the 2.2 in Python 2.2). |
| 37 | # The magical numbers in the long line under [WINDOWS] set most of the |
| 38 | # user-visible features (visible buttons, tabs, etc). |
Tim Peters | dc374e0 | 2002-04-21 02:01:01 +0000 | [diff] [blame] | 39 | # About 0x10384e: This defines the buttons in the help viewer. The |
| 40 | # following defns are taken from htmlhelp.h. Not all possibilities |
| 41 | # actually work, and not all those that work are available from the Help |
| 42 | # Workshop GUI. In particular, the Zoom/Font button works and is not |
| 43 | # available from the GUI. The ones we're using are marked with 'x': |
| 44 | # |
| 45 | # 0x000002 Hide/Show x |
| 46 | # 0x000004 Back x |
| 47 | # 0x000008 Forward x |
| 48 | # 0x000010 Stop |
| 49 | # 0x000020 Refresh |
| 50 | # 0x000040 Home x |
| 51 | # 0x000080 Forward |
| 52 | # 0x000100 Back |
| 53 | # 0x000200 Notes |
| 54 | # 0x000400 Contents |
| 55 | # 0x000800 Locate x |
| 56 | # 0x001000 Options x |
| 57 | # 0x002000 Print x |
| 58 | # 0x004000 Index |
| 59 | # 0x008000 Search |
| 60 | # 0x010000 History |
| 61 | # 0x020000 Favorites |
| 62 | # 0x040000 Jump 1 |
| 63 | # 0x080000 Jump 2 |
| 64 | # 0x100000 Zoom/Font x |
| 65 | # 0x200000 TOC Next |
| 66 | # 0x400000 TOC Prev |
| 67 | |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 68 | project_template = ''' |
| 69 | [OPTIONS] |
Tim Peters | e6b63e6 | 2002-04-19 18:07:52 +0000 | [diff] [blame] | 70 | Compiled file=%(arch)s.chm |
| 71 | Contents file=%(arch)s.hhc |
| 72 | Default Window=%(arch)s |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 73 | Default topic=index.html |
| 74 | Display compile progress=No |
Tim Peters | 4f109c1 | 2002-04-19 18:41:46 +0000 | [diff] [blame] | 75 | Full text search stop list file=%(arch)s.stp |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 76 | Full-text search=Yes |
Tim Peters | e6b63e6 | 2002-04-19 18:07:52 +0000 | [diff] [blame] | 77 | Index file=%(arch)s.hhk |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 78 | Language=0x409 |
Tim Peters | e6b63e6 | 2002-04-19 18:07:52 +0000 | [diff] [blame] | 79 | Title=Python %(version)s Documentation |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 80 | |
| 81 | [WINDOWS] |
Tim Peters | e6b63e6 | 2002-04-19 18:07:52 +0000 | [diff] [blame] | 82 | %(arch)s="Python %(version)s Documentation","%(arch)s.hhc","%(arch)s.hhk",\ |
Thomas Heller | ccfbfb9 | 2003-09-23 20:50:47 +0000 | [diff] [blame] | 83 | "index.html","index.html",,,,,0x63520,220,0x10384e,[0,0,1024,768],,,,,,,0 |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 84 | |
| 85 | [FILES] |
| 86 | ''' |
| 87 | |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 88 | contents_header = '''\ |
| 89 | <!DOCTYPE HTML PUBLIC "-//IETF//DTD HTML//EN"> |
| 90 | <HTML> |
| 91 | <HEAD> |
| 92 | <meta name="GENERATOR" content="Microsoft® HTML Help Workshop 4.1"> |
| 93 | <!-- Sitemap 1.0 --> |
| 94 | </HEAD><BODY> |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 95 | <OBJECT type="text/site properties"> |
Raymond Hettinger | ce9b471 | 2004-02-08 19:24:18 +0000 | [diff] [blame] | 96 | <param name="Window Styles" value="0x801227"> |
| 97 | <param name="ImageType" value="Folder"> |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 98 | </OBJECT> |
| 99 | <UL> |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 100 | ''' |
| 101 | |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 102 | contents_footer = '''\ |
Tim Peters | c8490c7 | 2002-04-20 21:34:34 +0000 | [diff] [blame] | 103 | </UL></BODY></HTML> |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 104 | ''' |
| 105 | |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 106 | object_sitemap = '''\ |
| 107 | <OBJECT type="text/sitemap"> |
| 108 | <param name="Name" value="%s"> |
| 109 | <param name="Local" value="%s"> |
| 110 | </OBJECT> |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 111 | ''' |
| 112 | |
Tim Peters | 4f109c1 | 2002-04-19 18:41:46 +0000 | [diff] [blame] | 113 | # List of words the full text search facility shouldn't index. This |
| 114 | # becomes file ARCH.stp. Note that this list must be pretty small! |
| 115 | # Different versions of the MS docs claim the file has a maximum size of |
| 116 | # 256 or 512 bytes (including \r\n at the end of each line). |
| 117 | # Note that "and", "or", "not" and "near" are operators in the search |
Tim Peters | 8d62ad7 | 2002-04-20 02:56:20 +0000 | [diff] [blame] | 118 | # language, so no point indexing them even if we wanted to. |
Tim Peters | 4f109c1 | 2002-04-19 18:41:46 +0000 | [diff] [blame] | 119 | stop_list = ''' |
Tim Peters | a3b0b29 | 2002-05-02 21:59:08 +0000 | [diff] [blame] | 120 | a and are as at |
| 121 | be but by |
| 122 | for |
| 123 | if in into is it |
| 124 | near no not |
| 125 | of on or |
| 126 | such |
| 127 | that the their then there these they this to |
| 128 | was will with |
Tim Peters | 4f109c1 | 2002-04-19 18:41:46 +0000 | [diff] [blame] | 129 | ''' |
| 130 | |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 131 | # s is a string or None. If None or empty, return None. Else tack '.html' |
| 132 | # on to the end, unless it's already there. |
| 133 | def addhtml(s): |
| 134 | if s: |
| 135 | if not s.endswith('.html'): |
| 136 | s += '.html' |
| 137 | return s |
| 138 | |
| 139 | # Convenience class to hold info about "a book" in HTMLHelp terms == a doc |
| 140 | # directory in Python terms. |
| 141 | class Book: |
| 142 | def __init__(self, directory, title, firstpage, |
| 143 | contentpage=None, indexpage=None): |
| 144 | self.directory = directory |
| 145 | self.title = title |
| 146 | self.firstpage = addhtml(firstpage) |
| 147 | self.contentpage = addhtml(contentpage) |
| 148 | self.indexpage = addhtml(indexpage) |
| 149 | |
| 150 | # Library Doc list of books: |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 151 | # each 'book' : (Dir, Title, First page, Content page, Index page) |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 152 | supported_libraries = { |
Martin v. Löwis | 22f3a6a | 2006-03-31 16:19:18 +0000 | [diff] [blame^] | 153 | '2.5': |
| 154 | [ |
| 155 | Book('.', 'Main page', 'index'), |
| 156 | Book('.', 'Global Module Index', 'modindex'), |
| 157 | Book('whatsnew', "What's New", 'index', 'contents'), |
| 158 | Book('tut','Tutorial','tut','node2'), |
| 159 | Book('lib','Library Reference','lib','contents','genindex'), |
| 160 | Book('ref','Language Reference','ref','contents','genindex'), |
| 161 | Book('mac','Macintosh Reference','mac','contents','genindex'), |
| 162 | Book('ext','Extending and Embedding','ext','contents'), |
| 163 | Book('api','Python/C API','api','contents','genindex'), |
| 164 | Book('doc','Documenting Python','doc','contents'), |
| 165 | Book('inst','Installing Python Modules', 'inst', 'index'), |
| 166 | Book('dist','Distributing Python Modules', 'dist', 'index', 'genindex'), |
| 167 | ], |
| 168 | |
Thomas Heller | ccfbfb9 | 2003-09-23 20:50:47 +0000 | [diff] [blame] | 169 | '2.4': |
| 170 | [ |
| 171 | Book('.', 'Main page', 'index'), |
| 172 | Book('.', 'Global Module Index', 'modindex'), |
| 173 | Book('whatsnew', "What's New", 'index', 'contents'), |
| 174 | Book('tut','Tutorial','tut','node2'), |
| 175 | Book('lib','Library Reference','lib','contents','genindex'), |
| 176 | Book('ref','Language Reference','ref','contents','genindex'), |
| 177 | Book('mac','Macintosh Reference','mac','contents','genindex'), |
| 178 | Book('ext','Extending and Embedding','ext','contents'), |
| 179 | Book('api','Python/C API','api','contents','genindex'), |
| 180 | Book('doc','Documenting Python','doc','contents'), |
| 181 | Book('inst','Installing Python Modules', 'inst', 'index'), |
Thomas Heller | a42bc21 | 2004-06-18 08:27:36 +0000 | [diff] [blame] | 182 | Book('dist','Distributing Python Modules', 'dist', 'index', 'genindex'), |
Thomas Heller | ccfbfb9 | 2003-09-23 20:50:47 +0000 | [diff] [blame] | 183 | ], |
| 184 | |
| 185 | '2.3': |
| 186 | [ |
| 187 | Book('.', 'Main page', 'index'), |
| 188 | Book('.', 'Global Module Index', 'modindex'), |
| 189 | Book('whatsnew', "What's New", 'index', 'contents'), |
| 190 | Book('tut','Tutorial','tut','node2'), |
| 191 | Book('lib','Library Reference','lib','contents','genindex'), |
| 192 | Book('ref','Language Reference','ref','contents','genindex'), |
| 193 | Book('mac','Macintosh Reference','mac','contents','genindex'), |
| 194 | Book('ext','Extending and Embedding','ext','contents'), |
| 195 | Book('api','Python/C API','api','contents','genindex'), |
| 196 | Book('doc','Documenting Python','doc','contents'), |
| 197 | Book('inst','Installing Python Modules', 'inst', 'index'), |
| 198 | Book('dist','Distributing Python Modules', 'dist', 'index'), |
| 199 | ], |
| 200 | |
Tim Peters | c8490c7 | 2002-04-20 21:34:34 +0000 | [diff] [blame] | 201 | '2.2': |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 202 | [ |
Tim Peters | c8490c7 | 2002-04-20 21:34:34 +0000 | [diff] [blame] | 203 | Book('.', 'Main page', 'index'), |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 204 | Book('.', 'Global Module Index', 'modindex'), |
| 205 | Book('whatsnew', "What's New", 'index', 'contents'), |
| 206 | Book('tut','Tutorial','tut','node2'), |
| 207 | Book('lib','Library Reference','lib','contents','genindex'), |
| 208 | Book('ref','Language Reference','ref','contents','genindex'), |
| 209 | Book('mac','Macintosh Reference','mac','contents','genindex'), |
| 210 | Book('ext','Extending and Embedding','ext','contents'), |
| 211 | Book('api','Python/C API','api','contents','genindex'), |
| 212 | Book('doc','Documenting Python','doc','contents'), |
| 213 | Book('inst','Installing Python Modules', 'inst', 'index'), |
| 214 | Book('dist','Distributing Python Modules', 'dist', 'index'), |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 215 | ], |
| 216 | |
| 217 | '2.1.1': |
| 218 | [ |
Tim Peters | c8490c7 | 2002-04-20 21:34:34 +0000 | [diff] [blame] | 219 | Book('.', 'Main page', 'index'), |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 220 | Book('.', 'Global Module Index', 'modindex'), |
| 221 | Book('tut','Tutorial','tut','node2'), |
| 222 | Book('lib','Library Reference','lib','contents','genindex'), |
| 223 | Book('ref','Language Reference','ref','contents','genindex'), |
| 224 | Book('mac','Macintosh Reference','mac','contents','genindex'), |
| 225 | Book('ext','Extending and Embedding','ext','contents'), |
| 226 | Book('api','Python/C API','api','contents','genindex'), |
| 227 | Book('doc','Documenting Python','doc','contents'), |
| 228 | Book('inst','Installing Python Modules', 'inst', 'index'), |
| 229 | Book('dist','Distributing Python Modules', 'dist', 'index'), |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 230 | ], |
| 231 | |
| 232 | '2.0.0': |
| 233 | [ |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 234 | Book('.', 'Global Module Index', 'modindex'), |
| 235 | Book('tut','Tutorial','tut','node2'), |
| 236 | Book('lib','Library Reference','lib','contents','genindex'), |
| 237 | Book('ref','Language Reference','ref','contents','genindex'), |
| 238 | Book('mac','Macintosh Reference','mac','contents','genindex'), |
| 239 | Book('ext','Extending and Embedding','ext','contents'), |
| 240 | Book('api','Python/C API','api','contents','genindex'), |
| 241 | Book('doc','Documenting Python','doc','contents'), |
| 242 | Book('inst','Installing Python Modules', 'inst', 'contents'), |
| 243 | Book('dist','Distributing Python Modules', 'dist', 'contents'), |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 244 | ], |
| 245 | |
| 246 | # <dnagata@creo.com> Apr 17/99: library for 1.5.2 version: |
| 247 | # <hernan.foffani@iname.com> May 01/99: library for 1.5.2 (04/30/99): |
| 248 | '1.5.2': |
| 249 | [ |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 250 | Book('tut','Tutorial','tut','node2'), |
| 251 | Book('lib','Library Reference','lib','contents','genindex'), |
| 252 | Book('ref','Language Reference','ref','contents','genindex'), |
| 253 | Book('mac','Macintosh Reference','mac','contents','genindex'), |
| 254 | Book('ext','Extending and Embedding','ext','contents'), |
| 255 | Book('api','Python/C API','api','contents','genindex'), |
| 256 | Book('doc','Documenting Python','doc','contents') |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 257 | ], |
| 258 | |
| 259 | # library for 1.5.1 version: |
| 260 | '1.5.1': |
| 261 | [ |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 262 | Book('tut','Tutorial','tut','contents'), |
| 263 | Book('lib','Library Reference','lib','contents','genindex'), |
| 264 | Book('ref','Language Reference','ref-1','ref-2','ref-11'), |
| 265 | Book('ext','Extending and Embedding','ext','contents'), |
| 266 | Book('api','Python/C API','api','contents','genindex') |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 267 | ], |
| 268 | |
| 269 | # library for 1.5 version: |
| 270 | '1.5': |
| 271 | [ |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 272 | Book('tut','Tutorial','tut','node1'), |
| 273 | Book('lib','Library Reference','lib','node1','node268'), |
| 274 | Book('ref','Language Reference','ref-1','ref-2','ref-11'), |
| 275 | Book('ext','Extending and Embedding','ext','node1'), |
| 276 | Book('api','Python/C API','api','node1','node48') |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 277 | ] |
| 278 | } |
| 279 | |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 280 | # AlmostNullWriter doesn't print anything; it just arranges to save the |
| 281 | # text sent to send_flowing_data(). This is used to capture the text |
| 282 | # between an anchor begin/end pair, e.g. for TOC entries. |
| 283 | |
| 284 | class AlmostNullWriter(NullWriter): |
| 285 | |
| 286 | def __init__(self): |
| 287 | NullWriter.__init__(self) |
| 288 | self.saved_clear() |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 289 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 290 | def send_flowing_data(self, data): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 291 | stripped = data.strip() |
| 292 | if stripped: # don't bother to save runs of whitespace |
| 293 | self.saved.append(stripped) |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 294 | |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 295 | # Forget all saved text. |
| 296 | def saved_clear(self): |
| 297 | self.saved = [] |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 298 | |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 299 | # Return all saved text as a string. |
| 300 | def saved_get(self): |
| 301 | return ' '.join(self.saved) |
| 302 | |
| 303 | class HelpHtmlParser(HTMLParser): |
| 304 | |
| 305 | def __init__(self, formatter, path, output): |
| 306 | HTMLParser.__init__(self, formatter) |
| 307 | self.path = path # relative path |
| 308 | self.ft = output # output file |
| 309 | self.indent = 0 # number of tabs for pretty printing of files |
| 310 | self.proc = False # True when actively processing, else False |
| 311 | # (headers, footers, etc) |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 312 | # XXX This shouldn't need to be a stack -- anchors shouldn't nest. |
| 313 | # XXX See SF bug <http://www.python.org/sf/546579>. |
| 314 | self.hrefstack = [] # stack of hrefs from anchor begins |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 315 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 316 | def begin_group(self): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 317 | self.indent += 1 |
| 318 | self.proc = True |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 319 | |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 320 | def finish_group(self): |
| 321 | self.indent -= 1 |
| 322 | # stop processing when back to top level |
| 323 | self.proc = self.indent > 0 |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 324 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 325 | def anchor_bgn(self, href, name, type): |
| 326 | if self.proc: |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 327 | # XXX See SF bug <http://www.python.org/sf/546579>. |
Tim Peters | 4a0db06 | 2002-04-21 04:44:11 +0000 | [diff] [blame] | 328 | # XXX index.html for the 2.2.1 language reference manual contains |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 329 | # XXX nested <a></a> tags in the entry for the section on blank |
| 330 | # XXX lines. We want to ignore the nested part completely. |
| 331 | if len(self.hrefstack) == 0: |
Tim Peters | 4a0db06 | 2002-04-21 04:44:11 +0000 | [diff] [blame] | 332 | self.saved_clear() |
| 333 | self.hrefstack.append(href) |
| 334 | |
| 335 | def anchor_end(self): |
| 336 | if self.proc: |
| 337 | # XXX See XXX above. |
| 338 | if self.hrefstack: |
| 339 | title = cgi.escape(self.saved_get(), True) |
| 340 | path = self.path + '/' + self.hrefstack.pop() |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 341 | self.tab(object_sitemap % (title, path)) |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 342 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 343 | def start_dl(self, atr_val): |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 344 | self.begin_group() |
| 345 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 346 | def end_dl(self): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 347 | self.finish_group() |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 348 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 349 | def do_dt(self, atr_val): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 350 | # no trailing newline on purpose! |
| 351 | self.tab("<LI>") |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 352 | |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 353 | # Write text to output file. |
| 354 | def write(self, text): |
| 355 | self.ft.write(text) |
| 356 | |
| 357 | # Write text to output file after indenting by self.indent tabs. |
| 358 | def tab(self, text=''): |
| 359 | self.write('\t' * self.indent) |
| 360 | if text: |
| 361 | self.write(text) |
| 362 | |
| 363 | # Forget all saved text. |
| 364 | def saved_clear(self): |
| 365 | self.formatter.writer.saved_clear() |
| 366 | |
| 367 | # Return all saved text as a string. |
| 368 | def saved_get(self): |
| 369 | return self.formatter.writer.saved_get() |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 370 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 371 | class IdxHlpHtmlParser(HelpHtmlParser): |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 372 | # nothing special here, seems enough with parent class |
| 373 | pass |
| 374 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 375 | class TocHlpHtmlParser(HelpHtmlParser): |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 376 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 377 | def start_dl(self, atr_val): |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 378 | self.begin_group() |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 379 | self.tab('<UL>\n') |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 380 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 381 | def end_dl(self): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 382 | self.finish_group() |
| 383 | self.tab('</UL>\n') |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 384 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 385 | def start_ul(self, atr_val): |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 386 | self.begin_group() |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 387 | self.tab('<UL>\n') |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 388 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 389 | def end_ul(self): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 390 | self.finish_group() |
| 391 | self.tab('</UL>\n') |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 392 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 393 | def do_li(self, atr_val): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 394 | # no trailing newline on purpose! |
| 395 | self.tab("<LI>") |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 396 | |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 397 | def index(path, indexpage, output): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 398 | parser = IdxHlpHtmlParser(AbstractFormatter(AlmostNullWriter()), |
| 399 | path, output) |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 400 | f = open(path + '/' + indexpage) |
| 401 | parser.feed(f.read()) |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 402 | parser.close() |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 403 | f.close() |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 404 | |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 405 | def content(path, contentpage, output): |
Tim Peters | e21095e | 2002-04-20 08:36:42 +0000 | [diff] [blame] | 406 | parser = TocHlpHtmlParser(AbstractFormatter(AlmostNullWriter()), |
| 407 | path, output) |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 408 | f = open(path + '/' + contentpage) |
| 409 | parser.feed(f.read()) |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 410 | parser.close() |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 411 | f.close() |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 412 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 413 | def do_index(library, output): |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 414 | output.write('<UL>\n') |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 415 | for book in library: |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 416 | print '\t', book.title, '-', book.indexpage |
| 417 | if book.indexpage: |
| 418 | index(book.directory, book.indexpage, output) |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 419 | output.write('</UL>\n') |
| 420 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 421 | def do_content(library, version, output): |
Tim Peters | c8490c7 | 2002-04-20 21:34:34 +0000 | [diff] [blame] | 422 | output.write(contents_header) |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 423 | for book in library: |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 424 | print '\t', book.title, '-', book.firstpage |
Tim Peters | 4545407 | 2002-04-20 20:26:26 +0000 | [diff] [blame] | 425 | path = book.directory + "/" + book.firstpage |
| 426 | output.write('<LI>') |
| 427 | output.write(object_sitemap % (book.title, path)) |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 428 | if book.contentpage: |
| 429 | content(book.directory, book.contentpage, output) |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 430 | output.write(contents_footer) |
| 431 | |
Tim Peters | 460643b | 2002-04-20 02:37:07 +0000 | [diff] [blame] | 432 | # Fill in the [FILES] section of the project (.hhp) file. |
| 433 | # 'library' is the list of directory description tuples from |
| 434 | # supported_libraries for the version of the docs getting generated. |
| 435 | def do_project(library, output, arch, version): |
Tim Peters | e6b63e6 | 2002-04-19 18:07:52 +0000 | [diff] [blame] | 436 | output.write(project_template % locals()) |
Tim Peters | c8490c7 | 2002-04-20 21:34:34 +0000 | [diff] [blame] | 437 | pathseen = {} |
Tim Peters | 460643b | 2002-04-20 02:37:07 +0000 | [diff] [blame] | 438 | for book in library: |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 439 | directory = book.directory |
Tim Peters | 460643b | 2002-04-20 02:37:07 +0000 | [diff] [blame] | 440 | path = directory + '\\%s\n' |
| 441 | for page in os.listdir(directory): |
| 442 | if page.endswith('.html') or page.endswith('.css'): |
Tim Peters | c8490c7 | 2002-04-20 21:34:34 +0000 | [diff] [blame] | 443 | fullpath = path % page |
| 444 | if fullpath not in pathseen: |
| 445 | output.write(fullpath) |
| 446 | pathseen[fullpath] = True |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 447 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 448 | def openfile(file): |
| 449 | try: |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 450 | p = open(file, "w") |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 451 | except IOError, msg: |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 452 | print file, ":", msg |
| 453 | sys.exit(1) |
| 454 | return p |
| 455 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 456 | def usage(): |
Tim Peters | 3d7d372 | 2004-07-18 06:25:50 +0000 | [diff] [blame] | 457 | print usage_mode |
| 458 | sys.exit(0) |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 459 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 460 | def do_it(args = None): |
| 461 | if not args: |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 462 | args = sys.argv[1:] |
| 463 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 464 | if not args: |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 465 | usage() |
| 466 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 467 | try: |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 468 | optlist, args = getopt.getopt(args, 'ckpv:') |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 469 | except getopt.error, msg: |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 470 | print msg |
| 471 | usage() |
| 472 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 473 | if not args or len(args) > 1: |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 474 | usage() |
| 475 | arch = args[0] |
| 476 | |
| 477 | version = None |
| 478 | for opt in optlist: |
| 479 | if opt[0] == '-v': |
| 480 | version = opt[1] |
| 481 | break |
| 482 | if not version: |
| 483 | usage() |
| 484 | |
Tim Peters | d9a1050 | 2002-04-20 03:25:02 +0000 | [diff] [blame] | 485 | library = supported_libraries[version] |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 486 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 487 | if not (('-p','') in optlist): |
Tim Peters | 4f109c1 | 2002-04-19 18:41:46 +0000 | [diff] [blame] | 488 | fname = arch + '.stp' |
| 489 | f = openfile(fname) |
| 490 | print "Building stoplist", fname, "..." |
| 491 | words = stop_list.split() |
| 492 | words.sort() |
| 493 | for word in words: |
| 494 | print >> f, word |
| 495 | f.close() |
| 496 | |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 497 | f = openfile(arch + '.hhp') |
| 498 | print "Building Project..." |
| 499 | do_project(library, f, arch, version) |
| 500 | if version == '2.0.0': |
| 501 | for image in os.listdir('icons'): |
| 502 | f.write('icons'+ '\\' + image + '\n') |
| 503 | |
| 504 | f.close() |
| 505 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 506 | if not (('-c','') in optlist): |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 507 | f = openfile(arch + '.hhc') |
| 508 | print "Building Table of Content..." |
| 509 | do_content(library, version, f) |
| 510 | f.close() |
| 511 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 512 | if not (('-k','') in optlist): |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 513 | f = openfile(arch + '.hhk') |
| 514 | print "Building Index..." |
| 515 | do_index(library, f) |
| 516 | f.close() |
| 517 | |
Tim Peters | 661e492 | 2002-04-20 02:39:44 +0000 | [diff] [blame] | 518 | if __name__ == '__main__': |
Tim Peters | 52cfa33 | 2002-04-19 16:09:26 +0000 | [diff] [blame] | 519 | do_it() |