blob: c25a5a43bc49e1ce821793979b87d39fbbd05d18 [file] [log] [blame]
Thomas Woutersa9773292006-04-21 09:43:23 +00001""" Python Character Mapping Codec cp875 generated from 'MAPPINGS/VENDORS/MICSFT/EBCDIC/CP875.TXT' with gencodec.py.
Guido van Rossum0229bf62000-03-10 23:17:24 +00002
3"""#"
4
5import codecs
6
7### Codec APIs
8
9class Codec(codecs.Codec):
10
11 def encode(self,input,errors='strict'):
Thomas Wouters73e5a5b2006-06-08 15:35:45 +000012 return codecs.charmap_encode(input,errors,encoding_table)
Tim Peters469cdad2002-08-08 20:19:19 +000013
Guido van Rossum0229bf62000-03-10 23:17:24 +000014 def decode(self,input,errors='strict'):
Marc-André Lemburg0f00ba82005-10-21 14:35:35 +000015 return codecs.charmap_decode(input,errors,decoding_table)
Tim Peters536cf992005-12-25 23:18:31 +000016
Thomas Woutersa9773292006-04-21 09:43:23 +000017class IncrementalEncoder(codecs.IncrementalEncoder):
18 def encode(self, input, final=False):
Thomas Wouters73e5a5b2006-06-08 15:35:45 +000019 return codecs.charmap_encode(input,self.errors,encoding_table)[0]
Thomas Woutersa9773292006-04-21 09:43:23 +000020
21class IncrementalDecoder(codecs.IncrementalDecoder):
22 def decode(self, input, final=False):
23 return codecs.charmap_decode(input,self.errors,decoding_table)[0]
24
Guido van Rossum0229bf62000-03-10 23:17:24 +000025class StreamWriter(Codec,codecs.StreamWriter):
26 pass
Tim Peters469cdad2002-08-08 20:19:19 +000027
Guido van Rossum0229bf62000-03-10 23:17:24 +000028class StreamReader(Codec,codecs.StreamReader):
29 pass
30
31### encodings module API
32
33def getregentry():
Thomas Woutersa9773292006-04-21 09:43:23 +000034 return codecs.CodecInfo(
35 name='cp875',
36 encode=Codec().encode,
37 decode=Codec().decode,
38 incrementalencoder=IncrementalEncoder,
39 incrementaldecoder=IncrementalDecoder,
40 streamreader=StreamReader,
41 streamwriter=StreamWriter,
42 )
Guido van Rossum0229bf62000-03-10 23:17:24 +000043
Guido van Rossum0229bf62000-03-10 23:17:24 +000044
Marc-André Lemburg0f00ba82005-10-21 14:35:35 +000045### Decoding Table
46
47decoding_table = (
Guido van Rossumef87d6e2007-05-02 19:09:54 +000048 '\x00' # 0x00 -> NULL
49 '\x01' # 0x01 -> START OF HEADING
50 '\x02' # 0x02 -> START OF TEXT
51 '\x03' # 0x03 -> END OF TEXT
52 '\x9c' # 0x04 -> CONTROL
53 '\t' # 0x05 -> HORIZONTAL TABULATION
54 '\x86' # 0x06 -> CONTROL
55 '\x7f' # 0x07 -> DELETE
56 '\x97' # 0x08 -> CONTROL
57 '\x8d' # 0x09 -> CONTROL
58 '\x8e' # 0x0A -> CONTROL
59 '\x0b' # 0x0B -> VERTICAL TABULATION
60 '\x0c' # 0x0C -> FORM FEED
61 '\r' # 0x0D -> CARRIAGE RETURN
62 '\x0e' # 0x0E -> SHIFT OUT
63 '\x0f' # 0x0F -> SHIFT IN
64 '\x10' # 0x10 -> DATA LINK ESCAPE
65 '\x11' # 0x11 -> DEVICE CONTROL ONE
66 '\x12' # 0x12 -> DEVICE CONTROL TWO
67 '\x13' # 0x13 -> DEVICE CONTROL THREE
68 '\x9d' # 0x14 -> CONTROL
69 '\x85' # 0x15 -> CONTROL
70 '\x08' # 0x16 -> BACKSPACE
71 '\x87' # 0x17 -> CONTROL
72 '\x18' # 0x18 -> CANCEL
73 '\x19' # 0x19 -> END OF MEDIUM
74 '\x92' # 0x1A -> CONTROL
75 '\x8f' # 0x1B -> CONTROL
76 '\x1c' # 0x1C -> FILE SEPARATOR
77 '\x1d' # 0x1D -> GROUP SEPARATOR
78 '\x1e' # 0x1E -> RECORD SEPARATOR
79 '\x1f' # 0x1F -> UNIT SEPARATOR
80 '\x80' # 0x20 -> CONTROL
81 '\x81' # 0x21 -> CONTROL
82 '\x82' # 0x22 -> CONTROL
83 '\x83' # 0x23 -> CONTROL
84 '\x84' # 0x24 -> CONTROL
85 '\n' # 0x25 -> LINE FEED
86 '\x17' # 0x26 -> END OF TRANSMISSION BLOCK
87 '\x1b' # 0x27 -> ESCAPE
88 '\x88' # 0x28 -> CONTROL
89 '\x89' # 0x29 -> CONTROL
90 '\x8a' # 0x2A -> CONTROL
91 '\x8b' # 0x2B -> CONTROL
92 '\x8c' # 0x2C -> CONTROL
93 '\x05' # 0x2D -> ENQUIRY
94 '\x06' # 0x2E -> ACKNOWLEDGE
95 '\x07' # 0x2F -> BELL
96 '\x90' # 0x30 -> CONTROL
97 '\x91' # 0x31 -> CONTROL
98 '\x16' # 0x32 -> SYNCHRONOUS IDLE
99 '\x93' # 0x33 -> CONTROL
100 '\x94' # 0x34 -> CONTROL
101 '\x95' # 0x35 -> CONTROL
102 '\x96' # 0x36 -> CONTROL
103 '\x04' # 0x37 -> END OF TRANSMISSION
104 '\x98' # 0x38 -> CONTROL
105 '\x99' # 0x39 -> CONTROL
106 '\x9a' # 0x3A -> CONTROL
107 '\x9b' # 0x3B -> CONTROL
108 '\x14' # 0x3C -> DEVICE CONTROL FOUR
109 '\x15' # 0x3D -> NEGATIVE ACKNOWLEDGE
110 '\x9e' # 0x3E -> CONTROL
111 '\x1a' # 0x3F -> SUBSTITUTE
112 ' ' # 0x40 -> SPACE
113 '\u0391' # 0x41 -> GREEK CAPITAL LETTER ALPHA
114 '\u0392' # 0x42 -> GREEK CAPITAL LETTER BETA
115 '\u0393' # 0x43 -> GREEK CAPITAL LETTER GAMMA
116 '\u0394' # 0x44 -> GREEK CAPITAL LETTER DELTA
117 '\u0395' # 0x45 -> GREEK CAPITAL LETTER EPSILON
118 '\u0396' # 0x46 -> GREEK CAPITAL LETTER ZETA
119 '\u0397' # 0x47 -> GREEK CAPITAL LETTER ETA
120 '\u0398' # 0x48 -> GREEK CAPITAL LETTER THETA
121 '\u0399' # 0x49 -> GREEK CAPITAL LETTER IOTA
122 '[' # 0x4A -> LEFT SQUARE BRACKET
123 '.' # 0x4B -> FULL STOP
124 '<' # 0x4C -> LESS-THAN SIGN
125 '(' # 0x4D -> LEFT PARENTHESIS
126 '+' # 0x4E -> PLUS SIGN
127 '!' # 0x4F -> EXCLAMATION MARK
128 '&' # 0x50 -> AMPERSAND
129 '\u039a' # 0x51 -> GREEK CAPITAL LETTER KAPPA
130 '\u039b' # 0x52 -> GREEK CAPITAL LETTER LAMDA
131 '\u039c' # 0x53 -> GREEK CAPITAL LETTER MU
132 '\u039d' # 0x54 -> GREEK CAPITAL LETTER NU
133 '\u039e' # 0x55 -> GREEK CAPITAL LETTER XI
134 '\u039f' # 0x56 -> GREEK CAPITAL LETTER OMICRON
135 '\u03a0' # 0x57 -> GREEK CAPITAL LETTER PI
136 '\u03a1' # 0x58 -> GREEK CAPITAL LETTER RHO
137 '\u03a3' # 0x59 -> GREEK CAPITAL LETTER SIGMA
138 ']' # 0x5A -> RIGHT SQUARE BRACKET
139 '$' # 0x5B -> DOLLAR SIGN
140 '*' # 0x5C -> ASTERISK
141 ')' # 0x5D -> RIGHT PARENTHESIS
142 ';' # 0x5E -> SEMICOLON
143 '^' # 0x5F -> CIRCUMFLEX ACCENT
144 '-' # 0x60 -> HYPHEN-MINUS
145 '/' # 0x61 -> SOLIDUS
146 '\u03a4' # 0x62 -> GREEK CAPITAL LETTER TAU
147 '\u03a5' # 0x63 -> GREEK CAPITAL LETTER UPSILON
148 '\u03a6' # 0x64 -> GREEK CAPITAL LETTER PHI
149 '\u03a7' # 0x65 -> GREEK CAPITAL LETTER CHI
150 '\u03a8' # 0x66 -> GREEK CAPITAL LETTER PSI
151 '\u03a9' # 0x67 -> GREEK CAPITAL LETTER OMEGA
152 '\u03aa' # 0x68 -> GREEK CAPITAL LETTER IOTA WITH DIALYTIKA
153 '\u03ab' # 0x69 -> GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA
154 '|' # 0x6A -> VERTICAL LINE
155 ',' # 0x6B -> COMMA
156 '%' # 0x6C -> PERCENT SIGN
157 '_' # 0x6D -> LOW LINE
158 '>' # 0x6E -> GREATER-THAN SIGN
159 '?' # 0x6F -> QUESTION MARK
160 '\xa8' # 0x70 -> DIAERESIS
161 '\u0386' # 0x71 -> GREEK CAPITAL LETTER ALPHA WITH TONOS
162 '\u0388' # 0x72 -> GREEK CAPITAL LETTER EPSILON WITH TONOS
163 '\u0389' # 0x73 -> GREEK CAPITAL LETTER ETA WITH TONOS
164 '\xa0' # 0x74 -> NO-BREAK SPACE
165 '\u038a' # 0x75 -> GREEK CAPITAL LETTER IOTA WITH TONOS
166 '\u038c' # 0x76 -> GREEK CAPITAL LETTER OMICRON WITH TONOS
167 '\u038e' # 0x77 -> GREEK CAPITAL LETTER UPSILON WITH TONOS
168 '\u038f' # 0x78 -> GREEK CAPITAL LETTER OMEGA WITH TONOS
169 '`' # 0x79 -> GRAVE ACCENT
170 ':' # 0x7A -> COLON
171 '#' # 0x7B -> NUMBER SIGN
172 '@' # 0x7C -> COMMERCIAL AT
173 "'" # 0x7D -> APOSTROPHE
174 '=' # 0x7E -> EQUALS SIGN
175 '"' # 0x7F -> QUOTATION MARK
176 '\u0385' # 0x80 -> GREEK DIALYTIKA TONOS
177 'a' # 0x81 -> LATIN SMALL LETTER A
178 'b' # 0x82 -> LATIN SMALL LETTER B
179 'c' # 0x83 -> LATIN SMALL LETTER C
180 'd' # 0x84 -> LATIN SMALL LETTER D
181 'e' # 0x85 -> LATIN SMALL LETTER E
182 'f' # 0x86 -> LATIN SMALL LETTER F
183 'g' # 0x87 -> LATIN SMALL LETTER G
184 'h' # 0x88 -> LATIN SMALL LETTER H
185 'i' # 0x89 -> LATIN SMALL LETTER I
186 '\u03b1' # 0x8A -> GREEK SMALL LETTER ALPHA
187 '\u03b2' # 0x8B -> GREEK SMALL LETTER BETA
188 '\u03b3' # 0x8C -> GREEK SMALL LETTER GAMMA
189 '\u03b4' # 0x8D -> GREEK SMALL LETTER DELTA
190 '\u03b5' # 0x8E -> GREEK SMALL LETTER EPSILON
191 '\u03b6' # 0x8F -> GREEK SMALL LETTER ZETA
192 '\xb0' # 0x90 -> DEGREE SIGN
193 'j' # 0x91 -> LATIN SMALL LETTER J
194 'k' # 0x92 -> LATIN SMALL LETTER K
195 'l' # 0x93 -> LATIN SMALL LETTER L
196 'm' # 0x94 -> LATIN SMALL LETTER M
197 'n' # 0x95 -> LATIN SMALL LETTER N
198 'o' # 0x96 -> LATIN SMALL LETTER O
199 'p' # 0x97 -> LATIN SMALL LETTER P
200 'q' # 0x98 -> LATIN SMALL LETTER Q
201 'r' # 0x99 -> LATIN SMALL LETTER R
202 '\u03b7' # 0x9A -> GREEK SMALL LETTER ETA
203 '\u03b8' # 0x9B -> GREEK SMALL LETTER THETA
204 '\u03b9' # 0x9C -> GREEK SMALL LETTER IOTA
205 '\u03ba' # 0x9D -> GREEK SMALL LETTER KAPPA
206 '\u03bb' # 0x9E -> GREEK SMALL LETTER LAMDA
207 '\u03bc' # 0x9F -> GREEK SMALL LETTER MU
208 '\xb4' # 0xA0 -> ACUTE ACCENT
209 '~' # 0xA1 -> TILDE
210 's' # 0xA2 -> LATIN SMALL LETTER S
211 't' # 0xA3 -> LATIN SMALL LETTER T
212 'u' # 0xA4 -> LATIN SMALL LETTER U
213 'v' # 0xA5 -> LATIN SMALL LETTER V
214 'w' # 0xA6 -> LATIN SMALL LETTER W
215 'x' # 0xA7 -> LATIN SMALL LETTER X
216 'y' # 0xA8 -> LATIN SMALL LETTER Y
217 'z' # 0xA9 -> LATIN SMALL LETTER Z
218 '\u03bd' # 0xAA -> GREEK SMALL LETTER NU
219 '\u03be' # 0xAB -> GREEK SMALL LETTER XI
220 '\u03bf' # 0xAC -> GREEK SMALL LETTER OMICRON
221 '\u03c0' # 0xAD -> GREEK SMALL LETTER PI
222 '\u03c1' # 0xAE -> GREEK SMALL LETTER RHO
223 '\u03c3' # 0xAF -> GREEK SMALL LETTER SIGMA
224 '\xa3' # 0xB0 -> POUND SIGN
225 '\u03ac' # 0xB1 -> GREEK SMALL LETTER ALPHA WITH TONOS
226 '\u03ad' # 0xB2 -> GREEK SMALL LETTER EPSILON WITH TONOS
227 '\u03ae' # 0xB3 -> GREEK SMALL LETTER ETA WITH TONOS
228 '\u03ca' # 0xB4 -> GREEK SMALL LETTER IOTA WITH DIALYTIKA
229 '\u03af' # 0xB5 -> GREEK SMALL LETTER IOTA WITH TONOS
230 '\u03cc' # 0xB6 -> GREEK SMALL LETTER OMICRON WITH TONOS
231 '\u03cd' # 0xB7 -> GREEK SMALL LETTER UPSILON WITH TONOS
232 '\u03cb' # 0xB8 -> GREEK SMALL LETTER UPSILON WITH DIALYTIKA
233 '\u03ce' # 0xB9 -> GREEK SMALL LETTER OMEGA WITH TONOS
234 '\u03c2' # 0xBA -> GREEK SMALL LETTER FINAL SIGMA
235 '\u03c4' # 0xBB -> GREEK SMALL LETTER TAU
236 '\u03c5' # 0xBC -> GREEK SMALL LETTER UPSILON
237 '\u03c6' # 0xBD -> GREEK SMALL LETTER PHI
238 '\u03c7' # 0xBE -> GREEK SMALL LETTER CHI
239 '\u03c8' # 0xBF -> GREEK SMALL LETTER PSI
240 '{' # 0xC0 -> LEFT CURLY BRACKET
241 'A' # 0xC1 -> LATIN CAPITAL LETTER A
242 'B' # 0xC2 -> LATIN CAPITAL LETTER B
243 'C' # 0xC3 -> LATIN CAPITAL LETTER C
244 'D' # 0xC4 -> LATIN CAPITAL LETTER D
245 'E' # 0xC5 -> LATIN CAPITAL LETTER E
246 'F' # 0xC6 -> LATIN CAPITAL LETTER F
247 'G' # 0xC7 -> LATIN CAPITAL LETTER G
248 'H' # 0xC8 -> LATIN CAPITAL LETTER H
249 'I' # 0xC9 -> LATIN CAPITAL LETTER I
250 '\xad' # 0xCA -> SOFT HYPHEN
251 '\u03c9' # 0xCB -> GREEK SMALL LETTER OMEGA
252 '\u0390' # 0xCC -> GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS
253 '\u03b0' # 0xCD -> GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS
254 '\u2018' # 0xCE -> LEFT SINGLE QUOTATION MARK
255 '\u2015' # 0xCF -> HORIZONTAL BAR
256 '}' # 0xD0 -> RIGHT CURLY BRACKET
257 'J' # 0xD1 -> LATIN CAPITAL LETTER J
258 'K' # 0xD2 -> LATIN CAPITAL LETTER K
259 'L' # 0xD3 -> LATIN CAPITAL LETTER L
260 'M' # 0xD4 -> LATIN CAPITAL LETTER M
261 'N' # 0xD5 -> LATIN CAPITAL LETTER N
262 'O' # 0xD6 -> LATIN CAPITAL LETTER O
263 'P' # 0xD7 -> LATIN CAPITAL LETTER P
264 'Q' # 0xD8 -> LATIN CAPITAL LETTER Q
265 'R' # 0xD9 -> LATIN CAPITAL LETTER R
266 '\xb1' # 0xDA -> PLUS-MINUS SIGN
267 '\xbd' # 0xDB -> VULGAR FRACTION ONE HALF
268 '\x1a' # 0xDC -> SUBSTITUTE
269 '\u0387' # 0xDD -> GREEK ANO TELEIA
270 '\u2019' # 0xDE -> RIGHT SINGLE QUOTATION MARK
271 '\xa6' # 0xDF -> BROKEN BAR
272 '\\' # 0xE0 -> REVERSE SOLIDUS
273 '\x1a' # 0xE1 -> SUBSTITUTE
274 'S' # 0xE2 -> LATIN CAPITAL LETTER S
275 'T' # 0xE3 -> LATIN CAPITAL LETTER T
276 'U' # 0xE4 -> LATIN CAPITAL LETTER U
277 'V' # 0xE5 -> LATIN CAPITAL LETTER V
278 'W' # 0xE6 -> LATIN CAPITAL LETTER W
279 'X' # 0xE7 -> LATIN CAPITAL LETTER X
280 'Y' # 0xE8 -> LATIN CAPITAL LETTER Y
281 'Z' # 0xE9 -> LATIN CAPITAL LETTER Z
282 '\xb2' # 0xEA -> SUPERSCRIPT TWO
283 '\xa7' # 0xEB -> SECTION SIGN
284 '\x1a' # 0xEC -> SUBSTITUTE
285 '\x1a' # 0xED -> SUBSTITUTE
286 '\xab' # 0xEE -> LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
287 '\xac' # 0xEF -> NOT SIGN
288 '0' # 0xF0 -> DIGIT ZERO
289 '1' # 0xF1 -> DIGIT ONE
290 '2' # 0xF2 -> DIGIT TWO
291 '3' # 0xF3 -> DIGIT THREE
292 '4' # 0xF4 -> DIGIT FOUR
293 '5' # 0xF5 -> DIGIT FIVE
294 '6' # 0xF6 -> DIGIT SIX
295 '7' # 0xF7 -> DIGIT SEVEN
296 '8' # 0xF8 -> DIGIT EIGHT
297 '9' # 0xF9 -> DIGIT NINE
298 '\xb3' # 0xFA -> SUPERSCRIPT THREE
299 '\xa9' # 0xFB -> COPYRIGHT SIGN
300 '\x1a' # 0xFC -> SUBSTITUTE
301 '\x1a' # 0xFD -> SUBSTITUTE
302 '\xbb' # 0xFE -> RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
303 '\x9f' # 0xFF -> CONTROL
Marc-André Lemburg0f00ba82005-10-21 14:35:35 +0000304)
305
Thomas Wouters73e5a5b2006-06-08 15:35:45 +0000306### Encoding table
307encoding_table=codecs.charmap_build(decoding_table)