blob: 3e7e065fb84f79faf417fd4cb56312fa690f0520 [file] [log] [blame]
Guido van Rossum667d7041995-08-04 04:20:48 +00001/* Python interpreter main program */
2
3#include "Python.h"
Guido van Rossuma075ce11997-12-05 21:56:45 +00004#include "osdefs.h"
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +00005#include "import.h"
Guido van Rossum667d7041995-08-04 04:20:48 +00006
Antoine Pitrou5651eaa2008-09-06 20:46:58 +00007#include <locale.h>
8
Martin v. Löwis79acb9e2002-12-06 12:48:53 +00009#ifdef __VMS
Martin v. Löwis7a924e62003-03-05 14:15:21 +000010#include <unixlib.h>
Martin v. Löwis79acb9e2002-12-06 12:48:53 +000011#endif
12
Sjoerd Mullender9cf424b2002-08-09 13:35:18 +000013#if defined(MS_WINDOWS) || defined(__CYGWIN__)
Martin v. Löwis945362c2007-08-30 14:57:25 +000014#include <windows.h>
Thomas Wouters477c8d52006-05-27 19:21:47 +000015#ifdef HAVE_FCNTL_H
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000016#include <fcntl.h>
Martin v. Löwis790465f2008-04-05 20:41:37 +000017#define PATH_MAX MAXPATHLEN
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000018#endif
Thomas Wouters477c8d52006-05-27 19:21:47 +000019#endif
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000020
Martin v. Löwis945362c2007-08-30 14:57:25 +000021#ifdef _MSC_VER
22#include <crtdbg.h>
23#endif
24
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000025#if (defined(PYOS_OS2) && !defined(PYCC_GCC)) || defined(MS_WINDOWS)
Guido van Rossuma075ce11997-12-05 21:56:45 +000026#define PYTHONHOMEHELP "<prefix>\\lib"
27#else
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000028#if defined(PYOS_OS2) && defined(PYCC_GCC)
29#define PYTHONHOMEHELP "<prefix>/Lib"
30#else
Marc-André Lemburgda4dbc32001-06-12 16:13:51 +000031#define PYTHONHOMEHELP "<prefix>/pythonX.X"
Guido van Rossuma075ce11997-12-05 21:56:45 +000032#endif
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000033#endif
Guido van Rossuma075ce11997-12-05 21:56:45 +000034
Thomas Wouters2cffc7d2000-11-03 08:18:37 +000035#include "pygetopt.h"
36
Guido van Rossuma22865e2000-09-05 04:41:18 +000037#define COPYRIGHT \
Guido van Rossum36002d72001-07-18 16:59:46 +000038 "Type \"help\", \"copyright\", \"credits\" or \"license\" " \
39 "for more information."
Guido van Rossuma22865e2000-09-05 04:41:18 +000040
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000041#ifdef __cplusplus
42extern "C" {
43#endif
44
Guido van Rossumac56b031996-07-21 02:33:38 +000045/* For Py_GetArgcArgv(); set by main() */
Martin v. Löwis790465f2008-04-05 20:41:37 +000046static wchar_t **orig_argv;
Guido van Rossum667d7041995-08-04 04:20:48 +000047static int orig_argc;
48
Guido van Rossumbceccf52001-04-10 22:07:43 +000049/* command line options */
Christian Heimes8dc226f2008-05-06 23:45:46 +000050#define BASE_OPTS L"bBc:dEhiJm:OsStuvVW:xX?"
Guido van Rossumbceccf52001-04-10 22:07:43 +000051
Guido van Rossumbceccf52001-04-10 22:07:43 +000052#define PROGRAM_OPTS BASE_OPTS
Guido van Rossum3ed4c152001-03-02 06:18:03 +000053
Guido van Rossum667d7041995-08-04 04:20:48 +000054/* Short usage message (with %s for argv0) */
55static char *usage_line =
Martin v. Löwis790465f2008-04-05 20:41:37 +000056"usage: %ls [option] ... [-c cmd | -m mod | file | -] [arg] ...\n";
Guido van Rossum667d7041995-08-04 04:20:48 +000057
58/* Long usage message, split into parts < 512 bytes */
Guido van Rossum393661d2001-08-31 17:40:15 +000059static char *usage_1 = "\
Guido van Rossum667d7041995-08-04 04:20:48 +000060Options and arguments (and corresponding environment variables):\n\
Christian Heimes2ab34442008-09-03 20:31:07 +000061-b : issue warnings about str(bytes_instance), str(bytearray_instance)\n\
62 and comparing bytes/bytearray with str. (-bb: issue errors)\n\
Christian Heimes790c8232008-01-07 21:14:23 +000063-B : don't write .py[co] files on import; also PYTHONDONTWRITEBYTECODE=x\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000064-c cmd : program passed in as string (terminates option list)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000065-d : debug output from parser; also PYTHONDEBUG=x\n\
Christian Heimes790c8232008-01-07 21:14:23 +000066-E : ignore PYTHON* environment variables (such as PYTHONPATH)\n\
Thomas Wouters0e3f5912006-08-11 14:57:12 +000067-h : print this help message and exit (also --help)\n\
Guido van Rossum61c345f2001-09-04 03:26:15 +000068";
69static char *usage_2 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000070-i : inspect interactively after running script; forces a prompt even\n\
71 if stdin does not appear to be a terminal; also PYTHONINSPECT=x\n\
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +000072-m mod : run library module as a script (terminates option list)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000073-O : optimize generated bytecode slightly; also PYTHONOPTIMIZE=x\n\
Guido van Rossum6b86a421999-01-28 15:07:47 +000074-OO : remove doc-strings in addition to the -O optimizations\n\
Christian Heimes8dc226f2008-05-06 23:45:46 +000075-s : don't add user site directory to sys.path; also PYTHONNOUSERSITE\n\
Guido van Rossum7922bd71997-08-29 22:34:47 +000076-S : don't imply 'import site' on initialization\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000077";
78static char *usage_3 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000079-u : unbuffered binary stdout and stderr; also PYTHONUNBUFFERED=x\n\
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +000080 see man page for details on internal buffering relating to '-u'\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000081-v : verbose (trace import statements); also PYTHONVERBOSE=x\n\
82 can be supplied multiple times to increase verbosity\n\
Thomas Wouters0e3f5912006-08-11 14:57:12 +000083-V : print the Python version number and exit (also --version)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000084-W arg : warning control; arg is action:message:category:module:lineno\n\
Philip Jenvey0805ca32010-04-07 04:04:10 +000085 also PYTHONWARNINGS=arg\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000086-x : skip first line of source, allowing use of non-Unix forms of #!cmd\n\
Guido van Rossum7922bd71997-08-29 22:34:47 +000087";
Guido van Rossum393661d2001-08-31 17:40:15 +000088static char *usage_4 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000089file : program read from script file\n\
90- : program read from stdin (default; interactive mode if a tty)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000091arg ...: arguments passed to program in sys.argv[1:]\n\n\
Guido van Rossum667d7041995-08-04 04:20:48 +000092Other environment variables:\n\
93PYTHONSTARTUP: file executed on interactive startup (no default)\n\
Guido van Rossuma075ce11997-12-05 21:56:45 +000094PYTHONPATH : '%c'-separated list of directories prefixed to the\n\
Guido van Rossum667d7041995-08-04 04:20:48 +000095 default module search path. The result is sys.path.\n\
Christian Heimes790c8232008-01-07 21:14:23 +000096";
97static char *usage_5 = "\
Guido van Rossuma075ce11997-12-05 21:56:45 +000098PYTHONHOME : alternate <prefix> directory (or <prefix>%c<exec_prefix>).\n\
99 The default module search path uses %s.\n\
Tim Peters793de092001-02-22 00:39:47 +0000100PYTHONCASEOK : ignore case in 'import' statements (Windows).\n\
Martin v. Löwis0f599892008-06-02 11:13:03 +0000101PYTHONIOENCODING: Encoding[:errors] used for stdin/stdout/stderr.\n\
Guido van Rossum667d7041995-08-04 04:20:48 +0000102";
103
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000104FILE *
105_Py_wfopen(const wchar_t *path, const wchar_t *mode)
Martin v. Löwis790465f2008-04-05 20:41:37 +0000106{
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000107#ifndef MS_WINDOWS
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000108 FILE *f;
109 char *cpath;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000110 char cmode[10];
111 size_t r;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000112 r = wcstombs(cmode, mode, 10);
113 if (r == (size_t)-1 || r >= 10) {
114 errno = EINVAL;
115 return NULL;
116 }
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000117 cpath = _Py_wchar2char(path);
118 if (cpath == NULL)
119 return NULL;
120 f = fopen(cpath, cmode);
121 PyMem_Free(cpath);
122 return f;
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000123#else
124 return _wfopen(path, mode);
Martin v. Löwis790465f2008-04-05 20:41:37 +0000125#endif
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000126}
Martin v. Löwis790465f2008-04-05 20:41:37 +0000127
Guido van Rossum667d7041995-08-04 04:20:48 +0000128
Martin v. Löwis852ba7e2003-03-30 17:09:58 +0000129static int
Martin v. Löwis790465f2008-04-05 20:41:37 +0000130usage(int exitcode, wchar_t* program)
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000131{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000132 FILE *f = exitcode ? stderr : stdout;
Guido van Rossum393661d2001-08-31 17:40:15 +0000133
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000134 fprintf(f, usage_line, program);
135 if (exitcode)
136 fprintf(f, "Try `python -h' for more information.\n");
137 else {
138 fputs(usage_1, f);
139 fputs(usage_2, f);
140 fputs(usage_3, f);
141 fprintf(f, usage_4, DELIM);
142 fprintf(f, usage_5, DELIM, PYTHONHOMEHELP);
143 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000144#if defined(__VMS)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000145 if (exitcode == 0) {
146 /* suppress 'error' message */
147 return 1;
148 }
149 else {
150 /* STS$M_INHIB_MSG + SS$_ABORT */
151 return 0x1000002c;
152 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000153#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000154 return exitcode;
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000155#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000156 /*NOTREACHED*/
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000157}
158
Martin v. Löwis6caea372003-11-18 19:46:25 +0000159static void RunStartupFile(PyCompilerFlags *cf)
160{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000161 char *startup = Py_GETENV("PYTHONSTARTUP");
162 if (startup != NULL && startup[0] != '\0') {
163 FILE *fp = fopen(startup, "r");
164 if (fp != NULL) {
165 (void) PyRun_SimpleFileExFlags(fp, startup, 0, cf);
166 PyErr_Clear();
167 fclose(fp);
168 } else {
169 int save_errno;
170
171 save_errno = errno;
172 PySys_WriteStderr("Could not open PYTHONSTARTUP\n");
173 errno = save_errno;
174 PyErr_SetFromErrnoWithFilename(PyExc_IOError,
175 startup);
176 PyErr_Print();
177 PyErr_Clear();
178 }
179 }
Martin v. Löwis6caea372003-11-18 19:46:25 +0000180}
181
Thomas Woutersa9773292006-04-21 09:43:23 +0000182
Antoine Pitrou5651eaa2008-09-06 20:46:58 +0000183static int RunModule(wchar_t *modname, int set_argv0)
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000184{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000185 PyObject *module, *runpy, *runmodule, *runargs, *result;
186 runpy = PyImport_ImportModule("runpy");
187 if (runpy == NULL) {
188 fprintf(stderr, "Could not import runpy module\n");
189 return -1;
190 }
191 runmodule = PyObject_GetAttrString(runpy, "_run_module_as_main");
192 if (runmodule == NULL) {
193 fprintf(stderr, "Could not access runpy._run_module_as_main\n");
194 Py_DECREF(runpy);
195 return -1;
196 }
197 module = PyUnicode_FromWideChar(modname, wcslen(modname));
198 if (module == NULL) {
199 fprintf(stderr, "Could not convert module name to unicode\n");
200 Py_DECREF(runpy);
201 Py_DECREF(runmodule);
202 return -1;
203 }
204 runargs = Py_BuildValue("(Oi)", module, set_argv0);
205 if (runargs == NULL) {
206 fprintf(stderr,
207 "Could not create arguments for runpy._run_module_as_main\n");
208 Py_DECREF(runpy);
209 Py_DECREF(runmodule);
210 Py_DECREF(module);
211 return -1;
212 }
213 result = PyObject_Call(runmodule, runargs, NULL);
214 if (result == NULL) {
215 PyErr_Print();
216 }
217 Py_DECREF(runpy);
218 Py_DECREF(runmodule);
219 Py_DECREF(module);
220 Py_DECREF(runargs);
221 if (result == NULL) {
222 return -1;
223 }
224 Py_DECREF(result);
225 return 0;
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000226}
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000227
Martin v. Löwis790465f2008-04-05 20:41:37 +0000228static int RunMainFromImporter(wchar_t *filename)
Christian Heimes9cd17752007-11-18 19:35:23 +0000229{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000230 PyObject *argv0 = NULL, *importer = NULL;
Christian Heimes9cd17752007-11-18 19:35:23 +0000231
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000232 if ((argv0 = PyUnicode_FromWideChar(filename,wcslen(filename))) &&
233 (importer = PyImport_GetImporter(argv0)) &&
234 (importer->ob_type != &PyNullImporter_Type))
235 {
236 /* argv0 is usable as an import source, so
237 put it in sys.path[0] and import __main__ */
238 PyObject *sys_path = NULL;
239 if ((sys_path = PySys_GetObject("path")) &&
240 !PyList_SetItem(sys_path, 0, argv0))
241 {
242 Py_INCREF(argv0);
243 Py_DECREF(importer);
244 sys_path = NULL;
245 return RunModule(L"__main__", 0) != 0;
Guido van Rossum74c29c72007-11-19 18:36:41 +0000246 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000247 }
248 Py_XDECREF(argv0);
249 Py_XDECREF(importer);
250 if (PyErr_Occurred()) {
251 PyErr_Print();
252 return 1;
253 }
254 else {
255 return -1;
256 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000257}
258
Victor Stinnera62207c2010-08-07 10:57:17 +0000259static int
260run_command(wchar_t *command, PyCompilerFlags *cf)
261{
262 PyObject *unicode, *bytes;
263 int ret;
264
265 unicode = PyUnicode_FromWideChar(command, -1);
266 if (unicode == NULL)
267 goto error;
268 bytes = PyUnicode_AsUTF8String(unicode);
269 Py_DECREF(unicode);
270 if (bytes == NULL)
271 goto error;
272 ret = PyRun_SimpleStringFlags(PyBytes_AsString(bytes), cf);
273 Py_DECREF(bytes);
274 return ret != 0;
275
276error:
277 PyErr_Print();
278 return 1;
279}
280
Victor Stinner0a3ddad2010-08-07 16:34:25 +0000281static int
282run_file(FILE *fp, const wchar_t *filename, PyCompilerFlags *p_cf)
283{
284 PyObject *unicode, *bytes = NULL;
285 char *filename_str;
286 int run;
287
288 /* call pending calls like signal handlers (SIGINT) */
289 if (Py_MakePendingCalls() == -1) {
290 PyErr_Print();
291 return 1;
292 }
293
294 if (filename) {
295 unicode = PyUnicode_FromWideChar(filename, wcslen(filename));
296 if (unicode != NULL) {
297 bytes = PyUnicode_AsUTF8String(unicode);
298 Py_DECREF(unicode);
299 }
300 if (bytes != NULL)
301 filename_str = PyBytes_AsString(bytes);
302 else {
303 PyErr_Clear();
304 filename_str = "<decoding error>";
305 }
306 }
307 else
308 filename_str = "<stdin>";
309
310 run = PyRun_AnyFileExFlags(fp, filename_str, filename != NULL, p_cf);
311 Py_XDECREF(bytes);
312 return run != 0;
313}
314
Christian Heimes9cd17752007-11-18 19:35:23 +0000315
Guido van Rossum667d7041995-08-04 04:20:48 +0000316/* Main program */
317
Mark Hammondfe51c6d2002-08-02 02:27:13 +0000318int
Martin v. Löwis790465f2008-04-05 20:41:37 +0000319Py_Main(int argc, wchar_t **argv)
Guido van Rossum667d7041995-08-04 04:20:48 +0000320{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000321 int c;
322 int sts;
323 wchar_t *command = NULL;
324 wchar_t *filename = NULL;
325 wchar_t *module = NULL;
326 FILE *fp = stdin;
327 char *p;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000328#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000329 wchar_t *wp;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000330#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000331 int skipfirstline = 0;
332 int stdin_is_interactive = 0;
333 int help = 0;
334 int version = 0;
335 int saw_unbuffered_flag = 0;
336 PyCompilerFlags cf;
Guido van Rossum667d7041995-08-04 04:20:48 +0000337
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000338 cf.cf_flags = 0;
Guido van Rossum393661d2001-08-31 17:40:15 +0000339
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000340 orig_argc = argc; /* For Py_GetArgcArgv() */
341 orig_argv = argv;
Guido van Rossum667d7041995-08-04 04:20:48 +0000342
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000343 PySys_ResetWarnOptions();
Guido van Rossum47f5fdc2000-12-15 22:00:54 +0000344
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000345 while ((c = _PyOS_GetOpt(argc, argv, PROGRAM_OPTS)) != EOF) {
346 if (c == 'c') {
347 size_t len;
348 /* -c is the last option; following arguments
349 that look like options are left for the
350 command to interpret. */
Amaury Forgeot d'Arc9a5499b2008-11-11 23:04:59 +0000351
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000352 len = wcslen(_PyOS_optarg) + 1 + 1;
353 command = (wchar_t *)malloc(sizeof(wchar_t) * len);
354 if (command == NULL)
355 Py_FatalError(
356 "not enough memory to copy -c argument");
357 wcscpy(command, _PyOS_optarg);
358 command[len - 2] = '\n';
359 command[len - 1] = 0;
360 break;
361 }
Guido van Rossum393661d2001-08-31 17:40:15 +0000362
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000363 if (c == 'm') {
364 /* -m is the last option; following arguments
365 that look like options are left for the
366 module to interpret. */
367 module = _PyOS_optarg;
368 break;
369 }
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000370
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000371 switch (c) {
372 case 'b':
373 Py_BytesWarningFlag++;
374 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000375
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000376 case 'd':
377 Py_DebugFlag++;
378 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000379
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000380 case 'i':
381 Py_InspectFlag++;
382 Py_InteractiveFlag++;
383 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000384
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000385 /* case 'J': reserved for Jython */
Christian Heimes33fe8092008-04-13 13:53:33 +0000386
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000387 case 'O':
388 Py_OptimizeFlag++;
389 break;
Guido van Rossum7614da61997-03-03 19:14:45 +0000390
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000391 case 'B':
392 Py_DontWriteBytecodeFlag++;
393 break;
Christian Heimes790c8232008-01-07 21:14:23 +0000394
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000395 case 's':
396 Py_NoUserSiteDirectory++;
397 break;
Christian Heimes8dc226f2008-05-06 23:45:46 +0000398
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000399 case 'S':
400 Py_NoSiteFlag++;
401 break;
Guido van Rossum7922bd71997-08-29 22:34:47 +0000402
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000403 case 'E':
404 Py_IgnoreEnvironmentFlag++;
405 break;
Neil Schemenauer7d4bb9f2001-07-23 16:30:27 +0000406
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000407 case 't':
408 /* ignored for backwards compatibility */
409 break;
Guido van Rossumbba92ca1998-04-10 19:39:15 +0000410
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000411 case 'u':
412 Py_UnbufferedStdioFlag = 1;
413 saw_unbuffered_flag = 1;
414 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000415
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000416 case 'v':
417 Py_VerboseFlag++;
418 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000419
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000420 case 'x':
421 skipfirstline = 1;
422 break;
Guido van Rossuma075ce11997-12-05 21:56:45 +0000423
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000424 /* case 'X': reserved for implementation-specific arguments */
Christian Heimes33fe8092008-04-13 13:53:33 +0000425
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000426 case 'h':
427 case '?':
428 help++;
429 break;
Guido van Rossum45aecf42006-03-15 04:58:47 +0000430
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000431 case 'V':
432 version++;
433 break;
Guido van Rossumc15a9a12000-05-01 17:54:33 +0000434
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000435 case 'W':
436 PySys_AddWarnOption(_PyOS_optarg);
437 break;
Guido van Rossum47f5fdc2000-12-15 22:00:54 +0000438
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000439 /* This space reserved for other options */
Guido van Rossum667d7041995-08-04 04:20:48 +0000440
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000441 default:
442 return usage(2, argv[0]);
443 /*NOTREACHED*/
Guido van Rossum667d7041995-08-04 04:20:48 +0000444
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000445 }
446 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000447
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000448 if (help)
449 return usage(0, argv[0]);
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000450
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000451 if (version) {
452 fprintf(stderr, "Python %s\n", PY_VERSION);
453 return 0;
454 }
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000455
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000456 if (!Py_InspectFlag &&
457 (p = Py_GETENV("PYTHONINSPECT")) && *p != '\0')
458 Py_InspectFlag = 1;
459 if (!saw_unbuffered_flag &&
460 (p = Py_GETENV("PYTHONUNBUFFERED")) && *p != '\0')
461 Py_UnbufferedStdioFlag = 1;
Neil Schemenauer7d4bb9f2001-07-23 16:30:27 +0000462
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000463 if (!Py_NoUserSiteDirectory &&
464 (p = Py_GETENV("PYTHONNOUSERSITE")) && *p != '\0')
465 Py_NoUserSiteDirectory = 1;
Christian Heimes8dc226f2008-05-06 23:45:46 +0000466
Philip Jenveye53de3d2010-04-14 03:01:39 +0000467#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000468 if (!Py_IgnoreEnvironmentFlag && (wp = _wgetenv(L"PYTHONWARNINGS")) &&
469 *wp != L'\0') {
470 wchar_t *buf, *warning;
Philip Jenvey0805ca32010-04-07 04:04:10 +0000471
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000472 buf = (wchar_t *)malloc((wcslen(wp) + 1) * sizeof(wchar_t));
473 if (buf == NULL)
474 Py_FatalError(
475 "not enough memory to copy PYTHONWARNINGS");
476 wcscpy(buf, wp);
477 for (warning = wcstok(buf, L",");
478 warning != NULL;
479 warning = wcstok(NULL, L",")) {
480 PySys_AddWarnOption(warning);
481 }
482 free(buf);
483 }
Philip Jenveye53de3d2010-04-14 03:01:39 +0000484#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000485 if ((p = Py_GETENV("PYTHONWARNINGS")) && *p != '\0') {
486 char *buf, *oldloc;
Victor Stinner9ca9c252010-05-19 16:53:30 +0000487 PyObject *warning;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000488
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000489 /* settle for strtok here as there's no one standard
490 C89 wcstok */
491 buf = (char *)malloc(strlen(p) + 1);
492 if (buf == NULL)
493 Py_FatalError(
494 "not enough memory to copy PYTHONWARNINGS");
495 strcpy(buf, p);
496 oldloc = strdup(setlocale(LC_ALL, NULL));
497 setlocale(LC_ALL, "");
498 for (p = strtok(buf, ","); p != NULL; p = strtok(NULL, ",")) {
Victor Stinner9ca9c252010-05-19 16:53:30 +0000499 warning = PyUnicode_DecodeFSDefault(p);
500 if (warning != NULL) {
501 PySys_AddWarnOptionUnicode(warning);
502 Py_DECREF(warning);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000503 }
504 }
505 setlocale(LC_ALL, oldloc);
506 free(oldloc);
507 free(buf);
508 }
Philip Jenveye53de3d2010-04-14 03:01:39 +0000509#endif
Philip Jenvey0805ca32010-04-07 04:04:10 +0000510
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000511 if (command == NULL && module == NULL && _PyOS_optind < argc &&
512 wcscmp(argv[_PyOS_optind], L"-") != 0)
513 {
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000514#ifdef __VMS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000515 filename = decc$translate_vms(argv[_PyOS_optind]);
516 if (filename == (char *)0 || filename == (char *)-1)
517 filename = argv[_PyOS_optind];
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000518
519#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000520 filename = argv[_PyOS_optind];
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000521#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000522 }
Guido van Rossum775af911997-02-14 19:50:32 +0000523
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000524 stdin_is_interactive = Py_FdIsInteractive(stdin, (char *)0);
Guido van Rossum775af911997-02-14 19:50:32 +0000525
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000526 if (Py_UnbufferedStdioFlag) {
Sjoerd Mullender9cf424b2002-08-09 13:35:18 +0000527#if defined(MS_WINDOWS) || defined(__CYGWIN__)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000528 _setmode(fileno(stdin), O_BINARY);
529 _setmode(fileno(stdout), O_BINARY);
Guido van Rossumf22d7e21997-01-11 19:28:55 +0000530#endif
Guido van Rossum22ffac11998-03-06 15:30:39 +0000531#ifdef HAVE_SETVBUF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000532 setvbuf(stdin, (char *)NULL, _IONBF, BUFSIZ);
533 setvbuf(stdout, (char *)NULL, _IONBF, BUFSIZ);
534 setvbuf(stderr, (char *)NULL, _IONBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000535#else /* !HAVE_SETVBUF */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000536 setbuf(stdin, (char *)NULL);
537 setbuf(stdout, (char *)NULL);
538 setbuf(stderr, (char *)NULL);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000539#endif /* !HAVE_SETVBUF */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000540 }
541 else if (Py_InteractiveFlag) {
Guido van Rossumb31c7dc1997-04-11 22:19:12 +0000542#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000543 /* Doesn't have to have line-buffered -- use unbuffered */
544 /* Any set[v]buf(stdin, ...) screws up Tkinter :-( */
545 setvbuf(stdout, (char *)NULL, _IONBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000546#else /* !MS_WINDOWS */
547#ifdef HAVE_SETVBUF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000548 setvbuf(stdin, (char *)NULL, _IOLBF, BUFSIZ);
549 setvbuf(stdout, (char *)NULL, _IOLBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000550#endif /* HAVE_SETVBUF */
551#endif /* !MS_WINDOWS */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000552 /* Leave stderr alone - it should be unbuffered anyway. */
553 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000554#ifdef __VMS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000555 else {
556 setvbuf (stdout, (char *)NULL, _IOLBF, BUFSIZ);
557 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000558#endif /* __VMS */
Guido van Rossum667d7041995-08-04 04:20:48 +0000559
Just van Rossum2ac79ef2003-03-05 15:46:54 +0000560#ifdef __APPLE__
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000561 /* On MacOS X, when the Python interpreter is embedded in an
562 application bundle, it gets executed by a bootstrapping script
563 that does os.execve() with an argv[0] that's different from the
564 actual Python executable. This is needed to keep the Finder happy,
565 or rather, to work around Apple's overly strict requirements of
566 the process name. However, we still need a usable sys.executable,
567 so the actual executable path is passed in an environment variable.
568 See Lib/plat-mac/bundlebuiler.py for details about the bootstrap
569 script. */
570 if ((p = Py_GETENV("PYTHONEXECUTABLE")) && *p != '\0') {
571 wchar_t* buffer;
572 size_t len = strlen(p);
573 size_t r;
Ronald Oussoren3e264e12009-02-12 15:55:38 +0000574
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000575 buffer = malloc(len * sizeof(wchar_t));
576 if (buffer == NULL) {
577 Py_FatalError(
578 "not enough memory to copy PYTHONEXECUTABLE");
579 }
Ronald Oussoren3e264e12009-02-12 15:55:38 +0000580
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000581 r = mbstowcs(buffer, p, len);
582 Py_SetProgramName(buffer);
583 /* buffer is now handed off - do not free */
584 } else {
585 Py_SetProgramName(argv[0]);
586 }
Just van Rossum2ac79ef2003-03-05 15:46:54 +0000587#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000588 Py_SetProgramName(argv[0]);
Jack Jansenfbd861b2003-03-05 16:00:15 +0000589#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000590 Py_Initialize();
Guido van Rossumed52aac1997-07-19 19:20:32 +0000591
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000592 if (Py_VerboseFlag ||
593 (command == NULL && filename == NULL && module == NULL && stdin_is_interactive)) {
594 fprintf(stderr, "Python %s on %s\n",
595 Py_GetVersion(), Py_GetPlatform());
596 if (!Py_NoSiteFlag)
597 fprintf(stderr, "%s\n", COPYRIGHT);
598 }
Guido van Rossum393661d2001-08-31 17:40:15 +0000599
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000600 if (command != NULL) {
601 /* Backup _PyOS_optind and force sys.argv[0] = '-c' */
602 _PyOS_optind--;
603 argv[_PyOS_optind] = L"-c";
604 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000605
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000606 if (module != NULL) {
Nick Coghland26c18a2010-08-17 13:06:11 +0000607 /* Backup _PyOS_optind and force sys.argv[0] = '-m'*/
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000608 _PyOS_optind--;
Nick Coghland26c18a2010-08-17 13:06:11 +0000609 argv[_PyOS_optind] = L"-m";
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000610 }
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000611
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000612 PySys_SetArgv(argc-_PyOS_optind, argv+_PyOS_optind);
Guido van Rossum667d7041995-08-04 04:20:48 +0000613
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000614 if ((Py_InspectFlag || (command == NULL && filename == NULL && module == NULL)) &&
615 isatty(fileno(stdin))) {
616 PyObject *v;
617 v = PyImport_ImportModule("readline");
618 if (v == NULL)
619 PyErr_Clear();
620 else
621 Py_DECREF(v);
622 }
Guido van Rossum3d26cc91997-09-16 16:11:28 +0000623
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000624 if (command) {
Victor Stinnera62207c2010-08-07 10:57:17 +0000625 sts = run_command(command, &cf);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000626 free(command);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000627 } else if (module) {
628 sts = RunModule(module, 1);
629 }
630 else {
Christian Heimes9cd17752007-11-18 19:35:23 +0000631
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000632 if (filename == NULL && stdin_is_interactive) {
633 Py_InspectFlag = 0; /* do exit on SystemExit */
634 RunStartupFile(&cf);
635 }
636 /* XXX */
Christian Heimes9cd17752007-11-18 19:35:23 +0000637
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000638 sts = -1; /* keep track of whether we've already run __main__ */
Christian Heimes9cd17752007-11-18 19:35:23 +0000639
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000640 if (filename != NULL) {
641 sts = RunMainFromImporter(filename);
642 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000643
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000644 if (sts==-1 && filename!=NULL) {
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000645 if ((fp = _Py_wfopen(filename, L"r")) == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000646 char cfilename[PATH_MAX];
647 size_t r = wcstombs(cfilename, filename, PATH_MAX);
648 if (r == PATH_MAX)
649 /* cfilename is not null-terminated;
650 * forcefully null-terminating it
651 * might break the shift state */
652 strcpy(cfilename, "<file name too long>");
653 if (r == ((size_t)-1))
654 strcpy(cfilename, "<unprintable file name>");
655 fprintf(stderr, "%ls: can't open file '%s': [Errno %d] %s\n",
656 argv[0], cfilename, errno, strerror(errno));
Christian Heimesada8c3b2008-03-18 18:26:33 +0000657
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000658 return 2;
659 }
660 else if (skipfirstline) {
661 int ch;
662 /* Push back first newline so line numbers
663 remain the same */
664 while ((ch = getc(fp)) != EOF) {
665 if (ch == '\n') {
666 (void)ungetc(ch, fp);
667 break;
668 }
669 }
670 }
671 {
672 /* XXX: does this work on Win/Win64? (see posix_fstat) */
673 struct stat sb;
674 if (fstat(fileno(fp), &sb) == 0 &&
675 S_ISDIR(sb.st_mode)) {
676 fprintf(stderr, "%ls: '%ls' is a directory, cannot continue\n", argv[0], filename);
677 fclose(fp);
678 return 1;
679 }
680 }
681 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000682
Victor Stinner0a3ddad2010-08-07 16:34:25 +0000683 if (sts == -1)
684 sts = run_file(fp, filename, &cf);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000685 }
Barry Warsawd86dcd32003-06-29 17:07:06 +0000686
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000687 /* Check this environment variable at the end, to give programs the
688 * opportunity to set it from Python.
689 */
690 if (!Py_InspectFlag &&
691 (p = Py_GETENV("PYTHONINSPECT")) && *p != '\0')
692 {
693 Py_InspectFlag = 1;
694 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000695
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000696 if (Py_InspectFlag && stdin_is_interactive &&
697 (filename != NULL || command != NULL || module != NULL)) {
698 Py_InspectFlag = 0;
699 /* XXX */
700 sts = PyRun_AnyFileFlags(stdin, "<stdin>", &cf) != 0;
701 }
702
703 Py_Finalize();
Barry Warsaw3e13b1e2001-02-23 16:46:39 +0000704
705#ifdef __INSURE__
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000706 /* Insure++ is a memory analysis tool that aids in discovering
707 * memory leaks and other memory problems. On Python exit, the
708 * interned string dictionaries are flagged as being in use at exit
709 * (which it is). Under normal circumstances, this is fine because
710 * the memory will be automatically reclaimed by the system. Under
711 * memory debugging, it's a huge source of useless noise, so we
712 * trade off slower shutdown for less distraction in the memory
713 * reports. -baw
714 */
715 _Py_ReleaseInternedStrings();
716 _Py_ReleaseInternedUnicodeStrings();
Barry Warsaw3e13b1e2001-02-23 16:46:39 +0000717#endif /* __INSURE__ */
718
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000719 return sts;
Guido van Rossum667d7041995-08-04 04:20:48 +0000720}
721
Skip Montanaro786ea6b2004-03-01 15:44:05 +0000722/* this is gonna seem *real weird*, but if you put some other code between
723 Py_Main() and Py_GetArgcArgv() you will need to adjust the test in the
724 while statement in Misc/gdbinit:ppystack */
Guido van Rossum667d7041995-08-04 04:20:48 +0000725
Guido van Rossum667d7041995-08-04 04:20:48 +0000726/* Make the *original* argc/argv available to other modules.
727 This is rare, but it is needed by the secureware extension. */
728
729void
Martin v. Löwis790465f2008-04-05 20:41:37 +0000730Py_GetArgcArgv(int *argc, wchar_t ***argv)
Guido van Rossum667d7041995-08-04 04:20:48 +0000731{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000732 *argc = orig_argc;
733 *argv = orig_argv;
Guido van Rossum667d7041995-08-04 04:20:48 +0000734}
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000735
Ronald Oussorend61deca2010-04-18 14:46:12 +0000736
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000737/* Encode a (wide) character string to the locale encoding with the
738 surrogateescape error handler (characters in range U+DC80..U+DCFF are
739 converted to bytes 0x80..0xFF).
740
741 This function is the reverse of _Py_char2wchar().
742
743 Return a pointer to a newly allocated byte string (use PyMem_Free() to free
744 the memory), or NULL on error (conversion error or memory error). */
745char*
746_Py_wchar2char(const wchar_t *text)
747{
748 const size_t len = wcslen(text);
749 char *result = NULL, *bytes = NULL;
750 size_t i, size, converted;
751 wchar_t c, buf[2];
752
753 /* The function works in two steps:
754 1. compute the length of the output buffer in bytes (size)
755 2. outputs the bytes */
756 size = 0;
757 buf[1] = 0;
758 while (1) {
759 for (i=0; i < len; i++) {
760 c = text[i];
761 if (c >= 0xdc80 && c <= 0xdcff) {
762 /* UTF-8b surrogate */
763 if (bytes != NULL) {
764 *bytes++ = c - 0xdc00;
765 size--;
766 }
767 else
768 size++;
769 continue;
770 }
771 else {
772 buf[0] = c;
773 if (bytes != NULL)
774 converted = wcstombs(bytes, buf, size);
775 else
776 converted = wcstombs(NULL, buf, 0);
777 if (converted == (size_t)-1) {
778 if (result != NULL)
779 PyMem_Free(result);
780 return NULL;
781 }
782 if (bytes != NULL) {
783 bytes += converted;
784 size -= converted;
785 }
786 else
787 size += converted;
788 }
789 }
790 if (result != NULL) {
791 *bytes = 0;
792 break;
793 }
794
795 size += 1; /* nul byte at the end */
796 result = PyMem_Malloc(size);
797 if (result == NULL)
798 return NULL;
799 bytes = result;
800 }
801 return result;
802}
803
804
805/* Decode a byte string from the locale encoding with the
806 surrogateescape error handler (undecodable bytes are decoded as characters
807 in range U+DC80..U+DCFF). If a byte sequence can be decoded as a surrogate
808 character, escape the bytes using the surrogateescape error handler instead
809 of decoding them.
810
811 Use _Py_wchar2char() to encode the character string back to a byte string.
812
813 Return a pointer to a newly allocated (wide) character string (use
814 PyMem_Free() to free the memory), or NULL on error (conversion error or
815 memory error). */
Ronald Oussorend61deca2010-04-18 14:46:12 +0000816wchar_t*
817_Py_char2wchar(char* arg)
818{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000819 wchar_t *res;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000820#ifdef HAVE_BROKEN_MBSTOWCS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000821 /* Some platforms have a broken implementation of
822 * mbstowcs which does not count the characters that
823 * would result from conversion. Use an upper bound.
824 */
825 size_t argsize = strlen(arg);
Ronald Oussorend61deca2010-04-18 14:46:12 +0000826#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000827 size_t argsize = mbstowcs(NULL, arg, 0);
Ronald Oussorend61deca2010-04-18 14:46:12 +0000828#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000829 size_t count;
830 unsigned char *in;
831 wchar_t *out;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000832#ifdef HAVE_MBRTOWC
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000833 mbstate_t mbs;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000834#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000835 if (argsize != (size_t)-1) {
836 res = (wchar_t *)PyMem_Malloc((argsize+1)*sizeof(wchar_t));
837 if (!res)
838 goto oom;
839 count = mbstowcs(res, arg, argsize+1);
840 if (count != (size_t)-1) {
841 wchar_t *tmp;
842 /* Only use the result if it contains no
843 surrogate characters. */
844 for (tmp = res; *tmp != 0 &&
845 (*tmp < 0xd800 || *tmp > 0xdfff); tmp++)
846 ;
847 if (*tmp == 0)
848 return res;
849 }
850 PyMem_Free(res);
851 }
852 /* Conversion failed. Fall back to escaping with surrogateescape. */
Ronald Oussorend61deca2010-04-18 14:46:12 +0000853#ifdef HAVE_MBRTOWC
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000854 /* Try conversion with mbrtwoc (C99), and escape non-decodable bytes. */
855
856 /* Overallocate; as multi-byte characters are in the argument, the
857 actual output could use less memory. */
858 argsize = strlen(arg) + 1;
859 res = (wchar_t*)PyMem_Malloc(argsize*sizeof(wchar_t));
860 if (!res) goto oom;
861 in = (unsigned char*)arg;
862 out = res;
863 memset(&mbs, 0, sizeof mbs);
864 while (argsize) {
865 size_t converted = mbrtowc(out, (char*)in, argsize, &mbs);
866 if (converted == 0)
867 /* Reached end of string; null char stored. */
868 break;
869 if (converted == (size_t)-2) {
870 /* Incomplete character. This should never happen,
871 since we provide everything that we have -
872 unless there is a bug in the C library, or I
873 misunderstood how mbrtowc works. */
874 fprintf(stderr, "unexpected mbrtowc result -2\n");
875 return NULL;
876 }
877 if (converted == (size_t)-1) {
878 /* Conversion error. Escape as UTF-8b, and start over
879 in the initial shift state. */
880 *out++ = 0xdc00 + *in++;
881 argsize--;
882 memset(&mbs, 0, sizeof mbs);
883 continue;
884 }
885 if (*out >= 0xd800 && *out <= 0xdfff) {
886 /* Surrogate character. Escape the original
887 byte sequence with surrogateescape. */
888 argsize -= converted;
889 while (converted--)
890 *out++ = 0xdc00 + *in++;
891 continue;
892 }
893 /* successfully converted some bytes */
894 in += converted;
895 argsize -= converted;
896 out++;
897 }
Ronald Oussorend61deca2010-04-18 14:46:12 +0000898#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000899 /* Cannot use C locale for escaping; manually escape as if charset
900 is ASCII (i.e. escape all bytes > 128. This will still roundtrip
901 correctly in the locale's charset, which must be an ASCII superset. */
902 res = PyMem_Malloc((strlen(arg)+1)*sizeof(wchar_t));
903 if (!res) goto oom;
904 in = (unsigned char*)arg;
905 out = res;
906 while(*in)
907 if(*in < 128)
908 *out++ = *in++;
909 else
910 *out++ = 0xdc00 + *in++;
911 *out = 0;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000912#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000913 return res;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000914oom:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000915 fprintf(stderr, "out of memory\n");
916 return NULL;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000917}
918
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000919#ifdef __cplusplus
920}
921#endif