blob: 5e9f82a2873228c4a626acfac106626c9defd930 [file] [log] [blame]
Guido van Rossum667d7041995-08-04 04:20:48 +00001/* Python interpreter main program */
2
3#include "Python.h"
Guido van Rossuma075ce11997-12-05 21:56:45 +00004#include "osdefs.h"
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +00005#include "import.h"
Guido van Rossum667d7041995-08-04 04:20:48 +00006
Antoine Pitrou5651eaa2008-09-06 20:46:58 +00007#include <locale.h>
8
Martin v. Löwis79acb9e2002-12-06 12:48:53 +00009#ifdef __VMS
Martin v. Löwis7a924e62003-03-05 14:15:21 +000010#include <unixlib.h>
Martin v. Löwis79acb9e2002-12-06 12:48:53 +000011#endif
12
Sjoerd Mullender9cf424b2002-08-09 13:35:18 +000013#if defined(MS_WINDOWS) || defined(__CYGWIN__)
Martin v. Löwis945362c2007-08-30 14:57:25 +000014#include <windows.h>
Thomas Wouters477c8d52006-05-27 19:21:47 +000015#ifdef HAVE_FCNTL_H
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000016#include <fcntl.h>
Martin v. Löwis790465f2008-04-05 20:41:37 +000017#define PATH_MAX MAXPATHLEN
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000018#endif
Thomas Wouters477c8d52006-05-27 19:21:47 +000019#endif
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000020
Martin v. Löwis945362c2007-08-30 14:57:25 +000021#ifdef _MSC_VER
22#include <crtdbg.h>
23#endif
24
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000025#if (defined(PYOS_OS2) && !defined(PYCC_GCC)) || defined(MS_WINDOWS)
Guido van Rossuma075ce11997-12-05 21:56:45 +000026#define PYTHONHOMEHELP "<prefix>\\lib"
27#else
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000028#if defined(PYOS_OS2) && defined(PYCC_GCC)
29#define PYTHONHOMEHELP "<prefix>/Lib"
30#else
Marc-André Lemburgda4dbc32001-06-12 16:13:51 +000031#define PYTHONHOMEHELP "<prefix>/pythonX.X"
Guido van Rossuma075ce11997-12-05 21:56:45 +000032#endif
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000033#endif
Guido van Rossuma075ce11997-12-05 21:56:45 +000034
Thomas Wouters2cffc7d2000-11-03 08:18:37 +000035#include "pygetopt.h"
36
Guido van Rossuma22865e2000-09-05 04:41:18 +000037#define COPYRIGHT \
Guido van Rossum36002d72001-07-18 16:59:46 +000038 "Type \"help\", \"copyright\", \"credits\" or \"license\" " \
39 "for more information."
Guido van Rossuma22865e2000-09-05 04:41:18 +000040
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000041#ifdef __cplusplus
42extern "C" {
43#endif
44
Guido van Rossumac56b031996-07-21 02:33:38 +000045/* For Py_GetArgcArgv(); set by main() */
Martin v. Löwis790465f2008-04-05 20:41:37 +000046static wchar_t **orig_argv;
Guido van Rossum667d7041995-08-04 04:20:48 +000047static int orig_argc;
48
Guido van Rossumbceccf52001-04-10 22:07:43 +000049/* command line options */
Christian Heimes8dc226f2008-05-06 23:45:46 +000050#define BASE_OPTS L"bBc:dEhiJm:OsStuvVW:xX?"
Guido van Rossumbceccf52001-04-10 22:07:43 +000051
Guido van Rossumbceccf52001-04-10 22:07:43 +000052#define PROGRAM_OPTS BASE_OPTS
Guido van Rossum3ed4c152001-03-02 06:18:03 +000053
Guido van Rossum667d7041995-08-04 04:20:48 +000054/* Short usage message (with %s for argv0) */
55static char *usage_line =
Martin v. Löwis790465f2008-04-05 20:41:37 +000056"usage: %ls [option] ... [-c cmd | -m mod | file | -] [arg] ...\n";
Guido van Rossum667d7041995-08-04 04:20:48 +000057
58/* Long usage message, split into parts < 512 bytes */
Guido van Rossum393661d2001-08-31 17:40:15 +000059static char *usage_1 = "\
Guido van Rossum667d7041995-08-04 04:20:48 +000060Options and arguments (and corresponding environment variables):\n\
Christian Heimes2ab34442008-09-03 20:31:07 +000061-b : issue warnings about str(bytes_instance), str(bytearray_instance)\n\
62 and comparing bytes/bytearray with str. (-bb: issue errors)\n\
Christian Heimes790c8232008-01-07 21:14:23 +000063-B : don't write .py[co] files on import; also PYTHONDONTWRITEBYTECODE=x\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000064-c cmd : program passed in as string (terminates option list)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000065-d : debug output from parser; also PYTHONDEBUG=x\n\
Christian Heimes790c8232008-01-07 21:14:23 +000066-E : ignore PYTHON* environment variables (such as PYTHONPATH)\n\
Thomas Wouters0e3f5912006-08-11 14:57:12 +000067-h : print this help message and exit (also --help)\n\
Guido van Rossum61c345f2001-09-04 03:26:15 +000068";
69static char *usage_2 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000070-i : inspect interactively after running script; forces a prompt even\n\
71 if stdin does not appear to be a terminal; also PYTHONINSPECT=x\n\
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +000072-m mod : run library module as a script (terminates option list)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000073-O : optimize generated bytecode slightly; also PYTHONOPTIMIZE=x\n\
Guido van Rossum6b86a421999-01-28 15:07:47 +000074-OO : remove doc-strings in addition to the -O optimizations\n\
Christian Heimes8dc226f2008-05-06 23:45:46 +000075-s : don't add user site directory to sys.path; also PYTHONNOUSERSITE\n\
Guido van Rossum7922bd71997-08-29 22:34:47 +000076-S : don't imply 'import site' on initialization\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000077";
78static char *usage_3 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000079-u : unbuffered binary stdout and stderr; also PYTHONUNBUFFERED=x\n\
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +000080 see man page for details on internal buffering relating to '-u'\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000081-v : verbose (trace import statements); also PYTHONVERBOSE=x\n\
82 can be supplied multiple times to increase verbosity\n\
Thomas Wouters0e3f5912006-08-11 14:57:12 +000083-V : print the Python version number and exit (also --version)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000084-W arg : warning control; arg is action:message:category:module:lineno\n\
Philip Jenvey0805ca32010-04-07 04:04:10 +000085 also PYTHONWARNINGS=arg\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000086-x : skip first line of source, allowing use of non-Unix forms of #!cmd\n\
Guido van Rossum7922bd71997-08-29 22:34:47 +000087";
Guido van Rossum393661d2001-08-31 17:40:15 +000088static char *usage_4 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000089file : program read from script file\n\
90- : program read from stdin (default; interactive mode if a tty)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000091arg ...: arguments passed to program in sys.argv[1:]\n\n\
Guido van Rossum667d7041995-08-04 04:20:48 +000092Other environment variables:\n\
93PYTHONSTARTUP: file executed on interactive startup (no default)\n\
Guido van Rossuma075ce11997-12-05 21:56:45 +000094PYTHONPATH : '%c'-separated list of directories prefixed to the\n\
Guido van Rossum667d7041995-08-04 04:20:48 +000095 default module search path. The result is sys.path.\n\
Christian Heimes790c8232008-01-07 21:14:23 +000096";
Victor Stinner9802b392010-08-19 11:36:43 +000097static char *usage_5 =
98"PYTHONHOME : alternate <prefix> directory (or <prefix>%c<exec_prefix>).\n"
99" The default module search path uses %s.\n"
100"PYTHONCASEOK : ignore case in 'import' statements (Windows).\n"
101"PYTHONIOENCODING: Encoding[:errors] used for stdin/stdout/stderr.\n"
102#if !(defined(MS_WINDOWS) && defined(HAVE_USABLE_WCHAR_T)) && !defined(__APPLE__)
103"PYTHONFSENCODING: Encoding used for the filesystem.\n"
104#endif
105;
Guido van Rossum667d7041995-08-04 04:20:48 +0000106
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000107FILE *
108_Py_wfopen(const wchar_t *path, const wchar_t *mode)
Martin v. Löwis790465f2008-04-05 20:41:37 +0000109{
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000110#ifndef MS_WINDOWS
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000111 FILE *f;
112 char *cpath;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000113 char cmode[10];
114 size_t r;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000115 r = wcstombs(cmode, mode, 10);
116 if (r == (size_t)-1 || r >= 10) {
117 errno = EINVAL;
118 return NULL;
119 }
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000120 cpath = _Py_wchar2char(path);
121 if (cpath == NULL)
122 return NULL;
123 f = fopen(cpath, cmode);
124 PyMem_Free(cpath);
125 return f;
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000126#else
127 return _wfopen(path, mode);
Martin v. Löwis790465f2008-04-05 20:41:37 +0000128#endif
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000129}
Martin v. Löwis790465f2008-04-05 20:41:37 +0000130
Guido van Rossum667d7041995-08-04 04:20:48 +0000131
Martin v. Löwis852ba7e2003-03-30 17:09:58 +0000132static int
Martin v. Löwis790465f2008-04-05 20:41:37 +0000133usage(int exitcode, wchar_t* program)
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000134{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000135 FILE *f = exitcode ? stderr : stdout;
Guido van Rossum393661d2001-08-31 17:40:15 +0000136
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000137 fprintf(f, usage_line, program);
138 if (exitcode)
139 fprintf(f, "Try `python -h' for more information.\n");
140 else {
141 fputs(usage_1, f);
142 fputs(usage_2, f);
143 fputs(usage_3, f);
144 fprintf(f, usage_4, DELIM);
145 fprintf(f, usage_5, DELIM, PYTHONHOMEHELP);
146 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000147#if defined(__VMS)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000148 if (exitcode == 0) {
149 /* suppress 'error' message */
150 return 1;
151 }
152 else {
153 /* STS$M_INHIB_MSG + SS$_ABORT */
154 return 0x1000002c;
155 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000156#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000157 return exitcode;
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000158#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000159 /*NOTREACHED*/
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000160}
161
Martin v. Löwis6caea372003-11-18 19:46:25 +0000162static void RunStartupFile(PyCompilerFlags *cf)
163{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000164 char *startup = Py_GETENV("PYTHONSTARTUP");
165 if (startup != NULL && startup[0] != '\0') {
166 FILE *fp = fopen(startup, "r");
167 if (fp != NULL) {
168 (void) PyRun_SimpleFileExFlags(fp, startup, 0, cf);
169 PyErr_Clear();
170 fclose(fp);
171 } else {
172 int save_errno;
173
174 save_errno = errno;
175 PySys_WriteStderr("Could not open PYTHONSTARTUP\n");
176 errno = save_errno;
177 PyErr_SetFromErrnoWithFilename(PyExc_IOError,
178 startup);
179 PyErr_Print();
180 PyErr_Clear();
181 }
182 }
Martin v. Löwis6caea372003-11-18 19:46:25 +0000183}
184
Thomas Woutersa9773292006-04-21 09:43:23 +0000185
Antoine Pitrou5651eaa2008-09-06 20:46:58 +0000186static int RunModule(wchar_t *modname, int set_argv0)
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000187{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000188 PyObject *module, *runpy, *runmodule, *runargs, *result;
189 runpy = PyImport_ImportModule("runpy");
190 if (runpy == NULL) {
191 fprintf(stderr, "Could not import runpy module\n");
192 return -1;
193 }
194 runmodule = PyObject_GetAttrString(runpy, "_run_module_as_main");
195 if (runmodule == NULL) {
196 fprintf(stderr, "Could not access runpy._run_module_as_main\n");
197 Py_DECREF(runpy);
198 return -1;
199 }
200 module = PyUnicode_FromWideChar(modname, wcslen(modname));
201 if (module == NULL) {
202 fprintf(stderr, "Could not convert module name to unicode\n");
203 Py_DECREF(runpy);
204 Py_DECREF(runmodule);
205 return -1;
206 }
207 runargs = Py_BuildValue("(Oi)", module, set_argv0);
208 if (runargs == NULL) {
209 fprintf(stderr,
210 "Could not create arguments for runpy._run_module_as_main\n");
211 Py_DECREF(runpy);
212 Py_DECREF(runmodule);
213 Py_DECREF(module);
214 return -1;
215 }
216 result = PyObject_Call(runmodule, runargs, NULL);
217 if (result == NULL) {
218 PyErr_Print();
219 }
220 Py_DECREF(runpy);
221 Py_DECREF(runmodule);
222 Py_DECREF(module);
223 Py_DECREF(runargs);
224 if (result == NULL) {
225 return -1;
226 }
227 Py_DECREF(result);
228 return 0;
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000229}
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000230
Victor Stinner4726e402010-10-06 23:24:57 +0000231static int
232RunMainFromImporter(wchar_t *filename)
Christian Heimes9cd17752007-11-18 19:35:23 +0000233{
Victor Stinner4726e402010-10-06 23:24:57 +0000234 PyObject *argv0 = NULL, *importer, *sys_path;
235 int sts;
Christian Heimes9cd17752007-11-18 19:35:23 +0000236
Victor Stinner4726e402010-10-06 23:24:57 +0000237 argv0 = PyUnicode_FromWideChar(filename, wcslen(filename));
238 if (argv0 == NULL)
239 goto error;
240
241 importer = PyImport_GetImporter(argv0);
242 if (importer == NULL)
243 goto error;
244
245 if (importer->ob_type == &PyNullImporter_Type) {
246 Py_DECREF(argv0);
247 Py_DECREF(importer);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000248 return -1;
249 }
Victor Stinner4726e402010-10-06 23:24:57 +0000250 Py_DECREF(importer);
251
252 /* argv0 is usable as an import source, so put it in sys.path[0]
253 and import __main__ */
254 sys_path = PySys_GetObject("path");
255 if (sys_path == NULL)
256 goto error;
257 if (PyList_SetItem(sys_path, 0, argv0)) {
258 argv0 = NULL;
259 goto error;
260 }
261 Py_INCREF(argv0);
262
263 sts = RunModule(L"__main__", 0);
264 return sts != 0;
265
266error:
267 Py_XDECREF(argv0);
268 PyErr_Print();
269 return 1;
Christian Heimes9cd17752007-11-18 19:35:23 +0000270}
271
Victor Stinnera62207c2010-08-07 10:57:17 +0000272static int
273run_command(wchar_t *command, PyCompilerFlags *cf)
274{
275 PyObject *unicode, *bytes;
276 int ret;
277
278 unicode = PyUnicode_FromWideChar(command, -1);
279 if (unicode == NULL)
280 goto error;
281 bytes = PyUnicode_AsUTF8String(unicode);
282 Py_DECREF(unicode);
283 if (bytes == NULL)
284 goto error;
285 ret = PyRun_SimpleStringFlags(PyBytes_AsString(bytes), cf);
286 Py_DECREF(bytes);
287 return ret != 0;
288
289error:
Victor Stinner398356b2010-08-18 22:23:22 +0000290 PySys_WriteStderr("Unable to decode the command from the command line:\n");
Victor Stinnera62207c2010-08-07 10:57:17 +0000291 PyErr_Print();
292 return 1;
293}
294
Victor Stinner0a3ddad2010-08-07 16:34:25 +0000295static int
296run_file(FILE *fp, const wchar_t *filename, PyCompilerFlags *p_cf)
297{
298 PyObject *unicode, *bytes = NULL;
299 char *filename_str;
300 int run;
301
302 /* call pending calls like signal handlers (SIGINT) */
303 if (Py_MakePendingCalls() == -1) {
304 PyErr_Print();
305 return 1;
306 }
307
308 if (filename) {
309 unicode = PyUnicode_FromWideChar(filename, wcslen(filename));
310 if (unicode != NULL) {
311 bytes = PyUnicode_AsUTF8String(unicode);
312 Py_DECREF(unicode);
313 }
314 if (bytes != NULL)
315 filename_str = PyBytes_AsString(bytes);
316 else {
317 PyErr_Clear();
318 filename_str = "<decoding error>";
319 }
320 }
321 else
322 filename_str = "<stdin>";
323
324 run = PyRun_AnyFileExFlags(fp, filename_str, filename != NULL, p_cf);
325 Py_XDECREF(bytes);
326 return run != 0;
327}
328
Christian Heimes9cd17752007-11-18 19:35:23 +0000329
Guido van Rossum667d7041995-08-04 04:20:48 +0000330/* Main program */
331
Mark Hammondfe51c6d2002-08-02 02:27:13 +0000332int
Martin v. Löwis790465f2008-04-05 20:41:37 +0000333Py_Main(int argc, wchar_t **argv)
Guido van Rossum667d7041995-08-04 04:20:48 +0000334{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000335 int c;
336 int sts;
337 wchar_t *command = NULL;
338 wchar_t *filename = NULL;
339 wchar_t *module = NULL;
340 FILE *fp = stdin;
341 char *p;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000342#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000343 wchar_t *wp;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000344#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000345 int skipfirstline = 0;
346 int stdin_is_interactive = 0;
347 int help = 0;
348 int version = 0;
349 int saw_unbuffered_flag = 0;
350 PyCompilerFlags cf;
Guido van Rossum667d7041995-08-04 04:20:48 +0000351
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000352 cf.cf_flags = 0;
Guido van Rossum393661d2001-08-31 17:40:15 +0000353
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000354 orig_argc = argc; /* For Py_GetArgcArgv() */
355 orig_argv = argv;
Guido van Rossum667d7041995-08-04 04:20:48 +0000356
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000357 PySys_ResetWarnOptions();
Guido van Rossum47f5fdc2000-12-15 22:00:54 +0000358
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000359 while ((c = _PyOS_GetOpt(argc, argv, PROGRAM_OPTS)) != EOF) {
360 if (c == 'c') {
361 size_t len;
362 /* -c is the last option; following arguments
363 that look like options are left for the
364 command to interpret. */
Amaury Forgeot d'Arc9a5499b2008-11-11 23:04:59 +0000365
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000366 len = wcslen(_PyOS_optarg) + 1 + 1;
367 command = (wchar_t *)malloc(sizeof(wchar_t) * len);
368 if (command == NULL)
369 Py_FatalError(
370 "not enough memory to copy -c argument");
371 wcscpy(command, _PyOS_optarg);
372 command[len - 2] = '\n';
373 command[len - 1] = 0;
374 break;
375 }
Guido van Rossum393661d2001-08-31 17:40:15 +0000376
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000377 if (c == 'm') {
378 /* -m is the last option; following arguments
379 that look like options are left for the
380 module to interpret. */
381 module = _PyOS_optarg;
382 break;
383 }
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000384
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000385 switch (c) {
386 case 'b':
387 Py_BytesWarningFlag++;
388 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000389
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000390 case 'd':
391 Py_DebugFlag++;
392 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000393
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000394 case 'i':
395 Py_InspectFlag++;
396 Py_InteractiveFlag++;
397 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000398
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000399 /* case 'J': reserved for Jython */
Christian Heimes33fe8092008-04-13 13:53:33 +0000400
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000401 case 'O':
402 Py_OptimizeFlag++;
403 break;
Guido van Rossum7614da61997-03-03 19:14:45 +0000404
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000405 case 'B':
406 Py_DontWriteBytecodeFlag++;
407 break;
Christian Heimes790c8232008-01-07 21:14:23 +0000408
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000409 case 's':
410 Py_NoUserSiteDirectory++;
411 break;
Christian Heimes8dc226f2008-05-06 23:45:46 +0000412
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000413 case 'S':
414 Py_NoSiteFlag++;
415 break;
Guido van Rossum7922bd71997-08-29 22:34:47 +0000416
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000417 case 'E':
418 Py_IgnoreEnvironmentFlag++;
419 break;
Neil Schemenauer7d4bb9f2001-07-23 16:30:27 +0000420
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000421 case 't':
422 /* ignored for backwards compatibility */
423 break;
Guido van Rossumbba92ca1998-04-10 19:39:15 +0000424
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000425 case 'u':
426 Py_UnbufferedStdioFlag = 1;
427 saw_unbuffered_flag = 1;
428 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000429
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000430 case 'v':
431 Py_VerboseFlag++;
432 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000433
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000434 case 'x':
435 skipfirstline = 1;
436 break;
Guido van Rossuma075ce11997-12-05 21:56:45 +0000437
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000438 /* case 'X': reserved for implementation-specific arguments */
Christian Heimes33fe8092008-04-13 13:53:33 +0000439
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000440 case 'h':
441 case '?':
442 help++;
443 break;
Guido van Rossum45aecf42006-03-15 04:58:47 +0000444
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000445 case 'V':
446 version++;
447 break;
Guido van Rossumc15a9a12000-05-01 17:54:33 +0000448
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000449 case 'W':
450 PySys_AddWarnOption(_PyOS_optarg);
451 break;
Guido van Rossum47f5fdc2000-12-15 22:00:54 +0000452
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000453 /* This space reserved for other options */
Guido van Rossum667d7041995-08-04 04:20:48 +0000454
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000455 default:
456 return usage(2, argv[0]);
457 /*NOTREACHED*/
Guido van Rossum667d7041995-08-04 04:20:48 +0000458
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000459 }
460 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000461
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000462 if (help)
463 return usage(0, argv[0]);
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000464
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000465 if (version) {
466 fprintf(stderr, "Python %s\n", PY_VERSION);
467 return 0;
468 }
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000469
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000470 if (!Py_InspectFlag &&
471 (p = Py_GETENV("PYTHONINSPECT")) && *p != '\0')
472 Py_InspectFlag = 1;
473 if (!saw_unbuffered_flag &&
474 (p = Py_GETENV("PYTHONUNBUFFERED")) && *p != '\0')
475 Py_UnbufferedStdioFlag = 1;
Neil Schemenauer7d4bb9f2001-07-23 16:30:27 +0000476
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000477 if (!Py_NoUserSiteDirectory &&
478 (p = Py_GETENV("PYTHONNOUSERSITE")) && *p != '\0')
479 Py_NoUserSiteDirectory = 1;
Christian Heimes8dc226f2008-05-06 23:45:46 +0000480
Philip Jenveye53de3d2010-04-14 03:01:39 +0000481#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000482 if (!Py_IgnoreEnvironmentFlag && (wp = _wgetenv(L"PYTHONWARNINGS")) &&
483 *wp != L'\0') {
484 wchar_t *buf, *warning;
Philip Jenvey0805ca32010-04-07 04:04:10 +0000485
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000486 buf = (wchar_t *)malloc((wcslen(wp) + 1) * sizeof(wchar_t));
487 if (buf == NULL)
488 Py_FatalError(
489 "not enough memory to copy PYTHONWARNINGS");
490 wcscpy(buf, wp);
491 for (warning = wcstok(buf, L",");
492 warning != NULL;
493 warning = wcstok(NULL, L",")) {
494 PySys_AddWarnOption(warning);
495 }
496 free(buf);
497 }
Philip Jenveye53de3d2010-04-14 03:01:39 +0000498#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000499 if ((p = Py_GETENV("PYTHONWARNINGS")) && *p != '\0') {
500 char *buf, *oldloc;
Victor Stinnerc2d76fd2010-09-10 23:13:52 +0000501 PyObject *unicode;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000502
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000503 /* settle for strtok here as there's no one standard
504 C89 wcstok */
505 buf = (char *)malloc(strlen(p) + 1);
506 if (buf == NULL)
507 Py_FatalError(
508 "not enough memory to copy PYTHONWARNINGS");
509 strcpy(buf, p);
510 oldloc = strdup(setlocale(LC_ALL, NULL));
511 setlocale(LC_ALL, "");
512 for (p = strtok(buf, ","); p != NULL; p = strtok(NULL, ",")) {
Victor Stinner5c848a82010-09-12 08:00:41 +0000513#ifdef __APPLE__
514 /* Use utf-8 on Mac OS X */
515 unicode = PyUnicode_FromString(p);
516#else
517 wchar_t *wchar = _Py_char2wchar(p);
Victor Stinnerc2d76fd2010-09-10 23:13:52 +0000518 if (wchar == NULL)
519 continue;
520 unicode = PyUnicode_FromWideChar(wchar, wcslen(wchar));
521 PyMem_Free(wchar);
Victor Stinner5c848a82010-09-12 08:00:41 +0000522#endif
Victor Stinnerc2d76fd2010-09-10 23:13:52 +0000523 if (unicode == NULL)
524 continue;
525 PySys_AddWarnOptionUnicode(unicode);
526 Py_DECREF(unicode);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000527 }
528 setlocale(LC_ALL, oldloc);
529 free(oldloc);
530 free(buf);
531 }
Philip Jenveye53de3d2010-04-14 03:01:39 +0000532#endif
Philip Jenvey0805ca32010-04-07 04:04:10 +0000533
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000534 if (command == NULL && module == NULL && _PyOS_optind < argc &&
535 wcscmp(argv[_PyOS_optind], L"-") != 0)
536 {
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000537#ifdef __VMS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000538 filename = decc$translate_vms(argv[_PyOS_optind]);
539 if (filename == (char *)0 || filename == (char *)-1)
540 filename = argv[_PyOS_optind];
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000541
542#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000543 filename = argv[_PyOS_optind];
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000544#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000545 }
Guido van Rossum775af911997-02-14 19:50:32 +0000546
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000547 stdin_is_interactive = Py_FdIsInteractive(stdin, (char *)0);
Guido van Rossum775af911997-02-14 19:50:32 +0000548
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000549 if (Py_UnbufferedStdioFlag) {
Sjoerd Mullender9cf424b2002-08-09 13:35:18 +0000550#if defined(MS_WINDOWS) || defined(__CYGWIN__)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000551 _setmode(fileno(stdin), O_BINARY);
552 _setmode(fileno(stdout), O_BINARY);
Guido van Rossumf22d7e21997-01-11 19:28:55 +0000553#endif
Guido van Rossum22ffac11998-03-06 15:30:39 +0000554#ifdef HAVE_SETVBUF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000555 setvbuf(stdin, (char *)NULL, _IONBF, BUFSIZ);
556 setvbuf(stdout, (char *)NULL, _IONBF, BUFSIZ);
557 setvbuf(stderr, (char *)NULL, _IONBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000558#else /* !HAVE_SETVBUF */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000559 setbuf(stdin, (char *)NULL);
560 setbuf(stdout, (char *)NULL);
561 setbuf(stderr, (char *)NULL);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000562#endif /* !HAVE_SETVBUF */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000563 }
564 else if (Py_InteractiveFlag) {
Guido van Rossumb31c7dc1997-04-11 22:19:12 +0000565#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000566 /* Doesn't have to have line-buffered -- use unbuffered */
567 /* Any set[v]buf(stdin, ...) screws up Tkinter :-( */
568 setvbuf(stdout, (char *)NULL, _IONBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000569#else /* !MS_WINDOWS */
570#ifdef HAVE_SETVBUF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000571 setvbuf(stdin, (char *)NULL, _IOLBF, BUFSIZ);
572 setvbuf(stdout, (char *)NULL, _IOLBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000573#endif /* HAVE_SETVBUF */
574#endif /* !MS_WINDOWS */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000575 /* Leave stderr alone - it should be unbuffered anyway. */
576 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000577#ifdef __VMS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000578 else {
579 setvbuf (stdout, (char *)NULL, _IOLBF, BUFSIZ);
580 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000581#endif /* __VMS */
Guido van Rossum667d7041995-08-04 04:20:48 +0000582
Just van Rossum2ac79ef2003-03-05 15:46:54 +0000583#ifdef __APPLE__
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000584 /* On MacOS X, when the Python interpreter is embedded in an
585 application bundle, it gets executed by a bootstrapping script
586 that does os.execve() with an argv[0] that's different from the
587 actual Python executable. This is needed to keep the Finder happy,
588 or rather, to work around Apple's overly strict requirements of
589 the process name. However, we still need a usable sys.executable,
590 so the actual executable path is passed in an environment variable.
591 See Lib/plat-mac/bundlebuiler.py for details about the bootstrap
592 script. */
593 if ((p = Py_GETENV("PYTHONEXECUTABLE")) && *p != '\0') {
594 wchar_t* buffer;
595 size_t len = strlen(p);
596 size_t r;
Ronald Oussoren3e264e12009-02-12 15:55:38 +0000597
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000598 buffer = malloc(len * sizeof(wchar_t));
599 if (buffer == NULL) {
600 Py_FatalError(
601 "not enough memory to copy PYTHONEXECUTABLE");
602 }
Ronald Oussoren3e264e12009-02-12 15:55:38 +0000603
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000604 r = mbstowcs(buffer, p, len);
605 Py_SetProgramName(buffer);
606 /* buffer is now handed off - do not free */
607 } else {
608 Py_SetProgramName(argv[0]);
609 }
Just van Rossum2ac79ef2003-03-05 15:46:54 +0000610#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000611 Py_SetProgramName(argv[0]);
Jack Jansenfbd861b2003-03-05 16:00:15 +0000612#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000613 Py_Initialize();
Guido van Rossumed52aac1997-07-19 19:20:32 +0000614
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000615 if (Py_VerboseFlag ||
616 (command == NULL && filename == NULL && module == NULL && stdin_is_interactive)) {
617 fprintf(stderr, "Python %s on %s\n",
618 Py_GetVersion(), Py_GetPlatform());
619 if (!Py_NoSiteFlag)
620 fprintf(stderr, "%s\n", COPYRIGHT);
621 }
Guido van Rossum393661d2001-08-31 17:40:15 +0000622
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000623 if (command != NULL) {
624 /* Backup _PyOS_optind and force sys.argv[0] = '-c' */
625 _PyOS_optind--;
626 argv[_PyOS_optind] = L"-c";
627 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000628
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000629 if (module != NULL) {
Nick Coghland26c18a2010-08-17 13:06:11 +0000630 /* Backup _PyOS_optind and force sys.argv[0] = '-m'*/
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000631 _PyOS_optind--;
Nick Coghland26c18a2010-08-17 13:06:11 +0000632 argv[_PyOS_optind] = L"-m";
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000633 }
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000634
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000635 PySys_SetArgv(argc-_PyOS_optind, argv+_PyOS_optind);
Guido van Rossum667d7041995-08-04 04:20:48 +0000636
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000637 if ((Py_InspectFlag || (command == NULL && filename == NULL && module == NULL)) &&
638 isatty(fileno(stdin))) {
639 PyObject *v;
640 v = PyImport_ImportModule("readline");
641 if (v == NULL)
642 PyErr_Clear();
643 else
644 Py_DECREF(v);
645 }
Guido van Rossum3d26cc91997-09-16 16:11:28 +0000646
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000647 if (command) {
Victor Stinnera62207c2010-08-07 10:57:17 +0000648 sts = run_command(command, &cf);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000649 free(command);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000650 } else if (module) {
651 sts = RunModule(module, 1);
652 }
653 else {
Christian Heimes9cd17752007-11-18 19:35:23 +0000654
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000655 if (filename == NULL && stdin_is_interactive) {
656 Py_InspectFlag = 0; /* do exit on SystemExit */
657 RunStartupFile(&cf);
658 }
659 /* XXX */
Christian Heimes9cd17752007-11-18 19:35:23 +0000660
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000661 sts = -1; /* keep track of whether we've already run __main__ */
Christian Heimes9cd17752007-11-18 19:35:23 +0000662
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000663 if (filename != NULL) {
664 sts = RunMainFromImporter(filename);
665 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000666
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000667 if (sts==-1 && filename!=NULL) {
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000668 if ((fp = _Py_wfopen(filename, L"r")) == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000669 char cfilename[PATH_MAX];
670 size_t r = wcstombs(cfilename, filename, PATH_MAX);
671 if (r == PATH_MAX)
672 /* cfilename is not null-terminated;
673 * forcefully null-terminating it
674 * might break the shift state */
675 strcpy(cfilename, "<file name too long>");
676 if (r == ((size_t)-1))
677 strcpy(cfilename, "<unprintable file name>");
678 fprintf(stderr, "%ls: can't open file '%s': [Errno %d] %s\n",
679 argv[0], cfilename, errno, strerror(errno));
Christian Heimesada8c3b2008-03-18 18:26:33 +0000680
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000681 return 2;
682 }
683 else if (skipfirstline) {
684 int ch;
685 /* Push back first newline so line numbers
686 remain the same */
687 while ((ch = getc(fp)) != EOF) {
688 if (ch == '\n') {
689 (void)ungetc(ch, fp);
690 break;
691 }
692 }
693 }
694 {
695 /* XXX: does this work on Win/Win64? (see posix_fstat) */
696 struct stat sb;
697 if (fstat(fileno(fp), &sb) == 0 &&
698 S_ISDIR(sb.st_mode)) {
699 fprintf(stderr, "%ls: '%ls' is a directory, cannot continue\n", argv[0], filename);
700 fclose(fp);
701 return 1;
702 }
703 }
704 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000705
Victor Stinner0a3ddad2010-08-07 16:34:25 +0000706 if (sts == -1)
707 sts = run_file(fp, filename, &cf);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000708 }
Barry Warsawd86dcd32003-06-29 17:07:06 +0000709
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000710 /* Check this environment variable at the end, to give programs the
711 * opportunity to set it from Python.
712 */
713 if (!Py_InspectFlag &&
714 (p = Py_GETENV("PYTHONINSPECT")) && *p != '\0')
715 {
716 Py_InspectFlag = 1;
717 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000718
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000719 if (Py_InspectFlag && stdin_is_interactive &&
720 (filename != NULL || command != NULL || module != NULL)) {
721 Py_InspectFlag = 0;
722 /* XXX */
723 sts = PyRun_AnyFileFlags(stdin, "<stdin>", &cf) != 0;
724 }
725
726 Py_Finalize();
Barry Warsaw3e13b1e2001-02-23 16:46:39 +0000727
728#ifdef __INSURE__
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000729 /* Insure++ is a memory analysis tool that aids in discovering
730 * memory leaks and other memory problems. On Python exit, the
731 * interned string dictionaries are flagged as being in use at exit
732 * (which it is). Under normal circumstances, this is fine because
733 * the memory will be automatically reclaimed by the system. Under
734 * memory debugging, it's a huge source of useless noise, so we
735 * trade off slower shutdown for less distraction in the memory
736 * reports. -baw
737 */
738 _Py_ReleaseInternedStrings();
739 _Py_ReleaseInternedUnicodeStrings();
Barry Warsaw3e13b1e2001-02-23 16:46:39 +0000740#endif /* __INSURE__ */
741
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000742 return sts;
Guido van Rossum667d7041995-08-04 04:20:48 +0000743}
744
Skip Montanaro786ea6b2004-03-01 15:44:05 +0000745/* this is gonna seem *real weird*, but if you put some other code between
746 Py_Main() and Py_GetArgcArgv() you will need to adjust the test in the
747 while statement in Misc/gdbinit:ppystack */
Guido van Rossum667d7041995-08-04 04:20:48 +0000748
Guido van Rossum667d7041995-08-04 04:20:48 +0000749/* Make the *original* argc/argv available to other modules.
750 This is rare, but it is needed by the secureware extension. */
751
752void
Martin v. Löwis790465f2008-04-05 20:41:37 +0000753Py_GetArgcArgv(int *argc, wchar_t ***argv)
Guido van Rossum667d7041995-08-04 04:20:48 +0000754{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000755 *argc = orig_argc;
756 *argv = orig_argv;
Guido van Rossum667d7041995-08-04 04:20:48 +0000757}
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000758
Ronald Oussorend61deca2010-04-18 14:46:12 +0000759
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000760/* Encode a (wide) character string to the locale encoding with the
761 surrogateescape error handler (characters in range U+DC80..U+DCFF are
762 converted to bytes 0x80..0xFF).
763
764 This function is the reverse of _Py_char2wchar().
765
766 Return a pointer to a newly allocated byte string (use PyMem_Free() to free
767 the memory), or NULL on error (conversion error or memory error). */
768char*
769_Py_wchar2char(const wchar_t *text)
770{
771 const size_t len = wcslen(text);
772 char *result = NULL, *bytes = NULL;
773 size_t i, size, converted;
774 wchar_t c, buf[2];
775
776 /* The function works in two steps:
777 1. compute the length of the output buffer in bytes (size)
778 2. outputs the bytes */
779 size = 0;
780 buf[1] = 0;
781 while (1) {
782 for (i=0; i < len; i++) {
783 c = text[i];
784 if (c >= 0xdc80 && c <= 0xdcff) {
785 /* UTF-8b surrogate */
786 if (bytes != NULL) {
787 *bytes++ = c - 0xdc00;
788 size--;
789 }
790 else
791 size++;
792 continue;
793 }
794 else {
795 buf[0] = c;
796 if (bytes != NULL)
797 converted = wcstombs(bytes, buf, size);
798 else
799 converted = wcstombs(NULL, buf, 0);
800 if (converted == (size_t)-1) {
801 if (result != NULL)
802 PyMem_Free(result);
803 return NULL;
804 }
805 if (bytes != NULL) {
806 bytes += converted;
807 size -= converted;
808 }
809 else
810 size += converted;
811 }
812 }
813 if (result != NULL) {
814 *bytes = 0;
815 break;
816 }
817
818 size += 1; /* nul byte at the end */
819 result = PyMem_Malloc(size);
820 if (result == NULL)
821 return NULL;
822 bytes = result;
823 }
824 return result;
825}
826
827
828/* Decode a byte string from the locale encoding with the
829 surrogateescape error handler (undecodable bytes are decoded as characters
830 in range U+DC80..U+DCFF). If a byte sequence can be decoded as a surrogate
831 character, escape the bytes using the surrogateescape error handler instead
832 of decoding them.
833
834 Use _Py_wchar2char() to encode the character string back to a byte string.
835
836 Return a pointer to a newly allocated (wide) character string (use
837 PyMem_Free() to free the memory), or NULL on error (conversion error or
838 memory error). */
Ronald Oussorend61deca2010-04-18 14:46:12 +0000839wchar_t*
840_Py_char2wchar(char* arg)
841{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000842 wchar_t *res;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000843#ifdef HAVE_BROKEN_MBSTOWCS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000844 /* Some platforms have a broken implementation of
845 * mbstowcs which does not count the characters that
846 * would result from conversion. Use an upper bound.
847 */
848 size_t argsize = strlen(arg);
Ronald Oussorend61deca2010-04-18 14:46:12 +0000849#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000850 size_t argsize = mbstowcs(NULL, arg, 0);
Ronald Oussorend61deca2010-04-18 14:46:12 +0000851#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000852 size_t count;
853 unsigned char *in;
854 wchar_t *out;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000855#ifdef HAVE_MBRTOWC
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000856 mbstate_t mbs;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000857#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000858 if (argsize != (size_t)-1) {
859 res = (wchar_t *)PyMem_Malloc((argsize+1)*sizeof(wchar_t));
860 if (!res)
861 goto oom;
862 count = mbstowcs(res, arg, argsize+1);
863 if (count != (size_t)-1) {
864 wchar_t *tmp;
865 /* Only use the result if it contains no
866 surrogate characters. */
867 for (tmp = res; *tmp != 0 &&
868 (*tmp < 0xd800 || *tmp > 0xdfff); tmp++)
869 ;
870 if (*tmp == 0)
871 return res;
872 }
873 PyMem_Free(res);
874 }
875 /* Conversion failed. Fall back to escaping with surrogateescape. */
Ronald Oussorend61deca2010-04-18 14:46:12 +0000876#ifdef HAVE_MBRTOWC
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000877 /* Try conversion with mbrtwoc (C99), and escape non-decodable bytes. */
878
879 /* Overallocate; as multi-byte characters are in the argument, the
880 actual output could use less memory. */
881 argsize = strlen(arg) + 1;
882 res = (wchar_t*)PyMem_Malloc(argsize*sizeof(wchar_t));
883 if (!res) goto oom;
884 in = (unsigned char*)arg;
885 out = res;
886 memset(&mbs, 0, sizeof mbs);
887 while (argsize) {
888 size_t converted = mbrtowc(out, (char*)in, argsize, &mbs);
889 if (converted == 0)
890 /* Reached end of string; null char stored. */
891 break;
892 if (converted == (size_t)-2) {
893 /* Incomplete character. This should never happen,
894 since we provide everything that we have -
895 unless there is a bug in the C library, or I
896 misunderstood how mbrtowc works. */
897 fprintf(stderr, "unexpected mbrtowc result -2\n");
898 return NULL;
899 }
900 if (converted == (size_t)-1) {
901 /* Conversion error. Escape as UTF-8b, and start over
902 in the initial shift state. */
903 *out++ = 0xdc00 + *in++;
904 argsize--;
905 memset(&mbs, 0, sizeof mbs);
906 continue;
907 }
908 if (*out >= 0xd800 && *out <= 0xdfff) {
909 /* Surrogate character. Escape the original
910 byte sequence with surrogateescape. */
911 argsize -= converted;
912 while (converted--)
913 *out++ = 0xdc00 + *in++;
914 continue;
915 }
916 /* successfully converted some bytes */
917 in += converted;
918 argsize -= converted;
919 out++;
920 }
Ronald Oussorend61deca2010-04-18 14:46:12 +0000921#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000922 /* Cannot use C locale for escaping; manually escape as if charset
923 is ASCII (i.e. escape all bytes > 128. This will still roundtrip
924 correctly in the locale's charset, which must be an ASCII superset. */
925 res = PyMem_Malloc((strlen(arg)+1)*sizeof(wchar_t));
926 if (!res) goto oom;
927 in = (unsigned char*)arg;
928 out = res;
929 while(*in)
930 if(*in < 128)
931 *out++ = *in++;
932 else
933 *out++ = 0xdc00 + *in++;
934 *out = 0;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000935#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000936 return res;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000937oom:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000938 fprintf(stderr, "out of memory\n");
939 return NULL;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000940}
941
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000942#ifdef __cplusplus
943}
944#endif