blob: a5c89059d36c4da144061f21da301eee055728ec [file] [log] [blame]
Guido van Rossum667d7041995-08-04 04:20:48 +00001/* Python interpreter main program */
2
3#include "Python.h"
Guido van Rossuma075ce11997-12-05 21:56:45 +00004#include "osdefs.h"
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +00005#include "import.h"
Guido van Rossum667d7041995-08-04 04:20:48 +00006
Antoine Pitrou5651eaa2008-09-06 20:46:58 +00007#include <locale.h>
8
Martin v. Löwis79acb9e2002-12-06 12:48:53 +00009#ifdef __VMS
Martin v. Löwis7a924e62003-03-05 14:15:21 +000010#include <unixlib.h>
Martin v. Löwis79acb9e2002-12-06 12:48:53 +000011#endif
12
Sjoerd Mullender9cf424b2002-08-09 13:35:18 +000013#if defined(MS_WINDOWS) || defined(__CYGWIN__)
Martin v. Löwis945362c2007-08-30 14:57:25 +000014#include <windows.h>
Thomas Wouters477c8d52006-05-27 19:21:47 +000015#ifdef HAVE_FCNTL_H
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000016#include <fcntl.h>
Martin v. Löwis790465f2008-04-05 20:41:37 +000017#define PATH_MAX MAXPATHLEN
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000018#endif
Thomas Wouters477c8d52006-05-27 19:21:47 +000019#endif
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000020
Martin v. Löwis945362c2007-08-30 14:57:25 +000021#ifdef _MSC_VER
22#include <crtdbg.h>
23#endif
24
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000025#if (defined(PYOS_OS2) && !defined(PYCC_GCC)) || defined(MS_WINDOWS)
Guido van Rossuma075ce11997-12-05 21:56:45 +000026#define PYTHONHOMEHELP "<prefix>\\lib"
27#else
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000028#if defined(PYOS_OS2) && defined(PYCC_GCC)
29#define PYTHONHOMEHELP "<prefix>/Lib"
30#else
Marc-André Lemburgda4dbc32001-06-12 16:13:51 +000031#define PYTHONHOMEHELP "<prefix>/pythonX.X"
Guido van Rossuma075ce11997-12-05 21:56:45 +000032#endif
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000033#endif
Guido van Rossuma075ce11997-12-05 21:56:45 +000034
Thomas Wouters2cffc7d2000-11-03 08:18:37 +000035#include "pygetopt.h"
36
Guido van Rossuma22865e2000-09-05 04:41:18 +000037#define COPYRIGHT \
Guido van Rossum36002d72001-07-18 16:59:46 +000038 "Type \"help\", \"copyright\", \"credits\" or \"license\" " \
39 "for more information."
Guido van Rossuma22865e2000-09-05 04:41:18 +000040
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000041#ifdef __cplusplus
42extern "C" {
43#endif
44
Guido van Rossumac56b031996-07-21 02:33:38 +000045/* For Py_GetArgcArgv(); set by main() */
Martin v. Löwis790465f2008-04-05 20:41:37 +000046static wchar_t **orig_argv;
Guido van Rossum667d7041995-08-04 04:20:48 +000047static int orig_argc;
48
Guido van Rossumbceccf52001-04-10 22:07:43 +000049/* command line options */
Christian Heimes8dc226f2008-05-06 23:45:46 +000050#define BASE_OPTS L"bBc:dEhiJm:OsStuvVW:xX?"
Guido van Rossumbceccf52001-04-10 22:07:43 +000051
Guido van Rossumbceccf52001-04-10 22:07:43 +000052#define PROGRAM_OPTS BASE_OPTS
Guido van Rossum3ed4c152001-03-02 06:18:03 +000053
Guido van Rossum667d7041995-08-04 04:20:48 +000054/* Short usage message (with %s for argv0) */
55static char *usage_line =
Martin v. Löwis790465f2008-04-05 20:41:37 +000056"usage: %ls [option] ... [-c cmd | -m mod | file | -] [arg] ...\n";
Guido van Rossum667d7041995-08-04 04:20:48 +000057
58/* Long usage message, split into parts < 512 bytes */
Guido van Rossum393661d2001-08-31 17:40:15 +000059static char *usage_1 = "\
Guido van Rossum667d7041995-08-04 04:20:48 +000060Options and arguments (and corresponding environment variables):\n\
Christian Heimes2ab34442008-09-03 20:31:07 +000061-b : issue warnings about str(bytes_instance), str(bytearray_instance)\n\
62 and comparing bytes/bytearray with str. (-bb: issue errors)\n\
Christian Heimes790c8232008-01-07 21:14:23 +000063-B : don't write .py[co] files on import; also PYTHONDONTWRITEBYTECODE=x\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000064-c cmd : program passed in as string (terminates option list)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000065-d : debug output from parser; also PYTHONDEBUG=x\n\
Christian Heimes790c8232008-01-07 21:14:23 +000066-E : ignore PYTHON* environment variables (such as PYTHONPATH)\n\
Thomas Wouters0e3f5912006-08-11 14:57:12 +000067-h : print this help message and exit (also --help)\n\
Guido van Rossum61c345f2001-09-04 03:26:15 +000068";
69static char *usage_2 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000070-i : inspect interactively after running script; forces a prompt even\n\
71 if stdin does not appear to be a terminal; also PYTHONINSPECT=x\n\
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +000072-m mod : run library module as a script (terminates option list)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000073-O : optimize generated bytecode slightly; also PYTHONOPTIMIZE=x\n\
Guido van Rossum6b86a421999-01-28 15:07:47 +000074-OO : remove doc-strings in addition to the -O optimizations\n\
Christian Heimes8dc226f2008-05-06 23:45:46 +000075-s : don't add user site directory to sys.path; also PYTHONNOUSERSITE\n\
Guido van Rossum7922bd71997-08-29 22:34:47 +000076-S : don't imply 'import site' on initialization\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000077";
78static char *usage_3 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000079-u : unbuffered binary stdout and stderr; also PYTHONUNBUFFERED=x\n\
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +000080 see man page for details on internal buffering relating to '-u'\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000081-v : verbose (trace import statements); also PYTHONVERBOSE=x\n\
82 can be supplied multiple times to increase verbosity\n\
Thomas Wouters0e3f5912006-08-11 14:57:12 +000083-V : print the Python version number and exit (also --version)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000084-W arg : warning control; arg is action:message:category:module:lineno\n\
Philip Jenvey0805ca32010-04-07 04:04:10 +000085 also PYTHONWARNINGS=arg\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000086-x : skip first line of source, allowing use of non-Unix forms of #!cmd\n\
Guido van Rossum7922bd71997-08-29 22:34:47 +000087";
Guido van Rossum393661d2001-08-31 17:40:15 +000088static char *usage_4 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000089file : program read from script file\n\
90- : program read from stdin (default; interactive mode if a tty)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000091arg ...: arguments passed to program in sys.argv[1:]\n\n\
Guido van Rossum667d7041995-08-04 04:20:48 +000092Other environment variables:\n\
93PYTHONSTARTUP: file executed on interactive startup (no default)\n\
Guido van Rossuma075ce11997-12-05 21:56:45 +000094PYTHONPATH : '%c'-separated list of directories prefixed to the\n\
Guido van Rossum667d7041995-08-04 04:20:48 +000095 default module search path. The result is sys.path.\n\
Christian Heimes790c8232008-01-07 21:14:23 +000096";
97static char *usage_5 = "\
Guido van Rossuma075ce11997-12-05 21:56:45 +000098PYTHONHOME : alternate <prefix> directory (or <prefix>%c<exec_prefix>).\n\
99 The default module search path uses %s.\n\
Tim Peters793de092001-02-22 00:39:47 +0000100PYTHONCASEOK : ignore case in 'import' statements (Windows).\n\
Martin v. Löwis0f599892008-06-02 11:13:03 +0000101PYTHONIOENCODING: Encoding[:errors] used for stdin/stdout/stderr.\n\
Victor Stinner94908bb2010-08-18 21:23:25 +0000102PYTHONFSENCODING: Encoding used for the filesystem.\n\
Guido van Rossum667d7041995-08-04 04:20:48 +0000103";
104
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000105FILE *
106_Py_wfopen(const wchar_t *path, const wchar_t *mode)
Martin v. Löwis790465f2008-04-05 20:41:37 +0000107{
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000108#ifndef MS_WINDOWS
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000109 FILE *f;
110 char *cpath;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000111 char cmode[10];
112 size_t r;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000113 r = wcstombs(cmode, mode, 10);
114 if (r == (size_t)-1 || r >= 10) {
115 errno = EINVAL;
116 return NULL;
117 }
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000118 cpath = _Py_wchar2char(path);
119 if (cpath == NULL)
120 return NULL;
121 f = fopen(cpath, cmode);
122 PyMem_Free(cpath);
123 return f;
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000124#else
125 return _wfopen(path, mode);
Martin v. Löwis790465f2008-04-05 20:41:37 +0000126#endif
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000127}
Martin v. Löwis790465f2008-04-05 20:41:37 +0000128
Guido van Rossum667d7041995-08-04 04:20:48 +0000129
Martin v. Löwis852ba7e2003-03-30 17:09:58 +0000130static int
Martin v. Löwis790465f2008-04-05 20:41:37 +0000131usage(int exitcode, wchar_t* program)
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000132{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000133 FILE *f = exitcode ? stderr : stdout;
Guido van Rossum393661d2001-08-31 17:40:15 +0000134
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000135 fprintf(f, usage_line, program);
136 if (exitcode)
137 fprintf(f, "Try `python -h' for more information.\n");
138 else {
139 fputs(usage_1, f);
140 fputs(usage_2, f);
141 fputs(usage_3, f);
142 fprintf(f, usage_4, DELIM);
143 fprintf(f, usage_5, DELIM, PYTHONHOMEHELP);
144 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000145#if defined(__VMS)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000146 if (exitcode == 0) {
147 /* suppress 'error' message */
148 return 1;
149 }
150 else {
151 /* STS$M_INHIB_MSG + SS$_ABORT */
152 return 0x1000002c;
153 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000154#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000155 return exitcode;
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000156#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000157 /*NOTREACHED*/
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000158}
159
Martin v. Löwis6caea372003-11-18 19:46:25 +0000160static void RunStartupFile(PyCompilerFlags *cf)
161{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000162 char *startup = Py_GETENV("PYTHONSTARTUP");
163 if (startup != NULL && startup[0] != '\0') {
164 FILE *fp = fopen(startup, "r");
165 if (fp != NULL) {
166 (void) PyRun_SimpleFileExFlags(fp, startup, 0, cf);
167 PyErr_Clear();
168 fclose(fp);
169 } else {
170 int save_errno;
171
172 save_errno = errno;
173 PySys_WriteStderr("Could not open PYTHONSTARTUP\n");
174 errno = save_errno;
175 PyErr_SetFromErrnoWithFilename(PyExc_IOError,
176 startup);
177 PyErr_Print();
178 PyErr_Clear();
179 }
180 }
Martin v. Löwis6caea372003-11-18 19:46:25 +0000181}
182
Thomas Woutersa9773292006-04-21 09:43:23 +0000183
Antoine Pitrou5651eaa2008-09-06 20:46:58 +0000184static int RunModule(wchar_t *modname, int set_argv0)
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000185{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000186 PyObject *module, *runpy, *runmodule, *runargs, *result;
187 runpy = PyImport_ImportModule("runpy");
188 if (runpy == NULL) {
189 fprintf(stderr, "Could not import runpy module\n");
190 return -1;
191 }
192 runmodule = PyObject_GetAttrString(runpy, "_run_module_as_main");
193 if (runmodule == NULL) {
194 fprintf(stderr, "Could not access runpy._run_module_as_main\n");
195 Py_DECREF(runpy);
196 return -1;
197 }
198 module = PyUnicode_FromWideChar(modname, wcslen(modname));
199 if (module == NULL) {
200 fprintf(stderr, "Could not convert module name to unicode\n");
201 Py_DECREF(runpy);
202 Py_DECREF(runmodule);
203 return -1;
204 }
205 runargs = Py_BuildValue("(Oi)", module, set_argv0);
206 if (runargs == NULL) {
207 fprintf(stderr,
208 "Could not create arguments for runpy._run_module_as_main\n");
209 Py_DECREF(runpy);
210 Py_DECREF(runmodule);
211 Py_DECREF(module);
212 return -1;
213 }
214 result = PyObject_Call(runmodule, runargs, NULL);
215 if (result == NULL) {
216 PyErr_Print();
217 }
218 Py_DECREF(runpy);
219 Py_DECREF(runmodule);
220 Py_DECREF(module);
221 Py_DECREF(runargs);
222 if (result == NULL) {
223 return -1;
224 }
225 Py_DECREF(result);
226 return 0;
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000227}
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000228
Martin v. Löwis790465f2008-04-05 20:41:37 +0000229static int RunMainFromImporter(wchar_t *filename)
Christian Heimes9cd17752007-11-18 19:35:23 +0000230{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000231 PyObject *argv0 = NULL, *importer = NULL;
Christian Heimes9cd17752007-11-18 19:35:23 +0000232
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000233 if ((argv0 = PyUnicode_FromWideChar(filename,wcslen(filename))) &&
234 (importer = PyImport_GetImporter(argv0)) &&
235 (importer->ob_type != &PyNullImporter_Type))
236 {
237 /* argv0 is usable as an import source, so
238 put it in sys.path[0] and import __main__ */
239 PyObject *sys_path = NULL;
240 if ((sys_path = PySys_GetObject("path")) &&
241 !PyList_SetItem(sys_path, 0, argv0))
242 {
243 Py_INCREF(argv0);
244 Py_DECREF(importer);
245 sys_path = NULL;
246 return RunModule(L"__main__", 0) != 0;
Guido van Rossum74c29c72007-11-19 18:36:41 +0000247 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000248 }
249 Py_XDECREF(argv0);
250 Py_XDECREF(importer);
251 if (PyErr_Occurred()) {
252 PyErr_Print();
253 return 1;
254 }
255 else {
256 return -1;
257 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000258}
259
Victor Stinnera62207c2010-08-07 10:57:17 +0000260static int
261run_command(wchar_t *command, PyCompilerFlags *cf)
262{
263 PyObject *unicode, *bytes;
264 int ret;
265
266 unicode = PyUnicode_FromWideChar(command, -1);
267 if (unicode == NULL)
268 goto error;
269 bytes = PyUnicode_AsUTF8String(unicode);
270 Py_DECREF(unicode);
271 if (bytes == NULL)
272 goto error;
273 ret = PyRun_SimpleStringFlags(PyBytes_AsString(bytes), cf);
274 Py_DECREF(bytes);
275 return ret != 0;
276
277error:
Victor Stinner398356b2010-08-18 22:23:22 +0000278 PySys_WriteStderr("Unable to decode the command from the command line:\n");
Victor Stinnera62207c2010-08-07 10:57:17 +0000279 PyErr_Print();
280 return 1;
281}
282
Victor Stinner0a3ddad2010-08-07 16:34:25 +0000283static int
284run_file(FILE *fp, const wchar_t *filename, PyCompilerFlags *p_cf)
285{
286 PyObject *unicode, *bytes = NULL;
287 char *filename_str;
288 int run;
289
290 /* call pending calls like signal handlers (SIGINT) */
291 if (Py_MakePendingCalls() == -1) {
292 PyErr_Print();
293 return 1;
294 }
295
296 if (filename) {
297 unicode = PyUnicode_FromWideChar(filename, wcslen(filename));
298 if (unicode != NULL) {
299 bytes = PyUnicode_AsUTF8String(unicode);
300 Py_DECREF(unicode);
301 }
302 if (bytes != NULL)
303 filename_str = PyBytes_AsString(bytes);
304 else {
305 PyErr_Clear();
306 filename_str = "<decoding error>";
307 }
308 }
309 else
310 filename_str = "<stdin>";
311
312 run = PyRun_AnyFileExFlags(fp, filename_str, filename != NULL, p_cf);
313 Py_XDECREF(bytes);
314 return run != 0;
315}
316
Christian Heimes9cd17752007-11-18 19:35:23 +0000317
Guido van Rossum667d7041995-08-04 04:20:48 +0000318/* Main program */
319
Mark Hammondfe51c6d2002-08-02 02:27:13 +0000320int
Martin v. Löwis790465f2008-04-05 20:41:37 +0000321Py_Main(int argc, wchar_t **argv)
Guido van Rossum667d7041995-08-04 04:20:48 +0000322{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000323 int c;
324 int sts;
325 wchar_t *command = NULL;
326 wchar_t *filename = NULL;
327 wchar_t *module = NULL;
328 FILE *fp = stdin;
329 char *p;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000330#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000331 wchar_t *wp;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000332#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000333 int skipfirstline = 0;
334 int stdin_is_interactive = 0;
335 int help = 0;
336 int version = 0;
337 int saw_unbuffered_flag = 0;
338 PyCompilerFlags cf;
Guido van Rossum667d7041995-08-04 04:20:48 +0000339
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000340 cf.cf_flags = 0;
Guido van Rossum393661d2001-08-31 17:40:15 +0000341
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000342 orig_argc = argc; /* For Py_GetArgcArgv() */
343 orig_argv = argv;
Guido van Rossum667d7041995-08-04 04:20:48 +0000344
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000345 PySys_ResetWarnOptions();
Guido van Rossum47f5fdc2000-12-15 22:00:54 +0000346
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000347 while ((c = _PyOS_GetOpt(argc, argv, PROGRAM_OPTS)) != EOF) {
348 if (c == 'c') {
349 size_t len;
350 /* -c is the last option; following arguments
351 that look like options are left for the
352 command to interpret. */
Amaury Forgeot d'Arc9a5499b2008-11-11 23:04:59 +0000353
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000354 len = wcslen(_PyOS_optarg) + 1 + 1;
355 command = (wchar_t *)malloc(sizeof(wchar_t) * len);
356 if (command == NULL)
357 Py_FatalError(
358 "not enough memory to copy -c argument");
359 wcscpy(command, _PyOS_optarg);
360 command[len - 2] = '\n';
361 command[len - 1] = 0;
362 break;
363 }
Guido van Rossum393661d2001-08-31 17:40:15 +0000364
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000365 if (c == 'm') {
366 /* -m is the last option; following arguments
367 that look like options are left for the
368 module to interpret. */
369 module = _PyOS_optarg;
370 break;
371 }
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000372
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000373 switch (c) {
374 case 'b':
375 Py_BytesWarningFlag++;
376 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000377
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000378 case 'd':
379 Py_DebugFlag++;
380 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000381
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000382 case 'i':
383 Py_InspectFlag++;
384 Py_InteractiveFlag++;
385 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000386
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000387 /* case 'J': reserved for Jython */
Christian Heimes33fe8092008-04-13 13:53:33 +0000388
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000389 case 'O':
390 Py_OptimizeFlag++;
391 break;
Guido van Rossum7614da61997-03-03 19:14:45 +0000392
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000393 case 'B':
394 Py_DontWriteBytecodeFlag++;
395 break;
Christian Heimes790c8232008-01-07 21:14:23 +0000396
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000397 case 's':
398 Py_NoUserSiteDirectory++;
399 break;
Christian Heimes8dc226f2008-05-06 23:45:46 +0000400
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000401 case 'S':
402 Py_NoSiteFlag++;
403 break;
Guido van Rossum7922bd71997-08-29 22:34:47 +0000404
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000405 case 'E':
406 Py_IgnoreEnvironmentFlag++;
407 break;
Neil Schemenauer7d4bb9f2001-07-23 16:30:27 +0000408
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000409 case 't':
410 /* ignored for backwards compatibility */
411 break;
Guido van Rossumbba92ca1998-04-10 19:39:15 +0000412
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000413 case 'u':
414 Py_UnbufferedStdioFlag = 1;
415 saw_unbuffered_flag = 1;
416 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000417
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000418 case 'v':
419 Py_VerboseFlag++;
420 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000421
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000422 case 'x':
423 skipfirstline = 1;
424 break;
Guido van Rossuma075ce11997-12-05 21:56:45 +0000425
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000426 /* case 'X': reserved for implementation-specific arguments */
Christian Heimes33fe8092008-04-13 13:53:33 +0000427
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000428 case 'h':
429 case '?':
430 help++;
431 break;
Guido van Rossum45aecf42006-03-15 04:58:47 +0000432
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000433 case 'V':
434 version++;
435 break;
Guido van Rossumc15a9a12000-05-01 17:54:33 +0000436
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000437 case 'W':
438 PySys_AddWarnOption(_PyOS_optarg);
439 break;
Guido van Rossum47f5fdc2000-12-15 22:00:54 +0000440
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000441 /* This space reserved for other options */
Guido van Rossum667d7041995-08-04 04:20:48 +0000442
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000443 default:
444 return usage(2, argv[0]);
445 /*NOTREACHED*/
Guido van Rossum667d7041995-08-04 04:20:48 +0000446
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000447 }
448 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000449
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000450 if (help)
451 return usage(0, argv[0]);
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000452
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000453 if (version) {
454 fprintf(stderr, "Python %s\n", PY_VERSION);
455 return 0;
456 }
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000457
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000458 if (!Py_InspectFlag &&
459 (p = Py_GETENV("PYTHONINSPECT")) && *p != '\0')
460 Py_InspectFlag = 1;
461 if (!saw_unbuffered_flag &&
462 (p = Py_GETENV("PYTHONUNBUFFERED")) && *p != '\0')
463 Py_UnbufferedStdioFlag = 1;
Neil Schemenauer7d4bb9f2001-07-23 16:30:27 +0000464
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000465 if (!Py_NoUserSiteDirectory &&
466 (p = Py_GETENV("PYTHONNOUSERSITE")) && *p != '\0')
467 Py_NoUserSiteDirectory = 1;
Christian Heimes8dc226f2008-05-06 23:45:46 +0000468
Philip Jenveye53de3d2010-04-14 03:01:39 +0000469#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000470 if (!Py_IgnoreEnvironmentFlag && (wp = _wgetenv(L"PYTHONWARNINGS")) &&
471 *wp != L'\0') {
472 wchar_t *buf, *warning;
Philip Jenvey0805ca32010-04-07 04:04:10 +0000473
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000474 buf = (wchar_t *)malloc((wcslen(wp) + 1) * sizeof(wchar_t));
475 if (buf == NULL)
476 Py_FatalError(
477 "not enough memory to copy PYTHONWARNINGS");
478 wcscpy(buf, wp);
479 for (warning = wcstok(buf, L",");
480 warning != NULL;
481 warning = wcstok(NULL, L",")) {
482 PySys_AddWarnOption(warning);
483 }
484 free(buf);
485 }
Philip Jenveye53de3d2010-04-14 03:01:39 +0000486#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000487 if ((p = Py_GETENV("PYTHONWARNINGS")) && *p != '\0') {
488 char *buf, *oldloc;
Victor Stinner9ca9c252010-05-19 16:53:30 +0000489 PyObject *warning;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000490
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000491 /* settle for strtok here as there's no one standard
492 C89 wcstok */
493 buf = (char *)malloc(strlen(p) + 1);
494 if (buf == NULL)
495 Py_FatalError(
496 "not enough memory to copy PYTHONWARNINGS");
497 strcpy(buf, p);
498 oldloc = strdup(setlocale(LC_ALL, NULL));
499 setlocale(LC_ALL, "");
500 for (p = strtok(buf, ","); p != NULL; p = strtok(NULL, ",")) {
Victor Stinner9ca9c252010-05-19 16:53:30 +0000501 warning = PyUnicode_DecodeFSDefault(p);
502 if (warning != NULL) {
503 PySys_AddWarnOptionUnicode(warning);
504 Py_DECREF(warning);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000505 }
506 }
507 setlocale(LC_ALL, oldloc);
508 free(oldloc);
509 free(buf);
510 }
Philip Jenveye53de3d2010-04-14 03:01:39 +0000511#endif
Philip Jenvey0805ca32010-04-07 04:04:10 +0000512
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000513 if (command == NULL && module == NULL && _PyOS_optind < argc &&
514 wcscmp(argv[_PyOS_optind], L"-") != 0)
515 {
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000516#ifdef __VMS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000517 filename = decc$translate_vms(argv[_PyOS_optind]);
518 if (filename == (char *)0 || filename == (char *)-1)
519 filename = argv[_PyOS_optind];
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000520
521#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000522 filename = argv[_PyOS_optind];
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000523#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000524 }
Guido van Rossum775af911997-02-14 19:50:32 +0000525
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000526 stdin_is_interactive = Py_FdIsInteractive(stdin, (char *)0);
Guido van Rossum775af911997-02-14 19:50:32 +0000527
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000528 if (Py_UnbufferedStdioFlag) {
Sjoerd Mullender9cf424b2002-08-09 13:35:18 +0000529#if defined(MS_WINDOWS) || defined(__CYGWIN__)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000530 _setmode(fileno(stdin), O_BINARY);
531 _setmode(fileno(stdout), O_BINARY);
Guido van Rossumf22d7e21997-01-11 19:28:55 +0000532#endif
Guido van Rossum22ffac11998-03-06 15:30:39 +0000533#ifdef HAVE_SETVBUF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000534 setvbuf(stdin, (char *)NULL, _IONBF, BUFSIZ);
535 setvbuf(stdout, (char *)NULL, _IONBF, BUFSIZ);
536 setvbuf(stderr, (char *)NULL, _IONBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000537#else /* !HAVE_SETVBUF */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000538 setbuf(stdin, (char *)NULL);
539 setbuf(stdout, (char *)NULL);
540 setbuf(stderr, (char *)NULL);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000541#endif /* !HAVE_SETVBUF */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000542 }
543 else if (Py_InteractiveFlag) {
Guido van Rossumb31c7dc1997-04-11 22:19:12 +0000544#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000545 /* Doesn't have to have line-buffered -- use unbuffered */
546 /* Any set[v]buf(stdin, ...) screws up Tkinter :-( */
547 setvbuf(stdout, (char *)NULL, _IONBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000548#else /* !MS_WINDOWS */
549#ifdef HAVE_SETVBUF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000550 setvbuf(stdin, (char *)NULL, _IOLBF, BUFSIZ);
551 setvbuf(stdout, (char *)NULL, _IOLBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000552#endif /* HAVE_SETVBUF */
553#endif /* !MS_WINDOWS */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000554 /* Leave stderr alone - it should be unbuffered anyway. */
555 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000556#ifdef __VMS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000557 else {
558 setvbuf (stdout, (char *)NULL, _IOLBF, BUFSIZ);
559 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000560#endif /* __VMS */
Guido van Rossum667d7041995-08-04 04:20:48 +0000561
Just van Rossum2ac79ef2003-03-05 15:46:54 +0000562#ifdef __APPLE__
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000563 /* On MacOS X, when the Python interpreter is embedded in an
564 application bundle, it gets executed by a bootstrapping script
565 that does os.execve() with an argv[0] that's different from the
566 actual Python executable. This is needed to keep the Finder happy,
567 or rather, to work around Apple's overly strict requirements of
568 the process name. However, we still need a usable sys.executable,
569 so the actual executable path is passed in an environment variable.
570 See Lib/plat-mac/bundlebuiler.py for details about the bootstrap
571 script. */
572 if ((p = Py_GETENV("PYTHONEXECUTABLE")) && *p != '\0') {
573 wchar_t* buffer;
574 size_t len = strlen(p);
575 size_t r;
Ronald Oussoren3e264e12009-02-12 15:55:38 +0000576
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000577 buffer = malloc(len * sizeof(wchar_t));
578 if (buffer == NULL) {
579 Py_FatalError(
580 "not enough memory to copy PYTHONEXECUTABLE");
581 }
Ronald Oussoren3e264e12009-02-12 15:55:38 +0000582
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000583 r = mbstowcs(buffer, p, len);
584 Py_SetProgramName(buffer);
585 /* buffer is now handed off - do not free */
586 } else {
587 Py_SetProgramName(argv[0]);
588 }
Just van Rossum2ac79ef2003-03-05 15:46:54 +0000589#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000590 Py_SetProgramName(argv[0]);
Jack Jansenfbd861b2003-03-05 16:00:15 +0000591#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000592 Py_Initialize();
Guido van Rossumed52aac1997-07-19 19:20:32 +0000593
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000594 if (Py_VerboseFlag ||
595 (command == NULL && filename == NULL && module == NULL && stdin_is_interactive)) {
596 fprintf(stderr, "Python %s on %s\n",
597 Py_GetVersion(), Py_GetPlatform());
598 if (!Py_NoSiteFlag)
599 fprintf(stderr, "%s\n", COPYRIGHT);
600 }
Guido van Rossum393661d2001-08-31 17:40:15 +0000601
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000602 if (command != NULL) {
603 /* Backup _PyOS_optind and force sys.argv[0] = '-c' */
604 _PyOS_optind--;
605 argv[_PyOS_optind] = L"-c";
606 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000607
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000608 if (module != NULL) {
Nick Coghland26c18a2010-08-17 13:06:11 +0000609 /* Backup _PyOS_optind and force sys.argv[0] = '-m'*/
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000610 _PyOS_optind--;
Nick Coghland26c18a2010-08-17 13:06:11 +0000611 argv[_PyOS_optind] = L"-m";
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000612 }
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000613
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000614 PySys_SetArgv(argc-_PyOS_optind, argv+_PyOS_optind);
Guido van Rossum667d7041995-08-04 04:20:48 +0000615
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000616 if ((Py_InspectFlag || (command == NULL && filename == NULL && module == NULL)) &&
617 isatty(fileno(stdin))) {
618 PyObject *v;
619 v = PyImport_ImportModule("readline");
620 if (v == NULL)
621 PyErr_Clear();
622 else
623 Py_DECREF(v);
624 }
Guido van Rossum3d26cc91997-09-16 16:11:28 +0000625
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000626 if (command) {
Victor Stinnera62207c2010-08-07 10:57:17 +0000627 sts = run_command(command, &cf);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000628 free(command);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000629 } else if (module) {
630 sts = RunModule(module, 1);
631 }
632 else {
Christian Heimes9cd17752007-11-18 19:35:23 +0000633
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000634 if (filename == NULL && stdin_is_interactive) {
635 Py_InspectFlag = 0; /* do exit on SystemExit */
636 RunStartupFile(&cf);
637 }
638 /* XXX */
Christian Heimes9cd17752007-11-18 19:35:23 +0000639
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000640 sts = -1; /* keep track of whether we've already run __main__ */
Christian Heimes9cd17752007-11-18 19:35:23 +0000641
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000642 if (filename != NULL) {
643 sts = RunMainFromImporter(filename);
644 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000645
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000646 if (sts==-1 && filename!=NULL) {
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000647 if ((fp = _Py_wfopen(filename, L"r")) == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000648 char cfilename[PATH_MAX];
649 size_t r = wcstombs(cfilename, filename, PATH_MAX);
650 if (r == PATH_MAX)
651 /* cfilename is not null-terminated;
652 * forcefully null-terminating it
653 * might break the shift state */
654 strcpy(cfilename, "<file name too long>");
655 if (r == ((size_t)-1))
656 strcpy(cfilename, "<unprintable file name>");
657 fprintf(stderr, "%ls: can't open file '%s': [Errno %d] %s\n",
658 argv[0], cfilename, errno, strerror(errno));
Christian Heimesada8c3b2008-03-18 18:26:33 +0000659
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000660 return 2;
661 }
662 else if (skipfirstline) {
663 int ch;
664 /* Push back first newline so line numbers
665 remain the same */
666 while ((ch = getc(fp)) != EOF) {
667 if (ch == '\n') {
668 (void)ungetc(ch, fp);
669 break;
670 }
671 }
672 }
673 {
674 /* XXX: does this work on Win/Win64? (see posix_fstat) */
675 struct stat sb;
676 if (fstat(fileno(fp), &sb) == 0 &&
677 S_ISDIR(sb.st_mode)) {
678 fprintf(stderr, "%ls: '%ls' is a directory, cannot continue\n", argv[0], filename);
679 fclose(fp);
680 return 1;
681 }
682 }
683 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000684
Victor Stinner0a3ddad2010-08-07 16:34:25 +0000685 if (sts == -1)
686 sts = run_file(fp, filename, &cf);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000687 }
Barry Warsawd86dcd32003-06-29 17:07:06 +0000688
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000689 /* Check this environment variable at the end, to give programs the
690 * opportunity to set it from Python.
691 */
692 if (!Py_InspectFlag &&
693 (p = Py_GETENV("PYTHONINSPECT")) && *p != '\0')
694 {
695 Py_InspectFlag = 1;
696 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000697
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000698 if (Py_InspectFlag && stdin_is_interactive &&
699 (filename != NULL || command != NULL || module != NULL)) {
700 Py_InspectFlag = 0;
701 /* XXX */
702 sts = PyRun_AnyFileFlags(stdin, "<stdin>", &cf) != 0;
703 }
704
705 Py_Finalize();
Barry Warsaw3e13b1e2001-02-23 16:46:39 +0000706
707#ifdef __INSURE__
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000708 /* Insure++ is a memory analysis tool that aids in discovering
709 * memory leaks and other memory problems. On Python exit, the
710 * interned string dictionaries are flagged as being in use at exit
711 * (which it is). Under normal circumstances, this is fine because
712 * the memory will be automatically reclaimed by the system. Under
713 * memory debugging, it's a huge source of useless noise, so we
714 * trade off slower shutdown for less distraction in the memory
715 * reports. -baw
716 */
717 _Py_ReleaseInternedStrings();
718 _Py_ReleaseInternedUnicodeStrings();
Barry Warsaw3e13b1e2001-02-23 16:46:39 +0000719#endif /* __INSURE__ */
720
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000721 return sts;
Guido van Rossum667d7041995-08-04 04:20:48 +0000722}
723
Skip Montanaro786ea6b2004-03-01 15:44:05 +0000724/* this is gonna seem *real weird*, but if you put some other code between
725 Py_Main() and Py_GetArgcArgv() you will need to adjust the test in the
726 while statement in Misc/gdbinit:ppystack */
Guido van Rossum667d7041995-08-04 04:20:48 +0000727
Guido van Rossum667d7041995-08-04 04:20:48 +0000728/* Make the *original* argc/argv available to other modules.
729 This is rare, but it is needed by the secureware extension. */
730
731void
Martin v. Löwis790465f2008-04-05 20:41:37 +0000732Py_GetArgcArgv(int *argc, wchar_t ***argv)
Guido van Rossum667d7041995-08-04 04:20:48 +0000733{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000734 *argc = orig_argc;
735 *argv = orig_argv;
Guido van Rossum667d7041995-08-04 04:20:48 +0000736}
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000737
Ronald Oussorend61deca2010-04-18 14:46:12 +0000738
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000739/* Encode a (wide) character string to the locale encoding with the
740 surrogateescape error handler (characters in range U+DC80..U+DCFF are
741 converted to bytes 0x80..0xFF).
742
743 This function is the reverse of _Py_char2wchar().
744
745 Return a pointer to a newly allocated byte string (use PyMem_Free() to free
746 the memory), or NULL on error (conversion error or memory error). */
747char*
748_Py_wchar2char(const wchar_t *text)
749{
750 const size_t len = wcslen(text);
751 char *result = NULL, *bytes = NULL;
752 size_t i, size, converted;
753 wchar_t c, buf[2];
754
755 /* The function works in two steps:
756 1. compute the length of the output buffer in bytes (size)
757 2. outputs the bytes */
758 size = 0;
759 buf[1] = 0;
760 while (1) {
761 for (i=0; i < len; i++) {
762 c = text[i];
763 if (c >= 0xdc80 && c <= 0xdcff) {
764 /* UTF-8b surrogate */
765 if (bytes != NULL) {
766 *bytes++ = c - 0xdc00;
767 size--;
768 }
769 else
770 size++;
771 continue;
772 }
773 else {
774 buf[0] = c;
775 if (bytes != NULL)
776 converted = wcstombs(bytes, buf, size);
777 else
778 converted = wcstombs(NULL, buf, 0);
779 if (converted == (size_t)-1) {
780 if (result != NULL)
781 PyMem_Free(result);
782 return NULL;
783 }
784 if (bytes != NULL) {
785 bytes += converted;
786 size -= converted;
787 }
788 else
789 size += converted;
790 }
791 }
792 if (result != NULL) {
793 *bytes = 0;
794 break;
795 }
796
797 size += 1; /* nul byte at the end */
798 result = PyMem_Malloc(size);
799 if (result == NULL)
800 return NULL;
801 bytes = result;
802 }
803 return result;
804}
805
806
807/* Decode a byte string from the locale encoding with the
808 surrogateescape error handler (undecodable bytes are decoded as characters
809 in range U+DC80..U+DCFF). If a byte sequence can be decoded as a surrogate
810 character, escape the bytes using the surrogateescape error handler instead
811 of decoding them.
812
813 Use _Py_wchar2char() to encode the character string back to a byte string.
814
815 Return a pointer to a newly allocated (wide) character string (use
816 PyMem_Free() to free the memory), or NULL on error (conversion error or
817 memory error). */
Ronald Oussorend61deca2010-04-18 14:46:12 +0000818wchar_t*
819_Py_char2wchar(char* arg)
820{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000821 wchar_t *res;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000822#ifdef HAVE_BROKEN_MBSTOWCS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000823 /* Some platforms have a broken implementation of
824 * mbstowcs which does not count the characters that
825 * would result from conversion. Use an upper bound.
826 */
827 size_t argsize = strlen(arg);
Ronald Oussorend61deca2010-04-18 14:46:12 +0000828#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000829 size_t argsize = mbstowcs(NULL, arg, 0);
Ronald Oussorend61deca2010-04-18 14:46:12 +0000830#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000831 size_t count;
832 unsigned char *in;
833 wchar_t *out;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000834#ifdef HAVE_MBRTOWC
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000835 mbstate_t mbs;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000836#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000837 if (argsize != (size_t)-1) {
838 res = (wchar_t *)PyMem_Malloc((argsize+1)*sizeof(wchar_t));
839 if (!res)
840 goto oom;
841 count = mbstowcs(res, arg, argsize+1);
842 if (count != (size_t)-1) {
843 wchar_t *tmp;
844 /* Only use the result if it contains no
845 surrogate characters. */
846 for (tmp = res; *tmp != 0 &&
847 (*tmp < 0xd800 || *tmp > 0xdfff); tmp++)
848 ;
849 if (*tmp == 0)
850 return res;
851 }
852 PyMem_Free(res);
853 }
854 /* Conversion failed. Fall back to escaping with surrogateescape. */
Ronald Oussorend61deca2010-04-18 14:46:12 +0000855#ifdef HAVE_MBRTOWC
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000856 /* Try conversion with mbrtwoc (C99), and escape non-decodable bytes. */
857
858 /* Overallocate; as multi-byte characters are in the argument, the
859 actual output could use less memory. */
860 argsize = strlen(arg) + 1;
861 res = (wchar_t*)PyMem_Malloc(argsize*sizeof(wchar_t));
862 if (!res) goto oom;
863 in = (unsigned char*)arg;
864 out = res;
865 memset(&mbs, 0, sizeof mbs);
866 while (argsize) {
867 size_t converted = mbrtowc(out, (char*)in, argsize, &mbs);
868 if (converted == 0)
869 /* Reached end of string; null char stored. */
870 break;
871 if (converted == (size_t)-2) {
872 /* Incomplete character. This should never happen,
873 since we provide everything that we have -
874 unless there is a bug in the C library, or I
875 misunderstood how mbrtowc works. */
876 fprintf(stderr, "unexpected mbrtowc result -2\n");
877 return NULL;
878 }
879 if (converted == (size_t)-1) {
880 /* Conversion error. Escape as UTF-8b, and start over
881 in the initial shift state. */
882 *out++ = 0xdc00 + *in++;
883 argsize--;
884 memset(&mbs, 0, sizeof mbs);
885 continue;
886 }
887 if (*out >= 0xd800 && *out <= 0xdfff) {
888 /* Surrogate character. Escape the original
889 byte sequence with surrogateescape. */
890 argsize -= converted;
891 while (converted--)
892 *out++ = 0xdc00 + *in++;
893 continue;
894 }
895 /* successfully converted some bytes */
896 in += converted;
897 argsize -= converted;
898 out++;
899 }
Ronald Oussorend61deca2010-04-18 14:46:12 +0000900#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000901 /* Cannot use C locale for escaping; manually escape as if charset
902 is ASCII (i.e. escape all bytes > 128. This will still roundtrip
903 correctly in the locale's charset, which must be an ASCII superset. */
904 res = PyMem_Malloc((strlen(arg)+1)*sizeof(wchar_t));
905 if (!res) goto oom;
906 in = (unsigned char*)arg;
907 out = res;
908 while(*in)
909 if(*in < 128)
910 *out++ = *in++;
911 else
912 *out++ = 0xdc00 + *in++;
913 *out = 0;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000914#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000915 return res;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000916oom:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000917 fprintf(stderr, "out of memory\n");
918 return NULL;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000919}
920
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000921#ifdef __cplusplus
922}
923#endif