blob: d129aba074c62574c5b45244588dce6f863f9c73 [file] [log] [blame]
Guido van Rossum667d7041995-08-04 04:20:48 +00001/* Python interpreter main program */
2
3#include "Python.h"
Guido van Rossuma075ce11997-12-05 21:56:45 +00004#include "osdefs.h"
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +00005#include "import.h"
Guido van Rossum667d7041995-08-04 04:20:48 +00006
Antoine Pitrou5651eaa2008-09-06 20:46:58 +00007#include <locale.h>
8
Martin v. Löwis79acb9e2002-12-06 12:48:53 +00009#ifdef __VMS
Martin v. Löwis7a924e62003-03-05 14:15:21 +000010#include <unixlib.h>
Martin v. Löwis79acb9e2002-12-06 12:48:53 +000011#endif
12
Sjoerd Mullender9cf424b2002-08-09 13:35:18 +000013#if defined(MS_WINDOWS) || defined(__CYGWIN__)
Martin v. Löwis945362c2007-08-30 14:57:25 +000014#include <windows.h>
Thomas Wouters477c8d52006-05-27 19:21:47 +000015#ifdef HAVE_FCNTL_H
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000016#include <fcntl.h>
Martin v. Löwis790465f2008-04-05 20:41:37 +000017#define PATH_MAX MAXPATHLEN
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000018#endif
Thomas Wouters477c8d52006-05-27 19:21:47 +000019#endif
Guido van Rossum3e7ae7a1997-01-17 22:05:38 +000020
Martin v. Löwis945362c2007-08-30 14:57:25 +000021#ifdef _MSC_VER
22#include <crtdbg.h>
23#endif
24
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000025#if (defined(PYOS_OS2) && !defined(PYCC_GCC)) || defined(MS_WINDOWS)
Guido van Rossuma075ce11997-12-05 21:56:45 +000026#define PYTHONHOMEHELP "<prefix>\\lib"
27#else
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000028#if defined(PYOS_OS2) && defined(PYCC_GCC)
29#define PYTHONHOMEHELP "<prefix>/Lib"
30#else
Marc-André Lemburgda4dbc32001-06-12 16:13:51 +000031#define PYTHONHOMEHELP "<prefix>/pythonX.X"
Guido van Rossuma075ce11997-12-05 21:56:45 +000032#endif
Andrew MacIntyre7bf68332002-03-03 02:59:16 +000033#endif
Guido van Rossuma075ce11997-12-05 21:56:45 +000034
Thomas Wouters2cffc7d2000-11-03 08:18:37 +000035#include "pygetopt.h"
36
Guido van Rossuma22865e2000-09-05 04:41:18 +000037#define COPYRIGHT \
Guido van Rossum36002d72001-07-18 16:59:46 +000038 "Type \"help\", \"copyright\", \"credits\" or \"license\" " \
39 "for more information."
Guido van Rossuma22865e2000-09-05 04:41:18 +000040
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000041#ifdef __cplusplus
42extern "C" {
43#endif
44
Guido van Rossumac56b031996-07-21 02:33:38 +000045/* For Py_GetArgcArgv(); set by main() */
Martin v. Löwis790465f2008-04-05 20:41:37 +000046static wchar_t **orig_argv;
Guido van Rossum667d7041995-08-04 04:20:48 +000047static int orig_argc;
48
Guido van Rossumbceccf52001-04-10 22:07:43 +000049/* command line options */
Christian Heimes8dc226f2008-05-06 23:45:46 +000050#define BASE_OPTS L"bBc:dEhiJm:OsStuvVW:xX?"
Guido van Rossumbceccf52001-04-10 22:07:43 +000051
Guido van Rossumbceccf52001-04-10 22:07:43 +000052#define PROGRAM_OPTS BASE_OPTS
Guido van Rossum3ed4c152001-03-02 06:18:03 +000053
Guido van Rossum667d7041995-08-04 04:20:48 +000054/* Short usage message (with %s for argv0) */
55static char *usage_line =
Martin v. Löwis790465f2008-04-05 20:41:37 +000056"usage: %ls [option] ... [-c cmd | -m mod | file | -] [arg] ...\n";
Guido van Rossum667d7041995-08-04 04:20:48 +000057
58/* Long usage message, split into parts < 512 bytes */
Guido van Rossum393661d2001-08-31 17:40:15 +000059static char *usage_1 = "\
Guido van Rossum667d7041995-08-04 04:20:48 +000060Options and arguments (and corresponding environment variables):\n\
Christian Heimes2ab34442008-09-03 20:31:07 +000061-b : issue warnings about str(bytes_instance), str(bytearray_instance)\n\
62 and comparing bytes/bytearray with str. (-bb: issue errors)\n\
Christian Heimes790c8232008-01-07 21:14:23 +000063-B : don't write .py[co] files on import; also PYTHONDONTWRITEBYTECODE=x\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000064-c cmd : program passed in as string (terminates option list)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000065-d : debug output from parser; also PYTHONDEBUG=x\n\
Christian Heimes790c8232008-01-07 21:14:23 +000066-E : ignore PYTHON* environment variables (such as PYTHONPATH)\n\
Thomas Wouters0e3f5912006-08-11 14:57:12 +000067-h : print this help message and exit (also --help)\n\
Guido van Rossum61c345f2001-09-04 03:26:15 +000068";
69static char *usage_2 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000070-i : inspect interactively after running script; forces a prompt even\n\
71 if stdin does not appear to be a terminal; also PYTHONINSPECT=x\n\
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +000072-m mod : run library module as a script (terminates option list)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000073-O : optimize generated bytecode slightly; also PYTHONOPTIMIZE=x\n\
Guido van Rossum6b86a421999-01-28 15:07:47 +000074-OO : remove doc-strings in addition to the -O optimizations\n\
Christian Heimes8dc226f2008-05-06 23:45:46 +000075-s : don't add user site directory to sys.path; also PYTHONNOUSERSITE\n\
Guido van Rossum7922bd71997-08-29 22:34:47 +000076-S : don't imply 'import site' on initialization\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000077";
78static char *usage_3 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000079-u : unbuffered binary stdout and stderr; also PYTHONUNBUFFERED=x\n\
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +000080 see man page for details on internal buffering relating to '-u'\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000081-v : verbose (trace import statements); also PYTHONVERBOSE=x\n\
82 can be supplied multiple times to increase verbosity\n\
Thomas Wouters0e3f5912006-08-11 14:57:12 +000083-V : print the Python version number and exit (also --version)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000084-W arg : warning control; arg is action:message:category:module:lineno\n\
Philip Jenvey0805ca32010-04-07 04:04:10 +000085 also PYTHONWARNINGS=arg\n\
Guido van Rossum393661d2001-08-31 17:40:15 +000086-x : skip first line of source, allowing use of non-Unix forms of #!cmd\n\
Guido van Rossum7922bd71997-08-29 22:34:47 +000087";
Guido van Rossum393661d2001-08-31 17:40:15 +000088static char *usage_4 = "\
Guido van Rossum98297ee2007-11-06 21:34:58 +000089file : program read from script file\n\
90- : program read from stdin (default; interactive mode if a tty)\n\
Thomas Wouters89f507f2006-12-13 04:49:30 +000091arg ...: arguments passed to program in sys.argv[1:]\n\n\
Guido van Rossum667d7041995-08-04 04:20:48 +000092Other environment variables:\n\
93PYTHONSTARTUP: file executed on interactive startup (no default)\n\
Guido van Rossuma075ce11997-12-05 21:56:45 +000094PYTHONPATH : '%c'-separated list of directories prefixed to the\n\
Guido van Rossum667d7041995-08-04 04:20:48 +000095 default module search path. The result is sys.path.\n\
Christian Heimes790c8232008-01-07 21:14:23 +000096";
97static char *usage_5 = "\
Guido van Rossuma075ce11997-12-05 21:56:45 +000098PYTHONHOME : alternate <prefix> directory (or <prefix>%c<exec_prefix>).\n\
99 The default module search path uses %s.\n\
Tim Peters793de092001-02-22 00:39:47 +0000100PYTHONCASEOK : ignore case in 'import' statements (Windows).\n\
Martin v. Löwis0f599892008-06-02 11:13:03 +0000101PYTHONIOENCODING: Encoding[:errors] used for stdin/stdout/stderr.\n\
Victor Stinner94908bb2010-08-18 21:23:25 +0000102PYTHONFSENCODING: Encoding used for the filesystem.\n\
Guido van Rossum667d7041995-08-04 04:20:48 +0000103";
104
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000105FILE *
106_Py_wfopen(const wchar_t *path, const wchar_t *mode)
Martin v. Löwis790465f2008-04-05 20:41:37 +0000107{
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000108#ifndef MS_WINDOWS
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000109 FILE *f;
110 char *cpath;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000111 char cmode[10];
112 size_t r;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000113 r = wcstombs(cmode, mode, 10);
114 if (r == (size_t)-1 || r >= 10) {
115 errno = EINVAL;
116 return NULL;
117 }
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000118 cpath = _Py_wchar2char(path);
119 if (cpath == NULL)
120 return NULL;
121 f = fopen(cpath, cmode);
122 PyMem_Free(cpath);
123 return f;
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000124#else
125 return _wfopen(path, mode);
Martin v. Löwis790465f2008-04-05 20:41:37 +0000126#endif
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000127}
Martin v. Löwis790465f2008-04-05 20:41:37 +0000128
Guido van Rossum667d7041995-08-04 04:20:48 +0000129
Martin v. Löwis852ba7e2003-03-30 17:09:58 +0000130static int
Martin v. Löwis790465f2008-04-05 20:41:37 +0000131usage(int exitcode, wchar_t* program)
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000132{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000133 FILE *f = exitcode ? stderr : stdout;
Guido van Rossum393661d2001-08-31 17:40:15 +0000134
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000135 fprintf(f, usage_line, program);
136 if (exitcode)
137 fprintf(f, "Try `python -h' for more information.\n");
138 else {
139 fputs(usage_1, f);
140 fputs(usage_2, f);
141 fputs(usage_3, f);
142 fprintf(f, usage_4, DELIM);
143 fprintf(f, usage_5, DELIM, PYTHONHOMEHELP);
144 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000145#if defined(__VMS)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000146 if (exitcode == 0) {
147 /* suppress 'error' message */
148 return 1;
149 }
150 else {
151 /* STS$M_INHIB_MSG + SS$_ABORT */
152 return 0x1000002c;
153 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000154#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000155 return exitcode;
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000156#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000157 /*NOTREACHED*/
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000158}
159
Martin v. Löwis6caea372003-11-18 19:46:25 +0000160static void RunStartupFile(PyCompilerFlags *cf)
161{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000162 char *startup = Py_GETENV("PYTHONSTARTUP");
163 if (startup != NULL && startup[0] != '\0') {
164 FILE *fp = fopen(startup, "r");
165 if (fp != NULL) {
166 (void) PyRun_SimpleFileExFlags(fp, startup, 0, cf);
167 PyErr_Clear();
168 fclose(fp);
169 } else {
170 int save_errno;
171
172 save_errno = errno;
173 PySys_WriteStderr("Could not open PYTHONSTARTUP\n");
174 errno = save_errno;
175 PyErr_SetFromErrnoWithFilename(PyExc_IOError,
176 startup);
177 PyErr_Print();
178 PyErr_Clear();
179 }
180 }
Martin v. Löwis6caea372003-11-18 19:46:25 +0000181}
182
Thomas Woutersa9773292006-04-21 09:43:23 +0000183
Antoine Pitrou5651eaa2008-09-06 20:46:58 +0000184static int RunModule(wchar_t *modname, int set_argv0)
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000185{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000186 PyObject *module, *runpy, *runmodule, *runargs, *result;
187 runpy = PyImport_ImportModule("runpy");
188 if (runpy == NULL) {
189 fprintf(stderr, "Could not import runpy module\n");
190 return -1;
191 }
192 runmodule = PyObject_GetAttrString(runpy, "_run_module_as_main");
193 if (runmodule == NULL) {
194 fprintf(stderr, "Could not access runpy._run_module_as_main\n");
195 Py_DECREF(runpy);
196 return -1;
197 }
198 module = PyUnicode_FromWideChar(modname, wcslen(modname));
199 if (module == NULL) {
200 fprintf(stderr, "Could not convert module name to unicode\n");
201 Py_DECREF(runpy);
202 Py_DECREF(runmodule);
203 return -1;
204 }
205 runargs = Py_BuildValue("(Oi)", module, set_argv0);
206 if (runargs == NULL) {
207 fprintf(stderr,
208 "Could not create arguments for runpy._run_module_as_main\n");
209 Py_DECREF(runpy);
210 Py_DECREF(runmodule);
211 Py_DECREF(module);
212 return -1;
213 }
214 result = PyObject_Call(runmodule, runargs, NULL);
215 if (result == NULL) {
216 PyErr_Print();
217 }
218 Py_DECREF(runpy);
219 Py_DECREF(runmodule);
220 Py_DECREF(module);
221 Py_DECREF(runargs);
222 if (result == NULL) {
223 return -1;
224 }
225 Py_DECREF(result);
226 return 0;
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000227}
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000228
Martin v. Löwis790465f2008-04-05 20:41:37 +0000229static int RunMainFromImporter(wchar_t *filename)
Christian Heimes9cd17752007-11-18 19:35:23 +0000230{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000231 PyObject *argv0 = NULL, *importer = NULL;
Christian Heimes9cd17752007-11-18 19:35:23 +0000232
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000233 if ((argv0 = PyUnicode_FromWideChar(filename,wcslen(filename))) &&
234 (importer = PyImport_GetImporter(argv0)) &&
235 (importer->ob_type != &PyNullImporter_Type))
236 {
237 /* argv0 is usable as an import source, so
238 put it in sys.path[0] and import __main__ */
239 PyObject *sys_path = NULL;
240 if ((sys_path = PySys_GetObject("path")) &&
241 !PyList_SetItem(sys_path, 0, argv0))
242 {
243 Py_INCREF(argv0);
244 Py_DECREF(importer);
245 sys_path = NULL;
246 return RunModule(L"__main__", 0) != 0;
Guido van Rossum74c29c72007-11-19 18:36:41 +0000247 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000248 }
249 Py_XDECREF(argv0);
250 Py_XDECREF(importer);
251 if (PyErr_Occurred()) {
252 PyErr_Print();
253 return 1;
254 }
255 else {
256 return -1;
257 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000258}
259
Victor Stinnera62207c2010-08-07 10:57:17 +0000260static int
261run_command(wchar_t *command, PyCompilerFlags *cf)
262{
263 PyObject *unicode, *bytes;
264 int ret;
265
266 unicode = PyUnicode_FromWideChar(command, -1);
267 if (unicode == NULL)
268 goto error;
269 bytes = PyUnicode_AsUTF8String(unicode);
270 Py_DECREF(unicode);
271 if (bytes == NULL)
272 goto error;
273 ret = PyRun_SimpleStringFlags(PyBytes_AsString(bytes), cf);
274 Py_DECREF(bytes);
275 return ret != 0;
276
277error:
278 PyErr_Print();
279 return 1;
280}
281
Victor Stinner0a3ddad2010-08-07 16:34:25 +0000282static int
283run_file(FILE *fp, const wchar_t *filename, PyCompilerFlags *p_cf)
284{
285 PyObject *unicode, *bytes = NULL;
286 char *filename_str;
287 int run;
288
289 /* call pending calls like signal handlers (SIGINT) */
290 if (Py_MakePendingCalls() == -1) {
291 PyErr_Print();
292 return 1;
293 }
294
295 if (filename) {
296 unicode = PyUnicode_FromWideChar(filename, wcslen(filename));
297 if (unicode != NULL) {
298 bytes = PyUnicode_AsUTF8String(unicode);
299 Py_DECREF(unicode);
300 }
301 if (bytes != NULL)
302 filename_str = PyBytes_AsString(bytes);
303 else {
304 PyErr_Clear();
305 filename_str = "<decoding error>";
306 }
307 }
308 else
309 filename_str = "<stdin>";
310
311 run = PyRun_AnyFileExFlags(fp, filename_str, filename != NULL, p_cf);
312 Py_XDECREF(bytes);
313 return run != 0;
314}
315
Christian Heimes9cd17752007-11-18 19:35:23 +0000316
Guido van Rossum667d7041995-08-04 04:20:48 +0000317/* Main program */
318
Mark Hammondfe51c6d2002-08-02 02:27:13 +0000319int
Martin v. Löwis790465f2008-04-05 20:41:37 +0000320Py_Main(int argc, wchar_t **argv)
Guido van Rossum667d7041995-08-04 04:20:48 +0000321{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000322 int c;
323 int sts;
324 wchar_t *command = NULL;
325 wchar_t *filename = NULL;
326 wchar_t *module = NULL;
327 FILE *fp = stdin;
328 char *p;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000329#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000330 wchar_t *wp;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000331#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000332 int skipfirstline = 0;
333 int stdin_is_interactive = 0;
334 int help = 0;
335 int version = 0;
336 int saw_unbuffered_flag = 0;
337 PyCompilerFlags cf;
Guido van Rossum667d7041995-08-04 04:20:48 +0000338
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000339 cf.cf_flags = 0;
Guido van Rossum393661d2001-08-31 17:40:15 +0000340
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000341 orig_argc = argc; /* For Py_GetArgcArgv() */
342 orig_argv = argv;
Guido van Rossum667d7041995-08-04 04:20:48 +0000343
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000344 PySys_ResetWarnOptions();
Guido van Rossum47f5fdc2000-12-15 22:00:54 +0000345
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000346 while ((c = _PyOS_GetOpt(argc, argv, PROGRAM_OPTS)) != EOF) {
347 if (c == 'c') {
348 size_t len;
349 /* -c is the last option; following arguments
350 that look like options are left for the
351 command to interpret. */
Amaury Forgeot d'Arc9a5499b2008-11-11 23:04:59 +0000352
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000353 len = wcslen(_PyOS_optarg) + 1 + 1;
354 command = (wchar_t *)malloc(sizeof(wchar_t) * len);
355 if (command == NULL)
356 Py_FatalError(
357 "not enough memory to copy -c argument");
358 wcscpy(command, _PyOS_optarg);
359 command[len - 2] = '\n';
360 command[len - 1] = 0;
361 break;
362 }
Guido van Rossum393661d2001-08-31 17:40:15 +0000363
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000364 if (c == 'm') {
365 /* -m is the last option; following arguments
366 that look like options are left for the
367 module to interpret. */
368 module = _PyOS_optarg;
369 break;
370 }
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000371
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000372 switch (c) {
373 case 'b':
374 Py_BytesWarningFlag++;
375 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000376
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000377 case 'd':
378 Py_DebugFlag++;
379 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000380
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000381 case 'i':
382 Py_InspectFlag++;
383 Py_InteractiveFlag++;
384 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000385
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000386 /* case 'J': reserved for Jython */
Christian Heimes33fe8092008-04-13 13:53:33 +0000387
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000388 case 'O':
389 Py_OptimizeFlag++;
390 break;
Guido van Rossum7614da61997-03-03 19:14:45 +0000391
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000392 case 'B':
393 Py_DontWriteBytecodeFlag++;
394 break;
Christian Heimes790c8232008-01-07 21:14:23 +0000395
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000396 case 's':
397 Py_NoUserSiteDirectory++;
398 break;
Christian Heimes8dc226f2008-05-06 23:45:46 +0000399
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000400 case 'S':
401 Py_NoSiteFlag++;
402 break;
Guido van Rossum7922bd71997-08-29 22:34:47 +0000403
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000404 case 'E':
405 Py_IgnoreEnvironmentFlag++;
406 break;
Neil Schemenauer7d4bb9f2001-07-23 16:30:27 +0000407
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000408 case 't':
409 /* ignored for backwards compatibility */
410 break;
Guido van Rossumbba92ca1998-04-10 19:39:15 +0000411
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000412 case 'u':
413 Py_UnbufferedStdioFlag = 1;
414 saw_unbuffered_flag = 1;
415 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000416
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000417 case 'v':
418 Py_VerboseFlag++;
419 break;
Guido van Rossum667d7041995-08-04 04:20:48 +0000420
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000421 case 'x':
422 skipfirstline = 1;
423 break;
Guido van Rossuma075ce11997-12-05 21:56:45 +0000424
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000425 /* case 'X': reserved for implementation-specific arguments */
Christian Heimes33fe8092008-04-13 13:53:33 +0000426
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000427 case 'h':
428 case '?':
429 help++;
430 break;
Guido van Rossum45aecf42006-03-15 04:58:47 +0000431
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000432 case 'V':
433 version++;
434 break;
Guido van Rossumc15a9a12000-05-01 17:54:33 +0000435
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000436 case 'W':
437 PySys_AddWarnOption(_PyOS_optarg);
438 break;
Guido van Rossum47f5fdc2000-12-15 22:00:54 +0000439
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000440 /* This space reserved for other options */
Guido van Rossum667d7041995-08-04 04:20:48 +0000441
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000442 default:
443 return usage(2, argv[0]);
444 /*NOTREACHED*/
Guido van Rossum667d7041995-08-04 04:20:48 +0000445
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000446 }
447 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000448
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000449 if (help)
450 return usage(0, argv[0]);
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000451
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000452 if (version) {
453 fprintf(stderr, "Python %s\n", PY_VERSION);
454 return 0;
455 }
Barry Warsaw3b2aedb2000-09-15 18:40:42 +0000456
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000457 if (!Py_InspectFlag &&
458 (p = Py_GETENV("PYTHONINSPECT")) && *p != '\0')
459 Py_InspectFlag = 1;
460 if (!saw_unbuffered_flag &&
461 (p = Py_GETENV("PYTHONUNBUFFERED")) && *p != '\0')
462 Py_UnbufferedStdioFlag = 1;
Neil Schemenauer7d4bb9f2001-07-23 16:30:27 +0000463
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000464 if (!Py_NoUserSiteDirectory &&
465 (p = Py_GETENV("PYTHONNOUSERSITE")) && *p != '\0')
466 Py_NoUserSiteDirectory = 1;
Christian Heimes8dc226f2008-05-06 23:45:46 +0000467
Philip Jenveye53de3d2010-04-14 03:01:39 +0000468#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000469 if (!Py_IgnoreEnvironmentFlag && (wp = _wgetenv(L"PYTHONWARNINGS")) &&
470 *wp != L'\0') {
471 wchar_t *buf, *warning;
Philip Jenvey0805ca32010-04-07 04:04:10 +0000472
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000473 buf = (wchar_t *)malloc((wcslen(wp) + 1) * sizeof(wchar_t));
474 if (buf == NULL)
475 Py_FatalError(
476 "not enough memory to copy PYTHONWARNINGS");
477 wcscpy(buf, wp);
478 for (warning = wcstok(buf, L",");
479 warning != NULL;
480 warning = wcstok(NULL, L",")) {
481 PySys_AddWarnOption(warning);
482 }
483 free(buf);
484 }
Philip Jenveye53de3d2010-04-14 03:01:39 +0000485#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000486 if ((p = Py_GETENV("PYTHONWARNINGS")) && *p != '\0') {
487 char *buf, *oldloc;
Victor Stinner9ca9c252010-05-19 16:53:30 +0000488 PyObject *warning;
Philip Jenveye53de3d2010-04-14 03:01:39 +0000489
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000490 /* settle for strtok here as there's no one standard
491 C89 wcstok */
492 buf = (char *)malloc(strlen(p) + 1);
493 if (buf == NULL)
494 Py_FatalError(
495 "not enough memory to copy PYTHONWARNINGS");
496 strcpy(buf, p);
497 oldloc = strdup(setlocale(LC_ALL, NULL));
498 setlocale(LC_ALL, "");
499 for (p = strtok(buf, ","); p != NULL; p = strtok(NULL, ",")) {
Victor Stinner9ca9c252010-05-19 16:53:30 +0000500 warning = PyUnicode_DecodeFSDefault(p);
501 if (warning != NULL) {
502 PySys_AddWarnOptionUnicode(warning);
503 Py_DECREF(warning);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000504 }
505 }
506 setlocale(LC_ALL, oldloc);
507 free(oldloc);
508 free(buf);
509 }
Philip Jenveye53de3d2010-04-14 03:01:39 +0000510#endif
Philip Jenvey0805ca32010-04-07 04:04:10 +0000511
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000512 if (command == NULL && module == NULL && _PyOS_optind < argc &&
513 wcscmp(argv[_PyOS_optind], L"-") != 0)
514 {
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000515#ifdef __VMS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000516 filename = decc$translate_vms(argv[_PyOS_optind]);
517 if (filename == (char *)0 || filename == (char *)-1)
518 filename = argv[_PyOS_optind];
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000519
520#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000521 filename = argv[_PyOS_optind];
Martin v. Löwis7a924e62003-03-05 14:15:21 +0000522#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000523 }
Guido van Rossum775af911997-02-14 19:50:32 +0000524
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000525 stdin_is_interactive = Py_FdIsInteractive(stdin, (char *)0);
Guido van Rossum775af911997-02-14 19:50:32 +0000526
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000527 if (Py_UnbufferedStdioFlag) {
Sjoerd Mullender9cf424b2002-08-09 13:35:18 +0000528#if defined(MS_WINDOWS) || defined(__CYGWIN__)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000529 _setmode(fileno(stdin), O_BINARY);
530 _setmode(fileno(stdout), O_BINARY);
Guido van Rossumf22d7e21997-01-11 19:28:55 +0000531#endif
Guido van Rossum22ffac11998-03-06 15:30:39 +0000532#ifdef HAVE_SETVBUF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000533 setvbuf(stdin, (char *)NULL, _IONBF, BUFSIZ);
534 setvbuf(stdout, (char *)NULL, _IONBF, BUFSIZ);
535 setvbuf(stderr, (char *)NULL, _IONBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000536#else /* !HAVE_SETVBUF */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000537 setbuf(stdin, (char *)NULL);
538 setbuf(stdout, (char *)NULL);
539 setbuf(stderr, (char *)NULL);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000540#endif /* !HAVE_SETVBUF */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000541 }
542 else if (Py_InteractiveFlag) {
Guido van Rossumb31c7dc1997-04-11 22:19:12 +0000543#ifdef MS_WINDOWS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000544 /* Doesn't have to have line-buffered -- use unbuffered */
545 /* Any set[v]buf(stdin, ...) screws up Tkinter :-( */
546 setvbuf(stdout, (char *)NULL, _IONBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000547#else /* !MS_WINDOWS */
548#ifdef HAVE_SETVBUF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000549 setvbuf(stdin, (char *)NULL, _IOLBF, BUFSIZ);
550 setvbuf(stdout, (char *)NULL, _IOLBF, BUFSIZ);
Guido van Rossum22ffac11998-03-06 15:30:39 +0000551#endif /* HAVE_SETVBUF */
552#endif /* !MS_WINDOWS */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000553 /* Leave stderr alone - it should be unbuffered anyway. */
554 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000555#ifdef __VMS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000556 else {
557 setvbuf (stdout, (char *)NULL, _IOLBF, BUFSIZ);
558 }
Martin v. Löwis79acb9e2002-12-06 12:48:53 +0000559#endif /* __VMS */
Guido van Rossum667d7041995-08-04 04:20:48 +0000560
Just van Rossum2ac79ef2003-03-05 15:46:54 +0000561#ifdef __APPLE__
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000562 /* On MacOS X, when the Python interpreter is embedded in an
563 application bundle, it gets executed by a bootstrapping script
564 that does os.execve() with an argv[0] that's different from the
565 actual Python executable. This is needed to keep the Finder happy,
566 or rather, to work around Apple's overly strict requirements of
567 the process name. However, we still need a usable sys.executable,
568 so the actual executable path is passed in an environment variable.
569 See Lib/plat-mac/bundlebuiler.py for details about the bootstrap
570 script. */
571 if ((p = Py_GETENV("PYTHONEXECUTABLE")) && *p != '\0') {
572 wchar_t* buffer;
573 size_t len = strlen(p);
574 size_t r;
Ronald Oussoren3e264e12009-02-12 15:55:38 +0000575
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000576 buffer = malloc(len * sizeof(wchar_t));
577 if (buffer == NULL) {
578 Py_FatalError(
579 "not enough memory to copy PYTHONEXECUTABLE");
580 }
Ronald Oussoren3e264e12009-02-12 15:55:38 +0000581
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000582 r = mbstowcs(buffer, p, len);
583 Py_SetProgramName(buffer);
584 /* buffer is now handed off - do not free */
585 } else {
586 Py_SetProgramName(argv[0]);
587 }
Just van Rossum2ac79ef2003-03-05 15:46:54 +0000588#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000589 Py_SetProgramName(argv[0]);
Jack Jansenfbd861b2003-03-05 16:00:15 +0000590#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000591 Py_Initialize();
Guido van Rossumed52aac1997-07-19 19:20:32 +0000592
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000593 if (Py_VerboseFlag ||
594 (command == NULL && filename == NULL && module == NULL && stdin_is_interactive)) {
595 fprintf(stderr, "Python %s on %s\n",
596 Py_GetVersion(), Py_GetPlatform());
597 if (!Py_NoSiteFlag)
598 fprintf(stderr, "%s\n", COPYRIGHT);
599 }
Guido van Rossum393661d2001-08-31 17:40:15 +0000600
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000601 if (command != NULL) {
602 /* Backup _PyOS_optind and force sys.argv[0] = '-c' */
603 _PyOS_optind--;
604 argv[_PyOS_optind] = L"-c";
605 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000606
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000607 if (module != NULL) {
Nick Coghland26c18a2010-08-17 13:06:11 +0000608 /* Backup _PyOS_optind and force sys.argv[0] = '-m'*/
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000609 _PyOS_optind--;
Nick Coghland26c18a2010-08-17 13:06:11 +0000610 argv[_PyOS_optind] = L"-m";
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000611 }
Raymond Hettingerdb29e0f2004-10-07 06:46:25 +0000612
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000613 PySys_SetArgv(argc-_PyOS_optind, argv+_PyOS_optind);
Guido van Rossum667d7041995-08-04 04:20:48 +0000614
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000615 if ((Py_InspectFlag || (command == NULL && filename == NULL && module == NULL)) &&
616 isatty(fileno(stdin))) {
617 PyObject *v;
618 v = PyImport_ImportModule("readline");
619 if (v == NULL)
620 PyErr_Clear();
621 else
622 Py_DECREF(v);
623 }
Guido van Rossum3d26cc91997-09-16 16:11:28 +0000624
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000625 if (command) {
Victor Stinnera62207c2010-08-07 10:57:17 +0000626 sts = run_command(command, &cf);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000627 free(command);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000628 } else if (module) {
629 sts = RunModule(module, 1);
630 }
631 else {
Christian Heimes9cd17752007-11-18 19:35:23 +0000632
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000633 if (filename == NULL && stdin_is_interactive) {
634 Py_InspectFlag = 0; /* do exit on SystemExit */
635 RunStartupFile(&cf);
636 }
637 /* XXX */
Christian Heimes9cd17752007-11-18 19:35:23 +0000638
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000639 sts = -1; /* keep track of whether we've already run __main__ */
Christian Heimes9cd17752007-11-18 19:35:23 +0000640
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000641 if (filename != NULL) {
642 sts = RunMainFromImporter(filename);
643 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000644
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000645 if (sts==-1 && filename!=NULL) {
Antoine Pitroue9b428f2010-08-13 22:25:01 +0000646 if ((fp = _Py_wfopen(filename, L"r")) == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000647 char cfilename[PATH_MAX];
648 size_t r = wcstombs(cfilename, filename, PATH_MAX);
649 if (r == PATH_MAX)
650 /* cfilename is not null-terminated;
651 * forcefully null-terminating it
652 * might break the shift state */
653 strcpy(cfilename, "<file name too long>");
654 if (r == ((size_t)-1))
655 strcpy(cfilename, "<unprintable file name>");
656 fprintf(stderr, "%ls: can't open file '%s': [Errno %d] %s\n",
657 argv[0], cfilename, errno, strerror(errno));
Christian Heimesada8c3b2008-03-18 18:26:33 +0000658
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000659 return 2;
660 }
661 else if (skipfirstline) {
662 int ch;
663 /* Push back first newline so line numbers
664 remain the same */
665 while ((ch = getc(fp)) != EOF) {
666 if (ch == '\n') {
667 (void)ungetc(ch, fp);
668 break;
669 }
670 }
671 }
672 {
673 /* XXX: does this work on Win/Win64? (see posix_fstat) */
674 struct stat sb;
675 if (fstat(fileno(fp), &sb) == 0 &&
676 S_ISDIR(sb.st_mode)) {
677 fprintf(stderr, "%ls: '%ls' is a directory, cannot continue\n", argv[0], filename);
678 fclose(fp);
679 return 1;
680 }
681 }
682 }
Christian Heimes9cd17752007-11-18 19:35:23 +0000683
Victor Stinner0a3ddad2010-08-07 16:34:25 +0000684 if (sts == -1)
685 sts = run_file(fp, filename, &cf);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000686 }
Barry Warsawd86dcd32003-06-29 17:07:06 +0000687
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000688 /* Check this environment variable at the end, to give programs the
689 * opportunity to set it from Python.
690 */
691 if (!Py_InspectFlag &&
692 (p = Py_GETENV("PYTHONINSPECT")) && *p != '\0')
693 {
694 Py_InspectFlag = 1;
695 }
Guido van Rossum667d7041995-08-04 04:20:48 +0000696
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000697 if (Py_InspectFlag && stdin_is_interactive &&
698 (filename != NULL || command != NULL || module != NULL)) {
699 Py_InspectFlag = 0;
700 /* XXX */
701 sts = PyRun_AnyFileFlags(stdin, "<stdin>", &cf) != 0;
702 }
703
704 Py_Finalize();
Barry Warsaw3e13b1e2001-02-23 16:46:39 +0000705
706#ifdef __INSURE__
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000707 /* Insure++ is a memory analysis tool that aids in discovering
708 * memory leaks and other memory problems. On Python exit, the
709 * interned string dictionaries are flagged as being in use at exit
710 * (which it is). Under normal circumstances, this is fine because
711 * the memory will be automatically reclaimed by the system. Under
712 * memory debugging, it's a huge source of useless noise, so we
713 * trade off slower shutdown for less distraction in the memory
714 * reports. -baw
715 */
716 _Py_ReleaseInternedStrings();
717 _Py_ReleaseInternedUnicodeStrings();
Barry Warsaw3e13b1e2001-02-23 16:46:39 +0000718#endif /* __INSURE__ */
719
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000720 return sts;
Guido van Rossum667d7041995-08-04 04:20:48 +0000721}
722
Skip Montanaro786ea6b2004-03-01 15:44:05 +0000723/* this is gonna seem *real weird*, but if you put some other code between
724 Py_Main() and Py_GetArgcArgv() you will need to adjust the test in the
725 while statement in Misc/gdbinit:ppystack */
Guido van Rossum667d7041995-08-04 04:20:48 +0000726
Guido van Rossum667d7041995-08-04 04:20:48 +0000727/* Make the *original* argc/argv available to other modules.
728 This is rare, but it is needed by the secureware extension. */
729
730void
Martin v. Löwis790465f2008-04-05 20:41:37 +0000731Py_GetArgcArgv(int *argc, wchar_t ***argv)
Guido van Rossum667d7041995-08-04 04:20:48 +0000732{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000733 *argc = orig_argc;
734 *argv = orig_argv;
Guido van Rossum667d7041995-08-04 04:20:48 +0000735}
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000736
Ronald Oussorend61deca2010-04-18 14:46:12 +0000737
Victor Stinnerf2e08b32010-08-13 23:29:08 +0000738/* Encode a (wide) character string to the locale encoding with the
739 surrogateescape error handler (characters in range U+DC80..U+DCFF are
740 converted to bytes 0x80..0xFF).
741
742 This function is the reverse of _Py_char2wchar().
743
744 Return a pointer to a newly allocated byte string (use PyMem_Free() to free
745 the memory), or NULL on error (conversion error or memory error). */
746char*
747_Py_wchar2char(const wchar_t *text)
748{
749 const size_t len = wcslen(text);
750 char *result = NULL, *bytes = NULL;
751 size_t i, size, converted;
752 wchar_t c, buf[2];
753
754 /* The function works in two steps:
755 1. compute the length of the output buffer in bytes (size)
756 2. outputs the bytes */
757 size = 0;
758 buf[1] = 0;
759 while (1) {
760 for (i=0; i < len; i++) {
761 c = text[i];
762 if (c >= 0xdc80 && c <= 0xdcff) {
763 /* UTF-8b surrogate */
764 if (bytes != NULL) {
765 *bytes++ = c - 0xdc00;
766 size--;
767 }
768 else
769 size++;
770 continue;
771 }
772 else {
773 buf[0] = c;
774 if (bytes != NULL)
775 converted = wcstombs(bytes, buf, size);
776 else
777 converted = wcstombs(NULL, buf, 0);
778 if (converted == (size_t)-1) {
779 if (result != NULL)
780 PyMem_Free(result);
781 return NULL;
782 }
783 if (bytes != NULL) {
784 bytes += converted;
785 size -= converted;
786 }
787 else
788 size += converted;
789 }
790 }
791 if (result != NULL) {
792 *bytes = 0;
793 break;
794 }
795
796 size += 1; /* nul byte at the end */
797 result = PyMem_Malloc(size);
798 if (result == NULL)
799 return NULL;
800 bytes = result;
801 }
802 return result;
803}
804
805
806/* Decode a byte string from the locale encoding with the
807 surrogateescape error handler (undecodable bytes are decoded as characters
808 in range U+DC80..U+DCFF). If a byte sequence can be decoded as a surrogate
809 character, escape the bytes using the surrogateescape error handler instead
810 of decoding them.
811
812 Use _Py_wchar2char() to encode the character string back to a byte string.
813
814 Return a pointer to a newly allocated (wide) character string (use
815 PyMem_Free() to free the memory), or NULL on error (conversion error or
816 memory error). */
Ronald Oussorend61deca2010-04-18 14:46:12 +0000817wchar_t*
818_Py_char2wchar(char* arg)
819{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000820 wchar_t *res;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000821#ifdef HAVE_BROKEN_MBSTOWCS
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000822 /* Some platforms have a broken implementation of
823 * mbstowcs which does not count the characters that
824 * would result from conversion. Use an upper bound.
825 */
826 size_t argsize = strlen(arg);
Ronald Oussorend61deca2010-04-18 14:46:12 +0000827#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000828 size_t argsize = mbstowcs(NULL, arg, 0);
Ronald Oussorend61deca2010-04-18 14:46:12 +0000829#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000830 size_t count;
831 unsigned char *in;
832 wchar_t *out;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000833#ifdef HAVE_MBRTOWC
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000834 mbstate_t mbs;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000835#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000836 if (argsize != (size_t)-1) {
837 res = (wchar_t *)PyMem_Malloc((argsize+1)*sizeof(wchar_t));
838 if (!res)
839 goto oom;
840 count = mbstowcs(res, arg, argsize+1);
841 if (count != (size_t)-1) {
842 wchar_t *tmp;
843 /* Only use the result if it contains no
844 surrogate characters. */
845 for (tmp = res; *tmp != 0 &&
846 (*tmp < 0xd800 || *tmp > 0xdfff); tmp++)
847 ;
848 if (*tmp == 0)
849 return res;
850 }
851 PyMem_Free(res);
852 }
853 /* Conversion failed. Fall back to escaping with surrogateescape. */
Ronald Oussorend61deca2010-04-18 14:46:12 +0000854#ifdef HAVE_MBRTOWC
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000855 /* Try conversion with mbrtwoc (C99), and escape non-decodable bytes. */
856
857 /* Overallocate; as multi-byte characters are in the argument, the
858 actual output could use less memory. */
859 argsize = strlen(arg) + 1;
860 res = (wchar_t*)PyMem_Malloc(argsize*sizeof(wchar_t));
861 if (!res) goto oom;
862 in = (unsigned char*)arg;
863 out = res;
864 memset(&mbs, 0, sizeof mbs);
865 while (argsize) {
866 size_t converted = mbrtowc(out, (char*)in, argsize, &mbs);
867 if (converted == 0)
868 /* Reached end of string; null char stored. */
869 break;
870 if (converted == (size_t)-2) {
871 /* Incomplete character. This should never happen,
872 since we provide everything that we have -
873 unless there is a bug in the C library, or I
874 misunderstood how mbrtowc works. */
875 fprintf(stderr, "unexpected mbrtowc result -2\n");
876 return NULL;
877 }
878 if (converted == (size_t)-1) {
879 /* Conversion error. Escape as UTF-8b, and start over
880 in the initial shift state. */
881 *out++ = 0xdc00 + *in++;
882 argsize--;
883 memset(&mbs, 0, sizeof mbs);
884 continue;
885 }
886 if (*out >= 0xd800 && *out <= 0xdfff) {
887 /* Surrogate character. Escape the original
888 byte sequence with surrogateescape. */
889 argsize -= converted;
890 while (converted--)
891 *out++ = 0xdc00 + *in++;
892 continue;
893 }
894 /* successfully converted some bytes */
895 in += converted;
896 argsize -= converted;
897 out++;
898 }
Ronald Oussorend61deca2010-04-18 14:46:12 +0000899#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000900 /* Cannot use C locale for escaping; manually escape as if charset
901 is ASCII (i.e. escape all bytes > 128. This will still roundtrip
902 correctly in the locale's charset, which must be an ASCII superset. */
903 res = PyMem_Malloc((strlen(arg)+1)*sizeof(wchar_t));
904 if (!res) goto oom;
905 in = (unsigned char*)arg;
906 out = res;
907 while(*in)
908 if(*in < 128)
909 *out++ = *in++;
910 else
911 *out++ = 0xdc00 + *in++;
912 *out = 0;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000913#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000914 return res;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000915oom:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000916 fprintf(stderr, "out of memory\n");
917 return NULL;
Ronald Oussorend61deca2010-04-18 14:46:12 +0000918}
919
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000920#ifdef __cplusplus
921}
922#endif