blob: 8bf0892637c182264df3feb5a66fd95496edf267 [file] [log] [blame]
Fred Drake6659c301998-03-03 22:02:19 +00001\documentclass{manual}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002
Guido van Rossum9faf4c51997-10-07 14:38:54 +00003\title{Python/C API Reference Manual}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00004
5\input{boilerplate}
6
Marc-André Lemburga544ea22001-01-17 18:04:31 +00007\makeindex % tell \index to actually write the .idx file
Guido van Rossum9231c8f1997-05-15 21:43:21 +00008
9
10\begin{document}
11
Guido van Rossum9231c8f1997-05-15 21:43:21 +000012\maketitle
13
Fred Drake9f86b661998-07-28 21:55:19 +000014\ifhtml
15\chapter*{Front Matter\label{front}}
16\fi
17
Guido van Rossum9231c8f1997-05-15 21:43:21 +000018\input{copyright}
19
20\begin{abstract}
21
22\noindent
Fred Drake659ebfa2000-04-03 15:42:13 +000023This manual documents the API used by C and \Cpp{} programmers who
Fred Drakee058b4f1998-02-16 06:15:35 +000024want to write extension modules or embed Python. It is a companion to
Fred Drakebe486461999-11-09 17:03:03 +000025\citetitle[../ext/ext.html]{Extending and Embedding the Python
26Interpreter}, which describes the general principles of extension
27writing but does not document the API functions in detail.
Guido van Rossum9231c8f1997-05-15 21:43:21 +000028
Guido van Rossum5b8a5231997-12-30 04:38:44 +000029\strong{Warning:} The current version of this document is incomplete.
30I hope that it is nevertheless useful. I will continue to work on it,
31and release new versions from time to time, independent from Python
32source code releases.
33
Guido van Rossum9231c8f1997-05-15 21:43:21 +000034\end{abstract}
35
Fred Drake4d4f9e71998-01-13 22:25:02 +000036\tableofcontents
Guido van Rossum9231c8f1997-05-15 21:43:21 +000037
Guido van Rossum5060b3b1997-08-17 18:02:23 +000038% XXX Consider moving all this back to ext.tex and giving api.tex
39% XXX a *really* short intro only.
Guido van Rossum9231c8f1997-05-15 21:43:21 +000040
Fred Drakeefd146c1999-02-15 15:30:45 +000041\chapter{Introduction \label{intro}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +000042
Fred Drake659ebfa2000-04-03 15:42:13 +000043The Application Programmer's Interface to Python gives C and
44\Cpp{} programmers access to the Python interpreter at a variety of
45levels. The API is equally usable from \Cpp{}, but for brevity it is
46generally referred to as the Python/C API. There are two
47fundamentally different reasons for using the Python/C API. The first
48reason is to write \emph{extension modules} for specific purposes;
49these are C modules that extend the Python interpreter. This is
50probably the most common use. The second reason is to use Python as a
51component in a larger application; this technique is generally
52referred to as \dfn{embedding} Python in an application.
Guido van Rossum59a61351997-08-14 20:34:33 +000053
Guido van Rossum4a944d71997-08-14 20:35:38 +000054Writing an extension module is a relatively well-understood process,
55where a ``cookbook'' approach works well. There are several tools
56that automate the process to some extent. While people have embedded
57Python in other applications since its early existence, the process of
58embedding Python is less straightforward that writing an extension.
Guido van Rossum59a61351997-08-14 20:34:33 +000059
Guido van Rossum4a944d71997-08-14 20:35:38 +000060Many API functions are useful independent of whether you're embedding
61or extending Python; moreover, most applications that embed Python
62will need to provide a custom extension as well, so it's probably a
63good idea to become familiar with writing an extension before
Guido van Rossum59a61351997-08-14 20:34:33 +000064attempting to embed Python in a real application.
65
Fred Drakeefd146c1999-02-15 15:30:45 +000066
67\section{Include Files \label{includes}}
Guido van Rossum580aa8d1997-11-25 15:34:51 +000068
69All function, type and macro definitions needed to use the Python/C
70API are included in your code by the following line:
71
Fred Drakee058b4f1998-02-16 06:15:35 +000072\begin{verbatim}
73#include "Python.h"
74\end{verbatim}
Guido van Rossum580aa8d1997-11-25 15:34:51 +000075
Fred Drakee058b4f1998-02-16 06:15:35 +000076This implies inclusion of the following standard headers:
Fred Drake0b71cea2000-09-26 05:51:50 +000077\code{<stdio.h>}, \code{<string.h>}, \code{<errno.h>},
78\code{<limits.h>}, and \code{<stdlib.h>} (if available).
Guido van Rossum580aa8d1997-11-25 15:34:51 +000079
80All user visible names defined by Python.h (except those defined by
Fred Drakee058b4f1998-02-16 06:15:35 +000081the included standard headers) have one of the prefixes \samp{Py} or
Fred Drake659ebfa2000-04-03 15:42:13 +000082\samp{_Py}. Names beginning with \samp{_Py} are for internal use by
83the Python implementation and should not be used by extension writers.
84Structure member names do not have a reserved prefix.
Guido van Rossum580aa8d1997-11-25 15:34:51 +000085
Fred Drakee058b4f1998-02-16 06:15:35 +000086\strong{Important:} user code should never define names that begin
87with \samp{Py} or \samp{_Py}. This confuses the reader, and
88jeopardizes the portability of the user code to future Python
89versions, which may define additional names beginning with one of
90these prefixes.
Guido van Rossum580aa8d1997-11-25 15:34:51 +000091
Fred Drake659ebfa2000-04-03 15:42:13 +000092The header files are typically installed with Python. On \UNIX, these
93are located in the directories
94\file{\envvar{prefix}/include/python\var{version}/} and
95\file{\envvar{exec_prefix}/include/python\var{version}/}, where
96\envvar{prefix} and \envvar{exec_prefix} are defined by the
97corresponding parameters to Python's \program{configure} script and
98\var{version} is \code{sys.version[:3]}. On Windows, the headers are
99installed in \file{\envvar{prefix}/include}, where \envvar{prefix} is
100the installation directory specified to the installer.
101
102To include the headers, place both directories (if different) on your
103compiler's search path for includes. Do \emph{not} place the parent
104directories on the search path and then use
Fred Draked5d04352000-09-14 20:24:17 +0000105\samp{\#include <python\shortversion/Python.h>}; this will break on
Fred Drake659ebfa2000-04-03 15:42:13 +0000106multi-platform builds since the platform independent headers under
107\envvar{prefix} include the platform specific headers from
108\envvar{exec_prefix}.
109
Fred Drakeefd146c1999-02-15 15:30:45 +0000110
111\section{Objects, Types and Reference Counts \label{objects}}
Guido van Rossum59a61351997-08-14 20:34:33 +0000112
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000113Most Python/C API functions have one or more arguments as well as a
Fred Drake659ebfa2000-04-03 15:42:13 +0000114return value of type \ctype{PyObject*}. This type is a pointer
Fred Drakee058b4f1998-02-16 06:15:35 +0000115to an opaque data type representing an arbitrary Python
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000116object. Since all Python object types are treated the same way by the
117Python language in most situations (e.g., assignments, scope rules,
118and argument passing), it is only fitting that they should be
Fred Drake659ebfa2000-04-03 15:42:13 +0000119represented by a single C type. Almost all Python objects live on the
120heap: you never declare an automatic or static variable of type
121\ctype{PyObject}, only pointer variables of type \ctype{PyObject*} can
122be declared. The sole exception are the type objects\obindex{type};
123since these must never be deallocated, they are typically static
124\ctype{PyTypeObject} objects.
Guido van Rossum59a61351997-08-14 20:34:33 +0000125
Fred Drakee058b4f1998-02-16 06:15:35 +0000126All Python objects (even Python integers) have a \dfn{type} and a
127\dfn{reference count}. An object's type determines what kind of object
Guido van Rossum4a944d71997-08-14 20:35:38 +0000128it is (e.g., an integer, a list, or a user-defined function; there are
Fred Drakebe486461999-11-09 17:03:03 +0000129many more as explained in the \citetitle[../ref/ref.html]{Python
130Reference Manual}). For each of the well-known types there is a macro
131to check whether an object is of that type; for instance,
Fred Drake659ebfa2000-04-03 15:42:13 +0000132\samp{PyList_Check(\var{a})} is true if (and only if) the object
133pointed to by \var{a} is a Python list.
Guido van Rossum59a61351997-08-14 20:34:33 +0000134
Fred Drakeefd146c1999-02-15 15:30:45 +0000135
136\subsection{Reference Counts \label{refcounts}}
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000137
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000138The reference count is important because today's computers have a
Fred Drake003d8da1998-04-13 00:53:42 +0000139finite (and often severely limited) memory size; it counts how many
Guido van Rossum4a944d71997-08-14 20:35:38 +0000140different places there are that have a reference to an object. Such a
Fred Drake659ebfa2000-04-03 15:42:13 +0000141place could be another object, or a global (or static) C variable, or
142a local variable in some C function. When an object's reference count
Guido van Rossum4a944d71997-08-14 20:35:38 +0000143becomes zero, the object is deallocated. If it contains references to
144other objects, their reference count is decremented. Those other
145objects may be deallocated in turn, if this decrement makes their
146reference count become zero, and so on. (There's an obvious problem
147with objects that reference each other here; for now, the solution is
Fred Drake659ebfa2000-04-03 15:42:13 +0000148``don't do that.'')
Guido van Rossum59a61351997-08-14 20:34:33 +0000149
Guido van Rossum4a944d71997-08-14 20:35:38 +0000150Reference counts are always manipulated explicitly. The normal way is
Fred Drake659ebfa2000-04-03 15:42:13 +0000151to use the macro \cfunction{Py_INCREF()}\ttindex{Py_INCREF()} to
152increment an object's reference count by one, and
153\cfunction{Py_DECREF()}\ttindex{Py_DECREF()} to decrement it by
154one. The \cfunction{Py_DECREF()} macro is considerably more complex
155than the incref one, since it must check whether the reference count
156becomes zero and then cause the object's deallocator to be called.
157The deallocator is a function pointer contained in the object's type
158structure. The type-specific deallocator takes care of decrementing
159the reference counts for other objects contained in the object if this
160is a compound object type, such as a list, as well as performing any
161additional finalization that's needed. There's no chance that the
162reference count can overflow; at least as many bits are used to hold
163the reference count as there are distinct memory locations in virtual
164memory (assuming \code{sizeof(long) >= sizeof(char*)}). Thus, the
165reference count increment is a simple operation.
Guido van Rossum59a61351997-08-14 20:34:33 +0000166
Guido van Rossum4a944d71997-08-14 20:35:38 +0000167It is not necessary to increment an object's reference count for every
168local variable that contains a pointer to an object. In theory, the
Fred Drakee058b4f1998-02-16 06:15:35 +0000169object's reference count goes up by one when the variable is made to
Guido van Rossum4a944d71997-08-14 20:35:38 +0000170point to it and it goes down by one when the variable goes out of
171scope. However, these two cancel each other out, so at the end the
172reference count hasn't changed. The only real reason to use the
173reference count is to prevent the object from being deallocated as
174long as our variable is pointing to it. If we know that there is at
175least one other reference to the object that lives at least as long as
176our variable, there is no need to increment the reference count
177temporarily. An important situation where this arises is in objects
Fred Drake659ebfa2000-04-03 15:42:13 +0000178that are passed as arguments to C functions in an extension module
Guido van Rossum4a944d71997-08-14 20:35:38 +0000179that are called from Python; the call mechanism guarantees to hold a
Guido van Rossum59a61351997-08-14 20:34:33 +0000180reference to every argument for the duration of the call.
181
Fred Drakee058b4f1998-02-16 06:15:35 +0000182However, a common pitfall is to extract an object from a list and
183hold on to it for a while without incrementing its reference count.
184Some other operation might conceivably remove the object from the
185list, decrementing its reference count and possible deallocating it.
186The real danger is that innocent-looking operations may invoke
187arbitrary Python code which could do this; there is a code path which
188allows control to flow back to the user from a \cfunction{Py_DECREF()},
189so almost any operation is potentially dangerous.
Guido van Rossum59a61351997-08-14 20:34:33 +0000190
Guido van Rossum4a944d71997-08-14 20:35:38 +0000191A safe approach is to always use the generic operations (functions
Fred Drake659ebfa2000-04-03 15:42:13 +0000192whose name begins with \samp{PyObject_}, \samp{PyNumber_},
193\samp{PySequence_} or \samp{PyMapping_}). These operations always
194increment the reference count of the object they return. This leaves
195the caller with the responsibility to call
196\cfunction{Py_DECREF()} when they are done with the result; this soon
197becomes second nature.
Guido van Rossum59a61351997-08-14 20:34:33 +0000198
Fred Drakeefd146c1999-02-15 15:30:45 +0000199
200\subsubsection{Reference Count Details \label{refcountDetails}}
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000201
202The reference count behavior of functions in the Python/C API is best
Fred Drake659ebfa2000-04-03 15:42:13 +0000203explained in terms of \emph{ownership of references}. Note that we
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000204talk of owning references, never of owning objects; objects are always
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000205shared! When a function owns a reference, it has to dispose of it
Fred Drakee058b4f1998-02-16 06:15:35 +0000206properly --- either by passing ownership on (usually to its caller) or
207by calling \cfunction{Py_DECREF()} or \cfunction{Py_XDECREF()}. When
208a function passes ownership of a reference on to its caller, the
209caller is said to receive a \emph{new} reference. When no ownership
210is transferred, the caller is said to \emph{borrow} the reference.
211Nothing needs to be done for a borrowed reference.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000212
Fred Drakea8455ab2000-06-16 19:58:42 +0000213Conversely, when a calling function passes it a reference to an
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000214object, there are two possibilities: the function \emph{steals} a
215reference to the object, or it does not. Few functions steal
Fred Drakee058b4f1998-02-16 06:15:35 +0000216references; the two notable exceptions are
Fred Drake659ebfa2000-04-03 15:42:13 +0000217\cfunction{PyList_SetItem()}\ttindex{PyList_SetItem()} and
218\cfunction{PyTuple_SetItem()}\ttindex{PyTuple_SetItem()}, which
Fred Drakee058b4f1998-02-16 06:15:35 +0000219steal a reference to the item (but not to the tuple or list into which
Fred Drake003d8da1998-04-13 00:53:42 +0000220the item is put!). These functions were designed to steal a reference
Fred Drakee058b4f1998-02-16 06:15:35 +0000221because of a common idiom for populating a tuple or list with newly
222created objects; for example, the code to create the tuple \code{(1,
2232, "three")} could look like this (forgetting about error handling for
Fred Drake659ebfa2000-04-03 15:42:13 +0000224the moment; a better way to code this is shown below):
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000225
226\begin{verbatim}
227PyObject *t;
Fred Drakec6fa34e1998-04-02 06:47:24 +0000228
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000229t = PyTuple_New(3);
230PyTuple_SetItem(t, 0, PyInt_FromLong(1L));
231PyTuple_SetItem(t, 1, PyInt_FromLong(2L));
232PyTuple_SetItem(t, 2, PyString_FromString("three"));
233\end{verbatim}
234
Fred Drakee058b4f1998-02-16 06:15:35 +0000235Incidentally, \cfunction{PyTuple_SetItem()} is the \emph{only} way to
236set tuple items; \cfunction{PySequence_SetItem()} and
237\cfunction{PyObject_SetItem()} refuse to do this since tuples are an
238immutable data type. You should only use
239\cfunction{PyTuple_SetItem()} for tuples that you are creating
Guido van Rossum5b8a5231997-12-30 04:38:44 +0000240yourself.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000241
242Equivalent code for populating a list can be written using
Fred Drakee058b4f1998-02-16 06:15:35 +0000243\cfunction{PyList_New()} and \cfunction{PyList_SetItem()}. Such code
244can also use \cfunction{PySequence_SetItem()}; this illustrates the
245difference between the two (the extra \cfunction{Py_DECREF()} calls):
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000246
247\begin{verbatim}
248PyObject *l, *x;
Fred Drakec6fa34e1998-04-02 06:47:24 +0000249
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000250l = PyList_New(3);
251x = PyInt_FromLong(1L);
Guido van Rossum5b8a5231997-12-30 04:38:44 +0000252PySequence_SetItem(l, 0, x); Py_DECREF(x);
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000253x = PyInt_FromLong(2L);
Guido van Rossum5b8a5231997-12-30 04:38:44 +0000254PySequence_SetItem(l, 1, x); Py_DECREF(x);
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000255x = PyString_FromString("three");
Guido van Rossum5b8a5231997-12-30 04:38:44 +0000256PySequence_SetItem(l, 2, x); Py_DECREF(x);
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000257\end{verbatim}
258
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000259You might find it strange that the ``recommended'' approach takes more
260code. However, in practice, you will rarely use these ways of
261creating and populating a tuple or list. There's a generic function,
Fred Drakee058b4f1998-02-16 06:15:35 +0000262\cfunction{Py_BuildValue()}, that can create most common objects from
Fred Drake659ebfa2000-04-03 15:42:13 +0000263C values, directed by a \dfn{format string}. For example, the
Fred Drakee058b4f1998-02-16 06:15:35 +0000264above two blocks of code could be replaced by the following (which
265also takes care of the error checking):
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000266
267\begin{verbatim}
268PyObject *t, *l;
Fred Drakec6fa34e1998-04-02 06:47:24 +0000269
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000270t = Py_BuildValue("(iis)", 1, 2, "three");
271l = Py_BuildValue("[iis]", 1, 2, "three");
272\end{verbatim}
273
Fred Drakee058b4f1998-02-16 06:15:35 +0000274It is much more common to use \cfunction{PyObject_SetItem()} and
275friends with items whose references you are only borrowing, like
276arguments that were passed in to the function you are writing. In
277that case, their behaviour regarding reference counts is much saner,
278since you don't have to increment a reference count so you can give a
279reference away (``have it be stolen''). For example, this function
280sets all items of a list (actually, any mutable sequence) to a given
281item:
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000282
283\begin{verbatim}
284int set_all(PyObject *target, PyObject *item)
285{
286 int i, n;
Fred Drakec6fa34e1998-04-02 06:47:24 +0000287
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000288 n = PyObject_Length(target);
289 if (n < 0)
290 return -1;
291 for (i = 0; i < n; i++) {
292 if (PyObject_SetItem(target, i, item) < 0)
293 return -1;
294 }
295 return 0;
296}
297\end{verbatim}
Fred Drake659ebfa2000-04-03 15:42:13 +0000298\ttindex{set_all()}
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000299
300The situation is slightly different for function return values.
301While passing a reference to most functions does not change your
302ownership responsibilities for that reference, many functions that
303return a referece to an object give you ownership of the reference.
304The reason is simple: in many cases, the returned object is created
305on the fly, and the reference you get is the only reference to the
Fred Drakee058b4f1998-02-16 06:15:35 +0000306object. Therefore, the generic functions that return object
307references, like \cfunction{PyObject_GetItem()} and
308\cfunction{PySequence_GetItem()}, always return a new reference (i.e.,
309the caller becomes the owner of the reference).
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000310
311It is important to realize that whether you own a reference returned
Fred Drakee058b4f1998-02-16 06:15:35 +0000312by a function depends on which function you call only --- \emph{the
313plumage} (i.e., the type of the type of the object passed as an
314argument to the function) \emph{doesn't enter into it!} Thus, if you
315extract an item from a list using \cfunction{PyList_GetItem()}, you
316don't own the reference --- but if you obtain the same item from the
317same list using \cfunction{PySequence_GetItem()} (which happens to
318take exactly the same arguments), you do own a reference to the
319returned object.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000320
Fred Drakee058b4f1998-02-16 06:15:35 +0000321Here is an example of how you could write a function that computes the
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000322sum of the items in a list of integers; once using
Fred Drake659ebfa2000-04-03 15:42:13 +0000323\cfunction{PyList_GetItem()}\ttindex{PyList_GetItem()}, and once using
324\cfunction{PySequence_GetItem()}\ttindex{PySequence_GetItem()}.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000325
326\begin{verbatim}
327long sum_list(PyObject *list)
328{
329 int i, n;
330 long total = 0;
331 PyObject *item;
Fred Drakec6fa34e1998-04-02 06:47:24 +0000332
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000333 n = PyList_Size(list);
334 if (n < 0)
335 return -1; /* Not a list */
336 for (i = 0; i < n; i++) {
337 item = PyList_GetItem(list, i); /* Can't fail */
338 if (!PyInt_Check(item)) continue; /* Skip non-integers */
339 total += PyInt_AsLong(item);
340 }
341 return total;
342}
343\end{verbatim}
Fred Drake659ebfa2000-04-03 15:42:13 +0000344\ttindex{sum_list()}
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000345
346\begin{verbatim}
347long sum_sequence(PyObject *sequence)
348{
349 int i, n;
350 long total = 0;
351 PyObject *item;
Fred Drake659ebfa2000-04-03 15:42:13 +0000352 n = PySequence_Length(sequence);
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000353 if (n < 0)
354 return -1; /* Has no length */
355 for (i = 0; i < n; i++) {
Fred Drake659ebfa2000-04-03 15:42:13 +0000356 item = PySequence_GetItem(sequence, i);
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000357 if (item == NULL)
358 return -1; /* Not a sequence, or other failure */
359 if (PyInt_Check(item))
360 total += PyInt_AsLong(item);
Guido van Rossum5b8a5231997-12-30 04:38:44 +0000361 Py_DECREF(item); /* Discard reference ownership */
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000362 }
363 return total;
364}
365\end{verbatim}
Fred Drake659ebfa2000-04-03 15:42:13 +0000366\ttindex{sum_sequence()}
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000367
Fred Drakeefd146c1999-02-15 15:30:45 +0000368
369\subsection{Types \label{types}}
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000370
371There are few other data types that play a significant role in
Fred Drake659ebfa2000-04-03 15:42:13 +0000372the Python/C API; most are simple C types such as \ctype{int},
373\ctype{long}, \ctype{double} and \ctype{char*}. A few structure types
Guido van Rossum4a944d71997-08-14 20:35:38 +0000374are used to describe static tables used to list the functions exported
Fred Drake659ebfa2000-04-03 15:42:13 +0000375by a module or the data attributes of a new object type, and another
376is used to describe the value of a complex number. These will
Guido van Rossum59a61351997-08-14 20:34:33 +0000377be discussed together with the functions that use them.
378
Fred Drakeefd146c1999-02-15 15:30:45 +0000379
380\section{Exceptions \label{exceptions}}
Guido van Rossum59a61351997-08-14 20:34:33 +0000381
Guido van Rossum4a944d71997-08-14 20:35:38 +0000382The Python programmer only needs to deal with exceptions if specific
383error handling is required; unhandled exceptions are automatically
Fred Drake659ebfa2000-04-03 15:42:13 +0000384propagated to the caller, then to the caller's caller, and so on, until
Guido van Rossum4a944d71997-08-14 20:35:38 +0000385they reach the top-level interpreter, where they are reported to the
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000386user accompanied by a stack traceback.
Guido van Rossum59a61351997-08-14 20:34:33 +0000387
Fred Drake659ebfa2000-04-03 15:42:13 +0000388For C programmers, however, error checking always has to be explicit.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000389All functions in the Python/C API can raise exceptions, unless an
390explicit claim is made otherwise in a function's documentation. In
391general, when a function encounters an error, it sets an exception,
392discards any object references that it owns, and returns an
Fred Drakee058b4f1998-02-16 06:15:35 +0000393error indicator --- usually \NULL{} or \code{-1}. A few functions
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000394return a Boolean true/false result, with false indicating an error.
395Very few functions return no explicit error indicator or have an
396ambiguous return value, and require explicit testing for errors with
Fred Drake659ebfa2000-04-03 15:42:13 +0000397\cfunction{PyErr_Occurred()}\ttindex{PyErr_Occurred()}.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000398
399Exception state is maintained in per-thread storage (this is
400equivalent to using global storage in an unthreaded application). A
Fred Drakec6fa34e1998-04-02 06:47:24 +0000401thread can be in one of two states: an exception has occurred, or not.
Fred Drakee058b4f1998-02-16 06:15:35 +0000402The function \cfunction{PyErr_Occurred()} can be used to check for
403this: it returns a borrowed reference to the exception type object
404when an exception has occurred, and \NULL{} otherwise. There are a
405number of functions to set the exception state:
Fred Drake659ebfa2000-04-03 15:42:13 +0000406\cfunction{PyErr_SetString()}\ttindex{PyErr_SetString()} is the most
407common (though not the most general) function to set the exception
408state, and \cfunction{PyErr_Clear()}\ttindex{PyErr_Clear()} clears the
409exception state.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000410
411The full exception state consists of three objects (all of which can
Fred Drakee058b4f1998-02-16 06:15:35 +0000412be \NULL{}): the exception type, the corresponding exception
Fred Drake659ebfa2000-04-03 15:42:13 +0000413value, and the traceback. These have the same meanings as the Python
414\withsubitem{(in module sys)}{
415 \ttindex{exc_type}\ttindex{exc_value}\ttindex{exc_traceback}}
416objects \code{sys.exc_type}, \code{sys.exc_value}, and
417\code{sys.exc_traceback}; however, they are not the same: the Python
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000418objects represent the last exception being handled by a Python
Fred Drake659ebfa2000-04-03 15:42:13 +0000419\keyword{try} \ldots\ \keyword{except} statement, while the C level
Fred Drakee058b4f1998-02-16 06:15:35 +0000420exception state only exists while an exception is being passed on
Fred Drake659ebfa2000-04-03 15:42:13 +0000421between C functions until it reaches the Python bytecode interpreter's
422main loop, which takes care of transferring it to \code{sys.exc_type}
423and friends.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000424
Fred Drakec6fa34e1998-04-02 06:47:24 +0000425Note that starting with Python 1.5, the preferred, thread-safe way to
Fred Drake659ebfa2000-04-03 15:42:13 +0000426access the exception state from Python code is to call the function
427\withsubitem{(in module sys)}{\ttindex{exc_info()}}
Fred Drakee058b4f1998-02-16 06:15:35 +0000428\function{sys.exc_info()}, which returns the per-thread exception state
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000429for Python code. Also, the semantics of both ways to access the
430exception state have changed so that a function which catches an
431exception will save and restore its thread's exception state so as to
432preserve the exception state of its caller. This prevents common bugs
433in exception handling code caused by an innocent-looking function
434overwriting the exception being handled; it also reduces the often
435unwanted lifetime extension for objects that are referenced by the
Fred Drakec6fa34e1998-04-02 06:47:24 +0000436stack frames in the traceback.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000437
438As a general principle, a function that calls another function to
439perform some task should check whether the called function raised an
440exception, and if so, pass the exception state on to its caller. It
Fred Drake659ebfa2000-04-03 15:42:13 +0000441should discard any object references that it owns, and return an
Fred Drakee058b4f1998-02-16 06:15:35 +0000442error indicator, but it should \emph{not} set another exception ---
443that would overwrite the exception that was just raised, and lose
444important information about the exact cause of the error.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000445
Fred Drake659ebfa2000-04-03 15:42:13 +0000446A simple example of detecting exceptions and passing them on is shown
447in the \cfunction{sum_sequence()}\ttindex{sum_sequence()} example
448above. It so happens that that example doesn't need to clean up any
449owned references when it detects an error. The following example
450function shows some error cleanup. First, to remind you why you like
451Python, we show the equivalent Python code:
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000452
453\begin{verbatim}
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000454def incr_item(dict, key):
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000455 try:
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000456 item = dict[key]
457 except KeyError:
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000458 item = 0
Fred Drake6b3f3f22000-11-29 15:48:22 +0000459 dict[key] = item + 1
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000460\end{verbatim}
Fred Drake659ebfa2000-04-03 15:42:13 +0000461\ttindex{incr_item()}
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000462
Fred Drake659ebfa2000-04-03 15:42:13 +0000463Here is the corresponding C code, in all its glory:
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000464
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000465\begin{verbatim}
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000466int incr_item(PyObject *dict, PyObject *key)
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000467{
468 /* Objects all initialized to NULL for Py_XDECREF */
469 PyObject *item = NULL, *const_one = NULL, *incremented_item = NULL;
Guido van Rossum5b8a5231997-12-30 04:38:44 +0000470 int rv = -1; /* Return value initialized to -1 (failure) */
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000471
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000472 item = PyObject_GetItem(dict, key);
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000473 if (item == NULL) {
Fred Drakec6fa34e1998-04-02 06:47:24 +0000474 /* Handle KeyError only: */
Fred Drake6b3f3f22000-11-29 15:48:22 +0000475 if (!PyErr_ExceptionMatches(PyExc_KeyError))
476 goto error;
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000477
478 /* Clear the error and use zero: */
479 PyErr_Clear();
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000480 item = PyInt_FromLong(0L);
Fred Drake6b3f3f22000-11-29 15:48:22 +0000481 if (item == NULL)
482 goto error;
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000483 }
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000484 const_one = PyInt_FromLong(1L);
Fred Drake6b3f3f22000-11-29 15:48:22 +0000485 if (const_one == NULL)
486 goto error;
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000487
488 incremented_item = PyNumber_Add(item, const_one);
Fred Drake6b3f3f22000-11-29 15:48:22 +0000489 if (incremented_item == NULL)
490 goto error;
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000491
Fred Drake6b3f3f22000-11-29 15:48:22 +0000492 if (PyObject_SetItem(dict, key, incremented_item) < 0)
493 goto error;
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000494 rv = 0; /* Success */
495 /* Continue with cleanup code */
496
497 error:
498 /* Cleanup code, shared by success and failure path */
499
500 /* Use Py_XDECREF() to ignore NULL references */
501 Py_XDECREF(item);
502 Py_XDECREF(const_one);
503 Py_XDECREF(incremented_item);
504
505 return rv; /* -1 for error, 0 for success */
506}
507\end{verbatim}
Fred Drake659ebfa2000-04-03 15:42:13 +0000508\ttindex{incr_item()}
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000509
Fred Drakef8830d11998-04-23 14:06:01 +0000510This example represents an endorsed use of the \keyword{goto} statement
Fred Drake659ebfa2000-04-03 15:42:13 +0000511in C! It illustrates the use of
512\cfunction{PyErr_ExceptionMatches()}\ttindex{PyErr_ExceptionMatches()} and
513\cfunction{PyErr_Clear()}\ttindex{PyErr_Clear()} to
514handle specific exceptions, and the use of
515\cfunction{Py_XDECREF()}\ttindex{Py_XDECREF()} to
516dispose of owned references that may be \NULL{} (note the
517\character{X} in the name; \cfunction{Py_DECREF()} would crash when
518confronted with a \NULL{} reference). It is important that the
519variables used to hold owned references are initialized to \NULL{} for
520this to work; likewise, the proposed return value is initialized to
521\code{-1} (failure) and only set to success after the final call made
522is successful.
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000523
Guido van Rossum59a61351997-08-14 20:34:33 +0000524
Fred Drakeefd146c1999-02-15 15:30:45 +0000525\section{Embedding Python \label{embedding}}
Guido van Rossum59a61351997-08-14 20:34:33 +0000526
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000527The one important task that only embedders (as opposed to extension
528writers) of the Python interpreter have to worry about is the
529initialization, and possibly the finalization, of the Python
530interpreter. Most functionality of the interpreter can only be used
531after the interpreter has been initialized.
Guido van Rossum59a61351997-08-14 20:34:33 +0000532
Fred Drake659ebfa2000-04-03 15:42:13 +0000533The basic initialization function is
534\cfunction{Py_Initialize()}\ttindex{Py_Initialize()}.
Fred Drakee058b4f1998-02-16 06:15:35 +0000535This initializes the table of loaded modules, and creates the
Fred Drake4de05a91998-02-16 14:25:26 +0000536fundamental modules \module{__builtin__}\refbimodindex{__builtin__},
537\module{__main__}\refbimodindex{__main__} and
538\module{sys}\refbimodindex{sys}. It also initializes the module
Fred Drakec6fa34e1998-04-02 06:47:24 +0000539search path (\code{sys.path}).%
540\indexiii{module}{search}{path}
Fred Drake659ebfa2000-04-03 15:42:13 +0000541\withsubitem{(in module sys)}{\ttindex{path}}
Guido van Rossum59a61351997-08-14 20:34:33 +0000542
Fred Drakee058b4f1998-02-16 06:15:35 +0000543\cfunction{Py_Initialize()} does not set the ``script argument list''
Guido van Rossum4a944d71997-08-14 20:35:38 +0000544(\code{sys.argv}). If this variable is needed by Python code that
545will be executed later, it must be set explicitly with a call to
Fred Drake659ebfa2000-04-03 15:42:13 +0000546\code{PySys_SetArgv(\var{argc},
547\var{argv})}\ttindex{PySys_SetArgv()} subsequent to the call to
548\cfunction{Py_Initialize()}.
Guido van Rossum59a61351997-08-14 20:34:33 +0000549
Fred Drakeb0a78731998-01-13 18:51:10 +0000550On most systems (in particular, on \UNIX{} and Windows, although the
Fred Drake659ebfa2000-04-03 15:42:13 +0000551details are slightly different),
552\cfunction{Py_Initialize()} calculates the module search path based
553upon its best guess for the location of the standard Python
554interpreter executable, assuming that the Python library is found in a
555fixed location relative to the Python interpreter executable. In
556particular, it looks for a directory named
Fred Draked5d04352000-09-14 20:24:17 +0000557\file{lib/python\shortversion} relative to the parent directory where
558the executable named \file{python} is found on the shell command
559search path (the environment variable \envvar{PATH}).
Guido van Rossum42cefd01997-10-05 15:27:29 +0000560
561For instance, if the Python executable is found in
Fred Drakee058b4f1998-02-16 06:15:35 +0000562\file{/usr/local/bin/python}, it will assume that the libraries are in
Fred Draked5d04352000-09-14 20:24:17 +0000563\file{/usr/local/lib/python\shortversion}. (In fact, this particular path
Fred Drakee058b4f1998-02-16 06:15:35 +0000564is also the ``fallback'' location, used when no executable file named
Fred Drakec6fa34e1998-04-02 06:47:24 +0000565\file{python} is found along \envvar{PATH}.) The user can override
566this behavior by setting the environment variable \envvar{PYTHONHOME},
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000567or insert additional directories in front of the standard path by
Fred Drakec6fa34e1998-04-02 06:47:24 +0000568setting \envvar{PYTHONPATH}.
Guido van Rossum59a61351997-08-14 20:34:33 +0000569
Guido van Rossum4a944d71997-08-14 20:35:38 +0000570The embedding application can steer the search by calling
Fred Drake659ebfa2000-04-03 15:42:13 +0000571\code{Py_SetProgramName(\var{file})}\ttindex{Py_SetProgramName()} \emph{before} calling
Fred Drakec6fa34e1998-04-02 06:47:24 +0000572\cfunction{Py_Initialize()}. Note that \envvar{PYTHONHOME} still
573overrides this and \envvar{PYTHONPATH} is still inserted in front of
Fred Drakee058b4f1998-02-16 06:15:35 +0000574the standard path. An application that requires total control has to
Fred Drake659ebfa2000-04-03 15:42:13 +0000575provide its own implementation of
576\cfunction{Py_GetPath()}\ttindex{Py_GetPath()},
577\cfunction{Py_GetPrefix()}\ttindex{Py_GetPrefix()},
578\cfunction{Py_GetExecPrefix()}\ttindex{Py_GetExecPrefix()}, and
579\cfunction{Py_GetProgramFullPath()}\ttindex{Py_GetProgramFullPath()} (all
580defined in \file{Modules/getpath.c}).
Guido van Rossum59a61351997-08-14 20:34:33 +0000581
Guido van Rossum4a944d71997-08-14 20:35:38 +0000582Sometimes, it is desirable to ``uninitialize'' Python. For instance,
583the application may want to start over (make another call to
Fred Drakee058b4f1998-02-16 06:15:35 +0000584\cfunction{Py_Initialize()}) or the application is simply done with its
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000585use of Python and wants to free all memory allocated by Python. This
Fred Drakee058b4f1998-02-16 06:15:35 +0000586can be accomplished by calling \cfunction{Py_Finalize()}. The function
Fred Drake659ebfa2000-04-03 15:42:13 +0000587\cfunction{Py_IsInitialized()}\ttindex{Py_IsInitialized()} returns
588true if Python is currently in the initialized state. More
589information about these functions is given in a later chapter.
Guido van Rossum59a61351997-08-14 20:34:33 +0000590
Guido van Rossum4a944d71997-08-14 20:35:38 +0000591
Fred Drakeefd146c1999-02-15 15:30:45 +0000592\chapter{The Very High Level Layer \label{veryhigh}}
Guido van Rossum4a944d71997-08-14 20:35:38 +0000593
Fred Drakee5bf8b21998-02-12 21:22:28 +0000594The functions in this chapter will let you execute Python source code
595given in a file or a buffer, but they will not let you interact in a
596more detailed way with the interpreter.
Guido van Rossum4a944d71997-08-14 20:35:38 +0000597
Fred Drake659ebfa2000-04-03 15:42:13 +0000598Several of these functions accept a start symbol from the grammar as a
599parameter. The available start symbols are \constant{Py_eval_input},
600\constant{Py_file_input}, and \constant{Py_single_input}. These are
601described following the functions which accept them as parameters.
602
Fred Drake510d08b2000-08-14 02:50:21 +0000603Note also that several of these functions take \ctype{FILE*}
604parameters. On particular issue which needs to be handled carefully
605is that the \ctype{FILE} structure for different C libraries can be
606different and incompatible. Under Windows (at least), it is possible
607for dynamically linked extensions to actually use different libraries,
608so care should be taken that \ctype{FILE*} parameters are only passed
609to these functions if it is certain that they were created by the same
610library that the Python runtime is using.
611
Fred Drakec6fa34e1998-04-02 06:47:24 +0000612\begin{cfuncdesc}{int}{PyRun_AnyFile}{FILE *fp, char *filename}
Fred Drake0041a941999-04-29 04:20:46 +0000613 If \var{fp} refers to a file associated with an interactive device
614 (console or terminal input or \UNIX{} pseudo-terminal), return the
615 value of \cfunction{PyRun_InteractiveLoop()}, otherwise return the
616 result of \cfunction{PyRun_SimpleFile()}. If \var{filename} is
Fred Drakea8d73412000-08-11 20:39:29 +0000617 \NULL{}, this function uses \code{"???"} as the filename.
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000618\end{cfuncdesc}
619
Fred Drakec6fa34e1998-04-02 06:47:24 +0000620\begin{cfuncdesc}{int}{PyRun_SimpleString}{char *command}
Fred Drake0041a941999-04-29 04:20:46 +0000621 Executes the Python source code from \var{command} in the
622 \module{__main__} module. If \module{__main__} does not already
623 exist, it is created. Returns \code{0} on success or \code{-1} if
624 an exception was raised. If there was an error, there is no way to
625 get the exception information.
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000626\end{cfuncdesc}
627
Fred Drakec6fa34e1998-04-02 06:47:24 +0000628\begin{cfuncdesc}{int}{PyRun_SimpleFile}{FILE *fp, char *filename}
Fred Drake0041a941999-04-29 04:20:46 +0000629 Similar to \cfunction{PyRun_SimpleString()}, but the Python source
630 code is read from \var{fp} instead of an in-memory string.
631 \var{filename} should be the name of the file.
Fred Drakee5bf8b21998-02-12 21:22:28 +0000632\end{cfuncdesc}
633
Fred Drakec6fa34e1998-04-02 06:47:24 +0000634\begin{cfuncdesc}{int}{PyRun_InteractiveOne}{FILE *fp, char *filename}
Fred Drakea8d73412000-08-11 20:39:29 +0000635 Read and execute a single statement from a file associated with an
636 interactive device. If \var{filename} is \NULL, \code{"???"} is
637 used instead. The user will be prompted using \code{sys.ps1} and
638 \code{sys.ps2}. Returns \code{0} when the input was executed
639 successfully, \code{-1} if there was an exception, or an error code
640 from the \file{errcode.h} include file distributed as part of Python
641 in case of a parse error. (Note that \file{errcode.h} is not
642 included by \file{Python.h}, so must be included specifically if
643 needed.)
Fred Drakee5bf8b21998-02-12 21:22:28 +0000644\end{cfuncdesc}
645
Fred Drakec6fa34e1998-04-02 06:47:24 +0000646\begin{cfuncdesc}{int}{PyRun_InteractiveLoop}{FILE *fp, char *filename}
Fred Drakea8d73412000-08-11 20:39:29 +0000647 Read and execute statements from a file associated with an
648 interactive device until \EOF{} is reached. If \var{filename} is
649 \NULL, \code{"???"} is used instead. The user will be prompted
650 using \code{sys.ps1} and \code{sys.ps2}. Returns \code{0} at \EOF.
Fred Drakee5bf8b21998-02-12 21:22:28 +0000651\end{cfuncdesc}
652
Fred Drakec6fa34e1998-04-02 06:47:24 +0000653\begin{cfuncdesc}{struct _node*}{PyParser_SimpleParseString}{char *str,
654 int start}
Fred Drake0041a941999-04-29 04:20:46 +0000655 Parse Python source code from \var{str} using the start token
656 \var{start}. The result can be used to create a code object which
657 can be evaluated efficiently. This is useful if a code fragment
658 must be evaluated many times.
Fred Drakee5bf8b21998-02-12 21:22:28 +0000659\end{cfuncdesc}
660
Fred Drakec6fa34e1998-04-02 06:47:24 +0000661\begin{cfuncdesc}{struct _node*}{PyParser_SimpleParseFile}{FILE *fp,
662 char *filename, int start}
Fred Drake0041a941999-04-29 04:20:46 +0000663 Similar to \cfunction{PyParser_SimpleParseString()}, but the Python
664 source code is read from \var{fp} instead of an in-memory string.
665 \var{filename} should be the name of the file.
Fred Drakee5bf8b21998-02-12 21:22:28 +0000666\end{cfuncdesc}
667
Fred Drakec6fa34e1998-04-02 06:47:24 +0000668\begin{cfuncdesc}{PyObject*}{PyRun_String}{char *str, int start,
669 PyObject *globals,
670 PyObject *locals}
Fred Drake0041a941999-04-29 04:20:46 +0000671 Execute Python source code from \var{str} in the context specified
672 by the dictionaries \var{globals} and \var{locals}. The parameter
673 \var{start} specifies the start token that should be used to parse
674 the source code.
675
676 Returns the result of executing the code as a Python object, or
677 \NULL{} if an exception was raised.
Fred Drakee5bf8b21998-02-12 21:22:28 +0000678\end{cfuncdesc}
679
Fred Drakec6fa34e1998-04-02 06:47:24 +0000680\begin{cfuncdesc}{PyObject*}{PyRun_File}{FILE *fp, char *filename,
681 int start, PyObject *globals,
682 PyObject *locals}
Fred Drake0041a941999-04-29 04:20:46 +0000683 Similar to \cfunction{PyRun_String()}, but the Python source code is
Fred Drake659ebfa2000-04-03 15:42:13 +0000684 read from \var{fp} instead of an in-memory string.
685 \var{filename} should be the name of the file.
Fred Drakee5bf8b21998-02-12 21:22:28 +0000686\end{cfuncdesc}
687
Fred Drakec6fa34e1998-04-02 06:47:24 +0000688\begin{cfuncdesc}{PyObject*}{Py_CompileString}{char *str, char *filename,
689 int start}
Fred Drake0041a941999-04-29 04:20:46 +0000690 Parse and compile the Python source code in \var{str}, returning the
691 resulting code object. The start token is given by \var{start};
Fred Drakec924b8d1999-08-23 18:57:25 +0000692 this can be used to constrain the code which can be compiled and should
693 be \constant{Py_eval_input}, \constant{Py_file_input}, or
694 \constant{Py_single_input}. The filename specified by
695 \var{filename} is used to construct the code object and may appear
696 in tracebacks or \exception{SyntaxError} exception messages. This
697 returns \NULL{} if the code cannot be parsed or compiled.
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000698\end{cfuncdesc}
699
Fred Drakec924b8d1999-08-23 18:57:25 +0000700\begin{cvardesc}{int}{Py_eval_input}
701 The start symbol from the Python grammar for isolated expressions;
Fred Drake659ebfa2000-04-03 15:42:13 +0000702 for use with \cfunction{Py_CompileString()}\ttindex{Py_CompileString()}.
Fred Drakec924b8d1999-08-23 18:57:25 +0000703\end{cvardesc}
704
705\begin{cvardesc}{int}{Py_file_input}
706 The start symbol from the Python grammar for sequences of statements
707 as read from a file or other source; for use with
Fred Drake659ebfa2000-04-03 15:42:13 +0000708 \cfunction{Py_CompileString()}\ttindex{Py_CompileString()}. This is
709 the symbol to use when compiling arbitrarily long Python source code.
Fred Drakec924b8d1999-08-23 18:57:25 +0000710\end{cvardesc}
711
712\begin{cvardesc}{int}{Py_single_input}
713 The start symbol from the Python grammar for a single statement; for
Fred Drake659ebfa2000-04-03 15:42:13 +0000714 use with \cfunction{Py_CompileString()}\ttindex{Py_CompileString()}.
715 This is the symbol used for the interactive interpreter loop.
Fred Drakec924b8d1999-08-23 18:57:25 +0000716\end{cvardesc}
717
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000718
Fred Drakeefd146c1999-02-15 15:30:45 +0000719\chapter{Reference Counting \label{countingRefs}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000720
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000721The macros in this section are used for managing reference counts
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000722of Python objects.
723
724\begin{cfuncdesc}{void}{Py_INCREF}{PyObject *o}
Fred Drakec6fa34e1998-04-02 06:47:24 +0000725Increment the reference count for object \var{o}. The object must
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000726not be \NULL{}; if you aren't sure that it isn't \NULL{}, use
Fred Drakee058b4f1998-02-16 06:15:35 +0000727\cfunction{Py_XINCREF()}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000728\end{cfuncdesc}
729
730\begin{cfuncdesc}{void}{Py_XINCREF}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +0000731Increment the reference count for object \var{o}. The object may be
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000732\NULL{}, in which case the macro has no effect.
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000733\end{cfuncdesc}
734
735\begin{cfuncdesc}{void}{Py_DECREF}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +0000736Decrement the reference count for object \var{o}. The object must
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000737not be \NULL{}; if you aren't sure that it isn't \NULL{}, use
Fred Drakee058b4f1998-02-16 06:15:35 +0000738\cfunction{Py_XDECREF()}. If the reference count reaches zero, the
739object's type's deallocation function (which must not be \NULL{}) is
740invoked.
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000741
742\strong{Warning:} The deallocation function can cause arbitrary Python
Fred Drake659ebfa2000-04-03 15:42:13 +0000743code to be invoked (e.g. when a class instance with a
744\method{__del__()} method is deallocated). While exceptions in such
745code are not propagated, the executed code has free access to all
746Python global variables. This means that any object that is reachable
747from a global variable should be in a consistent state before
748\cfunction{Py_DECREF()} is invoked. For example, code to delete an
749object from a list should copy a reference to the deleted object in a
750temporary variable, update the list data structure, and then call
751\cfunction{Py_DECREF()} for the temporary variable.
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000752\end{cfuncdesc}
753
754\begin{cfuncdesc}{void}{Py_XDECREF}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +0000755Decrement the reference count for object \var{o}. The object may be
756\NULL{}, in which case the macro has no effect; otherwise the effect
757is the same as for \cfunction{Py_DECREF()}, and the same warning
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000758applies.
759\end{cfuncdesc}
760
Fred Drake659ebfa2000-04-03 15:42:13 +0000761The following functions or macros are only for use within the
762interpreter core: \cfunction{_Py_Dealloc()},
763\cfunction{_Py_ForgetReference()}, \cfunction{_Py_NewReference()}, as
764well as the global variable \cdata{_Py_RefTotal}.
Guido van Rossum580aa8d1997-11-25 15:34:51 +0000765
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000766
Fred Drakeefd146c1999-02-15 15:30:45 +0000767\chapter{Exception Handling \label{exceptionHandling}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000768
Fred Drake659ebfa2000-04-03 15:42:13 +0000769The functions described in this chapter will let you handle and raise Python
Guido van Rossumae110af1997-05-22 20:11:52 +0000770exceptions. It is important to understand some of the basics of
Fred Drake659ebfa2000-04-03 15:42:13 +0000771Python exception handling. It works somewhat like the
772\UNIX{} \cdata{errno} variable: there is a global indicator (per
773thread) of the last error that occurred. Most functions don't clear
774this on success, but will set it to indicate the cause of the error on
775failure. Most functions also return an error indicator, usually
776\NULL{} if they are supposed to return a pointer, or \code{-1} if they
777return an integer (exception: the \cfunction{PyArg_Parse*()} functions
778return \code{1} for success and \code{0} for failure). When a
779function must fail because some function it called failed, it
780generally doesn't set the error indicator; the function it called
781already set it.
Guido van Rossumae110af1997-05-22 20:11:52 +0000782
783The error indicator consists of three Python objects corresponding to
Fred Drake659ebfa2000-04-03 15:42:13 +0000784\withsubitem{(in module sys)}{
785 \ttindex{exc_type}\ttindex{exc_value}\ttindex{exc_traceback}}
Guido van Rossumae110af1997-05-22 20:11:52 +0000786the Python variables \code{sys.exc_type}, \code{sys.exc_value} and
787\code{sys.exc_traceback}. API functions exist to interact with the
788error indicator in various ways. There is a separate error indicator
789for each thread.
790
791% XXX Order of these should be more thoughtful.
792% Either alphabetical or some kind of structure.
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000793
794\begin{cfuncdesc}{void}{PyErr_Print}{}
Guido van Rossumae110af1997-05-22 20:11:52 +0000795Print a standard traceback to \code{sys.stderr} and clear the error
796indicator. Call this function only when the error indicator is set.
797(Otherwise it will cause a fatal error!)
Guido van Rossum9231c8f1997-05-15 21:43:21 +0000798\end{cfuncdesc}
799
Fred Drakec6fa34e1998-04-02 06:47:24 +0000800\begin{cfuncdesc}{PyObject*}{PyErr_Occurred}{}
Guido van Rossumae110af1997-05-22 20:11:52 +0000801Test whether the error indicator is set. If set, return the exception
Fred Drakee058b4f1998-02-16 06:15:35 +0000802\emph{type} (the first argument to the last call to one of the
Fred Drakef8830d11998-04-23 14:06:01 +0000803\cfunction{PyErr_Set*()} functions or to \cfunction{PyErr_Restore()}). If
Fred Drakee058b4f1998-02-16 06:15:35 +0000804not set, return \NULL{}. You do not own a reference to the return
805value, so you do not need to \cfunction{Py_DECREF()} it.
Fred Drake659ebfa2000-04-03 15:42:13 +0000806\strong{Note:} Do not compare the return value to a specific
Fred Drakee058b4f1998-02-16 06:15:35 +0000807exception; use \cfunction{PyErr_ExceptionMatches()} instead, shown
Fred Drake659ebfa2000-04-03 15:42:13 +0000808below. (The comparison could easily fail since the exception may be
809an instance instead of a class, in the case of a class exception, or
810it may the a subclass of the expected exception.)
Guido van Rossum42cefd01997-10-05 15:27:29 +0000811\end{cfuncdesc}
812
813\begin{cfuncdesc}{int}{PyErr_ExceptionMatches}{PyObject *exc}
Guido van Rossum42cefd01997-10-05 15:27:29 +0000814Equivalent to
Fred Drakee058b4f1998-02-16 06:15:35 +0000815\samp{PyErr_GivenExceptionMatches(PyErr_Occurred(), \var{exc})}.
Fred Drake659ebfa2000-04-03 15:42:13 +0000816This should only be called when an exception is actually set; a memory
817access violation will occur if no exception has been raised.
Guido van Rossum42cefd01997-10-05 15:27:29 +0000818\end{cfuncdesc}
819
820\begin{cfuncdesc}{int}{PyErr_GivenExceptionMatches}{PyObject *given, PyObject *exc}
Guido van Rossum42cefd01997-10-05 15:27:29 +0000821Return true if the \var{given} exception matches the exception in
822\var{exc}. If \var{exc} is a class object, this also returns true
Fred Drake659ebfa2000-04-03 15:42:13 +0000823when \var{given} is an instance of a subclass. If \var{exc} is a tuple, all
Guido van Rossum42cefd01997-10-05 15:27:29 +0000824exceptions in the tuple (and recursively in subtuples) are searched
Fred Drake659ebfa2000-04-03 15:42:13 +0000825for a match. If \var{given} is \NULL, a memory access violation will
826occur.
Guido van Rossum42cefd01997-10-05 15:27:29 +0000827\end{cfuncdesc}
828
829\begin{cfuncdesc}{void}{PyErr_NormalizeException}{PyObject**exc, PyObject**val, PyObject**tb}
Guido van Rossum42cefd01997-10-05 15:27:29 +0000830Under certain circumstances, the values returned by
Fred Drakee058b4f1998-02-16 06:15:35 +0000831\cfunction{PyErr_Fetch()} below can be ``unnormalized'', meaning that
832\code{*\var{exc}} is a class object but \code{*\var{val}} is not an
833instance of the same class. This function can be used to instantiate
834the class in that case. If the values are already normalized, nothing
Fred Drake659ebfa2000-04-03 15:42:13 +0000835happens. The delayed normalization is implemented to improve
836performance.
Guido van Rossumae110af1997-05-22 20:11:52 +0000837\end{cfuncdesc}
838
839\begin{cfuncdesc}{void}{PyErr_Clear}{}
840Clear the error indicator. If the error indicator is not set, there
841is no effect.
842\end{cfuncdesc}
843
Fred Drake659ebfa2000-04-03 15:42:13 +0000844\begin{cfuncdesc}{void}{PyErr_Fetch}{PyObject **ptype, PyObject **pvalue,
845 PyObject **ptraceback}
Guido van Rossumae110af1997-05-22 20:11:52 +0000846Retrieve the error indicator into three variables whose addresses are
847passed. If the error indicator is not set, set all three variables to
848\NULL{}. If it is set, it will be cleared and you own a reference to
Fred Drake659ebfa2000-04-03 15:42:13 +0000849each object retrieved. The value and traceback object may be
850\NULL{} even when the type object is not. \strong{Note:} This
851function is normally only used by code that needs to handle exceptions
852or by code that needs to save and restore the error indicator
853temporarily.
Guido van Rossumae110af1997-05-22 20:11:52 +0000854\end{cfuncdesc}
855
Fred Drake17e63432000-08-31 05:50:40 +0000856\begin{cfuncdesc}{void}{PyErr_Restore}{PyObject *type, PyObject *value,
857 PyObject *traceback}
Guido van Rossumae110af1997-05-22 20:11:52 +0000858Set the error indicator from the three objects. If the error
859indicator is already set, it is cleared first. If the objects are
860\NULL{}, the error indicator is cleared. Do not pass a \NULL{} type
861and non-\NULL{} value or traceback. The exception type should be a
862string or class; if it is a class, the value should be an instance of
863that class. Do not pass an invalid exception type or value.
864(Violating these rules will cause subtle problems later.) This call
Fred Drake17e63432000-08-31 05:50:40 +0000865takes away a reference to each object, i.e.\ you must own a reference
Guido van Rossumae110af1997-05-22 20:11:52 +0000866to each object before the call and after the call you no longer own
867these references. (If you don't understand this, don't use this
Fred Drake659ebfa2000-04-03 15:42:13 +0000868function. I warned you.) \strong{Note:} This function is normally
Guido van Rossumae110af1997-05-22 20:11:52 +0000869only used by code that needs to save and restore the error indicator
870temporarily.
871\end{cfuncdesc}
872
873\begin{cfuncdesc}{void}{PyErr_SetString}{PyObject *type, char *message}
874This is the most common way to set the error indicator. The first
875argument specifies the exception type; it is normally one of the
Fred Drakef8830d11998-04-23 14:06:01 +0000876standard exceptions, e.g. \cdata{PyExc_RuntimeError}. You need not
Guido van Rossumae110af1997-05-22 20:11:52 +0000877increment its reference count. The second argument is an error
878message; it is converted to a string object.
879\end{cfuncdesc}
880
881\begin{cfuncdesc}{void}{PyErr_SetObject}{PyObject *type, PyObject *value}
Fred Drakee058b4f1998-02-16 06:15:35 +0000882This function is similar to \cfunction{PyErr_SetString()} but lets you
Guido van Rossumae110af1997-05-22 20:11:52 +0000883specify an arbitrary Python object for the ``value'' of the exception.
884You need not increment its reference count.
885\end{cfuncdesc}
886
Fred Drake73577702000-04-10 18:50:14 +0000887\begin{cfuncdesc}{PyObject*}{PyErr_Format}{PyObject *exception,
Moshe Zadka57a59322000-09-01 09:47:20 +0000888 const char *format, \moreargs}
Fred Drake89fb0352000-10-14 05:49:30 +0000889This function sets the error indicator. \var{exception} should be a
890Python exception (string or class, not an instance).
Fred Drake5566c1c2001-01-19 22:48:33 +0000891\var{format} should be a string, containing format codes, similar to
Moshe Zadka57a59322000-09-01 09:47:20 +0000892\cfunction{printf}. The \code{width.precision} before a format code
893is parsed, but the width part is ignored.
894
895\begin{tableii}{c|l}{character}{Character}{Meaning}
896 \lineii{c}{Character, as an \ctype{int} parameter}
897 \lineii{d}{Number in decimal, as an \ctype{int} parameter}
898 \lineii{x}{Number in hexadecimal, as an \ctype{int} parameter}
899 \lineii{x}{A string, as a \ctype{char *} parameter}
900\end{tableii}
901
902An unrecognized format character causes all the rest of
903the format string to be copied as-is to the result string,
904and any extra arguments discarded.
905
906A new reference is returned, which is owned by the caller.
Jeremy Hylton98605b52000-04-10 18:40:57 +0000907\end{cfuncdesc}
908
Guido van Rossumae110af1997-05-22 20:11:52 +0000909\begin{cfuncdesc}{void}{PyErr_SetNone}{PyObject *type}
Fred Drakee058b4f1998-02-16 06:15:35 +0000910This is a shorthand for \samp{PyErr_SetObject(\var{type}, Py_None)}.
Guido van Rossumae110af1997-05-22 20:11:52 +0000911\end{cfuncdesc}
912
913\begin{cfuncdesc}{int}{PyErr_BadArgument}{}
Fred Drakee058b4f1998-02-16 06:15:35 +0000914This is a shorthand for \samp{PyErr_SetString(PyExc_TypeError,
Guido van Rossumae110af1997-05-22 20:11:52 +0000915\var{message})}, where \var{message} indicates that a built-in operation
916was invoked with an illegal argument. It is mostly for internal use.
917\end{cfuncdesc}
918
Fred Drakec6fa34e1998-04-02 06:47:24 +0000919\begin{cfuncdesc}{PyObject*}{PyErr_NoMemory}{}
Fred Drakee058b4f1998-02-16 06:15:35 +0000920This is a shorthand for \samp{PyErr_SetNone(PyExc_MemoryError)}; it
Guido van Rossumae110af1997-05-22 20:11:52 +0000921returns \NULL{} so an object allocation function can write
Fred Drakee058b4f1998-02-16 06:15:35 +0000922\samp{return PyErr_NoMemory();} when it runs out of memory.
Guido van Rossumae110af1997-05-22 20:11:52 +0000923\end{cfuncdesc}
924
Fred Drakec6fa34e1998-04-02 06:47:24 +0000925\begin{cfuncdesc}{PyObject*}{PyErr_SetFromErrno}{PyObject *type}
Fred Drake659ebfa2000-04-03 15:42:13 +0000926This is a convenience function to raise an exception when a C library
927function has returned an error and set the C variable \cdata{errno}.
Guido van Rossumae110af1997-05-22 20:11:52 +0000928It constructs a tuple object whose first item is the integer
Fred Drakef8830d11998-04-23 14:06:01 +0000929\cdata{errno} value and whose second item is the corresponding error
Fred Drake659ebfa2000-04-03 15:42:13 +0000930message (gotten from \cfunction{strerror()}\ttindex{strerror()}), and
931then calls
Fred Drakee058b4f1998-02-16 06:15:35 +0000932\samp{PyErr_SetObject(\var{type}, \var{object})}. On \UNIX{}, when
Fred Drakef8830d11998-04-23 14:06:01 +0000933the \cdata{errno} value is \constant{EINTR}, indicating an interrupted
Fred Drakee058b4f1998-02-16 06:15:35 +0000934system call, this calls \cfunction{PyErr_CheckSignals()}, and if that set
Guido van Rossumae110af1997-05-22 20:11:52 +0000935the error indicator, leaves it set to that. The function always
936returns \NULL{}, so a wrapper function around a system call can write
Fred Drakee058b4f1998-02-16 06:15:35 +0000937\samp{return PyErr_SetFromErrno();} when the system call returns an
938error.
Guido van Rossumae110af1997-05-22 20:11:52 +0000939\end{cfuncdesc}
940
941\begin{cfuncdesc}{void}{PyErr_BadInternalCall}{}
Fred Drakee058b4f1998-02-16 06:15:35 +0000942This is a shorthand for \samp{PyErr_SetString(PyExc_TypeError,
Guido van Rossumae110af1997-05-22 20:11:52 +0000943\var{message})}, where \var{message} indicates that an internal
Guido van Rossum5060b3b1997-08-17 18:02:23 +0000944operation (e.g. a Python/C API function) was invoked with an illegal
Guido van Rossumae110af1997-05-22 20:11:52 +0000945argument. It is mostly for internal use.
946\end{cfuncdesc}
947
Guido van Rossum3dbb4062000-12-19 03:53:01 +0000948\begin{cfuncdesc}{int}{PyErr_Warn}{PyObject *category, char *message}
949Issue a warning message. The \var{category} argument is a warning
Fred Drake5566c1c2001-01-19 22:48:33 +0000950category (see below) or \NULL; the \var{message} argument is a message
Guido van Rossum3dbb4062000-12-19 03:53:01 +0000951string.
952
953This function normally prints a warning message to \var{sys.stderr};
954however, it is also possible that the user has specified that warnings
955are to be turned into errors, and in that case this will raise an
956exception. It is also possible that the function raises an exception
957because of a problem with the warning machinery (the implementation
958imports the \module{warnings} module to do the heavy lifting). The
959return value is \code{0} if no exception is raised, or \code{-1} if
960an exception is raised. (It is not possible to determine whether a
961warning message is actually printed, nor what the reason is for the
962exception; this is intentional.) If an exception is raised, the
Fred Drake5566c1c2001-01-19 22:48:33 +0000963caller should do its normal exception handling
964(e.g. \cfunction{Py_DECREF()} owned references and return an error
965value).
Guido van Rossum3dbb4062000-12-19 03:53:01 +0000966
967Warning categories must be subclasses of \cdata{Warning}; the default
968warning category is \cdata{RuntimeWarning}. The standard Python
969warning categories are available as global variables whose names are
970\samp{PyExc_} followed by the Python exception name. These have the
971type \ctype{PyObject*}; they are all class objects. Their names are
972\cdata{PyExc_Warning}, \cdata{PyExc_UserWarning},
973\cdata{PyExc_DeprecationWarning}, \cdata{PyExc_SyntaxWarning}, and
974\cdata{PyExc_RuntimeWarning}. \cdata{PyExc_Warning} is a subclass of
975\cdata{PyExc_Exception}; the other warning categories are subclasses
976of \cdata{PyExc_Warning}.
977
978For information about warning control, see the documentation for the
Fred Drake316ef7c2001-01-04 05:56:34 +0000979\module{warnings} module and the \programopt{-W} option in the command
980line documentation. There is no C API for warning control.
Guido van Rossum3dbb4062000-12-19 03:53:01 +0000981\end{cfuncdesc}
982
Guido van Rossum1874c8f2001-02-28 23:46:44 +0000983\begin{cfuncdesc}{int}{PyErr_WarnExplicit}{PyObject *category, char *message,
984char *filename, int lineno, char *module, PyObject *registry}
985Issue a warning message with explicit control over all warning
986attributes. This is a straightforward wrapper around the Python
987function \function{warnings.warn_explicit()}, see there for more
988information. The \var{module} and \var{registry} arguments may be
989set to \code{NULL} to get the default effect described there.
990\end{cfuncdesc}
991
Guido van Rossumae110af1997-05-22 20:11:52 +0000992\begin{cfuncdesc}{int}{PyErr_CheckSignals}{}
993This function interacts with Python's signal handling. It checks
994whether a signal has been sent to the processes and if so, invokes the
Fred Drake4de05a91998-02-16 14:25:26 +0000995corresponding signal handler. If the
996\module{signal}\refbimodindex{signal} module is supported, this can
997invoke a signal handler written in Python. In all cases, the default
Fred Drake659ebfa2000-04-03 15:42:13 +0000998effect for \constant{SIGINT}\ttindex{SIGINT} is to raise the
999\withsubitem{(built-in exception)}{\ttindex{KeyboardInterrupt}}
1000\exception{KeyboardInterrupt} exception. If an exception is raised the
Fred Drakee058b4f1998-02-16 06:15:35 +00001001error indicator is set and the function returns \code{1}; otherwise
1002the function returns \code{0}. The error indicator may or may not be
1003cleared if it was previously set.
Guido van Rossumae110af1997-05-22 20:11:52 +00001004\end{cfuncdesc}
1005
1006\begin{cfuncdesc}{void}{PyErr_SetInterrupt}{}
Fred Drake659ebfa2000-04-03 15:42:13 +00001007This function is obsolete. It simulates the effect of a
1008\constant{SIGINT}\ttindex{SIGINT} signal arriving --- the next time
Fred Drakee058b4f1998-02-16 06:15:35 +00001009\cfunction{PyErr_CheckSignals()} is called,
Fred Drake659ebfa2000-04-03 15:42:13 +00001010\withsubitem{(built-in exception)}{\ttindex{KeyboardInterrupt}}
1011\exception{KeyboardInterrupt} will be raised.
1012It may be called without holding the interpreter lock.
Guido van Rossumae110af1997-05-22 20:11:52 +00001013\end{cfuncdesc}
1014
Fred Drakec6fa34e1998-04-02 06:47:24 +00001015\begin{cfuncdesc}{PyObject*}{PyErr_NewException}{char *name,
1016 PyObject *base,
1017 PyObject *dict}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001018This utility function creates and returns a new exception object. The
Fred Drake659ebfa2000-04-03 15:42:13 +00001019\var{name} argument must be the name of the new exception, a C string
1020of the form \code{module.class}. The \var{base} and
Fred Draked04038d2000-06-29 20:15:14 +00001021\var{dict} arguments are normally \NULL{}. This creates a
Fred Drake659ebfa2000-04-03 15:42:13 +00001022class object derived from the root for all exceptions, the built-in
1023name \exception{Exception} (accessible in C as
Fred Draked04038d2000-06-29 20:15:14 +00001024\cdata{PyExc_Exception}). The \member{__module__} attribute of the
1025new class is set to the first part (up to the last dot) of the
1026\var{name} argument, and the class name is set to the last part (after
1027the last dot). The \var{base} argument can be used to specify an
1028alternate base class. The \var{dict} argument can be used to specify
1029a dictionary of class variables and methods.
Guido van Rossum42cefd01997-10-05 15:27:29 +00001030\end{cfuncdesc}
1031
Jeremy Hyltonb709df32000-09-01 02:47:25 +00001032\begin{cfuncdesc}{void}{PyErr_WriteUnraisable}{PyObject *obj}
1033This utility function prints a warning message to \var{sys.stderr}
1034when an exception has been set but it is impossible for the
1035interpreter to actually raise the exception. It is used, for example,
1036when an exception occurs in an \member{__del__} method.
1037
1038The function is called with a single argument \var{obj} that
1039identifies where the context in which the unraisable exception
1040occurred. The repr of \var{obj} will be printed in the warning
1041message.
1042\end{cfuncdesc}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001043
Fred Drakeefd146c1999-02-15 15:30:45 +00001044\section{Standard Exceptions \label{standardExceptions}}
Guido van Rossumae110af1997-05-22 20:11:52 +00001045
1046All standard Python exceptions are available as global variables whose
Fred Drake659ebfa2000-04-03 15:42:13 +00001047names are \samp{PyExc_} followed by the Python exception name. These
1048have the type \ctype{PyObject*}; they are all class objects. For
1049completeness, here are all the variables:
1050
1051\begin{tableiii}{l|l|c}{cdata}{C Name}{Python Name}{Notes}
1052 \lineiii{PyExc_Exception}{\exception{Exception}}{(1)}
1053 \lineiii{PyExc_StandardError}{\exception{StandardError}}{(1)}
1054 \lineiii{PyExc_ArithmeticError}{\exception{ArithmeticError}}{(1)}
1055 \lineiii{PyExc_LookupError}{\exception{LookupError}}{(1)}
1056 \lineiii{PyExc_AssertionError}{\exception{AssertionError}}{}
1057 \lineiii{PyExc_AttributeError}{\exception{AttributeError}}{}
1058 \lineiii{PyExc_EOFError}{\exception{EOFError}}{}
1059 \lineiii{PyExc_EnvironmentError}{\exception{EnvironmentError}}{(1)}
1060 \lineiii{PyExc_FloatingPointError}{\exception{FloatingPointError}}{}
1061 \lineiii{PyExc_IOError}{\exception{IOError}}{}
1062 \lineiii{PyExc_ImportError}{\exception{ImportError}}{}
1063 \lineiii{PyExc_IndexError}{\exception{IndexError}}{}
1064 \lineiii{PyExc_KeyError}{\exception{KeyError}}{}
1065 \lineiii{PyExc_KeyboardInterrupt}{\exception{KeyboardInterrupt}}{}
1066 \lineiii{PyExc_MemoryError}{\exception{MemoryError}}{}
1067 \lineiii{PyExc_NameError}{\exception{NameError}}{}
1068 \lineiii{PyExc_NotImplementedError}{\exception{NotImplementedError}}{}
1069 \lineiii{PyExc_OSError}{\exception{OSError}}{}
1070 \lineiii{PyExc_OverflowError}{\exception{OverflowError}}{}
1071 \lineiii{PyExc_RuntimeError}{\exception{RuntimeError}}{}
1072 \lineiii{PyExc_SyntaxError}{\exception{SyntaxError}}{}
1073 \lineiii{PyExc_SystemError}{\exception{SystemError}}{}
1074 \lineiii{PyExc_SystemExit}{\exception{SystemExit}}{}
1075 \lineiii{PyExc_TypeError}{\exception{TypeError}}{}
1076 \lineiii{PyExc_ValueError}{\exception{ValueError}}{}
Fred Drakea8d73412000-08-11 20:39:29 +00001077 \lineiii{PyExc_WindowsError}{\exception{WindowsError}}{(2)}
Fred Drake659ebfa2000-04-03 15:42:13 +00001078 \lineiii{PyExc_ZeroDivisionError}{\exception{ZeroDivisionError}}{}
1079\end{tableiii}
1080
1081\noindent
Fred Drakea8d73412000-08-11 20:39:29 +00001082Notes:
Fred Drake659ebfa2000-04-03 15:42:13 +00001083\begin{description}
1084\item[(1)]
Fred Draked04038d2000-06-29 20:15:14 +00001085 This is a base class for other standard exceptions.
Fred Drakea8d73412000-08-11 20:39:29 +00001086
1087\item[(2)]
1088 Only defined on Windows; protect code that uses this by testing that
1089 the preprocessor macro \code{MS_WINDOWS} is defined.
Fred Drake659ebfa2000-04-03 15:42:13 +00001090\end{description}
1091
1092
1093\section{Deprecation of String Exceptions}
1094
Fred Draked04038d2000-06-29 20:15:14 +00001095All exceptions built into Python or provided in the standard library
1096are derived from \exception{Exception}.
Fred Drake659ebfa2000-04-03 15:42:13 +00001097\withsubitem{(built-in exception)}{\ttindex{Exception}}
Fred Drake659ebfa2000-04-03 15:42:13 +00001098
Fred Draked04038d2000-06-29 20:15:14 +00001099String exceptions are still supported in the interpreter to allow
Fred Drake659ebfa2000-04-03 15:42:13 +00001100existing code to run unmodified, but this will also change in a future
1101release.
Guido van Rossumae110af1997-05-22 20:11:52 +00001102
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001103
Fred Drakeefd146c1999-02-15 15:30:45 +00001104\chapter{Utilities \label{utilities}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001105
1106The functions in this chapter perform various utility tasks, such as
Fred Drake659ebfa2000-04-03 15:42:13 +00001107parsing function arguments and constructing Python values from C
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001108values.
1109
Fred Drakeefd146c1999-02-15 15:30:45 +00001110\section{OS Utilities \label{os}}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001111
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001112\begin{cfuncdesc}{int}{Py_FdIsInteractive}{FILE *fp, char *filename}
Fred Drakee058b4f1998-02-16 06:15:35 +00001113Return true (nonzero) if the standard I/O file \var{fp} with name
1114\var{filename} is deemed interactive. This is the case for files for
1115which \samp{isatty(fileno(\var{fp}))} is true. If the global flag
Fred Drakef8830d11998-04-23 14:06:01 +00001116\cdata{Py_InteractiveFlag} is true, this function also returns true if
Fred Drake5566c1c2001-01-19 22:48:33 +00001117the \var{filename} pointer is \NULL{} or if the name is equal to one of
Fred Drakea8455ab2000-06-16 19:58:42 +00001118the strings \code{'<stdin>'} or \code{'???'}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001119\end{cfuncdesc}
1120
1121\begin{cfuncdesc}{long}{PyOS_GetLastModificationTime}{char *filename}
Fred Drakee058b4f1998-02-16 06:15:35 +00001122Return the time of last modification of the file \var{filename}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001123The result is encoded in the same way as the timestamp returned by
Fred Drake659ebfa2000-04-03 15:42:13 +00001124the standard C library function \cfunction{time()}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001125\end{cfuncdesc}
1126
Fred Drakecabbc3b2000-06-28 15:53:13 +00001127\begin{cfuncdesc}{void}{PyOS_AfterFork}{}
1128Function to update some internal state after a process fork; this
1129should be called in the new process if the Python interpreter will
1130continue to be used. If a new executable is loaded into the new
1131process, this function does not need to be called.
1132\end{cfuncdesc}
1133
Fred Drake17e63432000-08-31 05:50:40 +00001134\begin{cfuncdesc}{int}{PyOS_CheckStack}{}
1135Return true when the interpreter runs out of stack space. This is a
1136reliable check, but is only available when \code{USE_STACKCHECK} is
1137defined (currently on Windows using the Microsoft Visual C++ compiler
1138and on the Macintosh). \code{USE_CHECKSTACK} will be defined
1139automatically; you should never change the definition in your own
1140code.
1141\end{cfuncdesc}
1142
Guido van Rossumc96ec6e2000-09-16 16:30:48 +00001143\begin{cfuncdesc}{PyOS_sighandler_t}{PyOS_getsig}{int i}
1144Return the current signal handler for signal \var{i}.
1145This is a thin wrapper around either \cfunction{sigaction} or
1146\cfunction{signal}. Do not call those functions directly!
1147\ctype{PyOS_sighandler_t} is a typedef alias for \ctype{void (*)(int)}.
1148\end{cfuncdesc}
1149
1150\begin{cfuncdesc}{PyOS_sighandler_t}{PyOS_setsig}{int i, PyOS_sighandler_t h}
1151Set the signal handler for signal \var{i} to be \var{h};
1152return the old signal handler.
1153This is a thin wrapper around either \cfunction{sigaction} or
1154\cfunction{signal}. Do not call those functions directly!
1155\ctype{PyOS_sighandler_t} is a typedef alias for \ctype{void (*)(int)}.
1156\end{cfuncdesc}
1157
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001158
Fred Drakeefd146c1999-02-15 15:30:45 +00001159\section{Process Control \label{processControl}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00001160
1161\begin{cfuncdesc}{void}{Py_FatalError}{char *message}
1162Print a fatal error message and kill the process. No cleanup is
1163performed. This function should only be invoked when a condition is
1164detected that would make it dangerous to continue using the Python
1165interpreter; e.g., when the object administration appears to be
Fred Drake659ebfa2000-04-03 15:42:13 +00001166corrupted. On \UNIX{}, the standard C library function
1167\cfunction{abort()}\ttindex{abort()} is called which will attempt to
1168produce a \file{core} file.
Fred Drakee5bf8b21998-02-12 21:22:28 +00001169\end{cfuncdesc}
1170
1171\begin{cfuncdesc}{void}{Py_Exit}{int status}
Fred Drake659ebfa2000-04-03 15:42:13 +00001172Exit the current process. This calls
1173\cfunction{Py_Finalize()}\ttindex{Py_Finalize()} and
1174then calls the standard C library function
1175\code{exit(\var{status})}\ttindex{exit()}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00001176\end{cfuncdesc}
1177
1178\begin{cfuncdesc}{int}{Py_AtExit}{void (*func) ()}
Fred Drake659ebfa2000-04-03 15:42:13 +00001179Register a cleanup function to be called by
1180\cfunction{Py_Finalize()}\ttindex{Py_Finalize()}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00001181The cleanup function will be called with no arguments and should
Fred Drake659ebfa2000-04-03 15:42:13 +00001182return no value. At most 32 \index{cleanup functions}cleanup
1183functions can be registered.
Fred Drakee5bf8b21998-02-12 21:22:28 +00001184When the registration is successful, \cfunction{Py_AtExit()} returns
1185\code{0}; on failure, it returns \code{-1}. The cleanup function
1186registered last is called first. Each cleanup function will be called
1187at most once. Since Python's internal finallization will have
1188completed before the cleanup function, no Python APIs should be called
1189by \var{func}.
1190\end{cfuncdesc}
1191
1192
Fred Drakeefd146c1999-02-15 15:30:45 +00001193\section{Importing Modules \label{importing}}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001194
Fred Drakec6fa34e1998-04-02 06:47:24 +00001195\begin{cfuncdesc}{PyObject*}{PyImport_ImportModule}{char *name}
Fred Drake659ebfa2000-04-03 15:42:13 +00001196This is a simplified interface to
1197\cfunction{PyImport_ImportModuleEx()} below, leaving the
1198\var{globals} and \var{locals} arguments set to \NULL{}. When the
1199\var{name} argument contains a dot (i.e., when it specifies a
1200submodule of a package), the \var{fromlist} argument is set to the
1201list \code{['*']} so that the return value is the named module rather
1202than the top-level package containing it as would otherwise be the
1203case. (Unfortunately, this has an additional side effect when
1204\var{name} in fact specifies a subpackage instead of a submodule: the
1205submodules specified in the package's \code{__all__} variable are
1206\index{package variable!\code{__all__}}
1207\withsubitem{(package variable)}{\ttindex{__all__}}loaded.) Return a
1208new reference to the imported module, or
1209\NULL{} with an exception set on failure (the module may still be
1210created in this case --- examine \code{sys.modules} to find out).
1211\withsubitem{(in module sys)}{\ttindex{modules}}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001212\end{cfuncdesc}
1213
Fred Drakec6fa34e1998-04-02 06:47:24 +00001214\begin{cfuncdesc}{PyObject*}{PyImport_ImportModuleEx}{char *name, PyObject *globals, PyObject *locals, PyObject *fromlist}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001215Import a module. This is best described by referring to the built-in
Fred Drake53fb7721998-02-16 06:23:20 +00001216Python function \function{__import__()}\bifuncindex{__import__}, as
1217the standard \function{__import__()} function calls this function
1218directly.
Guido van Rossum42cefd01997-10-05 15:27:29 +00001219
Guido van Rossum42cefd01997-10-05 15:27:29 +00001220The return value is a new reference to the imported module or
Guido van Rossum580aa8d1997-11-25 15:34:51 +00001221top-level package, or \NULL{} with an exception set on failure
Guido van Rossumc44d3d61997-10-06 05:10:47 +00001222(the module may still be created in this case). Like for
Fred Drakee058b4f1998-02-16 06:15:35 +00001223\function{__import__()}, the return value when a submodule of a
1224package was requested is normally the top-level package, unless a
1225non-empty \var{fromlist} was given.
Guido van Rossum42cefd01997-10-05 15:27:29 +00001226\end{cfuncdesc}
1227
Fred Drakec6fa34e1998-04-02 06:47:24 +00001228\begin{cfuncdesc}{PyObject*}{PyImport_Import}{PyObject *name}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001229This is a higher-level interface that calls the current ``import hook
Fred Drakee058b4f1998-02-16 06:15:35 +00001230function''. It invokes the \function{__import__()} function from the
Guido van Rossum42cefd01997-10-05 15:27:29 +00001231\code{__builtins__} of the current globals. This means that the
1232import is done using whatever import hooks are installed in the
Fred Drake4de05a91998-02-16 14:25:26 +00001233current environment, e.g. by \module{rexec}\refstmodindex{rexec} or
1234\module{ihooks}\refstmodindex{ihooks}.
Guido van Rossum42cefd01997-10-05 15:27:29 +00001235\end{cfuncdesc}
1236
Fred Drakec6fa34e1998-04-02 06:47:24 +00001237\begin{cfuncdesc}{PyObject*}{PyImport_ReloadModule}{PyObject *m}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001238Reload a module. This is best described by referring to the built-in
Fred Drake53fb7721998-02-16 06:23:20 +00001239Python function \function{reload()}\bifuncindex{reload}, as the standard
Fred Drakee058b4f1998-02-16 06:15:35 +00001240\function{reload()} function calls this function directly. Return a
1241new reference to the reloaded module, or \NULL{} with an exception set
1242on failure (the module still exists in this case).
Guido van Rossum42cefd01997-10-05 15:27:29 +00001243\end{cfuncdesc}
1244
Fred Drakec6fa34e1998-04-02 06:47:24 +00001245\begin{cfuncdesc}{PyObject*}{PyImport_AddModule}{char *name}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001246Return the module object corresponding to a module name. The
1247\var{name} argument may be of the form \code{package.module}). First
1248check the modules dictionary if there's one there, and if not, create
Fred Drake659ebfa2000-04-03 15:42:13 +00001249a new one and insert in in the modules dictionary.
Guido van Rossuma096a2e1998-11-02 17:02:42 +00001250Warning: this function does not load or import the module; if the
1251module wasn't already loaded, you will get an empty module object.
1252Use \cfunction{PyImport_ImportModule()} or one of its variants to
1253import a module.
Fred Drake659ebfa2000-04-03 15:42:13 +00001254Return \NULL{} with an exception set on failure.
Guido van Rossum42cefd01997-10-05 15:27:29 +00001255\end{cfuncdesc}
1256
Fred Drakec6fa34e1998-04-02 06:47:24 +00001257\begin{cfuncdesc}{PyObject*}{PyImport_ExecCodeModule}{char *name, PyObject *co}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001258Given a module name (possibly of the form \code{package.module}) and a
1259code object read from a Python bytecode file or obtained from the
Fred Drake53fb7721998-02-16 06:23:20 +00001260built-in function \function{compile()}\bifuncindex{compile}, load the
1261module. Return a new reference to the module object, or \NULL{} with
1262an exception set if an error occurred (the module may still be created
1263in this case). (This function would reload the module if it was
1264already imported.)
Guido van Rossum42cefd01997-10-05 15:27:29 +00001265\end{cfuncdesc}
1266
1267\begin{cfuncdesc}{long}{PyImport_GetMagicNumber}{}
Fred Drake659ebfa2000-04-03 15:42:13 +00001268Return the magic number for Python bytecode files (a.k.a.
1269\file{.pyc} and \file{.pyo} files). The magic number should be
1270present in the first four bytes of the bytecode file, in little-endian
1271byte order.
Guido van Rossum42cefd01997-10-05 15:27:29 +00001272\end{cfuncdesc}
1273
Fred Drakec6fa34e1998-04-02 06:47:24 +00001274\begin{cfuncdesc}{PyObject*}{PyImport_GetModuleDict}{}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001275Return the dictionary used for the module administration
1276(a.k.a. \code{sys.modules}). Note that this is a per-interpreter
1277variable.
1278\end{cfuncdesc}
1279
1280\begin{cfuncdesc}{void}{_PyImport_Init}{}
1281Initialize the import mechanism. For internal use only.
1282\end{cfuncdesc}
1283
1284\begin{cfuncdesc}{void}{PyImport_Cleanup}{}
1285Empty the module table. For internal use only.
1286\end{cfuncdesc}
1287
1288\begin{cfuncdesc}{void}{_PyImport_Fini}{}
1289Finalize the import mechanism. For internal use only.
1290\end{cfuncdesc}
1291
Fred Drakec6fa34e1998-04-02 06:47:24 +00001292\begin{cfuncdesc}{PyObject*}{_PyImport_FindExtension}{char *, char *}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001293For internal use only.
Guido van Rossum5b8a5231997-12-30 04:38:44 +00001294\end{cfuncdesc}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001295
Fred Drakec6fa34e1998-04-02 06:47:24 +00001296\begin{cfuncdesc}{PyObject*}{_PyImport_FixupExtension}{char *, char *}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001297For internal use only.
Guido van Rossum5b8a5231997-12-30 04:38:44 +00001298\end{cfuncdesc}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001299
Fred Drake1d158692000-06-18 05:21:21 +00001300\begin{cfuncdesc}{int}{PyImport_ImportFrozenModule}{char *name}
1301Load a frozen module named \var{name}. Return \code{1} for success,
1302\code{0} if the module is not found, and \code{-1} with an exception
1303set if the initialization failed. To access the imported module on a
1304successful load, use \cfunction{PyImport_ImportModule()}.
Fred Drakee058b4f1998-02-16 06:15:35 +00001305(Note the misnomer --- this function would reload the module if it was
Guido van Rossum42cefd01997-10-05 15:27:29 +00001306already imported.)
1307\end{cfuncdesc}
1308
Fred Drake659ebfa2000-04-03 15:42:13 +00001309\begin{ctypedesc}[_frozen]{struct _frozen}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001310This is the structure type definition for frozen module descriptors,
Fred Drakec6fa34e1998-04-02 06:47:24 +00001311as generated by the \program{freeze}\index{freeze utility} utility
1312(see \file{Tools/freeze/} in the Python source distribution). Its
Fred Drakee0d9a832000-09-01 05:30:00 +00001313definition, found in \file{Include/import.h}, is:
Fred Drakec6fa34e1998-04-02 06:47:24 +00001314
Guido van Rossum9faf4c51997-10-07 14:38:54 +00001315\begin{verbatim}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001316struct _frozen {
Fred Drake36fbe761997-10-13 18:18:33 +00001317 char *name;
1318 unsigned char *code;
1319 int size;
Guido van Rossum42cefd01997-10-05 15:27:29 +00001320};
Guido van Rossum9faf4c51997-10-07 14:38:54 +00001321\end{verbatim}
Guido van Rossum42cefd01997-10-05 15:27:29 +00001322\end{ctypedesc}
1323
Fred Drakec6fa34e1998-04-02 06:47:24 +00001324\begin{cvardesc}{struct _frozen*}{PyImport_FrozenModules}
Fred Drakef8830d11998-04-23 14:06:01 +00001325This pointer is initialized to point to an array of \ctype{struct
Fred Drake659ebfa2000-04-03 15:42:13 +00001326_frozen} records, terminated by one whose members are all
1327\NULL{} or zero. When a frozen module is imported, it is searched in
1328this table. Third-party code could play tricks with this to provide a
Guido van Rossum42cefd01997-10-05 15:27:29 +00001329dynamically created collection of frozen modules.
1330\end{cvardesc}
1331
Fred Drakee0d9a832000-09-01 05:30:00 +00001332\begin{cfuncdesc}{int}{PyImport_AppendInittab}{char *name,
1333 void (*initfunc)(void)}
1334Add a single module to the existing table of built-in modules. This
1335is a convenience wrapper around \cfunction{PyImport_ExtendInittab()},
1336returning \code{-1} if the table could not be extended. The new
1337module can be imported by the name \var{name}, and uses the function
1338\var{initfunc} as the initialization function called on the first
1339attempted import. This should be called before
1340\cfunction{Py_Initialize()}.
1341\end{cfuncdesc}
1342
1343\begin{ctypedesc}[_inittab]{struct _inittab}
1344Structure describing a single entry in the list of built-in modules.
1345Each of these structures gives the name and initialization function
1346for a module built into the interpreter. Programs which embed Python
1347may use an array of these structures in conjunction with
1348\cfunction{PyImport_ExtendInittab()} to provide additional built-in
1349modules. The structure is defined in \file{Include/import.h} as:
1350
1351\begin{verbatim}
1352struct _inittab {
1353 char *name;
1354 void (*initfunc)(void);
1355};
1356\end{verbatim}
1357\end{ctypedesc}
1358
1359\begin{cfuncdesc}{int}{PyImport_ExtendInittab}{struct _inittab *newtab}
1360Add a collection of modules to the table of built-in modules. The
1361\var{newtab} array must end with a sentinel entry which contains
1362\NULL{} for the \member{name} field; failure to provide the sentinel
1363value can result in a memory fault. Returns \code{0} on success or
1364\code{-1} if insufficient memory could be allocated to extend the
1365internal table. In the event of failure, no modules are added to the
1366internal table. This should be called before
1367\cfunction{Py_Initialize()}.
1368\end{cfuncdesc}
1369
Guido van Rossum42cefd01997-10-05 15:27:29 +00001370
Fred Drakeefd146c1999-02-15 15:30:45 +00001371\chapter{Abstract Objects Layer \label{abstract}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001372
1373The functions in this chapter interact with Python objects regardless
1374of their type, or with wide classes of object types (e.g. all
1375numerical types, or all sequence types). When used on object types
Fred Drake659ebfa2000-04-03 15:42:13 +00001376for which they do not apply, they will raise a Python exception.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001377
Fred Drakeefd146c1999-02-15 15:30:45 +00001378\section{Object Protocol \label{object}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001379
1380\begin{cfuncdesc}{int}{PyObject_Print}{PyObject *o, FILE *fp, int flags}
Fred Drake659ebfa2000-04-03 15:42:13 +00001381Print an object \var{o}, on file \var{fp}. Returns \code{-1} on error.
1382The flags argument is used to enable certain printing options. The
1383only option currently supported is \constant{Py_PRINT_RAW}; if given,
1384the \function{str()} of the object is written instead of the
1385\function{repr()}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001386\end{cfuncdesc}
1387
1388\begin{cfuncdesc}{int}{PyObject_HasAttrString}{PyObject *o, char *attr_name}
Fred Drakee058b4f1998-02-16 06:15:35 +00001389Returns \code{1} if \var{o} has the attribute \var{attr_name}, and
1390\code{0} otherwise. This is equivalent to the Python expression
1391\samp{hasattr(\var{o}, \var{attr_name})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001392This function always succeeds.
1393\end{cfuncdesc}
1394
Fred Drake659ebfa2000-04-03 15:42:13 +00001395\begin{cfuncdesc}{PyObject*}{PyObject_GetAttrString}{PyObject *o,
1396 char *attr_name}
Fred Drakee058b4f1998-02-16 06:15:35 +00001397Retrieve an attribute named \var{attr_name} from object \var{o}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001398Returns the attribute value on success, or \NULL{} on failure.
Fred Drakee058b4f1998-02-16 06:15:35 +00001399This is the equivalent of the Python expression
1400\samp{\var{o}.\var{attr_name}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001401\end{cfuncdesc}
1402
1403
1404\begin{cfuncdesc}{int}{PyObject_HasAttr}{PyObject *o, PyObject *attr_name}
Fred Drakee058b4f1998-02-16 06:15:35 +00001405Returns \code{1} if \var{o} has the attribute \var{attr_name}, and
1406\code{0} otherwise. This is equivalent to the Python expression
1407\samp{hasattr(\var{o}, \var{attr_name})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001408This function always succeeds.
1409\end{cfuncdesc}
1410
1411
Fred Drake659ebfa2000-04-03 15:42:13 +00001412\begin{cfuncdesc}{PyObject*}{PyObject_GetAttr}{PyObject *o,
1413 PyObject *attr_name}
Fred Drakee058b4f1998-02-16 06:15:35 +00001414Retrieve an attribute named \var{attr_name} from object \var{o}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001415Returns the attribute value on success, or \NULL{} on failure.
Fred Drakee058b4f1998-02-16 06:15:35 +00001416This is the equivalent of the Python expression
1417\samp{\var{o}.\var{attr_name}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001418\end{cfuncdesc}
1419
1420
1421\begin{cfuncdesc}{int}{PyObject_SetAttrString}{PyObject *o, char *attr_name, PyObject *v}
Fred Drakee058b4f1998-02-16 06:15:35 +00001422Set the value of the attribute named \var{attr_name}, for object
1423\var{o}, to the value \var{v}. Returns \code{-1} on failure. This is
1424the equivalent of the Python statement \samp{\var{o}.\var{attr_name} =
1425\var{v}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001426\end{cfuncdesc}
1427
1428
1429\begin{cfuncdesc}{int}{PyObject_SetAttr}{PyObject *o, PyObject *attr_name, PyObject *v}
Fred Drakee058b4f1998-02-16 06:15:35 +00001430Set the value of the attribute named \var{attr_name}, for
1431object \var{o},
1432to the value \var{v}. Returns \code{-1} on failure. This is
1433the equivalent of the Python statement \samp{\var{o}.\var{attr_name} =
1434\var{v}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001435\end{cfuncdesc}
1436
1437
1438\begin{cfuncdesc}{int}{PyObject_DelAttrString}{PyObject *o, char *attr_name}
Fred Drakee058b4f1998-02-16 06:15:35 +00001439Delete attribute named \var{attr_name}, for object \var{o}. Returns
1440\code{-1} on failure. This is the equivalent of the Python
1441statement: \samp{del \var{o}.\var{attr_name}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001442\end{cfuncdesc}
1443
1444
1445\begin{cfuncdesc}{int}{PyObject_DelAttr}{PyObject *o, PyObject *attr_name}
Fred Drakee058b4f1998-02-16 06:15:35 +00001446Delete attribute named \var{attr_name}, for object \var{o}. Returns
1447\code{-1} on failure. This is the equivalent of the Python
1448statement \samp{del \var{o}.\var{attr_name}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001449\end{cfuncdesc}
1450
1451
1452\begin{cfuncdesc}{int}{PyObject_Cmp}{PyObject *o1, PyObject *o2, int *result}
Fred Drakee058b4f1998-02-16 06:15:35 +00001453Compare the values of \var{o1} and \var{o2} using a routine provided
1454by \var{o1}, if one exists, otherwise with a routine provided by
1455\var{o2}. The result of the comparison is returned in \var{result}.
1456Returns \code{-1} on failure. This is the equivalent of the Python
Fred Drake659ebfa2000-04-03 15:42:13 +00001457statement\bifuncindex{cmp} \samp{\var{result} = cmp(\var{o1}, \var{o2})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001458\end{cfuncdesc}
1459
1460
1461\begin{cfuncdesc}{int}{PyObject_Compare}{PyObject *o1, PyObject *o2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001462Compare the values of \var{o1} and \var{o2} using a routine provided
1463by \var{o1}, if one exists, otherwise with a routine provided by
1464\var{o2}. Returns the result of the comparison on success. On error,
1465the value returned is undefined; use \cfunction{PyErr_Occurred()} to
Fred Drake659ebfa2000-04-03 15:42:13 +00001466detect an error. This is equivalent to the Python
1467expression\bifuncindex{cmp} \samp{cmp(\var{o1}, \var{o2})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001468\end{cfuncdesc}
1469
1470
1471\begin{cfuncdesc}{PyObject*}{PyObject_Repr}{PyObject *o}
Fred Drake659ebfa2000-04-03 15:42:13 +00001472Compute a string representation of object \var{o}. Returns the
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001473string representation on success, \NULL{} on failure. This is
Fred Drakee058b4f1998-02-16 06:15:35 +00001474the equivalent of the Python expression \samp{repr(\var{o})}.
1475Called by the \function{repr()}\bifuncindex{repr} built-in function
1476and by reverse quotes.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001477\end{cfuncdesc}
1478
1479
1480\begin{cfuncdesc}{PyObject*}{PyObject_Str}{PyObject *o}
Fred Drake659ebfa2000-04-03 15:42:13 +00001481Compute a string representation of object \var{o}. Returns the
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001482string representation on success, \NULL{} on failure. This is
Fred Drakee058b4f1998-02-16 06:15:35 +00001483the equivalent of the Python expression \samp{str(\var{o})}.
1484Called by the \function{str()}\bifuncindex{str} built-in function and
1485by the \keyword{print} statement.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001486\end{cfuncdesc}
1487
1488
Marc-André Lemburgad7c98e2001-01-17 17:09:53 +00001489\begin{cfuncdesc}{PyObject*}{PyObject_Unicode}{PyObject *o}
1490Compute a Unicode string representation of object \var{o}. Returns the
1491Unicode string representation on success, \NULL{} on failure. This is
1492the equivalent of the Python expression \samp{unistr(\var{o})}.
1493Called by the \function{unistr()}\bifuncindex{unistr} built-in function.
1494\end{cfuncdesc}
1495
1496
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001497\begin{cfuncdesc}{int}{PyCallable_Check}{PyObject *o}
Fred Drake659ebfa2000-04-03 15:42:13 +00001498Determine if the object \var{o} is callable. Return \code{1} if the
Fred Drakee058b4f1998-02-16 06:15:35 +00001499object is callable and \code{0} otherwise.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001500This function always succeeds.
1501\end{cfuncdesc}
1502
1503
Fred Drake659ebfa2000-04-03 15:42:13 +00001504\begin{cfuncdesc}{PyObject*}{PyObject_CallObject}{PyObject *callable_object,
1505 PyObject *args}
Fred Drakee058b4f1998-02-16 06:15:35 +00001506Call a callable Python object \var{callable_object}, with
1507arguments given by the tuple \var{args}. If no arguments are
Fred Drake659ebfa2000-04-03 15:42:13 +00001508needed, then \var{args} may be \NULL{}. Returns the result of the
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001509call on success, or \NULL{} on failure. This is the equivalent
Fred Drake5566c1c2001-01-19 22:48:33 +00001510of the Python expression \samp{apply(\var{callable_object}, \var{args})}.
Fred Drake659ebfa2000-04-03 15:42:13 +00001511\bifuncindex{apply}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001512\end{cfuncdesc}
1513
Fred Drake5566c1c2001-01-19 22:48:33 +00001514\begin{cfuncdesc}{PyObject*}{PyObject_CallFunction}{PyObject *callable_object,
1515 char *format, ...}
Fred Drakee058b4f1998-02-16 06:15:35 +00001516Call a callable Python object \var{callable_object}, with a
Fred Drake659ebfa2000-04-03 15:42:13 +00001517variable number of C arguments. The C arguments are described
Fred Drakee058b4f1998-02-16 06:15:35 +00001518using a \cfunction{Py_BuildValue()} style format string. The format may
1519be \NULL{}, indicating that no arguments are provided. Returns the
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001520result of the call on success, or \NULL{} on failure. This is
Fred Drake5566c1c2001-01-19 22:48:33 +00001521the equivalent of the Python expression \samp{apply(\var{callable_object},
Fred Drake659ebfa2000-04-03 15:42:13 +00001522\var{args})}.\bifuncindex{apply}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001523\end{cfuncdesc}
1524
1525
Fred Drake5566c1c2001-01-19 22:48:33 +00001526\begin{cfuncdesc}{PyObject*}{PyObject_CallMethod}{PyObject *o,
1527 char *method, char *format, ...}
Fred Drakee058b4f1998-02-16 06:15:35 +00001528Call the method named \var{m} of object \var{o} with a variable number
Fred Drake659ebfa2000-04-03 15:42:13 +00001529of C arguments. The C arguments are described by a
Fred Drakee058b4f1998-02-16 06:15:35 +00001530\cfunction{Py_BuildValue()} format string. The format may be \NULL{},
1531indicating that no arguments are provided. Returns the result of the
1532call on success, or \NULL{} on failure. This is the equivalent of the
1533Python expression \samp{\var{o}.\var{method}(\var{args})}.
Fred Drake659ebfa2000-04-03 15:42:13 +00001534Note that special method names, such as \method{__add__()},
1535\method{__getitem__()}, and so on are not supported. The specific
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001536abstract-object routines for these must be used.
1537\end{cfuncdesc}
1538
1539
1540\begin{cfuncdesc}{int}{PyObject_Hash}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001541Compute and return the hash value of an object \var{o}. On
1542failure, return \code{-1}. This is the equivalent of the Python
Fred Drake659ebfa2000-04-03 15:42:13 +00001543expression \samp{hash(\var{o})}.\bifuncindex{hash}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001544\end{cfuncdesc}
1545
1546
1547\begin{cfuncdesc}{int}{PyObject_IsTrue}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001548Returns \code{1} if the object \var{o} is considered to be true, and
1549\code{0} otherwise. This is equivalent to the Python expression
1550\samp{not not \var{o}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001551This function always succeeds.
1552\end{cfuncdesc}
1553
1554
1555\begin{cfuncdesc}{PyObject*}{PyObject_Type}{PyObject *o}
1556On success, returns a type object corresponding to the object
Fred Drakee058b4f1998-02-16 06:15:35 +00001557type of object \var{o}. On failure, returns \NULL{}. This is
1558equivalent to the Python expression \samp{type(\var{o})}.
Fred Drake53fb7721998-02-16 06:23:20 +00001559\bifuncindex{type}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001560\end{cfuncdesc}
1561
1562\begin{cfuncdesc}{int}{PyObject_Length}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001563Return the length of object \var{o}. If the object \var{o} provides
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001564both sequence and mapping protocols, the sequence length is
Fred Drake659ebfa2000-04-03 15:42:13 +00001565returned. On error, \code{-1} is returned. This is the equivalent
1566to the Python expression \samp{len(\var{o})}.\bifuncindex{len}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001567\end{cfuncdesc}
1568
1569
1570\begin{cfuncdesc}{PyObject*}{PyObject_GetItem}{PyObject *o, PyObject *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00001571Return element of \var{o} corresponding to the object \var{key} or
1572\NULL{} on failure. This is the equivalent of the Python expression
1573\samp{\var{o}[\var{key}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001574\end{cfuncdesc}
1575
1576
1577\begin{cfuncdesc}{int}{PyObject_SetItem}{PyObject *o, PyObject *key, PyObject *v}
Fred Drakee058b4f1998-02-16 06:15:35 +00001578Map the object \var{key} to the value \var{v}.
1579Returns \code{-1} on failure. This is the equivalent
1580of the Python statement \samp{\var{o}[\var{key}] = \var{v}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001581\end{cfuncdesc}
1582
1583
Guido van Rossumd1dbf631999-01-22 20:10:49 +00001584\begin{cfuncdesc}{int}{PyObject_DelItem}{PyObject *o, PyObject *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00001585Delete the mapping for \var{key} from \var{o}. Returns \code{-1} on
1586failure. This is the equivalent of the Python statement \samp{del
1587\var{o}[\var{key}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001588\end{cfuncdesc}
1589
Andrew M. Kuchling8c46b302000-07-13 23:58:16 +00001590\begin{cfuncdesc}{int}{PyObject_AsFileDescriptor}{PyObject *o}
1591Derives a file-descriptor from a Python object. If the object
1592is an integer or long integer, its value is returned. If not, the
1593object's \method{fileno()} method is called if it exists; the method
1594must return an integer or long integer, which is returned as the file
1595descriptor value. Returns \code{-1} on failure.
1596\end{cfuncdesc}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001597
Fred Drakeefd146c1999-02-15 15:30:45 +00001598\section{Number Protocol \label{number}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001599
1600\begin{cfuncdesc}{int}{PyNumber_Check}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001601Returns \code{1} if the object \var{o} provides numeric protocols, and
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001602false otherwise.
1603This function always succeeds.
1604\end{cfuncdesc}
1605
1606
1607\begin{cfuncdesc}{PyObject*}{PyNumber_Add}{PyObject *o1, PyObject *o2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001608Returns the result of adding \var{o1} and \var{o2}, or \NULL{} on
1609failure. This is the equivalent of the Python expression
1610\samp{\var{o1} + \var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001611\end{cfuncdesc}
1612
1613
1614\begin{cfuncdesc}{PyObject*}{PyNumber_Subtract}{PyObject *o1, PyObject *o2}
Fred Drake659ebfa2000-04-03 15:42:13 +00001615Returns the result of subtracting \var{o2} from \var{o1}, or
1616\NULL{} on failure. This is the equivalent of the Python expression
Fred Drakee058b4f1998-02-16 06:15:35 +00001617\samp{\var{o1} - \var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001618\end{cfuncdesc}
1619
1620
1621\begin{cfuncdesc}{PyObject*}{PyNumber_Multiply}{PyObject *o1, PyObject *o2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001622Returns the result of multiplying \var{o1} and \var{o2}, or \NULL{} on
1623failure. This is the equivalent of the Python expression
1624\samp{\var{o1} * \var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001625\end{cfuncdesc}
1626
1627
1628\begin{cfuncdesc}{PyObject*}{PyNumber_Divide}{PyObject *o1, PyObject *o2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001629Returns the result of dividing \var{o1} by \var{o2}, or \NULL{} on
1630failure.
1631This is the equivalent of the Python expression \samp{\var{o1} /
1632\var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001633\end{cfuncdesc}
1634
1635
1636\begin{cfuncdesc}{PyObject*}{PyNumber_Remainder}{PyObject *o1, PyObject *o2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001637Returns the remainder of dividing \var{o1} by \var{o2}, or \NULL{} on
1638failure. This is the equivalent of the Python expression
Fred Drake659ebfa2000-04-03 15:42:13 +00001639\samp{\var{o1} \%\ \var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001640\end{cfuncdesc}
1641
1642
1643\begin{cfuncdesc}{PyObject*}{PyNumber_Divmod}{PyObject *o1, PyObject *o2}
Fred Drake53fb7721998-02-16 06:23:20 +00001644See the built-in function \function{divmod()}\bifuncindex{divmod}.
1645Returns \NULL{} on failure. This is the equivalent of the Python
1646expression \samp{divmod(\var{o1}, \var{o2})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001647\end{cfuncdesc}
1648
1649
1650\begin{cfuncdesc}{PyObject*}{PyNumber_Power}{PyObject *o1, PyObject *o2, PyObject *o3}
Fred Drake53fb7721998-02-16 06:23:20 +00001651See the built-in function \function{pow()}\bifuncindex{pow}. Returns
1652\NULL{} on failure. This is the equivalent of the Python expression
Fred Drakee058b4f1998-02-16 06:15:35 +00001653\samp{pow(\var{o1}, \var{o2}, \var{o3})}, where \var{o3} is optional.
Fred Drake659ebfa2000-04-03 15:42:13 +00001654If \var{o3} is to be ignored, pass \cdata{Py_None} in its place
1655(passing \NULL{} for \var{o3} would cause an illegal memory access).
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001656\end{cfuncdesc}
1657
1658
1659\begin{cfuncdesc}{PyObject*}{PyNumber_Negative}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001660Returns the negation of \var{o} on success, or \NULL{} on failure.
1661This is the equivalent of the Python expression \samp{-\var{o}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001662\end{cfuncdesc}
1663
1664
1665\begin{cfuncdesc}{PyObject*}{PyNumber_Positive}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001666Returns \var{o} on success, or \NULL{} on failure.
1667This is the equivalent of the Python expression \samp{+\var{o}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001668\end{cfuncdesc}
1669
1670
1671\begin{cfuncdesc}{PyObject*}{PyNumber_Absolute}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001672Returns the absolute value of \var{o}, or \NULL{} on failure. This is
1673the equivalent of the Python expression \samp{abs(\var{o})}.
Fred Drake659ebfa2000-04-03 15:42:13 +00001674\bifuncindex{abs}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001675\end{cfuncdesc}
1676
1677
1678\begin{cfuncdesc}{PyObject*}{PyNumber_Invert}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001679Returns the bitwise negation of \var{o} on success, or \NULL{} on
1680failure. This is the equivalent of the Python expression
1681\samp{\~\var{o}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001682\end{cfuncdesc}
1683
1684
1685\begin{cfuncdesc}{PyObject*}{PyNumber_Lshift}{PyObject *o1, PyObject *o2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001686Returns the result of left shifting \var{o1} by \var{o2} on success,
1687or \NULL{} on failure. This is the equivalent of the Python
1688expression \samp{\var{o1} << \var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001689\end{cfuncdesc}
1690
1691
1692\begin{cfuncdesc}{PyObject*}{PyNumber_Rshift}{PyObject *o1, PyObject *o2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001693Returns the result of right shifting \var{o1} by \var{o2} on success,
1694or \NULL{} on failure. This is the equivalent of the Python
1695expression \samp{\var{o1} >> \var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001696\end{cfuncdesc}
1697
1698
1699\begin{cfuncdesc}{PyObject*}{PyNumber_And}{PyObject *o1, PyObject *o2}
Fred Drake7740a012000-09-12 20:27:05 +00001700Returns the ``bitwise and'' of \var{o2} and \var{o2} on success and
1701\NULL{} on failure. This is the equivalent of the Python expression
Fred Drake5566c1c2001-01-19 22:48:33 +00001702\samp{\var{o1} \&\ \var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001703\end{cfuncdesc}
1704
1705
1706\begin{cfuncdesc}{PyObject*}{PyNumber_Xor}{PyObject *o1, PyObject *o2}
Fred Drake7740a012000-09-12 20:27:05 +00001707Returns the ``bitwise exclusive or'' of \var{o1} by \var{o2} on success,
Fred Drakee058b4f1998-02-16 06:15:35 +00001708or \NULL{} on failure. This is the equivalent of the Python
1709expression \samp{\var{o1} \^{ }\var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001710\end{cfuncdesc}
1711
1712\begin{cfuncdesc}{PyObject*}{PyNumber_Or}{PyObject *o1, PyObject *o2}
Fred Drake7740a012000-09-12 20:27:05 +00001713Returns the ``bitwise or'' of \var{o1} and \var{o2} on success, or
1714\NULL{} on failure. This is the equivalent of the Python expression
1715\samp{\var{o1} | \var{o2}}.
1716\end{cfuncdesc}
1717
1718
1719\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceAdd}{PyObject *o1, PyObject *o2}
1720Returns the result of adding \var{o1} and \var{o2}, or \NULL{} on failure.
1721The operation is done \emph{in-place} when \var{o1} supports it. This is the
1722equivalent of the Python expression \samp{\var{o1} += \var{o2}}.
1723\end{cfuncdesc}
1724
1725
1726\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceSubtract}{PyObject *o1, PyObject *o2}
1727Returns the result of subtracting \var{o2} from \var{o1}, or
1728\NULL{} on failure. The operation is done \emph{in-place} when \var{o1}
1729supports it. This is the equivalent of the Python expression \samp{\var{o1}
1730-= \var{o2}}.
1731\end{cfuncdesc}
1732
1733
1734\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceMultiply}{PyObject *o1, PyObject *o2}
1735Returns the result of multiplying \var{o1} and \var{o2}, or \NULL{} on
1736failure. The operation is done \emph{in-place} when \var{o1} supports it.
1737This is the equivalent of the Python expression \samp{\var{o1} *= \var{o2}}.
1738\end{cfuncdesc}
1739
1740
1741\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceDivide}{PyObject *o1, PyObject *o2}
1742Returns the result of dividing \var{o1} by \var{o2}, or \NULL{} on failure.
1743The operation is done \emph{in-place} when \var{o1} supports it. This is the
1744equivalent of the Python expression \samp{\var{o1} /= \var{o2}}.
1745\end{cfuncdesc}
1746
1747
1748\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceRemainder}{PyObject *o1, PyObject *o2}
1749Returns the remainder of dividing \var{o1} by \var{o2}, or \NULL{} on
1750failure. The operation is done \emph{in-place} when \var{o1} supports it.
1751This is the equivalent of the Python expression \samp{\var{o1} \%= \var{o2}}.
1752\end{cfuncdesc}
1753
1754
1755\begin{cfuncdesc}{PyObject*}{PyNumber_InPlacePower}{PyObject *o1, PyObject *o2, PyObject *o3}
1756See the built-in function \function{pow()}\bifuncindex{pow}. Returns
1757\NULL{} on failure. The operation is done \emph{in-place} when \var{o1}
1758supports it. This is the equivalent of the Python expression \samp{\var{o1}
1759**= \var{o2}} when o3 is \cdata{Py_None}, or an in-place variant of
Fred Drake5566c1c2001-01-19 22:48:33 +00001760\samp{pow(\var{o1}, \var{o2}, \var{o3})} otherwise. If \var{o3} is to be
Fred Drake7740a012000-09-12 20:27:05 +00001761ignored, pass \cdata{Py_None} in its place (passing \NULL{} for \var{o3}
1762would cause an illegal memory access).
1763\end{cfuncdesc}
1764
1765\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceLshift}{PyObject *o1, PyObject *o2}
1766Returns the result of left shifting \var{o1} by \var{o2} on success, or
1767\NULL{} on failure. The operation is done \emph{in-place} when \var{o1}
1768supports it. This is the equivalent of the Python expression \samp{\var{o1}
1769<<= \var{o2}}.
1770\end{cfuncdesc}
1771
1772
1773\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceRshift}{PyObject *o1, PyObject *o2}
1774Returns the result of right shifting \var{o1} by \var{o2} on success, or
1775\NULL{} on failure. The operation is done \emph{in-place} when \var{o1}
1776supports it. This is the equivalent of the Python expression \samp{\var{o1}
1777>>= \var{o2}}.
1778\end{cfuncdesc}
1779
1780
1781\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceAnd}{PyObject *o1, PyObject *o2}
Fred Drake5566c1c2001-01-19 22:48:33 +00001782Returns the ``bitwise and'' of \var{o1} and \var{o2} on success
1783and \NULL{} on failure. The operation is done \emph{in-place} when
1784\var{o1} supports it. This is the equivalent of the Python expression
1785\samp{\var{o1} \&= \var{o2}}.
Fred Drake7740a012000-09-12 20:27:05 +00001786\end{cfuncdesc}
1787
1788
1789\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceXor}{PyObject *o1, PyObject *o2}
1790Returns the ``bitwise exclusive or'' of \var{o1} by \var{o2} on success, or
1791\NULL{} on failure. The operation is done \emph{in-place} when \var{o1}
1792supports it. This is the equivalent of the Python expression \samp{\var{o1}
1793\^= \var{o2}}.
1794\end{cfuncdesc}
1795
1796\begin{cfuncdesc}{PyObject*}{PyNumber_InPlaceOr}{PyObject *o1, PyObject *o2}
1797Returns the ``bitwise or'' of \var{o1} and \var{o2} on success, or \NULL{}
1798on failure. The operation is done \emph{in-place} when \var{o1} supports
1799it. This is the equivalent of the Python expression \samp{\var{o1} |=
1800\var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001801\end{cfuncdesc}
1802
Fred Drakec0e6c5b2000-09-22 18:17:49 +00001803\begin{cfuncdesc}{int}{PyNumber_Coerce}{PyObject **p1, PyObject **p2}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001804This function takes the addresses of two variables of type
Fred Drake659ebfa2000-04-03 15:42:13 +00001805\ctype{PyObject*}. If the objects pointed to by \code{*\var{p1}} and
1806\code{*\var{p2}} have the same type, increment their reference count
1807and return \code{0} (success). If the objects can be converted to a
1808common numeric type, replace \code{*p1} and \code{*p2} by their
1809converted value (with 'new' reference counts), and return \code{0}.
1810If no conversion is possible, or if some other error occurs, return
1811\code{-1} (failure) and don't increment the reference counts. The
1812call \code{PyNumber_Coerce(\&o1, \&o2)} is equivalent to the Python
1813statement \samp{\var{o1}, \var{o2} = coerce(\var{o1}, \var{o2})}.
1814\bifuncindex{coerce}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001815\end{cfuncdesc}
1816
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001817\begin{cfuncdesc}{PyObject*}{PyNumber_Int}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001818Returns the \var{o} converted to an integer object on success, or
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001819\NULL{} on failure. This is the equivalent of the Python
Fred Drake659ebfa2000-04-03 15:42:13 +00001820expression \samp{int(\var{o})}.\bifuncindex{int}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001821\end{cfuncdesc}
1822
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001823\begin{cfuncdesc}{PyObject*}{PyNumber_Long}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001824Returns the \var{o} converted to a long integer object on success,
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001825or \NULL{} on failure. This is the equivalent of the Python
Fred Drake659ebfa2000-04-03 15:42:13 +00001826expression \samp{long(\var{o})}.\bifuncindex{long}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001827\end{cfuncdesc}
1828
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001829\begin{cfuncdesc}{PyObject*}{PyNumber_Float}{PyObject *o}
Fred Drake659ebfa2000-04-03 15:42:13 +00001830Returns the \var{o} converted to a float object on success, or
1831\NULL{} on failure. This is the equivalent of the Python expression
1832\samp{float(\var{o})}.\bifuncindex{float}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001833\end{cfuncdesc}
1834
1835
Fred Drakeefd146c1999-02-15 15:30:45 +00001836\section{Sequence Protocol \label{sequence}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001837
1838\begin{cfuncdesc}{int}{PySequence_Check}{PyObject *o}
Fred Drake659ebfa2000-04-03 15:42:13 +00001839Return \code{1} if the object provides sequence protocol, and
1840\code{0} otherwise. This function always succeeds.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001841\end{cfuncdesc}
1842
Fred Drake659ebfa2000-04-03 15:42:13 +00001843\begin{cfuncdesc}{int}{PySequence_Length}{PyObject *o}
1844Returns the number of objects in sequence \var{o} on success, and
1845\code{-1} on failure. For objects that do not provide sequence
1846protocol, this is equivalent to the Python expression
1847\samp{len(\var{o})}.\bifuncindex{len}
1848\end{cfuncdesc}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001849
1850\begin{cfuncdesc}{PyObject*}{PySequence_Concat}{PyObject *o1, PyObject *o2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001851Return the concatenation of \var{o1} and \var{o2} on success, and \NULL{} on
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001852failure. This is the equivalent of the Python
Fred Drakee058b4f1998-02-16 06:15:35 +00001853expression \samp{\var{o1} + \var{o2}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001854\end{cfuncdesc}
1855
1856
1857\begin{cfuncdesc}{PyObject*}{PySequence_Repeat}{PyObject *o, int count}
Fred Drake659ebfa2000-04-03 15:42:13 +00001858Return the result of repeating sequence object
1859\var{o} \var{count} times, or \NULL{} on failure. This is the
1860equivalent of the Python expression \samp{\var{o} * \var{count}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001861\end{cfuncdesc}
1862
Fred Drake7740a012000-09-12 20:27:05 +00001863\begin{cfuncdesc}{PyObject*}{PySequence_InPlaceConcat}{PyObject *o1, PyObject *o2}
1864Return the concatenation of \var{o1} and \var{o2} on success, and \NULL{} on
1865failure. The operation is done \emph{in-place} when \var{o1} supports it.
1866This is the equivalent of the Python expression \samp{\var{o1} += \var{o2}}.
1867\end{cfuncdesc}
1868
1869
1870\begin{cfuncdesc}{PyObject*}{PySequence_InPlaceRepeat}{PyObject *o, int count}
1871Return the result of repeating sequence object \var{o} \var{count} times, or
1872\NULL{} on failure. The operation is done \emph{in-place} when \var{o}
1873supports it. This is the equivalent of the Python expression \samp{\var{o}
1874*= \var{count}}.
1875\end{cfuncdesc}
1876
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001877
1878\begin{cfuncdesc}{PyObject*}{PySequence_GetItem}{PyObject *o, int i}
Fred Drakee058b4f1998-02-16 06:15:35 +00001879Return the \var{i}th element of \var{o}, or \NULL{} on failure. This
1880is the equivalent of the Python expression \samp{\var{o}[\var{i}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001881\end{cfuncdesc}
1882
1883
1884\begin{cfuncdesc}{PyObject*}{PySequence_GetSlice}{PyObject *o, int i1, int i2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001885Return the slice of sequence object \var{o} between \var{i1} and
1886\var{i2}, or \NULL{} on failure. This is the equivalent of the Python
1887expression \samp{\var{o}[\var{i1}:\var{i2}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001888\end{cfuncdesc}
1889
1890
1891\begin{cfuncdesc}{int}{PySequence_SetItem}{PyObject *o, int i, PyObject *v}
Fred Drakee058b4f1998-02-16 06:15:35 +00001892Assign object \var{v} to the \var{i}th element of \var{o}.
1893Returns \code{-1} on failure. This is the equivalent of the Python
1894statement \samp{\var{o}[\var{i}] = \var{v}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001895\end{cfuncdesc}
1896
1897\begin{cfuncdesc}{int}{PySequence_DelItem}{PyObject *o, int i}
Fred Drake5566c1c2001-01-19 22:48:33 +00001898Delete the \var{i}th element of object \var{o}. Returns
Fred Drakee058b4f1998-02-16 06:15:35 +00001899\code{-1} on failure. This is the equivalent of the Python
1900statement \samp{del \var{o}[\var{i}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001901\end{cfuncdesc}
1902
Fred Drake659ebfa2000-04-03 15:42:13 +00001903\begin{cfuncdesc}{int}{PySequence_SetSlice}{PyObject *o, int i1,
1904 int i2, PyObject *v}
Fred Drakee058b4f1998-02-16 06:15:35 +00001905Assign the sequence object \var{v} to the slice in sequence
1906object \var{o} from \var{i1} to \var{i2}. This is the equivalent of
1907the Python statement \samp{\var{o}[\var{i1}:\var{i2}] = \var{v}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001908\end{cfuncdesc}
1909
1910\begin{cfuncdesc}{int}{PySequence_DelSlice}{PyObject *o, int i1, int i2}
Fred Drakee058b4f1998-02-16 06:15:35 +00001911Delete the slice in sequence object \var{o} from \var{i1} to \var{i2}.
1912Returns \code{-1} on failure. This is the equivalent of the Python
1913statement \samp{del \var{o}[\var{i1}:\var{i2}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001914\end{cfuncdesc}
1915
1916\begin{cfuncdesc}{PyObject*}{PySequence_Tuple}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00001917Returns the \var{o} as a tuple on success, and \NULL{} on failure.
Fred Drake659ebfa2000-04-03 15:42:13 +00001918This is equivalent to the Python expression \samp{tuple(\var{o})}.
1919\bifuncindex{tuple}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001920\end{cfuncdesc}
1921
1922\begin{cfuncdesc}{int}{PySequence_Count}{PyObject *o, PyObject *value}
Fred Drakee058b4f1998-02-16 06:15:35 +00001923Return the number of occurrences of \var{value} in \var{o}, that is,
1924return the number of keys for which \code{\var{o}[\var{key}] ==
1925\var{value}}. On failure, return \code{-1}. This is equivalent to
1926the Python expression \samp{\var{o}.count(\var{value})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001927\end{cfuncdesc}
1928
Fred Drake659ebfa2000-04-03 15:42:13 +00001929\begin{cfuncdesc}{int}{PySequence_Contains}{PyObject *o, PyObject *value}
Fred Drakee058b4f1998-02-16 06:15:35 +00001930Determine if \var{o} contains \var{value}. If an item in \var{o} is
1931equal to \var{value}, return \code{1}, otherwise return \code{0}. On
1932error, return \code{-1}. This is equivalent to the Python expression
1933\samp{\var{value} in \var{o}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001934\end{cfuncdesc}
1935
1936\begin{cfuncdesc}{int}{PySequence_Index}{PyObject *o, PyObject *value}
Fred Drakee058b4f1998-02-16 06:15:35 +00001937Return the first index \var{i} for which \code{\var{o}[\var{i}] ==
1938\var{value}}. On error, return \code{-1}. This is equivalent to
1939the Python expression \samp{\var{o}.index(\var{value})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001940\end{cfuncdesc}
1941
Fred Drakea8455ab2000-06-16 19:58:42 +00001942\begin{cfuncdesc}{PyObject*}{PySequence_List}{PyObject *o}
1943Return a list object with the same contents as the arbitrary sequence
1944\var{o}. The returned list is guaranteed to be new.
1945\end{cfuncdesc}
1946
1947\begin{cfuncdesc}{PyObject*}{PySequence_Tuple}{PyObject *o}
1948Return a tuple object with the same contents as the arbitrary sequence
1949\var{o}. If \var{o} is a tuple, a new reference will be returned,
1950otherwise a tuple will be constructed with the appropriate contents.
1951\end{cfuncdesc}
1952
Fred Drakef39ed671998-02-26 22:01:23 +00001953
Fred Drake81cccb72000-09-12 15:22:05 +00001954\begin{cfuncdesc}{PyObject*}{PySequence_Fast}{PyObject *o, const char *m}
1955Returns the sequence \var{o} as a tuple, unless it is already a
1956tuple or list, in which case \var{o} is returned. Use
1957\cfunction{PySequence_Fast_GET_ITEM()} to access the members of the
1958result. Returns \NULL{} on failure. If the object is not a sequence,
1959raises \exception{TypeError} with \var{m} as the message text.
1960\end{cfuncdesc}
1961
1962\begin{cfuncdesc}{PyObject*}{PySequence_Fast_GET_ITEM}{PyObject *o, int i}
1963Return the \var{i}th element of \var{o}, assuming that \var{o} was
1964returned by \cfunction{PySequence_Fast()}, and that \var{i} is within
1965bounds. The caller is expected to get the length of the sequence by
1966calling \cfunction{PyObject_Size()} on \var{o}, since lists and tuples
1967are guaranteed to always return their true length.
1968\end{cfuncdesc}
1969
1970
Fred Drakeefd146c1999-02-15 15:30:45 +00001971\section{Mapping Protocol \label{mapping}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001972
1973\begin{cfuncdesc}{int}{PyMapping_Check}{PyObject *o}
Fred Drake659ebfa2000-04-03 15:42:13 +00001974Return \code{1} if the object provides mapping protocol, and
1975\code{0} otherwise. This function always succeeds.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001976\end{cfuncdesc}
1977
1978
1979\begin{cfuncdesc}{int}{PyMapping_Length}{PyObject *o}
Fred Drake659ebfa2000-04-03 15:42:13 +00001980Returns the number of keys in object \var{o} on success, and
1981\code{-1} on failure. For objects that do not provide mapping
1982protocol, this is equivalent to the Python expression
1983\samp{len(\var{o})}.\bifuncindex{len}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001984\end{cfuncdesc}
1985
1986
1987\begin{cfuncdesc}{int}{PyMapping_DelItemString}{PyObject *o, char *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00001988Remove the mapping for object \var{key} from the object \var{o}.
1989Return \code{-1} on failure. This is equivalent to
1990the Python statement \samp{del \var{o}[\var{key}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001991\end{cfuncdesc}
1992
1993
1994\begin{cfuncdesc}{int}{PyMapping_DelItem}{PyObject *o, PyObject *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00001995Remove the mapping for object \var{key} from the object \var{o}.
1996Return \code{-1} on failure. This is equivalent to
1997the Python statement \samp{del \var{o}[\var{key}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00001998\end{cfuncdesc}
1999
2000
2001\begin{cfuncdesc}{int}{PyMapping_HasKeyString}{PyObject *o, char *key}
Fred Drake659ebfa2000-04-03 15:42:13 +00002002On success, return \code{1} if the mapping object has the key
2003\var{key} and \code{0} otherwise. This is equivalent to the Python
2004expression \samp{\var{o}.has_key(\var{key})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002005This function always succeeds.
2006\end{cfuncdesc}
2007
2008
2009\begin{cfuncdesc}{int}{PyMapping_HasKey}{PyObject *o, PyObject *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00002010Return \code{1} if the mapping object has the key \var{key} and
2011\code{0} otherwise. This is equivalent to the Python expression
2012\samp{\var{o}.has_key(\var{key})}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002013This function always succeeds.
2014\end{cfuncdesc}
2015
2016
2017\begin{cfuncdesc}{PyObject*}{PyMapping_Keys}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00002018On success, return a list of the keys in object \var{o}. On
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002019failure, return \NULL{}. This is equivalent to the Python
Fred Drakee058b4f1998-02-16 06:15:35 +00002020expression \samp{\var{o}.keys()}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002021\end{cfuncdesc}
2022
2023
2024\begin{cfuncdesc}{PyObject*}{PyMapping_Values}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00002025On success, return a list of the values in object \var{o}. On
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002026failure, return \NULL{}. This is equivalent to the Python
Fred Drakee058b4f1998-02-16 06:15:35 +00002027expression \samp{\var{o}.values()}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002028\end{cfuncdesc}
2029
2030
2031\begin{cfuncdesc}{PyObject*}{PyMapping_Items}{PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00002032On success, return a list of the items in object \var{o}, where
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002033each item is a tuple containing a key-value pair. On
2034failure, return \NULL{}. This is equivalent to the Python
Fred Drakee058b4f1998-02-16 06:15:35 +00002035expression \samp{\var{o}.items()}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002036\end{cfuncdesc}
2037
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002038
2039\begin{cfuncdesc}{PyObject*}{PyMapping_GetItemString}{PyObject *o, char *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00002040Return element of \var{o} corresponding to the object \var{key} or
2041\NULL{} on failure. This is the equivalent of the Python expression
2042\samp{\var{o}[\var{key}]}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002043\end{cfuncdesc}
2044
Guido van Rossum0a0f11b1998-10-16 17:43:53 +00002045\begin{cfuncdesc}{int}{PyMapping_SetItemString}{PyObject *o, char *key, PyObject *v}
Fred Drakee058b4f1998-02-16 06:15:35 +00002046Map the object \var{key} to the value \var{v} in object \var{o}.
2047Returns \code{-1} on failure. This is the equivalent of the Python
2048statement \samp{\var{o}[\var{key}] = \var{v}}.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002049\end{cfuncdesc}
2050
2051
Fred Drakeefd146c1999-02-15 15:30:45 +00002052\chapter{Concrete Objects Layer \label{concrete}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002053
2054The functions in this chapter are specific to certain Python object
2055types. Passing them an object of the wrong type is not a good idea;
2056if you receive an object from a Python program and you are not sure
2057that it has the right type, you must perform a type check first;
Fred Drake5566c1c2001-01-19 22:48:33 +00002058for example, to check that an object is a dictionary, use
Fred Drakee5bf8b21998-02-12 21:22:28 +00002059\cfunction{PyDict_Check()}. The chapter is structured like the
2060``family tree'' of Python object types.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002061
Fred Drake89024422000-10-23 16:00:54 +00002062\strong{Warning:}
2063While the functions described in this chapter carefully check the type
2064of the objects which are passed in, many of them do not check for
2065\NULL{} being passed instead of a valid object. Allowing \NULL{} to
2066be passed in can cause memory access violations and immediate
2067termination of the interpreter.
2068
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002069
Fred Drakeefd146c1999-02-15 15:30:45 +00002070\section{Fundamental Objects \label{fundamental}}
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002071
Fred Drakee5bf8b21998-02-12 21:22:28 +00002072This section describes Python type objects and the singleton object
2073\code{None}.
2074
2075
Fred Drakeefd146c1999-02-15 15:30:45 +00002076\subsection{Type Objects \label{typeObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00002077
Fred Drake659ebfa2000-04-03 15:42:13 +00002078\obindex{type}
Fred Drakee5bf8b21998-02-12 21:22:28 +00002079\begin{ctypedesc}{PyTypeObject}
Fred Drake659ebfa2000-04-03 15:42:13 +00002080The C structure of the objects used to describe built-in types.
Fred Drakee5bf8b21998-02-12 21:22:28 +00002081\end{ctypedesc}
2082
Fred Drake659ebfa2000-04-03 15:42:13 +00002083\begin{cvardesc}{PyObject*}{PyType_Type}
Fred Drakeefd146c1999-02-15 15:30:45 +00002084This is the type object for type objects; it is the same object as
2085\code{types.TypeType} in the Python layer.
Fred Drake659ebfa2000-04-03 15:42:13 +00002086\withsubitem{(in module types)}{\ttindex{TypeType}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00002087\end{cvardesc}
2088
Fred Drake659ebfa2000-04-03 15:42:13 +00002089\begin{cfuncdesc}{int}{PyType_Check}{PyObject *o}
2090Returns true is the object \var{o} is a type object.
2091\end{cfuncdesc}
2092
2093\begin{cfuncdesc}{int}{PyType_HasFeature}{PyObject *o, int feature}
2094Returns true if the type object \var{o} sets the feature
Fred Drakef0e08ef2001-02-03 01:11:26 +00002095\var{feature}. Type features are denoted by single bit flags.
Fred Drake659ebfa2000-04-03 15:42:13 +00002096\end{cfuncdesc}
2097
Fred Drakee5bf8b21998-02-12 21:22:28 +00002098
Fred Drakeefd146c1999-02-15 15:30:45 +00002099\subsection{The None Object \label{noneObject}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00002100
Fred Drake659ebfa2000-04-03 15:42:13 +00002101\obindex{None@\texttt{None}}
2102Note that the \ctype{PyTypeObject} for \code{None} is not directly
2103exposed in the Python/C API. Since \code{None} is a singleton,
2104testing for object identity (using \samp{==} in C) is sufficient.
2105There is no \cfunction{PyNone_Check()} function for the same reason.
2106
2107\begin{cvardesc}{PyObject*}{Py_None}
Guido van Rossum44475131998-04-21 15:30:01 +00002108The Python \code{None} object, denoting lack of value. This object has
2109no methods.
Fred Drakee5bf8b21998-02-12 21:22:28 +00002110\end{cvardesc}
2111
2112
Fred Drakeefd146c1999-02-15 15:30:45 +00002113\section{Sequence Objects \label{sequenceObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00002114
Fred Drake659ebfa2000-04-03 15:42:13 +00002115\obindex{sequence}
Fred Drakee5bf8b21998-02-12 21:22:28 +00002116Generic operations on sequence objects were discussed in the previous
2117chapter; this section deals with the specific kinds of sequence
2118objects that are intrinsic to the Python language.
2119
2120
Fred Drakeefd146c1999-02-15 15:30:45 +00002121\subsection{String Objects \label{stringObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00002122
Fred Drake89024422000-10-23 16:00:54 +00002123These functions raise \exception{TypeError} when expecting a string
2124parameter and are called with a non-string parameter.
2125
Fred Drake659ebfa2000-04-03 15:42:13 +00002126\obindex{string}
Fred Drakee5bf8b21998-02-12 21:22:28 +00002127\begin{ctypedesc}{PyStringObject}
Fred Drakef8830d11998-04-23 14:06:01 +00002128This subtype of \ctype{PyObject} represents a Python string object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00002129\end{ctypedesc}
2130
2131\begin{cvardesc}{PyTypeObject}{PyString_Type}
Fred Drake659ebfa2000-04-03 15:42:13 +00002132This instance of \ctype{PyTypeObject} represents the Python string
2133type; it is the same object as \code{types.TypeType} in the Python
2134layer.\withsubitem{(in module types)}{\ttindex{StringType}}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00002135\end{cvardesc}
2136
2137\begin{cfuncdesc}{int}{PyString_Check}{PyObject *o}
Guido van Rossum3c4378b1998-04-14 20:21:10 +00002138Returns true if the object \var{o} is a string object.
Guido van Rossum9231c8f1997-05-15 21:43:21 +00002139\end{cfuncdesc}
2140
Fred Drakec6fa34e1998-04-02 06:47:24 +00002141\begin{cfuncdesc}{PyObject*}{PyString_FromString}{const char *v}
Guido van Rossum3c4378b1998-04-14 20:21:10 +00002142Returns a new string object with the value \var{v} on success, and
2143\NULL{} on failure.
Fred Drakec6fa34e1998-04-02 06:47:24 +00002144\end{cfuncdesc}
2145
Fred Drake659ebfa2000-04-03 15:42:13 +00002146\begin{cfuncdesc}{PyObject*}{PyString_FromStringAndSize}{const char *v,
2147 int len}
2148Returns a new string object with the value \var{v} and length
2149\var{len} on success, and \NULL{} on failure. If \var{v} is \NULL{},
2150the contents of the string are uninitialized.
2151\end{cfuncdesc}
2152
Fred Drakec6fa34e1998-04-02 06:47:24 +00002153\begin{cfuncdesc}{int}{PyString_Size}{PyObject *string}
Guido van Rossum3c4378b1998-04-14 20:21:10 +00002154Returns the length of the string in string object \var{string}.
Fred Drakec6fa34e1998-04-02 06:47:24 +00002155\end{cfuncdesc}
2156
Fred Drake659ebfa2000-04-03 15:42:13 +00002157\begin{cfuncdesc}{int}{PyString_GET_SIZE}{PyObject *string}
Fred Drake5d644212000-10-07 12:31:50 +00002158Macro form of \cfunction{PyString_Size()} but without error
Fred Drake659ebfa2000-04-03 15:42:13 +00002159checking.
2160\end{cfuncdesc}
2161
Fred Drakec6fa34e1998-04-02 06:47:24 +00002162\begin{cfuncdesc}{char*}{PyString_AsString}{PyObject *string}
Fred Drake659ebfa2000-04-03 15:42:13 +00002163Returns a null-terminated representation of the contents of
2164\var{string}. The pointer refers to the internal buffer of
Fred Drake89024422000-10-23 16:00:54 +00002165\var{string}, not a copy. The data must not be modified in any way,
2166unless the string was just created using
2167\code{PyString_FromStringAndSize(NULL, \var{size})}.
2168It must not be deallocated.
Fred Drake659ebfa2000-04-03 15:42:13 +00002169\end{cfuncdesc}
2170
2171\begin{cfuncdesc}{char*}{PyString_AS_STRING}{PyObject *string}
2172Macro form of \cfunction{PyString_AsString()} but without error
2173checking.
Fred Drakec6fa34e1998-04-02 06:47:24 +00002174\end{cfuncdesc}
2175
Marc-André Lemburgd1ba4432000-09-19 21:04:18 +00002176\begin{cfuncdesc}{int}{PyString_AsStringAndSize}{PyObject *obj,
2177 char **buffer,
2178 int *length}
2179Returns a null-terminated representation of the contents of the object
2180\var{obj} through the output variables \var{buffer} and \var{length}.
2181
2182The function accepts both string and Unicode objects as input. For
2183Unicode objects it returns the default encoded version of the object.
2184If \var{length} is set to \NULL{}, the resulting buffer may not contain
2185null characters; if it does, the function returns -1 and a
2186TypeError is raised.
2187
2188The buffer refers to an internal string buffer of \var{obj}, not a
Fred Drake89024422000-10-23 16:00:54 +00002189copy. The data must not be modified in any way, unless the string was
2190just created using \code{PyString_FromStringAndSize(NULL,
2191\var{size})}. It must not be deallocated.
Marc-André Lemburgd1ba4432000-09-19 21:04:18 +00002192\end{cfuncdesc}
2193
Fred Drakec6fa34e1998-04-02 06:47:24 +00002194\begin{cfuncdesc}{void}{PyString_Concat}{PyObject **string,
2195 PyObject *newpart}
Fred Drake66b989c1999-02-15 20:15:39 +00002196Creates a new string object in \var{*string} containing the
Fred Drakeddc6c272000-03-31 18:22:38 +00002197contents of \var{newpart} appended to \var{string}; the caller will
2198own the new reference. The reference to the old value of \var{string}
2199will be stolen. If the new string
Fred Drake66b989c1999-02-15 20:15:39 +00002200cannot be created, the old reference to \var{string} will still be
2201discarded and the value of \var{*string} will be set to
2202\NULL{}; the appropriate exception will be set.
Fred Drakec6fa34e1998-04-02 06:47:24 +00002203\end{cfuncdesc}
2204
2205\begin{cfuncdesc}{void}{PyString_ConcatAndDel}{PyObject **string,
2206 PyObject *newpart}
Guido van Rossum3c4378b1998-04-14 20:21:10 +00002207Creates a new string object in \var{*string} containing the contents
Guido van Rossum44475131998-04-21 15:30:01 +00002208of \var{newpart} appended to \var{string}. This version decrements
2209the reference count of \var{newpart}.
Fred Drakec6fa34e1998-04-02 06:47:24 +00002210\end{cfuncdesc}
2211
2212\begin{cfuncdesc}{int}{_PyString_Resize}{PyObject **string, int newsize}
Guido van Rossum44475131998-04-21 15:30:01 +00002213A way to resize a string object even though it is ``immutable''.
2214Only use this to build up a brand new string object; don't use this if
2215the string may already be known in other parts of the code.
Fred Drakec6fa34e1998-04-02 06:47:24 +00002216\end{cfuncdesc}
2217
2218\begin{cfuncdesc}{PyObject*}{PyString_Format}{PyObject *format,
2219 PyObject *args}
Guido van Rossum44475131998-04-21 15:30:01 +00002220Returns a new string object from \var{format} and \var{args}. Analogous
Fred Drake659ebfa2000-04-03 15:42:13 +00002221to \code{\var{format} \%\ \var{args}}. The \var{args} argument must be
Guido van Rossum44475131998-04-21 15:30:01 +00002222a tuple.
Fred Drakec6fa34e1998-04-02 06:47:24 +00002223\end{cfuncdesc}
2224
2225\begin{cfuncdesc}{void}{PyString_InternInPlace}{PyObject **string}
Guido van Rossum44475131998-04-21 15:30:01 +00002226Intern the argument \var{*string} in place. The argument must be the
2227address of a pointer variable pointing to a Python string object.
2228If there is an existing interned string that is the same as
2229\var{*string}, it sets \var{*string} to it (decrementing the reference
2230count of the old string object and incrementing the reference count of
2231the interned string object), otherwise it leaves \var{*string} alone
2232and interns it (incrementing its reference count). (Clarification:
2233even though there is a lot of talk about reference counts, think of
Fred Drakef8830d11998-04-23 14:06:01 +00002234this function as reference-count-neutral; you own the object after
2235the call if and only if you owned it before the call.)
Fred Drakec6fa34e1998-04-02 06:47:24 +00002236\end{cfuncdesc}
2237
2238\begin{cfuncdesc}{PyObject*}{PyString_InternFromString}{const char *v}
Fred Drakef8830d11998-04-23 14:06:01 +00002239A combination of \cfunction{PyString_FromString()} and
2240\cfunction{PyString_InternInPlace()}, returning either a new string object
Guido van Rossum44475131998-04-21 15:30:01 +00002241that has been interned, or a new (``owned'') reference to an earlier
2242interned string object with the same value.
Fred Drakec6fa34e1998-04-02 06:47:24 +00002243\end{cfuncdesc}
2244
Marc-André Lemburg5a20b212000-07-07 15:47:06 +00002245\begin{cfuncdesc}{PyObject*}{PyString_Decode}{const char *s,
2246 int size,
2247 const char *encoding,
2248 const char *errors}
2249Create a string object by decoding \var{size} bytes of the encoded
2250buffer \var{s}. \var{encoding} and \var{errors} have the same meaning
2251as the parameters of the same name in the unicode() builtin
2252function. The codec to be used is looked up using the Python codec
2253registry. Returns \NULL{} in case an exception was raised by the
2254codec.
2255\end{cfuncdesc}
2256
2257\begin{cfuncdesc}{PyObject*}{PyString_Encode}{const Py_UNICODE *s,
2258 int size,
2259 const char *encoding,
2260 const char *errors}
2261Encodes the \ctype{Py_UNICODE} buffer of the given size and returns a
2262Python string object. \var{encoding} and \var{errors} have the same
2263meaning as the parameters of the same name in the string .encode()
2264method. The codec to be used is looked up using the Python codec
2265registry. Returns \NULL{} in case an exception was raised by the
2266codec.
2267\end{cfuncdesc}
2268
2269\begin{cfuncdesc}{PyObject*}{PyString_AsEncodedString}{PyObject *unicode,
2270 const char *encoding,
2271 const char *errors}
2272Encodes a string object and returns the result as Python string
2273object. \var{encoding} and \var{errors} have the same meaning as the
2274parameters of the same name in the string .encode() method. The codec
2275to be used is looked up using the Python codec registry. Returns
2276\NULL{} in case an exception was raised by the codec.
2277\end{cfuncdesc}
2278
Fred Drakee5bf8b21998-02-12 21:22:28 +00002279
Fred Drakea4cd2612000-04-06 14:10:29 +00002280\subsection{Unicode Objects \label{unicodeObjects}}
2281\sectionauthor{Marc-Andre Lemburg}{mal@lemburg.com}
2282
2283%--- Unicode Type -------------------------------------------------------
2284
2285These are the basic Unicode object types used for the Unicode
2286implementation in Python:
2287
2288\begin{ctypedesc}{Py_UNICODE}
2289This type represents a 16-bit unsigned storage type which is used by
2290Python internally as basis for holding Unicode ordinals. On platforms
2291where \ctype{wchar_t} is available and also has 16-bits,
2292\ctype{Py_UNICODE} is a typedef alias for \ctype{wchar_t} to enhance
2293native platform compatibility. On all other platforms,
2294\ctype{Py_UNICODE} is a typedef alias for \ctype{unsigned short}.
2295\end{ctypedesc}
2296
2297\begin{ctypedesc}{PyUnicodeObject}
2298This subtype of \ctype{PyObject} represents a Python Unicode object.
2299\end{ctypedesc}
2300
2301\begin{cvardesc}{PyTypeObject}{PyUnicode_Type}
2302This instance of \ctype{PyTypeObject} represents the Python Unicode type.
2303\end{cvardesc}
2304
2305%--- These are really C macros... is there a macrodesc TeX macro ?
2306
2307The following APIs are really C macros and can be used to do fast
2308checks and to access internal read-only data of Unicode objects:
2309
2310\begin{cfuncdesc}{int}{PyUnicode_Check}{PyObject *o}
2311Returns true if the object \var{o} is a Unicode object.
2312\end{cfuncdesc}
2313
2314\begin{cfuncdesc}{int}{PyUnicode_GET_SIZE}{PyObject *o}
2315Returns the size of the object. o has to be a
2316PyUnicodeObject (not checked).
2317\end{cfuncdesc}
2318
2319\begin{cfuncdesc}{int}{PyUnicode_GET_DATA_SIZE}{PyObject *o}
2320Returns the size of the object's internal buffer in bytes. o has to be
2321a PyUnicodeObject (not checked).
2322\end{cfuncdesc}
2323
Fred Drake992fe5a2000-06-16 21:04:15 +00002324\begin{cfuncdesc}{Py_UNICODE*}{PyUnicode_AS_UNICODE}{PyObject *o}
Fred Drakea4cd2612000-04-06 14:10:29 +00002325Returns a pointer to the internal Py_UNICODE buffer of the object. o
2326has to be a PyUnicodeObject (not checked).
2327\end{cfuncdesc}
2328
Fred Drake992fe5a2000-06-16 21:04:15 +00002329\begin{cfuncdesc}{const char*}{PyUnicode_AS_DATA}{PyObject *o}
Fred Drakea4cd2612000-04-06 14:10:29 +00002330Returns a (const char *) pointer to the internal buffer of the object.
2331o has to be a PyUnicodeObject (not checked).
2332\end{cfuncdesc}
2333
2334% --- Unicode character properties ---------------------------------------
2335
2336Unicode provides many different character properties. The most often
2337needed ones are available through these macros which are mapped to C
2338functions depending on the Python configuration.
2339
2340\begin{cfuncdesc}{int}{Py_UNICODE_ISSPACE}{Py_UNICODE ch}
2341Returns 1/0 depending on whether \var{ch} is a whitespace character.
2342\end{cfuncdesc}
2343
2344\begin{cfuncdesc}{int}{Py_UNICODE_ISLOWER}{Py_UNICODE ch}
2345Returns 1/0 depending on whether \var{ch} is a lowercase character.
2346\end{cfuncdesc}
2347
2348\begin{cfuncdesc}{int}{Py_UNICODE_ISUPPER}{Py_UNICODE ch}
Fred Drakeae96aab2000-07-03 13:38:10 +00002349Returns 1/0 depending on whether \var{ch} is an uppercase character.
Fred Drakea4cd2612000-04-06 14:10:29 +00002350\end{cfuncdesc}
2351
2352\begin{cfuncdesc}{int}{Py_UNICODE_ISTITLE}{Py_UNICODE ch}
2353Returns 1/0 depending on whether \var{ch} is a titlecase character.
2354\end{cfuncdesc}
2355
2356\begin{cfuncdesc}{int}{Py_UNICODE_ISLINEBREAK}{Py_UNICODE ch}
2357Returns 1/0 depending on whether \var{ch} is a linebreak character.
2358\end{cfuncdesc}
2359
2360\begin{cfuncdesc}{int}{Py_UNICODE_ISDECIMAL}{Py_UNICODE ch}
2361Returns 1/0 depending on whether \var{ch} is a decimal character.
2362\end{cfuncdesc}
2363
2364\begin{cfuncdesc}{int}{Py_UNICODE_ISDIGIT}{Py_UNICODE ch}
2365Returns 1/0 depending on whether \var{ch} is a digit character.
2366\end{cfuncdesc}
2367
2368\begin{cfuncdesc}{int}{Py_UNICODE_ISNUMERIC}{Py_UNICODE ch}
2369Returns 1/0 depending on whether \var{ch} is a numeric character.
2370\end{cfuncdesc}
2371
Fred Drakeae96aab2000-07-03 13:38:10 +00002372\begin{cfuncdesc}{int}{Py_UNICODE_ISALPHA}{Py_UNICODE ch}
2373Returns 1/0 depending on whether \var{ch} is an alphabetic character.
2374\end{cfuncdesc}
2375
2376\begin{cfuncdesc}{int}{Py_UNICODE_ISALNUM}{Py_UNICODE ch}
2377Returns 1/0 depending on whether \var{ch} is an alphanumeric character.
2378\end{cfuncdesc}
2379
Fred Drakea4cd2612000-04-06 14:10:29 +00002380These APIs can be used for fast direct character conversions:
2381
2382\begin{cfuncdesc}{Py_UNICODE}{Py_UNICODE_TOLOWER}{Py_UNICODE ch}
2383Returns the character \var{ch} converted to lower case.
2384\end{cfuncdesc}
2385
2386\begin{cfuncdesc}{Py_UNICODE}{Py_UNICODE_TOUPPER}{Py_UNICODE ch}
2387Returns the character \var{ch} converted to upper case.
2388\end{cfuncdesc}
2389
2390\begin{cfuncdesc}{Py_UNICODE}{Py_UNICODE_TOTITLE}{Py_UNICODE ch}
2391Returns the character \var{ch} converted to title case.
2392\end{cfuncdesc}
2393
2394\begin{cfuncdesc}{int}{Py_UNICODE_TODECIMAL}{Py_UNICODE ch}
2395Returns the character \var{ch} converted to a decimal positive integer.
2396Returns -1 in case this is not possible. Does not raise exceptions.
2397\end{cfuncdesc}
2398
2399\begin{cfuncdesc}{int}{Py_UNICODE_TODIGIT}{Py_UNICODE ch}
2400Returns the character \var{ch} converted to a single digit integer.
2401Returns -1 in case this is not possible. Does not raise exceptions.
2402\end{cfuncdesc}
2403
2404\begin{cfuncdesc}{double}{Py_UNICODE_TONUMERIC}{Py_UNICODE ch}
2405Returns the character \var{ch} converted to a (positive) double.
2406Returns -1.0 in case this is not possible. Does not raise exceptions.
2407\end{cfuncdesc}
2408
2409% --- Plain Py_UNICODE ---------------------------------------------------
2410
2411To create Unicode objects and access their basic sequence properties,
2412use these APIs:
2413
2414\begin{cfuncdesc}{PyObject*}{PyUnicode_FromUnicode}{const Py_UNICODE *u,
2415 int size}
2416
2417Create a Unicode Object from the Py_UNICODE buffer \var{u} of the
2418given size. \var{u} may be \NULL{} which causes the contents to be
2419undefined. It is the user's responsibility to fill in the needed data.
2420The buffer is copied into the new object.
2421\end{cfuncdesc}
2422
Fred Drake1d158692000-06-18 05:21:21 +00002423\begin{cfuncdesc}{Py_UNICODE*}{PyUnicode_AsUnicode}{PyObject *unicode}
Fred Drakea4cd2612000-04-06 14:10:29 +00002424Return a read-only pointer to the Unicode object's internal
2425\ctype{Py_UNICODE} buffer.
2426\end{cfuncdesc}
2427
2428\begin{cfuncdesc}{int}{PyUnicode_GetSize}{PyObject *unicode}
2429Return the length of the Unicode object.
2430\end{cfuncdesc}
2431
Marc-André Lemburg5a20b212000-07-07 15:47:06 +00002432\begin{cfuncdesc}{PyObject*}{PyUnicode_FromEncodedObject}{PyObject *obj,
2433 const char *encoding,
2434 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002435
Marc-André Lemburg5a20b212000-07-07 15:47:06 +00002436Coerce an encoded object obj to an Unicode object and return a
2437reference with incremented refcount.
Fred Drakea4cd2612000-04-06 14:10:29 +00002438
2439Coercion is done in the following way:
2440\begin{enumerate}
2441\item Unicode objects are passed back as-is with incremented
Marc-André Lemburg5a20b212000-07-07 15:47:06 +00002442 refcount. Note: these cannot be decoded; passing a non-NULL
2443 value for encoding will result in a TypeError.
Fred Drakea4cd2612000-04-06 14:10:29 +00002444
2445\item String and other char buffer compatible objects are decoded
Marc-André Lemburg5a20b212000-07-07 15:47:06 +00002446 according to the given encoding and using the error handling
2447 defined by errors. Both can be NULL to have the interface use
2448 the default values (see the next section for details).
Fred Drakea4cd2612000-04-06 14:10:29 +00002449
Marc-André Lemburg5a20b212000-07-07 15:47:06 +00002450\item All other objects cause an exception.
Fred Drakea4cd2612000-04-06 14:10:29 +00002451\end{enumerate}
2452The API returns NULL in case of an error. The caller is responsible
2453for decref'ing the returned objects.
2454\end{cfuncdesc}
2455
Marc-André Lemburg5a20b212000-07-07 15:47:06 +00002456\begin{cfuncdesc}{PyObject*}{PyUnicode_FromObject}{PyObject *obj}
2457
2458Shortcut for PyUnicode_FromEncodedObject(obj, NULL, ``strict'')
2459which is used throughout the interpreter whenever coercion to
2460Unicode is needed.
2461\end{cfuncdesc}
2462
Fred Drakea4cd2612000-04-06 14:10:29 +00002463% --- wchar_t support for platforms which support it ---------------------
2464
2465If the platform supports \ctype{wchar_t} and provides a header file
2466wchar.h, Python can interface directly to this type using the
2467following functions. Support is optimized if Python's own
2468\ctype{Py_UNICODE} type is identical to the system's \ctype{wchar_t}.
2469
2470\begin{cfuncdesc}{PyObject*}{PyUnicode_FromWideChar}{const wchar_t *w,
2471 int size}
2472Create a Unicode Object from the \ctype{whcar_t} buffer \var{w} of the
2473given size. Returns \NULL{} on failure.
2474\end{cfuncdesc}
2475
2476\begin{cfuncdesc}{int}{PyUnicode_AsWideChar}{PyUnicodeObject *unicode,
2477 wchar_t *w,
2478 int size}
Fred Drakea4cd2612000-04-06 14:10:29 +00002479Copies the Unicode Object contents into the \ctype{whcar_t} buffer
2480\var{w}. At most \var{size} \ctype{whcar_t} characters are copied.
2481Returns the number of \ctype{whcar_t} characters copied or -1 in case
2482of an error.
2483\end{cfuncdesc}
2484
2485
2486\subsubsection{Builtin Codecs \label{builtinCodecs}}
2487
2488Python provides a set of builtin codecs which are written in C
2489for speed. All of these codecs are directly usable via the
2490following functions.
2491
2492Many of the following APIs take two arguments encoding and
2493errors. These parameters encoding and errors have the same semantics
2494as the ones of the builtin unicode() Unicode object constructor.
2495
2496Setting encoding to NULL causes the default encoding to be used which
2497is UTF-8.
2498
2499Error handling is set by errors which may also be set to NULL meaning
2500to use the default handling defined for the codec. Default error
2501handling for all builtin codecs is ``strict'' (ValueErrors are raised).
2502
2503The codecs all use a similar interface. Only deviation from the
2504following generic ones are documented for simplicity.
2505
2506% --- Generic Codecs -----------------------------------------------------
2507
2508These are the generic codec APIs:
2509
2510\begin{cfuncdesc}{PyObject*}{PyUnicode_Decode}{const char *s,
2511 int size,
2512 const char *encoding,
2513 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002514Create a Unicode object by decoding \var{size} bytes of the encoded
2515string \var{s}. \var{encoding} and \var{errors} have the same meaning
2516as the parameters of the same name in the unicode() builtin
2517function. The codec to be used is looked up using the Python codec
2518registry. Returns \NULL{} in case an exception was raised by the
2519codec.
2520\end{cfuncdesc}
2521
2522\begin{cfuncdesc}{PyObject*}{PyUnicode_Encode}{const Py_UNICODE *s,
2523 int size,
2524 const char *encoding,
2525 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002526Encodes the \ctype{Py_UNICODE} buffer of the given size and returns a
2527Python string object. \var{encoding} and \var{errors} have the same
2528meaning as the parameters of the same name in the Unicode .encode()
2529method. The codec to be used is looked up using the Python codec
2530registry. Returns \NULL{} in case an exception was raised by the
2531codec.
2532\end{cfuncdesc}
2533
2534\begin{cfuncdesc}{PyObject*}{PyUnicode_AsEncodedString}{PyObject *unicode,
2535 const char *encoding,
2536 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002537Encodes a Unicode object and returns the result as Python string
2538object. \var{encoding} and \var{errors} have the same meaning as the
2539parameters of the same name in the Unicode .encode() method. The codec
2540to be used is looked up using the Python codec registry. Returns
2541\NULL{} in case an exception was raised by the codec.
2542\end{cfuncdesc}
2543
2544% --- UTF-8 Codecs -------------------------------------------------------
2545
2546These are the UTF-8 codec APIs:
2547
2548\begin{cfuncdesc}{PyObject*}{PyUnicode_DecodeUTF8}{const char *s,
2549 int size,
2550 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002551Creates a Unicode object by decoding \var{size} bytes of the UTF-8
2552encoded string \var{s}. Returns \NULL{} in case an exception was
2553raised by the codec.
2554\end{cfuncdesc}
2555
2556\begin{cfuncdesc}{PyObject*}{PyUnicode_EncodeUTF8}{const Py_UNICODE *s,
2557 int size,
2558 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002559Encodes the \ctype{Py_UNICODE} buffer of the given size using UTF-8
2560and returns a Python string object. Returns \NULL{} in case an
2561exception was raised by the codec.
2562\end{cfuncdesc}
2563
2564\begin{cfuncdesc}{PyObject*}{PyUnicode_AsUTF8String}{PyObject *unicode}
Fred Drakea4cd2612000-04-06 14:10:29 +00002565Encodes a Unicode objects using UTF-8 and returns the result as Python
2566string object. Error handling is ``strict''. Returns
2567\NULL{} in case an exception was raised by the codec.
2568\end{cfuncdesc}
2569
2570% --- UTF-16 Codecs ------------------------------------------------------ */
2571
2572These are the UTF-16 codec APIs:
2573
2574\begin{cfuncdesc}{PyObject*}{PyUnicode_DecodeUTF16}{const char *s,
2575 int size,
2576 const char *errors,
2577 int *byteorder}
Fred Drakea4cd2612000-04-06 14:10:29 +00002578Decodes \var{length} bytes from a UTF-16 encoded buffer string and
2579returns the corresponding Unicode object.
2580
2581\var{errors} (if non-NULL) defines the error handling. It defaults
2582to ``strict''.
2583
2584If \var{byteorder} is non-\NULL{}, the decoder starts decoding using
2585the given byte order:
2586
2587\begin{verbatim}
2588 *byteorder == -1: little endian
2589 *byteorder == 0: native order
2590 *byteorder == 1: big endian
2591\end{verbatim}
2592
2593and then switches according to all byte order marks (BOM) it finds in
2594the input data. BOM marks are not copied into the resulting Unicode
2595string. After completion, \var{*byteorder} is set to the current byte
2596order at the end of input data.
2597
2598If \var{byteorder} is \NULL{}, the codec starts in native order mode.
2599
2600Returns \NULL{} in case an exception was raised by the codec.
2601\end{cfuncdesc}
2602
2603\begin{cfuncdesc}{PyObject*}{PyUnicode_EncodeUTF16}{const Py_UNICODE *s,
2604 int size,
2605 const char *errors,
2606 int byteorder}
Fred Drakea4cd2612000-04-06 14:10:29 +00002607Returns a Python string object holding the UTF-16 encoded value of the
2608Unicode data in \var{s}.
2609
Fred Drakea8455ab2000-06-16 19:58:42 +00002610If \var{byteorder} is not \code{0}, output is written according to the
Fred Drakea4cd2612000-04-06 14:10:29 +00002611following byte order:
2612
2613\begin{verbatim}
2614 byteorder == -1: little endian
2615 byteorder == 0: native byte order (writes a BOM mark)
2616 byteorder == 1: big endian
2617\end{verbatim}
2618
Fred Drakea8455ab2000-06-16 19:58:42 +00002619If byteorder is \code{0}, the output string will always start with the
Fred Drakea4cd2612000-04-06 14:10:29 +00002620Unicode BOM mark (U+FEFF). In the other two modes, no BOM mark is
2621prepended.
2622
2623Note that \ctype{Py_UNICODE} data is being interpreted as UTF-16
2624reduced to UCS-2. This trick makes it possible to add full UTF-16
2625capabilities at a later point without comprimising the APIs.
2626
2627Returns \NULL{} in case an exception was raised by the codec.
2628\end{cfuncdesc}
2629
2630\begin{cfuncdesc}{PyObject*}{PyUnicode_AsUTF16String}{PyObject *unicode}
Fred Drakea4cd2612000-04-06 14:10:29 +00002631Returns a Python string using the UTF-16 encoding in native byte
2632order. The string always starts with a BOM mark. Error handling is
2633``strict''. Returns \NULL{} in case an exception was raised by the
2634codec.
2635\end{cfuncdesc}
2636
2637% --- Unicode-Escape Codecs ----------------------------------------------
2638
2639These are the ``Unicode Esacpe'' codec APIs:
2640
2641\begin{cfuncdesc}{PyObject*}{PyUnicode_DecodeUnicodeEscape}{const char *s,
2642 int size,
2643 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002644Creates a Unicode object by decoding \var{size} bytes of the Unicode-Esacpe
2645encoded string \var{s}. Returns \NULL{} in case an exception was
2646raised by the codec.
2647\end{cfuncdesc}
2648
2649\begin{cfuncdesc}{PyObject*}{PyUnicode_EncodeUnicodeEscape}{const Py_UNICODE *s,
2650 int size,
2651 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002652Encodes the \ctype{Py_UNICODE} buffer of the given size using Unicode-Escape
2653and returns a Python string object. Returns \NULL{} in case an
2654exception was raised by the codec.
2655\end{cfuncdesc}
2656
2657\begin{cfuncdesc}{PyObject*}{PyUnicode_AsUnicodeEscapeString}{PyObject *unicode}
Fred Drakea4cd2612000-04-06 14:10:29 +00002658Encodes a Unicode objects using Unicode-Escape and returns the result
2659as Python string object. Error handling is ``strict''. Returns
2660\NULL{} in case an exception was raised by the codec.
2661\end{cfuncdesc}
2662
2663% --- Raw-Unicode-Escape Codecs ------------------------------------------
2664
2665These are the ``Raw Unicode Esacpe'' codec APIs:
2666
2667\begin{cfuncdesc}{PyObject*}{PyUnicode_DecodeRawUnicodeEscape}{const char *s,
2668 int size,
2669 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002670Creates a Unicode object by decoding \var{size} bytes of the Raw-Unicode-Esacpe
2671encoded string \var{s}. Returns \NULL{} in case an exception was
2672raised by the codec.
2673\end{cfuncdesc}
2674
2675\begin{cfuncdesc}{PyObject*}{PyUnicode_EncodeRawUnicodeEscape}{const Py_UNICODE *s,
2676 int size,
2677 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002678Encodes the \ctype{Py_UNICODE} buffer of the given size using Raw-Unicode-Escape
2679and returns a Python string object. Returns \NULL{} in case an
2680exception was raised by the codec.
2681\end{cfuncdesc}
2682
2683\begin{cfuncdesc}{PyObject*}{PyUnicode_AsRawUnicodeEscapeString}{PyObject *unicode}
Fred Drakea4cd2612000-04-06 14:10:29 +00002684Encodes a Unicode objects using Raw-Unicode-Escape and returns the result
2685as Python string object. Error handling is ``strict''. Returns
2686\NULL{} in case an exception was raised by the codec.
2687\end{cfuncdesc}
2688
2689% --- Latin-1 Codecs -----------------------------------------------------
2690
2691These are the Latin-1 codec APIs:
2692
2693Latin-1 corresponds to the first 256 Unicode ordinals and only these
2694are accepted by the codecs during encoding.
2695
2696\begin{cfuncdesc}{PyObject*}{PyUnicode_DecodeLatin1}{const char *s,
Fred Drake1d158692000-06-18 05:21:21 +00002697 int size,
2698 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002699Creates a Unicode object by decoding \var{size} bytes of the Latin-1
2700encoded string \var{s}. Returns \NULL{} in case an exception was
2701raised by the codec.
2702\end{cfuncdesc}
2703
2704\begin{cfuncdesc}{PyObject*}{PyUnicode_EncodeLatin1}{const Py_UNICODE *s,
Fred Drake1d158692000-06-18 05:21:21 +00002705 int size,
2706 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002707Encodes the \ctype{Py_UNICODE} buffer of the given size using Latin-1
2708and returns a Python string object. Returns \NULL{} in case an
2709exception was raised by the codec.
2710\end{cfuncdesc}
2711
2712\begin{cfuncdesc}{PyObject*}{PyUnicode_AsLatin1String}{PyObject *unicode}
Fred Drakea4cd2612000-04-06 14:10:29 +00002713Encodes a Unicode objects using Latin-1 and returns the result as
2714Python string object. Error handling is ``strict''. Returns
2715\NULL{} in case an exception was raised by the codec.
2716\end{cfuncdesc}
2717
2718% --- ASCII Codecs -------------------------------------------------------
2719
Fred Drake1d158692000-06-18 05:21:21 +00002720These are the \ASCII{} codec APIs. Only 7-bit \ASCII{} data is
2721accepted. All other codes generate errors.
Fred Drakea4cd2612000-04-06 14:10:29 +00002722
2723\begin{cfuncdesc}{PyObject*}{PyUnicode_DecodeASCII}{const char *s,
Fred Drake1d158692000-06-18 05:21:21 +00002724 int size,
2725 const char *errors}
2726Creates a Unicode object by decoding \var{size} bytes of the
2727\ASCII{} encoded string \var{s}. Returns \NULL{} in case an exception
2728was raised by the codec.
Fred Drakea4cd2612000-04-06 14:10:29 +00002729\end{cfuncdesc}
2730
2731\begin{cfuncdesc}{PyObject*}{PyUnicode_EncodeASCII}{const Py_UNICODE *s,
Fred Drake1d158692000-06-18 05:21:21 +00002732 int size,
2733 const char *errors}
2734Encodes the \ctype{Py_UNICODE} buffer of the given size using
2735\ASCII{} and returns a Python string object. Returns \NULL{} in case
2736an exception was raised by the codec.
Fred Drakea4cd2612000-04-06 14:10:29 +00002737\end{cfuncdesc}
2738
2739\begin{cfuncdesc}{PyObject*}{PyUnicode_AsASCIIString}{PyObject *unicode}
Fred Drake1d158692000-06-18 05:21:21 +00002740Encodes a Unicode objects using \ASCII{} and returns the result as Python
Fred Drakea4cd2612000-04-06 14:10:29 +00002741string object. Error handling is ``strict''. Returns
2742\NULL{} in case an exception was raised by the codec.
2743\end{cfuncdesc}
2744
2745% --- Character Map Codecs -----------------------------------------------
2746
2747These are the mapping codec APIs:
2748
2749This codec is special in that it can be used to implement many
2750different codecs (and this is in fact what was done to obtain most of
2751the standard codecs included in the \module{encodings} package). The
2752codec uses mapping to encode and decode characters.
2753
2754Decoding mappings must map single string characters to single Unicode
2755characters, integers (which are then interpreted as Unicode ordinals)
2756or None (meaning "undefined mapping" and causing an error).
2757
2758Encoding mappings must map single Unicode characters to single string
2759characters, integers (which are then interpreted as Latin-1 ordinals)
2760or None (meaning "undefined mapping" and causing an error).
2761
2762The mapping objects provided must only support the __getitem__ mapping
2763interface.
2764
2765If a character lookup fails with a LookupError, the character is
2766copied as-is meaning that its ordinal value will be interpreted as
2767Unicode or Latin-1 ordinal resp. Because of this, mappings only need
2768to contain those mappings which map characters to different code
2769points.
2770
2771\begin{cfuncdesc}{PyObject*}{PyUnicode_DecodeCharmap}{const char *s,
2772 int size,
2773 PyObject *mapping,
2774 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002775Creates a Unicode object by decoding \var{size} bytes of the encoded
2776string \var{s} using the given \var{mapping} object. Returns \NULL{}
2777in case an exception was raised by the codec.
2778\end{cfuncdesc}
2779
2780\begin{cfuncdesc}{PyObject*}{PyUnicode_EncodeCharmap}{const Py_UNICODE *s,
2781 int size,
2782 PyObject *mapping,
2783 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002784Encodes the \ctype{Py_UNICODE} buffer of the given size using the
2785given \var{mapping} object and returns a Python string object.
2786Returns \NULL{} in case an exception was raised by the codec.
2787\end{cfuncdesc}
2788
2789\begin{cfuncdesc}{PyObject*}{PyUnicode_AsCharmapString}{PyObject *unicode,
2790 PyObject *mapping}
Fred Drakea4cd2612000-04-06 14:10:29 +00002791Encodes a Unicode objects using the given \var{mapping} object and
2792returns the result as Python string object. Error handling is
2793``strict''. Returns \NULL{} in case an exception was raised by the
2794codec.
2795\end{cfuncdesc}
2796
2797The following codec API is special in that maps Unicode to Unicode.
2798
2799\begin{cfuncdesc}{PyObject*}{PyUnicode_TranslateCharmap}{const Py_UNICODE *s,
2800 int size,
2801 PyObject *table,
2802 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002803Translates a \ctype{Py_UNICODE} buffer of the given length by applying
2804a character mapping \var{table} to it and returns the resulting
Fred Drake1d158692000-06-18 05:21:21 +00002805Unicode object. Returns \NULL{} when an exception was raised by the
2806codec.
Fred Drakea4cd2612000-04-06 14:10:29 +00002807
2808The \var{mapping} table must map Unicode ordinal integers to Unicode
2809ordinal integers or None (causing deletion of the character).
2810
2811Mapping tables must only provide the __getitem__ interface,
2812e.g. dictionaries or sequences. Unmapped character ordinals (ones
2813which cause a LookupError) are left untouched and are copied as-is.
Fred Drakea4cd2612000-04-06 14:10:29 +00002814\end{cfuncdesc}
2815
2816% --- MBCS codecs for Windows --------------------------------------------
2817
Fred Drake1d158692000-06-18 05:21:21 +00002818These are the MBCS codec APIs. They are currently only available on
Fred Drakea4cd2612000-04-06 14:10:29 +00002819Windows and use the Win32 MBCS converters to implement the
Fred Drake1d158692000-06-18 05:21:21 +00002820conversions. Note that MBCS (or DBCS) is a class of encodings, not
2821just one. The target encoding is defined by the user settings on the
2822machine running the codec.
Fred Drakea4cd2612000-04-06 14:10:29 +00002823
2824\begin{cfuncdesc}{PyObject*}{PyUnicode_DecodeMBCS}{const char *s,
2825 int size,
2826 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002827Creates a Unicode object by decoding \var{size} bytes of the MBCS
Fred Drake1d158692000-06-18 05:21:21 +00002828encoded string \var{s}. Returns \NULL{} in case an exception was
Fred Drakea4cd2612000-04-06 14:10:29 +00002829raised by the codec.
2830\end{cfuncdesc}
2831
2832\begin{cfuncdesc}{PyObject*}{PyUnicode_EncodeMBCS}{const Py_UNICODE *s,
2833 int size,
2834 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002835Encodes the \ctype{Py_UNICODE} buffer of the given size using MBCS
2836and returns a Python string object. Returns \NULL{} in case an
2837exception was raised by the codec.
2838\end{cfuncdesc}
2839
2840\begin{cfuncdesc}{PyObject*}{PyUnicode_AsMBCSString}{PyObject *unicode}
Fred Drakea4cd2612000-04-06 14:10:29 +00002841Encodes a Unicode objects using MBCS and returns the result as Python
Fred Drake1d158692000-06-18 05:21:21 +00002842string object. Error handling is ``strict''. Returns \NULL{} in case
2843an exception was raised by the codec.
Fred Drakea4cd2612000-04-06 14:10:29 +00002844\end{cfuncdesc}
2845
2846% --- Methods & Slots ----------------------------------------------------
2847
2848\subsubsection{Methods and Slot Functions \label{unicodeMethodsAndSlots}}
2849
2850The following APIs are capable of handling Unicode objects and strings
2851on input (we refer to them as strings in the descriptions) and return
2852Unicode objects or integers as apporpriate.
2853
2854They all return \NULL{} or -1 in case an exception occurrs.
2855
2856\begin{cfuncdesc}{PyObject*}{PyUnicode_Concat}{PyObject *left,
2857 PyObject *right}
Fred Drakea4cd2612000-04-06 14:10:29 +00002858Concat two strings giving a new Unicode string.
2859\end{cfuncdesc}
2860
2861\begin{cfuncdesc}{PyObject*}{PyUnicode_Split}{PyObject *s,
2862 PyObject *sep,
2863 int maxsplit}
Fred Drakea4cd2612000-04-06 14:10:29 +00002864Split a string giving a list of Unicode strings.
2865
2866If sep is NULL, splitting will be done at all whitespace
2867substrings. Otherwise, splits occur at the given separator.
2868
2869At most maxsplit splits will be done. If negative, no limit is set.
2870
2871Separators are not included in the resulting list.
2872\end{cfuncdesc}
2873
2874\begin{cfuncdesc}{PyObject*}{PyUnicode_Splitlines}{PyObject *s,
2875 int maxsplit}
Fred Drake1d158692000-06-18 05:21:21 +00002876Split a Unicode string at line breaks, returning a list of Unicode
2877strings. CRLF is considered to be one line break. The Line break
2878characters are not included in the resulting strings.
Fred Drakea4cd2612000-04-06 14:10:29 +00002879\end{cfuncdesc}
2880
2881\begin{cfuncdesc}{PyObject*}{PyUnicode_Translate}{PyObject *str,
2882 PyObject *table,
2883 const char *errors}
Fred Drakea4cd2612000-04-06 14:10:29 +00002884Translate a string by applying a character mapping table to it and
2885return the resulting Unicode object.
2886
2887The mapping table must map Unicode ordinal integers to Unicode ordinal
2888integers or None (causing deletion of the character).
2889
2890Mapping tables must only provide the __getitem__ interface,
2891e.g. dictionaries or sequences. Unmapped character ordinals (ones
2892which cause a LookupError) are left untouched and are copied as-is.
2893
2894\var{errors} has the usual meaning for codecs. It may be \NULL{}
2895which indicates to use the default error handling.
Fred Drakea4cd2612000-04-06 14:10:29 +00002896\end{cfuncdesc}
2897
2898\begin{cfuncdesc}{PyObject*}{PyUnicode_Join}{PyObject *separator,
2899 PyObject *seq}
Fred Drakea4cd2612000-04-06 14:10:29 +00002900Join a sequence of strings using the given separator and return
2901the resulting Unicode string.
2902\end{cfuncdesc}
2903
2904\begin{cfuncdesc}{PyObject*}{PyUnicode_Tailmatch}{PyObject *str,
2905 PyObject *substr,
2906 int start,
2907 int end,
2908 int direction}
Fred Drakea4cd2612000-04-06 14:10:29 +00002909Return 1 if \var{substr} matches \var{str}[\var{start}:\var{end}] at
2910the given tail end (\var{direction} == -1 means to do a prefix match,
2911\var{direction} == 1 a suffix match), 0 otherwise.
2912\end{cfuncdesc}
2913
2914\begin{cfuncdesc}{PyObject*}{PyUnicode_Find}{PyObject *str,
2915 PyObject *substr,
2916 int start,
2917 int end,
2918 int direction}
Fred Drakea4cd2612000-04-06 14:10:29 +00002919Return the first position of \var{substr} in
2920\var{str}[\var{start}:\var{end}] using the given \var{direction}
2921(\var{direction} == 1 means to do a forward search,
2922\var{direction} == -1 a backward search), 0 otherwise.
2923\end{cfuncdesc}
2924
2925\begin{cfuncdesc}{PyObject*}{PyUnicode_Count}{PyObject *str,
2926 PyObject *substr,
2927 int start,
2928 int end}
Fred Drakea4cd2612000-04-06 14:10:29 +00002929Count the number of occurrences of \var{substr} in
2930\var{str}[\var{start}:\var{end}]
2931\end{cfuncdesc}
2932
2933\begin{cfuncdesc}{PyObject*}{PyUnicode_Replace}{PyObject *str,
2934 PyObject *substr,
2935 PyObject *replstr,
2936 int maxcount}
Fred Drakea4cd2612000-04-06 14:10:29 +00002937Replace at most \var{maxcount} occurrences of \var{substr} in
2938\var{str} with \var{replstr} and return the resulting Unicode object.
2939\var{maxcount} == -1 means: replace all occurrences.
2940\end{cfuncdesc}
2941
Fred Drake1d158692000-06-18 05:21:21 +00002942\begin{cfuncdesc}{int}{PyUnicode_Compare}{PyObject *left, PyObject *right}
Fred Drakea4cd2612000-04-06 14:10:29 +00002943Compare two strings and return -1, 0, 1 for less than, equal,
2944greater than resp.
2945\end{cfuncdesc}
2946
2947\begin{cfuncdesc}{PyObject*}{PyUnicode_Format}{PyObject *format,
2948 PyObject *args}
Fred Drake1d158692000-06-18 05:21:21 +00002949Returns a new string object from \var{format} and \var{args}; this is
2950analogous to \code{\var{format} \%\ \var{args}}. The
2951\var{args} argument must be a tuple.
Fred Drakea4cd2612000-04-06 14:10:29 +00002952\end{cfuncdesc}
2953
2954\begin{cfuncdesc}{int}{PyUnicode_Contains}{PyObject *container,
2955 PyObject *element}
Fred Drakea4cd2612000-04-06 14:10:29 +00002956Checks whether \var{element} is contained in \var{container} and
Fred Drake1d158692000-06-18 05:21:21 +00002957returns true or false accordingly.
Fred Drakea4cd2612000-04-06 14:10:29 +00002958
Fred Drake1d158692000-06-18 05:21:21 +00002959\var{element} has to coerce to a one element Unicode string. \code{-1} is
Fred Drakea4cd2612000-04-06 14:10:29 +00002960returned in case of an error.
2961\end{cfuncdesc}
2962
2963
Fred Drake58c5a2a1999-08-04 13:13:24 +00002964\subsection{Buffer Objects \label{bufferObjects}}
Fred Drake659ebfa2000-04-03 15:42:13 +00002965\sectionauthor{Greg Stein}{gstein@lyra.org}
Fred Drake58c5a2a1999-08-04 13:13:24 +00002966
Fred Drake659ebfa2000-04-03 15:42:13 +00002967\obindex{buffer}
2968Python objects implemented in C can export a group of functions called
2969the ``buffer\index{buffer interface} interface.'' These functions can
2970be used by an object to expose its data in a raw, byte-oriented
2971format. Clients of the object can use the buffer interface to access
2972the object data directly, without needing to copy it first.
2973
2974Two examples of objects that support
2975the buffer interface are strings and arrays. The string object exposes
2976the character contents in the buffer interface's byte-oriented
2977form. An array can also expose its contents, but it should be noted
2978that array elements may be multi-byte values.
2979
2980An example user of the buffer interface is the file object's
2981\method{write()} method. Any object that can export a series of bytes
2982through the buffer interface can be written to a file. There are a
2983number of format codes to \cfunction{PyArgs_ParseTuple()} that operate
2984against an object's buffer interface, returning data from the target
2985object.
2986
2987More information on the buffer interface is provided in the section
2988``Buffer Object Structures'' (section \ref{buffer-structs}), under
2989the description for \ctype{PyBufferProcs}\ttindex{PyBufferProcs}.
2990
2991A ``buffer object'' is defined in the \file{bufferobject.h} header
2992(included by \file{Python.h}). These objects look very similar to
2993string objects at the Python programming level: they support slicing,
2994indexing, concatenation, and some other standard string
2995operations. However, their data can come from one of two sources: from
2996a block of memory, or from another object which exports the buffer
2997interface.
2998
2999Buffer objects are useful as a way to expose the data from another
3000object's buffer interface to the Python programmer. They can also be
3001used as a zero-copy slicing mechanism. Using their ability to
3002reference a block of memory, it is possible to expose any data to the
3003Python programmer quite easily. The memory could be a large, constant
3004array in a C extension, it could be a raw block of memory for
3005manipulation before passing to an operating system library, or it
3006could be used to pass around structured data in its native, in-memory
3007format.
3008
3009\begin{ctypedesc}{PyBufferObject}
3010This subtype of \ctype{PyObject} represents a buffer object.
3011\end{ctypedesc}
Fred Drake58c5a2a1999-08-04 13:13:24 +00003012
3013\begin{cvardesc}{PyTypeObject}{PyBuffer_Type}
3014The instance of \ctype{PyTypeObject} which represents the Python
Fred Drake659ebfa2000-04-03 15:42:13 +00003015buffer type; it is the same object as \code{types.BufferType} in the
3016Python layer.\withsubitem{(in module types)}{\ttindex{BufferType}}.
Fred Drake58c5a2a1999-08-04 13:13:24 +00003017\end{cvardesc}
3018
3019\begin{cvardesc}{int}{Py_END_OF_BUFFER}
Fred Drake659ebfa2000-04-03 15:42:13 +00003020This constant may be passed as the \var{size} parameter to
3021\cfunction{PyBuffer_FromObject()} or
3022\cfunction{PyBuffer_FromReadWriteObject()}. It indicates that the new
3023\ctype{PyBufferObject} should refer to \var{base} object from the
3024specified \var{offset} to the end of its exported buffer. Using this
3025enables the caller to avoid querying the \var{base} object for its
3026length.
Fred Drake58c5a2a1999-08-04 13:13:24 +00003027\end{cvardesc}
3028
3029\begin{cfuncdesc}{int}{PyBuffer_Check}{PyObject *p}
3030Return true if the argument has type \cdata{PyBuffer_Type}.
3031\end{cfuncdesc}
3032
3033\begin{cfuncdesc}{PyObject*}{PyBuffer_FromObject}{PyObject *base,
3034 int offset, int size}
Fred Drake659ebfa2000-04-03 15:42:13 +00003035Return a new read-only buffer object. This raises
3036\exception{TypeError} if \var{base} doesn't support the read-only
3037buffer protocol or doesn't provide exactly one buffer segment, or it
3038raises \exception{ValueError} if \var{offset} is less than zero. The
3039buffer will hold a reference to the \var{base} object, and the
3040buffer's contents will refer to the \var{base} object's buffer
3041interface, starting as position \var{offset} and extending for
3042\var{size} bytes. If \var{size} is \constant{Py_END_OF_BUFFER}, then
3043the new buffer's contents extend to the length of the
3044\var{base} object's exported buffer data.
Fred Drake58c5a2a1999-08-04 13:13:24 +00003045\end{cfuncdesc}
3046
3047\begin{cfuncdesc}{PyObject*}{PyBuffer_FromReadWriteObject}{PyObject *base,
3048 int offset,
3049 int size}
3050Return a new writable buffer object. Parameters and exceptions are
3051similar to those for \cfunction{PyBuffer_FromObject()}.
Fred Drake659ebfa2000-04-03 15:42:13 +00003052If the \var{base} object does not export the writeable buffer
3053protocol, then \exception{TypeError} is raised.
Fred Drake58c5a2a1999-08-04 13:13:24 +00003054\end{cfuncdesc}
3055
3056\begin{cfuncdesc}{PyObject*}{PyBuffer_FromMemory}{void *ptr, int size}
Fred Drake659ebfa2000-04-03 15:42:13 +00003057Return a new read-only buffer object that reads from a specified
3058location in memory, with a specified size.
Fred Drake58c5a2a1999-08-04 13:13:24 +00003059The caller is responsible for ensuring that the memory buffer, passed
3060in as \var{ptr}, is not deallocated while the returned buffer object
3061exists. Raises \exception{ValueError} if \var{size} is less than
Fred Drake659ebfa2000-04-03 15:42:13 +00003062zero. Note that \constant{Py_END_OF_BUFFER} may \emph{not} be passed
3063for the \var{size} parameter; \exception{ValueError} will be raised in
3064that case.
Fred Drake58c5a2a1999-08-04 13:13:24 +00003065\end{cfuncdesc}
3066
3067\begin{cfuncdesc}{PyObject*}{PyBuffer_FromReadWriteMemory}{void *ptr, int size}
Fred Drake659ebfa2000-04-03 15:42:13 +00003068Similar to \cfunction{PyBuffer_FromMemory()}, but the returned buffer
3069is writable.
Fred Drake58c5a2a1999-08-04 13:13:24 +00003070\end{cfuncdesc}
3071
3072\begin{cfuncdesc}{PyObject*}{PyBuffer_New}{int size}
3073Returns a new writable buffer object that maintains its own memory
Fred Drake659ebfa2000-04-03 15:42:13 +00003074buffer of \var{size} bytes. \exception{ValueError} is returned if
3075\var{size} is not zero or positive.
Fred Drake58c5a2a1999-08-04 13:13:24 +00003076\end{cfuncdesc}
3077
Guido van Rossum44475131998-04-21 15:30:01 +00003078
Fred Drakeefd146c1999-02-15 15:30:45 +00003079\subsection{Tuple Objects \label{tupleObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003080
Fred Drake659ebfa2000-04-03 15:42:13 +00003081\obindex{tuple}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003082\begin{ctypedesc}{PyTupleObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003083This subtype of \ctype{PyObject} represents a Python tuple object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003084\end{ctypedesc}
3085
3086\begin{cvardesc}{PyTypeObject}{PyTuple_Type}
Fred Drake659ebfa2000-04-03 15:42:13 +00003087This instance of \ctype{PyTypeObject} represents the Python tuple
3088type; it is the same object as \code{types.TupleType} in the Python
3089layer.\withsubitem{(in module types)}{\ttindex{TupleType}}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003090\end{cvardesc}
3091
3092\begin{cfuncdesc}{int}{PyTuple_Check}{PyObject *p}
3093Return true if the argument is a tuple object.
3094\end{cfuncdesc}
3095
Fred Drake659ebfa2000-04-03 15:42:13 +00003096\begin{cfuncdesc}{PyObject*}{PyTuple_New}{int len}
3097Return a new tuple object of size \var{len}, or \NULL{} on failure.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003098\end{cfuncdesc}
3099
Fred Drakea05460c2001-02-12 17:38:18 +00003100\begin{cfuncdesc}{int}{PyTuple_Size}{PyObject *p}
Fred Drakee058b4f1998-02-16 06:15:35 +00003101Takes a pointer to a tuple object, and returns the size
Fred Drakee5bf8b21998-02-12 21:22:28 +00003102of that tuple.
3103\end{cfuncdesc}
3104
Fred Drakea05460c2001-02-12 17:38:18 +00003105\begin{cfuncdesc}{PyObject*}{PyTuple_GetItem}{PyObject *p, int pos}
Fred Drakee058b4f1998-02-16 06:15:35 +00003106Returns the object at position \var{pos} in the tuple pointed
3107to by \var{p}. If \var{pos} is out of bounds, returns \NULL{} and
Fred Drake659ebfa2000-04-03 15:42:13 +00003108sets an \exception{IndexError} exception.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003109\end{cfuncdesc}
3110
Fred Drakea05460c2001-02-12 17:38:18 +00003111\begin{cfuncdesc}{PyObject*}{PyTuple_GET_ITEM}{PyObject *p, int pos}
Fred Drakee058b4f1998-02-16 06:15:35 +00003112Does the same, but does no checking of its arguments.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003113\end{cfuncdesc}
3114
Fred Drakea05460c2001-02-12 17:38:18 +00003115\begin{cfuncdesc}{PyObject*}{PyTuple_GetSlice}{PyObject *p,
3116 int low, int high}
Fred Drakee058b4f1998-02-16 06:15:35 +00003117Takes a slice of the tuple pointed to by \var{p} from
3118\var{low} to \var{high} and returns it as a new tuple.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003119\end{cfuncdesc}
3120
Fred Drake659ebfa2000-04-03 15:42:13 +00003121\begin{cfuncdesc}{int}{PyTuple_SetItem}{PyObject *p,
3122 int pos, PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00003123Inserts a reference to object \var{o} at position \var{pos} of
3124the tuple pointed to by \var{p}. It returns \code{0} on success.
Fred Drake659ebfa2000-04-03 15:42:13 +00003125\strong{Note:} This function ``steals'' a reference to \var{o}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003126\end{cfuncdesc}
3127
Fred Drake659ebfa2000-04-03 15:42:13 +00003128\begin{cfuncdesc}{void}{PyTuple_SET_ITEM}{PyObject *p,
3129 int pos, PyObject *o}
Fred Drakee058b4f1998-02-16 06:15:35 +00003130Does the same, but does no error checking, and
Fred Drakee5bf8b21998-02-12 21:22:28 +00003131should \emph{only} be used to fill in brand new tuples.
Fred Drake659ebfa2000-04-03 15:42:13 +00003132\strong{Note:} This function ``steals'' a reference to \var{o}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003133\end{cfuncdesc}
3134
Fred Drakea05460c2001-02-12 17:38:18 +00003135\begin{cfuncdesc}{int}{_PyTuple_Resize}{PyObject **p,
Fred Drake659ebfa2000-04-03 15:42:13 +00003136 int newsize, int last_is_sticky}
3137Can be used to resize a tuple. \var{newsize} will be the new length
3138of the tuple. Because tuples are \emph{supposed} to be immutable,
3139this should only be used if there is only one reference to the object.
3140Do \emph{not} use this if the tuple may already be known to some other
Neil Schemenauer410cb6b2000-10-05 19:38:24 +00003141part of the code. The tuple will always grow or shrink at the end. The
3142\var{last_is_sticky} flag is not used and should always be false. Think
3143of this as destroying the old tuple and creating a new one, only more
3144efficiently. Returns \code{0} on success and \code{-1} on failure (in
3145which case a \exception{MemoryError} or \exception{SystemError} will be
3146raised).
Fred Drakee5bf8b21998-02-12 21:22:28 +00003147\end{cfuncdesc}
3148
3149
Fred Drakeefd146c1999-02-15 15:30:45 +00003150\subsection{List Objects \label{listObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003151
Fred Drake659ebfa2000-04-03 15:42:13 +00003152\obindex{list}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003153\begin{ctypedesc}{PyListObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003154This subtype of \ctype{PyObject} represents a Python list object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003155\end{ctypedesc}
3156
3157\begin{cvardesc}{PyTypeObject}{PyList_Type}
Fred Drake659ebfa2000-04-03 15:42:13 +00003158This instance of \ctype{PyTypeObject} represents the Python list
3159type. This is the same object as \code{types.ListType}.
3160\withsubitem{(in module types)}{\ttindex{ListType}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003161\end{cvardesc}
3162
3163\begin{cfuncdesc}{int}{PyList_Check}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003164Returns true if its argument is a \ctype{PyListObject}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003165\end{cfuncdesc}
3166
Fred Drake659ebfa2000-04-03 15:42:13 +00003167\begin{cfuncdesc}{PyObject*}{PyList_New}{int len}
3168Returns a new list of length \var{len} on success, or \NULL{} on
Guido van Rossum3c4378b1998-04-14 20:21:10 +00003169failure.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003170\end{cfuncdesc}
3171
Fred Drakec6fa34e1998-04-02 06:47:24 +00003172\begin{cfuncdesc}{int}{PyList_Size}{PyObject *list}
Fred Drake659ebfa2000-04-03 15:42:13 +00003173Returns the length of the list object in \var{list}; this is
3174equivalent to \samp{len(\var{list})} on a list object.
3175\bifuncindex{len}
3176\end{cfuncdesc}
3177
3178\begin{cfuncdesc}{int}{PyList_GET_SIZE}{PyObject *list}
Fred Drake5d644212000-10-07 12:31:50 +00003179Macro form of \cfunction{PyList_Size()} without error checking.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003180\end{cfuncdesc}
3181
Fred Drakec6fa34e1998-04-02 06:47:24 +00003182\begin{cfuncdesc}{PyObject*}{PyList_GetItem}{PyObject *list, int index}
Guido van Rossum44475131998-04-21 15:30:01 +00003183Returns the object at position \var{pos} in the list pointed
3184to by \var{p}. If \var{pos} is out of bounds, returns \NULL{} and
Fred Drake659ebfa2000-04-03 15:42:13 +00003185sets an \exception{IndexError} exception.
3186\end{cfuncdesc}
3187
3188\begin{cfuncdesc}{PyObject*}{PyList_GET_ITEM}{PyObject *list, int i}
3189Macro form of \cfunction{PyList_GetItem()} without error checking.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003190\end{cfuncdesc}
3191
Fred Drakec6fa34e1998-04-02 06:47:24 +00003192\begin{cfuncdesc}{int}{PyList_SetItem}{PyObject *list, int index,
3193 PyObject *item}
Guido van Rossum3c4378b1998-04-14 20:21:10 +00003194Sets the item at index \var{index} in list to \var{item}.
Fred Drake659ebfa2000-04-03 15:42:13 +00003195\strong{Note:} This function ``steals'' a reference to \var{item}.
3196\end{cfuncdesc}
3197
3198\begin{cfuncdesc}{PyObject*}{PyList_SET_ITEM}{PyObject *list, int i,
3199 PyObject *o}
3200Macro form of \cfunction{PyList_SetItem()} without error checking.
3201\strong{Note:} This function ``steals'' a reference to \var{item}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003202\end{cfuncdesc}
3203
Fred Drakec6fa34e1998-04-02 06:47:24 +00003204\begin{cfuncdesc}{int}{PyList_Insert}{PyObject *list, int index,
Guido van Rossum44475131998-04-21 15:30:01 +00003205 PyObject *item}
3206Inserts the item \var{item} into list \var{list} in front of index
Fred Drake659ebfa2000-04-03 15:42:13 +00003207\var{index}. Returns \code{0} if successful; returns \code{-1} and
3208raises an exception if unsuccessful. Analogous to
3209\code{\var{list}.insert(\var{index}, \var{item})}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003210\end{cfuncdesc}
3211
Fred Drakec6fa34e1998-04-02 06:47:24 +00003212\begin{cfuncdesc}{int}{PyList_Append}{PyObject *list, PyObject *item}
Guido van Rossum44475131998-04-21 15:30:01 +00003213Appends the object \var{item} at the end of list \var{list}. Returns
Fred Drake659ebfa2000-04-03 15:42:13 +00003214\code{0} if successful; returns \code{-1} and sets an exception if
3215unsuccessful. Analogous to \code{\var{list}.append(\var{item})}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003216\end{cfuncdesc}
3217
Fred Drakec6fa34e1998-04-02 06:47:24 +00003218\begin{cfuncdesc}{PyObject*}{PyList_GetSlice}{PyObject *list,
3219 int low, int high}
Guido van Rossum3c4378b1998-04-14 20:21:10 +00003220Returns a list of the objects in \var{list} containing the objects
Guido van Rossum44475131998-04-21 15:30:01 +00003221\emph{between} \var{low} and \var{high}. Returns NULL and sets an
3222exception if unsuccessful.
Fred Drake659ebfa2000-04-03 15:42:13 +00003223Analogous to \code{\var{list}[\var{low}:\var{high}]}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003224\end{cfuncdesc}
3225
Fred Drakec6fa34e1998-04-02 06:47:24 +00003226\begin{cfuncdesc}{int}{PyList_SetSlice}{PyObject *list,
3227 int low, int high,
3228 PyObject *itemlist}
Fred Drake659ebfa2000-04-03 15:42:13 +00003229Sets the slice of \var{list} between \var{low} and \var{high} to the
3230contents of \var{itemlist}. Analogous to
3231\code{\var{list}[\var{low}:\var{high}] = \var{itemlist}}. Returns
3232\code{0} on success, \code{-1} on failure.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003233\end{cfuncdesc}
3234
Fred Drakec6fa34e1998-04-02 06:47:24 +00003235\begin{cfuncdesc}{int}{PyList_Sort}{PyObject *list}
Fred Drake659ebfa2000-04-03 15:42:13 +00003236Sorts the items of \var{list} in place. Returns \code{0} on success,
3237\code{-1} on failure. This is equivalent to
3238\samp{\var{list}.sort()}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003239\end{cfuncdesc}
3240
Fred Drakec6fa34e1998-04-02 06:47:24 +00003241\begin{cfuncdesc}{int}{PyList_Reverse}{PyObject *list}
Fred Drake659ebfa2000-04-03 15:42:13 +00003242Reverses the items of \var{list} in place. Returns \code{0} on
3243success, \code{-1} on failure. This is the equivalent of
3244\samp{\var{list}.reverse()}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003245\end{cfuncdesc}
3246
Fred Drakec6fa34e1998-04-02 06:47:24 +00003247\begin{cfuncdesc}{PyObject*}{PyList_AsTuple}{PyObject *list}
Fred Drake659ebfa2000-04-03 15:42:13 +00003248Returns a new tuple object containing the contents of \var{list};
3249equivalent to \samp{tuple(\var{list})}.\bifuncindex{tuple}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003250\end{cfuncdesc}
3251
3252
Fred Drakeefd146c1999-02-15 15:30:45 +00003253\section{Mapping Objects \label{mapObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003254
Fred Drake659ebfa2000-04-03 15:42:13 +00003255\obindex{mapping}
3256
3257
Fred Drakeefd146c1999-02-15 15:30:45 +00003258\subsection{Dictionary Objects \label{dictObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003259
Fred Drake659ebfa2000-04-03 15:42:13 +00003260\obindex{dictionary}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003261\begin{ctypedesc}{PyDictObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003262This subtype of \ctype{PyObject} represents a Python dictionary object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003263\end{ctypedesc}
3264
3265\begin{cvardesc}{PyTypeObject}{PyDict_Type}
Fred Drake659ebfa2000-04-03 15:42:13 +00003266This instance of \ctype{PyTypeObject} represents the Python dictionary
3267type. This is exposed to Python programs as \code{types.DictType} and
3268\code{types.DictionaryType}.
3269\withsubitem{(in module types)}{\ttindex{DictType}\ttindex{DictionaryType}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003270\end{cvardesc}
3271
3272\begin{cfuncdesc}{int}{PyDict_Check}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003273Returns true if its argument is a \ctype{PyDictObject}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003274\end{cfuncdesc}
3275
Fred Drakec6fa34e1998-04-02 06:47:24 +00003276\begin{cfuncdesc}{PyObject*}{PyDict_New}{}
Fred Drake659ebfa2000-04-03 15:42:13 +00003277Returns a new empty dictionary, or \NULL{} on failure.
3278\end{cfuncdesc}
3279
3280\begin{cfuncdesc}{void}{PyDict_Clear}{PyObject *p}
3281Empties an existing dictionary of all key-value pairs.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003282\end{cfuncdesc}
3283
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00003284\begin{cfuncdesc}{PyObject*}{PyDict_Copy}{PyObject *p}
Fred Drake659ebfa2000-04-03 15:42:13 +00003285Returns a new dictionary that contains the same key-value pairs as p.
3286Empties an existing dictionary of all key-value pairs.
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00003287\end{cfuncdesc}
3288
Fred Drake659ebfa2000-04-03 15:42:13 +00003289\begin{cfuncdesc}{int}{PyDict_SetItem}{PyObject *p, PyObject *key,
3290 PyObject *val}
3291Inserts \var{value} into the dictionary with a key of \var{key}.
3292\var{key} must be hashable; if it isn't, \exception{TypeError} will be
3293raised.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003294\end{cfuncdesc}
3295
Fred Drake83e01bf2001-03-16 15:41:29 +00003296\begin{cfuncdesc}{int}{PyDict_SetItemString}{PyObject *p,
Fred Drakee5bf8b21998-02-12 21:22:28 +00003297 char *key,
3298 PyObject *val}
Fred Drakee058b4f1998-02-16 06:15:35 +00003299Inserts \var{value} into the dictionary using \var{key}
Fred Drake1d158692000-06-18 05:21:21 +00003300as a key. \var{key} should be a \ctype{char*}. The key object is
Fred Drakee058b4f1998-02-16 06:15:35 +00003301created using \code{PyString_FromString(\var{key})}.
Fred Drake659ebfa2000-04-03 15:42:13 +00003302\ttindex{PyString_FromString()}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003303\end{cfuncdesc}
3304
Fred Drake659ebfa2000-04-03 15:42:13 +00003305\begin{cfuncdesc}{int}{PyDict_DelItem}{PyObject *p, PyObject *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00003306Removes the entry in dictionary \var{p} with key \var{key}.
Fred Drake659ebfa2000-04-03 15:42:13 +00003307\var{key} must be hashable; if it isn't, \exception{TypeError} is
3308raised.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003309\end{cfuncdesc}
3310
Fred Drake659ebfa2000-04-03 15:42:13 +00003311\begin{cfuncdesc}{int}{PyDict_DelItemString}{PyObject *p, char *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00003312Removes the entry in dictionary \var{p} which has a key
Fred Drake659ebfa2000-04-03 15:42:13 +00003313specified by the string \var{key}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003314\end{cfuncdesc}
3315
Fred Drake659ebfa2000-04-03 15:42:13 +00003316\begin{cfuncdesc}{PyObject*}{PyDict_GetItem}{PyObject *p, PyObject *key}
Fred Drakee058b4f1998-02-16 06:15:35 +00003317Returns the object from dictionary \var{p} which has a key
Guido van Rossum44475131998-04-21 15:30:01 +00003318\var{key}. Returns \NULL{} if the key \var{key} is not present, but
Fred Drake659ebfa2000-04-03 15:42:13 +00003319\emph{without} setting an exception.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003320\end{cfuncdesc}
3321
Fred Drake659ebfa2000-04-03 15:42:13 +00003322\begin{cfuncdesc}{PyObject*}{PyDict_GetItemString}{PyObject *p, char *key}
Fred Drakef8830d11998-04-23 14:06:01 +00003323This is the same as \cfunction{PyDict_GetItem()}, but \var{key} is
Fred Drake659ebfa2000-04-03 15:42:13 +00003324specified as a \ctype{char*}, rather than a \ctype{PyObject*}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003325\end{cfuncdesc}
3326
Fred Drake659ebfa2000-04-03 15:42:13 +00003327\begin{cfuncdesc}{PyObject*}{PyDict_Items}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003328Returns a \ctype{PyListObject} containing all the items
Guido van Rossum44475131998-04-21 15:30:01 +00003329from the dictionary, as in the dictinoary method \method{items()} (see
Fred Drakebe486461999-11-09 17:03:03 +00003330the \citetitle[../lib/lib.html]{Python Library Reference}).
Fred Drakee5bf8b21998-02-12 21:22:28 +00003331\end{cfuncdesc}
3332
Fred Drake659ebfa2000-04-03 15:42:13 +00003333\begin{cfuncdesc}{PyObject*}{PyDict_Keys}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003334Returns a \ctype{PyListObject} containing all the keys
Guido van Rossum44475131998-04-21 15:30:01 +00003335from the dictionary, as in the dictionary method \method{keys()} (see the
Fred Drakebe486461999-11-09 17:03:03 +00003336\citetitle[../lib/lib.html]{Python Library Reference}).
Fred Drakee5bf8b21998-02-12 21:22:28 +00003337\end{cfuncdesc}
3338
Fred Drake659ebfa2000-04-03 15:42:13 +00003339\begin{cfuncdesc}{PyObject*}{PyDict_Values}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003340Returns a \ctype{PyListObject} containing all the values
Guido van Rossum44475131998-04-21 15:30:01 +00003341from the dictionary \var{p}, as in the dictionary method
Fred Drakebe486461999-11-09 17:03:03 +00003342\method{values()} (see the \citetitle[../lib/lib.html]{Python Library
3343Reference}).
Fred Drakee5bf8b21998-02-12 21:22:28 +00003344\end{cfuncdesc}
3345
Fred Drake659ebfa2000-04-03 15:42:13 +00003346\begin{cfuncdesc}{int}{PyDict_Size}{PyObject *p}
3347Returns the number of items in the dictionary. This is equivalent to
3348\samp{len(\var{p})} on a dictionary.\bifuncindex{len}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003349\end{cfuncdesc}
3350
Fred Drake83e01bf2001-03-16 15:41:29 +00003351\begin{cfuncdesc}{int}{PyDict_Next}{PyObject *p, int *ppos,
Fred Drake7d45d342000-08-11 17:07:32 +00003352 PyObject **pkey, PyObject **pvalue}
Fred Drake83e01bf2001-03-16 15:41:29 +00003353Iterate over all key-value pairs in the dictionary \var{p}. The
3354\ctype{int} referred to by \var{ppos} must be initialized to \code{0}
3355prior to the first call to this function to start the iteration; the
3356function returns true for each pair in the dictionary, and false once
3357all pairs have been reported. The parameters \var{pkey} and
3358\var{pvalue} should either point to \ctype{PyObject*} variables that
3359will be filled in with each key and value, respectively, or may be
3360\NULL. The dictionary \var{p} must not be mutated during iteration.
3361For example:
Fred Drakee5bf8b21998-02-12 21:22:28 +00003362
Fred Drake83e01bf2001-03-16 15:41:29 +00003363\begin{verbatim}
3364PyObject *key, *value;
3365int pos = 0;
3366
3367while (PyDict_Next(self->dict, &pos, &key, &value)) {
3368 /* do something interesting with the values... */
3369 ...
3370}
3371\end{verbatim}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003372\end{cfuncdesc}
3373
3374
Fred Drakeefd146c1999-02-15 15:30:45 +00003375\section{Numeric Objects \label{numericObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003376
Fred Drake659ebfa2000-04-03 15:42:13 +00003377\obindex{numeric}
3378
3379
Fred Drakeefd146c1999-02-15 15:30:45 +00003380\subsection{Plain Integer Objects \label{intObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003381
Fred Drake659ebfa2000-04-03 15:42:13 +00003382\obindex{integer}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003383\begin{ctypedesc}{PyIntObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003384This subtype of \ctype{PyObject} represents a Python integer object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003385\end{ctypedesc}
3386
3387\begin{cvardesc}{PyTypeObject}{PyInt_Type}
Fred Drakef8830d11998-04-23 14:06:01 +00003388This instance of \ctype{PyTypeObject} represents the Python plain
Fred Drake659ebfa2000-04-03 15:42:13 +00003389integer type. This is the same object as \code{types.IntType}.
3390\withsubitem{(in modules types)}{\ttindex{IntType}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003391\end{cvardesc}
3392
Fred Drake659ebfa2000-04-03 15:42:13 +00003393\begin{cfuncdesc}{int}{PyInt_Check}{PyObject* o}
3394Returns true if \var{o} is of type \cdata{PyInt_Type}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003395\end{cfuncdesc}
3396
Fred Drakec6fa34e1998-04-02 06:47:24 +00003397\begin{cfuncdesc}{PyObject*}{PyInt_FromLong}{long ival}
Fred Drakee058b4f1998-02-16 06:15:35 +00003398Creates a new integer object with a value of \var{ival}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003399
3400The current implementation keeps an array of integer objects for all
Fred Drakee058b4f1998-02-16 06:15:35 +00003401integers between \code{-1} and \code{100}, when you create an int in
3402that range you actually just get back a reference to the existing
3403object. So it should be possible to change the value of \code{1}. I
Fred Drake7e9d3141998-04-03 05:02:28 +00003404suspect the behaviour of Python in this case is undefined. :-)
Fred Drakee5bf8b21998-02-12 21:22:28 +00003405\end{cfuncdesc}
3406
Fred Drakee5bf8b21998-02-12 21:22:28 +00003407\begin{cfuncdesc}{long}{PyInt_AsLong}{PyObject *io}
Fred Drakef8830d11998-04-23 14:06:01 +00003408Will first attempt to cast the object to a \ctype{PyIntObject}, if
Fred Drakee058b4f1998-02-16 06:15:35 +00003409it is not already one, and then return its value.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003410\end{cfuncdesc}
3411
Fred Drake659ebfa2000-04-03 15:42:13 +00003412\begin{cfuncdesc}{long}{PyInt_AS_LONG}{PyObject *io}
3413Returns the value of the object \var{io}. No error checking is
3414performed.
3415\end{cfuncdesc}
3416
Fred Drakee5bf8b21998-02-12 21:22:28 +00003417\begin{cfuncdesc}{long}{PyInt_GetMax}{}
Fred Drake659ebfa2000-04-03 15:42:13 +00003418Returns the system's idea of the largest integer it can handle
3419(\constant{LONG_MAX}\ttindex{LONG_MAX}, as defined in the system
3420header files).
Fred Drakee5bf8b21998-02-12 21:22:28 +00003421\end{cfuncdesc}
3422
3423
Fred Drakeefd146c1999-02-15 15:30:45 +00003424\subsection{Long Integer Objects \label{longObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003425
Fred Drake659ebfa2000-04-03 15:42:13 +00003426\obindex{long integer}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003427\begin{ctypedesc}{PyLongObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003428This subtype of \ctype{PyObject} represents a Python long integer
Fred Drakee058b4f1998-02-16 06:15:35 +00003429object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003430\end{ctypedesc}
3431
3432\begin{cvardesc}{PyTypeObject}{PyLong_Type}
Fred Drakef8830d11998-04-23 14:06:01 +00003433This instance of \ctype{PyTypeObject} represents the Python long
Fred Drake659ebfa2000-04-03 15:42:13 +00003434integer type. This is the same object as \code{types.LongType}.
3435\withsubitem{(in modules types)}{\ttindex{LongType}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003436\end{cvardesc}
3437
3438\begin{cfuncdesc}{int}{PyLong_Check}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003439Returns true if its argument is a \ctype{PyLongObject}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003440\end{cfuncdesc}
3441
Fred Drakec6fa34e1998-04-02 06:47:24 +00003442\begin{cfuncdesc}{PyObject*}{PyLong_FromLong}{long v}
Fred Drake659ebfa2000-04-03 15:42:13 +00003443Returns a new \ctype{PyLongObject} object from \var{v}, or \NULL{} on
3444failure.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003445\end{cfuncdesc}
3446
Fred Drakec6fa34e1998-04-02 06:47:24 +00003447\begin{cfuncdesc}{PyObject*}{PyLong_FromUnsignedLong}{unsigned long v}
Fred Drake659ebfa2000-04-03 15:42:13 +00003448Returns a new \ctype{PyLongObject} object from a C \ctype{unsigned
3449long}, or \NULL{} on failure.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003450\end{cfuncdesc}
3451
Fred Drakec6fa34e1998-04-02 06:47:24 +00003452\begin{cfuncdesc}{PyObject*}{PyLong_FromDouble}{double v}
Fred Drake659ebfa2000-04-03 15:42:13 +00003453Returns a new \ctype{PyLongObject} object from the integer part of
3454\var{v}, or \NULL{} on failure.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003455\end{cfuncdesc}
3456
Fred Drakec6fa34e1998-04-02 06:47:24 +00003457\begin{cfuncdesc}{long}{PyLong_AsLong}{PyObject *pylong}
Fred Drake659ebfa2000-04-03 15:42:13 +00003458Returns a C \ctype{long} representation of the contents of
3459\var{pylong}. If \var{pylong} is greater than
3460\constant{LONG_MAX}\ttindex{LONG_MAX}, an \exception{OverflowError} is
3461raised.\withsubitem{(built-in exception)}{OverflowError}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003462\end{cfuncdesc}
3463
Fred Drakec6fa34e1998-04-02 06:47:24 +00003464\begin{cfuncdesc}{unsigned long}{PyLong_AsUnsignedLong}{PyObject *pylong}
Fred Drake659ebfa2000-04-03 15:42:13 +00003465Returns a C \ctype{unsigned long} representation of the contents of
3466\var{pylong}. If \var{pylong} is greater than
3467\constant{ULONG_MAX}\ttindex{ULONG_MAX}, an \exception{OverflowError}
3468is raised.\withsubitem{(built-in exception)}{OverflowError}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003469\end{cfuncdesc}
3470
Fred Drakec6fa34e1998-04-02 06:47:24 +00003471\begin{cfuncdesc}{double}{PyLong_AsDouble}{PyObject *pylong}
Fred Drake659ebfa2000-04-03 15:42:13 +00003472Returns a C \ctype{double} representation of the contents of \var{pylong}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003473\end{cfuncdesc}
3474
Fred Drakec6fa34e1998-04-02 06:47:24 +00003475\begin{cfuncdesc}{PyObject*}{PyLong_FromString}{char *str, char **pend,
3476 int base}
Fred Drake659ebfa2000-04-03 15:42:13 +00003477Return a new \ctype{PyLongObject} based on the string value in
3478\var{str}, which is interpreted according to the radix in \var{base}.
3479If \var{pend} is non-\NULL, \code{*\var{pend}} will point to the first
3480character in \var{str} which follows the representation of the
3481number. If \var{base} is \code{0}, the radix will be determined base
3482on the leading characters of \var{str}: if \var{str} starts with
3483\code{'0x'} or \code{'0X'}, radix 16 will be used; if \var{str} starts
3484with \code{'0'}, radix 8 will be used; otherwise radix 10 will be
3485used. If \var{base} is not \code{0}, it must be between \code{2} and
3486\code{36}, inclusive. Leading spaces are ignored. If there are no
3487digits, \exception{ValueError} will be raised.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003488\end{cfuncdesc}
3489
3490
Fred Drakeefd146c1999-02-15 15:30:45 +00003491\subsection{Floating Point Objects \label{floatObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003492
Fred Drake659ebfa2000-04-03 15:42:13 +00003493\obindex{floating point}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003494\begin{ctypedesc}{PyFloatObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003495This subtype of \ctype{PyObject} represents a Python floating point
Fred Drakee058b4f1998-02-16 06:15:35 +00003496object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003497\end{ctypedesc}
3498
3499\begin{cvardesc}{PyTypeObject}{PyFloat_Type}
Fred Drakef8830d11998-04-23 14:06:01 +00003500This instance of \ctype{PyTypeObject} represents the Python floating
Fred Drake659ebfa2000-04-03 15:42:13 +00003501point type. This is the same object as \code{types.FloatType}.
3502\withsubitem{(in modules types)}{\ttindex{FloatType}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003503\end{cvardesc}
3504
3505\begin{cfuncdesc}{int}{PyFloat_Check}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003506Returns true if its argument is a \ctype{PyFloatObject}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003507\end{cfuncdesc}
3508
Fred Drakec6fa34e1998-04-02 06:47:24 +00003509\begin{cfuncdesc}{PyObject*}{PyFloat_FromDouble}{double v}
Fred Drake659ebfa2000-04-03 15:42:13 +00003510Creates a \ctype{PyFloatObject} object from \var{v}, or \NULL{} on
3511failure.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003512\end{cfuncdesc}
3513
Fred Drakec6fa34e1998-04-02 06:47:24 +00003514\begin{cfuncdesc}{double}{PyFloat_AsDouble}{PyObject *pyfloat}
Fred Drake659ebfa2000-04-03 15:42:13 +00003515Returns a C \ctype{double} representation of the contents of \var{pyfloat}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003516\end{cfuncdesc}
3517
Fred Drakec6fa34e1998-04-02 06:47:24 +00003518\begin{cfuncdesc}{double}{PyFloat_AS_DOUBLE}{PyObject *pyfloat}
Fred Drake659ebfa2000-04-03 15:42:13 +00003519Returns a C \ctype{double} representation of the contents of
Fred Drakef8830d11998-04-23 14:06:01 +00003520\var{pyfloat}, but without error checking.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003521\end{cfuncdesc}
3522
3523
Fred Drakeefd146c1999-02-15 15:30:45 +00003524\subsection{Complex Number Objects \label{complexObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003525
Fred Drake659ebfa2000-04-03 15:42:13 +00003526\obindex{complex number}
3527Python's complex number objects are implemented as two distinct types
3528when viewed from the C API: one is the Python object exposed to
3529Python programs, and the other is a C structure which represents the
3530actual complex number value. The API provides functions for working
3531with both.
3532
3533\subsubsection{Complex Numbers as C Structures}
3534
3535Note that the functions which accept these structures as parameters
3536and return them as results do so \emph{by value} rather than
3537dereferencing them through pointers. This is consistent throughout
3538the API.
3539
Fred Drakee5bf8b21998-02-12 21:22:28 +00003540\begin{ctypedesc}{Py_complex}
Fred Drake659ebfa2000-04-03 15:42:13 +00003541The C structure which corresponds to the value portion of a Python
Fred Drake4de05a91998-02-16 14:25:26 +00003542complex number object. Most of the functions for dealing with complex
3543number objects use structures of this type as input or output values,
3544as appropriate. It is defined as:
3545
Fred Drakee058b4f1998-02-16 06:15:35 +00003546\begin{verbatim}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003547typedef struct {
3548 double real;
3549 double imag;
Fred Drake4de05a91998-02-16 14:25:26 +00003550} Py_complex;
Fred Drakee058b4f1998-02-16 06:15:35 +00003551\end{verbatim}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003552\end{ctypedesc}
3553
Fred Drake659ebfa2000-04-03 15:42:13 +00003554\begin{cfuncdesc}{Py_complex}{_Py_c_sum}{Py_complex left, Py_complex right}
3555Return the sum of two complex numbers, using the C
3556\ctype{Py_complex} representation.
3557\end{cfuncdesc}
3558
3559\begin{cfuncdesc}{Py_complex}{_Py_c_diff}{Py_complex left, Py_complex right}
3560Return the difference between two complex numbers, using the C
3561\ctype{Py_complex} representation.
3562\end{cfuncdesc}
3563
3564\begin{cfuncdesc}{Py_complex}{_Py_c_neg}{Py_complex complex}
3565Return the negation of the complex number \var{complex}, using the C
3566\ctype{Py_complex} representation.
3567\end{cfuncdesc}
3568
3569\begin{cfuncdesc}{Py_complex}{_Py_c_prod}{Py_complex left, Py_complex right}
3570Return the product of two complex numbers, using the C
3571\ctype{Py_complex} representation.
3572\end{cfuncdesc}
3573
3574\begin{cfuncdesc}{Py_complex}{_Py_c_quot}{Py_complex dividend,
3575 Py_complex divisor}
3576Return the quotient of two complex numbers, using the C
3577\ctype{Py_complex} representation.
3578\end{cfuncdesc}
3579
3580\begin{cfuncdesc}{Py_complex}{_Py_c_pow}{Py_complex num, Py_complex exp}
3581Return the exponentiation of \var{num} by \var{exp}, using the C
3582\ctype{Py_complex} representation.
3583\end{cfuncdesc}
3584
3585
3586\subsubsection{Complex Numbers as Python Objects}
3587
Fred Drakee5bf8b21998-02-12 21:22:28 +00003588\begin{ctypedesc}{PyComplexObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003589This subtype of \ctype{PyObject} represents a Python complex number object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003590\end{ctypedesc}
3591
3592\begin{cvardesc}{PyTypeObject}{PyComplex_Type}
Fred Drakef8830d11998-04-23 14:06:01 +00003593This instance of \ctype{PyTypeObject} represents the Python complex
Fred Drakee5bf8b21998-02-12 21:22:28 +00003594number type.
3595\end{cvardesc}
3596
3597\begin{cfuncdesc}{int}{PyComplex_Check}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003598Returns true if its argument is a \ctype{PyComplexObject}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003599\end{cfuncdesc}
3600
Fred Drakec6fa34e1998-04-02 06:47:24 +00003601\begin{cfuncdesc}{PyObject*}{PyComplex_FromCComplex}{Py_complex v}
Fred Drake659ebfa2000-04-03 15:42:13 +00003602Create a new Python complex number object from a C
3603\ctype{Py_complex} value.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003604\end{cfuncdesc}
3605
Fred Drakec6fa34e1998-04-02 06:47:24 +00003606\begin{cfuncdesc}{PyObject*}{PyComplex_FromDoubles}{double real, double imag}
Fred Drakef8830d11998-04-23 14:06:01 +00003607Returns a new \ctype{PyComplexObject} object from \var{real} and \var{imag}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003608\end{cfuncdesc}
3609
3610\begin{cfuncdesc}{double}{PyComplex_RealAsDouble}{PyObject *op}
Fred Drake659ebfa2000-04-03 15:42:13 +00003611Returns the real part of \var{op} as a C \ctype{double}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003612\end{cfuncdesc}
3613
3614\begin{cfuncdesc}{double}{PyComplex_ImagAsDouble}{PyObject *op}
Fred Drake659ebfa2000-04-03 15:42:13 +00003615Returns the imaginary part of \var{op} as a C \ctype{double}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003616\end{cfuncdesc}
3617
3618\begin{cfuncdesc}{Py_complex}{PyComplex_AsCComplex}{PyObject *op}
Fred Drake659ebfa2000-04-03 15:42:13 +00003619Returns the \ctype{Py_complex} value of the complex number \var{op}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003620\end{cfuncdesc}
3621
3622
3623
Fred Drakeefd146c1999-02-15 15:30:45 +00003624\section{Other Objects \label{otherObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003625
Fred Drakeefd146c1999-02-15 15:30:45 +00003626\subsection{File Objects \label{fileObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003627
Fred Drake659ebfa2000-04-03 15:42:13 +00003628\obindex{file}
3629Python's built-in file objects are implemented entirely on the
3630\ctype{FILE*} support from the C standard library. This is an
3631implementation detail and may change in future releases of Python.
3632
Fred Drakee5bf8b21998-02-12 21:22:28 +00003633\begin{ctypedesc}{PyFileObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003634This subtype of \ctype{PyObject} represents a Python file object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003635\end{ctypedesc}
3636
3637\begin{cvardesc}{PyTypeObject}{PyFile_Type}
Fred Drake659ebfa2000-04-03 15:42:13 +00003638This instance of \ctype{PyTypeObject} represents the Python file
3639type. This is exposed to Python programs as \code{types.FileType}.
3640\withsubitem{(in module types)}{\ttindex{FileType}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003641\end{cvardesc}
3642
3643\begin{cfuncdesc}{int}{PyFile_Check}{PyObject *p}
Fred Drakef8830d11998-04-23 14:06:01 +00003644Returns true if its argument is a \ctype{PyFileObject}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003645\end{cfuncdesc}
3646
Fred Drake659ebfa2000-04-03 15:42:13 +00003647\begin{cfuncdesc}{PyObject*}{PyFile_FromString}{char *filename, char *mode}
3648On success, returns a new file object that is opened on the
3649file given by \var{filename}, with a file mode given by \var{mode},
3650where \var{mode} has the same semantics as the standard C routine
3651\cfunction{fopen()}\ttindex{fopen()}. On failure, returns \NULL.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003652\end{cfuncdesc}
3653
Fred Drakec6fa34e1998-04-02 06:47:24 +00003654\begin{cfuncdesc}{PyObject*}{PyFile_FromFile}{FILE *fp,
Fred Drake659ebfa2000-04-03 15:42:13 +00003655 char *name, char *mode,
3656 int (*close)(FILE*)}
3657Creates a new \ctype{PyFileObject} from the already-open standard C
3658file pointer, \var{fp}. The function \var{close} will be called when
3659the file should be closed. Returns \NULL{} on failure.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003660\end{cfuncdesc}
3661
Fred Drake659ebfa2000-04-03 15:42:13 +00003662\begin{cfuncdesc}{FILE*}{PyFile_AsFile}{PyFileObject *p}
3663Returns the file object associated with \var{p} as a \ctype{FILE*}.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003664\end{cfuncdesc}
3665
Fred Drakec6fa34e1998-04-02 06:47:24 +00003666\begin{cfuncdesc}{PyObject*}{PyFile_GetLine}{PyObject *p, int n}
Fred Drake659ebfa2000-04-03 15:42:13 +00003667Equivalent to \code{\var{p}.readline(\optional{\var{n}})}, this
3668function reads one line from the object \var{p}. \var{p} may be a
3669file object or any object with a \method{readline()} method. If
3670\var{n} is \code{0}, exactly one line is read, regardless of the
3671length of the line. If \var{n} is greater than \code{0}, no more than
3672\var{n} bytes will be read from the file; a partial line can be
3673returned. In both cases, an empty string is returned if the end of
3674the file is reached immediately. If \var{n} is less than \code{0},
3675however, one line is read regardless of length, but
3676\exception{EOFError} is raised if the end of the file is reached
3677immediately.
3678\withsubitem{(built-in exception)}{\ttindex{EOFError}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003679\end{cfuncdesc}
3680
Fred Drakec6fa34e1998-04-02 06:47:24 +00003681\begin{cfuncdesc}{PyObject*}{PyFile_Name}{PyObject *p}
Fred Drake659ebfa2000-04-03 15:42:13 +00003682Returns the name of the file specified by \var{p} as a string object.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003683\end{cfuncdesc}
3684
3685\begin{cfuncdesc}{void}{PyFile_SetBufSize}{PyFileObject *p, int n}
Fred Drake659ebfa2000-04-03 15:42:13 +00003686Available on systems with \cfunction{setvbuf()}\ttindex{setvbuf()}
3687only. This should only be called immediately after file object
3688creation.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003689\end{cfuncdesc}
3690
Fred Drake659ebfa2000-04-03 15:42:13 +00003691\begin{cfuncdesc}{int}{PyFile_SoftSpace}{PyObject *p, int newflag}
3692This function exists for internal use by the interpreter.
3693Sets the \member{softspace} attribute of \var{p} to \var{newflag} and
3694\withsubitem{(file attribute)}{\ttindex{softspace}}returns the
3695previous value. \var{p} does not have to be a file object
3696for this function to work properly; any object is supported (thought
3697its only interesting if the \member{softspace} attribute can be set).
3698This function clears any errors, and will return \code{0} as the
3699previous value if the attribute either does not exist or if there were
3700errors in retrieving it. There is no way to detect errors from this
3701function, but doing so should not be needed.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003702\end{cfuncdesc}
3703
Fred Drakec6fa34e1998-04-02 06:47:24 +00003704\begin{cfuncdesc}{int}{PyFile_WriteObject}{PyObject *obj, PyFileObject *p,
3705 int flags}
Fred Drake659ebfa2000-04-03 15:42:13 +00003706Writes object \var{obj} to file object \var{p}. The only supported
3707flag for \var{flags} is \constant{Py_PRINT_RAW}\ttindex{Py_PRINT_RAW};
3708if given, the \function{str()} of the object is written instead of the
3709\function{repr()}. Returns \code{0} on success or \code{-1} on
3710failure; the appropriate exception will be set.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003711\end{cfuncdesc}
3712
Fred Drakec6fa34e1998-04-02 06:47:24 +00003713\begin{cfuncdesc}{int}{PyFile_WriteString}{char *s, PyFileObject *p,
3714 int flags}
Fred Drake659ebfa2000-04-03 15:42:13 +00003715Writes string \var{s} to file object \var{p}. Returns \code{0} on
3716success or \code{-1} on failure; the appropriate exception will be
3717set.
Fred Drakee5bf8b21998-02-12 21:22:28 +00003718\end{cfuncdesc}
3719
3720
Fred Drake5838d0f2001-01-28 06:39:35 +00003721\subsection{Instance Objects \label{instanceObjects}}
3722
3723\obindex{instance}
3724There are very few functions specific to instance objects.
3725
3726\begin{cvardesc}{PyTypeObject}{PyInstance_Type}
3727 Type object for class instances.
3728\end{cvardesc}
3729
3730\begin{cfuncdesc}{int}{PyInstance_Check}{PyObject *obj}
3731 Returns true if \var{obj} is an instance.
3732\end{cfuncdesc}
3733
3734\begin{cfuncdesc}{PyObject*}{PyInstance_New}{PyObject *class,
3735 PyObject *arg,
3736 PyObject *kw}
3737 Create a new instance of a specific class. The parameters \var{arg}
3738 and \var{kw} are used as the positional and keyword parameters to
3739 the object's constructor.
3740\end{cfuncdesc}
3741
3742\begin{cfuncdesc}{PyObject*}{PyInstance_NewRaw}{PyObject *class,
3743 PyObject *dict}
3744 Create a new instance of a specific class without calling it's
3745 constructor. \var{class} is the class of new object. The
3746 \var{dict} parameter will be used as the object's \member{__dict__};
3747 if \NULL, a new dictionary will be created for the instance.
3748\end{cfuncdesc}
3749
3750
Fred Drakeefd146c1999-02-15 15:30:45 +00003751\subsection{Module Objects \label{moduleObjects}}
3752
3753\obindex{module}
3754There are only a few functions special to module objects.
3755
Fred Drake659ebfa2000-04-03 15:42:13 +00003756\begin{cvardesc}{PyTypeObject}{PyModule_Type}
3757This instance of \ctype{PyTypeObject} represents the Python module
3758type. This is exposed to Python programs as \code{types.ModuleType}.
3759\withsubitem{(in module types)}{\ttindex{ModuleType}}
3760\end{cvardesc}
3761
3762\begin{cfuncdesc}{int}{PyModule_Check}{PyObject *p}
3763Returns true if its argument is a module object.
Fred Drakeefd146c1999-02-15 15:30:45 +00003764\end{cfuncdesc}
3765
Fred Drake659ebfa2000-04-03 15:42:13 +00003766\begin{cfuncdesc}{PyObject*}{PyModule_New}{char *name}
3767Return a new module object with the \member{__name__} attribute set to
3768\var{name}. Only the module's \member{__doc__} and
3769\member{__name__} attributes are filled in; the caller is responsible
3770for providing a \member{__file__} attribute.
3771\withsubitem{(module attribute)}{
3772 \ttindex{__name__}\ttindex{__doc__}\ttindex{__file__}}
3773\end{cfuncdesc}
3774
3775\begin{cfuncdesc}{PyObject*}{PyModule_GetDict}{PyObject *module}
Fred Drakeefd146c1999-02-15 15:30:45 +00003776Return the dictionary object that implements \var{module}'s namespace;
3777this object is the same as the \member{__dict__} attribute of the
3778module object. This function never fails.
Fred Drake659ebfa2000-04-03 15:42:13 +00003779\withsubitem{(module attribute)}{\ttindex{__dict__}}
Fred Drakeefd146c1999-02-15 15:30:45 +00003780\end{cfuncdesc}
3781
Fred Drake659ebfa2000-04-03 15:42:13 +00003782\begin{cfuncdesc}{char*}{PyModule_GetName}{PyObject *module}
Fred Drakeefd146c1999-02-15 15:30:45 +00003783Return \var{module}'s \member{__name__} value. If the module does not
Fred Drake659ebfa2000-04-03 15:42:13 +00003784provide one, or if it is not a string, \exception{SystemError} is
3785raised and \NULL{} is returned.
3786\withsubitem{(module attribute)}{\ttindex{__name__}}
3787\withsubitem{(built-in exception)}{\ttindex{SystemError}}
Fred Drakeefd146c1999-02-15 15:30:45 +00003788\end{cfuncdesc}
3789
Fred Drake659ebfa2000-04-03 15:42:13 +00003790\begin{cfuncdesc}{char*}{PyModule_GetFilename}{PyObject *module}
Fred Drakeefd146c1999-02-15 15:30:45 +00003791Return the name of the file from which \var{module} was loaded using
3792\var{module}'s \member{__file__} attribute. If this is not defined,
Fred Drake659ebfa2000-04-03 15:42:13 +00003793or if it is not a string, raise \exception{SystemError} and return
3794\NULL.
3795\withsubitem{(module attribute)}{\ttindex{__file__}}
3796\withsubitem{(built-in exception)}{\ttindex{SystemError}}
Fred Drakeefd146c1999-02-15 15:30:45 +00003797\end{cfuncdesc}
3798
Fred Drake891150b2000-09-23 03:25:42 +00003799\begin{cfuncdesc}{int}{PyModule_AddObject}{PyObject *module,
3800 char *name, PyObject *value}
3801Add an object to \var{module} as \var{name}. This is a convenience
3802function which can be used from the module's initialization function.
3803This steals a reference to \var{value}. Returns \code{-1} on error,
3804\code{0} on success.
3805\versionadded{2.0}
3806\end{cfuncdesc}
3807
3808\begin{cfuncdesc}{int}{PyModule_AddIntConstant}{PyObject *module,
3809 char *name, int value}
3810Add an integer constant to \var{module} as \var{name}. This convenience
3811function can be used from the module's initialization function.
3812Returns \code{-1} on error, \code{0} on success.
3813\versionadded{2.0}
3814\end{cfuncdesc}
3815
3816\begin{cfuncdesc}{int}{PyModule_AddStringConstant}{PyObject *module,
3817 char *name, char *value}
3818Add a string constant to \var{module} as \var{name}. This convenience
3819function can be used from the module's initialization function. The
3820string \var{value} must be null-terminated. Returns \code{-1} on
3821error, \code{0} on success.
3822\versionadded{2.0}
3823\end{cfuncdesc}
3824
Fred Drakeefd146c1999-02-15 15:30:45 +00003825
3826\subsection{CObjects \label{cObjects}}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003827
Fred Drake659ebfa2000-04-03 15:42:13 +00003828\obindex{CObject}
3829Refer to \emph{Extending and Embedding the Python Interpreter},
3830section 1.12 (``Providing a C API for an Extension Module''), for more
3831information on using these objects.
3832
3833
Guido van Rossum44475131998-04-21 15:30:01 +00003834\begin{ctypedesc}{PyCObject}
Fred Drakef8830d11998-04-23 14:06:01 +00003835This subtype of \ctype{PyObject} represents an opaque value, useful for
Fred Drake659ebfa2000-04-03 15:42:13 +00003836C extension modules who need to pass an opaque value (as a
3837\ctype{void*} pointer) through Python code to other C code. It is
Guido van Rossum44475131998-04-21 15:30:01 +00003838often used to make a C function pointer defined in one module
3839available to other modules, so the regular import mechanism can be
3840used to access C APIs defined in dynamically loaded modules.
3841\end{ctypedesc}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003842
Fred Drake659ebfa2000-04-03 15:42:13 +00003843\begin{cfuncdesc}{int}{PyCObject_Check}{PyObject *p}
3844Returns true if its argument is a \ctype{PyCObject}.
3845\end{cfuncdesc}
3846
3847\begin{cfuncdesc}{PyObject*}{PyCObject_FromVoidPtr}{void* cobj,
Marc-André Lemburga544ea22001-01-17 18:04:31 +00003848 void (*destr)(void *)}
Fred Drake1d158692000-06-18 05:21:21 +00003849Creates a \ctype{PyCObject} from the \code{void *}\var{cobj}. The
Fred Drakedab44681999-05-13 18:41:14 +00003850\var{destr} function will be called when the object is reclaimed, unless
3851it is \NULL.
Guido van Rossum44475131998-04-21 15:30:01 +00003852\end{cfuncdesc}
3853
Fred Drake659ebfa2000-04-03 15:42:13 +00003854\begin{cfuncdesc}{PyObject*}{PyCObject_FromVoidPtrAndDesc}{void* cobj,
Marc-André Lemburga544ea22001-01-17 18:04:31 +00003855 void* desc, void (*destr)(void *, void *) }
Fred Drakef8830d11998-04-23 14:06:01 +00003856Creates a \ctype{PyCObject} from the \ctype{void *}\var{cobj}. The
3857\var{destr} function will be called when the object is reclaimed. The
3858\var{desc} argument can be used to pass extra callback data for the
3859destructor function.
Guido van Rossum44475131998-04-21 15:30:01 +00003860\end{cfuncdesc}
3861
Fred Drake659ebfa2000-04-03 15:42:13 +00003862\begin{cfuncdesc}{void*}{PyCObject_AsVoidPtr}{PyObject* self}
3863Returns the object \ctype{void *} that the
3864\ctype{PyCObject} \var{self} was created with.
Guido van Rossum44475131998-04-21 15:30:01 +00003865\end{cfuncdesc}
3866
Fred Drake659ebfa2000-04-03 15:42:13 +00003867\begin{cfuncdesc}{void*}{PyCObject_GetDesc}{PyObject* self}
3868Returns the description \ctype{void *} that the
3869\ctype{PyCObject} \var{self} was created with.
Guido van Rossum44475131998-04-21 15:30:01 +00003870\end{cfuncdesc}
Fred Drakee5bf8b21998-02-12 21:22:28 +00003871
Fred Drake659ebfa2000-04-03 15:42:13 +00003872
Fred Drakeefd146c1999-02-15 15:30:45 +00003873\chapter{Initialization, Finalization, and Threads
3874 \label{initialization}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00003875
Guido van Rossum4a944d71997-08-14 20:35:38 +00003876\begin{cfuncdesc}{void}{Py_Initialize}{}
3877Initialize the Python interpreter. In an application embedding
3878Python, this should be called before using any other Python/C API
Fred Drake659ebfa2000-04-03 15:42:13 +00003879functions; with the exception of
3880\cfunction{Py_SetProgramName()}\ttindex{Py_SetProgramName()},
3881\cfunction{PyEval_InitThreads()}\ttindex{PyEval_InitThreads()},
3882\cfunction{PyEval_ReleaseLock()}\ttindex{PyEval_ReleaseLock()},
3883and \cfunction{PyEval_AcquireLock()}\ttindex{PyEval_AcquireLock()}.
3884This initializes the table of loaded modules (\code{sys.modules}), and
3885\withsubitem{(in module sys)}{\ttindex{modules}\ttindex{path}}creates the
3886fundamental modules \module{__builtin__}\refbimodindex{__builtin__},
Fred Drake4de05a91998-02-16 14:25:26 +00003887\module{__main__}\refbimodindex{__main__} and
3888\module{sys}\refbimodindex{sys}. It also initializes the module
Fred Drake659ebfa2000-04-03 15:42:13 +00003889search\indexiii{module}{search}{path} path (\code{sys.path}).
3890It does not set \code{sys.argv}; use
3891\cfunction{PySys_SetArgv()}\ttindex{PySys_SetArgv()} for that. This
3892is a no-op when called for a second time (without calling
3893\cfunction{Py_Finalize()}\ttindex{Py_Finalize()} first). There is no
3894return value; it is a fatal error if the initialization fails.
Guido van Rossum42cefd01997-10-05 15:27:29 +00003895\end{cfuncdesc}
3896
3897\begin{cfuncdesc}{int}{Py_IsInitialized}{}
Guido van Rossum42cefd01997-10-05 15:27:29 +00003898Return true (nonzero) when the Python interpreter has been
Fred Drakee058b4f1998-02-16 06:15:35 +00003899initialized, false (zero) if not. After \cfunction{Py_Finalize()} is
3900called, this returns false until \cfunction{Py_Initialize()} is called
Guido van Rossum42cefd01997-10-05 15:27:29 +00003901again.
Guido van Rossum4a944d71997-08-14 20:35:38 +00003902\end{cfuncdesc}
3903
3904\begin{cfuncdesc}{void}{Py_Finalize}{}
Fred Drakee058b4f1998-02-16 06:15:35 +00003905Undo all initializations made by \cfunction{Py_Initialize()} and
3906subsequent use of Python/C API functions, and destroy all
3907sub-interpreters (see \cfunction{Py_NewInterpreter()} below) that were
3908created and not yet destroyed since the last call to
3909\cfunction{Py_Initialize()}. Ideally, this frees all memory allocated
3910by the Python interpreter. This is a no-op when called for a second
3911time (without calling \cfunction{Py_Initialize()} again first). There
3912is no return value; errors during finalization are ignored.
Guido van Rossum4a944d71997-08-14 20:35:38 +00003913
3914This function is provided for a number of reasons. An embedding
3915application might want to restart Python without having to restart the
3916application itself. An application that has loaded the Python
3917interpreter from a dynamically loadable library (or DLL) might want to
3918free all memory allocated by Python before unloading the DLL. During a
3919hunt for memory leaks in an application a developer might want to free
3920all memory allocated by Python before exiting from the application.
3921
Fred Drakee058b4f1998-02-16 06:15:35 +00003922\strong{Bugs and caveats:} The destruction of modules and objects in
Guido van Rossum4a944d71997-08-14 20:35:38 +00003923modules is done in random order; this may cause destructors
Fred Drakee058b4f1998-02-16 06:15:35 +00003924(\method{__del__()} methods) to fail when they depend on other objects
Guido van Rossum4a944d71997-08-14 20:35:38 +00003925(even functions) or modules. Dynamically loaded extension modules
3926loaded by Python are not unloaded. Small amounts of memory allocated
3927by the Python interpreter may not be freed (if you find a leak, please
3928report it). Memory tied up in circular references between objects is
3929not freed. Some memory allocated by extension modules may not be
3930freed. Some extension may not work properly if their initialization
3931routine is called more than once; this can happen if an applcation
Fred Drakee058b4f1998-02-16 06:15:35 +00003932calls \cfunction{Py_Initialize()} and \cfunction{Py_Finalize()} more
3933than once.
Guido van Rossum4a944d71997-08-14 20:35:38 +00003934\end{cfuncdesc}
3935
Fred Drakec6fa34e1998-04-02 06:47:24 +00003936\begin{cfuncdesc}{PyThreadState*}{Py_NewInterpreter}{}
Fred Drake4de05a91998-02-16 14:25:26 +00003937Create a new sub-interpreter. This is an (almost) totally separate
3938environment for the execution of Python code. In particular, the new
3939interpreter has separate, independent versions of all imported
3940modules, including the fundamental modules
3941\module{__builtin__}\refbimodindex{__builtin__},
3942\module{__main__}\refbimodindex{__main__} and
3943\module{sys}\refbimodindex{sys}. The table of loaded modules
3944(\code{sys.modules}) and the module search path (\code{sys.path}) are
3945also separate. The new environment has no \code{sys.argv} variable.
3946It has new standard I/O stream file objects \code{sys.stdin},
3947\code{sys.stdout} and \code{sys.stderr} (however these refer to the
Fred Drake659ebfa2000-04-03 15:42:13 +00003948same underlying \ctype{FILE} structures in the C library).
3949\withsubitem{(in module sys)}{
3950 \ttindex{stdout}\ttindex{stderr}\ttindex{stdin}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00003951
3952The return value points to the first thread state created in the new
3953sub-interpreter. This thread state is made the current thread state.
3954Note that no actual thread is created; see the discussion of thread
3955states below. If creation of the new interpreter is unsuccessful,
Guido van Rossum580aa8d1997-11-25 15:34:51 +00003956\NULL{} is returned; no exception is set since the exception state
Guido van Rossum4a944d71997-08-14 20:35:38 +00003957is stored in the current thread state and there may not be a current
3958thread state. (Like all other Python/C API functions, the global
3959interpreter lock must be held before calling this function and is
3960still held when it returns; however, unlike most other Python/C API
3961functions, there needn't be a current thread state on entry.)
3962
3963Extension modules are shared between (sub-)interpreters as follows:
3964the first time a particular extension is imported, it is initialized
3965normally, and a (shallow) copy of its module's dictionary is
3966squirreled away. When the same extension is imported by another
3967(sub-)interpreter, a new module is initialized and filled with the
Fred Drakee058b4f1998-02-16 06:15:35 +00003968contents of this copy; the extension's \code{init} function is not
3969called. Note that this is different from what happens when an
3970extension is imported after the interpreter has been completely
Fred Drake659ebfa2000-04-03 15:42:13 +00003971re-initialized by calling
3972\cfunction{Py_Finalize()}\ttindex{Py_Finalize()} and
3973\cfunction{Py_Initialize()}\ttindex{Py_Initialize()}; in that case,
3974the extension's \code{init\var{module}} function \emph{is} called
3975again.
Guido van Rossum4a944d71997-08-14 20:35:38 +00003976
Fred Drakee058b4f1998-02-16 06:15:35 +00003977\strong{Bugs and caveats:} Because sub-interpreters (and the main
Guido van Rossum4a944d71997-08-14 20:35:38 +00003978interpreter) are part of the same process, the insulation between them
Fred Drakee058b4f1998-02-16 06:15:35 +00003979isn't perfect --- for example, using low-level file operations like
Fred Drake659ebfa2000-04-03 15:42:13 +00003980\withsubitem{(in module os)}{\ttindex{close()}}
Fred Drakef8830d11998-04-23 14:06:01 +00003981\function{os.close()} they can (accidentally or maliciously) affect each
Guido van Rossum4a944d71997-08-14 20:35:38 +00003982other's open files. Because of the way extensions are shared between
3983(sub-)interpreters, some extensions may not work properly; this is
3984especially likely when the extension makes use of (static) global
3985variables, or when the extension manipulates its module's dictionary
3986after its initialization. It is possible to insert objects created in
3987one sub-interpreter into a namespace of another sub-interpreter; this
3988should be done with great care to avoid sharing user-defined
3989functions, methods, instances or classes between sub-interpreters,
3990since import operations executed by such objects may affect the
3991wrong (sub-)interpreter's dictionary of loaded modules. (XXX This is
3992a hard-to-fix bug that will be addressed in a future release.)
3993\end{cfuncdesc}
3994
3995\begin{cfuncdesc}{void}{Py_EndInterpreter}{PyThreadState *tstate}
3996Destroy the (sub-)interpreter represented by the given thread state.
3997The given thread state must be the current thread state. See the
3998discussion of thread states below. When the call returns, the current
Guido van Rossum580aa8d1997-11-25 15:34:51 +00003999thread state is \NULL{}. All thread states associated with this
Guido van Rossum4a944d71997-08-14 20:35:38 +00004000interpreted are destroyed. (The global interpreter lock must be held
4001before calling this function and is still held when it returns.)
Fred Drake659ebfa2000-04-03 15:42:13 +00004002\cfunction{Py_Finalize()}\ttindex{Py_Finalize()} will destroy all
4003sub-interpreters that haven't been explicitly destroyed at that point.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004004\end{cfuncdesc}
4005
4006\begin{cfuncdesc}{void}{Py_SetProgramName}{char *name}
Fred Drake659ebfa2000-04-03 15:42:13 +00004007This function should be called before
4008\cfunction{Py_Initialize()}\ttindex{Py_Initialize()} is called
Guido van Rossum4a944d71997-08-14 20:35:38 +00004009for the first time, if it is called at all. It tells the interpreter
Fred Drake659ebfa2000-04-03 15:42:13 +00004010the value of the \code{argv[0]} argument to the
4011\cfunction{main()}\ttindex{main()} function of the program. This is
4012used by \cfunction{Py_GetPath()}\ttindex{Py_GetPath()} and some other
Guido van Rossum4a944d71997-08-14 20:35:38 +00004013functions below to find the Python run-time libraries relative to the
Fred Drakea8455ab2000-06-16 19:58:42 +00004014interpreter executable. The default value is \code{'python'}. The
Guido van Rossum4a944d71997-08-14 20:35:38 +00004015argument should point to a zero-terminated character string in static
4016storage whose contents will not change for the duration of the
4017program's execution. No code in the Python interpreter will change
4018the contents of this storage.
4019\end{cfuncdesc}
4020
Fred Drakec6fa34e1998-04-02 06:47:24 +00004021\begin{cfuncdesc}{char*}{Py_GetProgramName}{}
Fred Drake659ebfa2000-04-03 15:42:13 +00004022Return the program name set with
4023\cfunction{Py_SetProgramName()}\ttindex{Py_SetProgramName()}, or the
Guido van Rossum4a944d71997-08-14 20:35:38 +00004024default. The returned string points into static storage; the caller
4025should not modify its value.
4026\end{cfuncdesc}
4027
Fred Drakec6fa34e1998-04-02 06:47:24 +00004028\begin{cfuncdesc}{char*}{Py_GetPrefix}{}
Fred Drakee058b4f1998-02-16 06:15:35 +00004029Return the \emph{prefix} for installed platform-independent files. This
Guido van Rossum4a944d71997-08-14 20:35:38 +00004030is derived through a number of complicated rules from the program name
Fred Drakee058b4f1998-02-16 06:15:35 +00004031set with \cfunction{Py_SetProgramName()} and some environment variables;
Fred Drakea8455ab2000-06-16 19:58:42 +00004032for example, if the program name is \code{'/usr/local/bin/python'},
4033the prefix is \code{'/usr/local'}. The returned string points into
Guido van Rossum4a944d71997-08-14 20:35:38 +00004034static storage; the caller should not modify its value. This
Fred Drakec94d9341998-04-12 02:39:13 +00004035corresponds to the \makevar{prefix} variable in the top-level
Fred Drakea8455ab2000-06-16 19:58:42 +00004036\file{Makefile} and the \longprogramopt{prefix} argument to the
Fred Drakee058b4f1998-02-16 06:15:35 +00004037\program{configure} script at build time. The value is available to
Fred Drakeb0a78731998-01-13 18:51:10 +00004038Python code as \code{sys.prefix}. It is only useful on \UNIX{}. See
Guido van Rossum4a944d71997-08-14 20:35:38 +00004039also the next function.
4040\end{cfuncdesc}
4041
Fred Drakec6fa34e1998-04-02 06:47:24 +00004042\begin{cfuncdesc}{char*}{Py_GetExecPrefix}{}
Fred Drakee058b4f1998-02-16 06:15:35 +00004043Return the \emph{exec-prefix} for installed platform-\emph{de}pendent
Guido van Rossum4a944d71997-08-14 20:35:38 +00004044files. This is derived through a number of complicated rules from the
Fred Drakee058b4f1998-02-16 06:15:35 +00004045program name set with \cfunction{Py_SetProgramName()} and some environment
Guido van Rossum4a944d71997-08-14 20:35:38 +00004046variables; for example, if the program name is
Fred Drakea8455ab2000-06-16 19:58:42 +00004047\code{'/usr/local/bin/python'}, the exec-prefix is
4048\code{'/usr/local'}. The returned string points into static storage;
Guido van Rossum4a944d71997-08-14 20:35:38 +00004049the caller should not modify its value. This corresponds to the
Fred Drakec94d9341998-04-12 02:39:13 +00004050\makevar{exec_prefix} variable in the top-level \file{Makefile} and the
Fred Drakea8455ab2000-06-16 19:58:42 +00004051\longprogramopt{exec-prefix} argument to the
Fred Drake310ee611999-11-09 17:31:42 +00004052\program{configure} script at build time. The value is available to
4053Python code as \code{sys.exec_prefix}. It is only useful on \UNIX{}.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004054
4055Background: The exec-prefix differs from the prefix when platform
4056dependent files (such as executables and shared libraries) are
4057installed in a different directory tree. In a typical installation,
4058platform dependent files may be installed in the
Fred Drakea8455ab2000-06-16 19:58:42 +00004059\file{/usr/local/plat} subtree while platform independent may be
4060installed in \file{/usr/local}.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004061
4062Generally speaking, a platform is a combination of hardware and
4063software families, e.g. Sparc machines running the Solaris 2.x
4064operating system are considered the same platform, but Intel machines
4065running Solaris 2.x are another platform, and Intel machines running
4066Linux are yet another platform. Different major revisions of the same
Fred Drakeb0a78731998-01-13 18:51:10 +00004067operating system generally also form different platforms. Non-\UNIX{}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004068operating systems are a different story; the installation strategies
4069on those systems are so different that the prefix and exec-prefix are
4070meaningless, and set to the empty string. Note that compiled Python
4071bytecode files are platform independent (but not independent from the
4072Python version by which they were compiled!).
4073
Fred Drakee058b4f1998-02-16 06:15:35 +00004074System administrators will know how to configure the \program{mount} or
Fred Drakea8455ab2000-06-16 19:58:42 +00004075\program{automount} programs to share \file{/usr/local} between platforms
4076while having \file{/usr/local/plat} be a different filesystem for each
Guido van Rossum4a944d71997-08-14 20:35:38 +00004077platform.
4078\end{cfuncdesc}
4079
Fred Drakec6fa34e1998-04-02 06:47:24 +00004080\begin{cfuncdesc}{char*}{Py_GetProgramFullPath}{}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004081Return the full program name of the Python executable; this is
4082computed as a side-effect of deriving the default module search path
Fred Drake659ebfa2000-04-03 15:42:13 +00004083from the program name (set by
4084\cfunction{Py_SetProgramName()}\ttindex{Py_SetProgramName()} above).
4085The returned string points into static storage; the caller should not
Guido van Rossum4a944d71997-08-14 20:35:38 +00004086modify its value. The value is available to Python code as
Guido van Rossum42cefd01997-10-05 15:27:29 +00004087\code{sys.executable}.
Fred Drake659ebfa2000-04-03 15:42:13 +00004088\withsubitem{(in module sys)}{\ttindex{executable}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004089\end{cfuncdesc}
4090
Fred Drakec6fa34e1998-04-02 06:47:24 +00004091\begin{cfuncdesc}{char*}{Py_GetPath}{}
Fred Drake4de05a91998-02-16 14:25:26 +00004092\indexiii{module}{search}{path}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004093Return the default module search path; this is computed from the
Fred Drakee058b4f1998-02-16 06:15:35 +00004094program name (set by \cfunction{Py_SetProgramName()} above) and some
Guido van Rossum4a944d71997-08-14 20:35:38 +00004095environment variables. The returned string consists of a series of
4096directory names separated by a platform dependent delimiter character.
Fred Drakef8830d11998-04-23 14:06:01 +00004097The delimiter character is \character{:} on \UNIX{}, \character{;} on
Fred Drake659ebfa2000-04-03 15:42:13 +00004098DOS/Windows, and \character{\e n} (the \ASCII{} newline character) on
Fred Drakee5bc4971998-02-12 23:36:49 +00004099Macintosh. The returned string points into static storage; the caller
Guido van Rossum4a944d71997-08-14 20:35:38 +00004100should not modify its value. The value is available to Python code
Fred Drake659ebfa2000-04-03 15:42:13 +00004101as the list \code{sys.path}\withsubitem{(in module sys)}{\ttindex{path}},
4102which may be modified to change the future search path for loaded
4103modules.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004104
4105% XXX should give the exact rules
4106\end{cfuncdesc}
4107
Fred Drakec6fa34e1998-04-02 06:47:24 +00004108\begin{cfuncdesc}{const char*}{Py_GetVersion}{}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004109Return the version of this Python interpreter. This is a string that
4110looks something like
4111
Guido van Rossum09270b51997-08-15 18:57:32 +00004112\begin{verbatim}
Fred Drakee058b4f1998-02-16 06:15:35 +00004113"1.5 (#67, Dec 31 1997, 22:34:28) [GCC 2.7.2.2]"
Guido van Rossum09270b51997-08-15 18:57:32 +00004114\end{verbatim}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004115
4116The first word (up to the first space character) is the current Python
4117version; the first three characters are the major and minor version
4118separated by a period. The returned string points into static storage;
4119the caller should not modify its value. The value is available to
4120Python code as the list \code{sys.version}.
Fred Drake659ebfa2000-04-03 15:42:13 +00004121\withsubitem{(in module sys)}{\ttindex{version}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004122\end{cfuncdesc}
4123
Fred Drakec6fa34e1998-04-02 06:47:24 +00004124\begin{cfuncdesc}{const char*}{Py_GetPlatform}{}
Fred Drakeb0a78731998-01-13 18:51:10 +00004125Return the platform identifier for the current platform. On \UNIX{},
Guido van Rossum4a944d71997-08-14 20:35:38 +00004126this is formed from the ``official'' name of the operating system,
4127converted to lower case, followed by the major revision number; e.g.,
4128for Solaris 2.x, which is also known as SunOS 5.x, the value is
Fred Drakea8455ab2000-06-16 19:58:42 +00004129\code{'sunos5'}. On Macintosh, it is \code{'mac'}. On Windows, it
4130is \code{'win'}. The returned string points into static storage;
Guido van Rossum4a944d71997-08-14 20:35:38 +00004131the caller should not modify its value. The value is available to
4132Python code as \code{sys.platform}.
Fred Drake659ebfa2000-04-03 15:42:13 +00004133\withsubitem{(in module sys)}{\ttindex{platform}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004134\end{cfuncdesc}
4135
Fred Drakec6fa34e1998-04-02 06:47:24 +00004136\begin{cfuncdesc}{const char*}{Py_GetCopyright}{}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004137Return the official copyright string for the current Python version,
4138for example
4139
Fred Drakea8455ab2000-06-16 19:58:42 +00004140\code{'Copyright 1991-1995 Stichting Mathematisch Centrum, Amsterdam'}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004141
4142The returned string points into static storage; the caller should not
4143modify its value. The value is available to Python code as the list
4144\code{sys.copyright}.
Fred Drake659ebfa2000-04-03 15:42:13 +00004145\withsubitem{(in module sys)}{\ttindex{copyright}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004146\end{cfuncdesc}
4147
Fred Drakec6fa34e1998-04-02 06:47:24 +00004148\begin{cfuncdesc}{const char*}{Py_GetCompiler}{}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004149Return an indication of the compiler used to build the current Python
Fred Drakee058b4f1998-02-16 06:15:35 +00004150version, in square brackets, for example:
Guido van Rossum4a944d71997-08-14 20:35:38 +00004151
Fred Drakee058b4f1998-02-16 06:15:35 +00004152\begin{verbatim}
4153"[GCC 2.7.2.2]"
4154\end{verbatim}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004155
4156The returned string points into static storage; the caller should not
4157modify its value. The value is available to Python code as part of
4158the variable \code{sys.version}.
Fred Drake659ebfa2000-04-03 15:42:13 +00004159\withsubitem{(in module sys)}{\ttindex{version}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004160\end{cfuncdesc}
4161
Fred Drakec6fa34e1998-04-02 06:47:24 +00004162\begin{cfuncdesc}{const char*}{Py_GetBuildInfo}{}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004163Return information about the sequence number and build date and time
4164of the current Python interpreter instance, for example
4165
Guido van Rossum09270b51997-08-15 18:57:32 +00004166\begin{verbatim}
4167"#67, Aug 1 1997, 22:34:28"
4168\end{verbatim}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004169
4170The returned string points into static storage; the caller should not
4171modify its value. The value is available to Python code as part of
4172the variable \code{sys.version}.
Fred Drake659ebfa2000-04-03 15:42:13 +00004173\withsubitem{(in module sys)}{\ttindex{version}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004174\end{cfuncdesc}
4175
4176\begin{cfuncdesc}{int}{PySys_SetArgv}{int argc, char **argv}
Fred Drake659ebfa2000-04-03 15:42:13 +00004177Set \code{sys.argv} based on \var{argc} and \var{argv}. These
4178parameters are similar to those passed to the program's
4179\cfunction{main()}\ttindex{main()} function with the difference that
4180the first entry should refer to the script file to be executed rather
4181than the executable hosting the Python interpreter. If there isn't a
4182script that will be run, the first entry in \var{argv} can be an empty
4183string. If this function fails to initialize \code{sys.argv}, a fatal
4184condition is signalled using
4185\cfunction{Py_FatalError()}\ttindex{Py_FatalError()}.
4186\withsubitem{(in module sys)}{\ttindex{argv}}
4187% XXX impl. doesn't seem consistent in allowing 0/NULL for the params;
4188% check w/ Guido.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004189\end{cfuncdesc}
4190
4191% XXX Other PySys thingies (doesn't really belong in this chapter)
4192
Fred Drakeefd146c1999-02-15 15:30:45 +00004193\section{Thread State and the Global Interpreter Lock
4194 \label{threads}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004195
Fred Drake659ebfa2000-04-03 15:42:13 +00004196\index{global interpreter lock}
4197\index{interpreter lock}
4198\index{lock, interpreter}
4199
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004200The Python interpreter is not fully thread safe. In order to support
4201multi-threaded Python programs, there's a global lock that must be
4202held by the current thread before it can safely access Python objects.
4203Without the lock, even the simplest operations could cause problems in
Fred Drake7baf3d41998-02-20 00:45:52 +00004204a multi-threaded program: for example, when two threads simultaneously
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004205increment the reference count of the same object, the reference count
4206could end up being incremented only once instead of twice.
4207
4208Therefore, the rule exists that only the thread that has acquired the
4209global interpreter lock may operate on Python objects or call Python/C
4210API functions. In order to support multi-threaded Python programs,
Fred Drake659ebfa2000-04-03 15:42:13 +00004211the interpreter regularly releases and reacquires the lock --- by
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004212default, every ten bytecode instructions (this can be changed with
Fred Drake659ebfa2000-04-03 15:42:13 +00004213\withsubitem{(in module sys)}{\ttindex{setcheckinterval()}}
Fred Drakee058b4f1998-02-16 06:15:35 +00004214\function{sys.setcheckinterval()}). The lock is also released and
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004215reacquired around potentially blocking I/O operations like reading or
4216writing a file, so that other threads can run while the thread that
4217requests the I/O is waiting for the I/O operation to complete.
4218
4219The Python interpreter needs to keep some bookkeeping information
Fred Drakee058b4f1998-02-16 06:15:35 +00004220separate per thread --- for this it uses a data structure called
Fred Drake659ebfa2000-04-03 15:42:13 +00004221\ctype{PyThreadState}\ttindex{PyThreadState}. This is new in Python
42221.5; in earlier versions, such state was stored in global variables,
4223and switching threads could cause problems. In particular, exception
4224handling is now thread safe, when the application uses
4225\withsubitem{(in module sys)}{\ttindex{exc_info()}}
4226\function{sys.exc_info()} to access the exception last raised in the
4227current thread.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004228
4229There's one global variable left, however: the pointer to the current
Fred Drake659ebfa2000-04-03 15:42:13 +00004230\ctype{PyThreadState}\ttindex{PyThreadState} structure. While most
4231thread packages have a way to store ``per-thread global data,''
4232Python's internal platform independent thread abstraction doesn't
4233support this yet. Therefore, the current thread state must be
4234manipulated explicitly.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004235
4236This is easy enough in most cases. Most code manipulating the global
4237interpreter lock has the following simple structure:
4238
Guido van Rossum9faf4c51997-10-07 14:38:54 +00004239\begin{verbatim}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004240Save the thread state in a local variable.
4241Release the interpreter lock.
4242...Do some blocking I/O operation...
4243Reacquire the interpreter lock.
4244Restore the thread state from the local variable.
Guido van Rossum9faf4c51997-10-07 14:38:54 +00004245\end{verbatim}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004246
4247This is so common that a pair of macros exists to simplify it:
4248
Guido van Rossum9faf4c51997-10-07 14:38:54 +00004249\begin{verbatim}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004250Py_BEGIN_ALLOW_THREADS
4251...Do some blocking I/O operation...
4252Py_END_ALLOW_THREADS
Guido van Rossum9faf4c51997-10-07 14:38:54 +00004253\end{verbatim}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004254
Fred Drake659ebfa2000-04-03 15:42:13 +00004255The \code{Py_BEGIN_ALLOW_THREADS}\ttindex{Py_BEGIN_ALLOW_THREADS} macro
4256opens a new block and declares a hidden local variable; the
4257\code{Py_END_ALLOW_THREADS}\ttindex{Py_END_ALLOW_THREADS} macro closes
Fred Drakee058b4f1998-02-16 06:15:35 +00004258the block. Another advantage of using these two macros is that when
4259Python is compiled without thread support, they are defined empty,
4260thus saving the thread state and lock manipulations.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004261
4262When thread support is enabled, the block above expands to the
4263following code:
4264
Guido van Rossum9faf4c51997-10-07 14:38:54 +00004265\begin{verbatim}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004266 PyThreadState *_save;
Fred Drake659ebfa2000-04-03 15:42:13 +00004267
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004268 _save = PyEval_SaveThread();
4269 ...Do some blocking I/O operation...
4270 PyEval_RestoreThread(_save);
Guido van Rossum9faf4c51997-10-07 14:38:54 +00004271\end{verbatim}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004272
4273Using even lower level primitives, we can get roughly the same effect
4274as follows:
4275
Guido van Rossum9faf4c51997-10-07 14:38:54 +00004276\begin{verbatim}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004277 PyThreadState *_save;
Fred Drake659ebfa2000-04-03 15:42:13 +00004278
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004279 _save = PyThreadState_Swap(NULL);
4280 PyEval_ReleaseLock();
4281 ...Do some blocking I/O operation...
4282 PyEval_AcquireLock();
4283 PyThreadState_Swap(_save);
Guido van Rossum9faf4c51997-10-07 14:38:54 +00004284\end{verbatim}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004285
4286There are some subtle differences; in particular,
Fred Drake659ebfa2000-04-03 15:42:13 +00004287\cfunction{PyEval_RestoreThread()}\ttindex{PyEval_RestoreThread()} saves
4288and restores the value of the global variable
4289\cdata{errno}\ttindex{errno}, since the lock manipulation does not
Fred Drakef8830d11998-04-23 14:06:01 +00004290guarantee that \cdata{errno} is left alone. Also, when thread support
Fred Drake659ebfa2000-04-03 15:42:13 +00004291is disabled,
4292\cfunction{PyEval_SaveThread()}\ttindex{PyEval_SaveThread()} and
Fred Drakee058b4f1998-02-16 06:15:35 +00004293\cfunction{PyEval_RestoreThread()} don't manipulate the lock; in this
Fred Drake659ebfa2000-04-03 15:42:13 +00004294case, \cfunction{PyEval_ReleaseLock()}\ttindex{PyEval_ReleaseLock()} and
4295\cfunction{PyEval_AcquireLock()}\ttindex{PyEval_AcquireLock()} are not
4296available. This is done so that dynamically loaded extensions
4297compiled with thread support enabled can be loaded by an interpreter
4298that was compiled with disabled thread support.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004299
4300The global interpreter lock is used to protect the pointer to the
4301current thread state. When releasing the lock and saving the thread
4302state, the current thread state pointer must be retrieved before the
4303lock is released (since another thread could immediately acquire the
4304lock and store its own thread state in the global variable).
Fred Drakeffe58ca2000-09-29 17:31:54 +00004305Conversely, when acquiring the lock and restoring the thread state,
4306the lock must be acquired before storing the thread state pointer.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004307
4308Why am I going on with so much detail about this? Because when
Fred Drake659ebfa2000-04-03 15:42:13 +00004309threads are created from C, they don't have the global interpreter
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004310lock, nor is there a thread state data structure for them. Such
4311threads must bootstrap themselves into existence, by first creating a
4312thread state data structure, then acquiring the lock, and finally
4313storing their thread state pointer, before they can start using the
4314Python/C API. When they are done, they should reset the thread state
4315pointer, release the lock, and finally free their thread state data
4316structure.
4317
4318When creating a thread data structure, you need to provide an
4319interpreter state data structure. The interpreter state data
4320structure hold global data that is shared by all threads in an
4321interpreter, for example the module administration
4322(\code{sys.modules}). Depending on your needs, you can either create
4323a new interpreter state data structure, or share the interpreter state
4324data structure used by the Python main thread (to access the latter,
Fred Drakef8830d11998-04-23 14:06:01 +00004325you must obtain the thread state and access its \member{interp} member;
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004326this must be done by a thread that is created by Python or by the main
4327thread after Python is initialized).
4328
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004329
4330\begin{ctypedesc}{PyInterpreterState}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004331This data structure represents the state shared by a number of
4332cooperating threads. Threads belonging to the same interpreter
4333share their module administration and a few other internal items.
4334There are no public members in this structure.
4335
4336Threads belonging to different interpreters initially share nothing,
4337except process state like available memory, open file descriptors and
4338such. The global interpreter lock is also shared by all threads,
4339regardless of to which interpreter they belong.
4340\end{ctypedesc}
4341
4342\begin{ctypedesc}{PyThreadState}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004343This data structure represents the state of a single thread. The only
Fred Drakef8830d11998-04-23 14:06:01 +00004344public data member is \ctype{PyInterpreterState *}\member{interp},
4345which points to this thread's interpreter state.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004346\end{ctypedesc}
4347
4348\begin{cfuncdesc}{void}{PyEval_InitThreads}{}
4349Initialize and acquire the global interpreter lock. It should be
4350called in the main thread before creating a second thread or engaging
Fred Drakee058b4f1998-02-16 06:15:35 +00004351in any other thread operations such as
Fred Drake659ebfa2000-04-03 15:42:13 +00004352\cfunction{PyEval_ReleaseLock()}\ttindex{PyEval_ReleaseLock()} or
4353\code{PyEval_ReleaseThread(\var{tstate})}\ttindex{PyEval_ReleaseThread()}.
4354It is not needed before calling
4355\cfunction{PyEval_SaveThread()}\ttindex{PyEval_SaveThread()} or
4356\cfunction{PyEval_RestoreThread()}\ttindex{PyEval_RestoreThread()}.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004357
4358This is a no-op when called for a second time. It is safe to call
Fred Drake659ebfa2000-04-03 15:42:13 +00004359this function before calling
4360\cfunction{Py_Initialize()}\ttindex{Py_Initialize()}.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004361
4362When only the main thread exists, no lock operations are needed. This
4363is a common situation (most Python programs do not use threads), and
4364the lock operations slow the interpreter down a bit. Therefore, the
4365lock is not created initially. This situation is equivalent to having
4366acquired the lock: when there is only a single thread, all object
4367accesses are safe. Therefore, when this function initializes the
Fred Drake4de05a91998-02-16 14:25:26 +00004368lock, it also acquires it. Before the Python
4369\module{thread}\refbimodindex{thread} module creates a new thread,
4370knowing that either it has the lock or the lock hasn't been created
4371yet, it calls \cfunction{PyEval_InitThreads()}. When this call
4372returns, it is guaranteed that the lock has been created and that it
4373has acquired it.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004374
4375It is \strong{not} safe to call this function when it is unknown which
4376thread (if any) currently has the global interpreter lock.
4377
4378This function is not available when thread support is disabled at
4379compile time.
4380\end{cfuncdesc}
4381
Guido van Rossum4a944d71997-08-14 20:35:38 +00004382\begin{cfuncdesc}{void}{PyEval_AcquireLock}{}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004383Acquire the global interpreter lock. The lock must have been created
4384earlier. If this thread already has the lock, a deadlock ensues.
4385This function is not available when thread support is disabled at
4386compile time.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004387\end{cfuncdesc}
4388
4389\begin{cfuncdesc}{void}{PyEval_ReleaseLock}{}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004390Release the global interpreter lock. The lock must have been created
4391earlier. This function is not available when thread support is
Fred Drakee058b4f1998-02-16 06:15:35 +00004392disabled at compile time.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004393\end{cfuncdesc}
4394
4395\begin{cfuncdesc}{void}{PyEval_AcquireThread}{PyThreadState *tstate}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004396Acquire the global interpreter lock and then set the current thread
Guido van Rossum580aa8d1997-11-25 15:34:51 +00004397state to \var{tstate}, which should not be \NULL{}. The lock must
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004398have been created earlier. If this thread already has the lock,
4399deadlock ensues. This function is not available when thread support
Fred Drakee058b4f1998-02-16 06:15:35 +00004400is disabled at compile time.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004401\end{cfuncdesc}
4402
4403\begin{cfuncdesc}{void}{PyEval_ReleaseThread}{PyThreadState *tstate}
Guido van Rossum580aa8d1997-11-25 15:34:51 +00004404Reset the current thread state to \NULL{} and release the global
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004405interpreter lock. The lock must have been created earlier and must be
4406held by the current thread. The \var{tstate} argument, which must not
Guido van Rossum580aa8d1997-11-25 15:34:51 +00004407be \NULL{}, is only used to check that it represents the current
Fred Drakee058b4f1998-02-16 06:15:35 +00004408thread state --- if it isn't, a fatal error is reported. This
4409function is not available when thread support is disabled at compile
4410time.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004411\end{cfuncdesc}
4412
Fred Drakec6fa34e1998-04-02 06:47:24 +00004413\begin{cfuncdesc}{PyThreadState*}{PyEval_SaveThread}{}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004414Release the interpreter lock (if it has been created and thread
Guido van Rossum580aa8d1997-11-25 15:34:51 +00004415support is enabled) and reset the thread state to \NULL{},
4416returning the previous thread state (which is not \NULL{}). If
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004417the lock has been created, the current thread must have acquired it.
4418(This function is available even when thread support is disabled at
4419compile time.)
Guido van Rossum4a944d71997-08-14 20:35:38 +00004420\end{cfuncdesc}
4421
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004422\begin{cfuncdesc}{void}{PyEval_RestoreThread}{PyThreadState *tstate}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004423Acquire the interpreter lock (if it has been created and thread
4424support is enabled) and set the thread state to \var{tstate}, which
Guido van Rossum580aa8d1997-11-25 15:34:51 +00004425must not be \NULL{}. If the lock has been created, the current
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004426thread must not have acquired it, otherwise deadlock ensues. (This
4427function is available even when thread support is disabled at compile
4428time.)
Guido van Rossum4a944d71997-08-14 20:35:38 +00004429\end{cfuncdesc}
4430
Fred Drake659ebfa2000-04-03 15:42:13 +00004431The following macros are normally used without a trailing semicolon;
4432look for example usage in the Python source distribution.
4433
4434\begin{csimplemacrodesc}{Py_BEGIN_ALLOW_THREADS}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004435This macro expands to
Fred Drakee058b4f1998-02-16 06:15:35 +00004436\samp{\{ PyThreadState *_save; _save = PyEval_SaveThread();}.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004437Note that it contains an opening brace; it must be matched with a
4438following \code{Py_END_ALLOW_THREADS} macro. See above for further
4439discussion of this macro. It is a no-op when thread support is
4440disabled at compile time.
Fred Drake659ebfa2000-04-03 15:42:13 +00004441\end{csimplemacrodesc}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004442
Fred Drake659ebfa2000-04-03 15:42:13 +00004443\begin{csimplemacrodesc}{Py_END_ALLOW_THREADS}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004444This macro expands to
Fred Drakee058b4f1998-02-16 06:15:35 +00004445\samp{PyEval_RestoreThread(_save); \}}.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004446Note that it contains a closing brace; it must be matched with an
4447earlier \code{Py_BEGIN_ALLOW_THREADS} macro. See above for further
4448discussion of this macro. It is a no-op when thread support is
4449disabled at compile time.
Fred Drake659ebfa2000-04-03 15:42:13 +00004450\end{csimplemacrodesc}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004451
Fred Drake659ebfa2000-04-03 15:42:13 +00004452\begin{csimplemacrodesc}{Py_BEGIN_BLOCK_THREADS}
Fred Drakee058b4f1998-02-16 06:15:35 +00004453This macro expands to \samp{PyEval_RestoreThread(_save);} i.e. it
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004454is equivalent to \code{Py_END_ALLOW_THREADS} without the closing
4455brace. It is a no-op when thread support is disabled at compile
4456time.
Fred Drake659ebfa2000-04-03 15:42:13 +00004457\end{csimplemacrodesc}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004458
Fred Drake659ebfa2000-04-03 15:42:13 +00004459\begin{csimplemacrodesc}{Py_BEGIN_UNBLOCK_THREADS}
Fred Drakee058b4f1998-02-16 06:15:35 +00004460This macro expands to \samp{_save = PyEval_SaveThread();} i.e. it is
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004461equivalent to \code{Py_BEGIN_ALLOW_THREADS} without the opening brace
4462and variable declaration. It is a no-op when thread support is
4463disabled at compile time.
Fred Drake659ebfa2000-04-03 15:42:13 +00004464\end{csimplemacrodesc}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004465
4466All of the following functions are only available when thread support
4467is enabled at compile time, and must be called only when the
Fred Drake9d20ac31998-02-16 15:27:08 +00004468interpreter lock has been created.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004469
Fred Drakec6fa34e1998-04-02 06:47:24 +00004470\begin{cfuncdesc}{PyInterpreterState*}{PyInterpreterState_New}{}
Guido van Rossumed9dcc11998-08-07 18:28:03 +00004471Create a new interpreter state object. The interpreter lock need not
4472be held, but may be held if it is necessary to serialize calls to this
4473function.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004474\end{cfuncdesc}
4475
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004476\begin{cfuncdesc}{void}{PyInterpreterState_Clear}{PyInterpreterState *interp}
4477Reset all information in an interpreter state object. The interpreter
4478lock must be held.
Guido van Rossum4a944d71997-08-14 20:35:38 +00004479\end{cfuncdesc}
4480
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004481\begin{cfuncdesc}{void}{PyInterpreterState_Delete}{PyInterpreterState *interp}
4482Destroy an interpreter state object. The interpreter lock need not be
4483held. The interpreter state must have been reset with a previous
Fred Drakee058b4f1998-02-16 06:15:35 +00004484call to \cfunction{PyInterpreterState_Clear()}.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004485\end{cfuncdesc}
4486
Fred Drakec6fa34e1998-04-02 06:47:24 +00004487\begin{cfuncdesc}{PyThreadState*}{PyThreadState_New}{PyInterpreterState *interp}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004488Create a new thread state object belonging to the given interpreter
Guido van Rossumed9dcc11998-08-07 18:28:03 +00004489object. The interpreter lock need not be held, but may be held if it
4490is necessary to serialize calls to this function.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004491\end{cfuncdesc}
4492
4493\begin{cfuncdesc}{void}{PyThreadState_Clear}{PyThreadState *tstate}
4494Reset all information in a thread state object. The interpreter lock
4495must be held.
4496\end{cfuncdesc}
4497
4498\begin{cfuncdesc}{void}{PyThreadState_Delete}{PyThreadState *tstate}
4499Destroy a thread state object. The interpreter lock need not be
4500held. The thread state must have been reset with a previous
Fred Drakee058b4f1998-02-16 06:15:35 +00004501call to \cfunction{PyThreadState_Clear()}.
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004502\end{cfuncdesc}
4503
Fred Drakec6fa34e1998-04-02 06:47:24 +00004504\begin{cfuncdesc}{PyThreadState*}{PyThreadState_Get}{}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004505Return the current thread state. The interpreter lock must be held.
Guido van Rossum580aa8d1997-11-25 15:34:51 +00004506When the current thread state is \NULL{}, this issues a fatal
Guido van Rossum5b8a5231997-12-30 04:38:44 +00004507error (so that the caller needn't check for \NULL{}).
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004508\end{cfuncdesc}
4509
Fred Drakec6fa34e1998-04-02 06:47:24 +00004510\begin{cfuncdesc}{PyThreadState*}{PyThreadState_Swap}{PyThreadState *tstate}
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004511Swap the current thread state with the thread state given by the
Guido van Rossum580aa8d1997-11-25 15:34:51 +00004512argument \var{tstate}, which may be \NULL{}. The interpreter lock
Guido van Rossumc44d3d61997-10-06 05:10:47 +00004513must be held.
4514\end{cfuncdesc}
4515
4516
Fred Drake659ebfa2000-04-03 15:42:13 +00004517\chapter{Memory Management \label{memory}}
4518\sectionauthor{Vladimir Marangozov}{Vladimir.Marangozov@inrialpes.fr}
4519
4520
4521\section{Overview \label{memoryOverview}}
4522
4523Memory management in Python involves a private heap containing all
4524Python objects and data structures. The management of this private
4525heap is ensured internally by the \emph{Python memory manager}. The
4526Python memory manager has different components which deal with various
4527dynamic storage management aspects, like sharing, segmentation,
4528preallocation or caching.
4529
4530At the lowest level, a raw memory allocator ensures that there is
4531enough room in the private heap for storing all Python-related data
4532by interacting with the memory manager of the operating system. On top
4533of the raw memory allocator, several object-specific allocators
4534operate on the same heap and implement distinct memory management
4535policies adapted to the peculiarities of every object type. For
4536example, integer objects are managed differently within the heap than
4537strings, tuples or dictionaries because integers imply different
4538storage requirements and speed/space tradeoffs. The Python memory
4539manager thus delegates some of the work to the object-specific
4540allocators, but ensures that the latter operate within the bounds of
4541the private heap.
4542
4543It is important to understand that the management of the Python heap
4544is performed by the interpreter itself and that the user has no
4545control on it, even if she regularly manipulates object pointers to
4546memory blocks inside that heap. The allocation of heap space for
4547Python objects and other internal buffers is performed on demand by
4548the Python memory manager through the Python/C API functions listed in
4549this document.
4550
4551To avoid memory corruption, extension writers should never try to
4552operate on Python objects with the functions exported by the C
4553library: \cfunction{malloc()}\ttindex{malloc()},
4554\cfunction{calloc()}\ttindex{calloc()},
4555\cfunction{realloc()}\ttindex{realloc()} and
4556\cfunction{free()}\ttindex{free()}. This will result in
4557mixed calls between the C allocator and the Python memory manager
4558with fatal consequences, because they implement different algorithms
4559and operate on different heaps. However, one may safely allocate and
4560release memory blocks with the C library allocator for individual
4561purposes, as shown in the following example:
4562
4563\begin{verbatim}
4564 PyObject *res;
4565 char *buf = (char *) malloc(BUFSIZ); /* for I/O */
4566
4567 if (buf == NULL)
4568 return PyErr_NoMemory();
4569 ...Do some I/O operation involving buf...
4570 res = PyString_FromString(buf);
4571 free(buf); /* malloc'ed */
4572 return res;
4573\end{verbatim}
4574
4575In this example, the memory request for the I/O buffer is handled by
4576the C library allocator. The Python memory manager is involved only
4577in the allocation of the string object returned as a result.
4578
4579In most situations, however, it is recommended to allocate memory from
4580the Python heap specifically because the latter is under control of
4581the Python memory manager. For example, this is required when the
4582interpreter is extended with new object types written in C. Another
4583reason for using the Python heap is the desire to \emph{inform} the
4584Python memory manager about the memory needs of the extension module.
4585Even when the requested memory is used exclusively for internal,
4586highly-specific purposes, delegating all memory requests to the Python
4587memory manager causes the interpreter to have a more accurate image of
4588its memory footprint as a whole. Consequently, under certain
4589circumstances, the Python memory manager may or may not trigger
4590appropriate actions, like garbage collection, memory compaction or
4591other preventive procedures. Note that by using the C library
4592allocator as shown in the previous example, the allocated memory for
4593the I/O buffer escapes completely the Python memory manager.
4594
4595
4596\section{Memory Interface \label{memoryInterface}}
4597
4598The following function sets, modeled after the ANSI C standard, are
4599available for allocating and releasing memory from the Python heap:
4600
4601
Fred Drake7d45d342000-08-11 17:07:32 +00004602\begin{cfuncdesc}{void*}{PyMem_Malloc}{size_t n}
4603Allocates \var{n} bytes and returns a pointer of type \ctype{void*} to
Fred Drake659ebfa2000-04-03 15:42:13 +00004604the allocated memory, or \NULL{} if the request fails. Requesting zero
4605bytes returns a non-\NULL{} pointer.
4606\end{cfuncdesc}
4607
Fred Drake7d45d342000-08-11 17:07:32 +00004608\begin{cfuncdesc}{void*}{PyMem_Realloc}{void *p, size_t n}
Fred Drake659ebfa2000-04-03 15:42:13 +00004609Resizes the memory block pointed to by \var{p} to \var{n} bytes. The
4610contents will be unchanged to the minimum of the old and the new
4611sizes. If \var{p} is \NULL{}, the call is equivalent to
4612\cfunction{PyMem_Malloc(\var{n})}; if \var{n} is equal to zero, the memory block
4613is resized but is not freed, and the returned pointer is non-\NULL{}.
4614Unless \var{p} is \NULL{}, it must have been returned by a previous
4615call to \cfunction{PyMem_Malloc()} or \cfunction{PyMem_Realloc()}.
4616\end{cfuncdesc}
4617
Fred Drake7d45d342000-08-11 17:07:32 +00004618\begin{cfuncdesc}{void}{PyMem_Free}{void *p}
Fred Drake659ebfa2000-04-03 15:42:13 +00004619Frees the memory block pointed to by \var{p}, which must have been
4620returned by a previous call to \cfunction{PyMem_Malloc()} or
4621\cfunction{PyMem_Realloc()}. Otherwise, or if
4622\cfunction{PyMem_Free(p)} has been called before, undefined behaviour
4623occurs. If \var{p} is \NULL{}, no operation is performed.
4624\end{cfuncdesc}
4625
Fred Drake659ebfa2000-04-03 15:42:13 +00004626The following type-oriented macros are provided for convenience. Note
4627that \var{TYPE} refers to any C type.
4628
Fred Drakef913e542000-09-12 20:17:17 +00004629\begin{cfuncdesc}{\var{TYPE}*}{PyMem_New}{TYPE, size_t n}
Fred Drake659ebfa2000-04-03 15:42:13 +00004630Same as \cfunction{PyMem_Malloc()}, but allocates \code{(\var{n} *
4631sizeof(\var{TYPE}))} bytes of memory. Returns a pointer cast to
4632\ctype{\var{TYPE}*}.
4633\end{cfuncdesc}
4634
Fred Drakef913e542000-09-12 20:17:17 +00004635\begin{cfuncdesc}{\var{TYPE}*}{PyMem_Resize}{void *p, TYPE, size_t n}
Fred Drake659ebfa2000-04-03 15:42:13 +00004636Same as \cfunction{PyMem_Realloc()}, but the memory block is resized
4637to \code{(\var{n} * sizeof(\var{TYPE}))} bytes. Returns a pointer
4638cast to \ctype{\var{TYPE}*}.
4639\end{cfuncdesc}
4640
Fred Drakef913e542000-09-12 20:17:17 +00004641\begin{cfuncdesc}{void}{PyMem_Del}{void *p}
Fred Drake659ebfa2000-04-03 15:42:13 +00004642Same as \cfunction{PyMem_Free()}.
4643\end{cfuncdesc}
4644
Fred Drakef913e542000-09-12 20:17:17 +00004645In addition, the following macro sets are provided for calling the
4646Python memory allocator directly, without involving the C API functions
4647listed above. However, note that their use does not preserve binary
4648compatibility accross Python versions and is therefore deprecated in
4649extension modules.
4650
4651\cfunction{PyMem_MALLOC()}, \cfunction{PyMem_REALLOC()}, \cfunction{PyMem_FREE()}.
4652
4653\cfunction{PyMem_NEW()}, \cfunction{PyMem_RESIZE()}, \cfunction{PyMem_DEL()}.
4654
Fred Drake659ebfa2000-04-03 15:42:13 +00004655
4656\section{Examples \label{memoryExamples}}
4657
4658Here is the example from section \ref{memoryOverview}, rewritten so
4659that the I/O buffer is allocated from the Python heap by using the
4660first function set:
4661
4662\begin{verbatim}
4663 PyObject *res;
4664 char *buf = (char *) PyMem_Malloc(BUFSIZ); /* for I/O */
4665
4666 if (buf == NULL)
4667 return PyErr_NoMemory();
4668 /* ...Do some I/O operation involving buf... */
4669 res = PyString_FromString(buf);
4670 PyMem_Free(buf); /* allocated with PyMem_Malloc */
4671 return res;
4672\end{verbatim}
4673
Fred Drakef913e542000-09-12 20:17:17 +00004674The same code using the type-oriented function set:
Fred Drake659ebfa2000-04-03 15:42:13 +00004675
4676\begin{verbatim}
4677 PyObject *res;
Fred Drakef913e542000-09-12 20:17:17 +00004678 char *buf = PyMem_New(char, BUFSIZ); /* for I/O */
Fred Drake659ebfa2000-04-03 15:42:13 +00004679
4680 if (buf == NULL)
4681 return PyErr_NoMemory();
4682 /* ...Do some I/O operation involving buf... */
4683 res = PyString_FromString(buf);
Fred Drakef913e542000-09-12 20:17:17 +00004684 PyMem_Del(buf); /* allocated with PyMem_New */
Fred Drake659ebfa2000-04-03 15:42:13 +00004685 return res;
4686\end{verbatim}
4687
Fred Drakef913e542000-09-12 20:17:17 +00004688Note that in the two examples above, the buffer is always
4689manipulated via functions belonging to the same set. Indeed, it
Fred Drake659ebfa2000-04-03 15:42:13 +00004690is required to use the same memory API family for a given
4691memory block, so that the risk of mixing different allocators is
4692reduced to a minimum. The following code sequence contains two errors,
4693one of which is labeled as \emph{fatal} because it mixes two different
4694allocators operating on different heaps.
4695
4696\begin{verbatim}
Fred Drakef913e542000-09-12 20:17:17 +00004697char *buf1 = PyMem_New(char, BUFSIZ);
Fred Drake659ebfa2000-04-03 15:42:13 +00004698char *buf2 = (char *) malloc(BUFSIZ);
4699char *buf3 = (char *) PyMem_Malloc(BUFSIZ);
4700...
Fred Drakef913e542000-09-12 20:17:17 +00004701PyMem_Del(buf3); /* Wrong -- should be PyMem_Free() */
Fred Drake659ebfa2000-04-03 15:42:13 +00004702free(buf2); /* Right -- allocated via malloc() */
Fred Drakef913e542000-09-12 20:17:17 +00004703free(buf1); /* Fatal -- should be PyMem_Del() */
Fred Drake659ebfa2000-04-03 15:42:13 +00004704\end{verbatim}
4705
4706In addition to the functions aimed at handling raw memory blocks from
4707the Python heap, objects in Python are allocated and released with
Fred Drakef913e542000-09-12 20:17:17 +00004708\cfunction{PyObject_New()}, \cfunction{PyObject_NewVar()} and
4709\cfunction{PyObject_Del()}, or with their corresponding macros
4710\cfunction{PyObject_NEW()}, \cfunction{PyObject_NEW_VAR()} and
Fred Drakee06f0f92000-06-30 15:52:39 +00004711\cfunction{PyObject_DEL()}.
Fred Drake659ebfa2000-04-03 15:42:13 +00004712
Fred Drakee06f0f92000-06-30 15:52:39 +00004713These will be explained in the next chapter on defining and
4714implementing new object types in C.
Fred Drake659ebfa2000-04-03 15:42:13 +00004715
4716
Fred Drakeefd146c1999-02-15 15:30:45 +00004717\chapter{Defining New Object Types \label{newTypes}}
Guido van Rossum4a944d71997-08-14 20:35:38 +00004718
Fred Drakec6fa34e1998-04-02 06:47:24 +00004719\begin{cfuncdesc}{PyObject*}{_PyObject_New}{PyTypeObject *type}
Fred Drakee058b4f1998-02-16 06:15:35 +00004720\end{cfuncdesc}
4721
Fred Drakef913e542000-09-12 20:17:17 +00004722\begin{cfuncdesc}{PyVarObject*}{_PyObject_NewVar}{PyTypeObject *type, int size}
Fred Drakee058b4f1998-02-16 06:15:35 +00004723\end{cfuncdesc}
4724
Fred Drakef913e542000-09-12 20:17:17 +00004725\begin{cfuncdesc}{void}{_PyObject_Del}{PyObject *op}
Fred Drakee058b4f1998-02-16 06:15:35 +00004726\end{cfuncdesc}
4727
Fred Drakef913e542000-09-12 20:17:17 +00004728\begin{cfuncdesc}{PyObject*}{PyObject_Init}{PyObject *op,
Marc-André Lemburga544ea22001-01-17 18:04:31 +00004729 PyTypeObject *type}
Fred Drakef913e542000-09-12 20:17:17 +00004730\end{cfuncdesc}
4731
4732\begin{cfuncdesc}{PyVarObject*}{PyObject_InitVar}{PyVarObject *op,
Marc-André Lemburga544ea22001-01-17 18:04:31 +00004733 PyTypeObject *type, int size}
Fred Drakef913e542000-09-12 20:17:17 +00004734\end{cfuncdesc}
4735
4736\begin{cfuncdesc}{\var{TYPE}*}{PyObject_New}{TYPE, PyTypeObject *type}
4737\end{cfuncdesc}
4738
4739\begin{cfuncdesc}{\var{TYPE}*}{PyObject_NewVar}{TYPE, PyTypeObject *type,
4740 int size}
4741\end{cfuncdesc}
4742
4743\begin{cfuncdesc}{void}{PyObject_Del}{PyObject *op}
4744\end{cfuncdesc}
4745
4746\begin{cfuncdesc}{\var{TYPE}*}{PyObject_NEW}{TYPE, PyTypeObject *type}
4747\end{cfuncdesc}
4748
4749\begin{cfuncdesc}{\var{TYPE}*}{PyObject_NEW_VAR}{TYPE, PyTypeObject *type,
4750 int size}
4751\end{cfuncdesc}
4752
4753\begin{cfuncdesc}{void}{PyObject_DEL}{PyObject *op}
Fred Drakee058b4f1998-02-16 06:15:35 +00004754\end{cfuncdesc}
4755
Fred Drakeee814bf2000-11-28 22:34:32 +00004756\begin{cfuncdesc}{PyObject*}{Py_InitModule}{char *name,
4757 PyMethodDef *methods}
4758 Create a new module object based on a name and table of functions,
4759 returning the new module object.
4760\end{cfuncdesc}
4761
4762\begin{cfuncdesc}{PyObject*}{Py_InitModule3}{char *name,
4763 PyMethodDef *methods,
4764 char *doc}
4765 Create a new module object based on a name and table of functions,
4766 returning the new module object. If \var{doc} is non-\NULL, it will
4767 be used to define the docstring for the module.
4768\end{cfuncdesc}
4769
4770\begin{cfuncdesc}{PyObject*}{Py_InitModule4}{char *name,
4771 PyMethodDef *methods,
4772 char *doc, PyObject *self,
4773 int apiver}
4774 Create a new module object based on a name and table of functions,
4775 returning the new module object. If \var{doc} is non-\NULL, it will
4776 be used to define the docstring for the module. If \var{self} is
4777 non-\NULL, it will passed to the functions of the module as their
4778 (otherwise \NULL) first parameter. (This was added as an
4779 experimental feature, and there are no known uses in the current
4780 version of Python.) For \var{apiver}, the only value which should
4781 be passed is defined by the constant \constant{PYTHON_API_VERSION}.
4782
4783 \strong{Note:} Most uses of this function should probably be using
4784 the \cfunction{Py_InitModule3()} instead; only use this if you are
4785 sure you need it.
4786\end{cfuncdesc}
Guido van Rossum3c4378b1998-04-14 20:21:10 +00004787
4788PyArg_ParseTupleAndKeywords, PyArg_ParseTuple, PyArg_Parse
4789
4790Py_BuildValue
Guido van Rossumae110af1997-05-22 20:11:52 +00004791
Fred Drake659ebfa2000-04-03 15:42:13 +00004792DL_IMPORT
4793
Fred Drake659ebfa2000-04-03 15:42:13 +00004794_Py_NoneStruct
4795
4796
4797\section{Common Object Structures \label{common-structs}}
4798
Guido van Rossumae110af1997-05-22 20:11:52 +00004799PyObject, PyVarObject
4800
4801PyObject_HEAD, PyObject_HEAD_INIT, PyObject_VAR_HEAD
4802
4803Typedefs:
4804unaryfunc, binaryfunc, ternaryfunc, inquiry, coercion, intargfunc,
4805intintargfunc, intobjargproc, intintobjargproc, objobjargproc,
Guido van Rossumae110af1997-05-22 20:11:52 +00004806destructor, printfunc, getattrfunc, getattrofunc, setattrfunc,
4807setattrofunc, cmpfunc, reprfunc, hashfunc
4808
Fred Drakea8455ab2000-06-16 19:58:42 +00004809\begin{ctypedesc}{PyCFunction}
4810Type of the functions used to implement most Python callables in C.
4811\end{ctypedesc}
4812
4813\begin{ctypedesc}{PyMethodDef}
4814Structure used to describe a method of an extension type. This
4815structure has four fields:
4816
4817\begin{tableiii}{l|l|l}{member}{Field}{C Type}{Meaning}
4818 \lineiii{ml_name}{char *}{name of the method}
4819 \lineiii{ml_meth}{PyCFunction}{pointer to the C implementation}
4820 \lineiii{ml_flags}{int}{flag bits indicating how the call should be
4821 constructed}
4822 \lineiii{ml_doc}{char *}{points to the contents of the docstring}
4823\end{tableiii}
4824\end{ctypedesc}
4825
4826\begin{cfuncdesc}{PyObject*}{Py_FindMethod}{PyMethodDef[] table,
4827 PyObject *ob, char *name}
4828Return a bound method object for an extension type implemented in C.
4829This function also handles the special attribute \member{__methods__},
4830returning a list of all the method names defined in \var{table}.
4831\end{cfuncdesc}
4832
Fred Drake659ebfa2000-04-03 15:42:13 +00004833
4834\section{Mapping Object Structures \label{mapping-structs}}
4835
4836\begin{ctypedesc}{PyMappingMethods}
4837Structure used to hold pointers to the functions used to implement the
4838mapping protocol for an extension type.
4839\end{ctypedesc}
4840
4841
4842\section{Number Object Structures \label{number-structs}}
4843
4844\begin{ctypedesc}{PyNumberMethods}
4845Structure used to hold pointers to the functions an extension type
4846uses to implement the number protocol.
4847\end{ctypedesc}
4848
4849
4850\section{Sequence Object Structures \label{sequence-structs}}
4851
4852\begin{ctypedesc}{PySequenceMethods}
4853Structure used to hold pointers to the functions which an object uses
4854to implement the sequence protocol.
4855\end{ctypedesc}
4856
4857
4858\section{Buffer Object Structures \label{buffer-structs}}
4859\sectionauthor{Greg J. Stein}{greg@lyra.org}
4860
4861The buffer interface exports a model where an object can expose its
4862internal data as a set of chunks of data, where each chunk is
4863specified as a pointer/length pair. These chunks are called
4864\dfn{segments} and are presumed to be non-contiguous in memory.
4865
4866If an object does not export the buffer interface, then its
4867\member{tp_as_buffer} member in the \ctype{PyTypeObject} structure
4868should be \NULL{}. Otherwise, the \member{tp_as_buffer} will point to
4869a \ctype{PyBufferProcs} structure.
4870
4871\strong{Note:} It is very important that your
Fred Drakec392b572001-03-21 22:15:01 +00004872\ctype{PyTypeObject} structure uses \constant{Py_TPFLAGS_DEFAULT} for
4873the value of the \member{tp_flags} member rather than \code{0}. This
Fred Drake659ebfa2000-04-03 15:42:13 +00004874tells the Python runtime that your \ctype{PyBufferProcs} structure
4875contains the \member{bf_getcharbuffer} slot. Older versions of Python
4876did not have this member, so a new Python interpreter using an old
4877extension needs to be able to test for its presence before using it.
4878
4879\begin{ctypedesc}{PyBufferProcs}
4880Structure used to hold the function pointers which define an
4881implementation of the buffer protocol.
4882
4883The first slot is \member{bf_getreadbuffer}, of type
4884\ctype{getreadbufferproc}. If this slot is \NULL{}, then the object
4885does not support reading from the internal data. This is
4886non-sensical, so implementors should fill this in, but callers should
4887test that the slot contains a non-\NULL{} value.
4888
4889The next slot is \member{bf_getwritebuffer} having type
4890\ctype{getwritebufferproc}. This slot may be \NULL{} if the object
4891does not allow writing into its returned buffers.
4892
4893The third slot is \member{bf_getsegcount}, with type
4894\ctype{getsegcountproc}. This slot must not be \NULL{} and is used to
4895inform the caller how many segments the object contains. Simple
4896objects such as \ctype{PyString_Type} and
4897\ctype{PyBuffer_Type} objects contain a single segment.
4898
4899The last slot is \member{bf_getcharbuffer}, of type
4900\ctype{getcharbufferproc}. This slot will only be present if the
Fred Drakec392b572001-03-21 22:15:01 +00004901\constant{Py_TPFLAGS_HAVE_GETCHARBUFFER} flag is present in the
Fred Drake659ebfa2000-04-03 15:42:13 +00004902\member{tp_flags} field of the object's \ctype{PyTypeObject}. Before using
4903this slot, the caller should test whether it is present by using the
4904\cfunction{PyType_HasFeature()}\ttindex{PyType_HasFeature()} function.
4905If present, it may be \NULL, indicating that the object's contents
4906cannot be used as \emph{8-bit characters}.
4907The slot function may also raise an error if the object's contents
4908cannot be interpreted as 8-bit characters. For example, if the object
4909is an array which is configured to hold floating point values, an
4910exception may be raised if a caller attempts to use
4911\member{bf_getcharbuffer} to fetch a sequence of 8-bit characters.
4912This notion of exporting the internal buffers as ``text'' is used to
4913distinguish between objects that are binary in nature, and those which
4914have character-based content.
4915
4916\strong{Note:} The current policy seems to state that these characters
4917may be multi-byte characters. This implies that a buffer size of
4918\var{N} does not mean there are \var{N} characters present.
4919\end{ctypedesc}
4920
4921\begin{datadesc}{Py_TPFLAGS_HAVE_GETCHARBUFFER}
4922Flag bit set in the type structure to indicate that the
4923\member{bf_getcharbuffer} slot is known. This being set does not
4924indicate that the object supports the buffer interface or that the
4925\member{bf_getcharbuffer} slot is non-\NULL.
4926\end{datadesc}
4927
4928\begin{ctypedesc}[getreadbufferproc]{int (*getreadbufferproc)
4929 (PyObject *self, int segment, void **ptrptr)}
4930Return a pointer to a readable segment of the buffer. This function
4931is allowed to raise an exception, in which case it must return
4932\code{-1}. The \var{segment} which is passed must be zero or
4933positive, and strictly less than the number of segments returned by
4934the \member{bf_getsegcount} slot function. On success, returns
4935\code{0} and sets \code{*\var{ptrptr}} to a pointer to the buffer
4936memory.
4937\end{ctypedesc}
4938
4939\begin{ctypedesc}[getwritebufferproc]{int (*getwritebufferproc)
4940 (PyObject *self, int segment, void **ptrptr)}
Fred Drake58c5a2a1999-08-04 13:13:24 +00004941Return a pointer to a writable memory buffer in \code{*\var{ptrptr}};
4942the memory buffer must correspond to buffer segment \var{segment}.
4943Must return \code{-1} and set an exception on error.
4944\exception{TypeError} should be raised if the object only supports
4945read-only buffers, and \exception{SystemError} should be raised when
4946\var{segment} specifies a segment that doesn't exist.
4947% Why doesn't it raise ValueError for this one?
Fred Drake659ebfa2000-04-03 15:42:13 +00004948% GJS: because you shouldn't be calling it with an invalid
4949% segment. That indicates a blatant programming error in the C
4950% code.
Fred Drake58c5a2a1999-08-04 13:13:24 +00004951\end{ctypedesc}
4952
Fred Drake659ebfa2000-04-03 15:42:13 +00004953\begin{ctypedesc}[getsegcountproc]{int (*getsegcountproc)
4954 (PyObject *self, int *lenp)}
4955Return the number of memory segments which comprise the buffer. If
4956\var{lenp} is not \NULL, the implementation must report the sum of the
4957sizes (in bytes) of all segments in \code{*\var{lenp}}.
4958The function cannot fail.
4959\end{ctypedesc}
Guido van Rossumae110af1997-05-22 20:11:52 +00004960
Fred Drake659ebfa2000-04-03 15:42:13 +00004961\begin{ctypedesc}[getcharbufferproc]{int (*getcharbufferproc)
4962 (PyObject *self, int segment, const char **ptrptr)}
4963\end{ctypedesc}
Guido van Rossumae110af1997-05-22 20:11:52 +00004964
Guido van Rossumae110af1997-05-22 20:11:52 +00004965
Fred Drakec392b572001-03-21 22:15:01 +00004966\section{Supporting Cyclic Garbarge Collection
4967 \label{supporting-cycle-detection}}
4968
4969Python's support for detecting and collecting garbage which involves
4970circular references requires support from object types which are
4971``containers'' for other objects which may also be containers. Types
4972which do not store references to other objects, or which only store
4973references to atomic types (such as numbers or strings), do not need
4974to provide any explicit support for garbage collection.
4975
4976To create a container type, the \member{tp_flags} field of the type
4977object must include the \constant{Py_TPFLAGS_GC} and provide an
Fred Drakee28d8ae2001-03-22 16:30:17 +00004978implementation of the \member{tp_traverse} handler. The computed
4979value of the \member{tp_basicsize} field must include
4980\constant{PyGC_HEAD_SIZE} as well. If instances of the type are
4981mutable, a \member{tp_clear} implementation must also be provided.
Fred Drakec392b572001-03-21 22:15:01 +00004982
4983\begin{datadesc}{Py_TPFLAGS_GC}
4984 Objects with a type with this flag set must conform with the rules
4985 documented here. For convenience these objects will be referred to
4986 as container objects.
4987\end{datadesc}
4988
4989\begin{datadesc}{PyGC_HEAD_SIZE}
4990 Extra memory needed for the garbage collector. Container objects
4991 must include this in the calculation of their tp_basicsize. If the
4992 collector is disabled at compile time then this is \code{0}.
4993\end{datadesc}
4994
Fred Drakee28d8ae2001-03-22 16:30:17 +00004995Constructors for container types must conform to two rules:
4996
4997\begin{enumerate}
4998\item The memory for the object must be allocated using
4999 \cfunction{PyObject_New()} or \cfunction{PyObject_VarNew()}.
5000
5001\item Once all the fields which may contain references to other
5002 containers are initialized, it must call
5003 \cfunction{PyObject_GC_Init()}.
5004\end{enumerate}
5005
Fred Drakec392b572001-03-21 22:15:01 +00005006\begin{cfuncdesc}{void}{PyObject_GC_Init}{PyObject *op}
5007 Adds the object \var{op} to the set of container objects tracked by
5008 the collector. The collector can run at unexpected times so objects
5009 must be valid while being tracked. This should be called once all
5010 the fields followed by the \member{tp_traverse} handler become valid,
5011 usually near the end of the constructor.
5012\end{cfuncdesc}
5013
Fred Drakee28d8ae2001-03-22 16:30:17 +00005014Similarly, the deallocator for the object must conform to a similar
5015pair of rules:
5016
5017\begin{enumerate}
5018\item Before fields which refer to other containers are invalidated,
5019 \cfunction{PyObject_GC_Fini()} must be called.
5020
5021\item The object's memory must be deallocated using
5022 \cfunction{PyObject_Del()}.
5023\end{enumerate}
5024
Fred Drakec392b572001-03-21 22:15:01 +00005025\begin{cfuncdesc}{void}{PyObject_GC_Fini}{PyObject *op}
5026 Remove the object \var{op} from the set of container objects tracked
5027 by the collector. Note that \cfunction{PyObject_GC_Init()} can be
5028 called again on this object to add it back to the set of tracked
5029 objects. The deallocator (\member{tp_dealloc} handler) should call
5030 this for the object before any of the fields used by the
5031 \member{tp_traverse} handler become invalid.
Fred Drake8f6df462001-03-23 17:42:09 +00005032
5033 \strong{Note:} Any container which may be referenced from another
5034 object reachable by the collector must itself be tracked by the
5035 collector, so it is generally not safe to call this function
5036 anywhere but in the object's deallocator.
Fred Drakec392b572001-03-21 22:15:01 +00005037\end{cfuncdesc}
5038
5039The \member{tp_traverse} handler accepts a function parameter of this
5040type:
5041
5042\begin{ctypedesc}[visitproc]{int (*visitproc)(PyObject *object, void *arg)}
5043 Type of the visitor function passed to the \member{tp_traverse}
5044 handler. The function should be called with an object to traverse
5045 as \var{object} and the third parameter to the \member{tp_traverse}
5046 handler as \var{arg}.
5047\end{ctypedesc}
5048
5049The \member{tp_traverse} handler must have the following type:
5050
5051\begin{ctypedesc}[traverseproc]{int (*traverseproc)(PyObject *self,
5052 visitproc visit, void *arg)}
5053 Traversal function for a container object. Implementations must
5054 call the \var{visit} function for each object directly contained by
5055 \var{self}, with the parameters to \var{visit} being the contained
5056 object and the \var{arg} value passed to the handler. If
5057 \var{visit} returns a non-zero value then an error has occurred and
5058 that value should be returned immediately.
5059\end{ctypedesc}
5060
5061The \member{tp_clear} handler must be of the \ctype{inquiry} type, or
5062\NULL{} if the object is immutable.
5063
5064\begin{ctypedesc}[inquiry]{int (*inquiry)(PyObject *self)}
5065 Drop references that may have created reference cycles. Immutable
5066 objects do not have to define this method since they can never
5067 directly create reference cycles. Note that the object must still
5068 be valid after calling this method (i.e., don't just call
5069 \cfunction{Py_DECREF()} on a reference). The collector will call
5070 this method if it detects that this object is involved in a
5071 reference cycle.
5072\end{ctypedesc}
5073
5074
Fred Drakee28d8ae2001-03-22 16:30:17 +00005075\subsection{Example Cycle Collector Support
5076 \label{example-cycle-support}}
5077
5078This example shows only enough of the implementation of an extension
5079type to show how the garbage collector support needs to be added. It
5080shows the definition of the object structure, the
5081\member{tp_traverse}, \member{tp_clear} and \member{tp_dealloc}
5082implementations, the type structure, and a constructor --- the module
5083initialization needed to export the constructor to Python is not shown
5084as there are no special considerations there for the collector. To
5085make this interesting, assume that the module exposes ways for the
5086\member{container} field of the object to be modified. Note that
5087since no checks are made on the type of the object used to initialize
5088\member{container}, we have to assume that it may be a container.
5089
5090\begin{verbatim}
5091#include "Python.h"
5092
5093typedef struct {
5094 PyObject_HEAD
5095 PyObject *container;
5096} MyObject;
5097
5098static int
5099my_traverse(MyObject *self, visitproc visit, void *arg)
5100{
5101 if (self->container != NULL)
5102 return visit(self->container, arg);
5103 else
5104 return 0;
5105}
5106
5107static int
5108my_clear(MyObject *self)
5109{
5110 Py_XDECREF(self->container);
5111 self->container = NULL;
5112
5113 return 0;
5114}
5115
5116static void
5117my_dealloc(MyObject *self)
5118{
5119 PyObject_GC_Fini((PyObject *) self);
5120 Py_XDECREF(self->container);
5121 PyObject_Del(self);
5122}
5123\end{verbatim}
5124
5125\begin{verbatim}
5126statichere PyTypeObject
5127MyObject_Type = {
5128 PyObject_HEAD_INIT(NULL)
5129 0,
5130 "MyObject",
5131 sizeof(MyObject) + PyGC_HEAD_SIZE,
5132 0,
5133 (destructor)my_dealloc, /* tp_dealloc */
5134 0, /* tp_print */
5135 0, /* tp_getattr */
5136 0, /* tp_setattr */
5137 0, /* tp_compare */
5138 0, /* tp_repr */
5139 0, /* tp_as_number */
5140 0, /* tp_as_sequence */
5141 0, /* tp_as_mapping */
5142 0, /* tp_hash */
5143 0, /* tp_call */
5144 0, /* tp_str */
5145 0, /* tp_getattro */
5146 0, /* tp_setattro */
5147 0, /* tp_as_buffer */
5148 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_GC,
5149 0, /* tp_doc */
5150 (traverseproc)my_traverse, /* tp_traverse */
5151 (inquiry)my_clear, /* tp_clear */
5152 0, /* tp_richcompare */
5153 0, /* tp_weaklistoffset */
5154};
5155
5156/* This constructor should be made accessible from Python. */
5157static PyObject *
5158new_object(PyObject *unused, PyObject *args)
5159{
5160 PyObject *container = NULL;
5161 MyObject *result = NULL;
5162
5163 if (PyArg_ParseTuple(args, "|O:new_object", &container)) {
5164 result = PyObject_New(MyObject, &MyObject_Type);
5165 if (result != NULL) {
5166 result->container = container;
5167 PyObject_GC_Init();
5168 }
5169 }
5170 return (PyObject *) result;
5171}
5172\end{verbatim}
5173
5174
Fred Drake659ebfa2000-04-03 15:42:13 +00005175% \chapter{Debugging \label{debugging}}
5176%
5177% XXX Explain Py_DEBUG, Py_TRACE_REFS, Py_REF_DEBUG.
Guido van Rossum5b8a5231997-12-30 04:38:44 +00005178
5179
Fred Drakeed773ef2000-09-21 21:35:22 +00005180\appendix
5181\chapter{Reporting Bugs}
5182\input{reportingbugs}
5183
Marc-André Lemburga544ea22001-01-17 18:04:31 +00005184\input{api.ind} % Index -- must be last
Guido van Rossum9231c8f1997-05-15 21:43:21 +00005185
5186\end{document}