Blame - Include/unicodeobject.h - platform/external/python/cpython2

blob: 2c11bfd452407ef01d45fc6bda94d6f28c3cd8f3 [file] [log] [blame]

Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1	#ifndef Py_UNICODEOBJECT_H
				2	#define Py_UNICODEOBJECT_H
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	3
Neal Norwitz	cfb41c4	2008-01-27 07:41:33 +0000	[diff] [blame]	4	#include <stdarg.h>
				5
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	6	/*
				7
				8	Unicode implementation based on original code by Fredrik Lundh,
				9	modified by Marc-Andre Lemburg (mal@lemburg.com) according to the
				10	Unicode Integration Proposal (see file Misc/unicode.txt).
				11
Guido van Rossum	16b1ad9	2000-08-03 16:24:25 +0000	[diff] [blame]	12	Copyright (c) Corporation for National Research Initiatives.
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	13
				14
				15	Original header:
				16	--------------------------------------------------------------------
				17
				18	* Yet another Unicode string type for Python. This type supports the
				19	* 16-bit Basic Multilingual Plane (BMP) only.
				20	*
				21	* Written by Fredrik Lundh, January 1999.
				22	*
				23	* Copyright (c) 1999 by Secret Labs AB.
				24	* Copyright (c) 1999 by Fredrik Lundh.
				25	*
				26	* fredrik@pythonware.com
				27	* http://www.pythonware.com
				28	*
				29	* --------------------------------------------------------------------
				30	* This Unicode String Type is
				31	*
				32	* Copyright (c) 1999 by Secret Labs AB
				33	* Copyright (c) 1999 by Fredrik Lundh
				34	*
				35	* By obtaining, using, and/or copying this software and/or its
				36	* associated documentation, you agree that you have read, understood,
				37	* and will comply with the following terms and conditions:
				38	*
				39	* Permission to use, copy, modify, and distribute this software and its
				40	* associated documentation for any purpose and without fee is hereby
				41	* granted, provided that the above copyright notice appears in all
				42	* copies, and that both that copyright notice and this permission notice
				43	* appear in supporting documentation, and that the name of Secret Labs
				44	* AB or the author not be used in advertising or publicity pertaining to
				45	* distribution of the software without specific, written prior
				46	* permission.
				47	*
				48	* SECRET LABS AB AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD TO
				49	* THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND
				50	* FITNESS. IN NO EVENT SHALL SECRET LABS AB OR THE AUTHOR BE LIABLE FOR
				51	* ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
				52	* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
				53	* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT
				54	* OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
				55	* -------------------------------------------------------------------- */
				56
Marc-André Lemburg	5e6007c	2001-09-19 11:21:03 +0000	[diff] [blame]	57	#include <ctype.h>
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	58
				59	/* === Internal API ======================================================= */
				60
				61	/* --- Internal Unicode Format -------------------------------------------- */
				62
Martin v. Löwis	339d0f7	2001-08-17 18:39:25 +0000	[diff] [blame]	63	#ifndef Py_USING_UNICODE
				64
				65	#define PyUnicode_Check(op) 0
Tim Peters	78e0fc7	2001-09-11 03:07:38 +0000	[diff] [blame]	66	#define PyUnicode_CheckExact(op) 0
Martin v. Löwis	339d0f7	2001-08-17 18:39:25 +0000	[diff] [blame]	67
				68	#else
				69
Fredrik Lundh	9b14ab3	2001-06-26 22:59:49 +0000	[diff] [blame]	70	/* FIXME: MvL's new implementation assumes that Py_UNICODE_SIZE is
				71	properly set, but the default rules below doesn't set it. I'll
				72	sort this out some other day -- fredrik@pythonware.com */
				73
				74	#ifndef Py_UNICODE_SIZE
				75	#error Must define Py_UNICODE_SIZE
				76	#endif
				77
Fredrik Lundh	8f45585	2001-06-27 18:59:43 +0000	[diff] [blame]	78	/* Setting Py_UNICODE_WIDE enables UCS-4 storage. Otherwise, Unicode
				79	strings are stored as UCS-2 (with limited support for UTF-16) */
				80
				81	#if Py_UNICODE_SIZE >= 4
				82	#define Py_UNICODE_WIDE
Martin v. Löwis	0ba70cc	2001-06-26 22:22:37 +0000	[diff] [blame]	83	#endif
Fredrik Lundh	1294ad0	2001-06-26 17:17:07 +0000	[diff] [blame]	84
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	85	/* Set these flags if the platform has "wchar.h", "wctype.h" and the
				86	wchar_t type is a 16-bit unsigned type */
				87	/* #define HAVE_WCHAR_H */
				88	/* #define HAVE_USABLE_WCHAR_T */
				89
				90	/* Defaults for various platforms */
Martin v. Löwis	0ba70cc	2001-06-26 22:22:37 +0000	[diff] [blame]	91	#ifndef PY_UNICODE_TYPE
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	92
Fredrik Lundh	1294ad0	2001-06-26 17:17:07 +0000	[diff] [blame]	93	/* Windows has a usable wchar_t type (unless we're using UCS-4) */
Fredrik Lundh	8f45585	2001-06-27 18:59:43 +0000	[diff] [blame]	94	# if defined(MS_WIN32) && Py_UNICODE_SIZE == 2
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	95	# define HAVE_USABLE_WCHAR_T
Martin v. Löwis	0ba70cc	2001-06-26 22:22:37 +0000	[diff] [blame]	96	# define PY_UNICODE_TYPE wchar_t
				97	# endif
				98
Fredrik Lundh	8f45585	2001-06-27 18:59:43 +0000	[diff] [blame]	99	# if defined(Py_UNICODE_WIDE)
Martin v. Löwis	0ba70cc	2001-06-26 22:22:37 +0000	[diff] [blame]	100	# define PY_UNICODE_TYPE Py_UCS4
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	101	# endif
				102
				103	#endif
				104
				105	/* If the compiler provides a wchar_t type we try to support it
				106	through the interface functions PyUnicode_FromWideChar() and
				107	PyUnicode_AsWideChar(). */
				108
				109	#ifdef HAVE_USABLE_WCHAR_T
Marc-André Lemburg	1a731c6	2000-08-11 11:43:10 +0000	[diff] [blame]	110	# ifndef HAVE_WCHAR_H
				111	# define HAVE_WCHAR_H
				112	# endif
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	113	#endif
				114
				115	#ifdef HAVE_WCHAR_H
Guido van Rossum	24bdb04	2000-03-28 20:29:59 +0000	[diff] [blame]	116	/* Work around a cosmetic bug in BSDI 4.x wchar.h; thanks to Thomas Wouters */
				117	# ifdef _HAVE_BSDI
				118	# include <time.h>
				119	# endif
Marc-André Lemburg	5e6007c	2001-09-19 11:21:03 +0000	[diff] [blame]	120	# include <wchar.h>
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	121	#endif
				122
Martin v. Löwis	0ba70cc	2001-06-26 22:22:37 +0000	[diff] [blame]	123	/*
				124	* Use this typedef when you need to represent a UTF-16 surrogate pair
				125	* as single unsigned integer.
				126	*/
				127	#if SIZEOF_INT >= 4
				128	typedef unsigned int Py_UCS4;
				129	#elif SIZEOF_LONG >= 4
				130	typedef unsigned long Py_UCS4;
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	131	#endif
				132
Martin v. Löwis	0ba70cc	2001-06-26 22:22:37 +0000	[diff] [blame]	133	typedef PY_UNICODE_TYPE Py_UNICODE;
Marc-André Lemburg	4327910	2000-07-07 09:01:41 +0000	[diff] [blame]	134
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	135	/* --- UCS-2/UCS-4 Name Mangling ------------------------------------------ */
				136
				137	/* Unicode API names are mangled to assure that UCS-2 and UCS-4 builds
				138	produce different external names and thus cause import errors in
				139	case Python interpreters and extensions with mixed compiled in
				140	Unicode width assumptions are combined. */
				141
				142	#ifndef Py_UNICODE_WIDE
				143
				144	# define PyUnicode_AsASCIIString PyUnicodeUCS2_AsASCIIString
				145	# define PyUnicode_AsCharmapString PyUnicodeUCS2_AsCharmapString
Marc-André Lemburg	d2d4598	2004-07-08 17:57:32 +0000	[diff] [blame]	146	# define PyUnicode_AsEncodedObject PyUnicodeUCS2_AsEncodedObject
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	147	# define PyUnicode_AsEncodedString PyUnicodeUCS2_AsEncodedString
				148	# define PyUnicode_AsLatin1String PyUnicodeUCS2_AsLatin1String
				149	# define PyUnicode_AsRawUnicodeEscapeString PyUnicodeUCS2_AsRawUnicodeEscapeString
Walter Dörwald	6e39080	2007-08-17 16:41:28 +0000	[diff] [blame]	150	# define PyUnicode_AsUTF32String PyUnicodeUCS2_AsUTF32String
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	151	# define PyUnicode_AsUTF16String PyUnicodeUCS2_AsUTF16String
				152	# define PyUnicode_AsUTF8String PyUnicodeUCS2_AsUTF8String
				153	# define PyUnicode_AsUnicode PyUnicodeUCS2_AsUnicode
				154	# define PyUnicode_AsUnicodeEscapeString PyUnicodeUCS2_AsUnicodeEscapeString
				155	# define PyUnicode_AsWideChar PyUnicodeUCS2_AsWideChar
				156	# define PyUnicode_Compare PyUnicodeUCS2_Compare
				157	# define PyUnicode_Concat PyUnicodeUCS2_Concat
				158	# define PyUnicode_Contains PyUnicodeUCS2_Contains
				159	# define PyUnicode_Count PyUnicodeUCS2_Count
				160	# define PyUnicode_Decode PyUnicodeUCS2_Decode
				161	# define PyUnicode_DecodeASCII PyUnicodeUCS2_DecodeASCII
				162	# define PyUnicode_DecodeCharmap PyUnicodeUCS2_DecodeCharmap
				163	# define PyUnicode_DecodeLatin1 PyUnicodeUCS2_DecodeLatin1
				164	# define PyUnicode_DecodeRawUnicodeEscape PyUnicodeUCS2_DecodeRawUnicodeEscape
Walter Dörwald	6e39080	2007-08-17 16:41:28 +0000	[diff] [blame]	165	# define PyUnicode_DecodeUTF32 PyUnicodeUCS2_DecodeUTF32
				166	# define PyUnicode_DecodeUTF32Stateful PyUnicodeUCS2_DecodeUTF32Stateful
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	167	# define PyUnicode_DecodeUTF16 PyUnicodeUCS2_DecodeUTF16
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	168	# define PyUnicode_DecodeUTF16Stateful PyUnicodeUCS2_DecodeUTF16Stateful
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	169	# define PyUnicode_DecodeUTF8 PyUnicodeUCS2_DecodeUTF8
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	170	# define PyUnicode_DecodeUTF8Stateful PyUnicodeUCS2_DecodeUTF8Stateful
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	171	# define PyUnicode_DecodeUnicodeEscape PyUnicodeUCS2_DecodeUnicodeEscape
				172	# define PyUnicode_Encode PyUnicodeUCS2_Encode
				173	# define PyUnicode_EncodeASCII PyUnicodeUCS2_EncodeASCII
				174	# define PyUnicode_EncodeCharmap PyUnicodeUCS2_EncodeCharmap
				175	# define PyUnicode_EncodeDecimal PyUnicodeUCS2_EncodeDecimal
				176	# define PyUnicode_EncodeLatin1 PyUnicodeUCS2_EncodeLatin1
				177	# define PyUnicode_EncodeRawUnicodeEscape PyUnicodeUCS2_EncodeRawUnicodeEscape
Walter Dörwald	6e39080	2007-08-17 16:41:28 +0000	[diff] [blame]	178	# define PyUnicode_EncodeUTF32 PyUnicodeUCS2_EncodeUTF32
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	179	# define PyUnicode_EncodeUTF16 PyUnicodeUCS2_EncodeUTF16
				180	# define PyUnicode_EncodeUTF8 PyUnicodeUCS2_EncodeUTF8
				181	# define PyUnicode_EncodeUnicodeEscape PyUnicodeUCS2_EncodeUnicodeEscape
				182	# define PyUnicode_Find PyUnicodeUCS2_Find
				183	# define PyUnicode_Format PyUnicodeUCS2_Format
				184	# define PyUnicode_FromEncodedObject PyUnicodeUCS2_FromEncodedObject
				185	# define PyUnicode_FromObject PyUnicodeUCS2_FromObject
Marc-André Lemburg	9c329de	2002-08-12 08:19:10 +0000	[diff] [blame]	186	# define PyUnicode_FromOrdinal PyUnicodeUCS2_FromOrdinal
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	187	# define PyUnicode_FromUnicode PyUnicodeUCS2_FromUnicode
Christian Heimes	7f39c9f	2008-01-25 12:18:43 +0000	[diff] [blame]	188	# define PyUnicode_FromString PyUnicodeUCS2_FromString
				189	# define PyUnicode_FromStringAndSize PyUnicodeUCS2_FromStringAndSize
				190	# define PyUnicode_FromFormatV PyUnicodeUCS2_FromFormatV
				191	# define PyUnicode_FromFormat PyUnicodeUCS2_FromFormat
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	192	# define PyUnicode_FromWideChar PyUnicodeUCS2_FromWideChar
				193	# define PyUnicode_GetDefaultEncoding PyUnicodeUCS2_GetDefaultEncoding
				194	# define PyUnicode_GetMax PyUnicodeUCS2_GetMax
				195	# define PyUnicode_GetSize PyUnicodeUCS2_GetSize
				196	# define PyUnicode_Join PyUnicodeUCS2_Join
Fredrik Lundh	06a69dd	2006-05-26 08:54:28 +0000	[diff] [blame]	197	# define PyUnicode_Partition PyUnicodeUCS2_Partition
Fredrik Lundh	b3167cb	2006-05-26 18:15:38 +0000	[diff] [blame]	198	# define PyUnicode_RPartition PyUnicodeUCS2_RPartition
				199	# define PyUnicode_RSplit PyUnicodeUCS2_RSplit
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	200	# define PyUnicode_Replace PyUnicodeUCS2_Replace
				201	# define PyUnicode_Resize PyUnicodeUCS2_Resize
Marc-André Lemburg	040f76b	2006-08-14 10:55:19 +0000	[diff] [blame]	202	# define PyUnicode_RichCompare PyUnicodeUCS2_RichCompare
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	203	# define PyUnicode_SetDefaultEncoding PyUnicodeUCS2_SetDefaultEncoding
				204	# define PyUnicode_Split PyUnicodeUCS2_Split
				205	# define PyUnicode_Splitlines PyUnicodeUCS2_Splitlines
				206	# define PyUnicode_Tailmatch PyUnicodeUCS2_Tailmatch
				207	# define PyUnicode_Translate PyUnicodeUCS2_Translate
				208	# define PyUnicode_TranslateCharmap PyUnicodeUCS2_TranslateCharmap
				209	# define _PyUnicode_AsDefaultEncodedString _PyUnicodeUCS2_AsDefaultEncodedString
				210	# define _PyUnicode_Fini _PyUnicodeUCS2_Fini
				211	# define _PyUnicode_Init _PyUnicodeUCS2_Init
				212	# define _PyUnicode_IsAlpha _PyUnicodeUCS2_IsAlpha
				213	# define _PyUnicode_IsDecimalDigit _PyUnicodeUCS2_IsDecimalDigit
				214	# define _PyUnicode_IsDigit _PyUnicodeUCS2_IsDigit
				215	# define _PyUnicode_IsLinebreak _PyUnicodeUCS2_IsLinebreak
				216	# define _PyUnicode_IsLowercase _PyUnicodeUCS2_IsLowercase
				217	# define _PyUnicode_IsNumeric _PyUnicodeUCS2_IsNumeric
				218	# define _PyUnicode_IsTitlecase _PyUnicodeUCS2_IsTitlecase
				219	# define _PyUnicode_IsUppercase _PyUnicodeUCS2_IsUppercase
				220	# define _PyUnicode_IsWhitespace _PyUnicodeUCS2_IsWhitespace
				221	# define _PyUnicode_ToDecimalDigit _PyUnicodeUCS2_ToDecimalDigit
				222	# define _PyUnicode_ToDigit _PyUnicodeUCS2_ToDigit
				223	# define _PyUnicode_ToLowercase _PyUnicodeUCS2_ToLowercase
				224	# define _PyUnicode_ToNumeric _PyUnicodeUCS2_ToNumeric
				225	# define _PyUnicode_ToTitlecase _PyUnicodeUCS2_ToTitlecase
				226	# define _PyUnicode_ToUppercase _PyUnicodeUCS2_ToUppercase
				227
				228	#else
				229
				230	# define PyUnicode_AsASCIIString PyUnicodeUCS4_AsASCIIString
				231	# define PyUnicode_AsCharmapString PyUnicodeUCS4_AsCharmapString
Marc-André Lemburg	d2d4598	2004-07-08 17:57:32 +0000	[diff] [blame]	232	# define PyUnicode_AsEncodedObject PyUnicodeUCS4_AsEncodedObject
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	233	# define PyUnicode_AsEncodedString PyUnicodeUCS4_AsEncodedString
				234	# define PyUnicode_AsLatin1String PyUnicodeUCS4_AsLatin1String
				235	# define PyUnicode_AsRawUnicodeEscapeString PyUnicodeUCS4_AsRawUnicodeEscapeString
Walter Dörwald	6e39080	2007-08-17 16:41:28 +0000	[diff] [blame]	236	# define PyUnicode_AsUTF32String PyUnicodeUCS4_AsUTF32String
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	237	# define PyUnicode_AsUTF16String PyUnicodeUCS4_AsUTF16String
				238	# define PyUnicode_AsUTF8String PyUnicodeUCS4_AsUTF8String
				239	# define PyUnicode_AsUnicode PyUnicodeUCS4_AsUnicode
				240	# define PyUnicode_AsUnicodeEscapeString PyUnicodeUCS4_AsUnicodeEscapeString
				241	# define PyUnicode_AsWideChar PyUnicodeUCS4_AsWideChar
				242	# define PyUnicode_Compare PyUnicodeUCS4_Compare
				243	# define PyUnicode_Concat PyUnicodeUCS4_Concat
				244	# define PyUnicode_Contains PyUnicodeUCS4_Contains
				245	# define PyUnicode_Count PyUnicodeUCS4_Count
				246	# define PyUnicode_Decode PyUnicodeUCS4_Decode
				247	# define PyUnicode_DecodeASCII PyUnicodeUCS4_DecodeASCII
				248	# define PyUnicode_DecodeCharmap PyUnicodeUCS4_DecodeCharmap
				249	# define PyUnicode_DecodeLatin1 PyUnicodeUCS4_DecodeLatin1
				250	# define PyUnicode_DecodeRawUnicodeEscape PyUnicodeUCS4_DecodeRawUnicodeEscape
Walter Dörwald	6e39080	2007-08-17 16:41:28 +0000	[diff] [blame]	251	# define PyUnicode_DecodeUTF32 PyUnicodeUCS4_DecodeUTF32
				252	# define PyUnicode_DecodeUTF32Stateful PyUnicodeUCS4_DecodeUTF32Stateful
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	253	# define PyUnicode_DecodeUTF16 PyUnicodeUCS4_DecodeUTF16
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	254	# define PyUnicode_DecodeUTF16Stateful PyUnicodeUCS4_DecodeUTF16Stateful
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	255	# define PyUnicode_DecodeUTF8 PyUnicodeUCS4_DecodeUTF8
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	256	# define PyUnicode_DecodeUTF8Stateful PyUnicodeUCS4_DecodeUTF8Stateful
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	257	# define PyUnicode_DecodeUnicodeEscape PyUnicodeUCS4_DecodeUnicodeEscape
				258	# define PyUnicode_Encode PyUnicodeUCS4_Encode
				259	# define PyUnicode_EncodeASCII PyUnicodeUCS4_EncodeASCII
				260	# define PyUnicode_EncodeCharmap PyUnicodeUCS4_EncodeCharmap
				261	# define PyUnicode_EncodeDecimal PyUnicodeUCS4_EncodeDecimal
				262	# define PyUnicode_EncodeLatin1 PyUnicodeUCS4_EncodeLatin1
				263	# define PyUnicode_EncodeRawUnicodeEscape PyUnicodeUCS4_EncodeRawUnicodeEscape
Walter Dörwald	6e39080	2007-08-17 16:41:28 +0000	[diff] [blame]	264	# define PyUnicode_EncodeUTF32 PyUnicodeUCS4_EncodeUTF32
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	265	# define PyUnicode_EncodeUTF16 PyUnicodeUCS4_EncodeUTF16
				266	# define PyUnicode_EncodeUTF8 PyUnicodeUCS4_EncodeUTF8
				267	# define PyUnicode_EncodeUnicodeEscape PyUnicodeUCS4_EncodeUnicodeEscape
				268	# define PyUnicode_Find PyUnicodeUCS4_Find
				269	# define PyUnicode_Format PyUnicodeUCS4_Format
				270	# define PyUnicode_FromEncodedObject PyUnicodeUCS4_FromEncodedObject
				271	# define PyUnicode_FromObject PyUnicodeUCS4_FromObject
Marc-André Lemburg	9c329de	2002-08-12 08:19:10 +0000	[diff] [blame]	272	# define PyUnicode_FromOrdinal PyUnicodeUCS4_FromOrdinal
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	273	# define PyUnicode_FromUnicode PyUnicodeUCS4_FromUnicode
Christian Heimes	7f39c9f	2008-01-25 12:18:43 +0000	[diff] [blame]	274	# define PyUnicode_FromString PyUnicodeUCS4_FromString
				275	# define PyUnicode_FromStringAndSize PyUnicodeUCS4_FromStringAndSize
				276	# define PyUnicode_FromFormatV PyUnicodeUCS4_FromFormatV
				277	# define PyUnicode_FromFormat PyUnicodeUCS4_FromFormat
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	278	# define PyUnicode_FromWideChar PyUnicodeUCS4_FromWideChar
				279	# define PyUnicode_GetDefaultEncoding PyUnicodeUCS4_GetDefaultEncoding
				280	# define PyUnicode_GetMax PyUnicodeUCS4_GetMax
				281	# define PyUnicode_GetSize PyUnicodeUCS4_GetSize
				282	# define PyUnicode_Join PyUnicodeUCS4_Join
Fredrik Lundh	06a69dd	2006-05-26 08:54:28 +0000	[diff] [blame]	283	# define PyUnicode_Partition PyUnicodeUCS4_Partition
Fredrik Lundh	b3167cb	2006-05-26 18:15:38 +0000	[diff] [blame]	284	# define PyUnicode_RPartition PyUnicodeUCS4_RPartition
				285	# define PyUnicode_RSplit PyUnicodeUCS4_RSplit
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	286	# define PyUnicode_Replace PyUnicodeUCS4_Replace
				287	# define PyUnicode_Resize PyUnicodeUCS4_Resize
Marc-André Lemburg	040f76b	2006-08-14 10:55:19 +0000	[diff] [blame]	288	# define PyUnicode_RichCompare PyUnicodeUCS4_RichCompare
Marc-André Lemburg	b5ac6f6	2001-07-31 14:30:16 +0000	[diff] [blame]	289	# define PyUnicode_SetDefaultEncoding PyUnicodeUCS4_SetDefaultEncoding
				290	# define PyUnicode_Split PyUnicodeUCS4_Split
				291	# define PyUnicode_Splitlines PyUnicodeUCS4_Splitlines
				292	# define PyUnicode_Tailmatch PyUnicodeUCS4_Tailmatch
				293	# define PyUnicode_Translate PyUnicodeUCS4_Translate
				294	# define PyUnicode_TranslateCharmap PyUnicodeUCS4_TranslateCharmap
				295	# define _PyUnicode_AsDefaultEncodedString _PyUnicodeUCS4_AsDefaultEncodedString
				296	# define _PyUnicode_Fini _PyUnicodeUCS4_Fini
				297	# define _PyUnicode_Init _PyUnicodeUCS4_Init
				298	# define _PyUnicode_IsAlpha _PyUnicodeUCS4_IsAlpha
				299	# define _PyUnicode_IsDecimalDigit _PyUnicodeUCS4_IsDecimalDigit
				300	# define _PyUnicode_IsDigit _PyUnicodeUCS4_IsDigit
				301	# define _PyUnicode_IsLinebreak _PyUnicodeUCS4_IsLinebreak
				302	# define _PyUnicode_IsLowercase _PyUnicodeUCS4_IsLowercase
				303	# define _PyUnicode_IsNumeric _PyUnicodeUCS4_IsNumeric
				304	# define _PyUnicode_IsTitlecase _PyUnicodeUCS4_IsTitlecase
				305	# define _PyUnicode_IsUppercase _PyUnicodeUCS4_IsUppercase
				306	# define _PyUnicode_IsWhitespace _PyUnicodeUCS4_IsWhitespace
				307	# define _PyUnicode_ToDecimalDigit _PyUnicodeUCS4_ToDecimalDigit
				308	# define _PyUnicode_ToDigit _PyUnicodeUCS4_ToDigit
				309	# define _PyUnicode_ToLowercase _PyUnicodeUCS4_ToLowercase
				310	# define _PyUnicode_ToNumeric _PyUnicodeUCS4_ToNumeric
				311	# define _PyUnicode_ToTitlecase _PyUnicodeUCS4_ToTitlecase
				312	# define _PyUnicode_ToUppercase _PyUnicodeUCS4_ToUppercase
				313
				314
				315	#endif
				316
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	317	/* --- Internal Unicode Operations ---------------------------------------- */
				318
				319	/* If you want Python to use the compiler's wctype.h functions instead
Barry Warsaw	51ac580	2000-03-20 16:36:48 +0000	[diff] [blame]	320	of the ones supplied with Python, define WANT_WCTYPE_FUNCTIONS or
Raymond Hettinger	57341c3	2004-10-31 05:46:59 +0000	[diff] [blame]	321	configure Python using --with-wctype-functions. This reduces the
Barry Warsaw	51ac580	2000-03-20 16:36:48 +0000	[diff] [blame]	322	interpreter's code size. */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	323
				324	#if defined(HAVE_USABLE_WCHAR_T) && defined(WANT_WCTYPE_FUNCTIONS)
				325
Marc-André Lemburg	5e6007c	2001-09-19 11:21:03 +0000	[diff] [blame]	326	#include <wctype.h>
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	327
				328	#define Py_UNICODE_ISSPACE(ch) iswspace(ch)
				329
				330	#define Py_UNICODE_ISLOWER(ch) iswlower(ch)
				331	#define Py_UNICODE_ISUPPER(ch) iswupper(ch)
				332	#define Py_UNICODE_ISTITLE(ch) _PyUnicode_IsTitlecase(ch)
				333	#define Py_UNICODE_ISLINEBREAK(ch) _PyUnicode_IsLinebreak(ch)
				334
				335	#define Py_UNICODE_TOLOWER(ch) towlower(ch)
				336	#define Py_UNICODE_TOUPPER(ch) towupper(ch)
				337	#define Py_UNICODE_TOTITLE(ch) _PyUnicode_ToTitlecase(ch)
				338
				339	#define Py_UNICODE_ISDECIMAL(ch) _PyUnicode_IsDecimalDigit(ch)
				340	#define Py_UNICODE_ISDIGIT(ch) _PyUnicode_IsDigit(ch)
				341	#define Py_UNICODE_ISNUMERIC(ch) _PyUnicode_IsNumeric(ch)
				342
				343	#define Py_UNICODE_TODECIMAL(ch) _PyUnicode_ToDecimalDigit(ch)
				344	#define Py_UNICODE_TODIGIT(ch) _PyUnicode_ToDigit(ch)
				345	#define Py_UNICODE_TONUMERIC(ch) _PyUnicode_ToNumeric(ch)
				346
Marc-André Lemburg	f03e741	2000-07-05 09:45:59 +0000	[diff] [blame]	347	#define Py_UNICODE_ISALPHA(ch) iswalpha(ch)
				348
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	349	#else
				350
				351	#define Py_UNICODE_ISSPACE(ch) _PyUnicode_IsWhitespace(ch)
				352
				353	#define Py_UNICODE_ISLOWER(ch) _PyUnicode_IsLowercase(ch)
				354	#define Py_UNICODE_ISUPPER(ch) _PyUnicode_IsUppercase(ch)
				355	#define Py_UNICODE_ISTITLE(ch) _PyUnicode_IsTitlecase(ch)
				356	#define Py_UNICODE_ISLINEBREAK(ch) _PyUnicode_IsLinebreak(ch)
				357
				358	#define Py_UNICODE_TOLOWER(ch) _PyUnicode_ToLowercase(ch)
				359	#define Py_UNICODE_TOUPPER(ch) _PyUnicode_ToUppercase(ch)
				360	#define Py_UNICODE_TOTITLE(ch) _PyUnicode_ToTitlecase(ch)
				361
				362	#define Py_UNICODE_ISDECIMAL(ch) _PyUnicode_IsDecimalDigit(ch)
				363	#define Py_UNICODE_ISDIGIT(ch) _PyUnicode_IsDigit(ch)
				364	#define Py_UNICODE_ISNUMERIC(ch) _PyUnicode_IsNumeric(ch)
				365
				366	#define Py_UNICODE_TODECIMAL(ch) _PyUnicode_ToDecimalDigit(ch)
				367	#define Py_UNICODE_TODIGIT(ch) _PyUnicode_ToDigit(ch)
				368	#define Py_UNICODE_TONUMERIC(ch) _PyUnicode_ToNumeric(ch)
				369
Marc-André Lemburg	f03e741	2000-07-05 09:45:59 +0000	[diff] [blame]	370	#define Py_UNICODE_ISALPHA(ch) _PyUnicode_IsAlpha(ch)
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	371
Marc-André Lemburg	f03e741	2000-07-05 09:45:59 +0000	[diff] [blame]	372	#endif
Marc-André Lemburg	a9c103b	2000-07-03 10:52:13 +0000	[diff] [blame]	373
				374	#define Py_UNICODE_ISALNUM(ch) \
				375	(Py_UNICODE_ISALPHA(ch) \|\| \
				376	Py_UNICODE_ISDECIMAL(ch) \|\| \
				377	Py_UNICODE_ISDIGIT(ch) \|\| \
				378	Py_UNICODE_ISNUMERIC(ch))
				379
Fredrik Lundh	80f8e80	2006-05-28 12:06:46 +0000	[diff] [blame]	380	#define Py_UNICODE_COPY(target, source, length) \
				381	Py_MEMCPY((target), (source), (length)*sizeof(Py_UNICODE))
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	382
				383	#define Py_UNICODE_FILL(target, value, length) do\
Fredrik Lundh	8a8e05a	2006-05-22 17:12:58 +0000	[diff] [blame]	384	{Py_ssize_t i_; Py_UNICODE *t_ = (target); Py_UNICODE v_ = (value);\
				385	for (i_ = 0; i_ < (length); i_++) t_[i_] = v_;\
Fredrik Lundh	f1d60a5	2006-05-22 16:29:30 +0000	[diff] [blame]	386	} while (0)
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	387
Fredrik Lundh	3d885e0	2006-05-23 10:10:57 +0000	[diff] [blame]	388	/* check if substring matches at given offset. the offset must be
				389	valid, and the substring must not be empty */
				390	#define Py_UNICODE_MATCH(string, offset, substring) \
				391	((((string)->str + (offset)) == ((substring)->str)) && \
				392	((((string)->str + (offset) + (substring)->length-1) == ((substring)->str + (substring)->length-1))) && \
				393	!memcmp((string)->str + (offset), (substring)->str, (substring)->length*sizeof(Py_UNICODE)))
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	394
Barry Warsaw	51ac580	2000-03-20 16:36:48 +0000	[diff] [blame]	395	#ifdef __cplusplus
				396	extern "C" {
				397	#endif
				398
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	399	/* --- Unicode Type ------------------------------------------------------- */
				400
				401	typedef struct {
				402	PyObject_HEAD
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	403	Py_ssize_t length; /* Length of raw Unicode data in buffer */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	404	Py_UNICODE str; / Raw Unicode buffer */
				405	long hash; /* Hash value; -1 if not set */
Marc-André Lemburg	bff879c	2000-08-03 18:46:08 +0000	[diff] [blame]	406	PyObject defenc; / (Default) Encoded version as Python
				407	string, or NULL; this is used for
				408	implementing the buffer protocol */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	409	} PyUnicodeObject;
				410
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	411	PyAPI_DATA(PyTypeObject) PyUnicode_Type;
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	412
Neal Norwitz	ee3a1b5	2007-02-25 19:44:48 +0000	[diff] [blame]	413	#define PyUnicode_Check(op) \
Christian Heimes	e93237d	2007-12-19 02:37:44 +0000	[diff] [blame]	414	PyType_FastSubclass(Py_TYPE(op), Py_TPFLAGS_UNICODE_SUBCLASS)
				415	#define PyUnicode_CheckExact(op) (Py_TYPE(op) == &PyUnicode_Type)
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	416
				417	/* Fast access macros */
				418	#define PyUnicode_GET_SIZE(op) \
				419	(((PyUnicodeObject *)(op))->length)
				420	#define PyUnicode_GET_DATA_SIZE(op) \
				421	(((PyUnicodeObject )(op))->length sizeof(Py_UNICODE))
				422	#define PyUnicode_AS_UNICODE(op) \
				423	(((PyUnicodeObject *)(op))->str)
				424	#define PyUnicode_AS_DATA(op) \
				425	((const char )((PyUnicodeObject )(op))->str)
				426
				427	/* --- Constants ---------------------------------------------------------- */
				428
				429	/* This Unicode character will be used as replacement character during
				430	decoding if the errors argument is set to "replace". Note: the
				431	Unicode character U+FFFD is the official REPLACEMENT CHARACTER in
				432	Unicode 3.0. */
				433
				434	#define Py_UNICODE_REPLACEMENT_CHARACTER ((Py_UNICODE) 0xFFFD)
				435
				436	/* === Public API ========================================================= */
				437
				438	/* --- Plain Py_UNICODE --------------------------------------------------- */
				439
				440	/* Create a Unicode Object from the Py_UNICODE buffer u of the given
Marc-André Lemburg	8155e0e	2001-04-23 14:44:21 +0000	[diff] [blame]	441	size.
				442
				443	u may be NULL which causes the contents to be undefined. It is the
				444	user's responsibility to fill in the needed data afterwards. Note
				445	that modifying the Unicode object contents after construction is
				446	only allowed if u was set to NULL.
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	447
				448	The buffer is copied into the new object. */
				449
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	450	PyAPI_FUNC(PyObject*) PyUnicode_FromUnicode(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	451	const Py_UNICODE u, / Unicode buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	452	Py_ssize_t size /* size of buffer */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	453	);
				454
Christian Heimes	7f39c9f	2008-01-25 12:18:43 +0000	[diff] [blame]	455	/* Similar to PyUnicode_FromUnicode(), but u points to Latin-1 encoded bytes */
				456	PyAPI_FUNC(PyObject*) PyUnicode_FromStringAndSize(
				457	const char u, / char buffer */
				458	Py_ssize_t size /* size of buffer */
				459	);
				460
				461	/* Similar to PyUnicode_FromUnicode(), but u points to null-terminated
				462	Latin-1 encoded bytes */
				463	PyAPI_FUNC(PyObject*) PyUnicode_FromString(
				464	const char u / string */
				465	);
				466
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	467	/* Return a read-only pointer to the Unicode object's internal
				468	Py_UNICODE buffer. */
				469
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	470	PyAPI_FUNC(Py_UNICODE *) PyUnicode_AsUnicode(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	471	PyObject unicode / Unicode object */
				472	);
				473
				474	/* Get the length of the Unicode object. */
				475
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	476	PyAPI_FUNC(Py_ssize_t) PyUnicode_GetSize(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	477	PyObject unicode / Unicode object */
				478	);
				479
Martin v. Löwis	ce9b5a5	2001-06-27 06:28:56 +0000	[diff] [blame]	480	/* Get the maximum ordinal for a Unicode character. */
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	481	PyAPI_FUNC(Py_UNICODE) PyUnicode_GetMax(void);
Martin v. Löwis	ce9b5a5	2001-06-27 06:28:56 +0000	[diff] [blame]	482
Guido van Rossum	52c2359	2000-04-10 13:41:41 +0000	[diff] [blame]	483	/* Resize an already allocated Unicode object to the new size length.
				484
				485	*unicode is modified to point to the new (resized) object and 0
				486	returned on success.
				487
				488	This API may only be called by the function which also called the
				489	Unicode constructor. The refcount on the object must be 1. Otherwise,
				490	an error is returned.
				491
				492	Error handling is implemented as follows: an exception is set, -1
				493	is returned and *unicode left untouched.
				494
				495	*/
				496
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	497	PyAPI_FUNC(int) PyUnicode_Resize(
Guido van Rossum	52c2359	2000-04-10 13:41:41 +0000	[diff] [blame]	498	PyObject *unicode, / Pointer to the Unicode object */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	499	Py_ssize_t length /* New length */
Guido van Rossum	52c2359	2000-04-10 13:41:41 +0000	[diff] [blame]	500	);
				501
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	502	/* Coerce obj to an Unicode object and return a reference with
				503	incremented refcount.
				504
				505	Coercion is done in the following way:
				506
Guido van Rossum	b8c65bc	2001-10-19 02:01:31 +0000	[diff] [blame]	507	1. String and other char buffer compatible objects are decoded
Fred Drake	cb093fe	2000-05-09 19:51:53 +0000	[diff] [blame]	508	under the assumptions that they contain data using the current
				509	default encoding. Decoding is done in "strict" mode.
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	510
Guido van Rossum	b8c65bc	2001-10-19 02:01:31 +0000	[diff] [blame]	511	2. All other objects (including Unicode objects) raise an
				512	exception.
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	513
				514	The API returns NULL in case of an error. The caller is responsible
				515	for decref'ing the returned objects.
				516
				517	*/
				518
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	519	PyAPI_FUNC(PyObject*) PyUnicode_FromEncodedObject(
Marc-André Lemburg	5a5c81a	2000-07-07 13:46:42 +0000	[diff] [blame]	520	register PyObject obj, / Object */
				521	const char encoding, / encoding */
				522	const char errors / error handling */
				523	);
				524
Guido van Rossum	b8c65bc	2001-10-19 02:01:31 +0000	[diff] [blame]	525	/* Coerce obj to an Unicode object and return a reference with
Marc-André Lemburg	5a5c81a	2000-07-07 13:46:42 +0000	[diff] [blame]	526	incremented refcount.
Guido van Rossum	b8c65bc	2001-10-19 02:01:31 +0000	[diff] [blame]	527
				528	Unicode objects are passed back as-is (subclasses are converted to
				529	true Unicode objects), all other objects are delegated to
				530	PyUnicode_FromEncodedObject(obj, NULL, "strict") which results in
				531	using the default encoding as basis for decoding the object.
Marc-André Lemburg	5a5c81a	2000-07-07 13:46:42 +0000	[diff] [blame]	532
				533	The API returns NULL in case of an error. The caller is responsible
				534	for decref'ing the returned objects.
				535
				536	*/
				537
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	538	PyAPI_FUNC(PyObject*) PyUnicode_FromObject(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	539	register PyObject obj / Object */
				540	);
				541
Christian Heimes	7f39c9f	2008-01-25 12:18:43 +0000	[diff] [blame]	542	PyAPI_FUNC(PyObject ) PyUnicode_FromFormatV(const char, va_list);
				543	PyAPI_FUNC(PyObject ) PyUnicode_FromFormat(const char, ...);
				544
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	545	/* --- wchar_t support for platforms which support it --------------------- */
				546
				547	#ifdef HAVE_WCHAR_H
				548
				549	/* Create a Unicode Object from the whcar_t buffer w of the given
				550	size.
				551
				552	The buffer is copied into the new object. */
				553
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	554	PyAPI_FUNC(PyObject*) PyUnicode_FromWideChar(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	555	register const wchar_t w, / wchar_t buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	556	Py_ssize_t size /* size of buffer */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	557	);
				558
Marc-André Lemburg	a9cadcd	2004-11-22 13:02:31 +0000	[diff] [blame]	559	/* Copies the Unicode Object contents into the wchar_t buffer w. At
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	560	most size wchar_t characters are copied.
				561
Marc-André Lemburg	a9cadcd	2004-11-22 13:02:31 +0000	[diff] [blame]	562	Note that the resulting wchar_t string may or may not be
				563	0-terminated. It is the responsibility of the caller to make sure
				564	that the wchar_t string is 0-terminated in case this is required by
				565	the application.
				566
				567	Returns the number of wchar_t characters copied (excluding a
				568	possibly trailing 0-termination character) or -1 in case of an
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	569	error. */
				570
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	571	PyAPI_FUNC(Py_ssize_t) PyUnicode_AsWideChar(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	572	PyUnicodeObject unicode, / Unicode object */
				573	register wchar_t w, / wchar_t buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	574	Py_ssize_t size /* size of buffer */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	575	);
				576
				577	#endif
				578
Marc-André Lemburg	cc8764c	2002-08-11 12:23:04 +0000	[diff] [blame]	579	/* --- Unicode ordinals --------------------------------------------------- */
				580
				581	/* Create a Unicode Object from the given Unicode code point ordinal.
				582
				583	The ordinal must be in range(0x10000) on narrow Python builds
				584	(UCS2), and range(0x110000) on wide builds (UCS4). A ValueError is
				585	raised in case it is not.
				586
				587	*/
				588
Marc-André Lemburg	9c329de	2002-08-12 08:19:10 +0000	[diff] [blame]	589	PyAPI_FUNC(PyObject*) PyUnicode_FromOrdinal(int ordinal);
Marc-André Lemburg	cc8764c	2002-08-11 12:23:04 +0000	[diff] [blame]	590
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	591	/* === Builtin Codecs =====================================================
				592
				593	Many of these APIs take two arguments encoding and errors. These
				594	parameters encoding and errors have the same semantics as the ones
				595	of the builtin unicode() API.
				596
Fred Drake	cb093fe	2000-05-09 19:51:53 +0000	[diff] [blame]	597	Setting encoding to NULL causes the default encoding to be used.
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	598
				599	Error handling is set by errors which may also be set to NULL
				600	meaning to use the default handling defined for the codec. Default
				601	error handling for all builtin codecs is "strict" (ValueErrors are
				602	raised).
				603
				604	The codecs all use a similar interface. Only deviation from the
				605	generic ones are documented.
				606
				607	*/
				608
Fred Drake	cb093fe	2000-05-09 19:51:53 +0000	[diff] [blame]	609	/* --- Manage the default encoding ---------------------------------------- */
				610
Jeremy Hylton	3ce4538	2001-07-30 22:34:24 +0000	[diff] [blame]	611	/* Return a Python string holding the default encoded value of the
				612	Unicode object.
				613
				614	The resulting string is cached in the Unicode object for subsequent
				615	usage by this function. The cached version is needed to implement
				616	the character buffer interface and will live (at least) as long as
				617	the Unicode object itself.
				618
				619	The refcount of the string is not incremented.
				620
				621	* Exported for internal use by the interpreter only !!! *
				622
				623	*/
				624
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	625	PyAPI_FUNC(PyObject *) _PyUnicode_AsDefaultEncodedString(
Jeremy Hylton	3ce4538	2001-07-30 22:34:24 +0000	[diff] [blame]	626	PyObject , const char );
				627
Fred Drake	cb093fe	2000-05-09 19:51:53 +0000	[diff] [blame]	628	/* Returns the currently active default encoding.
				629
				630	The default encoding is currently implemented as run-time settable
				631	process global. This may change in future versions of the
				632	interpreter to become a parameter which is managed on a per-thread
				633	basis.
				634
				635	*/
				636
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	637	PyAPI_FUNC(const char*) PyUnicode_GetDefaultEncoding(void);
Fred Drake	cb093fe	2000-05-09 19:51:53 +0000	[diff] [blame]	638
				639	/* Sets the currently active default encoding.
				640
				641	Returns 0 on success, -1 in case of an error.
				642
				643	*/
				644
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	645	PyAPI_FUNC(int) PyUnicode_SetDefaultEncoding(
Fred Drake	cb093fe	2000-05-09 19:51:53 +0000	[diff] [blame]	646	const char encoding / Encoding name in standard form */
				647	);
				648
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	649	/* --- Generic Codecs ----------------------------------------------------- */
				650
				651	/* Create a Unicode object by decoding the encoded string s of the
				652	given size. */
				653
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	654	PyAPI_FUNC(PyObject*) PyUnicode_Decode(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	655	const char s, / encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	656	Py_ssize_t size, /* size of buffer */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	657	const char encoding, / encoding */
				658	const char errors / error handling */
				659	);
				660
				661	/* Encodes a Py_UNICODE buffer of the given size and returns a
				662	Python string object. */
				663
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	664	PyAPI_FUNC(PyObject*) PyUnicode_Encode(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	665	const Py_UNICODE s, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	666	Py_ssize_t size, /* number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	667	const char encoding, / encoding */
				668	const char errors / error handling */
				669	);
				670
Marc-André Lemburg	d2d4598	2004-07-08 17:57:32 +0000	[diff] [blame]	671	/* Encodes a Unicode object and returns the result as Python
				672	object. */
				673
				674	PyAPI_FUNC(PyObject*) PyUnicode_AsEncodedObject(
				675	PyObject unicode, / Unicode object */
				676	const char encoding, / encoding */
				677	const char errors / error handling */
				678	);
				679
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	680	/* Encodes a Unicode object and returns the result as Python string
				681	object. */
				682
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	683	PyAPI_FUNC(PyObject*) PyUnicode_AsEncodedString(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	684	PyObject unicode, / Unicode object */
				685	const char encoding, / encoding */
				686	const char errors / error handling */
				687	);
				688
Martin v. Löwis	3f76779	2006-06-04 19:36:28 +0000	[diff] [blame]	689	PyAPI_FUNC(PyObject*) PyUnicode_BuildEncodingMap(
				690	PyObject* string /* 256 character map */
				691	);
				692
				693
Marc-André Lemburg	c60e6f7	2001-09-20 10:35:46 +0000	[diff] [blame]	694	/* --- UTF-7 Codecs ------------------------------------------------------- */
				695
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	696	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUTF7(
Marc-André Lemburg	c60e6f7	2001-09-20 10:35:46 +0000	[diff] [blame]	697	const char string, / UTF-7 encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	698	Py_ssize_t length, /* size of string */
Marc-André Lemburg	c60e6f7	2001-09-20 10:35:46 +0000	[diff] [blame]	699	const char errors / error handling */
				700	);
				701
Amaury Forgeot d'Arc	5087980	2007-11-20 23:31:27 +0000	[diff] [blame]	702	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUTF7Stateful(
				703	const char string, / UTF-7 encoded string */
				704	Py_ssize_t length, /* size of string */
				705	const char errors, / error handling */
				706	Py_ssize_t consumed / bytes consumed */
				707	);
				708
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	709	PyAPI_FUNC(PyObject*) PyUnicode_EncodeUTF7(
Marc-André Lemburg	c60e6f7	2001-09-20 10:35:46 +0000	[diff] [blame]	710	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	711	Py_ssize_t length, /* number of Py_UNICODE chars to encode */
Marc-André Lemburg	c60e6f7	2001-09-20 10:35:46 +0000	[diff] [blame]	712	int encodeSetO, /* force the encoder to encode characters in
				713	Set O, as described in RFC2152 */
				714	int encodeWhiteSpace, /* force the encoder to encode space, tab,
				715	carriage return and linefeed characters */
				716	const char errors / error handling */
				717	);
				718
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	719	/* --- UTF-8 Codecs ------------------------------------------------------- */
				720
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	721	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUTF8(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	722	const char string, / UTF-8 encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	723	Py_ssize_t length, /* size of string */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	724	const char errors / error handling */
				725	);
				726
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	727	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUTF8Stateful(
				728	const char string, / UTF-8 encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	729	Py_ssize_t length, /* size of string */
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	730	const char errors, / error handling */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	731	Py_ssize_t consumed / bytes consumed */
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	732	);
				733
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	734	PyAPI_FUNC(PyObject*) PyUnicode_AsUTF8String(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	735	PyObject unicode / Unicode object */
				736	);
				737
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	738	PyAPI_FUNC(PyObject*) PyUnicode_EncodeUTF8(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	739	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	740	Py_ssize_t length, /* number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	741	const char errors / error handling */
				742	);
				743
Walter Dörwald	6e39080	2007-08-17 16:41:28 +0000	[diff] [blame]	744	/* --- UTF-32 Codecs ------------------------------------------------------ */
				745
				746	/* Decodes length bytes from a UTF-32 encoded buffer string and returns
				747	the corresponding Unicode object.
				748
				749	errors (if non-NULL) defines the error handling. It defaults
				750	to "strict".
				751
				752	If byteorder is non-NULL, the decoder starts decoding using the
				753	given byte order:
				754
				755	*byteorder == -1: little endian
				756	*byteorder == 0: native order
				757	*byteorder == 1: big endian
				758
				759	In native mode, the first four bytes of the stream are checked for a
				760	BOM mark. If found, the BOM mark is analysed, the byte order
				761	adjusted and the BOM skipped. In the other modes, no BOM mark
				762	interpretation is done. After completion, *byteorder is set to the
				763	current byte order at the end of input data.
				764
				765	If byteorder is NULL, the codec starts in native order mode.
				766
				767	*/
				768
				769	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUTF32(
				770	const char string, / UTF-32 encoded string */
				771	Py_ssize_t length, /* size of string */
				772	const char errors, / error handling */
				773	int byteorder / pointer to byteorder to use
				774	0=native;-1=LE,1=BE; updated on
				775	exit */
				776	);
				777
				778	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUTF32Stateful(
				779	const char string, / UTF-32 encoded string */
				780	Py_ssize_t length, /* size of string */
				781	const char errors, / error handling */
				782	int byteorder, / pointer to byteorder to use
				783	0=native;-1=LE,1=BE; updated on
				784	exit */
				785	Py_ssize_t consumed / bytes consumed */
				786	);
				787
				788	/* Returns a Python string using the UTF-32 encoding in native byte
				789	order. The string always starts with a BOM mark. */
				790
				791	PyAPI_FUNC(PyObject*) PyUnicode_AsUTF32String(
				792	PyObject unicode / Unicode object */
				793	);
				794
				795	/* Returns a Python string object holding the UTF-32 encoded value of
				796	the Unicode data.
				797
				798	If byteorder is not 0, output is written according to the following
				799	byte order:
				800
				801	byteorder == -1: little endian
				802	byteorder == 0: native byte order (writes a BOM mark)
				803	byteorder == 1: big endian
				804
				805	If byteorder is 0, the output string will always start with the
				806	Unicode BOM mark (U+FEFF). In the other two modes, no BOM mark is
				807	prepended.
				808
				809	*/
				810
				811	PyAPI_FUNC(PyObject*) PyUnicode_EncodeUTF32(
				812	const Py_UNICODE data, / Unicode char buffer */
				813	Py_ssize_t length, /* number of Py_UNICODE chars to encode */
				814	const char errors, / error handling */
				815	int byteorder /* byteorder to use 0=BOM+native;-1=LE,1=BE */
				816	);
				817
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	818	/* --- UTF-16 Codecs ------------------------------------------------------ */
				819
Guido van Rossum	9e896b3	2000-04-05 20:11:21 +0000	[diff] [blame]	820	/* Decodes length bytes from a UTF-16 encoded buffer string and returns
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	821	the corresponding Unicode object.
				822
				823	errors (if non-NULL) defines the error handling. It defaults
				824	to "strict".
				825
				826	If byteorder is non-NULL, the decoder starts decoding using the
				827	given byte order:
				828
				829	*byteorder == -1: little endian
				830	*byteorder == 0: native order
				831	*byteorder == 1: big endian
				832
Marc-André Lemburg	489b56e	2001-05-21 20:30:15 +0000	[diff] [blame]	833	In native mode, the first two bytes of the stream are checked for a
				834	BOM mark. If found, the BOM mark is analysed, the byte order
				835	adjusted and the BOM skipped. In the other modes, no BOM mark
				836	interpretation is done. After completion, *byteorder is set to the
				837	current byte order at the end of input data.
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	838
				839	If byteorder is NULL, the codec starts in native order mode.
				840
				841	*/
				842
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	843	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUTF16(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	844	const char string, / UTF-16 encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	845	Py_ssize_t length, /* size of string */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	846	const char errors, / error handling */
				847	int byteorder / pointer to byteorder to use
				848	0=native;-1=LE,1=BE; updated on
				849	exit */
				850	);
				851
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	852	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUTF16Stateful(
				853	const char string, / UTF-16 encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	854	Py_ssize_t length, /* size of string */
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	855	const char errors, / error handling */
				856	int byteorder, / pointer to byteorder to use
				857	0=native;-1=LE,1=BE; updated on
				858	exit */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	859	Py_ssize_t consumed / bytes consumed */
Walter Dörwald	6965203	2004-09-07 20:24:22 +0000	[diff] [blame]	860	);
				861
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	862	/* Returns a Python string using the UTF-16 encoding in native byte
				863	order. The string always starts with a BOM mark. */
				864
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	865	PyAPI_FUNC(PyObject*) PyUnicode_AsUTF16String(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	866	PyObject unicode / Unicode object */
				867	);
				868
				869	/* Returns a Python string object holding the UTF-16 encoded value of
Guido van Rossum	9e896b3	2000-04-05 20:11:21 +0000	[diff] [blame]	870	the Unicode data.
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	871
				872	If byteorder is not 0, output is written according to the following
				873	byte order:
				874
				875	byteorder == -1: little endian
				876	byteorder == 0: native byte order (writes a BOM mark)
				877	byteorder == 1: big endian
				878
				879	If byteorder is 0, the output string will always start with the
				880	Unicode BOM mark (U+FEFF). In the other two modes, no BOM mark is
				881	prepended.
				882
				883	Note that Py_UNICODE data is being interpreted as UTF-16 reduced to
				884	UCS-2. This trick makes it possible to add full UTF-16 capabilities
Thomas Wouters	7e47402	2000-07-16 12:04:32 +0000	[diff] [blame]	885	at a later point without compromising the APIs.
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	886
				887	*/
				888
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	889	PyAPI_FUNC(PyObject*) PyUnicode_EncodeUTF16(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	890	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	891	Py_ssize_t length, /* number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	892	const char errors, / error handling */
				893	int byteorder /* byteorder to use 0=BOM+native;-1=LE,1=BE */
				894	);
				895
				896	/* --- Unicode-Escape Codecs ---------------------------------------------- */
				897
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	898	PyAPI_FUNC(PyObject*) PyUnicode_DecodeUnicodeEscape(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	899	const char string, / Unicode-Escape encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	900	Py_ssize_t length, /* size of string */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	901	const char errors / error handling */
				902	);
				903
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	904	PyAPI_FUNC(PyObject*) PyUnicode_AsUnicodeEscapeString(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	905	PyObject unicode / Unicode object */
				906	);
				907
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	908	PyAPI_FUNC(PyObject*) PyUnicode_EncodeUnicodeEscape(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	909	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	910	Py_ssize_t length /* Number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	911	);
				912
				913	/* --- Raw-Unicode-Escape Codecs ------------------------------------------ */
				914
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	915	PyAPI_FUNC(PyObject*) PyUnicode_DecodeRawUnicodeEscape(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	916	const char string, / Raw-Unicode-Escape encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	917	Py_ssize_t length, /* size of string */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	918	const char errors / error handling */
				919	);
				920
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	921	PyAPI_FUNC(PyObject*) PyUnicode_AsRawUnicodeEscapeString(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	922	PyObject unicode / Unicode object */
				923	);
				924
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	925	PyAPI_FUNC(PyObject*) PyUnicode_EncodeRawUnicodeEscape(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	926	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	927	Py_ssize_t length /* Number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	928	);
				929
Walter Dörwald	a47d1c0	2005-08-30 10:23:14 +0000	[diff] [blame]	930	/* --- Unicode Internal Codec ---------------------------------------------
				931
				932	Only for internal use in _codecsmodule.c */
				933
				934	PyObject *_PyUnicode_DecodeUnicodeInternal(
				935	const char *string,
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	936	Py_ssize_t length,
Walter Dörwald	a47d1c0	2005-08-30 10:23:14 +0000	[diff] [blame]	937	const char *errors
				938	);
				939
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	940	/* --- Latin-1 Codecs -----------------------------------------------------
				941
				942	Note: Latin-1 corresponds to the first 256 Unicode ordinals.
				943
				944	*/
				945
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	946	PyAPI_FUNC(PyObject*) PyUnicode_DecodeLatin1(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	947	const char string, / Latin-1 encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	948	Py_ssize_t length, /* size of string */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	949	const char errors / error handling */
				950	);
				951
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	952	PyAPI_FUNC(PyObject*) PyUnicode_AsLatin1String(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	953	PyObject unicode / Unicode object */
				954	);
				955
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	956	PyAPI_FUNC(PyObject*) PyUnicode_EncodeLatin1(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	957	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	958	Py_ssize_t length, /* Number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	959	const char errors / error handling */
				960	);
				961
				962	/* --- ASCII Codecs -------------------------------------------------------
				963
				964	Only 7-bit ASCII data is excepted. All other codes generate errors.
				965
				966	*/
				967
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	968	PyAPI_FUNC(PyObject*) PyUnicode_DecodeASCII(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	969	const char string, / ASCII encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	970	Py_ssize_t length, /* size of string */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	971	const char errors / error handling */
				972	);
				973
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	974	PyAPI_FUNC(PyObject*) PyUnicode_AsASCIIString(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	975	PyObject unicode / Unicode object */
				976	);
				977
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	978	PyAPI_FUNC(PyObject*) PyUnicode_EncodeASCII(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	979	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	980	Py_ssize_t length, /* Number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	981	const char errors / error handling */
				982	);
				983
				984	/* --- Character Map Codecs -----------------------------------------------
				985
				986	This codec uses mappings to encode and decode characters.
				987
				988	Decoding mappings must map single string characters to single
				989	Unicode characters, integers (which are then interpreted as Unicode
				990	ordinals) or None (meaning "undefined mapping" and causing an
				991	error).
				992
				993	Encoding mappings must map single Unicode characters to single
				994	string characters, integers (which are then interpreted as Latin-1
				995	ordinals) or None (meaning "undefined mapping" and causing an
				996	error).
				997
				998	If a character lookup fails with a LookupError, the character is
				999	copied as-is meaning that its ordinal value will be interpreted as
				1000	Unicode or Latin-1 ordinal resp. Because of this mappings only need
				1001	to contain those mappings which map characters to different code
				1002	points.
				1003
				1004	*/
				1005
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1006	PyAPI_FUNC(PyObject*) PyUnicode_DecodeCharmap(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1007	const char string, / Encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1008	Py_ssize_t length, /* size of string */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1009	PyObject mapping, / character mapping
				1010	(char ordinal -> unicode ordinal) */
				1011	const char errors / error handling */
				1012	);
				1013
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1014	PyAPI_FUNC(PyObject*) PyUnicode_AsCharmapString(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1015	PyObject unicode, / Unicode object */
				1016	PyObject mapping / character mapping
				1017	(unicode ordinal -> char ordinal) */
				1018	);
				1019
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1020	PyAPI_FUNC(PyObject*) PyUnicode_EncodeCharmap(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1021	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1022	Py_ssize_t length, /* Number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1023	PyObject mapping, / character mapping
				1024	(unicode ordinal -> char ordinal) */
				1025	const char errors / error handling */
				1026	);
				1027
				1028	/* Translate a Py_UNICODE buffer of the given length by applying a
				1029	character mapping table to it and return the resulting Unicode
				1030	object.
				1031
				1032	The mapping table must map Unicode ordinal integers to Unicode
				1033	ordinal integers or None (causing deletion of the character).
				1034
				1035	Mapping tables may be dictionaries or sequences. Unmapped character
				1036	ordinals (ones which cause a LookupError) are left untouched and
				1037	are copied as-is.
				1038
				1039	*/
				1040
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1041	PyAPI_FUNC(PyObject *) PyUnicode_TranslateCharmap(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1042	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1043	Py_ssize_t length, /* Number of Py_UNICODE chars to encode */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1044	PyObject table, / Translate table */
				1045	const char errors / error handling */
				1046	);
				1047
Guido van Rossum	efec115	2000-03-28 02:01:15 +0000	[diff] [blame]	1048	#ifdef MS_WIN32
Guido van Rossum	24bdb04	2000-03-28 20:29:59 +0000	[diff] [blame]	1049
Guido van Rossum	efec115	2000-03-28 02:01:15 +0000	[diff] [blame]	1050	/* --- MBCS codecs for Windows -------------------------------------------- */
Guido van Rossum	24bdb04	2000-03-28 20:29:59 +0000	[diff] [blame]	1051
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1052	PyAPI_FUNC(PyObject*) PyUnicode_DecodeMBCS(
Guido van Rossum	efec115	2000-03-28 02:01:15 +0000	[diff] [blame]	1053	const char string, / MBCS encoded string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1054	Py_ssize_t length, /* size of string */
Guido van Rossum	efec115	2000-03-28 02:01:15 +0000	[diff] [blame]	1055	const char errors / error handling */
				1056	);
				1057
Martin v. Löwis	d825143	2006-06-14 05:21:04 +0000	[diff] [blame]	1058	PyAPI_FUNC(PyObject*) PyUnicode_DecodeMBCSStateful(
				1059	const char string, / MBCS encoded string */
				1060	Py_ssize_t length, /* size of string */
				1061	const char errors, / error handling */
				1062	Py_ssize_t consumed / bytes consumed */
				1063	);
				1064
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1065	PyAPI_FUNC(PyObject*) PyUnicode_AsMBCSString(
Guido van Rossum	efec115	2000-03-28 02:01:15 +0000	[diff] [blame]	1066	PyObject unicode / Unicode object */
				1067	);
				1068
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1069	PyAPI_FUNC(PyObject*) PyUnicode_EncodeMBCS(
Guido van Rossum	efec115	2000-03-28 02:01:15 +0000	[diff] [blame]	1070	const Py_UNICODE data, / Unicode char buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1071	Py_ssize_t length, /* Number of Py_UNICODE chars to encode */
Guido van Rossum	efec115	2000-03-28 02:01:15 +0000	[diff] [blame]	1072	const char errors / error handling */
				1073	);
				1074
Guido van Rossum	efec115	2000-03-28 02:01:15 +0000	[diff] [blame]	1075	#endif /* MS_WIN32 */
Guido van Rossum	24bdb04	2000-03-28 20:29:59 +0000	[diff] [blame]	1076
Guido van Rossum	9e896b3	2000-04-05 20:11:21 +0000	[diff] [blame]	1077	/* --- Decimal Encoder ---------------------------------------------------- */
				1078
				1079	/* Takes a Unicode string holding a decimal value and writes it into
				1080	an output buffer using standard ASCII digit codes.
				1081
				1082	The output buffer has to provide at least length+1 bytes of storage
				1083	area. The output string is 0-terminated.
				1084
				1085	The encoder converts whitespace to ' ', decimal characters to their
				1086	corresponding ASCII digit and all other Latin-1 characters except
				1087	\0 as-is. Characters outside this range (Unicode ordinals 1-256)
				1088	are treated as errors. This includes embedded NULL bytes.
				1089
				1090	Error handling is defined by the errors argument:
				1091
				1092	NULL or "strict": raise a ValueError
				1093	"ignore": ignore the wrong characters (these are not copied to the
				1094	output buffer)
				1095	"replace": replaces illegal characters with '?'
				1096
				1097	Returns 0 on success, -1 on failure.
				1098
				1099	*/
				1100
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1101	PyAPI_FUNC(int) PyUnicode_EncodeDecimal(
Guido van Rossum	9e896b3	2000-04-05 20:11:21 +0000	[diff] [blame]	1102	Py_UNICODE s, / Unicode buffer */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1103	Py_ssize_t length, /* Number of Py_UNICODE chars to encode */
Guido van Rossum	9e896b3	2000-04-05 20:11:21 +0000	[diff] [blame]	1104	char output, / Output buffer; must have size >= length */
				1105	const char errors / error handling */
				1106	);
				1107
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1108	/* --- Methods & Slots ----------------------------------------------------
				1109
				1110	These are capable of handling Unicode objects and strings on input
				1111	(we refer to them as strings in the descriptions) and return
				1112	Unicode objects or integers as apporpriate. */
				1113
				1114	/* Concat two strings giving a new Unicode string. */
				1115
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1116	PyAPI_FUNC(PyObject*) PyUnicode_Concat(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1117	PyObject left, / Left string */
				1118	PyObject right / Right string */
				1119	);
				1120
				1121	/* Split a string giving a list of Unicode strings.
				1122
				1123	If sep is NULL, splitting will be done at all whitespace
				1124	substrings. Otherwise, splits occur at the given separator.
				1125
				1126	At most maxsplit splits will be done. If negative, no limit is set.
				1127
				1128	Separators are not included in the resulting list.
				1129
				1130	*/
				1131
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1132	PyAPI_FUNC(PyObject*) PyUnicode_Split(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1133	PyObject s, / String to split */
				1134	PyObject sep, / String separator */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1135	Py_ssize_t maxsplit /* Maxsplit count */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1136	);
				1137
				1138	/* Dito, but split at line breaks.
				1139
				1140	CRLF is considered to be one line break. Line breaks are not
				1141	included in the resulting list. */
				1142
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1143	PyAPI_FUNC(PyObject*) PyUnicode_Splitlines(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1144	PyObject s, / String to split */
Guido van Rossum	004d64f	2000-04-11 15:39:46 +0000	[diff] [blame]	1145	int keepends /* If true, line end markers are included */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1146	);
				1147
Fredrik Lundh	06a69dd	2006-05-26 08:54:28 +0000	[diff] [blame]	1148	/* Partition a string using a given separator. */
				1149
				1150	PyAPI_FUNC(PyObject*) PyUnicode_Partition(
				1151	PyObject s, / String to partition */
				1152	PyObject sep / String separator */
				1153	);
				1154
Fredrik Lundh	b3167cb	2006-05-26 18:15:38 +0000	[diff] [blame]	1155	/* Partition a string using a given separator, searching from the end of the
				1156	string. */
				1157
				1158	PyAPI_FUNC(PyObject*) PyUnicode_RPartition(
				1159	PyObject s, / String to partition */
				1160	PyObject sep / String separator */
				1161	);
				1162
Hye-Shik Chang	3ae811b	2003-12-15 18:49:53 +0000	[diff] [blame]	1163	/* Split a string giving a list of Unicode strings.
				1164
				1165	If sep is NULL, splitting will be done at all whitespace
				1166	substrings. Otherwise, splits occur at the given separator.
				1167
				1168	At most maxsplit splits will be done. But unlike PyUnicode_Split
				1169	PyUnicode_RSplit splits from the end of the string. If negative,
				1170	no limit is set.
				1171
				1172	Separators are not included in the resulting list.
				1173
				1174	*/
				1175
				1176	PyAPI_FUNC(PyObject*) PyUnicode_RSplit(
				1177	PyObject s, / String to split */
				1178	PyObject sep, / String separator */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1179	Py_ssize_t maxsplit /* Maxsplit count */
Hye-Shik Chang	3ae811b	2003-12-15 18:49:53 +0000	[diff] [blame]	1180	);
				1181
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1182	/* Translate a string by applying a character mapping table to it and
				1183	return the resulting Unicode object.
				1184
				1185	The mapping table must map Unicode ordinal integers to Unicode
				1186	ordinal integers or None (causing deletion of the character).
				1187
				1188	Mapping tables may be dictionaries or sequences. Unmapped character
				1189	ordinals (ones which cause a LookupError) are left untouched and
				1190	are copied as-is.
				1191
				1192	*/
				1193
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1194	PyAPI_FUNC(PyObject *) PyUnicode_Translate(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1195	PyObject str, / String */
				1196	PyObject table, / Translate table */
				1197	const char errors / error handling */
				1198	);
				1199
				1200	/* Join a sequence of strings using the given separator and return
				1201	the resulting Unicode string. */
				1202
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1203	PyAPI_FUNC(PyObject*) PyUnicode_Join(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1204	PyObject separator, / Separator string */
				1205	PyObject seq / Sequence object */
				1206	);
				1207
				1208	/* Return 1 if substr matches str[start:end] at the given tail end, 0
				1209	otherwise. */
				1210
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1211	PyAPI_FUNC(Py_ssize_t) PyUnicode_Tailmatch(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1212	PyObject str, / String */
				1213	PyObject substr, / Prefix or Suffix string */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1214	Py_ssize_t start, /* Start index */
				1215	Py_ssize_t end, /* Stop index */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1216	int direction /* Tail end: -1 prefix, +1 suffix */
				1217	);
				1218
				1219	/* Return the first position of substr in str[start:end] using the
Marc-André Lemburg	4da6fd6	2002-05-29 11:33:13 +0000	[diff] [blame]	1220	given search direction or -1 if not found. -2 is returned in case
				1221	an error occurred and an exception is set. */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1222
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1223	PyAPI_FUNC(Py_ssize_t) PyUnicode_Find(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1224	PyObject str, / String */
				1225	PyObject substr, / Substring to find */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1226	Py_ssize_t start, /* Start index */
				1227	Py_ssize_t end, /* Stop index */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1228	int direction /* Find direction: +1 forward, -1 backward */
				1229	);
				1230
Barry Warsaw	51ac580	2000-03-20 16:36:48 +0000	[diff] [blame]	1231	/* Count the number of occurrences of substr in str[start:end]. */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1232
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1233	PyAPI_FUNC(Py_ssize_t) PyUnicode_Count(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1234	PyObject str, / String */
				1235	PyObject substr, / Substring to count */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1236	Py_ssize_t start, /* Start index */
				1237	Py_ssize_t end /* Stop index */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1238	);
				1239
Barry Warsaw	51ac580	2000-03-20 16:36:48 +0000	[diff] [blame]	1240	/* Replace at most maxcount occurrences of substr in str with replstr
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1241	and return the resulting Unicode object. */
				1242
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1243	PyAPI_FUNC(PyObject *) PyUnicode_Replace(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1244	PyObject str, / String */
				1245	PyObject substr, / Substring to find */
				1246	PyObject replstr, / Substring to replace */
Martin v. Löwis	18e1655	2006-02-15 17:27:45 +0000	[diff] [blame]	1247	Py_ssize_t maxcount /* Max. number of replacements to apply;
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1248	-1 = all */
				1249	);
				1250
				1251	/* Compare two strings and return -1, 0, 1 for less than, equal,
				1252	greater than resp. */
				1253
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1254	PyAPI_FUNC(int) PyUnicode_Compare(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1255	PyObject left, / Left string */
				1256	PyObject right / Right string */
				1257	);
				1258
Marc-André Lemburg	040f76b	2006-08-14 10:55:19 +0000	[diff] [blame]	1259	/* Rich compare two strings and return one of the following:
				1260
				1261	- NULL in case an exception was raised
				1262	- Py_True or Py_False for successfuly comparisons
				1263	- Py_NotImplemented in case the type combination is unknown
				1264
				1265	Note that Py_EQ and Py_NE comparisons can cause a UnicodeWarning in
				1266	case the conversion of the arguments to Unicode fails with a
				1267	UnicodeDecodeError.
				1268
				1269	Possible values for op:
				1270
				1271	Py_GT, Py_GE, Py_EQ, Py_NE, Py_LT, Py_LE
				1272
				1273	*/
				1274
				1275	PyAPI_FUNC(PyObject *) PyUnicode_RichCompare(
				1276	PyObject left, / Left string */
				1277	PyObject right, / Right string */
				1278	int op /* Operation: Py_EQ, Py_NE, Py_GT, etc. */
				1279	);
				1280
Thomas Wouters	7e47402	2000-07-16 12:04:32 +0000	[diff] [blame]	1281	/* Apply a argument tuple or dictionary to a format string and return
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1282	the resulting Unicode string. */
				1283
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1284	PyAPI_FUNC(PyObject *) PyUnicode_Format(
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1285	PyObject format, / Format string */
				1286	PyObject args / Argument tuple or dictionary */
				1287	);
				1288
Guido van Rossum	d0d366b	2000-03-13 23:22:24 +0000	[diff] [blame]	1289	/* Checks whether element is contained in container and return 1/0
				1290	accordingly.
				1291
				1292	element has to coerce to an one element Unicode string. -1 is
				1293	returned in case of an error. */
				1294
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1295	PyAPI_FUNC(int) PyUnicode_Contains(
Guido van Rossum	d0d366b	2000-03-13 23:22:24 +0000	[diff] [blame]	1296	PyObject container, / Container string */
				1297	PyObject element / Element string */
				1298	);
				1299
Walter Dörwald	de02bcb	2002-04-22 17:42:37 +0000	[diff] [blame]	1300	/* Externally visible for str.strip(unicode) */
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1301	PyAPI_FUNC(PyObject *) _PyUnicode_XStrip(
Walter Dörwald	de02bcb	2002-04-22 17:42:37 +0000	[diff] [blame]	1302	PyUnicodeObject *self,
				1303	int striptype,
				1304	PyObject *sepobj
				1305	);
				1306
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1307	/* === Characters Type APIs =============================================== */
				1308
				1309	/* These should not be used directly. Use the Py_UNICODE_IS* and
				1310	Py_UNICODE_TO* macros instead.
				1311
				1312	These APIs are implemented in Objects/unicodectype.c.
				1313
				1314	*/
				1315
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1316	PyAPI_FUNC(int) _PyUnicode_IsLowercase(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1317	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1318	);
				1319
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1320	PyAPI_FUNC(int) _PyUnicode_IsUppercase(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1321	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1322	);
				1323
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1324	PyAPI_FUNC(int) _PyUnicode_IsTitlecase(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1325	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1326	);
				1327
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1328	PyAPI_FUNC(int) _PyUnicode_IsWhitespace(
Tim Peters	2576c97	2005-10-29 02:33:18 +0000	[diff] [blame]	1329	const Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1330	);
				1331
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1332	PyAPI_FUNC(int) _PyUnicode_IsLinebreak(
Tim Peters	2576c97	2005-10-29 02:33:18 +0000	[diff] [blame]	1333	const Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1334	);
				1335
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1336	PyAPI_FUNC(Py_UNICODE) _PyUnicode_ToLowercase(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1337	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1338	);
				1339
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1340	PyAPI_FUNC(Py_UNICODE) _PyUnicode_ToUppercase(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1341	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1342	);
				1343
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1344	PyAPI_FUNC(Py_UNICODE) _PyUnicode_ToTitlecase(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1345	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1346	);
				1347
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1348	PyAPI_FUNC(int) _PyUnicode_ToDecimalDigit(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1349	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1350	);
				1351
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1352	PyAPI_FUNC(int) _PyUnicode_ToDigit(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1353	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1354	);
				1355
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1356	PyAPI_FUNC(double) _PyUnicode_ToNumeric(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1357	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1358	);
				1359
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1360	PyAPI_FUNC(int) _PyUnicode_IsDecimalDigit(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1361	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1362	);
				1363
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1364	PyAPI_FUNC(int) _PyUnicode_IsDigit(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1365	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1366	);
				1367
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1368	PyAPI_FUNC(int) _PyUnicode_IsNumeric(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1369	Py_UNICODE ch /* Unicode character */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1370	);
				1371
Mark Hammond	91a681d	2002-08-12 07:21:58 +0000	[diff] [blame]	1372	PyAPI_FUNC(int) _PyUnicode_IsAlpha(
Fredrik Lundh	72b0685	2001-06-27 22:08:26 +0000	[diff] [blame]	1373	Py_UNICODE ch /* Unicode character */
Marc-André Lemburg	f03e741	2000-07-05 09:45:59 +0000	[diff] [blame]	1374	);
				1375
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1376	#ifdef __cplusplus
				1377	}
				1378	#endif
Martin v. Löwis	339d0f7	2001-08-17 18:39:25 +0000	[diff] [blame]	1379	#endif /* Py_USING_UNICODE */
Guido van Rossum	d822518	2000-03-10 22:33:05 +0000	[diff] [blame]	1380	#endif /* !Py_UNICODEOBJECT_H */