Blame - magick/token.c - platform/external/ImageMagick

blob: 2f443d548f151b8ac4f592f00e4d025eda8d0245 [file] [log] [blame]

cristy	3ed852e	2009-09-05 21:47:34 +0000	[diff] [blame]	1	/*
				2	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				3	% %
				4	% %
				5	% %
				6	% TTTTT OOO K K EEEEE N N %
				7	% T O O K K E NN N %
				8	% T O O KKK EEE N N N %
				9	% T O O K K E N NN %
				10	% T OOO K K EEEEE N N %
				11	% %
				12	% %
				13	% MagickCore Token Methods %
				14	% %
				15	% Software Design %
				16	% John Cristy %
				17	% January 1993 %
				18	% %
				19	% %
cristy	16af1cb	2009-12-11 21:38:29 +0000	[diff] [blame]	20	% Copyright 1999-2010 ImageMagick Studio LLC, a non-profit organization %
cristy	3ed852e	2009-09-05 21:47:34 +0000	[diff] [blame]	21	% dedicated to making software imaging solutions freely available. %
				22	% %
				23	% You may not use this file except in compliance with the License. You may %
				24	% obtain a copy of the License at %
				25	% %
				26	% http://www.imagemagick.org/script/license.php %
				27	% %
				28	% Unless required by applicable law or agreed to in writing, software %
				29	% distributed under the License is distributed on an "AS IS" BASIS, %
				30	% WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. %
				31	% See the License for the specific language governing permissions and %
				32	% limitations under the License. %
				33	% %
				34	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				35	%
				36	%
				37	%
				38	*/
				39
				40	/*
				41	Include declarations.
				42	*/
				43	#include "magick/studio.h"
				44	#include "magick/exception.h"
				45	#include "magick/exception-private.h"
				46	#include "magick/image.h"
				47	#include "magick/memory_.h"
				48	#include "magick/string_.h"
				49	#include "magick/token.h"
				50	#include "magick/token-private.h"
				51	#include "magick/utility.h"
				52
				53	/*
				54	Typedef declaractions.
				55	*/
				56	struct _TokenInfo
				57	{
				58	int
				59	state;
				60
				61	MagickStatusType
				62	flag;
				63
				64	long
				65	offset;
				66
				67	char
				68	quote;
				69
				70	unsigned long
				71	signature;
				72	};
				73
				74	/*
				75	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				76	% %
				77	% %
				78	% %
				79	% A c q u i r e T o k e n I n f o %
				80	% %
				81	% %
				82	% %
				83	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				84	%
				85	% AcquireTokenInfo() allocates the TokenInfo structure.
				86	%
				87	% The format of the AcquireTokenInfo method is:
				88	%
				89	% TokenInfo *AcquireTokenInfo()
				90	%
				91	*/
				92	MagickExport TokenInfo *AcquireTokenInfo(void)
				93	{
				94	TokenInfo
				95	*token_info;
				96
				97	token_info=(TokenInfo ) AcquireMagickMemory(sizeof(token_info));
				98	if (token_info == (TokenInfo *) NULL)
				99	ThrowFatalException(ResourceLimitFatalError,"MemoryAllocationFailed");
				100	token_info->signature=MagickSignature;
				101	return(token_info);
				102	}
				103
				104	/*
				105	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				106	% %
				107	% %
				108	% %
				109	% D e s t r o y T o k e n I n f o %
				110	% %
				111	% %
				112	% %
				113	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				114	%
				115	% DestroyTokenInfo() deallocates memory associated with an TokenInfo
				116	% structure.
				117	%
				118	% The format of the DestroyTokenInfo method is:
				119	%
				120	% TokenInfo DestroyTokenInfo(TokenInfo token_info)
				121	%
				122	% A description of each parameter follows:
				123	%
				124	% o token_info: Specifies a pointer to an TokenInfo structure.
				125	%
				126	*/
				127	MagickExport TokenInfo DestroyTokenInfo(TokenInfo token_info)
				128	{
				129	(void) LogMagickEvent(TraceEvent,GetMagickModule(),"...");
				130	assert(token_info != (TokenInfo *) NULL);
				131	assert(token_info->signature == MagickSignature);
				132	token_info->signature=(~MagickSignature);
				133	token_info=(TokenInfo *) RelinquishMagickMemory(token_info);
				134	return(token_info);
				135	}
				136
				137	/*
				138	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				139	% %
				140	% %
				141	% %
				142	+ G e t M a g i c k T o k e n %
				143	% %
				144	% %
				145	% %
				146	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				147	%
				148	% GetMagickToken() gets a token from the token stream. A token is defined as a
				149	% sequence of characters delimited by whitespace (e.g. clip-path), a sequence
				150	% delimited with quotes (.e.g "Quote me"), or a sequence enclosed in
				151	% parenthesis (e.g. rgb(0,0,0)).
				152	%
				153	% The format of the GetMagickToken method is:
				154	%
				155	% void GetMagickToken(const char start,const char end,char token)
				156	%
				157	% A description of each parameter follows:
				158	%
				159	% o start: the start of the token sequence.
				160	%
				161	% o end: point to the end of the token sequence.
				162	%
				163	% o token: copy the token to this buffer.
				164	%
				165	*/
				166	MagickExport void GetMagickToken(const char start,const char end,char token)
				167	{
				168	double
				169	value;
				170
				171	register const char
				172	*p;
				173
				174	register long
				175	i;
				176
				177	i=0;
				178	for (p=start; *p != '\0'; )
				179	{
				180	while ((isspace((int) ((unsigned char) p)) != 0) && (p != '\0'))
				181	p++;
				182	if (*p == '\0')
				183	break;
				184	switch (*p)
				185	{
				186	case '"':
				187	case '\'':
				188	case '`':
				189	case '{':
				190	{
				191	register char
				192	escape;
				193
				194	switch (*p)
				195	{
				196	case '"': escape='"'; break;
				197	case '\'': escape='\''; break;
				198	case '`': escape='\''; break;
				199	case '{': escape='}'; break;
				200	default: escape=(*p); break;
				201	}
				202	for (p++; *p != '\0'; p++)
				203	{
				204	if ((p == '\\') && (((p+1) == escape) \|\| (*(p+1) == '\\')))
				205	p++;
				206	else
				207	if (*p == escape)
				208	{
				209	p++;
				210	break;
				211	}
				212	token[i++]=(*p);
				213	}
				214	break;
				215	}
				216	case '/':
				217	{
				218	token[i++]=(*p++);
				219	if ((p == '>') \|\| (p == '/'))
				220	token[i++]=(*p++);
				221	break;
				222	}
				223	default:
				224	{
				225	char
				226	*q;
				227
				228	value=strtod(p,&q);
				229	if ((p != q) && (*p != ','))
				230	{
				231	for ( ; (p < q) && (*p != ','); p++)
				232	token[i++]=(*p);
				233	if (*p == '%')
				234	token[i++]=(*p++);
				235	break;
				236	}
				237	if ((isalpha((int) ((unsigned char) *p)) == 0) &&
				238	(p != DirectorySeparator) && (p != '#') && (p != '<'))
				239	{
				240	token[i++]=(*p++);
				241	break;
				242	}
				243	for ( ; *p != '\0'; p++)
				244	{
				245	if (((isspace((int) ((unsigned char) p)) != 0) \|\| (p == '=') \|\|
				246	(p == ',') \|\| (p == ':')) && (*(p-1) != '\\'))
				247	break;
				248	if ((i > 0) && (*p == '<'))
				249	break;
				250	token[i++]=(*p);
				251	if (*p == '>')
				252	break;
				253	if (*p == '(')
				254	for (p++; *p != '\0'; p++)
				255	{
				256	token[i++]=(*p);
				257	if ((p == ')') && ((p-1) != '\\'))
				258	break;
				259	}
				260	}
				261	break;
				262	}
				263	}
				264	break;
				265	}
				266	token[i]='\0';
				267	if (LocaleNCompare(token,"url(",4) == 0)
				268	{
				269	ssize_t
				270	offset;
				271
				272	offset=4;
				273	if (token[offset] == '#')
				274	offset++;
				275	i=(long) strlen(token);
				276	(void) CopyMagickString(token,token+offset,MaxTextExtent);
				277	token[i-offset-1]='\0';
				278	}
				279	while (isspace((int) ((unsigned char) *p)) != 0)
				280	p++;
				281	if (end != (const char **) NULL)
				282	end=(const char ) p;
				283	}
				284
				285	/*
				286	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				287	% %
				288	% %
				289	% %
				290	% G l o b E x p r e s s i o n %
				291	% %
				292	% %
				293	% %
				294	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				295	%
				296	% GlobExpression() returns MagickTrue if the expression matches the pattern.
				297	%
				298	% The format of the GlobExpression function is:
				299	%
				300	% MagickBooleanType GlobExpression(const char *expression,
				301	% const char *pattern,const MagickBooleanType case_insensitive)
				302	%
				303	% A description of each parameter follows:
				304	%
				305	% o expression: Specifies a pointer to a text string containing a file name.
				306	%
				307	% o pattern: Specifies a pointer to a text string containing a pattern.
				308	%
				309	% o case_insensitive: set to MagickTrue to ignore the case when matching
				310	% an expression.
				311	%
				312	*/
				313	MagickExport MagickBooleanType GlobExpression(const char *expression,
				314	const char *pattern,const MagickBooleanType case_insensitive)
				315	{
				316	MagickBooleanType
				317	done,
				318	match;
				319
				320	register const char
				321	*p;
				322
				323	/*
				324	Return on empty pattern or '*'.
				325	*/
				326	if (pattern == (char *) NULL)
				327	return(MagickTrue);
				328	if (GetUTFCode(pattern) == 0)
				329	return(MagickTrue);
				330	if (LocaleCompare(pattern,"*") == 0)
				331	return(MagickTrue);
				332	p=pattern+strlen(pattern)-1;
				333	if ((GetUTFCode(p) == ']') && (strchr(pattern,'[') != (char *) NULL))
				334	{
				335	ExceptionInfo
				336	*exception;
				337
				338	ImageInfo
				339	*image_info;
				340
				341	/*
				342	Determine if pattern is a scene, i.e. img0001.pcd[2].
				343	*/
				344	image_info=AcquireImageInfo();
				345	(void) CopyMagickString(image_info->filename,pattern,MaxTextExtent);
				346	exception=AcquireExceptionInfo();
				347	(void) SetImageInfo(image_info,MagickTrue,exception);
				348	exception=DestroyExceptionInfo(exception);
				349	if (LocaleCompare(image_info->filename,pattern) != 0)
				350	{
				351	image_info=DestroyImageInfo(image_info);
				352	return(MagickFalse);
				353	}
				354	image_info=DestroyImageInfo(image_info);
				355	}
				356	/*
				357	Evaluate glob expression.
				358	*/
				359	done=MagickFalse;
				360	while ((GetUTFCode(pattern) != 0) && (done == MagickFalse))
				361	{
				362	if (GetUTFCode(expression) == 0)
				363	if ((GetUTFCode(pattern) != '{') && (GetUTFCode(pattern) != '*'))
				364	break;
				365	switch (GetUTFCode(pattern))
				366	{
				367	case '\\':
				368	{
				369	pattern+=GetUTFOctets(pattern);
				370	if (GetUTFCode(pattern) != 0)
				371	pattern+=GetUTFOctets(pattern);
				372	break;
				373	}
				374	case '*':
				375	{
				376	MagickBooleanType
				377	status;
				378
				379	status=MagickFalse;
				380	pattern+=GetUTFOctets(pattern);
				381	while ((GetUTFCode(expression) != 0) && (status == MagickFalse))
				382	{
				383	status=GlobExpression(expression,pattern,case_insensitive);
				384	expression+=GetUTFOctets(expression);
				385	}
				386	if (status != MagickFalse)
				387	{
				388	while (GetUTFCode(expression) != 0)
				389	expression+=GetUTFOctets(expression);
				390	while (GetUTFCode(pattern) != 0)
				391	pattern+=GetUTFOctets(pattern);
				392	}
				393	break;
				394	}
				395	case '[':
				396	{
				397	unsigned long
				398	c;
				399
				400	pattern+=GetUTFOctets(pattern);
				401	for ( ; ; )
				402	{
				403	if ((GetUTFCode(pattern) == 0) \|\| (GetUTFCode(pattern) == ']'))
				404	{
				405	done=MagickTrue;
				406	break;
				407	}
				408	if (GetUTFCode(pattern) == '\\')
				409	{
				410	pattern+=GetUTFOctets(pattern);
				411	if (GetUTFCode(pattern) == 0)
				412	{
				413	done=MagickTrue;
				414	break;
				415	}
				416	}
				417	if (GetUTFCode(pattern+GetUTFOctets(pattern)) == '-')
				418	{
				419	c=GetUTFCode(pattern);
				420	pattern+=GetUTFOctets(pattern);
				421	pattern+=GetUTFOctets(pattern);
				422	if (GetUTFCode(pattern) == ']')
				423	{
				424	done=MagickTrue;
				425	break;
				426	}
				427	if (GetUTFCode(pattern) == '\\')
				428	{
				429	pattern+=GetUTFOctets(pattern);
				430	if (GetUTFCode(pattern) == 0)
				431	{
				432	done=MagickTrue;
				433	break;
				434	}
				435	}
				436	if ((GetUTFCode(expression) < c) \|\|
				437	(GetUTFCode(expression) > GetUTFCode(pattern)))
				438	{
				439	pattern+=GetUTFOctets(pattern);
				440	continue;
				441	}
				442	}
				443	else
				444	if (GetUTFCode(pattern) != GetUTFCode(expression))
				445	{
				446	pattern+=GetUTFOctets(pattern);
				447	continue;
				448	}
				449	pattern+=GetUTFOctets(pattern);
				450	while ((GetUTFCode(pattern) != ']') && (GetUTFCode(pattern) != 0))
				451	{
				452	if ((GetUTFCode(pattern) == '\\') &&
				453	(GetUTFCode(pattern+GetUTFOctets(pattern)) > 0))
				454	pattern+=GetUTFOctets(pattern);
				455	pattern+=GetUTFOctets(pattern);
				456	}
				457	if (GetUTFCode(pattern) != 0)
				458	{
				459	pattern+=GetUTFOctets(pattern);
				460	expression+=GetUTFOctets(expression);
				461	}
				462	break;
				463	}
				464	break;
				465	}
				466	case '?':
				467	{
				468	pattern+=GetUTFOctets(pattern);
				469	expression+=GetUTFOctets(expression);
				470	break;
				471	}
				472	case '{':
				473	{
				474	register const char
				475	*p;
				476
				477	pattern+=GetUTFOctets(pattern);
				478	while ((GetUTFCode(pattern) != '}') && (GetUTFCode(pattern) != 0))
				479	{
				480	p=expression;
				481	match=MagickTrue;
				482	while ((GetUTFCode(p) != 0) && (GetUTFCode(pattern) != 0) &&
				483	(GetUTFCode(pattern) != ',') && (GetUTFCode(pattern) != '}') &&
				484	(match != MagickFalse))
				485	{
				486	if (GetUTFCode(pattern) == '\\')
				487	pattern+=GetUTFOctets(pattern);
				488	match=(GetUTFCode(pattern) == GetUTFCode(p)) ? MagickTrue :
				489	MagickFalse;
				490	p+=GetUTFOctets(p);
				491	pattern+=GetUTFOctets(pattern);
				492	}
				493	if (GetUTFCode(pattern) == 0)
				494	{
				495	match=MagickFalse;
				496	done=MagickTrue;
				497	break;
				498	}
				499	else
				500	if (match != MagickFalse)
				501	{
				502	expression=p;
				503	while ((GetUTFCode(pattern) != '}') &&
				504	(GetUTFCode(pattern) != 0))
				505	{
				506	pattern+=GetUTFOctets(pattern);
				507	if (GetUTFCode(pattern) == '\\')
				508	{
				509	pattern+=GetUTFOctets(pattern);
				510	if (GetUTFCode(pattern) == '}')
				511	pattern+=GetUTFOctets(pattern);
				512	}
				513	}
				514	}
				515	else
				516	{
				517	while ((GetUTFCode(pattern) != '}') &&
				518	(GetUTFCode(pattern) != ',') &&
				519	(GetUTFCode(pattern) != 0))
				520	{
				521	pattern+=GetUTFOctets(pattern);
				522	if (GetUTFCode(pattern) == '\\')
				523	{
				524	pattern+=GetUTFOctets(pattern);
				525	if ((GetUTFCode(pattern) == '}') \|\|
				526	(GetUTFCode(pattern) == ','))
				527	pattern+=GetUTFOctets(pattern);
				528	}
				529	}
				530	}
				531	if (GetUTFCode(pattern) != 0)
				532	pattern+=GetUTFOctets(pattern);
				533	}
				534	break;
				535	}
				536	default:
				537	{
				538	if (case_insensitive != MagickFalse)
				539	{
				540	if (tolower((int) GetUTFCode(expression)) !=
				541	tolower((int) GetUTFCode(pattern)))
				542	{
				543	done=MagickTrue;
				544	break;
				545	}
				546	}
				547	else
				548	if (GetUTFCode(expression) != GetUTFCode(pattern))
				549	{
				550	done=MagickTrue;
				551	break;
				552	}
				553	expression+=GetUTFOctets(expression);
				554	pattern+=GetUTFOctets(pattern);
				555	}
				556	}
				557	}
				558	while (GetUTFCode(pattern) == '*')
				559	pattern+=GetUTFOctets(pattern);
				560	match=(GetUTFCode(expression) == 0) && (GetUTFCode(pattern) == 0) ?
				561	MagickTrue : MagickFalse;
				562	return(match);
				563	}
				564
				565	/*
				566	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				567	% %
				568	% %
				569	% %
				570	+ I s G l o b %
				571	% %
				572	% %
				573	% %
				574	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				575	%
				576	% IsGlob() returns MagickTrue if the path specification contains a globbing
				577	% pattern.
				578	%
				579	% The format of the IsGlob method is:
				580	%
				581	% MagickBooleanType IsGlob(const char *geometry)
				582	%
				583	% A description of each parameter follows:
				584	%
				585	% o path: the path.
				586	%
				587	*/
				588	MagickExport MagickBooleanType IsGlob(const char *path)
				589	{
				590	MagickBooleanType
				591	status;
				592
				593	if (IsPathAccessible(path) != MagickFalse)
				594	return(MagickFalse);
				595	status=(strchr(path,'') != (char ) NULL) \|\|
				596	(strchr(path,'?') != (char *) NULL) \|\|
				597	(strchr(path,'{') != (char *) NULL) \|\|
				598	(strchr(path,'}') != (char *) NULL) \|\|
				599	(strchr(path,'[') != (char *) NULL) \|\|
				600	(strchr(path,']') != (char *) NULL) ? MagickTrue : MagickFalse;
				601	return(status);
				602	}
				603
				604	/*
				605	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				606	% %
				607	% %
				608	% %
				609	% T o k e n i z e r %
				610	% %
				611	% %
				612	% %
				613	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
				614	%
				615	% Tokenizer() is a generalized, finite state token parser. It extracts tokens
				616	% one at a time from a string of characters. The characters used for white
				617	% space, for break characters, and for quotes can be specified. Also,
				618	% characters in the string can be preceded by a specifiable escape character
				619	% which removes any special meaning the character may have.
				620	%
				621	% Here is some terminology:
				622	%
				623	% o token: A single unit of information in the form of a group of
				624	% characters.
				625	%
				626	% o white space: Apace that gets ignored (except within quotes or when
				627	% escaped), like blanks and tabs. in addition, white space terminates a
				628	% non-quoted token.
				629	%
				630	% o break set: One or more characters that separates non-quoted tokens.
				631	% Commas are a common break character. The usage of break characters to
				632	% signal the end of a token is the same as that of white space, except
				633	% multiple break characters with nothing or only white space between
				634	% generate a null token for each two break characters together.
				635	%
				636	% For example, if blank is set to be the white space and comma is set to
				637	% be the break character, the line
				638	%
				639	% A, B, C , , DEF
				640	%
				641	% ... consists of 5 tokens:
				642	%
				643	% 1) "A"
				644	% 2) "B"
				645	% 3) "C"
				646	% 4) "" (the null string)
				647	% 5) "DEF"
				648	%
				649	% o Quote character: A character that, when surrounding a group of other
				650	% characters, causes the group of characters to be treated as a single
				651	% token, no matter how many white spaces or break characters exist in
				652	% the group. Also, a token always terminates after the closing quote.
				653	% For example, if ' is the quote character, blank is white space, and
				654	% comma is the break character, the following string
				655	%
				656	% A, ' B, CD'EF GHI
				657	%
				658	% ... consists of 4 tokens:
				659	%
				660	% 1) "A"
				661	% 2) " B, CD" (note the blanks & comma)
				662	% 3) "EF"
				663	% 4) "GHI"
				664	%
				665	% The quote characters themselves do not appear in the resultant
				666	% tokens. The double quotes are delimiters i use here for
				667	% documentation purposes only.
				668	%
				669	% o Escape character: A character which itself is ignored but which
				670	% causes the next character to be used as is. ^ and \ are often used
				671	% as escape characters. An escape in the last position of the string
				672	% gets treated as a "normal" (i.e., non-quote, non-white, non-break,
				673	% and non-escape) character. For example, assume white space, break
				674	% character, and quote are the same as in the above examples, and
				675	% further, assume that ^ is the escape character. Then, in the string
				676	%
				677	% ABC, ' DEF ^' GH' I ^ J K^ L ^
				678	%
				679	% ... there are 7 tokens:
				680	%
				681	% 1) "ABC"
				682	% 2) " DEF ' GH"
				683	% 3) "I"
				684	% 4) " " (a lone blank)
				685	% 5) "J"
				686	% 6) "K L"
				687	% 7) "^" (passed as is at end of line)
				688	%
				689	% The format of the Tokenizer method is:
				690	%
				691	% int Tokenizer(TokenInfo token_info,const unsigned flag,char token,
				692	% const size_t max_token_length,const char line,const char white,
				693	% const char break_set,const char quote,const char escape,
				694	% char breaker,int next,char *quoted)
				695	%
				696	% A description of each parameter follows:
				697	%
				698	% o flag: right now, only the low order 3 bits are used.
				699	%
				700	% 1 => convert non-quoted tokens to upper case
				701	% 2 => convert non-quoted tokens to lower case
				702	% 0 => do not convert non-quoted tokens
				703	%
				704	% o token: a character string containing the returned next token
				705	%
				706	% o max_token_length: the maximum size of "token". Characters beyond
				707	% "max_token_length" are truncated.
				708	%
				709	% o string: the string to be parsed.
				710	%
				711	% o white: a string of the valid white spaces. example:
				712	%
				713	% char whitesp[]={" \t"};
				714	%
				715	% blank and tab will be valid white space.
				716	%
				717	% o break: a string of the valid break characters. example:
				718	%
				719	% char breakch[]={";,"};
				720	%
				721	% semicolon and comma will be valid break characters.
				722	%
				723	% o quote: a string of the valid quote characters. An example would be
				724	%
				725	% char whitesp[]={"'\"");
				726	%
				727	% (this causes single and double quotes to be valid) Note that a
				728	% token starting with one of these characters needs the same quote
				729	% character to terminate it.
				730	%
				731	% for example:
				732	%
				733	% "ABC '
				734	%
				735	% is unterminated, but
				736	%
				737	% "DEF" and 'GHI'
				738	%
				739	% are properly terminated. Note that different quote characters
				740	% can appear on the same line; only for a given token do the quote
				741	% characters have to be the same.
				742	%
				743	% o escape: the escape character (NOT a string ... only one
				744	% allowed). Use zero if none is desired.
				745	%
				746	% o breaker: the break character used to terminate the current
				747	% token. If the token was quoted, this will be the quote used. If
				748	% the token is the last one on the line, this will be zero.
				749	%
				750	% o next: this variable points to the first character of the
				751	% next token. it gets reset by "tokenizer" as it steps through the
				752	% string. Set it to 0 upon initialization, and leave it alone
				753	% after that. You can change it if you want to jump around in the
				754	% string or re-parse from the beginning, but be careful.
				755	%
				756	% o quoted: set to True if the token was quoted and MagickFalse
				757	% if not. You may need this information (for example: in C, a
				758	% string with quotes around it is a character string, while one
				759	% without is an identifier).
				760	%
				761	% o result: 0 if we haven't reached EOS (end of string), and 1
				762	% if we have.
				763	%
				764	*/
				765
				766	#define IN_WHITE 0
				767	#define IN_TOKEN 1
				768	#define IN_QUOTE 2
				769	#define IN_OZONE 3
				770
				771	static long sindex(int c,const char *string)
				772	{
				773	register const char
				774	*p;
				775
				776	for (p=string; *p != '\0'; p++)
				777	if (c == (int) (*p))
				778	return(p-string);
				779	return(-1);
				780	}
				781
				782	static void StoreToken(TokenInfo token_info,char string,
				783	size_t max_token_length,int c)
				784	{
				785	register long
				786	i;
				787
				788	if ((token_info->offset < 0) \|\|
				789	((size_t) token_info->offset >= (max_token_length-1)))
				790	return;
				791	i=token_info->offset++;
				792	string[i]=(char) c;
				793	if (token_info->state == IN_QUOTE)
				794	return;
				795	switch (token_info->flag & 0x03)
				796	{
				797	case 1:
				798	{
				799	string[i]=(char) toupper(c);
				800	break;
				801	}
				802	case 2:
				803	{
				804	string[i]=(char) tolower(c);
				805	break;
				806	}
				807	default:
				808	break;
				809	}
				810	}
				811
				812	MagickExport int Tokenizer(TokenInfo *token_info,const unsigned flag,
				813	char token,const size_t max_token_length,const char line,const char *white,
				814	const char break_set,const char quote,const char escape,char *breaker,
				815	int next,char quoted)
				816	{
				817	int
				818	c;
				819
				820	register long
				821	i;
				822
				823	*breaker='\0';
				824	*quoted='\0';
				825	if (line[*next] == '\0')
				826	return(1);
				827	token_info->state=IN_WHITE;
				828	token_info->quote=(char) MagickFalse;
				829	token_info->flag=flag;
				830	for (token_info->offset=0; (int) line[next] != 0; (next)++)
				831	{
				832	c=(int) line[*next];
				833	i=sindex(c,break_set);
				834	if (i >= 0)
				835	{
				836	switch (token_info->state)
				837	{
				838	case IN_WHITE:
				839	case IN_TOKEN:
				840	case IN_OZONE:
				841	{
				842	(*next)++;
				843	*breaker=break_set[i];
				844	token[token_info->offset]='\0';
				845	return(0);
				846	}
				847	case IN_QUOTE:
				848	{
				849	StoreToken(token_info,token,max_token_length,c);
				850	break;
				851	}
				852	}
				853	continue;
				854	}
				855	i=sindex(c,quote);
				856	if (i >= 0)
				857	{
				858	switch (token_info->state)
				859	{
				860	case IN_WHITE:
				861	{
				862	token_info->state=IN_QUOTE;
				863	token_info->quote=quote[i];
				864	*quoted=(char) MagickTrue;
				865	break;
				866	}
				867	case IN_QUOTE:
				868	{
				869	if (quote[i] != token_info->quote)
				870	StoreToken(token_info,token,max_token_length,c);
				871	else
				872	{
				873	token_info->state=IN_OZONE;
				874	token_info->quote='\0';
				875	}
				876	break;
				877	}
				878	case IN_TOKEN:
				879	case IN_OZONE:
				880	{
				881	*breaker=(char) c;
				882	token[token_info->offset]='\0';
				883	return(0);
				884	}
				885	}
				886	continue;
				887	}
				888	i=sindex(c,white);
				889	if (i >= 0)
				890	{
				891	switch (token_info->state)
				892	{
				893	case IN_WHITE:
				894	case IN_OZONE:
				895	break;
				896	case IN_TOKEN:
				897	{
				898	token_info->state=IN_OZONE;
				899	break;
				900	}
				901	case IN_QUOTE:
				902	{
				903	StoreToken(token_info,token,max_token_length,c);
				904	break;
				905	}
				906	}
				907	continue;
				908	}
				909	if (c == (int) escape)
				910	{
				911	if (line[(*next)+1] == '\0')
				912	{
				913	*breaker='\0';
				914	StoreToken(token_info,token,max_token_length,c);
				915	(*next)++;
				916	token[token_info->offset]='\0';
				917	return(0);
				918	}
				919	switch (token_info->state)
				920	{
				921	case IN_WHITE:
				922	{
				923	(*next)--;
				924	token_info->state=IN_TOKEN;
				925	break;
				926	}
				927	case IN_TOKEN:
				928	case IN_QUOTE:
				929	{
				930	(*next)++;
				931	c=(int) line[*next];
				932	StoreToken(token_info,token,max_token_length,c);
				933	break;
				934	}
				935	case IN_OZONE:
				936	{
				937	token[token_info->offset]='\0';
				938	return(0);
				939	}
				940	}
				941	continue;
				942	}
				943	switch (token_info->state)
				944	{
				945	case IN_WHITE:
				946	token_info->state=IN_TOKEN;
				947	case IN_TOKEN:
				948	case IN_QUOTE:
				949	{
				950	StoreToken(token_info,token,max_token_length,c);
				951	break;
				952	}
				953	case IN_OZONE:
				954	{
				955	token[token_info->offset]='\0';
				956	return(0);
				957	}
				958	}
				959	}
				960	token[token_info->offset]='\0';
				961	return(0);
				962	}