tools/wrc/parser.l - wine - Git at Google

 /* -*-C-*-
  *
  * Copyright 1998-2000	Bertho A. Stultiens (BS)
  *
  * This library is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * This library is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with this library; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
  *
  * History:
  * 21-May-2000 BS	- Fixed the ident requirement of resource names
  *			  which can be keywords.
  * 30-Apr-2000 BS	- Reintegration into the wine-tree
  * 11-Jan-2000 BS	- Very drastic cleanup because we don't have a
  *			  preprocessor in here anymore.
  * 02-Jan-2000 BS	- Removed the preprocessor code
  * 23-Dec-1999 BS	- Removed the copyright for Martin von Loewis.
  *			  There is really nothing left of his code in
  *			  this parser.
  * 20-Jun-1998 BS	- Changed the filename conversion. Filenames are
  *			  case-sensitive inder *nix, but not under dos.
  *			  default behaviour is to convert to lower case.
  *			- All backslashes are converted to forward and
  *			  both single and double slash is recognized as
  *			  MS/Borland does.
  *			- Fixed a bug in 'yywf' case that prevented
  *			  double quoted names to be scanned properly.
  *
  * 19-May-1998 BS	- Started to build a preprocessor.
  *			- Changed keyword processing completely to
  *			  table-lookups.
  *
  * 20-Apr-1998 BS	- Added ';' comment stripping
  *
  * 17-Apr-1998 BS	- Made the win32 keywords optional when compiling in
  *			  16bit mode
  *
  * 15-Apr-1998 BS	- Changed string handling to include escapes
  *			- Added unicode string handling (no codepage
  *			  translation though).
  *			- 'Borrowed' the main idea of string scanning from
  *			  the flex manual pages.
  *			- Added conditional handling of scanning depending
  *			  on the state of the parser. This was mainly required
  *			  to distinguish a file to load or raw data that
  *			  follows. MS's definition of filenames is rather
  *			  complex... It can be unquoted or double quoted. If
  *			  double quoted, then the '\\' char is not automatically
  *			  escaped according to Borland's rc compiler, but it
  *			  accepts both "\\path\\file.rc" and "\path\file.rc".
  *			  This makes life very hard! I go for the escaped
  *			  version, as this seems to be the documented way...
  *			- Single quoted strings are now parsed and converted
  *			  here.
  *			- Added comment stripping. The implementation is
  *			  'borrowed' from the flex manpages.
  *			- Rebuild string processing so that it may contain
  *			  escaped '\0'.
  */

 /* Exclusive string handling */
 %x tkstr
 /* Exclusive unicode string handling */
 %x tklstr
 /* Exclusive rcdata single quoted data handling */
 %x tkrcd
 /* Exclusive comment eating... */
 %x comment
 /* Set when stripping c-junk */
 %x pp_cstrip
 /* Set when scanning #line style directives */
 %x pp_line
 /* Set when scanning #pragma */
 %x pp_pragma
 %x pp_code_page

 %option stack
 %option noinput nounput noyy_top_state noyywrap
 %option 8bit never-interactive
 %option prefix="parser_"

 /* Some shortcut definitions */
 ws	[ \f\t\r]

 %{

 /*#define LEX_DEBUG*/

 #include "config.h"

 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
 #include <ctype.h>
 #include <assert.h>
 #include <errno.h>
 #include <limits.h>

 #ifdef HAVE_UNISTD_H
 #include <unistd.h>
 #else
 #define YY_NO_UNISTD_H
 #endif

 #include "wrc.h"
 #include "utils.h"
 #include "parser.h"
 #include "newstruc.h"

 #include "parser.tab.h"

 /* Always update the current character position within a line */
 #define YY_USER_ACTION	char_number+=yyleng; wanted_id = want_id; want_id = 0;

 #define YY_USER_INIT current_codepage = -1;

 static void addcchar(char c);
 static void addwchar(WCHAR s);
 static string_t *get_buffered_cstring(void);
 static string_t *get_buffered_wstring(void);
 static string_t *make_string(char *s);

 static char *cbuffer;		/* Buffers for string collection */
 static int cbufidx;
 static int cbufalloc = 0;
 static WCHAR *wbuffer;
 static int wbufidx;
 static int wbufalloc = 0;

 static int current_codepage = -1;  /* use language default */

 /*
  * This one is a bit tricky.
  * We set 'want_id' in the parser to get the first
  * identifier we get across in the scanner, but we
  * also want it to be reset at nearly any token we
  * see. Exceptions are:
  * - newlines
  * - comments
  * - whitespace
  *
  * The scanner will automatically reset 'want_id'
  * after *each* scanner reduction and puts is value
  * into the var below. In this way we can see the
  * state after the YY_RULE_SETUP (i.e. the user action;
  * see above) and don't have to worry too much when
  * it needs to be reset.
  */
 static int wanted_id = 0;
 static int save_wanted_id;	/* To save across comment reductions */

 struct keyword {
 	const char	*keyword;
 	int		token;
 	int		isextension;
 	int		needcase;
 	int		alwayskw;
 };

 static struct keyword keywords[] = {
 	{ "ACCELERATORS",	tACCELERATORS,		0, 0, 0},
 	{ "ALT",		tALT,			0, 0, 0},
 	{ "ASCII",		tASCII,			0, 0, 0},
 	{ "AUTO3STATE",		tAUTO3STATE,		1, 0, 0},
 	{ "AUTOCHECKBOX",	tAUTOCHECKBOX,		1, 0, 0},
 	{ "AUTORADIOBUTTON",	tAUTORADIOBUTTON,	1, 0, 0},
 	{ "BEGIN",		tBEGIN,			0, 0, 0},
 	{ "BITMAP",		tBITMAP,		0, 0, 0},
 	{ "BLOCK",		tBLOCK,			0, 0, 0},
 	{ "BUTTON",		tBUTTON,		1, 0, 0},
 	{ "CAPTION",		tCAPTION,		0, 0, 0},
 	{ "CHARACTERISTICS",	tCHARACTERISTICS,	1, 0, 0},
 	{ "CHECKBOX",		tCHECKBOX,		0, 0, 0},
 	{ "CHECKED",		tCHECKED,		0, 0, 0},
 	{ "CLASS",		tCLASS,			0, 0, 0},
 	{ "COMBOBOX",		tCOMBOBOX,		0, 0, 0},
 	{ "CONTROL",		tCONTROL,		0, 0, 0},
 	{ "CTEXT",		tCTEXT,			0, 0, 0},
 	{ "CURSOR",		tCURSOR,		0, 0, 0},
 	{ "DEFPUSHBUTTON",	tDEFPUSHBUTTON,		0, 0, 0},
 	{ "DIALOG",		tDIALOG,		0, 0, 0},
 	{ "DIALOGEX",		tDIALOGEX,		1, 0, 0},
 	{ "DISCARDABLE",	tDISCARDABLE,		0, 0, 0},
 	{ "DLGINIT",		tDLGINIT,		0, 0, 0},
 	{ "EDITTEXT",		tEDITTEXT,		0, 0, 0},
 	{ "END",		tEND,			0, 0, 0},
 	{ "EXSTYLE",		tEXSTYLE,		0, 0, 0},
 	{ "FILEFLAGS",		tFILEFLAGS,		0, 0, 0},
 	{ "FILEFLAGSMASK",	tFILEFLAGSMASK,		0, 0, 0},
 	{ "FILEOS",		tFILEOS,		0, 0, 0},
 	{ "FILESUBTYPE",	tFILESUBTYPE,		0, 0, 0},
 	{ "FILETYPE",		tFILETYPE,		0, 0, 0},
 	{ "FILEVERSION",	tFILEVERSION,		0, 0, 0},
 	{ "FIXED",		tFIXED,			0, 0, 0},
 	{ "FONT",		tFONT,			0, 0, 0},
 	{ "FONTDIR",		tFONTDIR,		0, 0, 0},	/* This is a Borland BRC extension */
 	{ "GRAYED",		tGRAYED,		0, 0, 0},
 	{ "GROUPBOX",		tGROUPBOX,		0, 0, 0},
 	{ "HELP",		tHELP,			0, 0, 0},
 	{ "HTML",		tHTML,			0, 0, 0},
 	{ "ICON",		tICON,			0, 0, 0},
 	{ "IMPURE",		tIMPURE,		0, 0, 0},
 	{ "INACTIVE",		tINACTIVE,		0, 0, 0},
 	{ "LANGUAGE",		tLANGUAGE,		1, 0, 1},
 	{ "LISTBOX",		tLISTBOX,		0, 0, 0},
 	{ "LOADONCALL",		tLOADONCALL,		0, 0, 0},
 	{ "LTEXT",		tLTEXT,			0, 0, 0},
 	{ "MENU",		tMENU,			0, 0, 0},
 	{ "MENUBARBREAK",	tMENUBARBREAK,		0, 0, 0},
 	{ "MENUBREAK",		tMENUBREAK,		0, 0, 0},
 	{ "MENUEX",		tMENUEX,		1, 0, 0},
 	{ "MENUITEM",		tMENUITEM,		0, 0, 0},
 	{ "MESSAGETABLE",	tMESSAGETABLE,		1, 0, 0},
 	{ "MOVEABLE",		tMOVEABLE,		0, 0, 0},
 	{ "NOINVERT",		tNOINVERT,		0, 0, 0},
 	{ "NOT",		tNOT,			0, 0, 0},
 	{ "POPUP",		tPOPUP,			0, 0, 0},
 	{ "PRELOAD",		tPRELOAD,		0, 0, 0},
 	{ "PRODUCTVERSION",	tPRODUCTVERSION,	0, 0, 0},
 	{ "PURE",		tPURE,			0, 0, 0},
 	{ "PUSHBUTTON",		tPUSHBUTTON,		0, 0, 0},
 	{ "RADIOBUTTON",	tRADIOBUTTON,		0, 0, 0},
 	{ "RCDATA",		tRCDATA,		0, 0, 0},
 	{ "RTEXT",		tRTEXT,			0, 0, 0},
 	{ "SCROLLBAR",		tSCROLLBAR,		0, 0, 0},
 	{ "SEPARATOR",		tSEPARATOR,		0, 0, 0},
 	{ "SHIFT",		tSHIFT,			0, 0, 0},
 	{ "STATE3",		tSTATE3,		1, 0, 0},
 	{ "STRING",		tSTRING,		0, 0, 0},
 	{ "STRINGTABLE",	tSTRINGTABLE,		0, 0, 1},
 	{ "STYLE",		tSTYLE,			0, 0, 0},
 	{ "TOOLBAR",		tTOOLBAR,		1, 0, 0},
 	{ "VALUE",		tVALUE,			0, 0, 0},
 	{ "VERSION",		tVERSION,		1, 0, 0},
 	{ "VERSIONINFO",	tVERSIONINFO,		0, 0, 0},
 	{ "VIRTKEY",		tVIRTKEY,		0, 0, 0}
 };

 #define NKEYWORDS	(sizeof(keywords)/sizeof(keywords[0]))
 #define KWP(p)		((const struct keyword *)(p))
 static int kw_cmp_func(const void *s1, const void *s2)
 {
 	int ret;
 	ret = compare_striA(KWP(s1)->keyword, KWP(s2)->keyword);
 	if(!ret && (KWP(s1)->needcase || KWP(s2)->needcase))
 		return strcmp(KWP(s1)->keyword, KWP(s2)->keyword);
 	else
 		return ret;
 }

 #define KW_BSEARCH
 #define DO_SORT
 static struct keyword *iskeyword(char *kw)
 {
 	struct keyword *kwp;
 	struct keyword key;
 	key.keyword = kw;
 	key.needcase = 0;
 #ifdef DO_SORT
 	{
 		/* Make sure that it is sorted for bsearsh */
 		static int sorted = 0;
 		if(!sorted)
 		{
 			qsort(keywords, NKEYWORDS, sizeof(keywords[0]), kw_cmp_func);
 			sorted = 1;
 		}
 	}
 #endif
 #ifdef KW_BSEARCH
 	kwp = bsearch(&key, keywords, NKEYWORDS, sizeof(keywords[0]), kw_cmp_func);
 #else
 	{
 		int i;
 		for(i = 0; i < NKEYWORDS; i++)
 		{
 			if(!kw_cmp_func(&key, &keywords[i]))
 				break;
 		}
 		if(i < NKEYWORDS)
 			kwp = &keywords[i];
 		else
 			kwp = NULL;
 	}
 #endif

 	if(kwp == NULL || (kwp->isextension && !extensions))
 		return NULL;
 	else
 		return kwp;
 }

 /* converts an integer in string form to an unsigned long and prints an error
  * on overflow */
 static unsigned long xstrtoul(const char *nptr, char **endptr, int base)
 {
     unsigned long l;

     errno = 0;
     l = strtoul(nptr, endptr, base);
     if (l == ULONG_MAX && errno == ERANGE)
         parser_error("integer constant %s is too large", nptr);
     return l;
 }

 %}

 /*
  **************************************************************************
  * The flexer starts here
  **************************************************************************
  */
 %%
 	/*
 	 * Catch the GCC-style line statements here and parse them.
 	 * This has the advantage that you can #include at any
 	 * stage in the resource file.
 	 * The preprocessor generates line directives in the format:
 	 * # <linenum> "filename" <codes>
 	 *
 	 * Codes can be a sequence of:
 	 * - 1 start of new file
 	 * - 2 returning to previous
 	 * - 3 system header
 	 * - 4 interpret as C-code
 	 *
 	 * 4 is not used and 1 mutually excludes 2
 	 * Anyhow, we are not really interested in these at all
 	 * because we only want to know the linenumber and
 	 * filename.
 	 */
 <INITIAL,pp_cstrip>^{ws}*\#{ws}*pragma{ws}+	yy_push_state(pp_pragma);
 <INITIAL,pp_cstrip>^{ws}*\#{ws}*	yy_push_state(pp_line);
 <pp_line>[^\n]*	{
 		int lineno, len;
 		char *cptr;
 		char *fname;
 		yy_pop_state();
 		lineno = (int)strtol(yytext, &cptr, 10);
 		if(!lineno)
 			parser_error("Malformed '#...' line-directive; invalid linenumber");
 		fname = strchr(cptr, '"');
 		if(!fname)
 			parser_error("Malformed '#...' line-directive; missing filename");
 		fname++;
 		cptr = strchr(fname, '"');
 		if(!cptr)
 			parser_error("Malformed '#...' line-directive; missing terminating \"");
 		*cptr = '\0';
 		line_number = lineno - 1;	/* We didn't read the newline */
 		input_name = xstrdup(fname);
                 /* ignore contents of C include files */
                 len = strlen(input_name);
                 if (len > 1 && !strcasecmp( input_name + len - 2, ".h" ))
                     BEGIN(pp_cstrip);
                 else
                     BEGIN(INITIAL);
 	}

 <pp_pragma>code_page[^\n]*	yyless(9); yy_pop_state(); yy_push_state(pp_code_page);
 <pp_pragma>[^\n]*		yy_pop_state(); if (pedantic) parser_warning("Unrecognized #pragma directive '%s'\n",yytext);

 <pp_code_page>\({ws}*default{ws}*\)[^\n]*	current_codepage = -1; yy_pop_state();
 <pp_code_page>\({ws}*utf8{ws}*\)[^\n]*		current_codepage = CP_UTF8; yy_pop_state();
 <pp_code_page>\({ws}*[0-9]+{ws}*\)[^\n]* {
         char *p = yytext;
         yy_pop_state();
         while (*p < '0' || *p > '9') p++;
         current_codepage = strtol( p, NULL, 10 );
         if (current_codepage != CP_UTF8 && !wine_cp_get_table( current_codepage ))
         {
             parser_error("Codepage %d not supported", current_codepage);
             current_codepage = 0;
         }
     }
 <pp_code_page>[^\n]*	yy_pop_state(); parser_error("Malformed #pragma code_page directive");

 	/*
 	 * Strip everything until a ';' taking
 	 * into account braces {} for structures,
 	 * classes and enums.
 	 */
 <pp_cstrip>\n			line_number++; char_number = 1;
 <pp_cstrip>.			; /* ignore */

 \{			return tBEGIN;
 \}			return tEND;

 [0-9]+[lL]?		{ parser_lval.num = xstrtoul(yytext,  0, 10);
                           return (yytext[yyleng-1] == 'L' || yytext[yyleng-1] == 'l') ? tLNUMBER : tNUMBER; }
 0[xX][0-9A-Fa-f]+[lL]?	{ parser_lval.num = xstrtoul(yytext,  0, 16);
                           return (yytext[yyleng-1] == 'L' || yytext[yyleng-1] == 'l') ? tLNUMBER : tNUMBER; }
 0[oO][0-7]+[lL]?	{ parser_lval.num = xstrtoul(yytext+2, 0, 8);
                           return (yytext[yyleng-1] == 'L' || yytext[yyleng-1] == 'l') ? tLNUMBER : tNUMBER; }

 [A-Za-z_0-9./\\]+	{
 				struct keyword *tok = iskeyword(yytext);

 				if(tok)
 				{
 					if(wanted_id && !tok->alwayskw)
 					{
 						parser_lval.str = make_string(yytext);
 						return tIDENT;
 					}
 					else
 						return tok->token;
 				}
 				else
 				{
 					parser_lval.str = make_string(yytext);
 					return tIDENT;
 				}
 			}

 	/*
 	 * Wide string scanning
 	 */
 L\"			{
 				yy_push_state(tklstr);
 				wbufidx = 0;
 				if(!win32)
 					parser_warning("16bit resource contains unicode strings\n");
 			}
 <tklstr>\"{ws}+	|
 <tklstr>\"		{
 				yy_pop_state();
 				parser_lval.str = get_buffered_wstring();
 				return tSTRING;
 			}
 <tklstr>\\[0-7]{1,6}	{ /* octal escape sequence */
 				unsigned int result;
 				result = strtoul(yytext+1, 0, 8);
 				if ( result > 0xffff )
 					parser_error("Character constant out of range");
 				addwchar((WCHAR)result);
 			}
 <tklstr>\\x[0-9a-fA-F]{4} {  /* hex escape sequence */
 				unsigned int result;
 				result = strtoul(yytext+2, 0, 16);
 				addwchar((WCHAR)result);
 			}
 <tklstr>\\x[0-9a-fA-F]{1,3} {  parser_error("Invalid hex escape sequence '%s'", yytext); }

 <tklstr>\\[0-9]+	parser_error("Bad escape sequence");
 <tklstr>\\\n{ws}*	line_number++; char_number = 1; /* backslash at EOL continues string after leading whitespace on next line */
 <tklstr>\\a		addwchar('\a');
 <tklstr>\\b		addwchar('\b');
 <tklstr>\\f		addwchar('\f');
 <tklstr>\\n		addwchar('\n');
 <tklstr>\\r		addwchar('\r');
 <tklstr>\\t		addwchar('\t');
 <tklstr>\\v		addwchar('\v');
 <tklstr>\\.		{
 			    if (yytext[1] & 0x80)
                                 parser_error("Invalid char %u in wide string", (unsigned char)yytext[1]);
 			    addwchar(yytext[1]);
 			}
 <tklstr>\\\r\n		addwchar(yytext[2]); line_number++; char_number = 1;
 <tklstr>\"\"		addwchar('\"');		/* "bla""bla"  -> "bla\"bla" */
 <tklstr>\\\"\"		addwchar('\"');		/* "bla\""bla" -> "bla\"bla" */
 <tklstr>\"{ws}+\"	;			/* "bla" "bla" -> "blabla" */
 <tklstr>[^\\\n\"]+	{
 				char *yptr = yytext;
 				while(*yptr)	/* FIXME: codepage translation */
                                 {
                                     if (*yptr & 0x80)
                                         parser_error("Invalid char %u in wide string", (unsigned char)*yptr);
                                     addwchar(*yptr++ & 0xff);
                                 }
 			}
 <tklstr>\n		parser_error("Unterminated string");

 	/*
 	 * Normal string scanning
 	 */
 \"			yy_push_state(tkstr); cbufidx = 0;
 <tkstr>\"{ws}+	|
 <tkstr>\"		{
 				yy_pop_state();
 				parser_lval.str = get_buffered_cstring();
 				return tSTRING;
 			}
 <tkstr>\\[0-7]{1,3}	{ /* octal escape sequence */
 				int result;
 				result = strtol(yytext+1, 0, 8);
 				if ( result > 0xff )
 					parser_error("Character constant out of range");
 				addcchar((char)result);
 			}
 <tkstr>\\x[0-9a-fA-F]{2} {  /* hex escape sequence */
 				int result;
 				result = strtol(yytext+2, 0, 16);
 				addcchar((char)result);
 			}
 <tkstr>\\x[0-9a-fA-F]	{  parser_error("Invalid hex escape sequence '%s'", yytext); }

 <tkstr>\\[0-9]+		parser_error("Bad escape sequence");
 <tkstr>\\\n{ws}*	line_number++; char_number = 1; /* backslash at EOL continues string after leading whitespace on next line */
 <tkstr>\\a		addcchar('\a');
 <tkstr>\\b		addcchar('\b');
 <tkstr>\\f		addcchar('\f');
 <tkstr>\\n		addcchar('\n');
 <tkstr>\\r		addcchar('\r');
 <tkstr>\\t		addcchar('\t');
 <tkstr>\\v		addcchar('\v');
 <tkstr>\\.		addcchar(yytext[1]);
 <tkstr>\\\r\n		addcchar(yytext[2]); line_number++; char_number = 1;
 <tkstr>[^\\\n\"]+	{
 				char *yptr = yytext;
 				while(*yptr)
 					addcchar(*yptr++);
 			}
 <tkstr>\"\"		addcchar('\"');		/* "bla""bla"   -> "bla\"bla" */
 <tkstr>\\\"\"		addcchar('\"');		/* "bla\""bla"  -> "bla\"bla" */
 <tkstr>\"{ws}+\"	;			/* "bla" "bla"  -> "blabla" */
 <tkstr>\n		parser_error("Unterminated string");

 	/*
 	 * Raw data scanning
 	 */
 \'			yy_push_state(tkrcd); cbufidx = 0;
 <tkrcd>\'		{
 				yy_pop_state();
 				parser_lval.raw = new_raw_data();
 				parser_lval.raw->size = cbufidx;
 				parser_lval.raw->data = xmalloc(parser_lval.raw->size);
 				memcpy(parser_lval.raw->data, cbuffer, parser_lval.raw->size);
 				return tRAWDATA;
 			}
 <tkrcd>[0-9a-fA-F]{2}	{
 				int result;
 				result = strtol(yytext, 0, 16);
 				addcchar((char)result);
 			}
 <tkrcd>{ws}+		;	/* Ignore space */
 <tkrcd>\n		line_number++; char_number = 1;
 <tkrcd>.		parser_error("Malformed data-line");

 	/*
 	 * Comment stripping
 	 * Should never occur after preprocessing
 	 */
 <INITIAL,pp_cstrip>"/*"	{
 				yy_push_state(comment);
 				save_wanted_id = wanted_id;
 				if(!no_preprocess)
 					parser_warning("Found comments after preprocessing, please report\n");
 			}
 <comment>[^*\n]*	;
 <comment>"*"+[^*/\n]*	;
 <comment>\n		line_number++; char_number = 1;
 <comment>"*"+"/"	yy_pop_state(); want_id = save_wanted_id;

 ;[^\n]*			want_id = wanted_id; /* not really comment, but left-over c-junk */
 "//"[^\n]*		want_id = wanted_id; if(!no_preprocess) parser_warning("Found comments after preprocessing, please report\n");

 \n			{
 				want_id = wanted_id;
 				line_number++;
 				char_number = 1;
 				if(want_nl)
 				{
 					want_nl = 0;
 					return tNL;
 				}
 			}
 {ws}+			want_id = wanted_id;	/* Eat whitespace */

 <INITIAL>[ -~]		return yytext[0];

 <*>.|\n			{
 				/* Catch all rule to find any unmatched text */
 				if(*yytext == '\n')
 				{
 					line_number++;
 					char_number = 1;
 				}
 				parser_error("Unmatched text '%c' (0x%02x) YY_START=%d",
                                              isprint((unsigned char)*yytext) ? *yytext : '.', *yytext, YY_START);
 			}

 %%

 /* These dup functions copy the enclosed '\0' from
  * the resource string.
  */
 static void addcchar(char c)
 {
 	if(cbufidx >= cbufalloc)
 	{
 		cbufalloc += 1024;
 		cbuffer = xrealloc(cbuffer, cbufalloc * sizeof(cbuffer[0]));
 		if(cbufalloc > 65536)
 			parser_warning("Reallocating string buffer larger than 64kB\n");
 	}
 	cbuffer[cbufidx++] = c;
 }

 static void addwchar(WCHAR s)
 {
 	if(wbufidx >= wbufalloc)
 	{
 		wbufalloc += 1024;
 		wbuffer = xrealloc(wbuffer, wbufalloc * sizeof(wbuffer[0]));
 		if(wbufalloc > 65536)
 			parser_warning("Reallocating wide string buffer larger than 64kB\n");
 	}
 	wbuffer[wbufidx++] = s;
 }

 static string_t *get_buffered_cstring(void)
 {
     string_t *str = new_string();

     str->size = cbufidx;
     str->type = str_char;
     str->str.cstr = xmalloc(cbufidx+1);
     memcpy(str->str.cstr, cbuffer, cbufidx);
     str->str.cstr[cbufidx] = '\0';

     if (!current_codepage || current_codepage == -1 || !win32)  /* store as ANSI string */
     {
         if (!current_codepage) parser_error("Codepage set to Unicode only, cannot use ASCII string here");
         return str;
     }
     else  /* convert to Unicode before storing */
     {
         string_t *str_w = convert_string( str, str_unicode, current_codepage );
         if (!check_unicode_conversion( str, str_w, current_codepage ))
             parser_error("String %s does not convert identically to Unicode and back in codepage %d. "
                     "Try using a Unicode string instead", str->str.cstr, current_codepage );
         if (check_valid_utf8( str, current_codepage ))
             parser_warning( "string \"%s\" seems to be UTF-8 but codepage %u is in use.\n",
                             str->str.cstr, current_codepage );
         free_string( str );
         return str_w;
     }
 }

 static string_t *get_buffered_wstring(void)
 {
 	string_t *str = new_string();
 	str->size = wbufidx;
 	str->type = str_unicode;
 	str->str.wstr = xmalloc((wbufidx+1)*sizeof(WCHAR));
 	memcpy(str->str.wstr, wbuffer, wbufidx*sizeof(WCHAR));
 	str->str.wstr[wbufidx] = 0;
 	return str;
 }

 static string_t *make_string(char *s)
 {
 	string_t *str = new_string();
 	str->size = strlen(s);
 	str->type = str_char;
 	str->str.cstr = xmalloc(str->size+1);
 	memcpy(str->str.cstr, s, str->size+1);
 	return str;
 }
	/* --C--
	*
	* Copyright 1998-2000 Bertho A. Stultiens (BS)
	*
	* This library is free software; you can redistribute it and/or
	* modify it under the terms of the GNU Lesser General Public
	* License as published by the Free Software Foundation; either
	* version 2.1 of the License, or (at your option) any later version.
	*
	* This library is distributed in the hope that it will be useful,
	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	* Lesser General Public License for more details.
	*
	* You should have received a copy of the GNU Lesser General Public
	* License along with this library; if not, write to the Free Software
	* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
	*
	* History:
	* 21-May-2000 BS - Fixed the ident requirement of resource names
	* which can be keywords.
	* 30-Apr-2000 BS - Reintegration into the wine-tree
	* 11-Jan-2000 BS - Very drastic cleanup because we don't have a
	* preprocessor in here anymore.
	* 02-Jan-2000 BS - Removed the preprocessor code
	* 23-Dec-1999 BS - Removed the copyright for Martin von Loewis.
	* There is really nothing left of his code in
	* this parser.
	* 20-Jun-1998 BS - Changed the filename conversion. Filenames are
	* case-sensitive inder *nix, but not under dos.
	* default behaviour is to convert to lower case.
	* - All backslashes are converted to forward and
	* both single and double slash is recognized as
	* MS/Borland does.
	* - Fixed a bug in 'yywf' case that prevented
	* double quoted names to be scanned properly.
	*
	* 19-May-1998 BS - Started to build a preprocessor.
	* - Changed keyword processing completely to
	* table-lookups.
	*
	* 20-Apr-1998 BS - Added ';' comment stripping
	*
	* 17-Apr-1998 BS - Made the win32 keywords optional when compiling in
	* 16bit mode
	*
	* 15-Apr-1998 BS - Changed string handling to include escapes
	* - Added unicode string handling (no codepage
	* translation though).
	* - 'Borrowed' the main idea of string scanning from
	* the flex manual pages.
	* - Added conditional handling of scanning depending
	* on the state of the parser. This was mainly required
	* to distinguish a file to load or raw data that
	* follows. MS's definition of filenames is rather
	* complex... It can be unquoted or double quoted. If
	* double quoted, then the '\\' char is not automatically
	* escaped according to Borland's rc compiler, but it
	* accepts both "\\path\\file.rc" and "\path\file.rc".
	* This makes life very hard! I go for the escaped
	* version, as this seems to be the documented way...
	* - Single quoted strings are now parsed and converted
	* here.
	* - Added comment stripping. The implementation is
	* 'borrowed' from the flex manpages.
	* - Rebuild string processing so that it may contain
	* escaped '\0'.
	*/

	/* Exclusive string handling */
	%x tkstr
	/* Exclusive unicode string handling */
	%x tklstr
	/* Exclusive rcdata single quoted data handling */
	%x tkrcd
	/* Exclusive comment eating... */
	%x comment
	/* Set when stripping c-junk */
	%x pp_cstrip
	/* Set when scanning #line style directives */
	%x pp_line
	/* Set when scanning #pragma */
	%x pp_pragma
	%x pp_code_page

	%option stack
	%option noinput nounput noyy_top_state noyywrap
	%option 8bit never-interactive
	%option prefix="parser_"

	/* Some shortcut definitions */
	ws [ \f\t\r]

	%{

	/#define LEX_DEBUG/

	#include "config.h"

	#include <stdio.h>
	#include <stdlib.h>
	#include <string.h>
	#include <ctype.h>
	#include <assert.h>
	#include <errno.h>
	#include <limits.h>

	#ifdef HAVE_UNISTD_H
	#include <unistd.h>
	#else
	#define YY_NO_UNISTD_H
	#endif

	#include "wrc.h"
	#include "utils.h"
	#include "parser.h"
	#include "newstruc.h"

	#include "parser.tab.h"

	/* Always update the current character position within a line */
	#define YY_USER_ACTION char_number+=yyleng; wanted_id = want_id; want_id = 0;

	#define YY_USER_INIT current_codepage = -1;

	static void addcchar(char c);
	static void addwchar(WCHAR s);
	static string_t *get_buffered_cstring(void);
	static string_t *get_buffered_wstring(void);
	static string_t make_string(char s);

	static char cbuffer; / Buffers for string collection */
	static int cbufidx;
	static int cbufalloc = 0;
	static WCHAR *wbuffer;
	static int wbufidx;
	static int wbufalloc = 0;

	static int current_codepage = -1; /* use language default */

	/*
	* This one is a bit tricky.
	* We set 'want_id' in the parser to get the first
	* identifier we get across in the scanner, but we
	* also want it to be reset at nearly any token we
	* see. Exceptions are:
	* - newlines
	* - comments
	* - whitespace
	*
	* The scanner will automatically reset 'want_id'
	* after each scanner reduction and puts is value
	* into the var below. In this way we can see the
	* state after the YY_RULE_SETUP (i.e. the user action;
	* see above) and don't have to worry too much when
	* it needs to be reset.
	*/
	static int wanted_id = 0;
	static int save_wanted_id; /* To save across comment reductions */

	struct keyword {
	const char *keyword;
	int token;
	int isextension;
	int needcase;
	int alwayskw;
	};

	static struct keyword keywords[] = {
	{ "ACCELERATORS", tACCELERATORS, 0, 0, 0},
	{ "ALT", tALT, 0, 0, 0},
	{ "ASCII", tASCII, 0, 0, 0},
	{ "AUTO3STATE", tAUTO3STATE, 1, 0, 0},
	{ "AUTOCHECKBOX", tAUTOCHECKBOX, 1, 0, 0},
	{ "AUTORADIOBUTTON", tAUTORADIOBUTTON, 1, 0, 0},
	{ "BEGIN", tBEGIN, 0, 0, 0},
	{ "BITMAP", tBITMAP, 0, 0, 0},
	{ "BLOCK", tBLOCK, 0, 0, 0},
	{ "BUTTON", tBUTTON, 1, 0, 0},
	{ "CAPTION", tCAPTION, 0, 0, 0},
	{ "CHARACTERISTICS", tCHARACTERISTICS, 1, 0, 0},
	{ "CHECKBOX", tCHECKBOX, 0, 0, 0},
	{ "CHECKED", tCHECKED, 0, 0, 0},
	{ "CLASS", tCLASS, 0, 0, 0},
	{ "COMBOBOX", tCOMBOBOX, 0, 0, 0},
	{ "CONTROL", tCONTROL, 0, 0, 0},
	{ "CTEXT", tCTEXT, 0, 0, 0},
	{ "CURSOR", tCURSOR, 0, 0, 0},
	{ "DEFPUSHBUTTON", tDEFPUSHBUTTON, 0, 0, 0},
	{ "DIALOG", tDIALOG, 0, 0, 0},
	{ "DIALOGEX", tDIALOGEX, 1, 0, 0},
	{ "DISCARDABLE", tDISCARDABLE, 0, 0, 0},
	{ "DLGINIT", tDLGINIT, 0, 0, 0},
	{ "EDITTEXT", tEDITTEXT, 0, 0, 0},
	{ "END", tEND, 0, 0, 0},
	{ "EXSTYLE", tEXSTYLE, 0, 0, 0},
	{ "FILEFLAGS", tFILEFLAGS, 0, 0, 0},
	{ "FILEFLAGSMASK", tFILEFLAGSMASK, 0, 0, 0},
	{ "FILEOS", tFILEOS, 0, 0, 0},
	{ "FILESUBTYPE", tFILESUBTYPE, 0, 0, 0},
	{ "FILETYPE", tFILETYPE, 0, 0, 0},
	{ "FILEVERSION", tFILEVERSION, 0, 0, 0},
	{ "FIXED", tFIXED, 0, 0, 0},
	{ "FONT", tFONT, 0, 0, 0},
	{ "FONTDIR", tFONTDIR, 0, 0, 0}, /* This is a Borland BRC extension */
	{ "GRAYED", tGRAYED, 0, 0, 0},
	{ "GROUPBOX", tGROUPBOX, 0, 0, 0},
	{ "HELP", tHELP, 0, 0, 0},
	{ "HTML", tHTML, 0, 0, 0},
	{ "ICON", tICON, 0, 0, 0},
	{ "IMPURE", tIMPURE, 0, 0, 0},
	{ "INACTIVE", tINACTIVE, 0, 0, 0},
	{ "LANGUAGE", tLANGUAGE, 1, 0, 1},
	{ "LISTBOX", tLISTBOX, 0, 0, 0},
	{ "LOADONCALL", tLOADONCALL, 0, 0, 0},
	{ "LTEXT", tLTEXT, 0, 0, 0},
	{ "MENU", tMENU, 0, 0, 0},
	{ "MENUBARBREAK", tMENUBARBREAK, 0, 0, 0},
	{ "MENUBREAK", tMENUBREAK, 0, 0, 0},
	{ "MENUEX", tMENUEX, 1, 0, 0},
	{ "MENUITEM", tMENUITEM, 0, 0, 0},
	{ "MESSAGETABLE", tMESSAGETABLE, 1, 0, 0},
	{ "MOVEABLE", tMOVEABLE, 0, 0, 0},
	{ "NOINVERT", tNOINVERT, 0, 0, 0},
	{ "NOT", tNOT, 0, 0, 0},
	{ "POPUP", tPOPUP, 0, 0, 0},
	{ "PRELOAD", tPRELOAD, 0, 0, 0},
	{ "PRODUCTVERSION", tPRODUCTVERSION, 0, 0, 0},
	{ "PURE", tPURE, 0, 0, 0},
	{ "PUSHBUTTON", tPUSHBUTTON, 0, 0, 0},
	{ "RADIOBUTTON", tRADIOBUTTON, 0, 0, 0},
	{ "RCDATA", tRCDATA, 0, 0, 0},
	{ "RTEXT", tRTEXT, 0, 0, 0},
	{ "SCROLLBAR", tSCROLLBAR, 0, 0, 0},
	{ "SEPARATOR", tSEPARATOR, 0, 0, 0},
	{ "SHIFT", tSHIFT, 0, 0, 0},
	{ "STATE3", tSTATE3, 1, 0, 0},
	{ "STRING", tSTRING, 0, 0, 0},
	{ "STRINGTABLE", tSTRINGTABLE, 0, 0, 1},
	{ "STYLE", tSTYLE, 0, 0, 0},
	{ "TOOLBAR", tTOOLBAR, 1, 0, 0},
	{ "VALUE", tVALUE, 0, 0, 0},
	{ "VERSION", tVERSION, 1, 0, 0},
	{ "VERSIONINFO", tVERSIONINFO, 0, 0, 0},
	{ "VIRTKEY", tVIRTKEY, 0, 0, 0}
	};

	#define NKEYWORDS (sizeof(keywords)/sizeof(keywords[0]))
	#define KWP(p) ((const struct keyword *)(p))
	static int kw_cmp_func(const void s1, const void s2)
	{
	int ret;
	ret = compare_striA(KWP(s1)->keyword, KWP(s2)->keyword);
	if(!ret && (KWP(s1)->needcase \|\| KWP(s2)->needcase))
	return strcmp(KWP(s1)->keyword, KWP(s2)->keyword);
	else
	return ret;
	}

	#define KW_BSEARCH
	#define DO_SORT
	static struct keyword iskeyword(char kw)
	{
	struct keyword *kwp;
	struct keyword key;
	key.keyword = kw;
	key.needcase = 0;
	#ifdef DO_SORT
	{
	/* Make sure that it is sorted for bsearsh */
	static int sorted = 0;
	if(!sorted)
	{
	qsort(keywords, NKEYWORDS, sizeof(keywords[0]), kw_cmp_func);
	sorted = 1;
	}
	}
	#endif
	#ifdef KW_BSEARCH
	kwp = bsearch(&key, keywords, NKEYWORDS, sizeof(keywords[0]), kw_cmp_func);
	#else
	{
	int i;
	for(i = 0; i < NKEYWORDS; i++)
	{
	if(!kw_cmp_func(&key, &keywords[i]))
	break;
	}
	if(i < NKEYWORDS)
	kwp = &keywords[i];
	else
	kwp = NULL;
	}
	#endif

	if(kwp == NULL \|\| (kwp->isextension && !extensions))
	return NULL;
	else
	return kwp;
	}

	/* converts an integer in string form to an unsigned long and prints an error
	* on overflow */
	static unsigned long xstrtoul(const char nptr, char *endptr, int base)
	{
	unsigned long l;

	errno = 0;
	l = strtoul(nptr, endptr, base);
	if (l == ULONG_MAX && errno == ERANGE)
	parser_error("integer constant %s is too large", nptr);
	return l;
	}

	%}

	/*
	**************************************************************************
	* The flexer starts here
	**************************************************************************
	*/
	%%
	/*
	* Catch the GCC-style line statements here and parse them.
	* This has the advantage that you can #include at any
	* stage in the resource file.
	* The preprocessor generates line directives in the format:
	* # <linenum> "filename" <codes>
	*
	* Codes can be a sequence of:
	* - 1 start of new file
	* - 2 returning to previous
	* - 3 system header
	* - 4 interpret as C-code
	*
	* 4 is not used and 1 mutually excludes 2
	* Anyhow, we are not really interested in these at all
	* because we only want to know the linenumber and
	* filename.
	*/
	<INITIAL,pp_cstrip>^{ws}\#{ws}pragma{ws}+ yy_push_state(pp_pragma);
	<INITIAL,pp_cstrip>^{ws}\#{ws} yy_push_state(pp_line);
	<pp_line>[^\n]* {
	int lineno, len;
	char *cptr;
	char *fname;
	yy_pop_state();
	lineno = (int)strtol(yytext, &cptr, 10);
	if(!lineno)
	parser_error("Malformed '#...' line-directive; invalid linenumber");
	fname = strchr(cptr, '"');
	if(!fname)
	parser_error("Malformed '#...' line-directive; missing filename");
	fname++;
	cptr = strchr(fname, '"');
	if(!cptr)
	parser_error("Malformed '#...' line-directive; missing terminating \"");
	*cptr = '\0';
	line_number = lineno - 1; /* We didn't read the newline */
	input_name = xstrdup(fname);
	/* ignore contents of C include files */
	len = strlen(input_name);
	if (len > 1 && !strcasecmp( input_name + len - 2, ".h" ))
	BEGIN(pp_cstrip);
	else
	BEGIN(INITIAL);
	}

	<pp_pragma>code_page[^\n]* yyless(9); yy_pop_state(); yy_push_state(pp_code_page);
	<pp_pragma>[^\n]* yy_pop_state(); if (pedantic) parser_warning("Unrecognized #pragma directive '%s'\n",yytext);

	<pp_code_page>\({ws}default{ws}\)[^\n]* current_codepage = -1; yy_pop_state();
	<pp_code_page>\({ws}utf8{ws}\)[^\n]* current_codepage = CP_UTF8; yy_pop_state();
	<pp_code_page>\({ws}[0-9]+{ws}\)[^\n]* {
	char *p = yytext;
	yy_pop_state();
	while (p < '0' \|\| p > '9') p++;
	current_codepage = strtol( p, NULL, 10 );
	if (current_codepage != CP_UTF8 && !wine_cp_get_table( current_codepage ))
	{
	parser_error("Codepage %d not supported", current_codepage);
	current_codepage = 0;
	}
	}
	<pp_code_page>[^\n]* yy_pop_state(); parser_error("Malformed #pragma code_page directive");

	/*
	* Strip everything until a ';' taking
	* into account braces {} for structures,
	* classes and enums.
	*/
	<pp_cstrip>\n line_number++; char_number = 1;
	<pp_cstrip>. ; /* ignore */

	\{ return tBEGIN;
	\} return tEND;

	[0-9]+[lL]? { parser_lval.num = xstrtoul(yytext, 0, 10);
	return (yytext[yyleng-1] == 'L' \|\| yytext[yyleng-1] == 'l') ? tLNUMBER : tNUMBER; }
	0[xX][0-9A-Fa-f]+[lL]? { parser_lval.num = xstrtoul(yytext, 0, 16);
	return (yytext[yyleng-1] == 'L' \|\| yytext[yyleng-1] == 'l') ? tLNUMBER : tNUMBER; }
	0[oO][0-7]+[lL]? { parser_lval.num = xstrtoul(yytext+2, 0, 8);
	return (yytext[yyleng-1] == 'L' \|\| yytext[yyleng-1] == 'l') ? tLNUMBER : tNUMBER; }

	[A-Za-z_0-9./\\]+ {
	struct keyword *tok = iskeyword(yytext);

	if(tok)
	{
	if(wanted_id && !tok->alwayskw)
	{
	parser_lval.str = make_string(yytext);
	return tIDENT;
	}
	else
	return tok->token;
	}
	else
	{
	parser_lval.str = make_string(yytext);
	return tIDENT;
	}
	}

	/*
	* Wide string scanning
	*/
	L\" {
	yy_push_state(tklstr);
	wbufidx = 0;
	if(!win32)
	parser_warning("16bit resource contains unicode strings\n");
	}
	<tklstr>\"{ws}+ \|
	<tklstr>\" {
	yy_pop_state();
	parser_lval.str = get_buffered_wstring();
	return tSTRING;
	}
	<tklstr>\\[0-7]{1,6} { /* octal escape sequence */
	unsigned int result;
	result = strtoul(yytext+1, 0, 8);
	if ( result > 0xffff )
	parser_error("Character constant out of range");
	addwchar((WCHAR)result);
	}
	<tklstr>\\x[0-9a-fA-F]{4} { /* hex escape sequence */
	unsigned int result;
	result = strtoul(yytext+2, 0, 16);
	addwchar((WCHAR)result);
	}
	<tklstr>\\x[0-9a-fA-F]{1,3} { parser_error("Invalid hex escape sequence '%s'", yytext); }

	<tklstr>\\[0-9]+ parser_error("Bad escape sequence");
	<tklstr>\\\n{ws}* line_number++; char_number = 1; /* backslash at EOL continues string after leading whitespace on next line */
	<tklstr>\\a addwchar('\a');
	<tklstr>\\b addwchar('\b');
	<tklstr>\\f addwchar('\f');
	<tklstr>\\n addwchar('\n');
	<tklstr>\\r addwchar('\r');
	<tklstr>\\t addwchar('\t');
	<tklstr>\\v addwchar('\v');
	<tklstr>\\. {
	if (yytext[1] & 0x80)
	parser_error("Invalid char %u in wide string", (unsigned char)yytext[1]);
	addwchar(yytext[1]);
	}
	<tklstr>\\\r\n addwchar(yytext[2]); line_number++; char_number = 1;
	<tklstr>\"\" addwchar('\"'); /* "bla""bla" -> "bla\"bla" */
	<tklstr>\\\"\" addwchar('\"'); /* "bla\""bla" -> "bla\"bla" */
	<tklstr>\"{ws}+\" ; /* "bla" "bla" -> "blabla" */
	<tklstr>[^\\\n\"]+ {
	char *yptr = yytext;
	while(yptr) / FIXME: codepage translation */
	{
	if (*yptr & 0x80)
	parser_error("Invalid char %u in wide string", (unsigned char)*yptr);
	addwchar(*yptr++ & 0xff);
	}
	}
	<tklstr>\n parser_error("Unterminated string");

	/*
	* Normal string scanning
	*/
	\" yy_push_state(tkstr); cbufidx = 0;
	<tkstr>\"{ws}+ \|
	<tkstr>\" {
	yy_pop_state();
	parser_lval.str = get_buffered_cstring();
	return tSTRING;
	}
	<tkstr>\\[0-7]{1,3} { /* octal escape sequence */
	int result;
	result = strtol(yytext+1, 0, 8);
	if ( result > 0xff )
	parser_error("Character constant out of range");
	addcchar((char)result);
	}
	<tkstr>\\x[0-9a-fA-F]{2} { /* hex escape sequence */
	int result;
	result = strtol(yytext+2, 0, 16);
	addcchar((char)result);
	}
	<tkstr>\\x[0-9a-fA-F] { parser_error("Invalid hex escape sequence '%s'", yytext); }

	<tkstr>\\[0-9]+ parser_error("Bad escape sequence");
	<tkstr>\\\n{ws}* line_number++; char_number = 1; /* backslash at EOL continues string after leading whitespace on next line */
	<tkstr>\\a addcchar('\a');
	<tkstr>\\b addcchar('\b');
	<tkstr>\\f addcchar('\f');
	<tkstr>\\n addcchar('\n');
	<tkstr>\\r addcchar('\r');
	<tkstr>\\t addcchar('\t');
	<tkstr>\\v addcchar('\v');
	<tkstr>\\. addcchar(yytext[1]);
	<tkstr>\\\r\n addcchar(yytext[2]); line_number++; char_number = 1;
	<tkstr>[^\\\n\"]+ {
	char *yptr = yytext;
	while(*yptr)
	addcchar(*yptr++);
	}
	<tkstr>\"\" addcchar('\"'); /* "bla""bla" -> "bla\"bla" */
	<tkstr>\\\"\" addcchar('\"'); /* "bla\""bla" -> "bla\"bla" */
	<tkstr>\"{ws}+\" ; /* "bla" "bla" -> "blabla" */
	<tkstr>\n parser_error("Unterminated string");

	/*
	* Raw data scanning
	*/
	\' yy_push_state(tkrcd); cbufidx = 0;
	<tkrcd>\' {
	yy_pop_state();
	parser_lval.raw = new_raw_data();
	parser_lval.raw->size = cbufidx;
	parser_lval.raw->data = xmalloc(parser_lval.raw->size);
	memcpy(parser_lval.raw->data, cbuffer, parser_lval.raw->size);
	return tRAWDATA;
	}
	<tkrcd>[0-9a-fA-F]{2} {
	int result;
	result = strtol(yytext, 0, 16);
	addcchar((char)result);
	}
	<tkrcd>{ws}+ ; /* Ignore space */
	<tkrcd>\n line_number++; char_number = 1;
	<tkrcd>. parser_error("Malformed data-line");

	/*
	* Comment stripping
	* Should never occur after preprocessing
	*/
	<INITIAL,pp_cstrip>"/*" {
	yy_push_state(comment);
	save_wanted_id = wanted_id;
	if(!no_preprocess)
	parser_warning("Found comments after preprocessing, please report\n");
	}
	<comment>[^\n] ;
	<comment>""+[^/\n]* ;
	<comment>\n line_number++; char_number = 1;
	<comment>"*"+"/" yy_pop_state(); want_id = save_wanted_id;

	;[^\n]* want_id = wanted_id; /* not really comment, but left-over c-junk */
	"//"[^\n]* want_id = wanted_id; if(!no_preprocess) parser_warning("Found comments after preprocessing, please report\n");

	\n {
	want_id = wanted_id;
	line_number++;
	char_number = 1;
	if(want_nl)
	{
	want_nl = 0;
	return tNL;
	}
	}
	{ws}+ want_id = wanted_id; /* Eat whitespace */

	<INITIAL>[ -~] return yytext[0];

	<*>.\|\n {
	/* Catch all rule to find any unmatched text */
	if(*yytext == '\n')
	{
	line_number++;
	char_number = 1;
	}
	parser_error("Unmatched text '%c' (0x%02x) YY_START=%d",
	isprint((unsigned char)yytext) ? yytext : '.', *yytext, YY_START);
	}

	%%

	/* These dup functions copy the enclosed '\0' from
	* the resource string.
	*/
	static void addcchar(char c)
	{
	if(cbufidx >= cbufalloc)
	{
	cbufalloc += 1024;
	cbuffer = xrealloc(cbuffer, cbufalloc * sizeof(cbuffer[0]));
	if(cbufalloc > 65536)
	parser_warning("Reallocating string buffer larger than 64kB\n");
	}
	cbuffer[cbufidx++] = c;
	}

	static void addwchar(WCHAR s)
	{
	if(wbufidx >= wbufalloc)
	{
	wbufalloc += 1024;
	wbuffer = xrealloc(wbuffer, wbufalloc * sizeof(wbuffer[0]));
	if(wbufalloc > 65536)
	parser_warning("Reallocating wide string buffer larger than 64kB\n");
	}
	wbuffer[wbufidx++] = s;
	}

	static string_t *get_buffered_cstring(void)
	{
	string_t *str = new_string();

	str->size = cbufidx;
	str->type = str_char;
	str->str.cstr = xmalloc(cbufidx+1);
	memcpy(str->str.cstr, cbuffer, cbufidx);
	str->str.cstr[cbufidx] = '\0';

	if (!current_codepage \|\| current_codepage == -1 \|\| !win32) /* store as ANSI string */
	{
	if (!current_codepage) parser_error("Codepage set to Unicode only, cannot use ASCII string here");
	return str;
	}
	else /* convert to Unicode before storing */
	{
	string_t *str_w = convert_string( str, str_unicode, current_codepage );
	if (!check_unicode_conversion( str, str_w, current_codepage ))
	parser_error("String %s does not convert identically to Unicode and back in codepage %d. "
	"Try using a Unicode string instead", str->str.cstr, current_codepage );
	if (check_valid_utf8( str, current_codepage ))
	parser_warning( "string \"%s\" seems to be UTF-8 but codepage %u is in use.\n",
	str->str.cstr, current_codepage );
	free_string( str );
	return str_w;
	}
	}

	static string_t *get_buffered_wstring(void)
	{
	string_t *str = new_string();
	str->size = wbufidx;
	str->type = str_unicode;
	str->str.wstr = xmalloc((wbufidx+1)*sizeof(WCHAR));
	memcpy(str->str.wstr, wbuffer, wbufidx*sizeof(WCHAR));
	str->str.wstr[wbufidx] = 0;
	return str;
	}

	static string_t make_string(char s)
	{
	string_t *str = new_string();
	str->size = strlen(s);
	str->type = str_char;
	str->str.cstr = xmalloc(str->size+1);
	memcpy(str->str.cstr, s, str->size+1);
	return str;
	}