Blame - libcpp/lex.c - toolchain/gcc

blob: 896a3bef2c2c732bf19c3babfeadc9e4debab38a [file] [log] [blame]

Zack Weinberg	45b966d	2000-03-13 22:01:08 +0000	[diff] [blame]	1	/* CPP Library - lexical analysis.
Joseph Myers	a48e3dd	2011-08-18 16:13:49 +0100	[diff] [blame]	2	Copyright (C) 2000, 2001, 2002, 2003, 2004, 2005, 2007, 2008, 2009, 2010,
				3	2011 Free Software Foundation, Inc.
Zack Weinberg	45b966d	2000-03-13 22:01:08 +0000	[diff] [blame]	4	Contributed by Per Bothner, 1994-95.
				5	Based on CCCP program by Paul Rubin, June 1986
				6	Adapted to ANSI C, Richard Stallman, Jan 1987
				7	Broken out to separate file, Zack Weinberg, Mar 2000
				8
				9	This program is free software; you can redistribute it and/or modify it
				10	under the terms of the GNU General Public License as published by the
Jakub Jelinek	748086b	2009-04-09 17:00:19 +0200	[diff] [blame]	11	Free Software Foundation; either version 3, or (at your option) any
Zack Weinberg	45b966d	2000-03-13 22:01:08 +0000	[diff] [blame]	12	later version.
				13
				14	This program is distributed in the hope that it will be useful,
				15	but WITHOUT ANY WARRANTY; without even the implied warranty of
				16	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
				17	GNU General Public License for more details.
				18
				19	You should have received a copy of the GNU General Public License
Jakub Jelinek	748086b	2009-04-09 17:00:19 +0200	[diff] [blame]	20	along with this program; see the file COPYING3. If not see
				21	<http://www.gnu.org/licenses/>. */
Zack Weinberg	45b966d	2000-03-13 22:01:08 +0000	[diff] [blame]	22
				23	#include "config.h"
				24	#include "system.h"
Zack Weinberg	45b966d	2000-03-13 22:01:08 +0000	[diff] [blame]	25	#include "cpplib.h"
Paolo Bonzini	4f4e53dd	2004-05-24 10:50:45 +0000	[diff] [blame]	26	#include "internal.h"
Zack Weinberg	45b966d	2000-03-13 22:01:08 +0000	[diff] [blame]	27
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	28	enum spell_type
Zack Weinberg	f9a0e96	2000-07-13 02:32:41 +0000	[diff] [blame]	29	{
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	30	SPELL_OPERATOR = 0,
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	31	SPELL_IDENT,
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	32	SPELL_LITERAL,
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	33	SPELL_NONE
Zack Weinberg	f9a0e96	2000-07-13 02:32:41 +0000	[diff] [blame]	34	};
				35
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	36	struct token_spelling
Zack Weinberg	f9a0e96	2000-07-13 02:32:41 +0000	[diff] [blame]	37	{
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	38	enum spell_type category;
				39	const unsigned char *name;
Zack Weinberg	f9a0e96	2000-07-13 02:32:41 +0000	[diff] [blame]	40	};
				41
Zack Weinberg	8206c79	2001-10-11 21:21:57 +0000	[diff] [blame]	42	static const unsigned char *const digraph_spellings[] =
Kris Van Hees	b6baa67	2008-04-18 13:58:08 +0000	[diff] [blame]	43	{ UC"%:", UC"%:%:", UC"<:", UC":>", UC"<%", UC"%>" };
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	44
Kris Van Hees	b6baa67	2008-04-18 13:58:08 +0000	[diff] [blame]	45	#define OP(e, s) { SPELL_OPERATOR, UC s },
				46	#define TK(e, s) { SPELL_ ## s, UC #e },
Zack Weinberg	8206c79	2001-10-11 21:21:57 +0000	[diff] [blame]	47	static const struct token_spelling token_spellings[N_TTYPES] = { TTYPE_TABLE };
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	48	#undef OP
				49	#undef TK
				50
				51	#define TOKEN_SPELL(token) (token_spellings[(token)->type].category)
				52	#define TOKEN_NAME(token) (token_spellings[(token)->type].name)
Zack Weinberg	f2d5f0c	2000-04-14 23:29:45 +0000	[diff] [blame]	53
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	54	static void add_line_note (cpp_buffer , const uchar , unsigned int);
				55	static int skip_line_comment (cpp_reader *);
				56	static void skip_whitespace (cpp_reader *, cppchar_t);
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	57	static void lex_string (cpp_reader , cpp_token , const uchar *);
				58	static void save_comment (cpp_reader , cpp_token , const uchar *, cppchar_t);
Matthew Gingell	631d0d3	2008-10-05 12:35:36 +0000	[diff] [blame]	59	static void store_comment (cpp_reader , cpp_token );
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	60	static void create_literal (cpp_reader , cpp_token , const uchar *,
				61	unsigned int, enum cpp_ttype);
				62	static bool warn_in_comment (cpp_reader , _cpp_line_note );
				63	static int name_p (cpp_reader , const cpp_string );
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	64	static tokenrun next_tokenrun (tokenrun );
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	65
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	66	static _cpp_buff *new_buff (size_t);
Zack Weinberg	15dad1d	2000-05-18 15:55:46 +0000	[diff] [blame]	67
Neil Booth	9d10c9a	2003-03-06 23:12:30 +0000	[diff] [blame]	68
Zack Weinberg	6d2c204	2000-04-30 17:30:25 +0000	[diff] [blame]	69	/* Utility routine:
Zack Weinberg	6d2c204	2000-04-30 17:30:25 +0000	[diff] [blame]	70
Zack Weinberg	bfb9dc7	2000-07-08 19:00:39 +0000	[diff] [blame]	71	Compares, the token TOKEN to the NUL-terminated string STRING.
				72	TOKEN must be a CPP_NAME. Returns 1 for equal, 0 for unequal. */
Zack Weinberg	6d2c204	2000-04-30 17:30:25 +0000	[diff] [blame]	73	int
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	74	cpp_ideq (const cpp_token token, const char string)
Zack Weinberg	6d2c204	2000-04-30 17:30:25 +0000	[diff] [blame]	75	{
Zack Weinberg	bfb9dc7	2000-07-08 19:00:39 +0000	[diff] [blame]	76	if (token->type != CPP_NAME)
Zack Weinberg	6d2c204	2000-04-30 17:30:25 +0000	[diff] [blame]	77	return 0;
Zack Weinberg	bfb9dc7	2000-07-08 19:00:39 +0000	[diff] [blame]	78
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	79	return !ustrcmp (NODE_NAME (token->val.node.node), (const uchar *) string);
Zack Weinberg	6d2c204	2000-04-30 17:30:25 +0000	[diff] [blame]	80	}
				81
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	82	/* Record a note TYPE at byte POS into the current cleaned logical
				83	line. */
Neil Booth	8706281	2001-10-20 09:00:53 +0000	[diff] [blame]	84	static void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	85	add_line_note (cpp_buffer buffer, const uchar pos, unsigned int type)
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	86	{
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	87	if (buffer->notes_used == buffer->notes_cap)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	88	{
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	89	buffer->notes_cap = buffer->notes_cap * 2 + 200;
Gabriel Dos Reis	c3f829c	2005-05-28 15:52:48 +0000	[diff] [blame]	90	buffer->notes = XRESIZEVEC (_cpp_line_note, buffer->notes,
				91	buffer->notes_cap);
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	92	}
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	93
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	94	buffer->notes[buffer->notes_used].pos = pos;
				95	buffer->notes[buffer->notes_used].type = type;
				96	buffer->notes_used++;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	97	}
				98
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	99
				100	/* Fast path to find line special characters using optimized character
				101	scanning algorithms. Anything complicated falls back to the slow
				102	path below. Since this loop is very hot it's worth doing these kinds
				103	of optimizations.
				104
				105	One of the paths through the ifdefs should provide
				106
				107	const uchar search_line_fast (const uchar s, const uchar *end);
				108
				109	Between S and END, search for \n, \r, \\, ?. Return a pointer to
				110	the found character.
				111
				112	Note that the last character of the buffer is always a newline,
				113	as forced by _cpp_convert_input. This fact can be used to avoid
				114	explicitly looking for the end of the buffer. */
				115
				116	/* Configure gives us an ifdef test. */
				117	#ifndef WORDS_BIGENDIAN
				118	#define WORDS_BIGENDIAN 0
				119	#endif
				120
				121	/* We'd like the largest integer that fits into a register. There's nothing
				122	in <stdint.h> that gives us that. For most hosts this is unsigned long,
				123	but MS decided on an LLP64 model. Thankfully when building with GCC we
				124	can get the "real" word size. */
				125	#ifdef __GNUC__
				126	typedef unsigned int word_type __attribute__((__mode__(__word__)));
				127	#else
				128	typedef unsigned long word_type;
				129	#endif
				130
				131	/* The code below is only expecting sizes 4 or 8.
				132	Die at compile-time if this expectation is violated. */
				133	typedef char check_word_type_size
				134	[(sizeof(word_type) == 8 \|\| sizeof(word_type) == 4) * 2 - 1];
				135
				136	/* Return X with the first N bytes forced to values that won't match one
				137	of the interesting characters. Note that NUL is not interesting. */
				138
				139	static inline word_type
				140	acc_char_mask_misalign (word_type val, unsigned int n)
				141	{
				142	word_type mask = -1;
				143	if (WORDS_BIGENDIAN)
				144	mask >>= n * 8;
				145	else
				146	mask <<= n * 8;
				147	return val & mask;
				148	}
				149
				150	/* Return X replicated to all byte positions within WORD_TYPE. */
				151
				152	static inline word_type
				153	acc_char_replicate (uchar x)
				154	{
				155	word_type ret;
				156
				157	ret = (x << 24) \| (x << 16) \| (x << 8) \| x;
				158	if (sizeof(word_type) == 8)
				159	ret = (ret << 16 << 16) \| ret;
				160	return ret;
				161	}
				162
				163	/* Return non-zero if some byte of VAL is (probably) C. */
				164
				165	static inline word_type
				166	acc_char_cmp (word_type val, word_type c)
				167	{
				168	#if defined(__GNUC__) && defined(__alpha__)
				169	/* We can get exact results using a compare-bytes instruction.
				170	Get (val == c) via (0 >= (val ^ c)). */
				171	return __builtin_alpha_cmpbge (0, val ^ c);
				172	#else
				173	word_type magic = 0x7efefefeU;
				174	if (sizeof(word_type) == 8)
				175	magic = (magic << 16 << 16) \| 0xfefefefeU;
				176	magic \|= 1;
				177
				178	val ^= c;
				179	return ((val + magic) ^ ~val) & ~magic;
				180	#endif
				181	}
				182
				183	/* Given the result of acc_char_cmp is non-zero, return the index of
				184	the found character. If this was a false positive, return -1. */
				185
				186	static inline int
				187	acc_char_index (word_type cmp ATTRIBUTE_UNUSED,
				188	word_type val ATTRIBUTE_UNUSED)
				189	{
				190	#if defined(__GNUC__) && defined(__alpha__) && !WORDS_BIGENDIAN
				191	/* The cmpbge instruction sets bits of the result corresponding to
				192	matches in the bytes with no false positives. */
				193	return __builtin_ctzl (cmp);
				194	#else
				195	unsigned int i;
				196
				197	/* ??? It would be nice to force unrolling here,
				198	and have all of these constants folded. */
				199	for (i = 0; i < sizeof(word_type); ++i)
				200	{
				201	uchar c;
				202	if (WORDS_BIGENDIAN)
				203	c = (val >> (sizeof(word_type) - i - 1) * 8) & 0xff;
				204	else
				205	c = (val >> i * 8) & 0xff;
				206
				207	if (c == '\n' \|\| c == '\r' \|\| c == '\\' \|\| c == '?')
				208	return i;
				209	}
				210
				211	return -1;
				212	#endif
				213	}
				214
				215	/* A version of the fast scanner using bit fiddling techniques.
				216
				217	For 32-bit words, one would normally perform 16 comparisons and
				218	16 branches. With this algorithm one performs 24 arithmetic
				219	operations and one branch. Whether this is faster with a 32-bit
				220	word size is going to be somewhat system dependent.
				221
				222	For 64-bit words, we eliminate twice the number of comparisons
				223	and branches without increasing the number of arithmetic operations.
				224	It's almost certainly going to be a win with 64-bit word size. */
				225
				226	static const uchar * search_line_acc_char (const uchar , const uchar )
				227	ATTRIBUTE_UNUSED;
				228
				229	static const uchar *
				230	search_line_acc_char (const uchar s, const uchar end ATTRIBUTE_UNUSED)
				231	{
				232	const word_type repl_nl = acc_char_replicate ('\n');
				233	const word_type repl_cr = acc_char_replicate ('\r');
				234	const word_type repl_bs = acc_char_replicate ('\\');
				235	const word_type repl_qm = acc_char_replicate ('?');
				236
				237	unsigned int misalign;
				238	const word_type *p;
				239	word_type val, t;
				240
				241	/* Align the buffer. Mask out any bytes from before the beginning. */
				242	p = (word_type *)((uintptr_t)s & -sizeof(word_type));
				243	val = *p;
				244	misalign = (uintptr_t)s & (sizeof(word_type) - 1);
				245	if (misalign)
				246	val = acc_char_mask_misalign (val, misalign);
				247
				248	/* Main loop. */
				249	while (1)
				250	{
				251	t = acc_char_cmp (val, repl_nl);
				252	t \|= acc_char_cmp (val, repl_cr);
				253	t \|= acc_char_cmp (val, repl_bs);
				254	t \|= acc_char_cmp (val, repl_qm);
				255
				256	if (__builtin_expect (t != 0, 0))
				257	{
				258	int i = acc_char_index (t, val);
				259	if (i >= 0)
				260	return (const uchar *)p + i;
				261	}
				262
				263	val = *++p;
				264	}
				265	}
				266
Rainer Orth	789d73c	2010-08-24 17:23:35 +0000	[diff] [blame]	267	/* Disable on Solaris 2/x86 until the following problems can be properly
				268	autoconfed:
				269
				270	The Solaris 8 assembler cannot assemble SSE2/SSE4.2 insns.
				271	The Solaris 9 assembler cannot assemble SSE4.2 insns.
				272	Before Solaris 9 Update 6, SSE insns cannot be executed.
				273	The Solaris 10+ assembler tags objects with the instruction set
				274	extensions used, so SSE4.2 executables cannot run on machines that
				275	don't support that extension. */
				276
				277	#if (GCC_VERSION >= 4005) && (defined(__i386__) \|\| defined(__x86_64__)) && !(defined(__sun__) && defined(__svr4__))
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	278
				279	/* Replicated character data to be shared between implementations.
				280	Recall that outside of a context with vector support we can't
				281	define compatible vector types, therefore these are all defined
				282	in terms of raw characters. */
				283	static const char repl_chars[4][16] __attribute__((aligned(16))) = {
				284	{ '\n', '\n', '\n', '\n', '\n', '\n', '\n', '\n',
				285	'\n', '\n', '\n', '\n', '\n', '\n', '\n', '\n' },
				286	{ '\r', '\r', '\r', '\r', '\r', '\r', '\r', '\r',
				287	'\r', '\r', '\r', '\r', '\r', '\r', '\r', '\r' },
				288	{ '\\', '\\', '\\', '\\', '\\', '\\', '\\', '\\',
				289	'\\', '\\', '\\', '\\', '\\', '\\', '\\', '\\' },
				290	{ '?', '?', '?', '?', '?', '?', '?', '?',
				291	'?', '?', '?', '?', '?', '?', '?', '?' },
				292	};
				293
				294	/* A version of the fast scanner using MMX vectorized byte compare insns.
				295
				296	This uses the PMOVMSKB instruction which was introduced with "MMX2",
Uros Bizjak	ef230b3	2011-05-22 20:53:32 +0200	[diff] [blame]	297	which was packaged into SSE1; it is also present in the AMD MMX
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	298	extension. Mark the function as using "sse" so that we emit a real
				299	"emms" instruction, rather than the 3dNOW "femms" instruction. */
				300
				301	static const uchar *
				302	#ifndef __SSE__
				303	__attribute__((__target__("sse")))
				304	#endif
				305	search_line_mmx (const uchar s, const uchar end ATTRIBUTE_UNUSED)
				306	{
				307	typedef char v8qi __attribute__ ((__vector_size__ (8)));
				308	typedef int __m64 __attribute__ ((__vector_size__ (8), __may_alias__));
				309
				310	const v8qi repl_nl = (const v8qi )repl_chars[0];
				311	const v8qi repl_cr = (const v8qi )repl_chars[1];
				312	const v8qi repl_bs = (const v8qi )repl_chars[2];
				313	const v8qi repl_qm = (const v8qi )repl_chars[3];
				314
				315	unsigned int misalign, found, mask;
				316	const v8qi *p;
				317	v8qi data, t, c;
				318
				319	/* Align the source pointer. While MMX doesn't generate unaligned data
				320	faults, this allows us to safely scan to the end of the buffer without
				321	reading beyond the end of the last page. */
				322	misalign = (uintptr_t)s & 7;
				323	p = (const v8qi *)((uintptr_t)s & -8);
				324	data = *p;
				325
				326	/* Create a mask for the bytes that are valid within the first
				327	16-byte block. The Idea here is that the AND with the mask
				328	within the loop is "free", since we need some AND or TEST
				329	insn in order to set the flags for the branch anyway. */
				330	mask = -1u << misalign;
				331
				332	/* Main loop processing 8 bytes at a time. */
				333	goto start;
				334	do
				335	{
				336	data = *++p;
				337	mask = -1;
				338
				339	start:
				340	t = __builtin_ia32_pcmpeqb(data, repl_nl);
				341	c = __builtin_ia32_pcmpeqb(data, repl_cr);
				342	t = (v8qi) __builtin_ia32_por ((__m64)t, (__m64)c);
				343	c = __builtin_ia32_pcmpeqb(data, repl_bs);
				344	t = (v8qi) __builtin_ia32_por ((__m64)t, (__m64)c);
				345	c = __builtin_ia32_pcmpeqb(data, repl_qm);
				346	t = (v8qi) __builtin_ia32_por ((__m64)t, (__m64)c);
				347	found = __builtin_ia32_pmovmskb (t);
				348	found &= mask;
				349	}
				350	while (!found);
				351
				352	__builtin_ia32_emms ();
				353
				354	/* FOUND contains 1 in bits for which we matched a relevant
				355	character. Conversion to the byte index is trivial. */
				356	found = __builtin_ctz(found);
				357	return (const uchar *)p + found;
				358	}
				359
				360	/* A version of the fast scanner using SSE2 vectorized byte compare insns. */
				361
				362	static const uchar *
				363	#ifndef __SSE2__
				364	__attribute__((__target__("sse2")))
				365	#endif
				366	search_line_sse2 (const uchar s, const uchar end ATTRIBUTE_UNUSED)
				367	{
				368	typedef char v16qi __attribute__ ((__vector_size__ (16)));
				369
				370	const v16qi repl_nl = (const v16qi )repl_chars[0];
				371	const v16qi repl_cr = (const v16qi )repl_chars[1];
				372	const v16qi repl_bs = (const v16qi )repl_chars[2];
				373	const v16qi repl_qm = (const v16qi )repl_chars[3];
				374
				375	unsigned int misalign, found, mask;
				376	const v16qi *p;
				377	v16qi data, t;
				378
				379	/* Align the source pointer. */
				380	misalign = (uintptr_t)s & 15;
				381	p = (const v16qi *)((uintptr_t)s & -16);
				382	data = *p;
				383
				384	/* Create a mask for the bytes that are valid within the first
				385	16-byte block. The Idea here is that the AND with the mask
				386	within the loop is "free", since we need some AND or TEST
				387	insn in order to set the flags for the branch anyway. */
				388	mask = -1u << misalign;
				389
				390	/* Main loop processing 16 bytes at a time. */
				391	goto start;
				392	do
				393	{
				394	data = *++p;
				395	mask = -1;
				396
				397	start:
				398	t = __builtin_ia32_pcmpeqb128(data, repl_nl);
				399	t \|= __builtin_ia32_pcmpeqb128(data, repl_cr);
				400	t \|= __builtin_ia32_pcmpeqb128(data, repl_bs);
				401	t \|= __builtin_ia32_pcmpeqb128(data, repl_qm);
				402	found = __builtin_ia32_pmovmskb128 (t);
				403	found &= mask;
				404	}
				405	while (!found);
				406
				407	/* FOUND contains 1 in bits for which we matched a relevant
				408	character. Conversion to the byte index is trivial. */
				409	found = __builtin_ctz(found);
				410	return (const uchar *)p + found;
				411	}
				412
Richard Henderson	6f173e5	2010-08-24 14:08:05 -0700	[diff] [blame]	413	#ifdef HAVE_SSE4
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	414	/* A version of the fast scanner using SSE 4.2 vectorized string insns. */
				415
				416	static const uchar *
				417	#ifndef __SSE4_2__
				418	__attribute__((__target__("sse4.2")))
				419	#endif
				420	search_line_sse42 (const uchar s, const uchar end)
				421	{
				422	typedef char v16qi __attribute__ ((__vector_size__ (16)));
				423	static const v16qi search = { '\n', '\r', '?', '\\' };
				424
				425	uintptr_t si = (uintptr_t)s;
				426	uintptr_t index;
				427
				428	/* Check for unaligned input. */
				429	if (si & 15)
				430	{
				431	if (__builtin_expect (end - s < 16, 0)
				432	&& __builtin_expect ((si & 0xfff) > 0xff0, 0))
				433	{
				434	/* There are less than 16 bytes left in the buffer, and less
				435	than 16 bytes left on the page. Reading 16 bytes at this
				436	point might generate a spurious page fault. Defer to the
				437	SSE2 implementation, which already handles alignment. */
				438	return search_line_sse2 (s, end);
				439	}
				440
				441	/* ??? The builtin doesn't understand that the PCMPESTRI read from
				442	memory need not be aligned. */
				443	__asm ("%vpcmpestri $0, (%1), %2"
				444	: "=c"(index) : "r"(s), "x"(search), "a"(4), "d"(16));
				445	if (__builtin_expect (index < 16, 0))
				446	goto found;
				447
				448	/* Advance the pointer to an aligned address. We will re-scan a
				449	few bytes, but we no longer need care for reading past the
				450	end of a page, since we're guaranteed a match. */
				451	s = (const uchar *)((si + 16) & -16);
				452	}
				453
				454	/* Main loop, processing 16 bytes at a time. By doing the whole loop
				455	in inline assembly, we can make proper use of the flags set. */
				456	__asm ( "sub $16, %1\n"
				457	" .balign 16\n"
				458	"0: add $16, %1\n"
				459	" %vpcmpestri $0, (%1), %2\n"
				460	" jnc 0b"
				461	: "=&c"(index), "+r"(s)
				462	: "x"(search), "a"(4), "d"(16));
				463
				464	found:
				465	return s + index;
				466	}
				467
Richard Henderson	6f173e5	2010-08-24 14:08:05 -0700	[diff] [blame]	468	#else
				469	/* Work around out-dated assemblers without sse4 support. */
				470	#define search_line_sse42 search_line_sse2
				471	#endif
				472
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	473	/* Check the CPU capabilities. */
				474
				475	#include "../gcc/config/i386/cpuid.h"
				476
				477	typedef const uchar * (search_line_fast_type) (const uchar , const uchar *);
				478	static search_line_fast_type search_line_fast;
				479
				480	static void __attribute__((constructor))
				481	init_vectorized_lexer (void)
				482	{
				483	unsigned dummy, ecx = 0, edx = 0;
				484	search_line_fast_type impl = search_line_acc_char;
				485	int minimum = 0;
				486
				487	#if defined(__SSE4_2__)
				488	minimum = 3;
				489	#elif defined(__SSE2__)
				490	minimum = 2;
Uros Bizjak	ef230b3	2011-05-22 20:53:32 +0200	[diff] [blame]	491	#elif defined(__SSE__)
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	492	minimum = 1;
				493	#endif
				494
				495	if (minimum == 3)
				496	impl = search_line_sse42;
				497	else if (__get_cpuid (1, &dummy, &dummy, &ecx, &edx) \|\| minimum == 2)
				498	{
				499	if (minimum == 3 \|\| (ecx & bit_SSE4_2))
				500	impl = search_line_sse42;
				501	else if (minimum == 2 \|\| (edx & bit_SSE2))
				502	impl = search_line_sse2;
				503	else if (minimum == 1 \|\| (edx & bit_SSE))
				504	impl = search_line_mmx;
				505	}
				506	else if (__get_cpuid (0x80000001, &dummy, &dummy, &dummy, &edx))
				507	{
Uros Bizjak	5e70c0b	2011-05-22 21:04:54 +0200	[diff] [blame]	508	if (minimum == 1
				509	\|\| (edx & (bit_MMXEXT \| bit_CMOV)) == (bit_MMXEXT \| bit_CMOV))
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	510	impl = search_line_mmx;
				511	}
				512
				513	search_line_fast = impl;
				514	}
				515
Richard Henderson	0195631	2011-03-18 13:20:35 -0700	[diff] [blame]	516	#elif (GCC_VERSION >= 4005) && defined(__ALTIVEC__)
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	517
				518	/* A vection of the fast scanner using AltiVec vectorized byte compares. */
				519	/* ??? Unfortunately, attribute(target("altivec")) is not yet supported,
				520	so we can't compile this function without -maltivec on the command line
				521	(or implied by some other switch). */
				522
				523	static const uchar *
				524	search_line_fast (const uchar s, const uchar end ATTRIBUTE_UNUSED)
				525	{
				526	typedef __attribute__((altivec(vector))) unsigned char vc;
				527
				528	const vc repl_nl = {
				529	'\n', '\n', '\n', '\n', '\n', '\n', '\n', '\n',
				530	'\n', '\n', '\n', '\n', '\n', '\n', '\n', '\n'
				531	};
				532	const vc repl_cr = {
				533	'\r', '\r', '\r', '\r', '\r', '\r', '\r', '\r',
				534	'\r', '\r', '\r', '\r', '\r', '\r', '\r', '\r'
				535	};
				536	const vc repl_bs = {
				537	'\\', '\\', '\\', '\\', '\\', '\\', '\\', '\\',
				538	'\\', '\\', '\\', '\\', '\\', '\\', '\\', '\\'
				539	};
				540	const vc repl_qm = {
				541	'?', '?', '?', '?', '?', '?', '?', '?',
				542	'?', '?', '?', '?', '?', '?', '?', '?',
				543	};
				544	const vc ones = {
				545	-1, -1, -1, -1, -1, -1, -1, -1,
				546	-1, -1, -1, -1, -1, -1, -1, -1,
				547	};
				548	const vc zero = { 0 };
				549
				550	vc data, mask, t;
				551
				552	/* Altivec loads automatically mask addresses with -16. This lets us
				553	issue the first load as early as possible. */
				554	data = __builtin_vec_ld(0, (const vc *)s);
				555
				556	/* Discard bytes before the beginning of the buffer. Do this by
				557	beginning with all ones and shifting in zeros according to the
				558	mis-alignment. The LVSR instruction pulls the exact shift we
				559	want from the address. */
				560	mask = __builtin_vec_lvsr(0, s);
				561	mask = __builtin_vec_perm(zero, ones, mask);
				562	data &= mask;
				563
				564	/* While altivec loads mask addresses, we still need to align S so
				565	that the offset we compute at the end is correct. */
				566	s = (const uchar *)((uintptr_t)s & -16);
				567
				568	/* Main loop processing 16 bytes at a time. */
				569	goto start;
				570	do
				571	{
				572	vc m_nl, m_cr, m_bs, m_qm;
				573
				574	s += 16;
				575	data = __builtin_vec_ld(0, (const vc *)s);
				576
				577	start:
				578	m_nl = (vc) __builtin_vec_cmpeq(data, repl_nl);
				579	m_cr = (vc) __builtin_vec_cmpeq(data, repl_cr);
				580	m_bs = (vc) __builtin_vec_cmpeq(data, repl_bs);
				581	m_qm = (vc) __builtin_vec_cmpeq(data, repl_qm);
				582	t = (m_nl \| m_cr) \| (m_bs \| m_qm);
				583
				584	/* T now contains 0xff in bytes for which we matched one of the relevant
				585	characters. We want to exit the loop if any byte in T is non-zero.
				586	Below is the expansion of vec_any_ne(t, zero). */
				587	}
				588	while (!__builtin_vec_vcmpeq_p(/__CR6_LT_REV/3, t, zero));
				589
				590	{
				591	#define N (sizeof(vc) / sizeof(long))
				592
				593	typedef char check_count[(N == 2 \|\| N == 4) * 2 - 1];
				594	union {
				595	vc v;
				596	unsigned long l[N];
				597	} u;
				598	unsigned long l, i = 0;
				599
				600	u.v = t;
				601
				602	/* Find the first word of T that is non-zero. */
				603	switch (N)
				604	{
				605	case 4:
				606	l = u.l[i++];
				607	if (l != 0)
				608	break;
				609	s += sizeof(unsigned long);
				610	l = u.l[i++];
				611	if (l != 0)
				612	break;
				613	s += sizeof(unsigned long);
				614	case 2:
				615	l = u.l[i++];
				616	if (l != 0)
				617	break;
				618	s += sizeof(unsigned long);
				619	l = u.l[i];
				620	}
				621
				622	/* L now contains 0xff in bytes for which we matched one of the
				623	relevant characters. We can find the byte index by finding
				624	its bit index and dividing by 8. */
				625	l = __builtin_clzl(l) >> 3;
				626	return s + l;
				627
				628	#undef N
				629	}
				630	}
				631
				632	#else
				633
				634	/* We only have one accellerated alternative. Use a direct call so that
				635	we encourage inlining. */
				636
				637	#define search_line_fast search_line_acc_char
				638
				639	#endif
				640
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	641	/* Returns with a logical line that contains no escaped newlines or
				642	trigraphs. This is a time-critical inner loop. */
				643	void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	644	_cpp_clean_line (cpp_reader *pfile)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	645	{
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	646	cpp_buffer *buffer;
				647	const uchar *s;
				648	uchar c, d, p;
Neil Booth	29401c3	2001-08-22 20:37:20 +0000	[diff] [blame]	649
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	650	buffer = pfile->buffer;
				651	buffer->cur_note = buffer->notes_used = 0;
				652	buffer->cur = buffer->line_base = buffer->next_line;
				653	buffer->need_line = false;
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	654	s = buffer->next_line;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	655
Neil Booth	a5c3ccc	2000-10-30 22:29:00 +0000	[diff] [blame]	656	if (!buffer->from_stage3)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	657	{
Ian Lance Taylor	7af45bd	2006-12-29 15:43:55 +0000	[diff] [blame]	658	const uchar *pbackslash = NULL;
				659
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	660	/* Fast path. This is the common case of an un-escaped line with
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	661	no trigraphs. The primary win here is by not writing any
				662	data back to memory until we have to. */
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	663	while (1)
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	664	{
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	665	/* Perform an optimized search for \n, \r, \\, ?. */
				666	s = search_line_fast (s, buffer->rlimit);
				667
				668	c = *s;
				669	if (c == '\\')
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	670	{
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	671	/* Record the location of the backslash and continue. */
				672	pbackslash = s++;
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	673	}
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	674	else if (__builtin_expect (c == '?', 0))
				675	{
				676	if (__builtin_expect (s[1] == '?', false)
Ian Lance Taylor	7af45bd	2006-12-29 15:43:55 +0000	[diff] [blame]	677	&& _cpp_trigraph_map[s[2]])
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	678	{
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	679	/* Have a trigraph. We may or may not have to convert
				680	it. Add a line note regardless, for -Wtrigraphs. */
				681	add_line_note (buffer, s, s[2]);
				682	if (CPP_OPTION (pfile, trigraphs))
				683	{
				684	/* We do, and that means we have to switch to the
				685	slow path. */
				686	d = (uchar *) s;
				687	*d = _cpp_trigraph_map[s[2]];
				688	s += 2;
				689	goto slow_path;
				690	}
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	691	}
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	692	/* Not a trigraph. Continue on fast-path. */
				693	s++;
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	694	}
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	695	else
				696	break;
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	697	}
				698
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	699	/* This must be \r or \n. We're either done, or we'll be forced
				700	to write back to the buffer and continue on the slow path. */
				701	d = (uchar *) s;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	702
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	703	if (__builtin_expect (s == buffer->rlimit, false))
				704	goto done;
				705
				706	/* DOS line ending? */
				707	if (__builtin_expect (c == '\r', false) && s[1] == '\n')
				708	{
				709	s++;
				710	if (s == buffer->rlimit)
				711	goto done;
				712	}
				713
				714	if (__builtin_expect (pbackslash == NULL, true))
				715	goto done;
				716
				717	/* Check for escaped newline. */
				718	p = d;
				719	while (is_nvspace (p[-1]))
				720	p--;
				721	if (p - 1 != pbackslash)
				722	goto done;
				723
				724	/* Have an escaped newline; process it and proceed to
				725	the slow path. */
				726	add_line_note (buffer, p - 1, p != d ? ' ' : '\\');
				727	d = p - 2;
				728	buffer->next_line = p - 1;
				729
				730	slow_path:
				731	while (1)
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	732	{
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	733	c = *++s;
				734	*++d = c;
				735
				736	if (c == '\n' \|\| c == '\r')
Neil Booth	a5c3ccc	2000-10-30 22:29:00 +0000	[diff] [blame]	737	{
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	738	/* Handle DOS line endings. */
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	739	if (c == '\r' && s != buffer->rlimit && s[1] == '\n')
				740	s++;
				741	if (s == buffer->rlimit)
Neil Booth	8706281	2001-10-20 09:00:53 +0000	[diff] [blame]	742	break;
Neil Booth	a5c3ccc	2000-10-30 22:29:00 +0000	[diff] [blame]	743
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	744	/* Escaped? */
				745	p = d;
				746	while (p != buffer->next_line && is_nvspace (p[-1]))
				747	p--;
				748	if (p == buffer->next_line \|\| p[-1] != '\\')
Neil Booth	a5c3ccc	2000-10-30 22:29:00 +0000	[diff] [blame]	749	break;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	750
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	751	add_line_note (buffer, p - 1, p != d ? ' ': '\\');
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	752	d = p - 2;
				753	buffer->next_line = p - 1;
Neil Booth	a5c3ccc	2000-10-30 22:29:00 +0000	[diff] [blame]	754	}
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	755	else if (c == '?' && s[1] == '?' && _cpp_trigraph_map[s[2]])
Neil Booth	a5c3ccc	2000-10-30 22:29:00 +0000	[diff] [blame]	756	{
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	757	/* Add a note regardless, for the benefit of -Wtrigraphs. */
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	758	add_line_note (buffer, d, s[2]);
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	759	if (CPP_OPTION (pfile, trigraphs))
				760	{
				761	*d = _cpp_trigraph_map[s[2]];
				762	s += 2;
				763	}
Neil Booth	a5c3ccc	2000-10-30 22:29:00 +0000	[diff] [blame]	764	}
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	765	}
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	766	}
				767	else
				768	{
Richard Henderson	246a2fc	2010-08-21 12:05:40 -0700	[diff] [blame]	769	while (s != '\n' && s != '\r')
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	770	s++;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	771	d = (uchar *) s;
				772
				773	/* Handle DOS line endings. */
				774	if (*s == '\r' && s != buffer->rlimit && s[1] == '\n')
				775	s++;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	776	}
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	777
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	778	done:
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	779	*d = '\n';
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	780	/* A sentinel note that should never be processed. */
				781	add_line_note (buffer, d + 1, '\n');
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	782	buffer->next_line = s + 1;
				783	}
				784
Neil Booth	a8eb604	2003-05-04 20:03:55 +0000	[diff] [blame]	785	/* Return true if the trigraph indicated by NOTE should be warned
				786	about in a comment. */
				787	static bool
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	788	warn_in_comment (cpp_reader pfile, _cpp_line_note note)
Neil Booth	a8eb604	2003-05-04 20:03:55 +0000	[diff] [blame]	789	{
				790	const uchar *p;
				791
				792	/* Within comments we don't warn about trigraphs, unless the
				793	trigraph forms an escaped newline, as that may change
Kazu Hirata	6356f89	2003-06-12 19:01:08 +0000	[diff] [blame]	794	behavior. */
Neil Booth	a8eb604	2003-05-04 20:03:55 +0000	[diff] [blame]	795	if (note->type != '/')
				796	return false;
				797
				798	/* If -trigraphs, then this was an escaped newline iff the next note
				799	is coincident. */
				800	if (CPP_OPTION (pfile, trigraphs))
				801	return note[1].pos == note->pos;
				802
				803	/* Otherwise, see if this forms an escaped newline. */
				804	p = note->pos + 3;
				805	while (is_nvspace (*p))
				806	p++;
				807
				808	/* There might have been escaped newlines between the trigraph and the
				809	newline we found. Hence the position test. */
				810	return (*p == '\n' && p < note[1].pos);
				811	}
				812
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	813	/* Process the notes created by add_line_note as far as the current
				814	location. */
				815	void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	816	_cpp_process_line_notes (cpp_reader *pfile, int in_comment)
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	817	{
				818	cpp_buffer *buffer = pfile->buffer;
				819
				820	for (;;)
				821	{
				822	_cpp_line_note *note = &buffer->notes[buffer->cur_note];
				823	unsigned int col;
				824
				825	if (note->pos > buffer->cur)
				826	break;
				827
				828	buffer->cur_note++;
				829	col = CPP_BUF_COLUMN (buffer, note->pos + 1);
				830
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	831	if (note->type == '\\' \|\| note->type == ' ')
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	832	{
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	833	if (note->type == ' ' && !in_comment)
Per Bothner	500bee0	2004-04-22 19:22:27 -0700	[diff] [blame]	834	cpp_error_with_line (pfile, CPP_DL_WARNING, pfile->line_table->highest_line, col,
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	835	"backslash and newline separated by space");
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	836
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	837	if (buffer->next_line > buffer->rlimit)
				838	{
Per Bothner	500bee0	2004-04-22 19:22:27 -0700	[diff] [blame]	839	cpp_error_with_line (pfile, CPP_DL_PEDWARN, pfile->line_table->highest_line, col,
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	840	"backslash-newline at end of file");
				841	/* Prevent "no newline at end of file" warning. */
				842	buffer->next_line = buffer->rlimit;
				843	}
				844
				845	buffer->line_base = note->pos;
Per Bothner	12f9df4	2004-02-11 07:29:30 -0800	[diff] [blame]	846	CPP_INCREMENT_LINE (pfile, 0);
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	847	}
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	848	else if (_cpp_trigraph_map[note->type])
				849	{
Neil Booth	a8eb604	2003-05-04 20:03:55 +0000	[diff] [blame]	850	if (CPP_OPTION (pfile, warn_trigraphs)
				851	&& (!in_comment \|\| warn_in_comment (pfile, note)))
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	852	{
				853	if (CPP_OPTION (pfile, trigraphs))
Simon Baldwin	87cf065	2010-04-07 17:18:10 +0000	[diff] [blame]	854	cpp_warning_with_line (pfile, CPP_W_TRIGRAPHS,
				855	pfile->line_table->highest_line, col,
				856	"trigraph ??%c converted to %c",
				857	note->type,
				858	(int) _cpp_trigraph_map[note->type]);
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	859	else
Geoffrey Keating	905bd7b	2003-07-22 02:21:16 +0000	[diff] [blame]	860	{
Simon Baldwin	87cf065	2010-04-07 17:18:10 +0000	[diff] [blame]	861	cpp_warning_with_line
				862	(pfile, CPP_W_TRIGRAPHS,
				863	pfile->line_table->highest_line, col,
Geoffrey Keating	905bd7b	2003-07-22 02:21:16 +0000	[diff] [blame]	864	"trigraph ??%c ignored, use -trigraphs to enable",
				865	note->type);
				866	}
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	867	}
				868	}
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	869	else if (note->type == 0)
				870	/* Already processed in lex_raw_string. */;
Neil Booth	41c32c9	2003-04-20 19:02:53 +0000	[diff] [blame]	871	else
				872	abort ();
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	873	}
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	874	}
				875
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	876	/* Skip a C-style block comment. We find the end of the comment by
				877	seeing if an asterisk is before every '/' we encounter. Returns
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	878	nonzero if comment terminated by EOF, zero otherwise.
				879
				880	Buffer->cur points to the initial asterisk of the comment. */
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	881	bool
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	882	_cpp_skip_block_comment (cpp_reader *pfile)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	883	{
				884	cpp_buffer *buffer = pfile->buffer;
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	885	const uchar *cur = buffer->cur;
				886	uchar c;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	887
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	888	cur++;
				889	if (*cur == '/')
				890	cur++;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	891
				892	for (;;)
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	893	{
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	894	/* People like decorating comments with '*', so check for '/'
				895	instead for efficiency. */
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	896	c = *cur++;
				897
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	898	if (c == '/')
				899	{
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	900	if (cur[-2] == '*')
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	901	break;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	902
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	903	/* Warn about potential nested comments, but not if the '/'
Joseph Myers	a1f300c	2001-11-23 02:05:19 +0000	[diff] [blame]	904	comes immediately before the true comment delimiter.
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	905	Don't bother to get it right across escaped newlines. */
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	906	if (CPP_OPTION (pfile, warn_comments)
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	907	&& cur[0] == '*' && cur[1] != '/')
				908	{
				909	buffer->cur = cur;
Simon Baldwin	87cf065	2010-04-07 17:18:10 +0000	[diff] [blame]	910	cpp_warning_with_line (pfile, CPP_W_COMMENTS,
				911	pfile->line_table->highest_line,
				912	CPP_BUF_COL (buffer),
				913	"\"/*\" within comment");
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	914	}
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	915	}
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	916	else if (c == '\n')
				917	{
Per Bothner	12f9df4	2004-02-11 07:29:30 -0800	[diff] [blame]	918	unsigned int cols;
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	919	buffer->cur = cur - 1;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	920	_cpp_process_line_notes (pfile, true);
				921	if (buffer->next_line >= buffer->rlimit)
				922	return true;
				923	_cpp_clean_line (pfile);
Per Bothner	12f9df4	2004-02-11 07:29:30 -0800	[diff] [blame]	924
				925	cols = buffer->next_line - buffer->line_base;
				926	CPP_INCREMENT_LINE (pfile, cols);
				927
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	928	cur = buffer->cur;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	929	}
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	930	}
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	931
Zack Weinberg	d08dcf8	2003-10-13 18:53:28 +0000	[diff] [blame]	932	buffer->cur = cur;
Neil Booth	a8eb604	2003-05-04 20:03:55 +0000	[diff] [blame]	933	_cpp_process_line_notes (pfile, true);
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	934	return false;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	935	}
				936
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	937	/* Skip a C++ line comment, leaving buffer->cur pointing to the
Kazu Hirata	da7d830	2002-09-22 02:03:17 +0000	[diff] [blame]	938	terminating newline. Handles escaped newlines. Returns nonzero
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	939	if a multiline comment. */
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	940	static int
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	941	skip_line_comment (cpp_reader *pfile)
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	942	{
Neil Booth	cbcff6d	2000-09-23 21:41:41 +0000	[diff] [blame]	943	cpp_buffer *buffer = pfile->buffer;
Manuel López-Ibáñez	1bb6466	2008-07-21 09:33:38 +0000	[diff] [blame]	944	source_location orig_line = pfile->line_table->highest_line;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	945
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	946	while (*buffer->cur != '\n')
				947	buffer->cur++;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	948
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	949	_cpp_process_line_notes (pfile, true);
Per Bothner	500bee0	2004-04-22 19:22:27 -0700	[diff] [blame]	950	return orig_line != pfile->line_table->highest_line;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	951	}
				952
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	953	/* Skips whitespace, saving the next non-whitespace character. */
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	954	static void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	955	skip_whitespace (cpp_reader *pfile, cppchar_t c)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	956	{
				957	cpp_buffer *buffer = pfile->buffer;
Neil Booth	f7d151f	2003-04-19 07:41:15 +0000	[diff] [blame]	958	bool saw_NUL = false;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	959
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	960	do
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	961	{
Neil Booth	91fcd15	2000-07-09 09:19:44 +0000	[diff] [blame]	962	/* Horizontal space always OK. */
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	963	if (c == ' ' \|\| c == '\t')
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	964	;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	965	/* Just \f \v or \0 left. */
Neil Booth	91fcd15	2000-07-09 09:19:44 +0000	[diff] [blame]	966	else if (c == '\0')
Neil Booth	f7d151f	2003-04-19 07:41:15 +0000	[diff] [blame]	967	saw_NUL = true;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	968	else if (pfile->state.in_directive && CPP_PEDANTIC (pfile))
Per Bothner	500bee0	2004-04-22 19:22:27 -0700	[diff] [blame]	969	cpp_error_with_line (pfile, CPP_DL_PEDWARN, pfile->line_table->highest_line,
Neil Booth	ebef4e8	2002-04-14 18:42:47 +0000	[diff] [blame]	970	CPP_BUF_COL (buffer),
				971	"%s in preprocessing directive",
				972	c == '\f' ? "form feed" : "vertical tab");
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	973
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	974	c = *buffer->cur++;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	975	}
Kazu Hirata	ec5c56d	2001-08-01 17:57:27 +0000	[diff] [blame]	976	/* We only want non-vertical space, i.e. ' ' \t \f \v \0. */
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	977	while (is_nvspace (c));
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	978
Neil Booth	f7d151f	2003-04-19 07:41:15 +0000	[diff] [blame]	979	if (saw_NUL)
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	980	cpp_error (pfile, CPP_DL_WARNING, "null character(s) ignored");
Neil Booth	f7d151f	2003-04-19 07:41:15 +0000	[diff] [blame]	981
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	982	buffer->cur--;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	983	}
				984
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	985	/* See if the characters of a number token are valid in a name (no
				986	'.', '+' or '-'). */
				987	static int
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	988	name_p (cpp_reader pfile, const cpp_string string)
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	989	{
				990	unsigned int i;
				991
				992	for (i = 0; i < string->len; i++)
				993	if (!is_idchar (string->text[i]))
				994	return 0;
				995
Kazu Hirata	df38348	2002-05-22 22:02:16 +0000	[diff] [blame]	996	return 1;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	997	}
				998
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	999	/* After parsing an identifier or other sequence, produce a warning about
				1000	sequences not in NFC/NFKC. */
				1001	static void
				1002	warn_about_normalization (cpp_reader *pfile,
				1003	const cpp_token *token,
				1004	const struct normalize_state *s)
				1005	{
				1006	if (CPP_OPTION (pfile, warn_normalize) < NORMALIZE_STATE_RESULT (s)
				1007	&& !pfile->state.skipping)
				1008	{
				1009	/* Make sure that the token is printed using UCNs, even
				1010	if we'd otherwise happily print UTF-8. */
Gabriel Dos Reis	c3f829c	2005-05-28 15:52:48 +0000	[diff] [blame]	1011	unsigned char *buf = XNEWVEC (unsigned char, cpp_token_len (token));
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1012	size_t sz;
				1013
				1014	sz = cpp_spell_token (pfile, token, buf, false) - buf;
				1015	if (NORMALIZE_STATE_RESULT (s) == normalized_C)
Simon Baldwin	87cf065	2010-04-07 17:18:10 +0000	[diff] [blame]	1016	cpp_warning_with_line (pfile, CPP_W_NORMALIZE, token->src_loc, 0,
				1017	"`%.*s' is not in NFKC", (int) sz, buf);
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1018	else
Simon Baldwin	87cf065	2010-04-07 17:18:10 +0000	[diff] [blame]	1019	cpp_warning_with_line (pfile, CPP_W_NORMALIZE, token->src_loc, 0,
				1020	"`%.*s' is not in NFC", (int) sz, buf);
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1021	}
				1022	}
				1023
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1024	/* Returns TRUE if the sequence starting at buffer->cur is invalid in
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1025	an identifier. FIRST is TRUE if this starts an identifier. */
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1026	static bool
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1027	forms_identifier_p (cpp_reader *pfile, int first,
				1028	struct normalize_state *state)
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1029	{
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1030	cpp_buffer *buffer = pfile->buffer;
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1031
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1032	if (*buffer->cur == '$')
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1033	{
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1034	if (!CPP_OPTION (pfile, dollars_in_ident))
				1035	return false;
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1036
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1037	buffer->cur++;
Hans-Peter Nilsson	78b8811	2003-06-12 06:09:15 +0000	[diff] [blame]	1038	if (CPP_OPTION (pfile, warn_dollars) && !pfile->state.skipping)
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1039	{
Hans-Peter Nilsson	78b8811	2003-06-12 06:09:15 +0000	[diff] [blame]	1040	CPP_OPTION (pfile, warn_dollars) = 0;
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	1041	cpp_error (pfile, CPP_DL_PEDWARN, "'$' in identifier or number");
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1042	}
				1043
				1044	return true;
				1045	}
				1046
				1047	/* Is this a syntactically valid UCN? */
Joseph Myers	af15a2f	2005-09-20 21:31:37 +0100	[diff] [blame]	1048	if (CPP_OPTION (pfile, extended_identifiers)
Geoffrey Keating	6baba9b	2005-03-15 09:55:41 +0000	[diff] [blame]	1049	&& *buffer->cur == '\\'
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1050	&& (buffer->cur[1] == 'u' \|\| buffer->cur[1] == 'U'))
				1051	{
				1052	buffer->cur += 2;
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1053	if (_cpp_valid_ucn (pfile, &buffer->cur, buffer->rlimit, 1 + !first,
				1054	state))
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	1055	return true;
				1056	buffer->cur -= 2;
				1057	}
				1058
				1059	return false;
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1060	}
				1061
Kai Tietz	17e7cb8	2009-11-11 18:37:19 +0000	[diff] [blame]	1062	/* Helper function to get the cpp_hashnode of the identifier BASE. */
				1063	static cpp_hashnode *
				1064	lex_identifier_intern (cpp_reader pfile, const uchar base)
				1065	{
				1066	cpp_hashnode *result;
				1067	const uchar *cur;
				1068	unsigned int len;
				1069	unsigned int hash = HT_HASHSTEP (0, *base);
				1070
				1071	cur = base + 1;
				1072	while (ISIDNUM (*cur))
				1073	{
				1074	hash = HT_HASHSTEP (hash, *cur);
				1075	cur++;
				1076	}
				1077	len = cur - base;
				1078	hash = HT_HASHFINISH (hash, len);
				1079	result = CPP_HASHNODE (ht_lookup_with_hash (pfile->hash_table,
				1080	base, len, hash, HT_ALLOC));
				1081
				1082	/* Rarely, identifiers require diagnostics when lexed. */
				1083	if (__builtin_expect ((result->flags & NODE_DIAGNOSTIC)
				1084	&& !pfile->state.skipping, 0))
				1085	{
				1086	/* It is allowed to poison the same identifier twice. */
				1087	if ((result->flags & NODE_POISONED) && !pfile->state.poisoned_ok)
				1088	cpp_error (pfile, CPP_DL_ERROR, "attempt to use poisoned \"%s\"",
				1089	NODE_NAME (result));
				1090
				1091	/* Constraint 6.10.3.5: __VA_ARGS__ should only appear in the
				1092	replacement list of a variadic macro. */
				1093	if (result == pfile->spec_nodes.n__VA_ARGS__
				1094	&& !pfile->state.va_args_ok)
				1095	cpp_error (pfile, CPP_DL_PEDWARN,
				1096	"__VA_ARGS__ can only appear in the expansion"
				1097	" of a C99 variadic macro");
				1098
				1099	/* For -Wc++-compat, warn about use of C++ named operators. */
				1100	if (result->flags & NODE_WARN_OPERATOR)
Simon Baldwin	87cf065	2010-04-07 17:18:10 +0000	[diff] [blame]	1101	cpp_warning (pfile, CPP_W_CXX_OPERATOR_NAMES,
				1102	"identifier \"%s\" is a special operator name in C++",
				1103	NODE_NAME (result));
Kai Tietz	17e7cb8	2009-11-11 18:37:19 +0000	[diff] [blame]	1104	}
				1105
				1106	return result;
				1107	}
				1108
				1109	/* Get the cpp_hashnode of an identifier specified by NAME in
				1110	the current cpp_reader object. If none is found, NULL is returned. */
				1111	cpp_hashnode *
				1112	_cpp_lex_identifier (cpp_reader pfile, const char name)
				1113	{
				1114	cpp_hashnode *result;
				1115	result = lex_identifier_intern (pfile, (uchar *) name);
				1116	return result;
				1117	}
				1118
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1119	/* Lex an identifier starting at BUFFER->CUR - 1. */
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1120	static cpp_hashnode *
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1121	lex_identifier (cpp_reader pfile, const uchar base, bool starts_ucn,
				1122	struct normalize_state *nst)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	1123	{
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	1124	cpp_hashnode *result;
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	1125	const uchar *cur;
Zack Weinberg	c6e8380	2004-06-05 20:58:06 +0000	[diff] [blame]	1126	unsigned int len;
				1127	unsigned int hash = HT_HASHSTEP (0, *base);
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	1128
Zack Weinberg	c6e8380	2004-06-05 20:58:06 +0000	[diff] [blame]	1129	cur = pfile->buffer->cur;
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	1130	if (! starts_ucn)
				1131	while (ISIDNUM (*cur))
				1132	{
				1133	hash = HT_HASHSTEP (hash, *cur);
				1134	cur++;
				1135	}
				1136	pfile->buffer->cur = cur;
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1137	if (starts_ucn \|\| forms_identifier_p (pfile, false, nst))
Neil Booth	10cf9bd	2002-03-22 07:23:21 +0000	[diff] [blame]	1138	{
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	1139	/* Slower version for identifiers containing UCNs (or $). */
				1140	do {
				1141	while (ISIDNUM (*pfile->buffer->cur))
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1142	{
				1143	pfile->buffer->cur++;
				1144	NORMALIZE_STATE_UPDATE_IDNUM (nst);
				1145	}
				1146	} while (forms_identifier_p (pfile, false, nst));
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	1147	result = _cpp_interpret_identifier (pfile, base,
				1148	pfile->buffer->cur - base);
Zack Weinberg	2c3fcba	2001-09-10 22:34:03 +0000	[diff] [blame]	1149	}
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	1150	else
				1151	{
				1152	len = cur - base;
				1153	hash = HT_HASHFINISH (hash, len);
Zack Weinberg	2c3fcba	2001-09-10 22:34:03 +0000	[diff] [blame]	1154
Tom Tromey	2bf41bf	2008-02-20 02:16:43 +0000	[diff] [blame]	1155	result = CPP_HASHNODE (ht_lookup_with_hash (pfile->hash_table,
				1156	base, len, hash, HT_ALLOC));
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	1157	}
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1158
				1159	/* Rarely, identifiers require diagnostics when lexed. */
Zack Weinberg	2c3fcba	2001-09-10 22:34:03 +0000	[diff] [blame]	1160	if (__builtin_expect ((result->flags & NODE_DIAGNOSTIC)
				1161	&& !pfile->state.skipping, 0))
				1162	{
				1163	/* It is allowed to poison the same identifier twice. */
				1164	if ((result->flags & NODE_POISONED) && !pfile->state.poisoned_ok)
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	1165	cpp_error (pfile, CPP_DL_ERROR, "attempt to use poisoned \"%s\"",
Zack Weinberg	2c3fcba	2001-09-10 22:34:03 +0000	[diff] [blame]	1166	NODE_NAME (result));
				1167
				1168	/* Constraint 6.10.3.5: __VA_ARGS__ should only appear in the
				1169	replacement list of a variadic macro. */
				1170	if (result == pfile->spec_nodes.n__VA_ARGS__
				1171	&& !pfile->state.va_args_ok)
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	1172	cpp_error (pfile, CPP_DL_PEDWARN,
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1173	"__VA_ARGS__ can only appear in the expansion"
				1174	" of a C99 variadic macro");
Ian Lance Taylor	3d8b2a9	2009-06-12 19:43:25 +0000	[diff] [blame]	1175
				1176	/* For -Wc++-compat, warn about use of C++ named operators. */
				1177	if (result->flags & NODE_WARN_OPERATOR)
Simon Baldwin	87cf065	2010-04-07 17:18:10 +0000	[diff] [blame]	1178	cpp_warning (pfile, CPP_W_CXX_OPERATOR_NAMES,
				1179	"identifier \"%s\" is a special operator name in C++",
				1180	NODE_NAME (result));
Zack Weinberg	2c3fcba	2001-09-10 22:34:03 +0000	[diff] [blame]	1181	}
				1182
				1183	return result;
				1184	}
				1185
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1186	/* Lex a number to NUMBER starting at BUFFER->CUR - 1. */
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	1187	static void
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1188	lex_number (cpp_reader pfile, cpp_string number,
				1189	struct normalize_state *nst)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	1190	{
Neil Booth	562a5c2	2002-04-21 18:46:42 +0000	[diff] [blame]	1191	const uchar *cur;
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1192	const uchar *base;
				1193	uchar *dest;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	1194
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1195	base = pfile->buffer->cur - 1;
				1196	do
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	1197	{
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1198	cur = pfile->buffer->cur;
Neil Booth	10cf9bd	2002-03-22 07:23:21 +0000	[diff] [blame]	1199
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1200	/* N.B. ISIDNUM does not include $. */
				1201	while (ISIDNUM (cur) \|\| cur == '.' \|\| VALID_SIGN (*cur, cur[-1]))
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1202	{
				1203	cur++;
				1204	NORMALIZE_STATE_UPDATE_IDNUM (nst);
				1205	}
Neil Booth	10cf9bd	2002-03-22 07:23:21 +0000	[diff] [blame]	1206
Neil Booth	10cf9bd	2002-03-22 07:23:21 +0000	[diff] [blame]	1207	pfile->buffer->cur = cur;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	1208	}
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	1209	while (forms_identifier_p (pfile, false, nst));
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1210
				1211	number->len = cur - base;
				1212	dest = _cpp_unaligned_alloc (pfile, number->len + 1);
				1213	memcpy (dest, base, number->len);
				1214	dest[number->len] = '\0';
				1215	number->text = dest;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1216	}
				1217
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1218	/* Create a token of type TYPE with a literal spelling. */
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	1219	static void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1220	create_literal (cpp_reader pfile, cpp_token token, const uchar *base,
				1221	unsigned int len, enum cpp_ttype type)
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1222	{
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1223	uchar *dest = _cpp_unaligned_alloc (pfile, len + 1);
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1224
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1225	memcpy (dest, base, len);
				1226	dest[len] = '\0';
				1227	token->type = type;
				1228	token->val.str.len = len;
				1229	token->val.str.text = dest;
				1230	}
				1231
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1232	/* Subroutine of lex_raw_string: Append LEN chars from BASE to the buffer
				1233	sequence from FIRST_BUFF_P to LAST_BUFF_P. /
				1234
				1235	static void
				1236	bufring_append (cpp_reader pfile, const uchar base, size_t len,
				1237	_cpp_buff first_buff_p, _cpp_buff last_buff_p)
				1238	{
				1239	_cpp_buff first_buff = first_buff_p;
				1240	_cpp_buff last_buff = last_buff_p;
				1241
				1242	if (first_buff == NULL)
				1243	first_buff = last_buff = _cpp_get_buff (pfile, len);
				1244	else if (len > BUFF_ROOM (last_buff))
				1245	{
				1246	size_t room = BUFF_ROOM (last_buff);
				1247	memcpy (BUFF_FRONT (last_buff), base, room);
				1248	BUFF_FRONT (last_buff) += room;
				1249	base += room;
				1250	len -= room;
				1251	last_buff = _cpp_append_extend_buff (pfile, last_buff, len);
				1252	}
				1253
				1254	memcpy (BUFF_FRONT (last_buff), base, len);
				1255	BUFF_FRONT (last_buff) += len;
				1256
				1257	*first_buff_p = first_buff;
				1258	*last_buff_p = last_buff;
				1259	}
				1260
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1261	/* Lexes a raw string. The stored string contains the spelling, including
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1262	double quotes, delimiter string, '(' and ')', any leading
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1263	'L', 'u', 'U' or 'u8' and 'R' modifier. It returns the type of the
				1264	literal, or CPP_OTHER if it was not properly terminated.
				1265
				1266	The spelling is NUL-terminated, but it is not guaranteed that this
				1267	is the first NUL since embedded NULs are preserved. */
				1268
				1269	static void
				1270	lex_raw_string (cpp_reader pfile, cpp_token token, const uchar *base,
				1271	const uchar *cur)
				1272	{
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1273	const uchar *raw_prefix;
				1274	unsigned int raw_prefix_len = 0;
				1275	enum cpp_ttype type;
				1276	size_t total_len = 0;
				1277	_cpp_buff first_buff = NULL, last_buff = NULL;
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1278	_cpp_line_note *note = &pfile->buffer->notes[pfile->buffer->cur_note];
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1279
				1280	type = (*base == 'L' ? CPP_WSTRING :
				1281	*base == 'U' ? CPP_STRING32 :
				1282	*base == 'u' ? (base[1] == '8' ? CPP_UTF8STRING : CPP_STRING16)
				1283	: CPP_STRING);
				1284
				1285	raw_prefix = cur + 1;
				1286	while (raw_prefix_len < 16)
				1287	{
				1288	switch (raw_prefix[raw_prefix_len])
				1289	{
Jason Merrill	5215062	2010-03-29 11:00:43 -0400	[diff] [blame]	1290	case ' ': case '(': case ')': case '\\': case '\t':
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1291	case '\v': case '\f': case '\n': default:
				1292	break;
				1293	/* Basic source charset except the above chars. */
				1294	case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
				1295	case 'g': case 'h': case 'i': case 'j': case 'k': case 'l':
				1296	case 'm': case 'n': case 'o': case 'p': case 'q': case 'r':
				1297	case 's': case 't': case 'u': case 'v': case 'w': case 'x':
				1298	case 'y': case 'z':
				1299	case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
				1300	case 'G': case 'H': case 'I': case 'J': case 'K': case 'L':
				1301	case 'M': case 'N': case 'O': case 'P': case 'Q': case 'R':
				1302	case 'S': case 'T': case 'U': case 'V': case 'W': case 'X':
				1303	case 'Y': case 'Z':
				1304	case '0': case '1': case '2': case '3': case '4': case '5':
				1305	case '6': case '7': case '8': case '9':
Jason Merrill	5215062	2010-03-29 11:00:43 -0400	[diff] [blame]	1306	case '_': case '{': case '}': case '#': case '[': case ']':
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1307	case '<': case '>': case '%': case ':': case ';': case '.':
				1308	case '?': case '*': case '+': case '-': case '/': case '^':
				1309	case '&': case '\|': case '~': case '!': case '=': case ',':
Jason Merrill	5215062	2010-03-29 11:00:43 -0400	[diff] [blame]	1310	case '"': case '\'':
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1311	raw_prefix_len++;
				1312	continue;
				1313	}
				1314	break;
				1315	}
				1316
Jason Merrill	5215062	2010-03-29 11:00:43 -0400	[diff] [blame]	1317	if (raw_prefix[raw_prefix_len] != '(')
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1318	{
				1319	int col = CPP_BUF_COLUMN (pfile->buffer, raw_prefix + raw_prefix_len)
				1320	+ 1;
				1321	if (raw_prefix_len == 16)
				1322	cpp_error_with_line (pfile, CPP_DL_ERROR, token->src_loc, col,
				1323	"raw string delimiter longer than 16 characters");
				1324	else
				1325	cpp_error_with_line (pfile, CPP_DL_ERROR, token->src_loc, col,
				1326	"invalid character '%c' in raw string delimiter",
				1327	(int) raw_prefix[raw_prefix_len]);
				1328	pfile->buffer->cur = raw_prefix - 1;
				1329	create_literal (pfile, token, base, raw_prefix - 1 - base, CPP_OTHER);
				1330	return;
				1331	}
				1332
				1333	cur = raw_prefix + raw_prefix_len + 1;
				1334	for (;;)
				1335	{
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1336	#define BUF_APPEND(STR,LEN) \
				1337	do { \
				1338	bufring_append (pfile, (const uchar *)(STR), (LEN), \
				1339	&first_buff, &last_buff); \
				1340	total_len += (LEN); \
				1341	} while (0);
				1342
				1343	cppchar_t c;
				1344
				1345	/* If we previously performed any trigraph or line splicing
				1346	transformations, undo them within the body of the raw string. */
				1347	while (note->pos < cur)
				1348	++note;
				1349	for (; note->pos == cur; ++note)
				1350	{
				1351	switch (note->type)
				1352	{
				1353	case '\\':
				1354	case ' ':
				1355	/* Restore backslash followed by newline. */
				1356	BUF_APPEND (base, cur - base);
				1357	base = cur;
				1358	BUF_APPEND ("\\", 1);
				1359	after_backslash:
				1360	if (note->type == ' ')
				1361	{
				1362	/* GNU backslash whitespace newline extension. FIXME
				1363	could be any sequence of non-vertical space. When we
				1364	can properly restore any such sequence, we should mark
				1365	this note as handled so _cpp_process_line_notes
				1366	doesn't warn. */
				1367	BUF_APPEND (" ", 1);
				1368	}
				1369
				1370	BUF_APPEND ("\n", 1);
				1371	break;
				1372
				1373	case 0:
				1374	/* Already handled. */
				1375	break;
				1376
				1377	default:
				1378	if (_cpp_trigraph_map[note->type])
				1379	{
				1380	/* Don't warn about this trigraph in
				1381	_cpp_process_line_notes, since trigraphs show up as
				1382	trigraphs in raw strings. */
Jakub Jelinek	d947ada	2010-04-06 09:02:40 +0200	[diff] [blame]	1383	uchar type = note->type;
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1384	note->type = 0;
				1385
				1386	if (!CPP_OPTION (pfile, trigraphs))
				1387	/* If we didn't convert the trigraph in the first
				1388	place, don't do anything now either. */
				1389	break;
				1390
				1391	BUF_APPEND (base, cur - base);
				1392	base = cur;
				1393	BUF_APPEND ("??", 2);
				1394
				1395	/* ??/ followed by newline gets two line notes, one for
				1396	the trigraph and one for the backslash/newline. */
				1397	if (type == '/' && note[1].pos == cur)
				1398	{
				1399	if (note[1].type != '\\'
				1400	&& note[1].type != ' ')
				1401	abort ();
				1402	BUF_APPEND ("/", 1);
				1403	++note;
				1404	goto after_backslash;
				1405	}
				1406	/* The ) from ??) could be part of the suffix. */
				1407	else if (type == ')'
				1408	&& strncmp ((const char *) cur+1,
				1409	(const char *) raw_prefix,
				1410	raw_prefix_len) == 0
				1411	&& cur[raw_prefix_len+1] == '"')
				1412	{
Jakub Jelinek	6cfae07	2011-04-24 01:32:09 +0200	[diff] [blame]	1413	BUF_APPEND (")", 1);
				1414	base++;
				1415	cur += raw_prefix_len + 2;
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1416	goto break_outer_loop;
				1417	}
				1418	else
				1419	{
				1420	/* Skip the replacement character. */
				1421	base = ++cur;
				1422	BUF_APPEND (&type, 1);
				1423	}
				1424	}
				1425	else
				1426	abort ();
				1427	break;
				1428	}
				1429	}
				1430	c = *cur++;
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1431
Jason Merrill	5215062	2010-03-29 11:00:43 -0400	[diff] [blame]	1432	if (c == ')'
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1433	&& strncmp ((const char ) cur, (const char ) raw_prefix,
				1434	raw_prefix_len) == 0
				1435	&& cur[raw_prefix_len] == '"')
				1436	{
				1437	cur += raw_prefix_len + 1;
				1438	break;
				1439	}
				1440	else if (c == '\n')
				1441	{
				1442	if (pfile->state.in_directive
				1443	\|\| pfile->state.parsing_args
				1444	\|\| pfile->state.in_deferred_pragma)
				1445	{
				1446	cur--;
				1447	type = CPP_OTHER;
				1448	cpp_error_with_line (pfile, CPP_DL_ERROR, token->src_loc, 0,
				1449	"unterminated raw string");
				1450	break;
				1451	}
				1452
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1453	BUF_APPEND (base, cur - base);
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1454
				1455	if (pfile->buffer->cur < pfile->buffer->rlimit)
				1456	CPP_INCREMENT_LINE (pfile, 0);
				1457	pfile->buffer->need_line = true;
				1458
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1459	pfile->buffer->cur = cur-1;
				1460	_cpp_process_line_notes (pfile, false);
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1461	if (!_cpp_get_fresh_line (pfile))
				1462	{
				1463	source_location src_loc = token->src_loc;
				1464	token->type = CPP_EOF;
				1465	/* Tell the compiler the line number of the EOF token. */
				1466	token->src_loc = pfile->line_table->highest_line;
				1467	token->flags = BOL;
				1468	if (first_buff != NULL)
				1469	_cpp_release_buff (pfile, first_buff);
				1470	cpp_error_with_line (pfile, CPP_DL_ERROR, src_loc, 0,
				1471	"unterminated raw string");
				1472	return;
				1473	}
				1474
				1475	cur = base = pfile->buffer->cur;
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1476	note = &pfile->buffer->notes[pfile->buffer->cur_note];
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1477	}
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1478	}
Jason Merrill	00a81b8	2010-03-29 16:07:29 -0400	[diff] [blame]	1479	break_outer_loop:
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1480
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1481	pfile->buffer->cur = cur;
				1482	if (first_buff == NULL)
				1483	create_literal (pfile, token, base, cur - base, type);
				1484	else
				1485	{
				1486	uchar *dest = _cpp_unaligned_alloc (pfile, total_len + (cur - base) + 1);
				1487
				1488	token->type = type;
				1489	token->val.str.len = total_len + (cur - base);
				1490	token->val.str.text = dest;
				1491	last_buff = first_buff;
				1492	while (last_buff != NULL)
				1493	{
				1494	memcpy (dest, last_buff->base,
				1495	BUFF_FRONT (last_buff) - last_buff->base);
				1496	dest += BUFF_FRONT (last_buff) - last_buff->base;
				1497	last_buff = last_buff->next;
				1498	}
				1499	_cpp_release_buff (pfile, first_buff);
				1500	memcpy (dest, base, cur - base);
				1501	dest[cur - base] = '\0';
				1502	}
				1503	}
				1504
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1505	/* Lexes a string, character constant, or angle-bracketed header file
				1506	name. The stored string contains the spelling, including opening
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1507	quote and any leading 'L', 'u', 'U' or 'u8' and optional
				1508	'R' modifier. It returns the type of the literal, or CPP_OTHER
				1509	if it was not properly terminated, or CPP_LESS for an unterminated
				1510	header name which must be relexed as normal tokens.
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1511
				1512	The spelling is NUL-terminated, but it is not guaranteed that this
				1513	is the first NUL since embedded NULs are preserved. */
				1514	static void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1515	lex_string (cpp_reader pfile, cpp_token token, const uchar *base)
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1516	{
				1517	bool saw_NUL = false;
				1518	const uchar *cur;
				1519	cppchar_t terminator;
				1520	enum cpp_ttype type;
				1521
				1522	cur = base;
				1523	terminator = *cur++;
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1524	if (terminator == 'L' \|\| terminator == 'U')
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1525	terminator = *cur++;
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1526	else if (terminator == 'u')
				1527	{
				1528	terminator = *cur++;
				1529	if (terminator == '8')
				1530	terminator = *cur++;
				1531	}
				1532	if (terminator == 'R')
				1533	{
				1534	lex_raw_string (pfile, token, base, cur);
				1535	return;
				1536	}
				1537	if (terminator == '"')
Kris Van Hees	b6baa67	2008-04-18 13:58:08 +0000	[diff] [blame]	1538	type = (*base == 'L' ? CPP_WSTRING :
				1539	*base == 'U' ? CPP_STRING32 :
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	1540	*base == 'u' ? (base[1] == '8' ? CPP_UTF8STRING : CPP_STRING16)
				1541	: CPP_STRING);
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1542	else if (terminator == '\'')
Kris Van Hees	b6baa67	2008-04-18 13:58:08 +0000	[diff] [blame]	1543	type = (*base == 'L' ? CPP_WCHAR :
				1544	*base == 'U' ? CPP_CHAR32 :
				1545	*base == 'u' ? CPP_CHAR16 : CPP_CHAR);
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1546	else
				1547	terminator = '>', type = CPP_HEADER_NAME;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	1548
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1549	for (;;)
				1550	{
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1551	cppchar_t c = *cur++;
Neil Booth	7868b4a	2001-03-04 12:02:02 +0000	[diff] [blame]	1552
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	1553	/* In #include-style directives, terminators are not escapable. */
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1554	if (c == '\\' && !pfile->state.angled_headers && *cur != '\n')
				1555	cur++;
				1556	else if (c == terminator)
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	1557	break;
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1558	else if (c == '\n')
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1559	{
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1560	cur--;
Joseph Myers	4bb09c2	2009-02-21 21:25:39 +0000	[diff] [blame]	1561	/* Unmatched quotes always yield undefined behavior, but
				1562	greedy lexing means that what appears to be an unterminated
				1563	header name may actually be a legitimate sequence of tokens. */
				1564	if (terminator == '>')
				1565	{
				1566	token->type = CPP_LESS;
				1567	return;
				1568	}
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1569	type = CPP_OTHER;
				1570	break;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1571	}
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1572	else if (c == '\0')
				1573	saw_NUL = true;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1574	}
				1575
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1576	if (saw_NUL && !pfile->state.skipping)
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	1577	cpp_error (pfile, CPP_DL_WARNING,
				1578	"null character(s) preserved in literal");
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1579
Joseph Myers	c663e30	2006-09-13 02:04:18 +0100	[diff] [blame]	1580	if (type == CPP_OTHER && CPP_OPTION (pfile, lang) != CLK_ASM)
				1581	cpp_error (pfile, CPP_DL_PEDWARN, "missing terminating %c character",
				1582	(int) terminator);
				1583
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	1584	pfile->buffer->cur = cur;
				1585	create_literal (pfile, token, base, cur - base, type);
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1586	}
				1587
Matthew Gingell	631d0d3	2008-10-05 12:35:36 +0000	[diff] [blame]	1588	/* Return the comment table. The client may not make any assumption
				1589	about the ordering of the table. */
				1590	cpp_comment_table *
				1591	cpp_get_comments (cpp_reader *pfile)
				1592	{
				1593	return &pfile->comments;
				1594	}
				1595
				1596	/* Append a comment to the end of the comment table. */
				1597	static void
				1598	store_comment (cpp_reader pfile, cpp_token token)
				1599	{
				1600	int len;
				1601
				1602	if (pfile->comments.allocated == 0)
				1603	{
				1604	pfile->comments.allocated = 256;
				1605	pfile->comments.entries = (cpp_comment *) xmalloc
				1606	(pfile->comments.allocated * sizeof (cpp_comment));
				1607	}
				1608
				1609	if (pfile->comments.count == pfile->comments.allocated)
				1610	{
				1611	pfile->comments.allocated *= 2;
				1612	pfile->comments.entries = (cpp_comment *) xrealloc
				1613	(pfile->comments.entries,
				1614	pfile->comments.allocated * sizeof (cpp_comment));
				1615	}
				1616
				1617	len = token->val.str.len;
				1618
				1619	/* Copy comment. Note, token may not be NULL terminated. */
				1620	pfile->comments.entries[pfile->comments.count].comment =
				1621	(char ) xmalloc (sizeof (char) (len + 1));
				1622	memcpy (pfile->comments.entries[pfile->comments.count].comment,
				1623	token->val.str.text, len);
				1624	pfile->comments.entries[pfile->comments.count].comment[len] = '\0';
				1625
				1626	/* Set source location. */
				1627	pfile->comments.entries[pfile->comments.count].sloc = token->src_loc;
				1628
				1629	/* Increment the count of entries in the comment table. */
				1630	pfile->comments.count++;
				1631	}
				1632
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	1633	/* The stored comment includes the comment start and any terminator. */
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1634	static void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1635	save_comment (cpp_reader pfile, cpp_token token, const unsigned char *from,
				1636	cppchar_t type)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	1637	{
Neil Booth	5d7ee2f	2000-05-10 09:39:18 +0000	[diff] [blame]	1638	unsigned char *buffer;
Kai Tietz	651a20b	2010-11-16 19:50:17 +0000	[diff] [blame]	1639	unsigned int len, clen, i;
Kazu Hirata	df38348	2002-05-22 22:02:16 +0000	[diff] [blame]	1640
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	1641	len = pfile->buffer->cur - from + 1; /* + 1 for the initial '/'. */
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	1642
Neil Booth	3542203	2000-10-29 09:56:00 +0000	[diff] [blame]	1643	/* C++ comments probably (not definitely) have moved past a new
				1644	line, which we don't want to save in the comment. */
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	1645	if (is_vspace (pfile->buffer->cur[-1]))
Neil Booth	3542203	2000-10-29 09:56:00 +0000	[diff] [blame]	1646	len--;
Jason Thorpe	477cdac	2002-04-07 03:12:23 +0000	[diff] [blame]	1647
Kai Tietz	651a20b	2010-11-16 19:50:17 +0000	[diff] [blame]	1648	/* If we are currently in a directive or in argument parsing, then
				1649	we need to store all C++ comments as C comments internally, and
				1650	so we need to allocate a little extra space in that case.
Jason Thorpe	477cdac	2002-04-07 03:12:23 +0000	[diff] [blame]	1651
				1652	Note that the only time we encounter a directive here is
				1653	when we are saving comments in a "#define". */
Kai Tietz	651a20b	2010-11-16 19:50:17 +0000	[diff] [blame]	1654	clen = ((pfile->state.in_directive \|\| pfile->state.parsing_args)
				1655	&& type == '/') ? len + 2 : len;
Jason Thorpe	477cdac	2002-04-07 03:12:23 +0000	[diff] [blame]	1656
				1657	buffer = _cpp_unaligned_alloc (pfile, clen);
Kazu Hirata	df38348	2002-05-22 22:02:16 +0000	[diff] [blame]	1658
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1659	token->type = CPP_COMMENT;
Jason Thorpe	477cdac	2002-04-07 03:12:23 +0000	[diff] [blame]	1660	token->val.str.len = clen;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1661	token->val.str.text = buffer;
Neil Booth	d1d9a6b	2000-05-27 23:19:56 +0000	[diff] [blame]	1662
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	1663	buffer[0] = '/';
				1664	memcpy (buffer + 1, from, len - 1);
Jason Thorpe	477cdac	2002-04-07 03:12:23 +0000	[diff] [blame]	1665
Kazu Hirata	1eeeb6a	2002-04-30 20:48:55 +0000	[diff] [blame]	1666	/* Finish conversion to a C comment, if necessary. */
Kai Tietz	651a20b	2010-11-16 19:50:17 +0000	[diff] [blame]	1667	if ((pfile->state.in_directive \|\| pfile->state.parsing_args) && type == '/')
Jason Thorpe	477cdac	2002-04-07 03:12:23 +0000	[diff] [blame]	1668	{
				1669	buffer[1] = '*';
				1670	buffer[clen - 2] = '*';
				1671	buffer[clen - 1] = '/';
Kai Tietz	651a20b	2010-11-16 19:50:17 +0000	[diff] [blame]	1672	/* As there can be in a C++ comments illegal sequences for C comments
				1673	we need to filter them out. */
				1674	for (i = 2; i < (clen - 2); i++)
				1675	if (buffer[i] == '/' && (buffer[i - 1] == '' \|\| buffer[i + 1] == ''))
				1676	buffer[i] = '\|';
Jason Thorpe	477cdac	2002-04-07 03:12:23 +0000	[diff] [blame]	1677	}
Matthew Gingell	631d0d3	2008-10-05 12:35:36 +0000	[diff] [blame]	1678
				1679	/* Finally store this comment for use by clients of libcpp. */
				1680	store_comment (pfile, token);
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1681	}
				1682
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1683	/* Allocate COUNT tokens for RUN. */
				1684	void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1685	_cpp_init_tokenrun (tokenrun *run, unsigned int count)
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1686	{
Bernardo Innocenti	72bb2c3	2004-07-24 20:04:42 +0200	[diff] [blame]	1687	run->base = XNEWVEC (cpp_token, count);
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1688	run->limit = run->base + count;
				1689	run->next = NULL;
				1690	}
				1691
				1692	/* Returns the next tokenrun, or creates one if there is none. */
				1693	static tokenrun *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1694	next_tokenrun (tokenrun *run)
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1695	{
				1696	if (run->next == NULL)
				1697	{
Bernardo Innocenti	72bb2c3	2004-07-24 20:04:42 +0200	[diff] [blame]	1698	run->next = XNEW (tokenrun);
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1699	run->next->prev = run;
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1700	_cpp_init_tokenrun (run->next, 250);
				1701	}
				1702
				1703	return run->next;
				1704	}
				1705
Dodji Seketeli	ad2305a	2011-10-22 17:49:18 +0000	[diff] [blame^]	1706	/* Return the number of not yet processed token in a given
Tom Tromey	92582b7	2011-10-17 09:59:12 +0000	[diff] [blame]	1707	context. */
				1708	int
Dodji Seketeli	ad2305a	2011-10-22 17:49:18 +0000	[diff] [blame^]	1709	_cpp_remaining_tokens_num_in_context (cpp_context *context)
Tom Tromey	92582b7	2011-10-17 09:59:12 +0000	[diff] [blame]	1710	{
Tom Tromey	92582b7	2011-10-17 09:59:12 +0000	[diff] [blame]	1711	if (context->tokens_kind == TOKENS_KIND_DIRECT)
Dodji Seketeli	cbbcf65	2011-10-20 08:49:29 +0000	[diff] [blame]	1712	return (LAST (context).token - FIRST (context).token);
Tom Tromey	92582b7	2011-10-17 09:59:12 +0000	[diff] [blame]	1713	else if (context->tokens_kind == TOKENS_KIND_INDIRECT
				1714	\|\| context->tokens_kind == TOKENS_KIND_EXTENDED)
Dodji Seketeli	cbbcf65	2011-10-20 08:49:29 +0000	[diff] [blame]	1715	return (LAST (context).ptoken - FIRST (context).ptoken);
Tom Tromey	92582b7	2011-10-17 09:59:12 +0000	[diff] [blame]	1716	else
				1717	abort ();
				1718	}
				1719
Dodji Seketeli	ad2305a	2011-10-22 17:49:18 +0000	[diff] [blame^]	1720	/* Returns the token present at index INDEX in a given context. If
				1721	INDEX is zero, the next token to be processed is returned. */
Tom Tromey	92582b7	2011-10-17 09:59:12 +0000	[diff] [blame]	1722	static const cpp_token*
Dodji Seketeli	ad2305a	2011-10-22 17:49:18 +0000	[diff] [blame^]	1723	_cpp_token_from_context_at (cpp_context *context, int index)
Tom Tromey	92582b7	2011-10-17 09:59:12 +0000	[diff] [blame]	1724	{
Tom Tromey	92582b7	2011-10-17 09:59:12 +0000	[diff] [blame]	1725	if (context->tokens_kind == TOKENS_KIND_DIRECT)
				1726	return &(FIRST (context).token[index]);
				1727	else if (context->tokens_kind == TOKENS_KIND_INDIRECT
				1728	\|\| context->tokens_kind == TOKENS_KIND_EXTENDED)
				1729	return FIRST (context).ptoken[index];
				1730	else
				1731	abort ();
				1732	}
				1733
Ben Elliston	5950c3c	2008-07-14 05:09:48 +0000	[diff] [blame]	1734	/* Look ahead in the input stream. */
				1735	const cpp_token *
				1736	cpp_peek_token (cpp_reader *pfile, int index)
				1737	{
				1738	cpp_context *context = pfile->context;
				1739	const cpp_token *peektok;
				1740	int count;
				1741
				1742	/* First, scan through any pending cpp_context objects. */
				1743	while (context->prev)
				1744	{
Dodji Seketeli	ad2305a	2011-10-22 17:49:18 +0000	[diff] [blame^]	1745	ptrdiff_t sz = _cpp_remaining_tokens_num_in_context (context);
Ben Elliston	5950c3c	2008-07-14 05:09:48 +0000	[diff] [blame]	1746
				1747	if (index < (int) sz)
Dodji Seketeli	ad2305a	2011-10-22 17:49:18 +0000	[diff] [blame^]	1748	return _cpp_token_from_context_at (context, index);
Ben Elliston	5950c3c	2008-07-14 05:09:48 +0000	[diff] [blame]	1749	index -= (int) sz;
				1750	context = context->prev;
				1751	}
				1752
				1753	/* We will have to read some new tokens after all (and do so
				1754	without invalidating preceding tokens). */
				1755	count = index;
				1756	pfile->keep_tokens++;
				1757
				1758	do
				1759	{
				1760	peektok = _cpp_lex_token (pfile);
				1761	if (peektok->type == CPP_EOF)
				1762	return peektok;
				1763	}
				1764	while (index--);
				1765
				1766	_cpp_backup_tokens_direct (pfile, count + 1);
				1767	pfile->keep_tokens--;
				1768
				1769	return peektok;
				1770	}
				1771
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	1772	/* Allocate a single token that is invalidated at the same time as the
				1773	rest of the tokens on the line. Has its line and col set to the
				1774	same as the last lexed token, so that diagnostics appear in the
				1775	right place. */
				1776	cpp_token *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1777	_cpp_temp_token (cpp_reader *pfile)
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	1778	{
				1779	cpp_token old, result;
Ben Elliston	5950c3c	2008-07-14 05:09:48 +0000	[diff] [blame]	1780	ptrdiff_t sz = pfile->cur_run->limit - pfile->cur_token;
				1781	ptrdiff_t la = (ptrdiff_t) pfile->lookaheads;
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	1782
				1783	old = pfile->cur_token - 1;
Ben Elliston	5950c3c	2008-07-14 05:09:48 +0000	[diff] [blame]	1784	/* Any pre-existing lookaheads must not be clobbered. */
				1785	if (la)
				1786	{
				1787	if (sz <= la)
				1788	{
				1789	tokenrun *next = next_tokenrun (pfile->cur_run);
				1790
				1791	if (sz < la)
				1792	memmove (next->base + 1, next->base,
				1793	(la - sz) * sizeof (cpp_token));
				1794
				1795	next->base[0] = pfile->cur_run->limit[-1];
				1796	}
				1797
				1798	if (sz > 1)
				1799	memmove (pfile->cur_token + 1, pfile->cur_token,
				1800	MIN (la, sz - 1) * sizeof (cpp_token));
				1801	}
				1802
				1803	if (!sz && pfile->cur_token == pfile->cur_run->limit)
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	1804	{
				1805	pfile->cur_run = next_tokenrun (pfile->cur_run);
				1806	pfile->cur_token = pfile->cur_run->base;
				1807	}
				1808
				1809	result = pfile->cur_token++;
Per Bothner	12f9df4	2004-02-11 07:29:30 -0800	[diff] [blame]	1810	result->src_loc = old->src_loc;
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	1811	return result;
				1812	}
				1813
Neil Booth	14baae0	2001-09-17 18:26:12 +0000	[diff] [blame]	1814	/* Lex a token into RESULT (external interface). Takes care of issues
				1815	like directive handling, token lookahead, multiple include
Joseph Myers	a1f300c	2001-11-23 02:05:19 +0000	[diff] [blame]	1816	optimization and skipping. */
Neil Booth	345894b	2001-09-16 13:44:29 +0000	[diff] [blame]	1817	const cpp_token *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1818	_cpp_lex_token (cpp_reader *pfile)
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1819	{
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1820	cpp_token *result;
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1821
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1822	for (;;)
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1823	{
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1824	if (pfile->cur_token == pfile->cur_run->limit)
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1825	{
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1826	pfile->cur_run = next_tokenrun (pfile->cur_run);
				1827	pfile->cur_token = pfile->cur_run->base;
				1828	}
Tom Tromey	ee38036	2007-01-30 15:46:01 +0000	[diff] [blame]	1829	/* We assume that the current token is somewhere in the current
				1830	run. */
				1831	if (pfile->cur_token < pfile->cur_run->base
				1832	\|\| pfile->cur_token >= pfile->cur_run->limit)
				1833	abort ();
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1834
				1835	if (pfile->lookaheads)
Neil Booth	14baae0	2001-09-17 18:26:12 +0000	[diff] [blame]	1836	{
				1837	pfile->lookaheads--;
				1838	result = pfile->cur_token++;
				1839	}
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1840	else
Neil Booth	14baae0	2001-09-17 18:26:12 +0000	[diff] [blame]	1841	result = _cpp_lex_direct (pfile);
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1842
				1843	if (result->flags & BOL)
				1844	{
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1845	/* Is this a directive. If _cpp_handle_directive returns
				1846	false, it is an assembler #. */
				1847	if (result->type == CPP_HASH
Neil Booth	e808ec9	2002-02-27 07:24:53 +0000	[diff] [blame]	1848	/* 6.10.3 p 11: Directives in a list of macro arguments
				1849	gives undefined behavior. This implementation
				1850	handles the directive as normal. */
Richard Henderson	bc4071d	2006-01-04 08:33:38 -0800	[diff] [blame]	1851	&& pfile->state.parsing_args != 1)
Zack Weinberg	21b1149	2004-09-09 19:16:56 +0000	[diff] [blame]	1852	{
Richard Henderson	bc4071d	2006-01-04 08:33:38 -0800	[diff] [blame]	1853	if (_cpp_handle_directive (pfile, result->flags & PREV_WHITE))
Zack Weinberg	21b1149	2004-09-09 19:16:56 +0000	[diff] [blame]	1854	{
Richard Henderson	bc4071d	2006-01-04 08:33:38 -0800	[diff] [blame]	1855	if (pfile->directive_result.type == CPP_PADDING)
				1856	continue;
Zack Weinberg	21b1149	2004-09-09 19:16:56 +0000	[diff] [blame]	1857	result = &pfile->directive_result;
Zack Weinberg	21b1149	2004-09-09 19:16:56 +0000	[diff] [blame]	1858	}
				1859	}
Richard Henderson	bc4071d	2006-01-04 08:33:38 -0800	[diff] [blame]	1860	else if (pfile->state.in_deferred_pragma)
				1861	result = &pfile->directive_result;
Zack Weinberg	21b1149	2004-09-09 19:16:56 +0000	[diff] [blame]	1862
Neil Booth	9729389	2001-09-14 22:04:46 +0000	[diff] [blame]	1863	if (pfile->cb.line_change && !pfile->state.skipping)
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1864	pfile->cb.line_change (pfile, result, pfile->state.parsing_args);
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1865	}
				1866
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1867	/* We don't skip tokens in directives. */
Richard Henderson	bc4071d	2006-01-04 08:33:38 -0800	[diff] [blame]	1868	if (pfile->state.in_directive \|\| pfile->state.in_deferred_pragma)
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1869	break;
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1870
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1871	/* Outside a directive, invalidate controlling macros. At file
Neil Booth	14baae0	2001-09-17 18:26:12 +0000	[diff] [blame]	1872	EOF, _cpp_lex_direct takes care of popping the buffer, so we never
Kazu Hirata	6356f89	2003-06-12 19:01:08 +0000	[diff] [blame]	1873	get here and MI optimization works. */
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1874	pfile->mi_valid = false;
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	1875
				1876	if (!pfile->state.skipping \|\| result->type == CPP_EOF)
				1877	break;
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1878	}
				1879
Neil Booth	345894b	2001-09-16 13:44:29 +0000	[diff] [blame]	1880	return result;
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1881	}
				1882
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1883	/* Returns true if a fresh line has been loaded. */
				1884	bool
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1885	_cpp_get_fresh_line (cpp_reader *pfile)
Neil Booth	004cb26	2002-05-17 20:16:48 +0000	[diff] [blame]	1886	{
Per Bothner	22234f5	2004-02-18 14:02:39 -0800	[diff] [blame]	1887	int return_at_eof;
				1888
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1889	/* We can't get a new line until we leave the current directive. */
				1890	if (pfile->state.in_directive)
				1891	return false;
Kazu Hirata	df38348	2002-05-22 22:02:16 +0000	[diff] [blame]	1892
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1893	for (;;)
Neil Booth	1a76916	2002-06-11 05:36:17 +0000	[diff] [blame]	1894	{
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1895	cpp_buffer *buffer = pfile->buffer;
				1896
				1897	if (!buffer->need_line)
				1898	return true;
				1899
				1900	if (buffer->next_line < buffer->rlimit)
				1901	{
				1902	_cpp_clean_line (pfile);
				1903	return true;
				1904	}
				1905
				1906	/* First, get out of parsing arguments state. */
				1907	if (pfile->state.parsing_args)
Neil Booth	1a76916	2002-06-11 05:36:17 +0000	[diff] [blame]	1908	return false;
				1909
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1910	/* End of buffer. Non-empty files should end in a newline. */
				1911	if (buffer->buf != buffer->rlimit
				1912	&& buffer->next_line > buffer->rlimit
				1913	&& !buffer->from_stage3)
Neil Booth	004cb26	2002-05-17 20:16:48 +0000	[diff] [blame]	1914	{
Dave Korn	ed0e74e	2007-05-31 02:06:48 +0000	[diff] [blame]	1915	/* Clip to buffer size. */
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1916	buffer->next_line = buffer->rlimit;
Neil Booth	004cb26	2002-05-17 20:16:48 +0000	[diff] [blame]	1917	}
Per Bothner	22234f5	2004-02-18 14:02:39 -0800	[diff] [blame]	1918
				1919	return_at_eof = buffer->return_at_eof;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1920	_cpp_pop_buffer (pfile);
Per Bothner	22234f5	2004-02-18 14:02:39 -0800	[diff] [blame]	1921	if (pfile->buffer == NULL \|\| return_at_eof)
Per Bothner	a506c55	2003-10-02 07:20:38 +0000	[diff] [blame]	1922	return false;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1923	}
Neil Booth	004cb26	2002-05-17 20:16:48 +0000	[diff] [blame]	1924	}
				1925
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	1926	#define IF_NEXT_IS(CHAR, THEN_TYPE, ELSE_TYPE) \
				1927	do \
				1928	{ \
				1929	result->type = ELSE_TYPE; \
				1930	if (*buffer->cur == CHAR) \
				1931	buffer->cur++, result->type = THEN_TYPE; \
				1932	} \
				1933	while (0)
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	1934
Neil Booth	14baae0	2001-09-17 18:26:12 +0000	[diff] [blame]	1935	/* Lex a token into pfile->cur_token, which is also incremented, to
				1936	get diagnostics pointing to the correct location.
				1937
				1938	Does not handle issues such as token lookahead, multiple-include
Kazu Hirata	f1ba665	2003-06-28 19:43:01 +0000	[diff] [blame]	1939	optimization, directives, skipping etc. This function is only
Neil Booth	14baae0	2001-09-17 18:26:12 +0000	[diff] [blame]	1940	suitable for use by _cpp_lex_token, and in special cases like
				1941	lex_expansion_token which doesn't care for any of these issues.
				1942
				1943	When meeting a newline, returns CPP_EOF if parsing a directive,
				1944	otherwise returns to the start of the token buffer if permissible.
				1945	Returns the location of the lexed token. */
				1946	cpp_token *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	1947	_cpp_lex_direct (cpp_reader *pfile)
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1948	{
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1949	cppchar_t c;
Neil Booth	adb84b4	2000-11-08 23:08:07 +0000	[diff] [blame]	1950	cpp_buffer *buffer;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1951	const unsigned char *comment_start;
Neil Booth	14baae0	2001-09-17 18:26:12 +0000	[diff] [blame]	1952	cpp_token *result = pfile->cur_token++;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1953
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1954	fresh_line:
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1955	result->flags = 0;
Per Bothner	2be570f	2003-08-28 18:07:42 -0700	[diff] [blame]	1956	buffer = pfile->buffer;
Per Bothner	a506c55	2003-10-02 07:20:38 +0000	[diff] [blame]	1957	if (buffer->need_line)
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1958	{
Richard Henderson	bc4071d	2006-01-04 08:33:38 -0800	[diff] [blame]	1959	if (pfile->state.in_deferred_pragma)
				1960	{
				1961	result->type = CPP_PRAGMA_EOL;
				1962	pfile->state.in_deferred_pragma = false;
				1963	if (!pfile->state.pragma_allow_expansion)
				1964	pfile->state.prevent_expansion--;
				1965	return result;
				1966	}
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1967	if (!_cpp_get_fresh_line (pfile))
				1968	{
				1969	result->type = CPP_EOF;
Neil Booth	9ff7868	2003-04-26 21:03:51 +0000	[diff] [blame]	1970	if (!pfile->state.in_directive)
				1971	{
				1972	/* Tell the compiler the line number of the EOF token. */
Per Bothner	500bee0	2004-04-22 19:22:27 -0700	[diff] [blame]	1973	result->src_loc = pfile->line_table->highest_line;
Neil Booth	9ff7868	2003-04-26 21:03:51 +0000	[diff] [blame]	1974	result->flags = BOL;
				1975	}
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1976	return result;
				1977	}
				1978	if (!pfile->keep_tokens)
				1979	{
				1980	pfile->cur_run = &pfile->base_run;
				1981	result = pfile->base_run.base;
				1982	pfile->cur_token = result + 1;
				1983	}
				1984	result->flags = BOL;
				1985	if (pfile->state.parsing_args == 2)
				1986	result->flags \|= PREV_WHITE;
				1987	}
Per Bothner	a506c55	2003-10-02 07:20:38 +0000	[diff] [blame]	1988	buffer = pfile->buffer;
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1989	update_tokens_line:
Per Bothner	500bee0	2004-04-22 19:22:27 -0700	[diff] [blame]	1990	result->src_loc = pfile->line_table->highest_line;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	1991
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	1992	skipped_white:
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1993	if (buffer->cur >= buffer->notes[buffer->cur_note].pos
				1994	&& !pfile->overlaid_buffer)
				1995	{
				1996	_cpp_process_line_notes (pfile, false);
Per Bothner	500bee0	2004-04-22 19:22:27 -0700	[diff] [blame]	1997	result->src_loc = pfile->line_table->highest_line;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	1998	}
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	1999	c = *buffer->cur++;
Per Bothner	12f9df4	2004-02-11 07:29:30 -0800	[diff] [blame]	2000
Gabriel Charette	e3dfef4	2011-08-22 20:41:07 +0000	[diff] [blame]	2001	if (pfile->forced_token_location_p)
				2002	result->src_loc = *pfile->forced_token_location_p;
				2003	else
				2004	result->src_loc = linemap_position_for_column (pfile->line_table,
				2005	CPP_BUF_COLUMN (buffer, buffer->cur));
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	2006
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2007	switch (c)
				2008	{
Neil Booth	4d6baaf	2001-11-26 23:44:54 +0000	[diff] [blame]	2009	case ' ': case '\t': case '\f': case '\v': case '\0':
				2010	result->flags \|= PREV_WHITE;
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	2011	skip_whitespace (pfile, c);
				2012	goto skipped_white;
Neil Booth	4d6baaf	2001-11-26 23:44:54 +0000	[diff] [blame]	2013
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	2014	case '\n':
Per Bothner	12f9df4	2004-02-11 07:29:30 -0800	[diff] [blame]	2015	if (buffer->cur < buffer->rlimit)
				2016	CPP_INCREMENT_LINE (pfile, 0);
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	2017	buffer->need_line = true;
				2018	goto fresh_line;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2019
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2020	case '0': case '1': case '2': case '3': case '4':
				2021	case '5': case '6': case '7': case '8': case '9':
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	2022	{
				2023	struct normalize_state nst = INITIAL_NORMALIZE_STATE;
				2024	result->type = CPP_NUMBER;
				2025	lex_number (pfile, &result->val.str, &nst);
				2026	warn_about_normalization (pfile, result, &nst);
				2027	break;
				2028	}
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2029
Neil Booth	0abc6a6	2001-11-27 22:31:34 +0000	[diff] [blame]	2030	case 'L':
Kris Van Hees	b6baa67	2008-04-18 13:58:08 +0000	[diff] [blame]	2031	case 'u':
				2032	case 'U':
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	2033	case 'R':
				2034	/* 'L', 'u', 'U', 'u8' or 'R' may introduce wide characters,
				2035	wide strings or raw strings. */
Joseph Myers	a48e3dd	2011-08-18 16:13:49 +0100	[diff] [blame]	2036	if (c == 'L' \|\| CPP_OPTION (pfile, rliterals)
				2037	\|\| (c != 'R' && CPP_OPTION (pfile, uliterals)))
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	2038	{
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	2039	if ((*buffer->cur == '\'' && c != 'R')
				2040	\|\| *buffer->cur == '"'
				2041	\|\| (*buffer->cur == 'R'
				2042	&& c != 'R'
				2043	&& buffer->cur[1] == '"'
Joseph Myers	a48e3dd	2011-08-18 16:13:49 +0100	[diff] [blame]	2044	&& CPP_OPTION (pfile, rliterals))
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	2045	\|\| (*buffer->cur == '8'
				2046	&& c == 'u'
				2047	&& (buffer->cur[1] == '"'
Joseph Myers	a48e3dd	2011-08-18 16:13:49 +0100	[diff] [blame]	2048	\|\| (buffer->cur[1] == 'R' && buffer->cur[2] == '"'
				2049	&& CPP_OPTION (pfile, rliterals)))))
Kris Van Hees	b6baa67	2008-04-18 13:58:08 +0000	[diff] [blame]	2050	{
				2051	lex_string (pfile, result, buffer->cur - 1);
				2052	break;
				2053	}
Neil Booth	bced6ed	2003-04-19 11:59:44 +0000	[diff] [blame]	2054	}
Kazu Hirata	df38348	2002-05-22 22:02:16 +0000	[diff] [blame]	2055	/* Fall through. */
Neil Booth	0abc6a6	2001-11-27 22:31:34 +0000	[diff] [blame]	2056
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2057	case '_':
				2058	case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
				2059	case 'g': case 'h': case 'i': case 'j': case 'k': case 'l':
				2060	case 'm': case 'n': case 'o': case 'p': case 'q': case 'r':
Kris Van Hees	b6baa67	2008-04-18 13:58:08 +0000	[diff] [blame]	2061	case 's': case 't': case 'v': case 'w': case 'x':
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2062	case 'y': case 'z':
				2063	case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
Neil Booth	0abc6a6	2001-11-27 22:31:34 +0000	[diff] [blame]	2064	case 'G': case 'H': case 'I': case 'J': case 'K':
Jakub Jelinek	2c6e3f5	2009-10-19 23:41:15 +0200	[diff] [blame]	2065	case 'M': case 'N': case 'O': case 'P': case 'Q':
Kris Van Hees	b6baa67	2008-04-18 13:58:08 +0000	[diff] [blame]	2066	case 'S': case 'T': case 'V': case 'W': case 'X':
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2067	case 'Y': case 'Z':
				2068	result->type = CPP_NAME;
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	2069	{
				2070	struct normalize_state nst = INITIAL_NORMALIZE_STATE;
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2071	result->val.node.node = lex_identifier (pfile, buffer->cur - 1, false,
				2072	&nst);
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	2073	warn_about_normalization (pfile, result, &nst);
				2074	}
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2075
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2076	/* Convert named operators to their proper types. */
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2077	if (result->val.node.node->flags & NODE_OPERATOR)
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2078	{
				2079	result->flags \|= NAMED_OP;
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2080	result->type = (enum cpp_ttype) result->val.node.node->directive_index;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2081	}
				2082	break;
				2083
				2084	case '\'':
				2085	case '"':
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	2086	lex_string (pfile, result, buffer->cur - 1);
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2087	break;
				2088
				2089	case '/':
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	2090	/* A potential block or line comment. */
				2091	comment_start = buffer->cur;
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2092	c = *buffer->cur;
				2093
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	2094	if (c == '*')
				2095	{
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	2096	if (_cpp_skip_block_comment (pfile))
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	2097	cpp_error (pfile, CPP_DL_ERROR, "unterminated comment");
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2098	}
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2099	else if (c == '/' && (CPP_OPTION (pfile, cplusplus_comments)
Per Bothner	12f9df4	2004-02-11 07:29:30 -0800	[diff] [blame]	2100	\|\| cpp_in_system_header (pfile)))
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2101	{
Neil Booth	bdb05a7	2000-11-26 17:31:13 +0000	[diff] [blame]	2102	/* Warn about comments only if pedantically GNUC89, and not
				2103	in system headers. */
				2104	if (CPP_OPTION (pfile, lang) == CLK_GNUC89 && CPP_PEDANTIC (pfile)
Neil Booth	a94c119	2000-09-25 23:35:10 +0000	[diff] [blame]	2105	&& ! buffer->warned_cplusplus_comments)
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2106	{
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	2107	cpp_error (pfile, CPP_DL_PEDWARN,
Gabriel Dos Reis	5650830	2002-07-21 21:35:17 +0000	[diff] [blame]	2108	"C++ style comments are not allowed in ISO C90");
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	2109	cpp_error (pfile, CPP_DL_PEDWARN,
Neil Booth	ebef4e8	2002-04-14 18:42:47 +0000	[diff] [blame]	2110	"(this will be reported only once per input file)");
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	2111	buffer->warned_cplusplus_comments = 1;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2112	}
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	2113
Jakub Jelinek	01ef656	2001-04-11 11:43:10 +0200	[diff] [blame]	2114	if (skip_line_comment (pfile) && CPP_OPTION (pfile, warn_comments))
Simon Baldwin	87cf065	2010-04-07 17:18:10 +0000	[diff] [blame]	2115	cpp_warning (pfile, CPP_W_COMMENTS, "multi-line comment");
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2116	}
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2117	else if (c == '=')
				2118	{
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2119	buffer->cur++;
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2120	result->type = CPP_DIV_EQ;
				2121	break;
				2122	}
				2123	else
				2124	{
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2125	result->type = CPP_DIV;
				2126	break;
				2127	}
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	2128
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	2129	if (!pfile->state.save_comments)
				2130	{
				2131	result->flags \|= PREV_WHITE;
Neil Booth	5fddcff	2001-09-11 07:00:12 +0000	[diff] [blame]	2132	goto update_tokens_line;
Neil Booth	1c6d33e	2000-09-25 22:39:51 +0000	[diff] [blame]	2133	}
				2134
				2135	/* Save the comment as a token in its own right. */
Jason Thorpe	477cdac	2002-04-07 03:12:23 +0000	[diff] [blame]	2136	save_comment (pfile, result, comment_start, c);
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	2137	break;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2138
				2139	case '<':
				2140	if (pfile->state.angled_headers)
				2141	{
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	2142	lex_string (pfile, result, buffer->cur - 1);
Joseph Myers	4bb09c2	2009-02-21 21:25:39 +0000	[diff] [blame]	2143	if (result->type != CPP_LESS)
				2144	break;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2145	}
				2146
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2147	result->type = CPP_LESS;
				2148	if (*buffer->cur == '=')
				2149	buffer->cur++, result->type = CPP_LESS_EQ;
				2150	else if (*buffer->cur == '<')
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2151	{
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2152	buffer->cur++;
				2153	IF_NEXT_IS ('=', CPP_LSHIFT_EQ, CPP_LSHIFT);
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2154	}
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2155	else if (CPP_OPTION (pfile, digraphs))
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2156	{
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2157	if (*buffer->cur == ':')
				2158	{
				2159	buffer->cur++;
				2160	result->flags \|= DIGRAPH;
				2161	result->type = CPP_OPEN_SQUARE;
				2162	}
				2163	else if (*buffer->cur == '%')
				2164	{
				2165	buffer->cur++;
				2166	result->flags \|= DIGRAPH;
				2167	result->type = CPP_OPEN_BRACE;
				2168	}
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2169	}
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2170	break;
				2171
				2172	case '>':
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2173	result->type = CPP_GREATER;
				2174	if (*buffer->cur == '=')
				2175	buffer->cur++, result->type = CPP_GREATER_EQ;
				2176	else if (*buffer->cur == '>')
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2177	{
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2178	buffer->cur++;
				2179	IF_NEXT_IS ('=', CPP_RSHIFT_EQ, CPP_RSHIFT);
				2180	}
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2181	break;
				2182
Neil Booth	cbcff6d	2000-09-23 21:41:41 +0000	[diff] [blame]	2183	case '%':
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2184	result->type = CPP_MOD;
				2185	if (*buffer->cur == '=')
				2186	buffer->cur++, result->type = CPP_MOD_EQ;
				2187	else if (CPP_OPTION (pfile, digraphs))
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2188	{
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2189	if (*buffer->cur == ':')
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2190	{
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2191	buffer->cur++;
				2192	result->flags \|= DIGRAPH;
				2193	result->type = CPP_HASH;
				2194	if (*buffer->cur == '%' && buffer->cur[1] == ':')
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2195	buffer->cur += 2, result->type = CPP_PASTE, result->val.token_no = 0;
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2196	}
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2197	else if (*buffer->cur == '>')
				2198	{
				2199	buffer->cur++;
				2200	result->flags \|= DIGRAPH;
				2201	result->type = CPP_CLOSE_BRACE;
				2202	}
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2203	}
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2204	break;
				2205
Neil Booth	cbcff6d	2000-09-23 21:41:41 +0000	[diff] [blame]	2206	case '.':
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2207	result->type = CPP_DOT;
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2208	if (ISDIGIT (*buffer->cur))
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2209	{
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	2210	struct normalize_state nst = INITIAL_NORMALIZE_STATE;
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2211	result->type = CPP_NUMBER;
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	2212	lex_number (pfile, &result->val.str, &nst);
				2213	warn_about_normalization (pfile, result, &nst);
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2214	}
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2215	else if (*buffer->cur == '.' && buffer->cur[1] == '.')
				2216	buffer->cur += 2, result->type = CPP_ELLIPSIS;
				2217	else if (buffer->cur == '' && CPP_OPTION (pfile, cplusplus))
				2218	buffer->cur++, result->type = CPP_DOT_STAR;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2219	break;
				2220
				2221	case '+':
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2222	result->type = CPP_PLUS;
				2223	if (*buffer->cur == '+')
				2224	buffer->cur++, result->type = CPP_PLUS_PLUS;
				2225	else if (*buffer->cur == '=')
				2226	buffer->cur++, result->type = CPP_PLUS_EQ;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2227	break;
				2228
				2229	case '-':
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2230	result->type = CPP_MINUS;
				2231	if (*buffer->cur == '>')
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2232	{
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2233	buffer->cur++;
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2234	result->type = CPP_DEREF;
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2235	if (buffer->cur == '' && CPP_OPTION (pfile, cplusplus))
				2236	buffer->cur++, result->type = CPP_DEREF_STAR;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2237	}
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2238	else if (*buffer->cur == '-')
				2239	buffer->cur++, result->type = CPP_MINUS_MINUS;
				2240	else if (*buffer->cur == '=')
				2241	buffer->cur++, result->type = CPP_MINUS_EQ;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2242	break;
				2243
				2244	case '&':
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2245	result->type = CPP_AND;
				2246	if (*buffer->cur == '&')
				2247	buffer->cur++, result->type = CPP_AND_AND;
				2248	else if (*buffer->cur == '=')
				2249	buffer->cur++, result->type = CPP_AND_EQ;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2250	break;
Kazu Hirata	df38348	2002-05-22 22:02:16 +0000	[diff] [blame]	2251
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2252	case '\|':
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2253	result->type = CPP_OR;
				2254	if (*buffer->cur == '\|')
				2255	buffer->cur++, result->type = CPP_OR_OR;
				2256	else if (*buffer->cur == '=')
				2257	buffer->cur++, result->type = CPP_OR_EQ;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2258	break;
				2259
				2260	case ':':
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2261	result->type = CPP_COLON;
				2262	if (*buffer->cur == ':' && CPP_OPTION (pfile, cplusplus))
				2263	buffer->cur++, result->type = CPP_SCOPE;
				2264	else if (*buffer->cur == '>' && CPP_OPTION (pfile, digraphs))
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2265	{
Neil Booth	6f572ac	2003-04-19 16:34:33 +0000	[diff] [blame]	2266	buffer->cur++;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2267	result->flags \|= DIGRAPH;
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2268	result->type = CPP_CLOSE_SQUARE;
				2269	}
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2270	break;
				2271
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2272	case '*': IF_NEXT_IS ('=', CPP_MULT_EQ, CPP_MULT); break;
				2273	case '=': IF_NEXT_IS ('=', CPP_EQ_EQ, CPP_EQ); break;
				2274	case '!': IF_NEXT_IS ('=', CPP_NOT_EQ, CPP_NOT); break;
				2275	case '^': IF_NEXT_IS ('=', CPP_XOR_EQ, CPP_XOR); break;
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2276	case '#': IF_NEXT_IS ('#', CPP_PASTE, CPP_HASH); result->val.token_no = 0; break;
Neil Booth	480709c	2001-10-21 14:04:42 +0000	[diff] [blame]	2277
Neil Booth	26aea07	2003-04-19 00:22:51 +0000	[diff] [blame]	2278	case '?': result->type = CPP_QUERY; break;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2279	case '~': result->type = CPP_COMPL; break;
				2280	case ',': result->type = CPP_COMMA; break;
				2281	case '(': result->type = CPP_OPEN_PAREN; break;
				2282	case ')': result->type = CPP_CLOSE_PAREN; break;
				2283	case '[': result->type = CPP_OPEN_SQUARE; break;
				2284	case ']': result->type = CPP_CLOSE_SQUARE; break;
				2285	case '{': result->type = CPP_OPEN_BRACE; break;
				2286	case '}': result->type = CPP_CLOSE_BRACE; break;
				2287	case ';': result->type = CPP_SEMICOLON; break;
				2288
Kazu Hirata	40f0365	2002-09-26 22:25:14 +0000	[diff] [blame]	2289	/* @ is a punctuator in Objective-C. */
Zack Weinberg	cc93758	2001-03-07 01:32:01 +0000	[diff] [blame]	2290	case '@': result->type = CPP_ATSIGN; break;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2291
Neil Booth	0abc6a6	2001-11-27 22:31:34 +0000	[diff] [blame]	2292	case '$':
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	2293	case '\\':
				2294	{
				2295	const uchar *base = --buffer->cur;
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	2296	struct normalize_state nst = INITIAL_NORMALIZE_STATE;
Neil Booth	0abc6a6	2001-11-27 22:31:34 +0000	[diff] [blame]	2297
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	2298	if (forms_identifier_p (pfile, true, &nst))
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	2299	{
				2300	result->type = CPP_NAME;
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2301	result->val.node.node = lex_identifier (pfile, base, true, &nst);
Geoffrey Keating	50668cf	2005-03-15 00:36:33 +0000	[diff] [blame]	2302	warn_about_normalization (pfile, result, &nst);
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	2303	break;
				2304	}
				2305	buffer->cur++;
Neil Booth	1067694	2003-04-22 19:28:00 +0000	[diff] [blame]	2306	}
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	2307
Neil Booth	1067694	2003-04-22 19:28:00 +0000	[diff] [blame]	2308	default:
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	2309	create_literal (pfile, result, buffer->cur - 1, 1, CPP_OTHER);
				2310	break;
Neil Booth	0d9f234	2000-09-18 18:43:05 +0000	[diff] [blame]	2311	}
Neil Booth	bdcbe49	2001-09-13 20:05:17 +0000	[diff] [blame]	2312
				2313	return result;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	2314	}
				2315
Neil Booth	5932565	2003-04-24 20:03:57 +0000	[diff] [blame]	2316	/* An upper bound on the number of bytes needed to spell TOKEN.
				2317	Does not include preceding whitespace. */
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2318	unsigned int
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2319	cpp_token_len (const cpp_token *token)
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	2320	{
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2321	unsigned int len;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	2322
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2323	switch (TOKEN_SPELL (token))
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	2324	{
Joseph Myers	cc95528	2008-11-29 12:21:10 +0000	[diff] [blame]	2325	default: len = 6; break;
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	2326	case SPELL_LITERAL: len = token->val.str.len; break;
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2327	case SPELL_IDENT: len = NODE_LEN (token->val.node.node) * 10; break;
Zack Weinberg	c5a0473	2000-04-25 19:32:36 +0000	[diff] [blame]	2328	}
Neil Booth	5932565	2003-04-24 20:03:57 +0000	[diff] [blame]	2329
				2330	return len;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2331	}
				2332
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2333	/* Parse UTF-8 out of NAMEP and place a \U escape in BUFFER.
				2334	Return the number of bytes read out of NAME. (There are always
				2335	10 bytes written to BUFFER.) */
				2336
				2337	static size_t
				2338	utf8_to_ucn (unsigned char buffer, const unsigned char name)
				2339	{
				2340	int j;
				2341	int ucn_len = 0;
				2342	int ucn_len_c;
				2343	unsigned t;
				2344	unsigned long utf32;
				2345
				2346	/* Compute the length of the UTF-8 sequence. */
				2347	for (t = *name; t & 0x80; t <<= 1)
				2348	ucn_len++;
				2349
				2350	utf32 = *name & (0x7F >> ucn_len);
				2351	for (ucn_len_c = 1; ucn_len_c < ucn_len; ucn_len_c++)
				2352	{
				2353	utf32 = (utf32 << 6) \| (*++name & 0x3F);
				2354
				2355	/* Ill-formed UTF-8. */
				2356	if ((*name & ~0x3F) != 0x80)
				2357	abort ();
				2358	}
				2359
				2360	*buffer++ = '\\';
				2361	*buffer++ = 'U';
				2362	for (j = 7; j >= 0; j--)
				2363	buffer++ = "0123456789abcdef"[(utf32 >> (4 j)) & 0xF];
				2364	return ucn_len;
				2365	}
				2366
Manuel López-Ibáñez	cfc9353	2009-04-22 15:32:18 +0000	[diff] [blame]	2367	/* Given a token TYPE corresponding to a digraph, return a pointer to
				2368	the spelling of the digraph. */
				2369	static const unsigned char *
				2370	cpp_digraph2name (enum cpp_ttype type)
				2371	{
				2372	return digraph_spellings[(int) type - (int) CPP_FIRST_DIGRAPH];
				2373	}
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2374
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2375	/* Write the spelling of a token TOKEN to BUFFER. The buffer must
Zack Weinberg	cf00a88	2000-07-08 02:33:00 +0000	[diff] [blame]	2376	already contain the enough space to hold the token's spelling.
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2377	Returns a pointer to the character after the last character written.
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2378	FORSTRING is true if this is to be the spelling after translation
				2379	phase 1 (this is different for UCNs).
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2380	FIXME: Would be nice if we didn't need the PFILE argument. */
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2381	unsigned char *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2382	cpp_spell_token (cpp_reader pfile, const cpp_token token,
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2383	unsigned char *buffer, bool forstring)
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2384	{
Zack Weinberg	96be699	2000-07-18 23:25:06 +0000	[diff] [blame]	2385	switch (TOKEN_SPELL (token))
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2386	{
Neil Booth	5d7ee2f	2000-05-10 09:39:18 +0000	[diff] [blame]	2387	case SPELL_OPERATOR:
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2388	{
				2389	const unsigned char *spelling;
				2390	unsigned char c;
				2391
				2392	if (token->flags & DIGRAPH)
Manuel López-Ibáñez	cfc9353	2009-04-22 15:32:18 +0000	[diff] [blame]	2393	spelling = cpp_digraph2name (token->type);
Zack Weinberg	92936ec	2000-07-19 20:18:08 +0000	[diff] [blame]	2394	else if (token->flags & NAMED_OP)
				2395	goto spell_ident;
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2396	else
Zack Weinberg	96be699	2000-07-18 23:25:06 +0000	[diff] [blame]	2397	spelling = TOKEN_NAME (token);
Kazu Hirata	df38348	2002-05-22 22:02:16 +0000	[diff] [blame]	2398
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2399	while ((c = *spelling++) != '\0')
				2400	*buffer++ = c;
				2401	}
				2402	break;
				2403
Zack Weinberg	47ad413	2001-10-06 23:11:27 +0000	[diff] [blame]	2404	spell_ident:
Neil Booth	5d7ee2f	2000-05-10 09:39:18 +0000	[diff] [blame]	2405	case SPELL_IDENT:
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2406	if (forstring)
				2407	{
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2408	memcpy (buffer, NODE_NAME (token->val.node.node),
				2409	NODE_LEN (token->val.node.node));
				2410	buffer += NODE_LEN (token->val.node.node);
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2411	}
				2412	else
				2413	{
				2414	size_t i;
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2415	const unsigned char * name = NODE_NAME (token->val.node.node);
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2416
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2417	for (i = 0; i < NODE_LEN (token->val.node.node); i++)
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2418	if (name[i] & ~0x7F)
				2419	{
				2420	i += utf8_to_ucn (buffer, name + i) - 1;
				2421	buffer += 10;
				2422	}
				2423	else
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2424	*buffer++ = NODE_NAME (token->val.node.node)[i];
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2425	}
Neil Booth	5d7ee2f	2000-05-10 09:39:18 +0000	[diff] [blame]	2426	break;
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2427
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	2428	case SPELL_LITERAL:
Zack Weinberg	47ad413	2001-10-06 23:11:27 +0000	[diff] [blame]	2429	memcpy (buffer, token->val.str.text, token->val.str.len);
				2430	buffer += token->val.str.len;
				2431	break;
				2432
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2433	case SPELL_NONE:
John David Anglin	0527bc4	2003-11-01 22:56:54 +0000	[diff] [blame]	2434	cpp_error (pfile, CPP_DL_ICE,
				2435	"unspellable token %s", TOKEN_NAME (token));
Neil Booth	3fef5b2	2000-05-08 22:22:49 +0000	[diff] [blame]	2436	break;
				2437	}
				2438
				2439	return buffer;
				2440	}
				2441
Neil Booth	5d8ebbd	2002-01-03 21:43:09 +0000	[diff] [blame]	2442	/* Returns TOKEN spelt as a null-terminated string. The string is
				2443	freed when the reader is destroyed. Useful for diagnostics. */
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2444	unsigned char *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2445	cpp_token_as_text (cpp_reader pfile, const cpp_token token)
Neil Booth	5932565	2003-04-24 20:03:57 +0000	[diff] [blame]	2446	{
				2447	unsigned int len = cpp_token_len (token) + 1;
Neil Booth	ece54d5	2001-09-28 09:40:22 +0000	[diff] [blame]	2448	unsigned char start = _cpp_unaligned_alloc (pfile, len), end;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2449
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2450	end = cpp_spell_token (pfile, token, start, false);
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2451	end[0] = '\0';
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2452
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2453	return start;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2454	}
				2455
Manuel López-Ibáñez	cfc9353	2009-04-22 15:32:18 +0000	[diff] [blame]	2456	/* Returns a pointer to a string which spells the token defined by
				2457	TYPE and FLAGS. Used by C front ends, which really should move to
				2458	using cpp_token_as_text. */
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2459	const char *
Manuel López-Ibáñez	cfc9353	2009-04-22 15:32:18 +0000	[diff] [blame]	2460	cpp_type2name (enum cpp_ttype type, unsigned char flags)
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2461	{
Manuel López-Ibáñez	cfc9353	2009-04-22 15:32:18 +0000	[diff] [blame]	2462	if (flags & DIGRAPH)
				2463	return (const char *) cpp_digraph2name (type);
				2464	else if (flags & NAMED_OP)
				2465	return cpp_named_operator2name (type);
				2466
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2467	return (const char *) token_spellings[type].name;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2468	}
				2469
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	2470	/* Writes the spelling of token to FP, without any preceding space.
				2471	Separated from cpp_spell_token for efficiency - to avoid stdio
				2472	double-buffering. */
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2473	void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2474	cpp_output_token (const cpp_token token, FILE fp)
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2475	{
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2476	switch (TOKEN_SPELL (token))
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2477	{
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2478	case SPELL_OPERATOR:
				2479	{
				2480	const unsigned char *spelling;
Zack Weinberg	3b681e9	2001-09-28 07:00:27 +0000	[diff] [blame]	2481	int c;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2482
				2483	if (token->flags & DIGRAPH)
Manuel López-Ibáñez	cfc9353	2009-04-22 15:32:18 +0000	[diff] [blame]	2484	spelling = cpp_digraph2name (token->type);
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2485	else if (token->flags & NAMED_OP)
				2486	goto spell_ident;
				2487	else
				2488	spelling = TOKEN_NAME (token);
				2489
Zack Weinberg	3b681e9	2001-09-28 07:00:27 +0000	[diff] [blame]	2490	c = *spelling;
				2491	do
				2492	putc (c, fp);
				2493	while ((c = *++spelling) != '\0');
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2494	}
				2495	break;
				2496
				2497	spell_ident:
				2498	case SPELL_IDENT:
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2499	{
				2500	size_t i;
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2501	const unsigned char * name = NODE_NAME (token->val.node.node);
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2502
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2503	for (i = 0; i < NODE_LEN (token->val.node.node); i++)
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2504	if (name[i] & ~0x7F)
				2505	{
				2506	unsigned char buffer[10];
				2507	i += utf8_to_ucn (buffer, name + i) - 1;
				2508	fwrite (buffer, 1, 10, fp);
				2509	}
				2510	else
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2511	fputc (NODE_NAME (token->val.node.node)[i], fp);
Geoffrey Keating	47e2049	2005-03-12 10:44:06 +0000	[diff] [blame]	2512	}
				2513	break;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2514
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	2515	case SPELL_LITERAL:
Zack Weinberg	47ad413	2001-10-06 23:11:27 +0000	[diff] [blame]	2516	fwrite (token->val.str.text, 1, token->val.str.len, fp);
				2517	break;
				2518
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2519	case SPELL_NONE:
				2520	/* An error, most probably. */
				2521	break;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2522	}
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2523	}
				2524
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2525	/* Compare two tokens. */
				2526	int
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2527	_cpp_equiv_tokens (const cpp_token a, const cpp_token b)
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2528	{
				2529	if (a->type == b->type && a->flags == b->flags)
				2530	switch (TOKEN_SPELL (a))
				2531	{
				2532	default: /* Keep compiler happy. */
				2533	case SPELL_OPERATOR:
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2534	/* token_no is used to track where multiple consecutive ##
Joseph Myers	aa50850	2009-04-19 18:10:56 +0100	[diff] [blame]	2535	tokens were originally located. */
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2536	return (a->type != CPP_PASTE \|\| a->val.token_no == b->val.token_no);
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2537	case SPELL_NONE:
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2538	return (a->type != CPP_MACRO_ARG
				2539	\|\| a->val.macro_arg.arg_no == b->val.macro_arg.arg_no);
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2540	case SPELL_IDENT:
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2541	return a->val.node.node == b->val.node.node;
Neil Booth	6338b35	2003-04-23 22:44:06 +0000	[diff] [blame]	2542	case SPELL_LITERAL:
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2543	return (a->val.str.len == b->val.str.len
				2544	&& !memcmp (a->val.str.text, b->val.str.text,
				2545	a->val.str.len));
				2546	}
				2547
				2548	return 0;
				2549	}
				2550
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2551	/* Returns nonzero if a space should be inserted to avoid an
				2552	accidental token paste for output. For simplicity, it is
				2553	conservative, and occasionally advises a space where one is not
				2554	needed, e.g. "." and ".2". */
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2555	int
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2556	cpp_avoid_paste (cpp_reader pfile, const cpp_token token1,
				2557	const cpp_token *token2)
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2558	{
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2559	enum cpp_ttype a = token1->type, b = token2->type;
				2560	cppchar_t c;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2561
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2562	if (token1->flags & NAMED_OP)
				2563	a = CPP_NAME;
				2564	if (token2->flags & NAMED_OP)
				2565	b = CPP_NAME;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2566
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2567	c = EOF;
				2568	if (token2->flags & DIGRAPH)
John David Anglin	37b8524	2001-03-02 01:11:50 +0000	[diff] [blame]	2569	c = digraph_spellings[(int) b - (int) CPP_FIRST_DIGRAPH][0];
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2570	else if (token_spellings[b].category == SPELL_OPERATOR)
				2571	c = token_spellings[b].name[0];
Zack Weinberg	417f3e3	2000-07-11 23:20:53 +0000	[diff] [blame]	2572
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2573	/* Quickly get everything that can paste with an '='. */
John David Anglin	37b8524	2001-03-02 01:11:50 +0000	[diff] [blame]	2574	if ((int) a <= (int) CPP_LAST_EQ && c == '=')
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2575	return 1;
				2576
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2577	switch (a)
				2578	{
Steve Ellcey	b52dbbf	2006-08-14 23:13:54 +0000	[diff] [blame]	2579	case CPP_GREATER: return c == '>';
				2580	case CPP_LESS: return c == '<' \|\| c == '%' \|\| c == ':';
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2581	case CPP_PLUS: return c == '+';
				2582	case CPP_MINUS: return c == '-' \|\| c == '>';
				2583	case CPP_DIV: return c == '/' \|\| c == ''; / Comments. */
				2584	case CPP_MOD: return c == ':' \|\| c == '>';
				2585	case CPP_AND: return c == '&';
				2586	case CPP_OR: return c == '\|';
				2587	case CPP_COLON: return c == ':' \|\| c == '>';
				2588	case CPP_DEREF: return c == '*';
Neil Booth	26ec42e	2001-01-28 11:22:23 +0000	[diff] [blame]	2589	case CPP_DOT: return c == '.' \|\| c == '%' \|\| b == CPP_NUMBER;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2590	case CPP_HASH: return c == '#' \|\| c == '%'; /* Digraph form. */
				2591	case CPP_NAME: return ((b == CPP_NUMBER
				2592	&& name_p (pfile, &token2->val.str))
				2593	\|\| b == CPP_NAME
				2594	\|\| b == CPP_CHAR \|\| b == CPP_STRING); /* L */
				2595	case CPP_NUMBER: return (b == CPP_NUMBER \|\| b == CPP_NAME
				2596	\|\| c == '.' \|\| c == '+' \|\| c == '-');
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	2597	/* UCNs */
Neil Booth	1067694	2003-04-22 19:28:00 +0000	[diff] [blame]	2598	case CPP_OTHER: return ((token1->val.str.text[0] == '\\'
				2599	&& b == CPP_NAME)
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	2600	\|\| (CPP_OPTION (pfile, objc)
Neil Booth	1067694	2003-04-22 19:28:00 +0000	[diff] [blame]	2601	&& token1->val.str.text[0] == '@'
Neil Booth	1613e52	2003-04-20 07:29:23 +0000	[diff] [blame]	2602	&& (b == CPP_NAME \|\| b == CPP_STRING)));
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2603	default: break;
				2604	}
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2605
				2606	return 0;
				2607	}
				2608
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2609	/* Output all the remaining tokens on the current line, and a newline
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	2610	character, to FP. Leading whitespace is removed. If there are
				2611	macros, special token padding is not performed. */
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2612	void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2613	cpp_output_line (cpp_reader pfile, FILE fp)
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2614	{
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	2615	const cpp_token *token;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2616
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	2617	token = cpp_get_token (pfile);
				2618	while (token->type != CPP_EOF)
Zack Weinberg	6ead1e9	2000-07-31 23:47:19 +0000	[diff] [blame]	2619	{
Neil Booth	4ed5bcf	2001-09-24 22:53:12 +0000	[diff] [blame]	2620	cpp_output_token (token, fp);
				2621	token = cpp_get_token (pfile);
				2622	if (token->flags & PREV_WHITE)
				2623	putc (' ', fp);
Zack Weinberg	6ead1e9	2000-07-31 23:47:19 +0000	[diff] [blame]	2624	}
				2625
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2626	putc ('\n', fp);
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2627	}
				2628
Tom Tromey	5d6342e	2008-05-21 21:52:57 +0000	[diff] [blame]	2629	/* Return a string representation of all the remaining tokens on the
				2630	current line. The result is allocated using xmalloc and must be
				2631	freed by the caller. */
				2632	unsigned char *
				2633	cpp_output_line_to_string (cpp_reader pfile, const unsigned char dir_name)
				2634	{
				2635	const cpp_token *token;
				2636	unsigned int out = dir_name ? ustrlen (dir_name) : 0;
				2637	unsigned int alloced = 120 + out;
				2638	unsigned char result = (unsigned char ) xmalloc (alloced);
				2639
				2640	/* If DIR_NAME is empty, there are no initial contents. */
				2641	if (dir_name)
				2642	{
				2643	sprintf ((char *) result, "#%s ", dir_name);
				2644	out += 2;
				2645	}
				2646
				2647	token = cpp_get_token (pfile);
				2648	while (token->type != CPP_EOF)
				2649	{
				2650	unsigned char *last;
				2651	/* Include room for a possible space and the terminating nul. */
				2652	unsigned int len = cpp_token_len (token) + 2;
				2653
				2654	if (out + len > alloced)
				2655	{
				2656	alloced *= 2;
				2657	if (out + len > alloced)
				2658	alloced = out + len;
				2659	result = (unsigned char *) xrealloc (result, alloced);
				2660	}
				2661
				2662	last = cpp_spell_token (pfile, token, &result[out], 0);
				2663	out = last - result;
				2664
				2665	token = cpp_get_token (pfile);
				2666	if (token->flags & PREV_WHITE)
				2667	result[out++] = ' ';
				2668	}
				2669
				2670	result[out] = '\0';
				2671	return result;
				2672	}
				2673
Neil Booth	1e013d2	2001-09-26 21:44:35 +0000	[diff] [blame]	2674	/* Memory buffers. Changing these three constants can have a dramatic
				2675	effect on performance. The values here are reasonable defaults,
				2676	but might be tuned. If you adjust them, be sure to test across a
				2677	range of uses of cpplib, including heavy nested function-like macro
				2678	expansion. Also check the change in peak memory usage (NJAMD is a
				2679	good tool for this). */
				2680	#define MIN_BUFF_SIZE 8000
Neil Booth	8706281	2001-10-20 09:00:53 +0000	[diff] [blame]	2681	#define BUFF_SIZE_UPPER_BOUND(MIN_SIZE) (MIN_BUFF_SIZE + (MIN_SIZE) * 3 / 2)
Neil Booth	1e013d2	2001-09-26 21:44:35 +0000	[diff] [blame]	2682	#define EXTENDED_BUFF_SIZE(BUFF, MIN_EXTRA) \
				2683	(MIN_EXTRA + ((BUFF)->limit - (BUFF)->cur) * 2)
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2684
Neil Booth	8706281	2001-10-20 09:00:53 +0000	[diff] [blame]	2685	#if MIN_BUFF_SIZE > BUFF_SIZE_UPPER_BOUND (0)
				2686	#error BUFF_SIZE_UPPER_BOUND must be at least as large as MIN_BUFF_SIZE!
				2687	#endif
				2688
Neil Booth	c9e7a60	2001-09-27 12:59:38 +0000	[diff] [blame]	2689	/* Create a new allocation buffer. Place the control block at the end
				2690	of the buffer, so that buffer overflows will cause immediate chaos. */
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2691	static _cpp_buff *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2692	new_buff (size_t len)
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2693	{
				2694	_cpp_buff *result;
Neil Booth	ece54d5	2001-09-28 09:40:22 +0000	[diff] [blame]	2695	unsigned char *base;
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2696
Neil Booth	1e013d2	2001-09-26 21:44:35 +0000	[diff] [blame]	2697	if (len < MIN_BUFF_SIZE)
				2698	len = MIN_BUFF_SIZE;
Neil Booth	c70f6ed	2002-06-07 06:26:32 +0000	[diff] [blame]	2699	len = CPP_ALIGN (len);
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2700
Gabriel Dos Reis	c3f829c	2005-05-28 15:52:48 +0000	[diff] [blame]	2701	base = XNEWVEC (unsigned char, len + sizeof (_cpp_buff));
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2702	result = (_cpp_buff *) (base + len);
				2703	result->base = base;
				2704	result->cur = base;
				2705	result->limit = base + len;
				2706	result->next = NULL;
				2707	return result;
				2708	}
				2709
				2710	/* Place a chain of unwanted allocation buffers on the free list. */
				2711	void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2712	_cpp_release_buff (cpp_reader pfile, _cpp_buff buff)
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2713	{
				2714	_cpp_buff *end = buff;
				2715
				2716	while (end->next)
				2717	end = end->next;
				2718	end->next = pfile->free_buffs;
				2719	pfile->free_buffs = buff;
				2720	}
				2721
				2722	/* Return a free buffer of size at least MIN_SIZE. */
				2723	_cpp_buff *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2724	_cpp_get_buff (cpp_reader *pfile, size_t min_size)
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2725	{
				2726	_cpp_buff result, *p;
				2727
				2728	for (p = &pfile->free_buffs;; p = &(*p)->next)
				2729	{
Neil Booth	6142088	2001-09-28 13:25:38 +0000	[diff] [blame]	2730	size_t size;
Neil Booth	1e013d2	2001-09-26 21:44:35 +0000	[diff] [blame]	2731
				2732	if (*p == NULL)
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2733	return new_buff (min_size);
Neil Booth	1e013d2	2001-09-26 21:44:35 +0000	[diff] [blame]	2734	result = *p;
				2735	size = result->limit - result->base;
				2736	/* Return a buffer that's big enough, but don't waste one that's
				2737	way too big. */
Richard Earnshaw	34f5271	2001-10-17 16:20:04 +0000	[diff] [blame]	2738	if (size >= min_size && size <= BUFF_SIZE_UPPER_BOUND (min_size))
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2739	break;
				2740	}
				2741
				2742	*p = result->next;
				2743	result->next = NULL;
				2744	result->cur = result->base;
				2745	return result;
				2746	}
				2747
Kazu Hirata	4fe9b91	2001-10-09 06:03:16 +0000	[diff] [blame]	2748	/* Creates a new buffer with enough space to hold the uncommitted
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2749	remaining bytes of BUFF, and at least MIN_EXTRA more bytes. Copies
				2750	the excess bytes to the new buffer. Chains the new buffer after
				2751	BUFF, and returns the new buffer. */
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2752	_cpp_buff *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2753	_cpp_append_extend_buff (cpp_reader pfile, _cpp_buff buff, size_t min_extra)
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2754	{
Neil Booth	6142088	2001-09-28 13:25:38 +0000	[diff] [blame]	2755	size_t size = EXTENDED_BUFF_SIZE (buff, min_extra);
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2756	_cpp_buff *new_buff = _cpp_get_buff (pfile, size);
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2757
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2758	buff->next = new_buff;
				2759	memcpy (new_buff->base, buff->cur, BUFF_ROOM (buff));
				2760	return new_buff;
				2761	}
				2762
Kazu Hirata	4fe9b91	2001-10-09 06:03:16 +0000	[diff] [blame]	2763	/* Creates a new buffer with enough space to hold the uncommitted
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2764	remaining bytes of the buffer pointed to by BUFF, and at least
				2765	MIN_EXTRA more bytes. Copies the excess bytes to the new buffer.
				2766	Chains the new buffer before the buffer pointed to by BUFF, and
				2767	updates the pointer to point to the new buffer. */
				2768	void
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2769	_cpp_extend_buff (cpp_reader pfile, _cpp_buff *pbuff, size_t min_extra)
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2770	{
				2771	_cpp_buff new_buff, old_buff = *pbuff;
				2772	size_t size = EXTENDED_BUFF_SIZE (old_buff, min_extra);
				2773
				2774	new_buff = _cpp_get_buff (pfile, size);
				2775	memcpy (new_buff->base, old_buff->cur, BUFF_ROOM (old_buff));
				2776	new_buff->next = old_buff;
				2777	*pbuff = new_buff;
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2778	}
				2779
				2780	/* Free a chain of buffers starting at BUFF. */
				2781	void
Andreas Jaeger	5671bf2	2003-07-07 21:11:59 +0200	[diff] [blame]	2782	_cpp_free_buff (_cpp_buff *buff)
Neil Booth	b8af0ca	2001-09-26 17:52:50 +0000	[diff] [blame]	2783	{
				2784	_cpp_buff *next;
				2785
				2786	for (; buff; buff = next)
				2787	{
				2788	next = buff->next;
				2789	free (buff->base);
				2790	}
				2791	}
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2792
Neil Booth	ece54d5	2001-09-28 09:40:22 +0000	[diff] [blame]	2793	/* Allocate permanent, unaligned storage of length LEN. */
				2794	unsigned char *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2795	_cpp_unaligned_alloc (cpp_reader *pfile, size_t len)
Neil Booth	ece54d5	2001-09-28 09:40:22 +0000	[diff] [blame]	2796	{
				2797	_cpp_buff *buff = pfile->u_buff;
				2798	unsigned char *result = buff->cur;
				2799
				2800	if (len > (size_t) (buff->limit - result))
				2801	{
				2802	buff = _cpp_get_buff (pfile, len);
				2803	buff->next = pfile->u_buff;
				2804	pfile->u_buff = buff;
				2805	result = buff->cur;
				2806	}
				2807
				2808	buff->cur = result + len;
				2809	return result;
				2810	}
				2811
Neil Booth	8706281	2001-10-20 09:00:53 +0000	[diff] [blame]	2812	/* Allocate permanent, unaligned storage of length LEN from a_buff.
				2813	That buffer is used for growing allocations when saving macro
				2814	replacement lists in a #define, and when parsing an answer to an
				2815	assertion in #assert, #unassert or #if (and therefore possibly
				2816	whilst expanding macros). It therefore must not be used by any
				2817	code that they might call: specifically the lexer and the guts of
				2818	the macro expander.
				2819
				2820	All existing other uses clearly fit this restriction: storing
				2821	registered pragmas during initialization. */
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2822	unsigned char *
Zack Weinberg	6cf87ca	2003-06-17 06:17:44 +0000	[diff] [blame]	2823	_cpp_aligned_alloc (cpp_reader *pfile, size_t len)
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2824	{
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2825	_cpp_buff *buff = pfile->a_buff;
				2826	unsigned char *result = buff->cur;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2827
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2828	if (len > (size_t) (buff->limit - result))
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2829	{
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2830	buff = _cpp_get_buff (pfile, len);
				2831	buff->next = pfile->a_buff;
				2832	pfile->a_buff = buff;
				2833	result = buff->cur;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2834	}
				2835
Neil Booth	8c3b269	2001-09-30 10:03:11 +0000	[diff] [blame]	2836	buff->cur = result + len;
Neil Booth	93c80368	2000-10-28 17:59:06 +0000	[diff] [blame]	2837	return result;
Zack Weinberg	041c319	2000-07-04 01:58:21 +0000	[diff] [blame]	2838	}
Geoffrey Keating	d804416	2004-06-09 20:10:13 +0000	[diff] [blame]	2839
				2840	/* Say which field of TOK is in use. */
				2841
				2842	enum cpp_token_fld_kind
				2843	cpp_token_val_index (cpp_token *tok)
				2844	{
				2845	switch (TOKEN_SPELL (tok))
				2846	{
				2847	case SPELL_IDENT:
				2848	return CPP_TOKEN_FLD_NODE;
				2849	case SPELL_LITERAL:
				2850	return CPP_TOKEN_FLD_STR;
Joseph Myers	aa50850	2009-04-19 18:10:56 +0100	[diff] [blame]	2851	case SPELL_OPERATOR:
				2852	if (tok->type == CPP_PASTE)
Joseph Myers	9a0c618	2009-05-10 15:27:32 +0100	[diff] [blame]	2853	return CPP_TOKEN_FLD_TOKEN_NO;
Joseph Myers	aa50850	2009-04-19 18:10:56 +0100	[diff] [blame]	2854	else
				2855	return CPP_TOKEN_FLD_NONE;
Geoffrey Keating	d804416	2004-06-09 20:10:13 +0000	[diff] [blame]	2856	case SPELL_NONE:
				2857	if (tok->type == CPP_MACRO_ARG)
				2858	return CPP_TOKEN_FLD_ARG_NO;
				2859	else if (tok->type == CPP_PADDING)
				2860	return CPP_TOKEN_FLD_SOURCE;
Zack Weinberg	21b1149	2004-09-09 19:16:56 +0000	[diff] [blame]	2861	else if (tok->type == CPP_PRAGMA)
Richard Henderson	bc4071d	2006-01-04 08:33:38 -0800	[diff] [blame]	2862	return CPP_TOKEN_FLD_PRAGMA;
Geoffrey Keating	d804416	2004-06-09 20:10:13 +0000	[diff] [blame]	2863	/* else fall through */
				2864	default:
				2865	return CPP_TOKEN_FLD_NONE;
				2866	}
				2867	}
Gabriel Charette	e3dfef4	2011-08-22 20:41:07 +0000	[diff] [blame]	2868
				2869	/* All tokens lexed in R after calling this function will be forced to have
				2870	their source_location the same as the location referenced by P, until
				2871	cpp_stop_forcing_token_locations is called for R. */
				2872
				2873	void
				2874	cpp_force_token_locations (cpp_reader r, source_location p)
				2875	{
				2876	r->forced_token_location_p = p;
				2877	}
				2878
				2879	/* Go back to assigning locations naturally for lexed tokens. */
				2880
				2881	void
				2882	cpp_stop_forcing_token_locations (cpp_reader *r)
				2883	{
				2884	r->forced_token_location_p = NULL;
				2885	}