parsetok.c 6.11 KB
Newer Older
1

Guido van Rossum's avatar
Guido van Rossum committed
2 3
/* Parser-tokenizer link implementation */

Guido van Rossum's avatar
Guido van Rossum committed
4
#include "pgenheaders.h"
Guido van Rossum's avatar
Guido van Rossum committed
5 6 7 8
#include "tokenizer.h"
#include "node.h"
#include "grammar.h"
#include "parser.h"
Guido van Rossum's avatar
Guido van Rossum committed
9
#include "parsetok.h"
Guido van Rossum's avatar
Guido van Rossum committed
10
#include "errcode.h"
11
#include "graminit.h"
Guido van Rossum's avatar
Guido van Rossum committed
12

13 14
int Py_TabcheckFlag;

Guido van Rossum's avatar
Guido van Rossum committed
15

Guido van Rossum's avatar
Guido van Rossum committed
16
/* Forward */
17
static node *parsetok(struct tok_state *, grammar *, int, perrdetail *, int);
18
static void initerr(perrdetail *err_ret, const char* filename);
Guido van Rossum's avatar
Guido van Rossum committed
19

Guido van Rossum's avatar
Guido van Rossum committed
20
/* Parse input coming from a string.  Return error code, print some errors. */
21
node *
22
PyParser_ParseString(const char *s, grammar *g, int start, perrdetail *err_ret)
23
{
Jeremy Hylton's avatar
Jeremy Hylton committed
24
	return PyParser_ParseStringFlagsFilename(s, NULL, g, start, err_ret, 0);
25 26 27
}

node *
28
PyParser_ParseStringFlags(const char *s, grammar *g, int start,
29
		          perrdetail *err_ret, int flags)
30 31
{
	return PyParser_ParseStringFlagsFilename(s, NULL,
32
						 g, start, err_ret, flags);
33 34 35
}

node *
36
PyParser_ParseStringFlagsFilename(const char *s, const char *filename,
37 38
			  grammar *g, int start,
		          perrdetail *err_ret, int flags)
Guido van Rossum's avatar
Guido van Rossum committed
39
{
40 41
	struct tok_state *tok;

42
	initerr(err_ret, filename);
43

44
	if ((tok = PyTokenizer_FromString(s)) == NULL) {
45
		err_ret->error = PyErr_Occurred() ? E_DECODE : E_NOMEM;
46
		return NULL;
Guido van Rossum's avatar
Guido van Rossum committed
47
	}
48

49
        tok->filename = filename ? filename : "<string>";
50 51 52 53 54 55
	if (Py_TabcheckFlag || Py_VerboseFlag) {
		tok->altwarning = (tok->filename != NULL);
		if (Py_TabcheckFlag >= 2)
			tok->alterror++;
	}

56
	return parsetok(tok, g, start, err_ret, flags);
Guido van Rossum's avatar
Guido van Rossum committed
57 58
}

Guido van Rossum's avatar
Guido van Rossum committed
59
/* Parse input coming from a file.  Return error code, print some errors. */
Guido van Rossum's avatar
Guido van Rossum committed
60

61
node *
62
PyParser_ParseFile(FILE *fp, const char *filename, grammar *g, int start,
Thomas Wouters's avatar
Thomas Wouters committed
63
		   char *ps1, char *ps2, perrdetail *err_ret)
64 65 66 67 68 69
{
	return PyParser_ParseFileFlags(fp, filename, g, start, ps1, ps2,
				       err_ret, 0);
}

node *
70
PyParser_ParseFileFlags(FILE *fp, const char *filename, grammar *g, int start,
71
			char *ps1, char *ps2, perrdetail *err_ret, int flags)
Guido van Rossum's avatar
Guido van Rossum committed
72
{
73 74
	struct tok_state *tok;

75
	initerr(err_ret, filename);
76

77
	if ((tok = PyTokenizer_FromFile(fp, ps1, ps2)) == NULL) {
78 79
		err_ret->error = E_NOMEM;
		return NULL;
Guido van Rossum's avatar
Guido van Rossum committed
80
	}
81
	tok->filename = filename;
82 83 84 85 86
	if (Py_TabcheckFlag || Py_VerboseFlag) {
		tok->altwarning = (filename != NULL);
		if (Py_TabcheckFlag >= 2)
			tok->alterror++;
	}
87

Guido van Rossum's avatar
Guido van Rossum committed
88

89
	return parsetok(tok, g, start, err_ret, flags);
90
}
Guido van Rossum's avatar
Guido van Rossum committed
91 92 93 94

/* Parse input coming from the given tokenizer structure.
   Return error code. */

95 96 97 98 99 100 101 102 103 104 105 106 107
static char with_msg[] =
"%s:%d: Warning: 'with' will become a reserved keyword in Python 2.6\n";

static char as_msg[] =
"%s:%d: Warning: 'as' will become a reserved keyword in Python 2.6\n";

static void
warn(const char *msg, const char *filename, int lineno)
{
	if (filename == NULL)
		filename = "<string>";
	PySys_WriteStderr(msg, filename, lineno);
}
108

109
static node *
110 111
parsetok(struct tok_state *tok, grammar *g, int start, perrdetail *err_ret,
	 int flags)
Guido van Rossum's avatar
Guido van Rossum committed
112 113
{
	parser_state *ps;
114
	node *n;
115
	int started = 0, handling_import = 0, handling_with = 0;
116

117
	if ((ps = PyParser_New(g, start)) == NULL) {
Guido van Rossum's avatar
Guido van Rossum committed
118
		fprintf(stderr, "no mem for new parser\n");
119
		err_ret->error = E_NOMEM;
120
		PyTokenizer_Free(tok);
121
		return NULL;
Guido van Rossum's avatar
Guido van Rossum committed
122
	}
123 124 125
#ifdef PY_PARSER_REQUIRES_FUTURE_KEYWORD
	if (flags & PyPARSE_WITH_IS_KEYWORD)
		ps->p_flags |= CO_FUTURE_WITH_STATEMENT;
126
#endif
127

Guido van Rossum's avatar
Guido van Rossum committed
128 129 130
	for (;;) {
		char *a, *b;
		int type;
131
		size_t len;
Guido van Rossum's avatar
Guido van Rossum committed
132
		char *str;
133
		int col_offset;
134

135
		type = PyTokenizer_Get(tok, &a, &b);
Guido van Rossum's avatar
Guido van Rossum committed
136
		if (type == ERRORTOKEN) {
137
			err_ret->error = tok->done;
Guido van Rossum's avatar
Guido van Rossum committed
138 139
			break;
		}
140 141
		if (type == ENDMARKER && started) {
			type = NEWLINE; /* Add an extra newline */
142
			handling_with = handling_import = 0;
143
			started = 0;
144 145 146 147 148 149 150 151 152
			/* Add the right number of dedent tokens,
			   except if a certain flag is given --
			   codeop.py uses this. */
			if (tok->indent &&
			    !(flags & PyPARSE_DONT_IMPLY_DEDENT))
			{
				tok->pendin = -tok->indent;
				tok->indent = 0;
			}
153 154 155
		}
		else
			started = 1;
156
		len = b - a; /* XXX this may compute NULL - NULL */
Andrew MacIntyre's avatar
Andrew MacIntyre committed
157
		str = (char *) PyObject_MALLOC(len + 1);
Guido van Rossum's avatar
Guido van Rossum committed
158 159
		if (str == NULL) {
			fprintf(stderr, "no mem for next token\n");
160
			err_ret->error = E_NOMEM;
Guido van Rossum's avatar
Guido van Rossum committed
161 162
			break;
		}
163 164
		if (len > 0)
			strncpy(str, a, len);
Guido van Rossum's avatar
Guido van Rossum committed
165
		str[len] = '\0';
166

167 168 169 170 171 172 173 174 175 176 177 178 179
#ifdef PY_PARSER_REQUIRES_FUTURE_KEYWORD
		/* This is only necessary to support the "as" warning, but
		   we don't want to warn about "as" in import statements. */
		if (type == NAME &&
		    len == 6 && str[0] == 'i' && strcmp(str, "import") == 0)
			handling_import = 1;

		/* Warn about with as NAME */
		if (type == NAME &&
		    !(ps->p_flags & CO_FUTURE_WITH_STATEMENT)) {
		    if (len == 4 && str[0] == 'w' && strcmp(str, "with") == 0)
			warn(with_msg, err_ret->filename, tok->lineno);
		    else if (!(handling_import || handling_with) &&
180 181
		             len == 2 && str[0] == 'a' &&
			     strcmp(str, "as") == 0)
182 183 184 185 186 187
			warn(as_msg, err_ret->filename, tok->lineno);
		}
		else if (type == NAME &&
			 (ps->p_flags & CO_FUTURE_WITH_STATEMENT) &&
			 len == 4 && str[0] == 'w' && strcmp(str, "with") == 0)
			handling_with = 1;
188
#endif
189 190 191 192 193
		if (a >= tok->line_start)
			col_offset = a - tok->line_start;
		else
			col_offset = -1;
			
194
		if ((err_ret->error =
195
		     PyParser_AddToken(ps, (int)type, str, tok->lineno, col_offset,
196
				       &(err_ret->expected))) != E_OK) {
197
			if (err_ret->error != E_DONE)
Andrew MacIntyre's avatar
Andrew MacIntyre committed
198
				PyObject_FREE(str);
Guido van Rossum's avatar
Guido van Rossum committed
199
			break;
200
		}
Guido van Rossum's avatar
Guido van Rossum committed
201
	}
202 203 204 205 206 207 208 209

	if (err_ret->error == E_DONE) {
		n = ps->p_tree;
		ps->p_tree = NULL;
	}
	else
		n = NULL;

210
	PyParser_Delete(ps);
211 212 213 214 215 216

	if (n == NULL) {
		if (tok->lineno <= 1 && tok->done == E_EOF)
			err_ret->error = E_EOF;
		err_ret->lineno = tok->lineno;
		if (tok->buf != NULL) {
Martin v. Löwis's avatar
Martin v. Löwis committed
217
			size_t len;
Martin v. Löwis's avatar
Martin v. Löwis committed
218 219
			assert(tok->cur - tok->buf < INT_MAX);
			err_ret->offset = (int)(tok->cur - tok->buf);
Martin v. Löwis's avatar
Martin v. Löwis committed
220
			len = tok->inp - tok->buf;
Andrew MacIntyre's avatar
Andrew MacIntyre committed
221
			err_ret->text = (char *) PyObject_MALLOC(len + 1);
222
			if (err_ret->text != NULL) {
223 224
				if (len > 0)
					strncpy(err_ret->text, tok->buf, len);
225 226 227
				err_ret->text[len] = '\0';
			}
		}
228 229 230 231 232 233 234
	} else if (tok->encoding != NULL) {
		node* r = PyNode_New(encoding_decl);
		r->n_str = tok->encoding;
		r->n_nchildren = 1;
		r->n_child = n;
		tok->encoding = NULL;
		n = r;
235 236
	}

237
	PyTokenizer_Free(tok);
238 239

	return n;
Guido van Rossum's avatar
Guido van Rossum committed
240
}
241 242

static void
Jeremy Hylton's avatar
Jeremy Hylton committed
243
initerr(perrdetail *err_ret, const char *filename)
244 245
{
	err_ret->error = E_OK;
246
	err_ret->filename = filename;
247 248 249 250 251 252
	err_ret->lineno = 0;
	err_ret->offset = 0;
	err_ret->text = NULL;
	err_ret->token = -1;
	err_ret->expected = -1;
}