grammar.c 5.38 KB
Newer Older
1

Guido van Rossum's avatar
Guido van Rossum committed
2 3
/* Grammar implementation */

4
#include "Python.h"
Guido van Rossum's avatar
Guido van Rossum committed
5 6
#include "pgenheaders.h"

Guido van Rossum's avatar
Guido van Rossum committed
7 8 9 10 11
#include <ctype.h>

#include "token.h"
#include "grammar.h"

12
extern int Py_DebugFlag;
Guido van Rossum's avatar
Guido van Rossum committed
13 14

grammar *
Thomas Wouters's avatar
Thomas Wouters committed
15
newgrammar(int start)
Guido van Rossum's avatar
Guido van Rossum committed
16 17 18
{
	grammar *g;
	
19
	g = (grammar *)PyObject_MALLOC(sizeof(grammar));
Guido van Rossum's avatar
Guido van Rossum committed
20
	if (g == NULL)
21
		Py_FatalError("no mem for new grammar");
Guido van Rossum's avatar
Guido van Rossum committed
22 23 24 25 26
	g->g_ndfas = 0;
	g->g_dfa = NULL;
	g->g_start = start;
	g->g_ll.ll_nlabels = 0;
	g->g_ll.ll_label = NULL;
27
	g->g_accel = 0;
Guido van Rossum's avatar
Guido van Rossum committed
28 29 30 31
	return g;
}

dfa *
Thomas Wouters's avatar
Thomas Wouters committed
32
adddfa(grammar *g, int type, char *name)
Guido van Rossum's avatar
Guido van Rossum committed
33 34 35
{
	dfa *d;
	
36 37
	g->g_dfa = (dfa *)PyObject_REALLOC(g->g_dfa, 
                                            sizeof(dfa) * (g->g_ndfas + 1));
Guido van Rossum's avatar
Guido van Rossum committed
38
	if (g->g_dfa == NULL)
39
		Py_FatalError("no mem to resize dfa in adddfa");
Guido van Rossum's avatar
Guido van Rossum committed
40 41
	d = &g->g_dfa[g->g_ndfas++];
	d->d_type = type;
42
	d->d_name = strdup(name);
Guido van Rossum's avatar
Guido van Rossum committed
43 44 45 46 47 48 49 50
	d->d_nstates = 0;
	d->d_state = NULL;
	d->d_initial = -1;
	d->d_first = NULL;
	return d; /* Only use while fresh! */
}

int
Thomas Wouters's avatar
Thomas Wouters committed
51
addstate(dfa *d)
Guido van Rossum's avatar
Guido van Rossum committed
52 53 54
{
	state *s;
	
55 56
	d->d_state = (state *)PyObject_REALLOC(d->d_state,
				      sizeof(state) * (d->d_nstates + 1));
Guido van Rossum's avatar
Guido van Rossum committed
57
	if (d->d_state == NULL)
58
		Py_FatalError("no mem to resize state in addstate");
Guido van Rossum's avatar
Guido van Rossum committed
59 60 61
	s = &d->d_state[d->d_nstates++];
	s->s_narcs = 0;
	s->s_arc = NULL;
62 63 64 65
	s->s_lower = 0;
	s->s_upper = 0;
	s->s_accel = NULL;
	s->s_accept = 0;
Guido van Rossum's avatar
Guido van Rossum committed
66 67 68 69
	return s - d->d_state;
}

void
Thomas Wouters's avatar
Thomas Wouters committed
70
addarc(dfa *d, int from, int to, int lbl)
Guido van Rossum's avatar
Guido van Rossum committed
71 72 73 74 75 76 77 78
{
	state *s;
	arc *a;
	
	assert(0 <= from && from < d->d_nstates);
	assert(0 <= to && to < d->d_nstates);
	
	s = &d->d_state[from];
79
	s->s_arc = (arc *)PyObject_REALLOC(s->s_arc, sizeof(arc) * (s->s_narcs + 1));
Guido van Rossum's avatar
Guido van Rossum committed
80
	if (s->s_arc == NULL)
81
		Py_FatalError("no mem to resize arc list in addarc");
Guido van Rossum's avatar
Guido van Rossum committed
82 83 84 85 86 87
	a = &s->s_arc[s->s_narcs++];
	a->a_lbl = lbl;
	a->a_arrow = to;
}

int
Thomas Wouters's avatar
Thomas Wouters committed
88
addlabel(labellist *ll, int type, char *str)
Guido van Rossum's avatar
Guido van Rossum committed
89 90 91 92 93 94 95 96 97
{
	int i;
	label *lb;
	
	for (i = 0; i < ll->ll_nlabels; i++) {
		if (ll->ll_label[i].lb_type == type &&
			strcmp(ll->ll_label[i].lb_str, str) == 0)
			return i;
	}
98 99
	ll->ll_label = (label *)PyObject_REALLOC(ll->ll_label,
					sizeof(label) * (ll->ll_nlabels + 1));
Guido van Rossum's avatar
Guido van Rossum committed
100
	if (ll->ll_label == NULL)
101
		Py_FatalError("no mem to resize labellist in addlabel");
Guido van Rossum's avatar
Guido van Rossum committed
102 103
	lb = &ll->ll_label[ll->ll_nlabels++];
	lb->lb_type = type;
104 105
	lb->lb_str = strdup(str);
	if (Py_DebugFlag)
Guido van Rossum's avatar
Guido van Rossum committed
106
		printf("Label @ %8p, %d: %s\n", ll, ll->ll_nlabels,
107
		       PyGrammar_LabelRepr(lb));
Guido van Rossum's avatar
Guido van Rossum committed
108 109 110 111 112 113
	return lb - ll->ll_label;
}

/* Same, but rather dies than adds */

int
Thomas Wouters's avatar
Thomas Wouters committed
114
findlabel(labellist *ll, int type, char *str)
Guido van Rossum's avatar
Guido van Rossum committed
115 116 117 118 119 120 121 122 123
{
	int i;
	
	for (i = 0; i < ll->ll_nlabels; i++) {
		if (ll->ll_label[i].lb_type == type /*&&
			strcmp(ll->ll_label[i].lb_str, str) == 0*/)
			return i;
	}
	fprintf(stderr, "Label %d/'%s' not found\n", type, str);
124
	Py_FatalError("grammar.c:findlabel()");
Guido van Rossum's avatar
Guido van Rossum committed
125
	return 0; /* Make gcc -Wall happy */
Guido van Rossum's avatar
Guido van Rossum committed
126 127
}

Guido van Rossum's avatar
Guido van Rossum committed
128
/* Forward */
129
static void translabel(grammar *, label *);
Guido van Rossum's avatar
Guido van Rossum committed
130 131

void
Thomas Wouters's avatar
Thomas Wouters committed
132
translatelabels(grammar *g)
Guido van Rossum's avatar
Guido van Rossum committed
133 134
{
	int i;
135

136
#ifdef Py_DEBUG
Guido van Rossum's avatar
Guido van Rossum committed
137
	printf("Translating labels ...\n");
138
#endif
Guido van Rossum's avatar
Guido van Rossum committed
139 140 141 142 143
	/* Don't translate EMPTY */
	for (i = EMPTY+1; i < g->g_ll.ll_nlabels; i++)
		translabel(g, &g->g_ll.ll_label[i]);
}

Guido van Rossum's avatar
Guido van Rossum committed
144
static void
Thomas Wouters's avatar
Thomas Wouters committed
145
translabel(grammar *g, label *lb)
Guido van Rossum's avatar
Guido van Rossum committed
146 147 148
{
	int i;
	
149 150
	if (Py_DebugFlag)
		printf("Translating label %s ...\n", PyGrammar_LabelRepr(lb));
Guido van Rossum's avatar
Guido van Rossum committed
151 152 153 154
	
	if (lb->lb_type == NAME) {
		for (i = 0; i < g->g_ndfas; i++) {
			if (strcmp(lb->lb_str, g->g_dfa[i].d_name) == 0) {
155 156 157 158 159
				if (Py_DebugFlag)
					printf(
					    "Label %s is non-terminal %d.\n",
					    lb->lb_str,
					    g->g_dfa[i].d_type);
Guido van Rossum's avatar
Guido van Rossum committed
160
				lb->lb_type = g->g_dfa[i].d_type;
161
				free(lb->lb_str);
Guido van Rossum's avatar
Guido van Rossum committed
162 163 164 165 166
				lb->lb_str = NULL;
				return;
			}
		}
		for (i = 0; i < (int)N_TOKENS; i++) {
167 168
			if (strcmp(lb->lb_str, _PyParser_TokenNames[i]) == 0) {
				if (Py_DebugFlag)
Guido van Rossum's avatar
Guido van Rossum committed
169 170 171
					printf("Label %s is terminal %d.\n",
						lb->lb_str, i);
				lb->lb_type = i;
172
				free(lb->lb_str);
Guido van Rossum's avatar
Guido van Rossum committed
173 174 175 176 177 178 179 180 181
				lb->lb_str = NULL;
				return;
			}
		}
		printf("Can't translate NAME label '%s'\n", lb->lb_str);
		return;
	}
	
	if (lb->lb_type == STRING) {
182 183
		if (isalpha(Py_CHARMASK(lb->lb_str[1])) ||
		    lb->lb_str[1] == '_') {
184
			char *p;
185 186 187
			char *src;
			char *dest;
			size_t name_len;
188
			if (Py_DebugFlag)
Guido van Rossum's avatar
Guido van Rossum committed
189 190
				printf("Label %s is a keyword\n", lb->lb_str);
			lb->lb_type = NAME;
191 192
			src = lb->lb_str + 1;
			p = strchr(src, '\'');
Guido van Rossum's avatar
Guido van Rossum committed
193
			if (p)
194 195 196
				name_len = p - src;
			else
				name_len = strlen(src);
197
			dest = (char *)malloc(name_len + 1);
198 199 200 201
			if (!dest) {
				printf("Can't alloc dest '%s'\n", src);
				return;
			}
202 203 204 205
			strncpy(dest, src, name_len);
			dest[name_len] = '\0';
			free(lb->lb_str);
			lb->lb_str = dest;
Guido van Rossum's avatar
Guido van Rossum committed
206
		}
207
		else if (lb->lb_str[2] == lb->lb_str[0]) {
208
			int type = (int) PyToken_OneChar(lb->lb_str[1]);
209 210
			if (type != OP) {
				lb->lb_type = type;
211
				free(lb->lb_str);
212 213 214 215 216 217 218
				lb->lb_str = NULL;
			}
			else
				printf("Unknown OP label %s\n",
					lb->lb_str);
		}
		else if (lb->lb_str[2] && lb->lb_str[3] == lb->lb_str[0]) {
219
			int type = (int) PyToken_TwoChars(lb->lb_str[1],
220 221 222
						   lb->lb_str[2]);
			if (type != OP) {
				lb->lb_type = type;
223
				free(lb->lb_str);
224
				lb->lb_str = NULL;
Guido van Rossum's avatar
Guido van Rossum committed
225 226
			}
			else
227
				printf("Unknown OP label %s\n",
Guido van Rossum's avatar
Guido van Rossum committed
228 229
					lb->lb_str);
		}
230 231 232 233 234 235
		else if (lb->lb_str[2] && lb->lb_str[3] && lb->lb_str[4] == lb->lb_str[0]) {
			int type = (int) PyToken_ThreeChars(lb->lb_str[1],
							    lb->lb_str[2],
							    lb->lb_str[3]);
			if (type != OP) {
				lb->lb_type = type;
236
				free(lb->lb_str);
237 238 239 240 241 242
				lb->lb_str = NULL;
			}
			else
				printf("Unknown OP label %s\n",
					lb->lb_str);
		}
243 244 245
		else
			printf("Can't translate STRING label %s\n",
				lb->lb_str);
Guido van Rossum's avatar
Guido van Rossum committed
246 247
	}
	else
248 249
		printf("Can't translate label '%s'\n",
		       PyGrammar_LabelRepr(lb));
Guido van Rossum's avatar
Guido van Rossum committed
250
}