forked from DoctorWkt/acwj
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdecl.c
529 lines (467 loc) · 15 KB
/
decl.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
#include "defs.h"
#include "data.h"
#include "decl.h"
// Parsing of declarations
// Copyright (c) 2019 Warren Toomey, GPL3
static struct symtable *composite_declaration(int type);
static void enum_declaration(void);
int typedef_declaration(struct symtable **ctype);
int type_of_typedef(char *name, struct symtable **ctype);
// Parse the current token and return a
// primitive type enum value, a pointer
// to any composite type and possibly
// modify the class of the type.
// Also scan in the next token.
int parse_type(struct symtable **ctype, int *class) {
int type, exstatic=1;
// See if the class has been changed to extern (later, static)
while (exstatic) {
switch (Token.token) {
case T_EXTERN: *class= C_EXTERN; scan(&Token); break;
default: exstatic= 0;
}
}
// Now work on the actual type keyword
switch (Token.token) {
case T_VOID:
type = P_VOID;
scan(&Token);
break;
case T_CHAR:
type = P_CHAR;
scan(&Token);
break;
case T_INT:
type = P_INT;
scan(&Token);
break;
case T_LONG:
type = P_LONG;
scan(&Token);
break;
// For the following, if we have a ';' after the
// parsing then there is no type, so return -1
case T_STRUCT:
type = P_STRUCT;
*ctype = composite_declaration(P_STRUCT);
if (Token.token == T_SEMI)
type = -1;
break;
case T_UNION:
type = P_UNION;
*ctype = composite_declaration(P_UNION);
if (Token.token == T_SEMI)
type = -1;
break;
case T_ENUM:
type = P_INT; // Enums are really ints
enum_declaration();
if (Token.token == T_SEMI)
type = -1;
break;
case T_TYPEDEF:
type = typedef_declaration(ctype);
if (Token.token == T_SEMI)
type = -1;
break;
case T_IDENT:
type = type_of_typedef(Text, ctype);
break;
default:
fatald("Illegal type, token", Token.token);
}
// Scan in one or more further '*' tokens
// and determine the correct pointer type
while (1) {
if (Token.token != T_STAR)
break;
type = pointer_to(type);
scan(&Token);
}
// We leave with the next token already scanned
return (type);
}
// variable_declaration: type identifier ';'
// | type identifier '[' INTLIT ']' ';'
// ;
//
// Parse the declaration of a scalar variable or an array
// with a given size.
// The identifier has been scanned & we have the type.
// class is the variable's class
// Return the pointer to variable's entry in the symbol table
struct symtable *var_declaration(int type, struct symtable *ctype, int class) {
struct symtable *sym = NULL;
// See if this has already been declared
switch (class) {
case C_EXTERN:
case C_GLOBAL:
if (findglob(Text) != NULL)
fatals("Duplicate global variable declaration", Text);
case C_LOCAL:
case C_PARAM:
if (findlocl(Text) != NULL)
fatals("Duplicate local variable declaration", Text);
case C_MEMBER:
if (findmember(Text) != NULL)
fatals("Duplicate struct/union member declaration", Text);
}
// Text now has the identifier's name.
// If the next token is a '['
if (Token.token == T_LBRACKET) {
// Skip past the '['
scan(&Token);
// Check we have an array size
if (Token.token == T_INTLIT) {
// Add this as a known array and generate its space in assembly.
// We treat the array as a pointer to its elements' type
switch (class) {
case C_EXTERN:
case C_GLOBAL:
sym =
addglob(Text, pointer_to(type), ctype, S_ARRAY, class, Token.intvalue);
break;
case C_LOCAL:
case C_PARAM:
case C_MEMBER:
fatal
("For now, declaration of non-global arrays is not implemented");
}
}
// Ensure we have a following ']'
scan(&Token);
match(T_RBRACKET, "]");
} else {
// Add this as a known scalar
// and generate its space in assembly
switch (class) {
case C_EXTERN:
case C_GLOBAL:
sym = addglob(Text, type, ctype, S_VARIABLE, class, 1);
break;
case C_LOCAL:
sym = addlocl(Text, type, ctype, S_VARIABLE, 1);
break;
case C_PARAM:
sym = addparm(Text, type, ctype, S_VARIABLE, 1);
break;
case C_MEMBER:
sym = addmemb(Text, type, ctype, S_VARIABLE, 1);
break;
}
}
return (sym);
}
// var_declaration_list: <null>
// | variable_declaration
// | variable_declaration separate_token var_declaration_list ;
//
// When called to parse function parameters, separate_token is ','.
// When called to parse members of a struct/union, separate_token is ';'.
//
// Parse a list of variables.
// Add them as symbols to one of the symbol table lists, and return the
// number of variables. If funcsym is not NULL, there is an existing function
// prototype, so compare each variable's type against this prototype.
static int var_declaration_list(struct symtable *funcsym, int class,
int separate_token, int end_token) {
int type;
int paramcnt = 0;
struct symtable *protoptr = NULL;
struct symtable *ctype;
// If there is a prototype, get the pointer
// to the first prototype parameter
if (funcsym != NULL)
protoptr = funcsym->member;
// Loop until the final end token
while (Token.token != end_token) {
// Get the type and identifier
type = parse_type(&ctype, &class);
ident();
// Check that this type matches the prototype if there is one
if (protoptr != NULL) {
if (type != protoptr->type)
fatald("Type doesn't match prototype for parameter", paramcnt + 1);
protoptr = protoptr->next;
} else {
// Add a new parameter to the right symbol table list, based on the class
var_declaration(type, ctype, class);
}
paramcnt++;
// Must have a separate_token or ')' at this point
if ((Token.token != separate_token) && (Token.token != end_token))
fatald("Unexpected token in parameter list", Token.token);
if (Token.token == separate_token)
scan(&Token);
}
// Check that the number of parameters in this list matches
// any existing prototype
if ((funcsym != NULL) && (paramcnt != funcsym->nelems))
fatals("Parameter count mismatch for function", funcsym->name);
// Return the count of parameters
return (paramcnt);
}
//
// function_declaration: type identifier '(' parameter_list ')' ;
// | type identifier '(' parameter_list ')' compound_statement ;
//
// Parse the declaration of function.
// The identifier has been scanned & we have the type.
struct ASTnode *function_declaration(int type) {
struct ASTnode *tree, *finalstmt;
struct symtable *oldfuncsym, *newfuncsym = NULL;
int endlabel, paramcnt;
// Text has the identifier's name. If this exists and is a
// function, get the id. Otherwise, set oldfuncsym to NULL.
if ((oldfuncsym = findsymbol(Text)) != NULL)
if (oldfuncsym->stype != S_FUNCTION)
oldfuncsym = NULL;
// If this is a new function declaration, get a
// label-id for the end label, and add the function
// to the symbol table,
if (oldfuncsym == NULL) {
endlabel = genlabel();
// Assumtion: functions only return scalar types, so NULL below
newfuncsym = addglob(Text, type, NULL, S_FUNCTION, C_GLOBAL, endlabel);
}
// Scan in the '(', any parameters and the ')'.
// Pass in any existing function prototype pointer
lparen();
paramcnt = var_declaration_list(oldfuncsym, C_PARAM, T_COMMA, T_RPAREN);
rparen();
// If this is a new function declaration, update the
// function symbol entry with the number of parameters.
// Also copy the parameter list into the function's node.
if (newfuncsym) {
newfuncsym->nelems = paramcnt;
newfuncsym->member = Parmhead;
oldfuncsym = newfuncsym;
}
// Clear out the parameter list
Parmhead = Parmtail = NULL;
// Declaration ends in a semicolon, only a prototype.
if (Token.token == T_SEMI) {
scan(&Token);
return (NULL);
}
// This is not just a prototype.
// Set the Functionid global to the function's symbol pointer
Functionid = oldfuncsym;
// Get the AST tree for the compound statement and mark
// that we have parsed no loops yet
Looplevel= 0;
tree = compound_statement();
// If the function type isn't P_VOID ..
if (type != P_VOID) {
// Error if no statements in the function
if (tree == NULL)
fatal("No statements in function with non-void type");
// Check that the last AST operation in the
// compound statement was a return statement
finalstmt = (tree->op == A_GLUE) ? tree->right : tree;
if (finalstmt == NULL || finalstmt->op != A_RETURN)
fatal("No return for function with non-void type");
}
// Return an A_FUNCTION node which has the function's symbol pointer
// and the compound statement sub-tree
return (mkastunary(A_FUNCTION, type, tree, oldfuncsym, endlabel));
}
// Parse composite type declarations: structs or unions.
// Either find an existing struct/union declaration, or build
// a struct/union symbol table entry and return its pointer.
static struct symtable *composite_declaration(int type) {
struct symtable *ctype = NULL;
struct symtable *m;
int offset;
// Skip the struct/union keyword
scan(&Token);
// See if there is a following struct/union name
if (Token.token == T_IDENT) {
// Find any matching composite type
if (type == P_STRUCT)
ctype = findstruct(Text);
else
ctype = findunion(Text);
scan(&Token);
}
// If the next token isn't an LBRACE , this is
// the usage of an existing struct/union type.
// Return the pointer to the type.
if (Token.token != T_LBRACE) {
if (ctype == NULL)
fatals("unknown struct/union type", Text);
return (ctype);
}
// Ensure this struct/union type hasn't been
// previously defined
if (ctype)
fatals("previously defined struct/union", Text);
// Build the composite type and skip the left brace
if (type == P_STRUCT)
ctype = addstruct(Text, P_STRUCT, NULL, 0, 0);
else
ctype = addunion(Text, P_UNION, NULL, 0, 0);
scan(&Token);
// Scan in the list of members and attach
// to the struct type's node
var_declaration_list(NULL, C_MEMBER, T_SEMI, T_RBRACE);
rbrace();
ctype->member = Membhead;
Membhead = Membtail = NULL;
// Set the offset of the initial member
// and find the first free byte after it
m = ctype->member;
m->posn = 0;
offset = typesize(m->type, m->ctype);
// Set the position of each successive member in the composite type
// Unions are easy. For structs, align the member and find the next free byte
for (m = m->next; m != NULL; m = m->next) {
// Set the offset for this member
if (type == P_STRUCT)
m->posn = genalign(m->type, offset, 1);
else
m->posn = 0;
// Get the offset of the next free byte after this member
offset += typesize(m->type, m->ctype);
}
// Set the overall size of the composite type
ctype->size = offset;
return (ctype);
}
// Parse an enum declaration
static void enum_declaration(void) {
struct symtable *etype = NULL;
char *name;
int intval = 0;
// Skip the enum keyword.
scan(&Token);
// If there's a following enum type name, get a
// pointer to any existing enum type node.
if (Token.token == T_IDENT) {
etype = findenumtype(Text);
name = strdup(Text); // As it gets tromped soon
scan(&Token);
}
// If the next token isn't a LBRACE, check
// that we have an enum type name, then return
if (Token.token != T_LBRACE) {
if (etype == NULL)
fatals("undeclared enum type:", name);
return;
}
// We do have an LBRACE. Skip it
scan(&Token);
// If we have an enum type name, ensure that it
// hasn't been declared before.
if (etype != NULL)
fatals("enum type redeclared:", etype->name);
else
// Build an enum type node for this identifier
etype = addenum(name, C_ENUMTYPE, 0);
// Loop to get all the enum values
while (1) {
// Ensure we have an identifier
// Copy it in case there's an int literal coming up
ident();
name = strdup(Text);
// Ensure this enum value hasn't been declared before
etype = findenumval(name);
if (etype != NULL)
fatals("enum value redeclared:", Text);
// If the next token is an '=', skip it and
// get the following int literal
if (Token.token == T_ASSIGN) {
scan(&Token);
if (Token.token != T_INTLIT)
fatal("Expected int literal after '='");
intval = Token.intvalue;
scan(&Token);
}
// Build an enum value node for this identifier.
// Increment the value for the next enum identifier.
etype = addenum(name, C_ENUMVAL, intval++);
// Bail out on a right curly bracket, else get a comma
if (Token.token == T_RBRACE)
break;
comma();
}
scan(&Token); // Skip over the right curly bracket
}
// Parse a typedef declaration and return the type
// and ctype that it represents
int typedef_declaration(struct symtable **ctype) {
int type, class=0;
// Skip the typedef keyword.
scan(&Token);
// Get the actual type following the keyword
type = parse_type(ctype, &class);
if (class != 0)
fatal("Can't have extern in a typedef declaration");
// See if the typedef identifier already exists
if (findtypedef(Text) != NULL)
fatals("redefinition of typedef", Text);
// It doesn't exist so add it to the typedef list
addtypedef(Text, type, *ctype, 0, 0);
scan(&Token);
return (type);
}
// Given a typedef name, return the type it represents
int type_of_typedef(char *name, struct symtable **ctype) {
struct symtable *t;
// Look up the typedef in the list
t = findtypedef(name);
if (t == NULL)
fatals("unknown type", name);
scan(&Token);
*ctype = t->ctype;
return (t->type);
}
// Parse one or more global declarations, either
// variables, functions or structs
void global_declarations(void) {
struct ASTnode *tree;
struct symtable *ctype;
int type, class= C_GLOBAL;
while (1) {
// Stop when we have reached EOF
if (Token.token == T_EOF)
break;
// Get the type
type = parse_type(&ctype, &class);
// We might have just parsed a struct, union or enum
// declaration with no associated variable.
// The next token might be a ';'. Loop back if it is.
// XXX: I'm not happy with this as it allows
// "struct fred;" as an accepted statement
if (type == -1) {
semi();
continue;
}
// We have to read past the identifier
// to see either a '(' for a function declaration
// or a ',' or ';' for a variable declaration.
// Text is filled in by the ident() call.
ident();
if (Token.token == T_LPAREN) {
// Parse the function declaration
tree = function_declaration(type);
// Only a function prototype, no code
if (tree == NULL)
continue;
// A real function, generate the assembly code for it
if (O_dumpAST) {
dumpAST(tree, NOLABEL, 0);
fprintf(stdout, "\n\n");
}
genAST(tree, NOLABEL, NOLABEL, NOLABEL, 0);
// Now free the symbols associated
// with this function
freeloclsyms();
} else {
// Parse the global variable declaration
// and skip past the trailing semicolon
var_declaration(type, ctype, class);
semi();
}
}
}