-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathparse.c
2565 lines (2221 loc) · 69.3 KB
/
parse.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
#include "rvcc.h"
// 局部变量,全局变量,typedef,enum常量的域
typedef struct VarScope VarScope;
// 变量域
struct VarScope {
VarScope *Next; // 下一变量域
char *Name; // 变量域名称
Obj *Var; // 对应的变量
Type *Typedef; // 别名
Type *EnumTy; // 枚举的类型
int EnumVal; // 枚举的值
};
// 结构体标签,联合体标签,枚举标签的域
typedef struct TagScope TagScope;
struct TagScope {
TagScope *Next; // 下一个标签域
char *Name; // 域名称
Type *Ty; // 域类名
};
// 表示一个块域
typedef struct Scope Scope;
struct Scope {
Scope *Next; // 指向上一级的域
// C有两个域:变量(或类型别名)域,结构体(或联合体,枚举)标签域
VarScope *Vars; // 指向当前域内的变量
TagScope *Tags; // 指向当前域内的结构体标签
};
// 变量属性(是否是static, typedef)
typedef struct {
bool IsStatic; // 是否为文件域内
bool IsTypedef; // 是否为类型别名
bool IsExtern; // 是否为外部变量
int Align; // 对齐量
} VarAttr;
// 可变的初始化器。此处为树状结构。
// 因为初始化器可以是嵌套的,
// 类似于 int x[2][2] = {{1, 2}, {3, 4}} ,
typedef struct Initializer Initializer;
struct Initializer {
Initializer *Next; // 下一个
Type *Ty; // 原始类型
Token *Tok; // 终结符
bool IsFlexible; // 可调整的,表示需要重新构造
// 如果不是聚合类型,并且有一个初始化器,Expr 有对应的初始化表达式。
Node *Expr;
// 如果是聚合类型(如数组或结构体),Children有子节点的初始化器
Initializer **Children;
};
// 指派初始化,用于局部变量的初始化器
typedef struct InitDesig InitDesig;
struct InitDesig {
InitDesig *Next; // 下一个
int Idx; // 数组中的索引
Member *Mem; // 成员变量
Obj *Var; // 对应的变量
};
// 在解析时,全部的变量实例都被累加到这个列表里。
Obj *Locals; // 局部变量
Obj *Globals; // 全局变量
// 所有的域的链表
static Scope *Scp = &(Scope){};
// 指向当前正在解析的函数
static Obj *CurrentFn;
// 当前函数内的goto和标签列表
static Node *Gotos;
static Node *Labels;
// 当前goto跳转的目标
static char *BrkLabel;
// 当前continue跳转的目标
static char *ContLabel;
// 如果我们正在解析switch语句,则指向表示switch的节点。
// 否则为空。
static Node *CurrentSwitch;
// program = (typedef | functionDefinition | globalVariable)*
// functionDefinition = declspec declarator "{" compoundStmt*
// declspec = ("void" | "_Bool" | char" | "short" | "int" | "long"
// | "typedef" | "static" | "extern"
// | "_Alignas" ("(" typeName | constExpr ")")
// | structDecl | unionDecl | typedefName
// | enumSpecifier)+
// enumSpecifier = ident? "{" enumList? "}"
// | ident ("{" enumList? "}")?
// enumList = ident ("=" constExpr)? ("," ident ("=" constExpr)?)* ","?
// declarator = "*"* ("(" ident ")" | "(" declarator ")" | ident) typeSuffix
// typeSuffix = "(" funcParams | "[" arrayDimensions | ε
// arrayDimensions = constExpr? "]" typeSuffix
// funcParams = ("void" | param ("," param)*)? ")"
// param = declspec declarator
// compoundStmt = (typedef | declaration | stmt)* "}"
// declaration = declspec (declarator ("=" initializer)?
// ("," declarator ("=" initializer)?)*)? ";"
// initializer = stringInitializer | arrayInitializer | structInitializer
// | unionInitializer |assign
// stringInitializer = stringLiteral
// arrayInitializer = arrayInitializer1 | arrayInitializer2
// arrayInitializer1 = "{" initializer ("," initializer)* ","? "}"
// arrayIntializer2 = initializer ("," initializer)* ","?
// structInitializer = structInitializer1 | structInitializer2
// structInitializer1 = "{" initializer ("," initializer)* ","? "}"
// structIntializer2 = initializer ("," initializer)* ","?
// unionInitializer = "{" initializer "}"
// stmt = "return" expr ";"
// | "if" "(" expr ")" stmt ("else" stmt)?
// | "switch" "(" expr ")" stmt
// | "case" constExpr ":" stmt
// | "default" ":" stmt
// | "for" "(" exprStmt expr? ";" expr? ")" stmt
// | "while" "(" expr ")" stmt
// | "goto" ident ";"
// | "break" ";"
// | "continue" ";"
// | ident ":" stmt
// | "{" compoundStmt
// | exprStmt
// exprStmt = expr? ";"
// expr = assign ("," expr)?
// assign = conditional (assignOp assign)?
// conditional = logOr ("?" expr ":" conditional)?
// logOr = logAnd ("||" logAnd)*
// logAnd = bitOr ("&&" bitOr)*
// bitOr = bitXor ("|" bitXor)*
// bitXor = bitAnd ("^" bitAnd)*
// bitAnd = equality ("&" equality)*
// assignOp = "=" | "+=" | "-=" | "*=" | "/=" | "%=" | "&=" | "|=" | "^="
// equality = relational ("==" relational | "!=" relational)*
// relational = shift ("<" shift | "<=" shift | ">" shift | ">=" shift)*
// shift = add ("<<" add | ">>" add)*
// add = mul ("+" mul | "-" mul)*
// mul = cast ("*" cast | "/" cast | "%" cast)*
// cast = "(" typeName ")" cast | unary
// unary = ("+" | "-" | "*" | "&" | "!" | "~") cast
// | ("++" | "--") unary
// | postfix
// structMembers = (declspec declarator ("," declarator)* ";")*
// structDecl = structUnionDecl
// unionDecl = structUnionDecl
// structUnionDecl = ident? ("{" structMembers)?
// postfix = primary ("[" expr "]" | "." ident)* | "->" ident | "++" | "--")*
// primary = "(" "{" stmt+ "}" ")"
// | "(" expr ")"
// | "sizeof" "(" typeName ")"
// | "sizeof" unary
// | "_Alignof" "(" typeName ")"
// | "_Alignof" unary
// | ident funcArgs?
// | str
// | num
// typeName = declspec abstractDeclarator
// abstractDeclarator = "*"* ("(" abstractDeclarator ")")? typeSuffix
// funcall = ident "(" (assign ("," assign)*)? ")"
static bool isTypename(Token *Tok);
static Type *declspec(Token **Rest, Token *Tok, VarAttr *Attr);
static Type *typename(Token **Rest, Token *Tok);
static Type *enumSpecifier(Token **Rest, Token *Tok);
static Type *typeSuffix(Token **Rest, Token *Tok, Type *Ty);
static Type *declarator(Token **Rest, Token *Tok, Type *Ty);
static Node *declaration(Token **Rest, Token *Tok, Type *BaseTy, VarAttr *Attr);
static void initializer2(Token **Rest, Token *Tok, Initializer *Init);
static Initializer *initializer(Token **Rest, Token *Tok, Type *Ty,
Type **NewTy);
static Node *LVarInitializer(Token **Rest, Token *Tok, Obj *Var);
static void GVarInitializer(Token **Rest, Token *Tok, Obj *Var);
static Node *compoundStmt(Token **Rest, Token *Tok);
static Node *stmt(Token **Rest, Token *Tok);
static Node *exprStmt(Token **Rest, Token *Tok);
static Node *expr(Token **Rest, Token *Tok);
static int64_t eval(Node *Nd);
static int64_t eval2(Node *Nd, char **Label);
static int64_t evalRVal(Node *Nd, char **Label);
static int64_t constExpr(Token **Rest, Token *Tok);
static Node *assign(Token **Rest, Token *Tok);
static Node *conditional(Token **Rest, Token *Tok);
static Node *logOr(Token **Rest, Token *Tok);
static Node *logAnd(Token **Rest, Token *Tok);
static Node *bitOr(Token **Rest, Token *Tok);
static Node *bitXor(Token **Rest, Token *Tok);
static Node *bitAnd(Token **Rest, Token *Tok);
static Node *equality(Token **Rest, Token *Tok);
static Node *relational(Token **Rest, Token *Tok);
static Node *shift(Token **Rest, Token *Tok);
static Node *add(Token **Rest, Token *Tok);
static Node *newAdd(Node *LHS, Node *RHS, Token *Tok);
static Node *newSub(Node *LHS, Node *RHS, Token *Tok);
static Node *mul(Token **Rest, Token *Tok);
static Node *cast(Token **Rest, Token *Tok);
static Type *structDecl(Token **Rest, Token *Tok);
static Type *unionDecl(Token **Rest, Token *Tok);
static Node *unary(Token **Rest, Token *Tok);
static Node *postfix(Token **Rest, Token *Tok);
static Node *primary(Token **Rest, Token *Tok);
static Token *parseTypedef(Token *Tok, Type *BaseTy);
static bool isFunction(Token *Tok);
static Token *function(Token *Tok, Type *BaseTy, VarAttr *Attr);
static Token *globalVariable(Token *Tok, Type *Basety, VarAttr *Attr);
// 进入域
static void enterScope(void) {
Scope *S = calloc(1, sizeof(Scope));
// 后来的在链表头部
// 类似于栈的结构,栈顶对应最近的域
S->Next = Scp;
Scp = S;
}
// 结束当前域
static void leaveScope(void) { Scp = Scp->Next; }
// 通过名称,查找一个变量
static VarScope *findVar(Token *Tok) {
// 此处越先匹配的域,越深层
for (Scope *S = Scp; S; S = S->Next)
// 遍历域内的所有变量
for (VarScope *S2 = S->Vars; S2; S2 = S2->Next)
if (equal(Tok, S2->Name)) return S2;
return NULL;
}
// 通过Token查找标签(定义的struct, union, enum的种类)
static Type *findTag(Token *Tok) {
for (Scope *S = Scp; S; S = S->Next)
for (TagScope *S2 = S->Tags; S2; S2 = S2->Next)
if (equal(Tok, S2->Name)) return S2->Ty;
return NULL;
}
// 新建一个节点
static Node *newNode(NodeKind Kind, Token *Tok) {
Node *Nd = calloc(1, sizeof(Node));
Nd->Kind = Kind;
Nd->Tok = Tok;
return Nd;
}
// 新建一个单叉树
static Node *newUnary(NodeKind Kind, Node *Expr, Token *Tok) {
Node *Nd = newNode(Kind, Tok);
Nd->LHS = Expr;
return Nd;
}
// 新建一个二叉树节点
static Node *newBinary(NodeKind Kind, Node *LHS, Node *RHS, Token *Tok) {
Node *Nd = newNode(Kind, Tok);
Nd->LHS = LHS;
Nd->RHS = RHS;
return Nd;
}
// 新建一个数字节点
static Node *newNum(int64_t Val, Token *Tok) {
Node *Nd = newNode(ND_NUM, Tok);
Nd->Val = Val;
return Nd;
}
// 新建一个长整型节点
static Node *newLong(int64_t Val, Token *Tok) {
Node *Nd = newNode(ND_NUM, Tok);
Nd->Val = Val;
Nd->Ty = TyLong;
return Nd;
}
// 新变量
static Node *newVarNode(Obj *Var, Token *Tok) {
Node *Nd = newNode(ND_VAR, Tok);
Nd->Var = Var;
return Nd;
}
// 新转换,(Ty)Expr
Node *newCast(Node *Expr, Type *Ty) {
addType(Expr);
Node *Nd = calloc(1, sizeof(Node));
Nd->Kind = ND_CAST;
Nd->Tok = Expr->Tok;
Nd->LHS = Expr;
Nd->Ty = copyType(Ty);
return Nd;
}
// 将变量存入当前的域的变量域中
static VarScope *pushScope(char *Name) {
VarScope *S = calloc(1, sizeof(VarScope));
S->Name = Name;
// 后来的在链表头部
S->Next = Scp->Vars;
Scp->Vars = S;
return S;
}
// 新建初始化器
static Initializer *newInitializer(Type *Ty, bool IsFlexible) {
Initializer *Init = calloc(1, sizeof(Initializer));
// 存储原始类型
Init->Ty = Ty;
if (Ty->Kind == TY_ARRAY) {
// 判断是否需要调整数组元素数并且数组不完整
if (IsFlexible && Ty->Size < 0) {
// 设置初始化器为可调整的,之后进行完数组元素数的计算后,再构造初始化器
Init->IsFlexible = true;
return Init;
}
Init->Children = calloc(Ty->ArrayLen, sizeof(Initializer *));
for (int I = 0; I < Ty->ArrayLen; ++I)
Init->Children[I] = newInitializer(Ty->Base, false);
}
// 处理结构体和联合体
if (Ty->Kind == TY_STRUCT || Ty->Kind == TY_UNION) {
// 计算结构体成员的数量
int Len = 0;
for (Member *Mem = Ty->Mems; Mem; Mem = Mem->Next) ++Len;
// 初始化器的子项
Init->Children = calloc(Len, sizeof(Initializer *));
// 遍历子项进行赋值
for (Member *Mem = Ty->Mems; Mem; Mem = Mem->Next)
// 判断结构体是否为灵活,成员也是灵活的并且为最后一个
// 单独构造
if (IsFlexible && Ty->IsFlexible && !Mem->Next) {
Initializer *Child = calloc(1, sizeof(Initializer));
Child->Ty = Mem->Ty;
Child->IsFlexible = true;
Init->Children[Mem->Idx] = Child;
} else {
// 对非灵活子项进行赋值
Init->Children[Mem->Idx] = newInitializer(Mem->Ty, false);
}
return Init;
}
return Init;
}
// 新建变量
static Obj *newVar(char *Name, Type *Ty) {
Obj *Var = calloc(1, sizeof(Obj));
Var->Name = Name;
Var->Ty = Ty;
// 设置变量默认的对齐量为类型的对齐量
Var->Align = Ty->Align;
pushScope(Name)->Var = Var;
return Var;
}
// 在链表中新增一个局部变量
static Obj *newLVar(char *Name, Type *Ty) {
Obj *Var = newVar(Name, Ty);
Var->IsLocal = true;
// 将变量插入头部
Var->Next = Locals;
Locals = Var;
return Var;
}
// 在链表中新增一个全局变量
static Obj *newGVar(char *Name, Type *Ty) {
Obj *Var = newVar(Name, Ty);
Var->Next = Globals;
// 存在定义
Var->IsDefinition = true;
Globals = Var;
return Var;
}
// 新增唯一名称
static char *newUniqueName(void) {
static int Id = 0;
return format(".L..%d", Id++);
}
// 新增匿名全局变量
static Obj *newAnonGVar(Type *Ty) { return newGVar(newUniqueName(), Ty); }
// 新增字符串字面量
static Obj *newStringLiteral(char *Str, Type *Ty) {
Obj *Var = newAnonGVar(Ty);
Var->InitData = Str;
return Var;
}
// 获取标识符
static char *getIdent(Token *Tok) {
if (Tok->Kind != TK_IDENT) errorTok(Tok, "expected an identifier");
return strndup(Tok->Loc, Tok->Len);
}
// 查找类型别名
static Type *findTypedef(Token *Tok) {
// 类型名是个标识符
if (Tok->Kind == TK_IDENT) {
// 查找是否存在于变量域内
VarScope *S = findVar(Tok);
if (S) return S->Typedef;
}
return NULL;
}
static void pushTagScope(Token *Tok, Type *Ty) {
TagScope *S = calloc(1, sizeof(TagScope));
S->Name = strndup(Tok->Loc, Tok->Len);
S->Ty = Ty;
S->Next = Scp->Tags;
Scp->Tags = S;
}
// declspec = ("void" | "_Bool" | char" | "short" | "int" | "long"
// | "typedef" | "static" | "extern"
// | "_Alignas" ("(" typeName | constExpr ")")
// | structDecl | unionDecl | typedefName
// | enumSpecifier)+
// declarator specifier
static Type *declspec(Token **Rest, Token *Tok, VarAttr *Attr) {
// 类型的组合,被表示为例如:LONG+LONG=1<<9
// 可知long int和int long是等价的。
enum {
VOID = 1 << 0,
BOOL = 1 << 2,
CHAR = 1 << 4,
SHORT = 1 << 6,
INT = 1 << 8,
LONG = 1 << 10,
OTHER = 1 << 12,
};
Type *Ty = TyInt;
int Counter = 0; // 记录类型相加的数值
// 遍历所有类型名的Tok
while (isTypename(Tok)) {
// 处理typedef关键字
if (equal(Tok, "typedef") || equal(Tok, "static") || equal(Tok, "extern")) {
if (!Attr)
errorTok(Tok, "storage class specifier is not allowed in this context");
if (equal(Tok, "typedef"))
Attr->IsTypedef = true;
else if (equal(Tok, "extern"))
Attr->IsExtern = true;
else
Attr->IsStatic = true;
// typedef不应与static/extern一起使用
if ((Attr->IsStatic || Attr->IsExtern) && Attr->IsTypedef)
errorTok(Tok, "typedef and static are contradictory");
Tok = Tok->Next;
continue;
}
if (equal(Tok, "_Alignas")) {
// 不存在变量属性时,无法设置对齐值
if (!Attr) errorTok(Tok, "_Alignas is not allowed in this context");
Tok = skip(Tok->Next, "(");
// 判断是类型名,或者常量表达式
if (isTypename(Tok))
Attr->Align = typename(&Tok, Tok)->Align;
else
Attr->Align = constExpr(&Tok, Tok);
Tok = skip(Tok, ")");
continue;
}
// 处理用户定义的类型
Type *Ty2 = findTypedef(Tok);
if (equal(Tok, "struct") || equal(Tok, "union") || equal(Tok, "enum") ||
Ty2) {
if (Counter) break;
if (equal(Tok, "struct"))
Ty = structDecl(&Tok, Tok->Next);
else if (equal(Tok, "union"))
Ty = unionDecl(&Tok, Tok->Next);
else if (equal(Tok, "enum"))
Ty = enumSpecifier(&Tok, Tok->Next);
else {
// 将类型设为类型别名指向的类型
Ty = Ty2;
Tok = Tok->Next;
}
Counter += OTHER;
continue;
}
// 对于出现的类型名加入Counter
// 每一步的Counter都需要有合法值
if (equal(Tok, "void"))
Counter += VOID;
else if (equal(Tok, "_Bool"))
Counter += BOOL;
else if (equal(Tok, "char"))
Counter += CHAR;
else if (equal(Tok, "short"))
Counter += SHORT;
else if (equal(Tok, "int"))
Counter += INT;
else if (equal(Tok, "long"))
Counter += LONG;
else
unreachable();
// 根据Counter值映射到对应的Type
switch (Counter) {
case VOID:
Ty = TyVoid;
break;
case BOOL:
Ty = TyBool;
break;
case CHAR:
Ty = TyChar;
break;
case SHORT:
case SHORT + INT:
Ty = TyShort;
break;
case INT:
Ty = TyInt;
break;
case LONG:
case LONG + INT:
case LONG + LONG:
case LONG + LONG + INT:
Ty = TyLong;
break;
default:
errorTok(Tok, "invalid type");
}
Tok = Tok->Next;
} // while (isTypename(Tok))
*Rest = Tok;
return Ty;
}
// funcParams = ("void" | param ("," param)*)? ")"
// param = declspec declarator
static Type *funcParams(Token **Rest, Token *Tok, Type *Ty) {
// "void"
if (equal(Tok, "void") && equal(Tok->Next, ")")) {
*Rest = Tok->Next->Next;
return funcType(Ty);
}
Type Head = {};
Type *Cur = &Head;
while (!equal(Tok, ")")) {
// funcParams = param ("," param)*
// param = declspec declarator
if (Cur != &Head) Tok = skip(Tok, ",");
Type *Ty2 = declspec(&Tok, Tok, NULL);
Ty2 = declarator(&Tok, Tok, Ty2);
// T类型的数组被转换为T*
if (Ty2->Kind == TY_ARRAY) {
Token *Name = Ty2->Name;
Ty2 = pointerTo(Ty2->Base);
Ty2->Name = Name;
}
// 将类型复制到形参链表一份
Cur->Next = copyType(Ty2);
Cur = Cur->Next;
}
// 封装一个函数节点
Ty = funcType(Ty);
// 传递形参
Ty->Params = Head.Next;
*Rest = Tok->Next;
return Ty;
}
// 数组维数
// arrayDimensions = constExpr? "]" typeSuffix
static Type *arrayDimensions(Token **Rest, Token *Tok, Type *Ty) {
// "]" 无数组维数的 "[]"
if (equal(Tok, "]")) {
Ty = typeSuffix(Rest, Tok->Next, Ty);
return arrayOf(Ty, -1);
}
// 有数组维数的情况
int Sz = constExpr(&Tok, Tok);
Tok = skip(Tok, "]");
Ty = typeSuffix(Rest, Tok, Ty);
return arrayOf(Ty, Sz);
}
// typeSuffix = "(" funcParams | "[" arrayDimensions | ε
static Type *typeSuffix(Token **Rest, Token *Tok, Type *Ty) {
// "(" funcParams
if (equal(Tok, "(")) return funcParams(Rest, Tok->Next, Ty);
if (equal(Tok, "[")) return arrayDimensions(Rest, Tok->Next, Ty);
*Rest = Tok;
return Ty;
}
// declarator = "*"* ("(" ident ")" | "(" declarator ")" | ident) typeSuffix
static Type *declarator(Token **Rest, Token *Tok, Type *Ty) {
// "*"*
// 构建所有的(多重)指针
while (consume(&Tok, Tok, "*")) Ty = pointerTo(Ty);
// "(" declarator ")"
if (equal(Tok, "(")) {
Token *Start = Tok;
Type Dummy = {};
// 使Tok前进到")"后面的位置
declarator(&Tok, Start->Next, &Dummy);
Tok = skip(Tok, ")");
// 获取到括号后面的类型后缀,Ty为解析完的类型,Rest指向分号
Ty = typeSuffix(Rest, Tok, Ty);
// 解析Ty整体作为Base去构造,返回Type的值
return declarator(&Tok, Start->Next, Ty);
}
if (Tok->Kind != TK_IDENT) errorTok(Tok, "expected a variable name");
// typeSuffix
Ty = typeSuffix(Rest, Tok->Next, Ty);
// ident
// 变量名 或 函数名
Ty->Name = Tok;
return Ty;
}
// abstractDeclarator = "*"* ("(" abstractDeclarator ")")? typeSuffix
static Type *abstractDeclarator(Token **Rest, Token *Tok, Type *Ty) {
//"*"*
while (equal(Tok, "*")) {
Ty = pointerTo(Ty);
Tok = Tok->Next;
}
// ("(" abstractDeclarator ")")?
if (equal(Tok, "(")) {
Token *Start = Tok;
Type Dummy = {};
// 使Tok前进到")"后面的位置
abstractDeclarator(&Tok, Start->Next, &Dummy);
Tok = skip(Tok, ")");
// 获取到括号后面的类型后缀,Ty为解析完的类型,Rest指向分号
Ty = typeSuffix(Rest, Tok, Ty);
// 解析Ty整体作为Base去构造,返回Type的值
return abstractDeclarator(&Tok, Start->Next, Ty);
}
// typeSuffix
return typeSuffix(Rest, Tok, Ty);
}
// typeName = declspec abstractDeclarator
// 获取类型的相关信息
static Type *typename(Token **Rest, Token *Tok) {
// declspec
Type *Ty = declspec(&Tok, Tok, NULL);
// abstractDeclarator
return abstractDeclarator(Rest, Tok, Ty);
}
// 判断是否终结符匹配到了结尾
static bool isEnd(Token *Tok) {
// "}" | ",}"
return (equal(Tok, "}") || (equal(Tok, ",") && equal(Tok->Next, "}")));
}
// 消耗掉结尾的终结符
// "}" | ",}"
static bool consumeEnd(Token **Rest, Token *Tok) {
// "}"
if (equal(Tok, "}")) {
*Rest = Tok->Next;
return true;
}
// ",}"
if (equal(Tok, ",") && equal(Tok->Next, "}")) {
*Rest = Tok->Next->Next;
return true;
}
// 没有消耗到指定字符
return false;
}
// 获取枚举类型信息
// enumSpecifier = ident? "{" enumList? "}"
// | ident ("{" enumList? "}")?
// enumList = ident ("=" constExpr)? ("," ident ("=" constExpr)?)* ","?
static Type *enumSpecifier(Token **Rest, Token *Tok) {
Type *Ty = enumType();
// 读取标签
// ident?
Token *Tag = NULL;
if (Tok->Kind == TK_IDENT) {
Tag = Tok;
Tok = Tok->Next;
}
// 处理没有{}(枚举变量的声明,定义:enum color a = RED;)
if (Tag && !equal(Tok, "{")) {
Type *Ty = findTag(Tag);
if (!Ty) errorTok(Tag, "unknown enum type");
if (Ty->Kind != TY_ENUM) errorTok(Tag, "not an enum tag");
*Rest = Tok;
return Ty;
}
// "{ enumList? "}"
Tok = skip(Tok, "{");
// enumList
// 读取枚举列表
int I = 0; // 第几个枚举常量
int Val = 0; // 枚举常量的值
while (!consumeEnd(Rest, Tok)) {
if (I++ > 0) Tok = skip(Tok, ",");
char *Name = getIdent(Tok);
Tok = Tok->Next;
// 判断是否存在赋值
if (equal(Tok, "=")) Val = constExpr(&Tok, Tok->Next);
// 将枚举常量存到变量域中
VarScope *S = pushScope(Name);
S->EnumTy = Ty;
S->EnumVal = Val++;
}
if (Tag) pushTagScope(Tag, Ty);
return Ty;
}
// declaration = declspec (declarator ("=" initializer)?
// ("," declarator ("=" initializer)?)*)? ";"
static Node *declaration(Token **Rest, Token *Tok, Type *BaseTy,
VarAttr *Attr) {
Node Head = {};
Node *Cur = &Head;
// 对变量声明次数计数
int I = 0;
// (declarator ("=" expr)? ("," declarator ("=" expr)?)*)?
while (!equal(Tok, ";")) {
// 第1个变量不必匹配 ","
if (I++ > 0) Tok = skip(Tok, ",");
// declarator
// 声明获取到变量类型,包括变量名
Type *Ty = declarator(&Tok, Tok, BaseTy);
if (Ty->Kind == TY_VOID) errorTok(Tok, "variable declared void");
Obj *Var = newLVar(getIdent(Ty->Name), Ty);
// 读取是否存在变量的对齐值
if (Attr && Attr->Align) Var->Align = Attr->Align;
// 如果不存在"="则为变量声明,不需要生成节点,已经存储在Locals中了
if (equal(Tok, "=")) {
// 解析变量的初始化器
Node *Expr = LVarInitializer(&Tok, Tok->Next, Var);
// 存放在表达式语句中
Cur->Next = newUnary(ND_EXPR_STMT, Expr, Tok);
Cur = Cur->Next;
}
// 初始化后若为Size < 0, Kind == TY_VOID报错
if (Var->Ty->Size < 0) errorTok(Ty->Name, "variable has incomplete type");
if (Var->Ty->Kind == TY_VOID) errorTok(Ty->Name, "variable declared void");
}
// 将所有表达式语句,存放在代码块中
Node *Nd = newNode(ND_BLOCK, Tok);
Nd->Body = Head.Next;
*Rest = Tok->Next;
return Nd;
}
// 跳过多余的元素
static Token *skipExcessElement(Token *Tok) {
if (equal(Tok, "{")) {
Tok = skipExcessElement(Tok->Next);
return skip(Tok, "}");
}
// 解析并舍弃多余的元素
assign(&Tok, Tok);
return Tok;
}
// stringInitializer = stringLiteral
static void stringInitializer(Token **Rest, Token *Tok, Initializer *Init) {
// 如果是可调整的,就构造一个包含数组的初始化器
// 字符串字面量在词法解析部分已经增加了'\0'
if (Init->IsFlexible)
*Init = *newInitializer(arrayOf(Init->Ty->Base, Tok->Ty->ArrayLen), false);
// 取数组和字符串的最短长度
int Len = MIN(Init->Ty->ArrayLen, Tok->Ty->ArrayLen);
// 遍历赋值
for (int I = 0; I < Len; ++I)
Init->Children[I]->Expr = newNum(Tok->Str[I], Tok);
*Rest = Tok->Next;
}
// 计算数组初始化元素个数
static int countArrayInitElements(Token *Tok, Type *Ty) {
Initializer *Dummy = newInitializer(Ty->Base, false);
// 项数
int I = 0;
// 遍历所有匹配的项
for (; !consumeEnd(&Tok, Tok); I++) {
if (I > 0) Tok = skip(Tok, ",");
initializer2(&Tok, Tok, Dummy);
}
return I;
}
// arrayInitializer1 = "{" initializer ("," initializer)* ","? "}"
static void arrayInitializer1(Token **Rest, Token *Tok, Initializer *Init) {
Tok = skip(Tok, "{");
// 如果数组是可调整的,那么就计算数组的元素数,然后进行初始化器的构造
if (Init->IsFlexible) {
int Len = countArrayInitElements(Tok, Init->Ty);
// 在这里Ty也被重新构造为了数组
*Init = *newInitializer(arrayOf(Init->Ty->Base, Len), false);
}
// 遍历数组
for (int I = 0; !consumeEnd(Rest, Tok); I++) {
if (I > 0) Tok = skip(Tok, ",");
// 正常解析元素
if (I < Init->Ty->ArrayLen) initializer2(&Tok, Tok, Init->Children[I]);
// 跳过多余的元素
else
Tok = skipExcessElement(Tok);
}
}
// arrayIntializer2 = initializer ("," initializer)* ","?
static void arrayInitializer2(Token **Rest, Token *Tok, Initializer *Init) {
// 如果数组是可调整的,那么就计算数组的元素数,然后进行初始化器的构造
if (Init->IsFlexible) {
int Len = countArrayInitElements(Tok, Init->Ty);
// 在这里Ty也被重新构造为了数组
*Init = *newInitializer(arrayOf(Init->Ty->Base, Len), false);
}
// 遍历数组
for (int I = 0; I < Init->Ty->ArrayLen && !isEnd(Tok); I++) {
if (I > 0) Tok = skip(Tok, ",");
initializer2(&Tok, Tok, Init->Children[I]);
}
*Rest = Tok;
}
// structInitializer1 = "{" initializer ("," initializer)* ","? "}"
static void structInitializer1(Token **Rest, Token *Tok, Initializer *Init) {
Tok = skip(Tok, "{");
// 成员变量的链表
Member *Mem = Init->Ty->Mems;
while (!consumeEnd(Rest, Tok)) {
// Mem未指向Init->Ty->Mems,则说明Mem进行过Next的操作,就不是第一个
if (Mem != Init->Ty->Mems) Tok = skip(Tok, ",");
if (Mem) {
// 处理成员
initializer2(&Tok, Tok, Init->Children[Mem->Idx]);
Mem = Mem->Next;
} else {
// 处理多余的成员
Tok = skipExcessElement(Tok);
}
}
}
// structIntializer2 = initializer ("," initializer)* ","?
static void structInitializer2(Token **Rest, Token *Tok, Initializer *Init) {
bool First = true;
// 遍历所有成员变量
for (Member *Mem = Init->Ty->Mems; Mem && !isEnd(Tok); Mem = Mem->Next) {
if (!First) Tok = skip(Tok, ",");
First = false;
initializer2(&Tok, Tok, Init->Children[Mem->Idx]);
}
*Rest = Tok;
}
// unionInitializer = "{" initializer "}"
static void unionInitializer(Token **Rest, Token *Tok, Initializer *Init) {
// 联合体只接受第一个成员用来初始化
if (equal(Tok, "{")) {
// 存在括号的情况
initializer2(&Tok, Tok->Next, Init->Children[0]);
// ","?
consume(&Tok, Tok, ",");
*Rest = skip(Tok, "}");
} else {
// 不存在括号的情况
initializer2(Rest, Tok, Init->Children[0]);
}
}
// initializer = stringInitializer | arrayInitializer | structInitializer
// | unionInitializer |assign
static void initializer2(Token **Rest, Token *Tok, Initializer *Init) {
// 字符串字面量的初始化
if (Init->Ty->Kind == TY_ARRAY && Tok->Kind == TK_STR) {
stringInitializer(Rest, Tok, Init);
return;
}
// 联合体的初始化
if (Init->Ty->Kind == TY_UNION) {
unionInitializer(Rest, Tok, Init);
return;
}
// 数组的初始化
if (Init->Ty->Kind == TY_ARRAY) {
if (equal(Tok, "{"))
// 存在括号的情况
arrayInitializer1(Rest, Tok, Init);
else
// 不存在括号的情况
arrayInitializer2(Rest, Tok, Init);
return;
}
// 结构体的初始化
if (Init->Ty->Kind == TY_STRUCT) {
// 匹配使用其他结构体来赋值,其他结构体需要先被解析过
// 存在括号的情况
if (equal(Tok, "{")) {
structInitializer1(Rest, Tok, Init);
return;
}
// 不存在括号的情况
Node *Expr = assign(Rest, Tok);
addType(Expr);
if (Expr->Ty->Kind == TY_STRUCT) {
Init->Expr = Expr;
return;
}
structInitializer2(Rest, Tok, Init);
return;
}
// 处理标量外的大括号,例如:int x = {3};
if (equal(Tok, "{")) {
initializer2(&Tok, Tok->Next, Init);
*Rest = skip(Tok, "}");
return;
}
// assign
// 为节点存储对应的表达式
Init->Expr = assign(Rest, Tok);
}
// 复制结构体的类型
static Type *copyStructType(Type *Ty) {
Ty = copyType(Ty);
Member Head = {};
Member *Cur = &Head;
for (Member *Mem = Ty->Mems; Mem; Mem = Mem->Next) {
Member *M = calloc(1, sizeof(Member));
*M = *Mem;