From d3498162b4a37a1ff66412afa3fa07cd5356a769 Mon Sep 17 00:00:00 2001 From: pu9sp4t32 <2931381969@qq.com> Date: Mon, 23 Mar 2026 20:30:40 +0800 Subject: [PATCH 1/6] =?UTF-8?q?=E5=8A=A0=E5=85=A5Lab1=E6=B5=8B=E8=AF=95?= =?UTF-8?q?=E6=89=B9=E5=A4=84=E7=90=86=E8=84=9A=E6=9C=AC?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- test_parse.sh | 78 +++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 78 insertions(+) create mode 100644 test_parse.sh diff --git a/test_parse.sh b/test_parse.sh new file mode 100644 index 0000000..750d9bf --- /dev/null +++ b/test_parse.sh @@ -0,0 +1,78 @@ +#!/bin/bash +# ================================================ +# SysY 编译器 Lab1 批量解析测试脚本 +# 文件名:scripts/test_parse.sh +# 适用环境:Arch Linux(bash 原生支持,无需额外安装) +# 功能: +# - 遍历 test/test_case 下所有 .sy 文件(functional + performance) +# - 执行 --emit-parse-tree 检查是否能成功解析 +# - 输出简洁的 PASS/FAIL 结果 + 统计 +# - 错误文件会自动打印最后 10 行报错信息(方便调试) +# - 所有结果保存到 test/test_result/parse_test.log +# ================================================ + +set -u # 遇到未定义变量直接报错 + +# ================== 配置 ================== +COMPILER="./build/bin/compiler" +TEST_DIR="test/test_case" +LOG_FILE="test/test_result/parse_test.log" +MAX_ERROR_LINES=10 + +# 检查编译器是否存在 +if [[ ! -x "$COMPILER" ]]; then + echo "❌ 错误:找不到编译器 $COMPILER" + echo " 请先执行 Lab1 构建命令:" + echo " cmake -S . -B build -DCMAKE_BUILD_TYPE=Release -DCOMPILER_PARSE_ONLY=ON" + echo " cmake --build build -j \"\$(nproc)\"" + exit 1 +fi + +# 创建日志目录(如果不存在) +mkdir -p "$(dirname "$LOG_FILE")" +> "$LOG_FILE" # 清空日志 + +echo "开始 Lab1 批量语法树测试..." | tee -a "$LOG_FILE" +echo "测试目录:$TEST_DIR" | tee -a "$LOG_FILE" +echo "编译器:$COMPILER" | tee -a "$LOG_FILE" +echo "========================================" | tee -a "$LOG_FILE" + +pass=0 +fail=0 +total=0 + +# 遍历所有 .sy 文件(支持子目录) +while IFS= read -r -d '' sy_file; do + ((total++)) + echo -n "[$total] 测试: $sy_file ... " | tee -a "$LOG_FILE" + + # 执行解析(把输出丢到 /dev/null,防止刷屏) + if "$COMPILER" --emit-parse-tree "$sy_file" > /dev/null 2>&1; then + echo "✅PASS" | tee -a "$LOG_FILE" + ((pass++)) + else + echo "FAIL" | tee -a "$LOG_FILE" + ((fail++)) + + # 打印错误信息到日志(最后几行) + echo " └── 错误详情(最后 $MAX_ERROR_LINES 行):" >> "$LOG_FILE" + "$COMPILER" --emit-parse-tree "$sy_file" 2>&1 | tail -n "$MAX_ERROR_LINES" >> "$LOG_FILE" + echo "" >> "$LOG_FILE" + fi +done < <(find "$TEST_DIR" -name "*.sy" -print0 | sort -z) + +# ================== 总结 ================== +echo "========================================" | tee -a "$LOG_FILE" +echo "测试完成!" | tee -a "$LOG_FILE" +echo "总文件数 : $total" | tee -a "$LOG_FILE" +echo "通过 : $pass" | tee -a "$LOG_FILE" +echo "失败 : $fail" | tee -a "$LOG_FILE" + +if [[ $fail -eq 0 ]]; then + echo "恭喜!Lab1 语法树构建全部通过!可以进入 Lab2 啦~" | tee -a "$LOG_FILE" +else + echo "有 $fail 个文件解析失败,请检查 SysY.g4 或报错日志" | tee -a "$LOG_FILE" + echo " 日志文件:$LOG_FILE" | tee -a "$LOG_FILE" +fi + +echo "========================================" | tee -a "$LOG_FILE" From 8465f2ddd5708a1d30a2d3649195446f492f2661 Mon Sep 17 00:00:00 2001 From: pabgh52us <2826301297@qq.com> Date: Mon, 23 Mar 2026 20:33:42 +0800 Subject: [PATCH 2/6] ADD file via upload --- SysY.g4 | 227 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 227 insertions(+) create mode 100644 SysY.g4 diff --git a/SysY.g4 b/SysY.g4 new file mode 100644 index 0000000..d3633df --- /dev/null +++ b/SysY.g4 @@ -0,0 +1,227 @@ +grammar SysY; + +/*===-------------------------------------------===*/ +/* Lexer rules */ +/*===-------------------------------------------===*/ + +CONST: 'const'; +INT: 'int'; +FLOAT: 'float'; +VOID: 'void'; +IF: 'if'; +ELSE: 'else'; +WHILE: 'while'; +BREAK: 'break'; +CONTINUE: 'continue'; +RETURN: 'return'; + +ASSIGN: '='; +EQ: '=='; +NE: '!='; +LT: '<'; +GT: '>'; +LE: '<='; +GE: '>='; + +ADD: '+'; +SUB: '-'; +MUL: '*'; +DIV: '/'; +MOD: '%'; +NOT: '!'; +LAND: '&&'; +LOR: '||'; + +LPAREN: '('; +RPAREN: ')'; +LBRACE: '{'; +RBRACE: '}'; +LBRACK: '['; +RBRACK: ']'; +COMMA: ','; +SEMICOLON: ';'; + +FLOAT_CONST + : DEC_FLOAT_CONST + | HEX_FLOAT_CONST + ; + +INT_CONST + : HEX_PREFIX HEX_DIGIT+ + | '0' [0-7]+ + | '0' + | [1-9] DIGIT* + ; + +ID: [a-zA-Z_][a-zA-Z_0-9]*; + +WS: [ \t\r\n] -> skip; +LINECOMMENT: '//' ~[\r\n]* -> skip; +BLOCKCOMMENT: '/*' .*? '*/' -> skip; + +fragment DEC_FLOAT_CONST + : DIGIT+ '.' DIGIT* EXP_PART? + | '.' DIGIT+ EXP_PART? + | DIGIT+ EXP_PART + ; + +fragment HEX_FLOAT_CONST + : HEX_PREFIX HEX_DIGIT+ '.' HEX_DIGIT* BIN_EXP_PART + | HEX_PREFIX '.' HEX_DIGIT+ BIN_EXP_PART + | HEX_PREFIX HEX_DIGIT+ BIN_EXP_PART + ; + +fragment EXP_PART: [eE] [+-]? DIGIT+; +fragment BIN_EXP_PART: [pP] [+-]? DIGIT+; +fragment HEX_PREFIX: '0' [xX]; +fragment HEX_DIGIT: [0-9a-fA-F]; +fragment DIGIT: [0-9]; + +/*===-------------------------------------------===*/ +/* Syntax rules */ +/*===-------------------------------------------===*/ + +compUnit + : (decl | funcDef)+ EOF + ; + +decl + : constDecl + | varDecl + ; + +constDecl + : CONST bType constDef (COMMA constDef)* SEMICOLON + ; + +varDecl + : bType varDef (COMMA varDef)* SEMICOLON + ; + +bType + : INT + | FLOAT + ; + +constDef + : ID (LBRACK constExp RBRACK)* ASSIGN constInitVal + ; + +constInitVal + : constExp + | LBRACE (constInitVal (COMMA constInitVal)*)? RBRACE + ; + +varDef + : ID (LBRACK constExp RBRACK)* (ASSIGN initVal)? + ; + +initVal + : exp + | LBRACE (initVal (COMMA initVal)*)? RBRACE + ; + +funcDef + : funcType ID LPAREN funcFParams? RPAREN block + ; + +funcType + : VOID + | INT + | FLOAT + ; + +funcFParams + : funcFParam (COMMA funcFParam)* + ; + +funcFParam + : bType ID (LBRACK RBRACK (LBRACK exp RBRACK)*)? + ; + +block + : LBRACE blockItem* RBRACE + ; + +blockItem + : decl + | stmt + ; + +stmt + : lVal ASSIGN exp SEMICOLON + | exp? SEMICOLON + | block + | IF LPAREN cond RPAREN stmt (ELSE stmt)? + | WHILE LPAREN cond RPAREN stmt + | BREAK SEMICOLON + | CONTINUE SEMICOLON + | RETURN exp? SEMICOLON + ; + +exp + : addExp + ; + +cond + : lOrExp + ; + +lVal + : ID (LBRACK exp RBRACK)* + ; + +primaryExp + : LPAREN exp RPAREN + | lVal + | number + ; + +number + : INT_CONST + | FLOAT_CONST + ; + +unaryExp + : primaryExp + | ID LPAREN funcRParams? RPAREN + | unaryOp unaryExp + ; + +unaryOp + : ADD + | SUB + | NOT + ; + +funcRParams + : exp (COMMA exp)* + ; + +mulExp + : unaryExp ((MUL | DIV | MOD) unaryExp)* + ; + +addExp + : mulExp ((ADD | SUB) mulExp)* + ; + +relExp + : addExp ((LT | GT | LE | GE) addExp)* + ; + +eqExp + : relExp ((EQ | NE) relExp)* + ; + +lAndExp + : eqExp (LAND eqExp)* + ; + +lOrExp + : lAndExp (LOR lAndExp)* + ; + +constExp + : addExp + ; From 3cfd47fb71eb835786e40b8704daa45fbb3fbaac Mon Sep 17 00:00:00 2001 From: pabgh52us <2826301297@qq.com> Date: Mon, 23 Mar 2026 20:34:09 +0800 Subject: [PATCH 3/6] Delete 'SysY.g4' --- SysY.g4 | 227 -------------------------------------------------------- 1 file changed, 227 deletions(-) delete mode 100644 SysY.g4 diff --git a/SysY.g4 b/SysY.g4 deleted file mode 100644 index d3633df..0000000 --- a/SysY.g4 +++ /dev/null @@ -1,227 +0,0 @@ -grammar SysY; - -/*===-------------------------------------------===*/ -/* Lexer rules */ -/*===-------------------------------------------===*/ - -CONST: 'const'; -INT: 'int'; -FLOAT: 'float'; -VOID: 'void'; -IF: 'if'; -ELSE: 'else'; -WHILE: 'while'; -BREAK: 'break'; -CONTINUE: 'continue'; -RETURN: 'return'; - -ASSIGN: '='; -EQ: '=='; -NE: '!='; -LT: '<'; -GT: '>'; -LE: '<='; -GE: '>='; - -ADD: '+'; -SUB: '-'; -MUL: '*'; -DIV: '/'; -MOD: '%'; -NOT: '!'; -LAND: '&&'; -LOR: '||'; - -LPAREN: '('; -RPAREN: ')'; -LBRACE: '{'; -RBRACE: '}'; -LBRACK: '['; -RBRACK: ']'; -COMMA: ','; -SEMICOLON: ';'; - -FLOAT_CONST - : DEC_FLOAT_CONST - | HEX_FLOAT_CONST - ; - -INT_CONST - : HEX_PREFIX HEX_DIGIT+ - | '0' [0-7]+ - | '0' - | [1-9] DIGIT* - ; - -ID: [a-zA-Z_][a-zA-Z_0-9]*; - -WS: [ \t\r\n] -> skip; -LINECOMMENT: '//' ~[\r\n]* -> skip; -BLOCKCOMMENT: '/*' .*? '*/' -> skip; - -fragment DEC_FLOAT_CONST - : DIGIT+ '.' DIGIT* EXP_PART? - | '.' DIGIT+ EXP_PART? - | DIGIT+ EXP_PART - ; - -fragment HEX_FLOAT_CONST - : HEX_PREFIX HEX_DIGIT+ '.' HEX_DIGIT* BIN_EXP_PART - | HEX_PREFIX '.' HEX_DIGIT+ BIN_EXP_PART - | HEX_PREFIX HEX_DIGIT+ BIN_EXP_PART - ; - -fragment EXP_PART: [eE] [+-]? DIGIT+; -fragment BIN_EXP_PART: [pP] [+-]? DIGIT+; -fragment HEX_PREFIX: '0' [xX]; -fragment HEX_DIGIT: [0-9a-fA-F]; -fragment DIGIT: [0-9]; - -/*===-------------------------------------------===*/ -/* Syntax rules */ -/*===-------------------------------------------===*/ - -compUnit - : (decl | funcDef)+ EOF - ; - -decl - : constDecl - | varDecl - ; - -constDecl - : CONST bType constDef (COMMA constDef)* SEMICOLON - ; - -varDecl - : bType varDef (COMMA varDef)* SEMICOLON - ; - -bType - : INT - | FLOAT - ; - -constDef - : ID (LBRACK constExp RBRACK)* ASSIGN constInitVal - ; - -constInitVal - : constExp - | LBRACE (constInitVal (COMMA constInitVal)*)? RBRACE - ; - -varDef - : ID (LBRACK constExp RBRACK)* (ASSIGN initVal)? - ; - -initVal - : exp - | LBRACE (initVal (COMMA initVal)*)? RBRACE - ; - -funcDef - : funcType ID LPAREN funcFParams? RPAREN block - ; - -funcType - : VOID - | INT - | FLOAT - ; - -funcFParams - : funcFParam (COMMA funcFParam)* - ; - -funcFParam - : bType ID (LBRACK RBRACK (LBRACK exp RBRACK)*)? - ; - -block - : LBRACE blockItem* RBRACE - ; - -blockItem - : decl - | stmt - ; - -stmt - : lVal ASSIGN exp SEMICOLON - | exp? SEMICOLON - | block - | IF LPAREN cond RPAREN stmt (ELSE stmt)? - | WHILE LPAREN cond RPAREN stmt - | BREAK SEMICOLON - | CONTINUE SEMICOLON - | RETURN exp? SEMICOLON - ; - -exp - : addExp - ; - -cond - : lOrExp - ; - -lVal - : ID (LBRACK exp RBRACK)* - ; - -primaryExp - : LPAREN exp RPAREN - | lVal - | number - ; - -number - : INT_CONST - | FLOAT_CONST - ; - -unaryExp - : primaryExp - | ID LPAREN funcRParams? RPAREN - | unaryOp unaryExp - ; - -unaryOp - : ADD - | SUB - | NOT - ; - -funcRParams - : exp (COMMA exp)* - ; - -mulExp - : unaryExp ((MUL | DIV | MOD) unaryExp)* - ; - -addExp - : mulExp ((ADD | SUB) mulExp)* - ; - -relExp - : addExp ((LT | GT | LE | GE) addExp)* - ; - -eqExp - : relExp ((EQ | NE) relExp)* - ; - -lAndExp - : eqExp (LAND eqExp)* - ; - -lOrExp - : lAndExp (LOR lAndExp)* - ; - -constExp - : addExp - ; From 6b5e184cf6eb0de9a43670a64514a1f091df5f94 Mon Sep 17 00:00:00 2001 From: pabgh52us <2826301297@qq.com> Date: Mon, 23 Mar 2026 20:34:28 +0800 Subject: [PATCH 4/6] Delete 'src/antlr4/SysY.g4' --- src/antlr4/SysY.g4 | 98 ---------------------------------------------- 1 file changed, 98 deletions(-) delete mode 100644 src/antlr4/SysY.g4 diff --git a/src/antlr4/SysY.g4 b/src/antlr4/SysY.g4 deleted file mode 100644 index 263aeef..0000000 --- a/src/antlr4/SysY.g4 +++ /dev/null @@ -1,98 +0,0 @@ -// SysY 子集语法:支持形如 -// int main() { int a = 1; int b = 2; return a + b; } -// 的最小返回表达式编译。 - -// 后续需要自行添加 - -grammar SysY; - -/*===-------------------------------------------===*/ -/* Lexer rules */ -/*===-------------------------------------------===*/ - -INT: 'int'; -RETURN: 'return'; - -ASSIGN: '='; -ADD: '+'; - -LPAREN: '('; -RPAREN: ')'; -LBRACE: '{'; -RBRACE: '}'; -SEMICOLON: ';'; - -ID: [a-zA-Z_][a-zA-Z_0-9]*; -ILITERAL: [0-9]+; - -WS: [ \t\r\n] -> skip; -LINECOMMENT: '//' ~[\r\n]* -> skip; -BLOCKCOMMENT: '/*' .*? '*/' -> skip; - -/*===-------------------------------------------===*/ -/* Syntax rules */ -/*===-------------------------------------------===*/ - -compUnit - : funcDef EOF - ; - -decl - : btype varDef SEMICOLON - ; - -btype - : INT - ; - -varDef - : lValue (ASSIGN initValue)? - ; - -initValue - : exp - ; - -funcDef - : funcType ID LPAREN RPAREN blockStmt - ; - -funcType - : INT - ; - -blockStmt - : LBRACE blockItem* RBRACE - ; - -blockItem - : decl - | stmt - ; - -stmt - : returnStmt - ; - -returnStmt - : RETURN exp SEMICOLON - ; - -exp - : LPAREN exp RPAREN # parenExp - | var # varExp - | number # numberExp - | exp ADD exp # additiveExp - ; - -var - : ID - ; - -lValue - : ID - ; - -number - : ILITERAL - ; From dbc1d089578cd77ab9a5b921f323e0c2f493e691 Mon Sep 17 00:00:00 2001 From: pabgh52us <2826301297@qq.com> Date: Mon, 23 Mar 2026 20:46:00 +0800 Subject: [PATCH 5/6] Add antlr4 --- src/antlr4 | 1 + 1 file changed, 1 insertion(+) create mode 100644 src/antlr4 diff --git a/src/antlr4 b/src/antlr4 new file mode 100644 index 0000000..66dc905 --- /dev/null +++ b/src/antlr4 @@ -0,0 +1 @@ +undefined \ No newline at end of file From 9e981ce28b0b50a377361e3b232384192570b5c0 Mon Sep 17 00:00:00 2001 From: pabgh52us <2826301297@qq.com> Date: Mon, 23 Mar 2026 20:46:30 +0800 Subject: [PATCH 6/6] Delete 'src/antlr4' --- src/antlr4 | 1 - 1 file changed, 1 deletion(-) delete mode 100644 src/antlr4 diff --git a/src/antlr4 b/src/antlr4 deleted file mode 100644 index 66dc905..0000000 --- a/src/antlr4 +++ /dev/null @@ -1 +0,0 @@ -undefined \ No newline at end of file