i'm trying to make a mini compiler using lex and yacc however each time i try to test my parser i keep getting a syntax error.
Here is my lex file :
%option noyywrap
%{
#include "y.tab.h"
int line = 1;
int spaceCount = 1;
int sourceLineCount = 1;
%}
IDENTIFIER [_a-zA-Z][_a-zA-Z0-9]*
WHITESPACE [ ]
DIGIT [0-9]
TAB \t
NEXTLINE \n
%%
int return INT;
float return FLOAT;
double return DOUBLE;
char return CHAR;
void return VOID;
static return STATIC;
const return CONST;
struct return STRUCT;
union return UNION;
enum return ENUM;
if return IF;
else return ELSE;
switch return SWITCH;
case return CASE;
break return BREAK;
default return DEFAULT;
^"#include ".+ ;
typedef return TYPEDEF;
extern return EXTERN;
for return FOR;
while return WHILE;
do return DO;
"<" return LT;
">" return GT;
"<=" return LE;
">=" return GE;
"==" return EQ;
"!=" return NE;
"." return DOT;
"," return COMMA;
printf return PRINTF;
return return RETURN;
{DIGIT}+ return NUM;
{NEXTLINE} {
line++;
}
{WHITESPACE} {
spaceCount++;
}
. return yytext[0];
%%
And my yacc/bison file :
%{
#include<stdio.h>
extern FILE *fp;
%}
%token INT FLOAT CHAR DOUBLE VOID
%token FOR WHILE DO
%token IF ELSE PRINTF
%token STRUCT ENUM UNION
%token SWITCH CASE BREAK DEFAULT
%token NUM ID
%token INCLUDE
%token DOT COMMA
%token STATIC CONST
%token TYPEDEF EXTERN
%token RETURN
%right '='
%left AND OR
%left '<' '>' LE GE EQ NE LT GT
%%
start: Function
| Declaration
;
/* DECCLARATION */
Declaration: Type Assignment ';'
| Assignment ';'
| FunctionCall ';'
| ArrayUsage ';'
| Type ArrayUsage ';'
| StructStmt ';'
| error
;
/* ASSIGNMENT */
Assignment: ID '=' Assignment
| ID '=' FunctionCall
| ID '=' ArrayUsage
| ArrayUsage '=' Assignment
| ID ',' Assignment
| NUM ',' Assignment
| ID '+' Assignment
| ID '-' Assignment
| ID '*' Assignment
| ID '/' Assignment
| NUM '+' Assignment
| NUM '-' Assignment
| NUM '*' Assignment
| NUM '/' Assignment
| '\'' Assignment '\''
| '(' Assignment ')'
| '-' '(' Assignment ')'
| '-' NUM
| '-' ID
| NUM
| ID
;
/* Function Call*/
FunctionCall : ID'('')'
| ID'('Assignment')'
;
/* Function block */
Function: Type ID '(' ArgListOpt ')' CompoundStmt
;
ArgListOpt: ArgList
|
;
ArgList: ArgList ',' Arg
| Arg
;
Arg: Type ID
;
/* Array Usage */
ArrayUsage : ID'['Assignment']'
;
CompoundStmt: '{' StmtList '}'
;
StmtList: StmtList Stmt
|
;
Stmt: WhileStmt
| Declaration
| ForStmt
| IfStmt
| PrintFunc
| SwitchStmt
| ';'
;
/* Type Identifier block */
Type: INT
| FLOAT
| CHAR
| DOUBLE
| VOID
;
/* Loop Blocks */
WhileStmt: WHILE '(' Expr ')' Stmt
| WHILE '(' Expr ')' CompoundStmt
;
/* For Block */
ForStmt: FOR '(' Expr ';' Expr ';' Expr ')' Stmt
| FOR '(' Expr ';' Expr ';' Expr ')' CompoundStmt
| FOR '(' Expr ')' Stmt
| FOR '(' Expr ')' CompoundStmt
;
/* IfStmt Block */
IfStmt : IF '(' Expr ')'
Stmt
;
/* SwitchStmnt */
SwitchStmt : SWITCH '(' ID ')'
CaseStmt
| SWITCH '(' ID ')'
CompoundStmt
CaseStmt
DefaultStmt
;
/* CaseStmt */
CaseStmt : CASE NUM ':'
Stmt
BREAK ';'
;
/* DefaultStmt */
DefaultStmt : DEFAULT ':'
Stmt
BREAK ';'
/* Struct Statement */
StructStmt : STRUCT ID '{' Type Assignment '}'
;
/* Print Function */
PrintFunc : PRINTF '(' Expr ')' ';'
;
/*Expression Block*/
Expr:
| Expr LE Expr
| Expr GE Expr
| Expr NE Expr
| Expr EQ Expr
| Expr GT Expr
| Expr LT Expr
| Assignment
| ArrayUsage
;
%%
#include"lex.yy.c"
#include<ctype.h>
int count=0;
int main(int argc, char *argv[])
{
yyin = fopen(argv[1], "r");
if(!yyparse())
printf("\nParsing complete\n");
else
printf("\nParsing failed\n");
fclose(yyin);
return 0;
}
yyerror(char *s) {
printf("\n %d: %s avant %s\n\n",line,s, yytext );
}
I tried to test it with multiple test files but it always seems to give me a syntax error, here is a sample of what i tried.
int main()
{
int a;
}
in this case i got an error before "m".
Nowhere in your lexical scanner do you
return ID;
which means that productions in the parser which require an ID
token are never going to match anything. I suppose you just forgot to add the line which recognises identifiers. Note that main
should be an ID
, which is why your parse fails at that point.
There are other problems with your grammar, including the fact that it only recognizes a single function declaration (Function
) or other statement (Declaration
). Along with any other changes you make, you should try to give your non-terminals more meaningful names, so that other people can understand your grammar. (This might help you, too.)