I'm implementing a programming language (katir) with the help of yacc and lex. Lex and yacc files are prepared and lex.yy.c and y.tab.c files are created without any error. But when I call gcc -o katir y.tab.c it gives a big list of error such as and it continues like this:
y.tab.c:557:41: error: expected ‘;’ before ‘goto’
yyloop:
^
y.tab.c:558:8: error: called object is not a function or function pointer
if ((yyn = yydefred[yystate]) != 0) goto yyreduce;
^
y.tab.c:559:5: error: expected ‘;’ before ‘{’ token
if (yychar < 0)
^
y.tab.c:607:8: error: called object is not a function or function pointer
yyinrecovery:
^
y.tab.c:608:5: error: expected ‘;’ before ‘{’ token
if (yyerrflag < 3)
^
y.tab.c:666:8: error: called object is not a function or function pointer
yym = yylen[yyn];
^
y.tab.c:667:9: error: expected ‘;’ before ‘yyval’
if (yym)
^
y.tab.c:669:9: error: expected ‘;’ before ‘memset’
else
^
y.tab.c:677:8: error: called object is not a function or function pointer
yym = yylhs[yyn];
^
y.tab.c:678:5: error: expected ‘;’ before ‘{’ token
if (yystate == 0 && yym == 0)
^
y.tab.c:708:9: error: expected ‘;’ before ‘yystate’
else
^
y.tab.c:714:8: error: called object is not a function or function pointer
#endif
^
y.tab.c:715:5: error: expected ‘;’ before ‘{’ token
if (yystack.s_mark >= yystack.s_last && yygrowstack(&yystack))
^
y.tab.c:727:12: error: called object is not a function or function pointer
yyfreestack(&yystack);
^
y.tab.c:731:12: error: called object is not a function or function pointer
yyfreestack(&yystack);
My lex file is;
%{
#include <stdlib.h>
void yyerror(char *);
%}
begin begin
end end
assignment_op <-
endline \n
difference diff
set_type set
integer_type integer
char_type char
boolean_type boolean
string_type string
float_type float
constant const
equal ==|eq
comment {hashtag}([^\n])*\n
hashtag #
and \&\&|and
or \|\||or
cardinality_op \|
cp_op cp
set_del del
else else
not !|not
lt <|lt
gt >|gt
lte <=|lte
gte >=|gte
lp \(
rp \)
lcb \{
rcb \}
comma ,
endstmnt \;
underscore _
dot \.
digit [0-9]
letter[a-zA-Z]
if if
then then
do do
multiplier \*
divider \/
subtractor \-
adder \+
union uni
intersection inter
subset subs
superset sups
while while
for for
fc fc
return return
input input
output output
true true
false false
space ([ ])
boolean TRUE|FALSE
integer [+-]?({digit})+
float ({integer})*(\.({digit})+|({digit})+\.)({digit})*
char \'[^\\\']\'
string \"([^\\\"]|\\\"|\\\n|\\\\)*\"
identifier {letter}({letter}|{digit}|{underscore})*
text ([^\\\"]|\\\"|\\\n|\\\\)*
whitespace [ \t]
%option yylineno
%%
{end} return end;
{begin} return begin;
{assignment_op} return assignment_op;
{equal} return equality_op;
{hashtag} return hashtag;
{set_type} return set_type;
{and} return and;
{or} return or;
{else} return else;
{lp} return lp;
{rp} return rp;
{lcb} return lb;
{rcb} return rb;
{lt} return lt;
{gt} return gt;
{lte} return lte;
{gte} return gte;
{comma} return comma;
{dot} return dot;
{then} return then;
{cardinality_op} return cardinality_op;
{cp_op} return cp_op;
{set_del} return del;
{float} return float;
{digit} return digit;
{integer} return integer;
{integer_type} return int_type;
{char_type} return char_type;
{boolean_type} return boolean_type;
{string_type} return string_type;
{float_type} return float_type;
{if} return if;
{do} return do;
{while} return while;
{for} return for;
{true} return true;
{false} return false;
{difference} return difference;
{union} return union;
{intersection} return intersection;
{subset} return subset;
{superset} return superset;
{constant} return constant;
{boolean} return boolean;
{char} return char;
{fc} return fc;
{endline} ;
{whitespace};
{return} return return;
{output} return output;
{input} return input;
{string} return string;
{identifier} return identifier;
{comment} return comment;
{endstmnt} return endstmnt;
{underscore} return underscore;
{multiplier} return multiplier;
{divider} return divider;
{subtractor} return subtractor;
{adder} return adder;
{text} return text;
%%
int yywrap(){return 1;}
And yacc file is the following;
%{
#include <stdio.h>
#include <stdlib.h>
%}
%token begin
%token end
%token assignment_op
%token equal
%token hashtag
%token constant
%token and
%token or
%token then
%token not
%token else
%token lp
%token rp
%token lcb
%token rcb
%token comment
%token lt
%token gt
%token lte
%token gte
%token comma
%token dot
%token cardinality_op
%token cp_op
%token set_del
%token float
%token digit
%token integer
%token integer_type
%token char_type
%token boolean_type
%token string_type
%token float_type
%token if
%token do
%token while
%token for
%token true
%token false
%token difference
%token union
%token set_type
%token intersection
%token subset
%token superset
%token constant
%token boolean
%token char
%token fc
%token return
%token output
%token input
%token string
%token identifier
%token comment
%token endstmnt
%token underscore
%token multiplier
%token divider
%token subtractor
%token adder
%token text
%start program
%right assignment_op
%left adder subtractor difference intersection union
%left multiplier divider
%left cp_op
%%
//Start Rule
program:
begin stmnt_l end;
stmnt_l:
stmnt endstmnt
|stmnt endstmnt stmnt_l
;
//Possible statement types
stmnt:
if_stmnt;
nan_if:
loop_stmnt
|expression
|declare
|initialize
|in_out_stmnt
|function
;
loop_stmnt:
while_stmnt
|for_stmnt
|do_while_stmnt
;
if_stmnt: matched | unmatched;
matched: if logical_expression then matched else matched| nan_if;
unmatched: if logical_expression then stmnt
| if logical_expression then matched else unmatched;
while_stmnt: while lp logical_expression rp lcb stmnt_l rcb;
do_while_stmnt: do lcb stmnt_l rcb while logical_expression ;
for_stmnt: for lp initialize endstmnt logical_expression lp stmnt_l rp;
term: var | constant_type | function_call;
constant_type: constant var;
var: identifier;
//Types
type: boolean | string | integer | float; //|set
primitive: boolean_type | string_type | integer_type | float_type | set_type;
set: lcb list rcb | lcb rcb;
list: type | var | type comma list | var comma list;
//----------------------------------Declerations----------------------------------------------
declare:
primitive var;
init_types:
type | function_call | set_exp;
initialize:
declare assignment_op init_types | var assignment_op init_types;
//Connectives
logical_operator: subset | superset | lt | gt | and | or | not | equal;
logical_expression: term logical_operator logical_expression | term logical_operator term | not_expression;
not_expression: not lp logical_expression rp;
del_expression: set_del var;
//Arithmetic
arithmetic_expression: arithmetic_expression adder arithmetic_expression | exp2;
exp2: exp2 subtractor exp2 | exp3;
exp3: exp3 multiplier exp3 | exp4;
exp4: exp4 divider exp4 | exp5;
exp5: integer | float | function_call;
//Set Expressions
set_exp: exp_uni;
exp_uni: exp_uni union exp_uni | exp_intersection;
exp_intersection: exp_intersection intersection exp_intersection| exp_diff;
exp_diff: exp_diff difference exp_diff|exp_cartesian;
exp_cartesian: exp_cartesian cp_op exp_cartesian | set;
expression: arithmetic_expression | logical_expression | cardinality_expression | del_expression;
cardinality_expression: cardinality_op var cardinality_op | cardinality_op set cardinality_op;
//Input/Output
in_out_stmnt: input_stmnt | output_stmnt;
input_stmnt: input lp input_body rp;
input_body: type var;
output_stmnt: output lp output_body rp;
output_body: var;
//Function
function: type var lp arguments rp lcb stmnt_l return_stmnt rcb
| type var lp rp lcb stmnt_l return_stmnt rcb;
arguments: primitive var | primitive var comma arguments;
function_call: fc lp parameters rp | fc lp rp;
parameters: var | var comma parameters |type comma parameters;
return_stmnt: return var;
%%
#include "lex.yy.c"
int yyerror(char *s) {
fprintf(stdout, "line %d: %s\n", yylineno,s);
}
int main(){
return yyparse();
if(yynerrs < 1){
printf("Parsing is successful\n");
}
return 0;
}
And finally all the code I call in linux terminal is the following;
flex katir.l
yacc katir.yacc
gcc -o katir y.tab.c
As you already surmised in a comment, your problem is that your token names clash with C keywords. Defining a token if
in your yacc file will cause the generated C file to contain both a line like if = 258
(where 258 could of course be a different number) inside an enum
declaration and #define if 258
afterwards. if = 258
is a syntax error of course and #define if 258
will cause errors anywhere where if
is used as part of an actual if
statement anywhere in the following code (because something like if(cond)
would become 42(cond)
, which is a type error). The same goes for any other keywords.
The convention is for token names to be written in ALL_CAPS to avoid exactly this problem.