BISON AST生产打印出混乱的价值

时间:2015-07-29 16:20:09

标签: c compiler-construction bison abstract-syntax-tree yacc

我试图制作一个简单的解析器。它既可用于家庭作业,也可用于自己的实验。我已经完成了词法分析器和解析器,我现在尝试输出AST。问题是,当我添加例如两个整数时,结果树会打印出无法识别的符号。有效输入应为+(1,1),有效输出应为(+ 1 1)。而不是这个,我得到了( + �|k �|k )。我尝试了很多东西,但实际上没有任何重大结果。 sprintf函数返回一个空终止符,所以可能这不是问题。以下是解析器代码(.y文件):

%{
#define YYDEBUG 1
%}

%start program

%token  NUMBER
%token  ID
%token  PLUS    MINUS   TIMES
%token  LP  RP  EQUALS  COMMA
%token  END

%token  LET IN  AND

%left   PLUS    MINUS
%left   TIMES
%left   LET IN  AND
%left   EQUALS

%%

program:{printf("Empty Input\n");}  /* empty */
        | program line /* do nothing */

line:   expr END        { printtree($1); printf("\n");}
    ;

expr    : /*Empty*/
    | LET deflist IN expr {}
    | ID        { printf("Found ID\n"); $$ = make_id_leaf($1);}
    | NUMBER    { printf("Found NUMBER\n"); $$ = make_number_leaf($1);}
        | PLUS LP expr COMMA expr RP  {$$ = make_plus_tree($3,$5); printf("Found expr PLUS expr.\n"); }
        | TIMES LP expr COMMA expr RP {$$ = make_times_tree($3,$5); printf("Found expr TIMES expr. Result:%d\n", $$);}
    | MINUS ID
    | MINUS NUMBER     { printf("found MINUS NUMBER\n"); }
        ;

deflist : definition
    | definition AND deflist
    ;

definition : /*Empty*/
       | ID EQUALS expr {printf("Found EQ\n");}
       ;
%%

/*int main (void) {return yyparse ( );}*/

int yyerror (char *s) {fprintf (stderr, "%s\n", s);}

lexer 文件:

%{
#include "parser.h"
%}
DIGIT [0-9]
LETTER [a-zA-Z]
%%

LET {printf("Encountered LET\n"); return(LET);}
IN  {printf("Encountered IN\n"); return(IN);}
AND {printf("Encountered AND\n"); return(AND);}
{DIGIT}+    {yylval = atoi(yytext); return NUMBER;}
{LETTER}*       { if (strlen(yytext) <= 8){
                    yylval = strlen(yytext);
            printf( "<ID, %s> ", yytext );
            return(ID);
                  } else {
                        yytext[8] = '\0';
                        printf("WARNING! Long identifier. Truncating to 8 chars\n");
                        printf( "<ID, %s> ", yytext );
            return(ID);
                  }
                }
[ \t] ;
[\n]     return(END); 
"+"      return(PLUS);
"-"      return(MINUS);
"*"      return(TIMES);
"="  return(EQUALS);
"("      return(LP);
")"      return(RP);
","  return(COMMA);
<<EOF>>  return(0);
%%

int yywrap (void) {return 1;}

main.c ,其中包含 yyparse()函数:

#include <stdio.h>
#include <stdlib.h>
#include "tree.h"
#include "treedefs.h"

int main(int argc, char **argv){
    yyparse();

    return 0;
}

包含函数定义的 treedefs.h 文件(我只包括结构定义,数字叶和加号树):

typedef struct tree{
    char *token;
    TREE *l;
    TREE *r;
    TREE *child;
}TREE;

/* Make number leaves */

TREE *make_number_leaf(int n){

    TREE *leafNum = malloc(sizeof(TREE));

    char *c, ch[8];
    sprintf(ch, "%d", n); /* Effective way to convert int to string */
    c = ch;
    leafNum->token = c;
    leafNum->l = NULL;
        leafNum->r = NULL;
        leafNum->child = NULL;

    printf("NUM Leaf is: %s\n", leafNum->token);

    return (leafNum);
}

/* Addition tree */

TREE *make_plus_tree(TREE *l, TREE *r){

    TREE *plusTree = malloc(sizeof(TREE));

    plusTree->token = "+";
    plusTree->l = l;
    plusTree->r = r;
    plusTree->child = NULL;

    return (plusTree);

}
void printtree(TREE *tree)
{
    if (tree->l || tree->r){
            printf("(");
    }

    printf(" %s ", tree->token);

    if (tree->l){
        printtree(tree->l);
    }
    if (tree->r){
        printtree(tree->r);
    }
    if (tree->l || tree->r){
        printf(")");
    }
}

文件 tree.h 仅包含一些声明,没什么大不了的,而且与问题无关。

为什么数字看起来像这样?我该如何解决?任何帮助将不胜感激。

1 个答案:

答案 0 :(得分:2)

这个问题实际上与野牛或弹性无关。它位于TREE *make_number_leaf(int n){ TREE *leafNum = malloc(sizeof(TREE)); char *c, ch[8]; // ^ local variable sprintf(ch, "%d", n); /* Effective way to convert int to string */ c = ch; leafNum->token = c; // ^ dangling pointer // Remainder omitted } 实施中:

ch

如上面的注释所示,c是一个本地(堆栈分配)变量,其生命周期在函数返回时结束。将其地址分配给变量c不会改变它。因此,只要函数返回,存储在leafNum->token中的malloc的值将成为悬空指针。

因此,当您稍后尝试打印出令牌时,您将打印出随机存储器的内容。

您需要free一个字符缓冲区,并在free TREE时记住leafNum->token。 (但是,在free是字符串文字的情况下,你不能调用make,所以你需要更聪明一点。)