首页
学习
活动
专区
圈层
工具
发布
社区首页 >问答首页 >如何使用结构创建带有树的表达式分析器

如何使用结构创建带有树的表达式分析器
EN

Stack Overflow用户
提问于 2020-09-26 18:53:11
回答 1查看 242关注 0票数 1

我有一个我不明白的问题。我想要创建一个表达式分析器。所以,首先我为那个解析器创建了一棵树。就这样了。

代码语言:javascript
复制
enum {
    integer, plus, minus, multi, divis, string, character
};

struct Tree {
    int operation;
    struct Tree *left;
    struct Tree *right;
    char *value;
};

struct Tree *make_node(int operation, struct Tree *left, struct Tree *right, char *value) {
    struct Tree *n;
    
    n = (struct Tree *)malloc(sizeof(struct Tree));
    
    if(n == NULL) {
        printf("Unable to malloc \'make_node()\'\n");
    }
    
    n -> operation = operation;
    n -> left = left;
    n -> right = right;
    n -> value = value;
    
    return n;
}

// Print ostorder
int print_post_order_data(struct Tree *n) {
    if(n == NULL) {
        return 0;
    }
    
    print_post_order_data(n -> left);   
    print_post_order_data(n -> right);
    
    printf("Operation => %d \t Value => %s\n", n -> operation, n -> value);
}

int main(void) {
    struct Tree *m;
    
    // Expression is ( 2 + 3 * 5 - 8 / 3 )
    m = make_node(plus, NULL, NULL, NULL);
    m -> left = make_node(minus, NULL, NULL, NULL);
    m -> right = make_node(integer, NULL, NULL, "2");
    m -> left -> left = make_node(multi, NULL, NULL, NULL);
    m -> left -> right = make_node(divis, NULL, NULL, NULL);
    m -> left -> left -> left = make_node(integer, NULL, NULL, "3");
    m -> left -> left -> right = make_node(integer, NULL, NULL, "5");
    m -> left -> right -> left = make_node(integer, NULL, NULL, "8");
    m -> left -> right -> right = make_node(integer, NULL, NULL, "3");

    print_post_order_data(n);

    return 0;
}

您可以看到,我已经手动创建了用于表达式的树。表达为2 +3*5-8/ 3

假设这个程序可以识别2为数字,+为加号等,我如何编写解析器。也就是说,像上面描述的那样创建一个节点?能告诉我代码还是代码吗?

以下是更多信息

代码语言:javascript
复制
e.g. => 1 + 2 * 3

The tree is,
                +
               / \
              /   \
             *     1
            / \
           /   \
          2     3

1 + 2 * 3 => 1 + ( 2 * 3 )

So manually I can create tree like this.

    struct Tree *n;
    n = make_node(plus, NULL, NULL, NULL);
    n -> left = make_node(multi, NULL, NULL, NULL);
    n -> right = make_node(integer, NULL, NULL, "1");
    n -> left -> left = make_node(integer, NULL, NULL, "2");
    n -> left -> right = make_node(integer, NULL, NULL, "3");

我试图创建这样一个解析器。

代码语言:javascript
复制
addictive_expression() {
    multiplicative_expression()

    while(1) {
        multiplicative_expression()

        ....
    }
}


multiplicative_expression() {
    primary_expression()

    while(+ || * || /) {
        primary_expression()

        ....
    }
}

primary_expression() {
    switch(current token) {
        case integer:
             ....
             ....
    }
}

虽然我试着这样做,但我很难弄清楚如何将树连接到它。

编辑1

我想在不使用Bison等工具的情况下创建一个解析器。为此,所需的

  1. 已经被

所做了。

编辑2 :

代码语言:javascript
复制
// This is the Source of Struct Tree
struct TREE {
        int operation;
        struct TREE *left;
        struct TREE *right;
        char *value;
} Tree;

struct TREE *create_new_node(int operation, struct TREE *left, struct TREE *right, char value[MAX_LENG]) {
        struct TREE *n;

        n = (struct TREE *) malloc (sizeof(struct TREE));

        if(n == NULL) {
                fatal("Unable to Malloc New Structure TREE in \'create_new_node()\' Function in tree.c File");
        }

        n -> operation = operation;
        n -> left = left;
        n -> right = right;
        n -> value = value;

        return n;
}

// This is the Source of Parser
int expression(void) {
        next_token(); // This Function will get the next Token

        addictive_expression();
}

int addictive_expression(void) {
        int token_type;

        multiplicative_expression();

        token_type = Token.current_token; // Token.current_token is the Current Token
        if(token_type == END_FILE) {
                return 0;
        }

        while(1) {
                next_token();

                multiplicative_expression();
                
                token_type = Token.current_token;
                if(token_type == END_FILE) { // End File is a Enum
                        return 0;
                }
        }

        return 0;
}

int multiplicative_expression(void) {
        int token_type;

        primary_expression();

        token_type = Token.current_token;
        if(token_type == END_FILE) {
                return 0;
        }

        // O_MLTI, O_DIVS. O_MUDL are the tokens ( Enum )
        while(token_type == O_MLTI || token_type == O_DIVS || token_type == O_MUDL) {
                next_token();

                primary_expression();

                token_type = Token.current_token;
                if(token_type == END_FILE) {
                        return 0;
                }
        }

        return 0;
}

int primary_expression(void) {
        switch(Token.current_token) {
                case INTEGER:
                        next_token();
                        break;
                
                case O_PLUS:
                case O_MNUS:
                case O_MLTI:
                case O_DIVS:
                case O_MUDL:
                        next_token();
                        break;
                
                default:
                        error_d("Syntax Error in Primary Expression", Token.current_token); // Custom Error Message
                        break;
        }

        return 0;
}

/*
    struct Tree *m;

    m = make_node(plus, NULL, NULL, NULL);
    m -> left = make_node(minus, NULL, NULL, NULL);
    m -> right = make_node(integer, NULL, NULL, "2");
    m -> left -> left = make_node(multi, NULL, NULL, NULL);
    m -> left -> right = make_node(divis, NULL, NULL, NULL);
    m -> left -> left -> left = make_node(integer, NULL, NULL, "3");
    m -> left -> left -> right = make_node(integer, NULL, NULL, "5");
    m -> left -> right -> left = make_node(integer, NULL, NULL, "8");
    m -> left -> right -> right = make_node(integer, NULL, NULL, "3");
*/

我很难想出如何将树连接到它,,你能给我一个解决方案吗?

EN

回答 1

Stack Overflow用户

回答已采纳

发布于 2020-09-27 17:43:16

语法的非终端由返回自己为子表达式的函数实现,在您的示例中是由struct Tree *表示的。

这允许在递归调用时构造树。

因此,基本上您的addictive_expression应该是这样的:

代码语言:javascript
复制
static struct Tree *addictive_expression() {
    struct Tree *expr = multiplicative_expression();
    while (token->type == OPERATOR && (token->op == PLUS || token->op == MINUS)) {
        Operator op = token->op;
        token = next_token();
        struct Tree *expr2 = multiplicative_expression();
        switch (op) {
            case PLUS:
                expr = create_new_node(OPERATOR, PLUS, expr, expr2, NULL);
                break;
            case MINUS:
                expr = create_new_node(OPERATOR, MINUS, expr, expr2, NULL);
                break;
        }
    }
    return expr;
}

它是如何工作的:

它调用multiplicative_expression,然后调用其他函数来获取表达式。在一种简单的递归降序解析形式中,每个优先级级别都有一个单独的函数。由于正负是左关联运算符,所以它们是在循环中处理的.如果存在相同优先级级别的连续操作,则在创建新节点时,将前一个节点设置为左表达式。

为了更好地理解,我添加了一个包含正负大小写的switch语句,但正如您所看到的,您可以将它简化为:

代码语言:javascript
复制
static struct Tree *multiplicative_expression() {
    struct Tree *expr = value_expression();
    while (token->type == OPERATOR && (token->op == MULT || token->op == DIV)) {
        Operator op = token->op;
        token = next_token();
        struct Tree *expr2 = value_expression();
        expr = create_new_node(OPERATOR, op, expr, expr2, NULL);
    }
    return expr;
}

这里只使用操作符来创建一个新节点。

数据结构

注意:类型和运算符是分开的。

代码语言:javascript
复制
typedef enum  {
    NONE,
    END,
    NUMERIC,
    OPERATOR
} Type;

typedef enum {
    INVALID,
    PLUS,
    MINUS,
    MULT,
    DIV
} Operator;

typedef struct {
    Type type;
    Operator op;
    char *value;
} Token;

然后,树结构是:

代码语言:javascript
复制
struct Tree {
    Type type;
    Operator op;
    struct Tree *left;
    struct Tree *right;
    char *value;
};

完整示例

因此,一个小而完整的示例,其中的函数名是基于问题中的示例片段,看起来可能是这样的,具有两个优先级级别:

  • */
  • +-

代码语言:javascript
复制
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include "parser.h"
#include "lexer.h"

static Token *token;

static void fatal(char *msg) {
    fprintf(stderr, "%s\n", msg);
    exit(1);
}

static struct Tree *create_new_node(Type type,
                                    Operator operation,
                                    struct Tree *left,
                                    struct Tree *right,
                                    char *value) {
    struct Tree *n = (struct Tree*) malloc(sizeof(struct Tree));
    if (n == NULL) {
        fatal("Unable to Malloc New Structure Tree in \'create_new_node()\' Function in tree.c File");
    }
    n->type = type;
    n->op = operation;
    n->left = left;
    n->right = right;
    n->value = value;
    return n;
}


static struct Tree *value_expression() {
    if (token->type == NUMERIC) {
        struct Tree *result = create_new_node(NUMERIC, NONE, NULL, NULL, strdup(token->value));
        token = next_token();
        return result;
    }
    fatal("can't determine value for token");
}

static struct Tree *multiplicative_expression() {
    struct Tree *expr = value_expression();
    while (token->type == OPERATOR && (token->op == MULT || token->op == DIV)) {
        Operator op = token->op;
        token = next_token();
        struct Tree *expr2 = value_expression();
        expr = create_new_node(OPERATOR, op, expr, expr2, NULL);
    }
    return expr;
}

static struct Tree *addictive_expression() {
    struct Tree *expr = multiplicative_expression();
    while (token->type == OPERATOR && (token->op == PLUS || token->op == MINUS)) {
        Operator op = token->op;
        token = next_token();
        struct Tree *expr2 = multiplicative_expression();
        expr = create_new_node(OPERATOR, op, expr, expr2, NULL);
    }
    return expr;
}

struct Tree *expression() {
    token = next_token();
    struct Tree *expr = addictive_expression();
    putback_token(token);
    return expr;
}

树输出

代码语言:javascript
复制
#include <stdio.h>
#include <stdlib.h>
#include "lexer.h"
#include "parser.h"

void test_parser();

int main(void) {
    test_parser();
    return 0;
}

void print_expr(struct Tree *expr, int level) {
    for(int i = 0; i < level; i++) {
        printf("  |  ");
    }
    switch(expr->type) {
        case OPERATOR:
            switch(expr->op) {
                case INVALID:
                    fprintf(stderr, "invalid op\n");
                    exit(1);
                case PLUS:
                    printf("+\n");
                    print_expr(expr->left, level + 1);
                    print_expr(expr->right, level + 1);
                    printf("\n");
                    break;
                case MINUS:
                    printf("-\n");
                    print_expr(expr->left, level + 1);
                    print_expr(expr->right, level + 1);
                    printf("\n");
                    break;
                case MULT:
                    printf("*\n");
                    print_expr(expr->left, level + 1);
                    print_expr(expr->right, level + 1);
                    printf("\n");
                    break;
                case DIV:
                    printf("/\n");
                    print_expr(expr->left, level + 1);
                    print_expr(expr->right, level + 1);
                    printf("\n");
                    break;
            }
            break;
        case NUMERIC:
            printf("%s\n", expr->value);
            break;
        case NONE:
            fprintf(stderr, "unexpected NONE\n");
            exit(1);
        case END:
            fprintf(stderr, "unexpected END\n");
            exit(1);
    }
}

void test_parser() {
    setup_lexer("../input.txt");
    struct Tree *expr = expression();
    print_expr(expr, 0);
}

结果

对于输入的2 + 3 * 5 - 8 / 3,上面的小型测试程序将以下内容输出到调试控制台:

代码语言:javascript
复制
-
  |  +
  |    |  2
  |    |  *
  |    |    |  3
  |    |    |  5


  |  /
  |    |  8
  |    |  3

它看起来像正确的语法树!

票数 1
EN
页面原文内容由Stack Overflow提供。腾讯云小微IT领域专用引擎提供翻译支持
原文链接:

https://stackoverflow.com/questions/64081412

复制
相关文章

相似问题

领券
问题归档专栏文章快讯文章归档关键词归档开发者手册归档开发者手册 Section 归档