summaryrefslogtreecommitdiff
path: root/bu-parser.h
blob: 8910b5dceb26ac5fecf6bedfbd5f9e2cda78fbe3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
#ifndef BU_PARSER_HG
#define BU_PARSER_HG

#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include "tree.h"

/* PRODUCTION RULES
  <expr> ::= <expr> <binary_op> <expr> | <unary_op> <expr> | "(" <expr> ")" | <var>
  <binary_op> ::= "*" | "+"
  <unary_op> ::= "!"
  <var> ::= r#[a-z]
 */

enum parser_state {
  PARSER_ERR = -1,
  PARSER_READY = 0,
  PARSER_ACCEPT,
};

enum token_id {
  TOKEN_INVALID = 0,
  TOKEN_BINARY_OPERATOR,
  TOKEN_UNARY_OPERATOR,
  TOKEN_VARIABLE,
  TOKEN_OPEN_PAREN,
  TOKEN_CLOSE_PAREN,
  TOKEN_EOS,
  TOKEN_OOB,
  TOKEN_MAX,
};

enum stackmember_id {
  // all token ids
  STACKMEMBER_INVALID = TOKEN_INVALID,
  // ...
  STACKMEMBER_EXPR = TOKEN_MAX + 1,
  STACKMEMBER_MAX,
};

struct chartoken { enum token_id id; char c; };
typedef struct chartoken(*lexer_fn)(void*);

struct stackmember {
  enum stackmember_id id;
  union {
    char terminal;
    node *expr;
  };
};

struct expr_parser {
  lexer_fn lex;
  void *lex_data;
  // since tokens are 1-to-1 maps to chars,
  // we're fine making this type assumption
  struct chartoken lahead;
  enum parser_state st;
  // (and 1024 oughta be enough, FIXME if not)
  struct stackmember stack[1024];
  size_t stack_idx;
};

struct expr_parser expr_parser_init(lexer_fn src, void* lex_data);
void expr_parser_finish(struct expr_parser *ep);
int expr_parser_run(struct expr_parser *ep);
void expr_parser_debug_print(FILE *stream, struct expr_parser *ep);

#endif // BU_PARSER_HG