as_parser.c 6.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192
  1. #include "as_parser.h"
  2. #include "as_tokenizer.h"
  3. #include "utils.h"
  4. #include <stdio.h>
  5. #include <stdlib.h>
  6. #include <string.h>
  7. // BNF
  8. // ===
  9. //
  10. // <prog> ::= <stmts>
  11. // <stmts> ::= <stmt> newline | <stmt> newline <stmts>
  12. // <stmt> ::= <label> <instr> | <instr> | <label>
  13. // <instr> ::= <op> | <op> arg | <op> tag
  14. // <label> ::= tag ":"
  15. // <op> ::= "add" | "sub" | "mul" | "div" | "mod" | "eq" | ...
  16. struct result parse_prog(struct allocator * alct, struct token_stream * ts) {
  17. struct result result;
  18. struct prog * p = allocate(alct, sizeof(struct prog));
  19. result = parse_stmts(alct, ts);
  20. if (result.errmsg != NULL) return result;
  21. p->stmts = result.value;
  22. return (struct result){.value = p, .errmsg = NULL};
  23. }
  24. struct result parse_stmts(struct allocator * alct, struct token_stream * ts) {
  25. struct token *token;
  26. struct result result;
  27. const char* errmsg;
  28. struct stmts * ss = allocate(alct, sizeof(struct stmts));
  29. ss->stmts = allocate(alct, sizeof(struct stmt *));
  30. ss->stmts[0] = NULL;
  31. int capacity = 0;
  32. int len = 0;
  33. while (1) {
  34. result = peek_token(alct, ts);
  35. if (result.errmsg != NULL) return result;
  36. token = result.value;
  37. if (token->type == TK_ENDOFFILE) {
  38. break;
  39. }
  40. result = parse_stmt(alct, ts);
  41. if (result.errmsg != NULL) {
  42. return result;
  43. }
  44. struct stmt * s = result.value;
  45. if (s == NULL) continue;
  46. if (len == capacity) {
  47. size_t new_capacity = capacity * 2 + 1;
  48. void* new_stmts = allocate(alct, sizeof(struct stmt **) * new_capacity);
  49. memcpy(new_stmts, ss->stmts, sizeof(struct stmt **) * capacity);
  50. ss->stmts = new_stmts;
  51. capacity = new_capacity;
  52. }
  53. // expect newline
  54. result = peek_token(alct, ts);
  55. if (result.errmsg != NULL) return result;
  56. token = result.value;
  57. if (token->type == TK_NEWLINE) {
  58. result = next_token(alct, ts);
  59. if (result.errmsg != NULL) return result;
  60. } else {
  61. errmsg = safe_sprintf(alct, "%d:%d expect newline.\n", token->line, token->col);
  62. return (struct result){.value = NULL, .errmsg = errmsg};
  63. }
  64. ss->stmts[len] = s;
  65. len++;
  66. }
  67. ss->stmts[len] = NULL;
  68. return (struct result){.value = ss, .errmsg = NULL};
  69. }
  70. struct result parse_label(struct allocator * alct, struct token_stream * ts) {
  71. const char *errmsg;
  72. struct result result;
  73. struct token * t;
  74. result = next_token(alct, ts);
  75. if (result.errmsg != NULL) return result;
  76. t = result.value;
  77. if (t->type != TK_TAG) {
  78. errmsg = safe_sprintf(alct, "%d:%d expect label.\n", t->line, t->col);
  79. return (struct result){.value = NULL, .errmsg = errmsg};
  80. }
  81. struct label * l = allocate(alct, sizeof(struct label *));
  82. l->name = t->sval;
  83. result = next_token(alct, ts);
  84. if (result.errmsg != NULL) return result;
  85. t = result.value;
  86. if (t->type != TK_COLON) {
  87. errmsg = safe_sprintf(alct, "%d:%d expect colon.\n", t->line, t->col);
  88. return (struct result){.value = NULL, .errmsg = errmsg};
  89. }
  90. return (struct result){.value = l, .errmsg = NULL};
  91. }
  92. struct result parse_stmt(struct allocator * alct, struct token_stream * ts) {
  93. const char *errmsg;
  94. struct result result;
  95. struct token * t;
  96. result = peek_token(alct, ts);
  97. if (result.errmsg != NULL) return result;
  98. t = result.value;
  99. struct stmt * stmt = allocate(alct, sizeof(struct stmt));
  100. stmt->label = NULL;
  101. stmt->instr = NULL;
  102. if (t->type == TK_TAG) {
  103. result = parse_label(alct, ts);
  104. if (result.errmsg != NULL) return result;
  105. stmt->label = result.value;
  106. result = peek_token(alct, ts);
  107. if (result.errmsg != NULL) return result;
  108. t = result.value;
  109. if (t->type == TK_NEWLINE) {
  110. return (struct result){.value = stmt, .errmsg = NULL};
  111. }
  112. result = peek_token(alct, ts);
  113. if (result.errmsg != NULL) return result;
  114. t = result.value;
  115. }
  116. if (t->type == TK_OP) {
  117. result = parse_instr(alct, ts);
  118. if (result.errmsg != NULL) return result;
  119. stmt->instr = result.value;
  120. result = peek_token(alct, ts);
  121. if (result.errmsg != NULL) return result;
  122. t = result.value;
  123. if (t->type == TK_NEWLINE) {
  124. return (struct result){.value = stmt, .errmsg = NULL};
  125. }
  126. }
  127. if (t->type == TK_NEWLINE) {
  128. return (struct result){.value = NULL, .errmsg = NULL};
  129. }
  130. errmsg = safe_sprintf(alct, "%d:%d expect lable + instruction, lable, or instruction.\n", t->line, t->col);
  131. return (struct result){.value = NULL, .errmsg = errmsg};
  132. }
  133. struct result parse_op(struct allocator * alct, struct token_stream * ts) {
  134. const char *errmsg;
  135. struct result result;
  136. struct token * t;
  137. result = next_token(alct, ts);
  138. if (result.errmsg != NULL) return result;
  139. t = result.value;
  140. enum op op;
  141. if (t->type == TK_OP) {
  142. op = str2op(t->sval);
  143. if (op == OP_END) {
  144. errmsg = safe_sprintf(alct, "%d:%d invalid op.\n", t->line, t->col);
  145. return (struct result){.value = NULL, .errmsg = errmsg};
  146. }
  147. } else {
  148. errmsg = safe_sprintf(alct, "%d:%d expect op.\n", t->line, t->col);
  149. return (struct result){.value = NULL, .errmsg = errmsg};
  150. }
  151. return (struct result){.value = (void*)op, .errmsg = NULL};
  152. }
  153. struct result parse_instr(struct allocator * alct, struct token_stream * ts) {
  154. struct result result;
  155. struct token * t;
  156. result = peek_token(alct, ts);
  157. if (result.errmsg != NULL) return result;
  158. t = result.value;
  159. struct instr * i = allocate(alct, sizeof(struct instr));
  160. i->tag_name = NULL;
  161. i->arg = NULL;
  162. i->op = OP_END;
  163. if (t->type == TK_OP) {
  164. result = parse_op(alct, ts);
  165. i->op = (enum op)(result.value);
  166. result = peek_token(alct, ts);
  167. if (result.errmsg != NULL) return result;
  168. t = result.value;
  169. if (t->type == TK_ARG) {
  170. struct arg * a = allocate(alct, sizeof(struct arg));
  171. a->ival = t->ival;
  172. a->fval = t->fval;
  173. i->arg = a;
  174. next_token(alct, ts);
  175. } else if (t->type == TK_TAG) {
  176. i->tag_name = t->sval;
  177. next_token(alct, ts);
  178. }
  179. }
  180. return (struct result){.value = i, .errmsg = NULL};
  181. }