457 lines
10 KiB
C
457 lines
10 KiB
C
#include "parse.h"
|
|
|
|
#include <blue/core/hash.h>
|
|
#include <ctype.h>
|
|
#include <ivy/asm/assembler.h>
|
|
#include <ivy/asm/bin.h>
|
|
#include <ivy/ident.h>
|
|
#include <ivy/selector.h>
|
|
#include <ivy/asm/instr.h>
|
|
#include <stdlib.h>
|
|
|
|
#define HASH_SELF 0x2d19e518d40792b7
|
|
#define HASH_POOL 0x8c22f10da88b1083
|
|
#define HASH_SP 0x08d93e07b5793c56
|
|
#define HASH_BP 0x08a64407b54decef
|
|
|
|
#define REG_INDEX_INVALID ((unsigned long long)-1)
|
|
|
|
enum instr_component {
|
|
INSTR_NONE = 0,
|
|
INSTR_OPCODE,
|
|
INSTR_OPCODE_DOT,
|
|
INSTR_OPERAND,
|
|
INSTR_OPERAND_SEPARATOR,
|
|
INSTR_OPERAND_INDEX_LEFT,
|
|
INSTR_OPERAND_INDEX_BASE,
|
|
INSTR_OPERAND_INDEX_SEPARATOR,
|
|
INSTR_OPERAND_INDEX_OFFSET,
|
|
INSTR_OPERAND_INDEX_RIGHT,
|
|
};
|
|
|
|
enum index_base {
|
|
INDEX_NONE = 0,
|
|
INDEX_SELF,
|
|
INDEX_POOL,
|
|
INDEX_SP,
|
|
INDEX_BP,
|
|
};
|
|
|
|
enum arg_type {
|
|
ARG_NONE = 0,
|
|
ARG_CONST,
|
|
ARG_LABEL,
|
|
ARG_REG,
|
|
ARG_INDEX_REG,
|
|
ARG_INDEX_CONST,
|
|
};
|
|
|
|
struct label {
|
|
b_queue_entry l_entry;
|
|
struct ivy_asm_token *l_name;
|
|
unsigned long long l_offset;
|
|
};
|
|
|
|
struct arg {
|
|
enum arg_type arg_type;
|
|
b_queue_entry arg_entry;
|
|
|
|
union {
|
|
struct ivy_asm_token *arg_const;
|
|
struct ivy_asm_token *arg_label;
|
|
struct {
|
|
struct ivy_asm_token *reg_token;
|
|
unsigned long long reg_index;
|
|
} arg_reg;
|
|
struct {
|
|
enum index_base index_base;
|
|
struct ivy_asm_token *index_base_token;
|
|
|
|
struct ivy_asm_token *index_offset;
|
|
unsigned long long index_offset_reg;
|
|
} arg_index_reg;
|
|
|
|
struct {
|
|
enum index_base index_base;
|
|
struct ivy_asm_token *index_base_token;
|
|
|
|
struct ivy_asm_token *index_offset;
|
|
} arg_index_const;
|
|
};
|
|
};
|
|
|
|
struct block_parser_state {
|
|
struct parser_state s_base;
|
|
unsigned int s_prev_token;
|
|
enum instr_component s_prev_component;
|
|
|
|
b_queue s_labels;
|
|
|
|
b_queue s_mnemonic;
|
|
|
|
b_queue s_args;
|
|
struct arg *s_current_arg;
|
|
};
|
|
|
|
static unsigned long long get_register_index(struct ivy_asm_token *tok)
|
|
{
|
|
if (tok->t_type != IVY_ASM_TOK_IDENT) {
|
|
return REG_INDEX_INVALID;
|
|
}
|
|
|
|
const char *s = tok->t_str;
|
|
if (tolower(s[0]) != 'x') {
|
|
return REG_INDEX_INVALID;
|
|
}
|
|
|
|
char index_str[5] = {0};
|
|
strncpy(index_str + 1, s, sizeof index_str - 1);
|
|
char *ep = NULL;
|
|
unsigned long long index = strtoul(index_str, &ep, 10);
|
|
|
|
if (*ep || index >= 256) {
|
|
return REG_INDEX_INVALID;
|
|
}
|
|
|
|
return index;
|
|
}
|
|
|
|
static enum index_base get_index_base(struct ivy_asm_token *tok)
|
|
{
|
|
if (tok->t_type != IVY_ASM_TOK_IDENT) {
|
|
return INDEX_NONE;
|
|
}
|
|
|
|
const char *s = tok->t_str;
|
|
uint64_t hash = b_hash_string(s);
|
|
|
|
switch (hash) {
|
|
case HASH_SELF:
|
|
if (!strcmp(s, "self")) {
|
|
return INDEX_SELF;
|
|
}
|
|
|
|
return INDEX_NONE;
|
|
case HASH_POOL:
|
|
if (!strcmp(s, "pool")) {
|
|
return INDEX_POOL;
|
|
}
|
|
|
|
return INDEX_NONE;
|
|
case HASH_SP:
|
|
if (!strcmp(s, "sp")) {
|
|
return INDEX_SP;
|
|
}
|
|
|
|
return INDEX_NONE;
|
|
case HASH_BP:
|
|
if (!strcmp(s, "bp")) {
|
|
return INDEX_BP;
|
|
}
|
|
|
|
return INDEX_NONE;
|
|
default:
|
|
return INDEX_NONE;
|
|
}
|
|
}
|
|
|
|
static enum ivy_status write_instruction(struct ivy_asm_parser *p, struct block_parser_state *state)
|
|
{
|
|
struct ivy_instr instr = {0};
|
|
ivy_assembler_put_instr(p->p_assembler, &instr);
|
|
return IVY_OK;
|
|
}
|
|
|
|
static enum ivy_status push_const_arg(
|
|
struct block_parser_state *state, struct ivy_asm_token *tok)
|
|
{
|
|
struct arg *arg = malloc(sizeof *arg);
|
|
if (!arg) {
|
|
return IVY_ERR_NO_MEMORY;
|
|
}
|
|
|
|
memset(arg, 0x0, sizeof *arg);
|
|
|
|
arg->arg_type = ARG_CONST;
|
|
arg->arg_const = tok;
|
|
|
|
b_queue_push_back(&state->s_args, &arg->arg_entry);
|
|
return IVY_OK;
|
|
}
|
|
|
|
static enum ivy_status push_label(
|
|
struct block_parser_state *state, struct ivy_asm_token *tok)
|
|
{
|
|
struct label *label = malloc(sizeof *label);
|
|
if (!label) {
|
|
return IVY_ERR_NO_MEMORY;
|
|
}
|
|
|
|
memset(label, 0x0, sizeof *label);
|
|
|
|
label->l_name = tok;
|
|
/* TODO */
|
|
label->l_offset = 0;
|
|
|
|
b_queue_push_back(&state->s_labels, &label->l_entry);
|
|
return IVY_OK;
|
|
}
|
|
|
|
static enum ivy_status push_label_arg(
|
|
struct block_parser_state *state, struct ivy_asm_token *tok,
|
|
unsigned long long reg_index)
|
|
{
|
|
struct arg *arg = malloc(sizeof *arg);
|
|
if (!arg) {
|
|
return IVY_ERR_NO_MEMORY;
|
|
}
|
|
|
|
memset(arg, 0x0, sizeof *arg);
|
|
|
|
arg->arg_type = ARG_LABEL;
|
|
arg->arg_label = tok;
|
|
|
|
b_queue_push_back(&state->s_args, &arg->arg_entry);
|
|
return IVY_OK;
|
|
}
|
|
|
|
static enum ivy_status push_reg_arg(
|
|
struct block_parser_state *state, struct ivy_asm_token *tok,
|
|
unsigned long long reg_index)
|
|
{
|
|
struct arg *arg = malloc(sizeof *arg);
|
|
if (!arg) {
|
|
return IVY_ERR_NO_MEMORY;
|
|
}
|
|
|
|
memset(arg, 0x0, sizeof *arg);
|
|
|
|
arg->arg_type = ARG_REG;
|
|
arg->arg_reg.reg_token = tok;
|
|
arg->arg_reg.reg_index = reg_index;
|
|
|
|
b_queue_push_back(&state->s_args, &arg->arg_entry);
|
|
return IVY_OK;
|
|
}
|
|
|
|
static enum ivy_status parse_linefeed(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
switch (state->s_prev_component) {
|
|
case INSTR_NONE:
|
|
return IVY_OK;
|
|
case INSTR_OPCODE:
|
|
case INSTR_OPERAND:
|
|
case INSTR_OPERAND_INDEX_RIGHT:
|
|
state->s_prev_component = INSTR_NONE;
|
|
return write_instruction(ctx, state);
|
|
default:
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
}
|
|
|
|
static enum ivy_status parse_int(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
switch (state->s_prev_component) {
|
|
case INSTR_OPCODE:
|
|
case INSTR_OPERAND_SEPARATOR:
|
|
push_const_arg(state, tok);
|
|
state->s_prev_component = INSTR_OPERAND;
|
|
return IVY_OK;
|
|
case INSTR_OPERAND_INDEX_SEPARATOR:
|
|
state->s_current_arg->arg_type = ARG_INDEX_CONST;
|
|
state->s_current_arg->arg_index_const.index_offset = tok;
|
|
state->s_prev_component = INSTR_OPERAND_INDEX_OFFSET;
|
|
return IVY_OK;
|
|
default:
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
}
|
|
|
|
static enum ivy_status parse_ident(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
unsigned long long x = 0;
|
|
|
|
switch (state->s_prev_component) {
|
|
case INSTR_NONE:
|
|
case INSTR_OPCODE_DOT:
|
|
b_queue_push_back(&state->s_mnemonic, &tok->t_entry);
|
|
state->s_prev_component = INSTR_OPCODE;
|
|
return IVY_OK;
|
|
case INSTR_OPCODE:
|
|
case INSTR_OPERAND_SEPARATOR:
|
|
x = get_register_index(tok);
|
|
state->s_prev_component = INSTR_OPERAND;
|
|
|
|
if (x == REG_INDEX_INVALID) {
|
|
return push_label_arg(state, tok, x);
|
|
} else {
|
|
return push_reg_arg(state, tok, x);
|
|
}
|
|
case INSTR_OPERAND_INDEX_LEFT:
|
|
x = get_index_base(tok);
|
|
if (x == INDEX_NONE) {
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
|
|
state->s_current_arg->arg_type = ARG_INDEX_REG;
|
|
state->s_current_arg->arg_index_reg.index_base_token = tok;
|
|
state->s_current_arg->arg_index_reg.index_base = x;
|
|
state->s_prev_component = INSTR_OPERAND_INDEX_BASE;
|
|
return IVY_OK;
|
|
default:
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
|
|
/* not sure what this is but we aren't expecting it. */
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
|
|
static enum ivy_status parse_dot(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
if (state->s_prev_component != INSTR_OPCODE) {
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
|
|
state->s_prev_component = INSTR_OPCODE_DOT;
|
|
return IVY_OK;
|
|
}
|
|
|
|
static enum ivy_status parse_label(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
if (state->s_prev_component != INSTR_NONE) {
|
|
/* not sure what this is but we aren't expecting it. */
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
|
|
return push_label(state, tok);
|
|
}
|
|
|
|
static enum ivy_status parse_comma(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
switch (state->s_prev_component) {
|
|
case INSTR_OPERAND:
|
|
case INSTR_OPERAND_INDEX_RIGHT:
|
|
state->s_prev_component = INSTR_OPERAND_SEPARATOR;
|
|
return IVY_OK;
|
|
case INSTR_OPERAND_INDEX_BASE:
|
|
state->s_prev_component = INSTR_OPERAND_INDEX_SEPARATOR;
|
|
return IVY_OK;
|
|
default:
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
}
|
|
|
|
static enum ivy_status parse_left_bracket(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
switch (state->s_prev_component) {
|
|
case INSTR_OPCODE:
|
|
case INSTR_OPERAND_SEPARATOR:
|
|
break;
|
|
default:
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
|
|
struct arg *arg = malloc(sizeof *arg);
|
|
if (!arg) {
|
|
return IVY_ERR_NO_MEMORY;
|
|
}
|
|
|
|
memset(arg, 0x0, sizeof *arg);
|
|
|
|
state->s_current_arg = arg;
|
|
state->s_prev_component = INSTR_OPERAND_INDEX_LEFT;
|
|
return IVY_OK;
|
|
}
|
|
|
|
static enum ivy_status parse_right_bracket(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
if (state->s_prev_component != INSTR_OPERAND_INDEX_OFFSET) {
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
|
|
b_queue_push_back(&state->s_args, &state->s_current_arg->arg_entry);
|
|
state->s_current_arg = NULL;
|
|
state->s_prev_component = INSTR_OPERAND;
|
|
|
|
return IVY_OK;
|
|
}
|
|
|
|
static enum ivy_status parse_end(
|
|
struct ivy_asm_parser *ctx, struct ivy_asm_token *tok)
|
|
{
|
|
struct block_parser_state *state
|
|
= (struct block_parser_state *)asm_parser_get_state(ctx);
|
|
|
|
if (state->s_prev_component != INSTR_NONE) {
|
|
return IVY_ERR_BAD_SYNTAX;
|
|
}
|
|
|
|
asm_parser_pop_state(ctx, NULL);
|
|
|
|
return IVY_OK;
|
|
}
|
|
|
|
static void init_state(struct ivy_asm_parser *ctx, struct parser_state *state)
|
|
{
|
|
ivy_assembler_begin_scope(
|
|
ctx->p_assembler, IVY_ASM_SCOPE_BLOCK, state->s_attrib);
|
|
}
|
|
|
|
static void finish_state(struct ivy_asm_parser *ctx, struct parser_state *state)
|
|
{
|
|
ivy_assembler_end_scope(ctx->p_assembler);
|
|
}
|
|
|
|
struct parser_state_type block_parser_state_type = {
|
|
.n_init_state = init_state,
|
|
.n_finish_state = finish_state,
|
|
.n_state_size = sizeof(struct block_parser_state),
|
|
.n_token_parsers = {
|
|
TOK_PARSER(IDENT, parse_ident),
|
|
TOK_PARSER(LABEL, parse_label),
|
|
TOK_PARSER(INT, parse_int),
|
|
TOK_PARSER(LINEFEED, parse_linefeed),
|
|
},
|
|
.n_symbol_parsers = {
|
|
SYM_PARSER(LEFT_BRACKET, parse_left_bracket),
|
|
SYM_PARSER(RIGHT_BRACKET, parse_right_bracket),
|
|
SYM_PARSER(COMMA, parse_comma),
|
|
SYM_PARSER(DOT, parse_dot),
|
|
},
|
|
.n_keyword_parsers = {
|
|
KW_PARSER(END, parse_end),
|
|
},
|
|
};
|