mpir/yasm/modules/arch/lc3b/lc3bid.re
2008-06-15 21:27:00 +00:00

481 lines
16 KiB
C++

/*
* LC-3b identifier recognition and instruction handling
*
* Copyright (C) 2003-2007 Peter Johnson
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND OTHER CONTRIBUTORS ``AS IS''
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR OTHER CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
#include <util.h>
RCSID("$Id: lc3bid.re 1914 2007-08-20 05:13:35Z peter $");
#include <libyasm.h>
#include "modules/arch/lc3b/lc3barch.h"
/* Opcode modifiers. The opcode bytes are in "reverse" order because the
* parameters are read from the arch-specific data in LSB->MSB order.
* (only for asthetic reasons in the lexer code below, no practical reason).
*/
#define MOD_OpHAdd (1UL<<0) /* Parameter adds to upper 8 bits of insn */
#define MOD_OpLAdd (1UL<<1) /* Parameter adds to lower 8 bits of insn */
/* Operand types. These are more detailed than the "general" types for all
* architectures, as they include the size, for instance.
* Bit Breakdown (from LSB to MSB):
* - 1 bit = general type (must be exact match, except for =3):
* 0 = immediate
* 1 = register
*
* MSBs than the above are actions: what to do with the operand if the
* instruction matches. Essentially describes what part of the output bytecode
* gets the operand. This may require conversion (e.g. a register going into
* an ea field). Naturally, only one of each of these may be contained in the
* operands of a single insn_info structure.
* - 2 bits = action:
* 0 = does nothing (operand data is discarded)
* 1 = DR field
* 2 = SR field
* 3 = immediate
*
* Immediate operands can have different sizes.
* - 3 bits = size:
* 0 = no immediate
* 1 = 4-bit immediate
* 2 = 5-bit immediate
* 3 = 6-bit index, word (16 bit)-multiple
* 4 = 6-bit index, byte-multiple
* 5 = 8-bit immediate, word-multiple
* 6 = 9-bit signed immediate, word-multiple
* 7 = 9-bit signed offset from next PC ($+2), word-multiple
*/
#define OPT_Imm 0x0
#define OPT_Reg 0x1
#define OPT_MASK 0x1
#define OPA_None (0<<1)
#define OPA_DR (1<<1)
#define OPA_SR (2<<1)
#define OPA_Imm (3<<1)
#define OPA_MASK (3<<1)
#define OPI_None (LC3B_IMM_NONE<<3)
#define OPI_4 (LC3B_IMM_4<<3)
#define OPI_5 (LC3B_IMM_5<<3)
#define OPI_6W (LC3B_IMM_6_WORD<<3)
#define OPI_6B (LC3B_IMM_6_BYTE<<3)
#define OPI_8 (LC3B_IMM_8<<3)
#define OPI_9 (LC3B_IMM_9<<3)
#define OPI_9PC (LC3B_IMM_9_PC<<3)
#define OPI_MASK (7<<3)
typedef struct lc3b_insn_info {
/* Opcode modifiers for variations of instruction. As each modifier reads
* its parameter in LSB->MSB order from the arch-specific data[1] from the
* lexer data, and the LSB of the arch-specific data[1] is reserved for the
* count of insn_info structures in the instruction grouping, there can
* only be a maximum of 3 modifiers.
*/
unsigned int modifiers;
/* The basic 2 byte opcode */
unsigned int opcode;
/* The number of operands this form of the instruction takes */
unsigned char num_operands;
/* The types of each operand, see above */
unsigned int operands[3];
} lc3b_insn_info;
typedef struct lc3b_id_insn {
yasm_insn insn; /* base structure */
/* instruction parse group - NULL if empty instruction (just prefixes) */
/*@null@*/ const lc3b_insn_info *group;
/* Modifier data */
unsigned long mod_data;
/* Number of elements in the instruction parse group */
unsigned int num_info:8;
} lc3b_id_insn;
static void lc3b_id_insn_destroy(void *contents);
static void lc3b_id_insn_print(const void *contents, FILE *f, int indent_level);
static void lc3b_id_insn_finalize(yasm_bytecode *bc, yasm_bytecode *prev_bc);
static const yasm_bytecode_callback lc3b_id_insn_callback = {
lc3b_id_insn_destroy,
lc3b_id_insn_print,
lc3b_id_insn_finalize,
yasm_bc_calc_len_common,
yasm_bc_expand_common,
yasm_bc_tobytes_common,
YASM_BC_SPECIAL_INSN
};
/*
* Instruction groupings
*/
static const lc3b_insn_info empty_insn[] = {
{ 0, 0, 0, {0, 0, 0} }
};
static const lc3b_insn_info addand_insn[] = {
{ MOD_OpHAdd, 0x1000, 3,
{OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Reg|OPA_Imm|OPI_5} },
{ MOD_OpHAdd, 0x1020, 3,
{OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Imm|OPA_Imm|OPI_5} }
};
static const lc3b_insn_info br_insn[] = {
{ MOD_OpHAdd, 0x0000, 1, {OPT_Imm|OPA_Imm|OPI_9PC, 0, 0} }
};
static const lc3b_insn_info jmp_insn[] = {
{ 0, 0xC000, 2, {OPT_Reg|OPA_DR, OPT_Imm|OPA_Imm|OPI_9, 0} }
};
static const lc3b_insn_info lea_insn[] = {
{ 0, 0xE000, 2, {OPT_Reg|OPA_DR, OPT_Imm|OPA_Imm|OPI_9PC, 0} }
};
static const lc3b_insn_info ldst_insn[] = {
{ MOD_OpHAdd, 0x0000, 3,
{OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Imm|OPA_Imm|OPI_6W} }
};
static const lc3b_insn_info ldstb_insn[] = {
{ MOD_OpHAdd, 0x0000, 3,
{OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Imm|OPA_Imm|OPI_6B} }
};
static const lc3b_insn_info not_insn[] = {
{ 0, 0x903F, 2, {OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, 0} }
};
static const lc3b_insn_info nooperand_insn[] = {
{ MOD_OpHAdd, 0x0000, 0, {0, 0, 0} }
};
static const lc3b_insn_info shift_insn[] = {
{ MOD_OpLAdd, 0xD000, 3,
{OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Imm|OPA_Imm|OPI_4} }
};
static const lc3b_insn_info trap_insn[] = {
{ 0, 0xF000, 1, {OPT_Imm|OPA_Imm|OPI_8, 0, 0} }
};
static void
lc3b_id_insn_finalize(yasm_bytecode *bc, yasm_bytecode *prev_bc)
{
lc3b_id_insn *id_insn = (lc3b_id_insn *)bc->contents;
lc3b_insn *insn;
int num_info = id_insn->num_info;
const lc3b_insn_info *info = id_insn->group;
unsigned long mod_data = id_insn->mod_data;
int found = 0;
yasm_insn_operand *op;
int i;
yasm_insn_finalize(&id_insn->insn);
/* Just do a simple linear search through the info array for a match.
* First match wins.
*/
for (; num_info>0 && !found; num_info--, info++) {
int mismatch = 0;
/* Match # of operands */
if (id_insn->insn.num_operands != info->num_operands)
continue;
if (id_insn->insn.num_operands == 0) {
found = 1; /* no operands -> must have a match here. */
break;
}
/* Match each operand type and size */
for(i = 0, op = yasm_insn_ops_first(&id_insn->insn);
op && i<info->num_operands && !mismatch;
op = yasm_insn_op_next(op), i++) {
/* Check operand type */
switch ((int)(info->operands[i] & OPT_MASK)) {
case OPT_Imm:
if (op->type != YASM_INSN__OPERAND_IMM)
mismatch = 1;
break;
case OPT_Reg:
if (op->type != YASM_INSN__OPERAND_REG)
mismatch = 1;
break;
default:
yasm_internal_error(N_("invalid operand type"));
}
if (mismatch)
break;
}
if (!mismatch) {
found = 1;
break;
}
}
if (!found) {
/* Didn't find a matching one */
yasm_error_set(YASM_ERROR_TYPE,
N_("invalid combination of opcode and operands"));
return;
}
/* Copy what we can from info */
insn = yasm_xmalloc(sizeof(lc3b_insn));
yasm_value_initialize(&insn->imm, NULL, 0);
insn->imm_type = LC3B_IMM_NONE;
insn->opcode = info->opcode;
/* Apply modifiers */
if (info->modifiers & MOD_OpHAdd) {
insn->opcode += ((unsigned int)(mod_data & 0xFF))<<8;
mod_data >>= 8;
}
if (info->modifiers & MOD_OpLAdd) {
insn->opcode += (unsigned int)(mod_data & 0xFF);
/*mod_data >>= 8;*/
}
/* Go through operands and assign */
if (id_insn->insn.num_operands > 0) {
for(i = 0, op = yasm_insn_ops_first(&id_insn->insn);
op && i<info->num_operands; op = yasm_insn_op_next(op), i++) {
switch ((int)(info->operands[i] & OPA_MASK)) {
case OPA_None:
/* Throw away the operand contents */
if (op->type == YASM_INSN__OPERAND_IMM)
yasm_expr_destroy(op->data.val);
break;
case OPA_DR:
if (op->type != YASM_INSN__OPERAND_REG)
yasm_internal_error(N_("invalid operand conversion"));
insn->opcode |= ((unsigned int)(op->data.reg & 0x7)) << 9;
break;
case OPA_SR:
if (op->type != YASM_INSN__OPERAND_REG)
yasm_internal_error(N_("invalid operand conversion"));
insn->opcode |= ((unsigned int)(op->data.reg & 0x7)) << 6;
break;
case OPA_Imm:
insn->imm_type = (info->operands[i] & OPI_MASK)>>3;
switch (op->type) {
case YASM_INSN__OPERAND_IMM:
if (insn->imm_type == LC3B_IMM_6_WORD
|| insn->imm_type == LC3B_IMM_8
|| insn->imm_type == LC3B_IMM_9
|| insn->imm_type == LC3B_IMM_9_PC)
op->data.val = yasm_expr_create(YASM_EXPR_SHR,
yasm_expr_expr(op->data.val),
yasm_expr_int(yasm_intnum_create_uint(1)),
op->data.val->line);
if (yasm_value_finalize_expr(&insn->imm,
op->data.val,
prev_bc, 0))
yasm_error_set(YASM_ERROR_TOO_COMPLEX,
N_("immediate expression too complex"));
break;
case YASM_INSN__OPERAND_REG:
if (yasm_value_finalize_expr(&insn->imm,
yasm_expr_create_ident(yasm_expr_int(
yasm_intnum_create_uint(op->data.reg & 0x7)),
bc->line), prev_bc, 0))
yasm_internal_error(N_("reg expr too complex?"));
break;
default:
yasm_internal_error(N_("invalid operand conversion"));
}
break;
default:
yasm_internal_error(N_("unknown operand action"));
}
/* Clear so it doesn't get destroyed */
op->type = YASM_INSN__OPERAND_REG;
}
if (insn->imm_type == LC3B_IMM_9_PC) {
if (insn->imm.seg_of || insn->imm.rshift > 1
|| insn->imm.curpos_rel)
yasm_error_set(YASM_ERROR_VALUE, N_("invalid jump target"));
insn->imm.curpos_rel = 1;
}
}
/* Transform the bytecode */
yasm_lc3b__bc_transform_insn(bc, insn);
}
#define YYCTYPE unsigned char
#define YYCURSOR id
#define YYLIMIT id
#define YYMARKER marker
#define YYFILL(n) (void)(n)
yasm_arch_regtmod
yasm_lc3b__parse_check_regtmod(yasm_arch *arch, const char *oid, size_t id_len,
uintptr_t *data)
{
const YYCTYPE *id = (const YYCTYPE *)oid;
/*const char *marker;*/
/*!re2c
/* integer registers */
'r' [0-7] {
*data = (oid[1]-'0');
return YASM_ARCH_REG;
}
/* catchalls */
[\001-\377]+ {
return YASM_ARCH_NOTREGTMOD;
}
[\000] {
return YASM_ARCH_NOTREGTMOD;
}
*/
}
#define RET_INSN(g, m) \
do { \
group = g##_insn; \
mod = m; \
nelems = NELEMS(g##_insn); \
goto done; \
} while(0)
yasm_arch_insnprefix
yasm_lc3b__parse_check_insnprefix(yasm_arch *arch, const char *oid,
size_t id_len, unsigned long line,
yasm_bytecode **bc, uintptr_t *prefix)
{
const YYCTYPE *id = (const YYCTYPE *)oid;
const lc3b_insn_info *group = empty_insn;
unsigned long mod = 0;
unsigned int nelems = NELEMS(empty_insn);
lc3b_id_insn *id_insn;
*bc = (yasm_bytecode *)NULL;
*prefix = 0;
/*const char *marker;*/
/*!re2c
/* instructions */
'add' { RET_INSN(addand, 0x00); }
'and' { RET_INSN(addand, 0x40); }
'br' { RET_INSN(br, 0x00); }
'brn' { RET_INSN(br, 0x08); }
'brz' { RET_INSN(br, 0x04); }
'brp' { RET_INSN(br, 0x02); }
'brnz' { RET_INSN(br, 0x0C); }
'brnp' { RET_INSN(br, 0x0A); }
'brzp' { RET_INSN(br, 0x06); }
'brnzp' { RET_INSN(br, 0x0E); }
'jsr' { RET_INSN(br, 0x40); }
'jmp' { RET_INSN(jmp, 0); }
'lea' { RET_INSN(lea, 0); }
'ld' { RET_INSN(ldst, 0x20); }
'ldi' { RET_INSN(ldst, 0xA0); }
'st' { RET_INSN(ldst, 0x30); }
'sti' { RET_INSN(ldst, 0xB0); }
'ldb' { RET_INSN(ldstb, 0x60); }
'stb' { RET_INSN(ldstb, 0x70); }
'not' { RET_INSN(not, 0); }
'ret' { RET_INSN(nooperand, 0xCE); }
'rti' { RET_INSN(nooperand, 0x80); }
'nop' { RET_INSN(nooperand, 0); }
'lshf' { RET_INSN(shift, 0x00); }
'rshfl' { RET_INSN(shift, 0x10); }
'rshfa' { RET_INSN(shift, 0x30); }
'trap' { RET_INSN(trap, 0); }
/* catchalls */
[\001-\377]+ {
return YASM_ARCH_NOTINSNPREFIX;
}
[\000] {
return YASM_ARCH_NOTINSNPREFIX;
}
*/
done:
id_insn = yasm_xmalloc(sizeof(lc3b_id_insn));
yasm_insn_initialize(&id_insn->insn);
id_insn->group = group;
id_insn->mod_data = mod;
id_insn->num_info = nelems;
*bc = yasm_bc_create_common(&lc3b_id_insn_callback, id_insn, line);
return YASM_ARCH_INSN;
}
static void
lc3b_id_insn_destroy(void *contents)
{
lc3b_id_insn *id_insn = (lc3b_id_insn *)contents;
yasm_insn_delete(&id_insn->insn, yasm_lc3b__ea_destroy);
yasm_xfree(contents);
}
static void
lc3b_id_insn_print(const void *contents, FILE *f, int indent_level)
{
const lc3b_id_insn *id_insn = (const lc3b_id_insn *)contents;
yasm_insn_print(&id_insn->insn, f, indent_level);
/*TODO*/
}
/*@only@*/ yasm_bytecode *
yasm_lc3b__create_empty_insn(yasm_arch *arch, unsigned long line)
{
lc3b_id_insn *id_insn = yasm_xmalloc(sizeof(lc3b_id_insn));
yasm_insn_initialize(&id_insn->insn);
id_insn->group = empty_insn;
id_insn->mod_data = 0;
id_insn->num_info = NELEMS(empty_insn);
return yasm_bc_create_common(&lc3b_id_insn_callback, id_insn, line);
}