/* * LC-3b identifier recognition and instruction handling * * Copyright (C) 2003-2007 Peter Johnson * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND OTHER CONTRIBUTORS ``AS IS'' * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR OTHER CONTRIBUTORS BE * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. */ #include #include #include "modules/arch/lc3b/lc3barch.h" /* Opcode modifiers. The opcode bytes are in "reverse" order because the * parameters are read from the arch-specific data in LSB->MSB order. * (only for asthetic reasons in the lexer code below, no practical reason). */ #define MOD_OpHAdd (1UL<<0) /* Parameter adds to upper 8 bits of insn */ #define MOD_OpLAdd (1UL<<1) /* Parameter adds to lower 8 bits of insn */ /* Operand types. These are more detailed than the "general" types for all * architectures, as they include the size, for instance. * Bit Breakdown (from LSB to MSB): * - 1 bit = general type (must be exact match, except for =3): * 0 = immediate * 1 = register * * MSBs than the above are actions: what to do with the operand if the * instruction matches. Essentially describes what part of the output bytecode * gets the operand. This may require conversion (e.g. a register going into * an ea field). Naturally, only one of each of these may be contained in the * operands of a single insn_info structure. * - 2 bits = action: * 0 = does nothing (operand data is discarded) * 1 = DR field * 2 = SR field * 3 = immediate * * Immediate operands can have different sizes. * - 3 bits = size: * 0 = no immediate * 1 = 4-bit immediate * 2 = 5-bit immediate * 3 = 6-bit index, word (16 bit)-multiple * 4 = 6-bit index, byte-multiple * 5 = 8-bit immediate, word-multiple * 6 = 9-bit signed immediate, word-multiple * 7 = 9-bit signed offset from next PC ($+2), word-multiple */ #define OPT_Imm 0x0 #define OPT_Reg 0x1 #define OPT_MASK 0x1 #define OPA_None (0<<1) #define OPA_DR (1<<1) #define OPA_SR (2<<1) #define OPA_Imm (3<<1) #define OPA_MASK (3<<1) #define OPI_None (LC3B_IMM_NONE<<3) #define OPI_4 (LC3B_IMM_4<<3) #define OPI_5 (LC3B_IMM_5<<3) #define OPI_6W (LC3B_IMM_6_WORD<<3) #define OPI_6B (LC3B_IMM_6_BYTE<<3) #define OPI_8 (LC3B_IMM_8<<3) #define OPI_9 (LC3B_IMM_9<<3) #define OPI_9PC (LC3B_IMM_9_PC<<3) #define OPI_MASK (7<<3) typedef struct lc3b_insn_info { /* Opcode modifiers for variations of instruction. As each modifier reads * its parameter in LSB->MSB order from the arch-specific data[1] from the * lexer data, and the LSB of the arch-specific data[1] is reserved for the * count of insn_info structures in the instruction grouping, there can * only be a maximum of 3 modifiers. */ unsigned int modifiers; /* The basic 2 byte opcode */ unsigned int opcode; /* The number of operands this form of the instruction takes */ unsigned char num_operands; /* The types of each operand, see above */ unsigned int operands[3]; } lc3b_insn_info; typedef struct lc3b_id_insn { yasm_insn insn; /* base structure */ /* instruction parse group - NULL if empty instruction (just prefixes) */ /*@null@*/ const lc3b_insn_info *group; /* Modifier data */ unsigned long mod_data; /* Number of elements in the instruction parse group */ unsigned int num_info:8; } lc3b_id_insn; static void lc3b_id_insn_destroy(void *contents); static void lc3b_id_insn_print(const void *contents, FILE *f, int indent_level); static void lc3b_id_insn_finalize(yasm_bytecode *bc, yasm_bytecode *prev_bc); static const yasm_bytecode_callback lc3b_id_insn_callback = { lc3b_id_insn_destroy, lc3b_id_insn_print, lc3b_id_insn_finalize, NULL, yasm_bc_calc_len_common, yasm_bc_expand_common, yasm_bc_tobytes_common, YASM_BC_SPECIAL_INSN }; /* * Instruction groupings */ static const lc3b_insn_info empty_insn[] = { { 0, 0, 0, {0, 0, 0} } }; static const lc3b_insn_info addand_insn[] = { { MOD_OpHAdd, 0x1000, 3, {OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Reg|OPA_Imm|OPI_5} }, { MOD_OpHAdd, 0x1020, 3, {OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Imm|OPA_Imm|OPI_5} } }; static const lc3b_insn_info br_insn[] = { { MOD_OpHAdd, 0x0000, 1, {OPT_Imm|OPA_Imm|OPI_9PC, 0, 0} } }; static const lc3b_insn_info jmp_insn[] = { { 0, 0xC000, 2, {OPT_Reg|OPA_DR, OPT_Imm|OPA_Imm|OPI_9, 0} } }; static const lc3b_insn_info lea_insn[] = { { 0, 0xE000, 2, {OPT_Reg|OPA_DR, OPT_Imm|OPA_Imm|OPI_9PC, 0} } }; static const lc3b_insn_info ldst_insn[] = { { MOD_OpHAdd, 0x0000, 3, {OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Imm|OPA_Imm|OPI_6W} } }; static const lc3b_insn_info ldstb_insn[] = { { MOD_OpHAdd, 0x0000, 3, {OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Imm|OPA_Imm|OPI_6B} } }; static const lc3b_insn_info not_insn[] = { { 0, 0x903F, 2, {OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, 0} } }; static const lc3b_insn_info nooperand_insn[] = { { MOD_OpHAdd, 0x0000, 0, {0, 0, 0} } }; static const lc3b_insn_info shift_insn[] = { { MOD_OpLAdd, 0xD000, 3, {OPT_Reg|OPA_DR, OPT_Reg|OPA_SR, OPT_Imm|OPA_Imm|OPI_4} } }; static const lc3b_insn_info trap_insn[] = { { 0, 0xF000, 1, {OPT_Imm|OPA_Imm|OPI_8, 0, 0} } }; static void lc3b_id_insn_finalize(yasm_bytecode *bc, yasm_bytecode *prev_bc) { lc3b_id_insn *id_insn = (lc3b_id_insn *)bc->contents; lc3b_insn *insn; int num_info = id_insn->num_info; const lc3b_insn_info *info = id_insn->group; unsigned long mod_data = id_insn->mod_data; int found = 0; yasm_insn_operand *op; int i; yasm_insn_finalize(&id_insn->insn); /* Just do a simple linear search through the info array for a match. * First match wins. */ for (; num_info>0 && !found; num_info--, info++) { int mismatch = 0; /* Match # of operands */ if (id_insn->insn.num_operands != info->num_operands) continue; if (id_insn->insn.num_operands == 0) { found = 1; /* no operands -> must have a match here. */ break; } /* Match each operand type and size */ for(i = 0, op = yasm_insn_ops_first(&id_insn->insn); op && inum_operands && !mismatch; op = yasm_insn_op_next(op), i++) { /* Check operand type */ switch ((int)(info->operands[i] & OPT_MASK)) { case OPT_Imm: if (op->type != YASM_INSN__OPERAND_IMM) mismatch = 1; break; case OPT_Reg: if (op->type != YASM_INSN__OPERAND_REG) mismatch = 1; break; default: yasm_internal_error(N_("invalid operand type")); } if (mismatch) break; } if (!mismatch) { found = 1; break; } } if (!found) { /* Didn't find a matching one */ yasm_error_set(YASM_ERROR_TYPE, N_("invalid combination of opcode and operands")); return; } /* Copy what we can from info */ insn = yasm_xmalloc(sizeof(lc3b_insn)); yasm_value_initialize(&insn->imm, NULL, 0); insn->imm_type = LC3B_IMM_NONE; insn->opcode = info->opcode; /* Apply modifiers */ if (info->modifiers & MOD_OpHAdd) { insn->opcode += ((unsigned int)(mod_data & 0xFF))<<8; mod_data >>= 8; } if (info->modifiers & MOD_OpLAdd) { insn->opcode += (unsigned int)(mod_data & 0xFF); /*mod_data >>= 8;*/ } /* Go through operands and assign */ if (id_insn->insn.num_operands > 0) { for(i = 0, op = yasm_insn_ops_first(&id_insn->insn); op && inum_operands; op = yasm_insn_op_next(op), i++) { switch ((int)(info->operands[i] & OPA_MASK)) { case OPA_None: /* Throw away the operand contents */ if (op->type == YASM_INSN__OPERAND_IMM) yasm_expr_destroy(op->data.val); break; case OPA_DR: if (op->type != YASM_INSN__OPERAND_REG) yasm_internal_error(N_("invalid operand conversion")); insn->opcode |= ((unsigned int)(op->data.reg & 0x7)) << 9; break; case OPA_SR: if (op->type != YASM_INSN__OPERAND_REG) yasm_internal_error(N_("invalid operand conversion")); insn->opcode |= ((unsigned int)(op->data.reg & 0x7)) << 6; break; case OPA_Imm: insn->imm_type = (info->operands[i] & OPI_MASK)>>3; switch (op->type) { case YASM_INSN__OPERAND_IMM: if (insn->imm_type == LC3B_IMM_6_WORD || insn->imm_type == LC3B_IMM_8 || insn->imm_type == LC3B_IMM_9 || insn->imm_type == LC3B_IMM_9_PC) op->data.val = yasm_expr_create(YASM_EXPR_SHR, yasm_expr_expr(op->data.val), yasm_expr_int(yasm_intnum_create_uint(1)), op->data.val->line); if (yasm_value_finalize_expr(&insn->imm, op->data.val, prev_bc, 0)) yasm_error_set(YASM_ERROR_TOO_COMPLEX, N_("immediate expression too complex")); break; case YASM_INSN__OPERAND_REG: if (yasm_value_finalize_expr(&insn->imm, yasm_expr_create_ident(yasm_expr_int( yasm_intnum_create_uint(op->data.reg & 0x7)), bc->line), prev_bc, 0)) yasm_internal_error(N_("reg expr too complex?")); break; default: yasm_internal_error(N_("invalid operand conversion")); } break; default: yasm_internal_error(N_("unknown operand action")); } /* Clear so it doesn't get destroyed */ op->type = YASM_INSN__OPERAND_REG; } if (insn->imm_type == LC3B_IMM_9_PC) { if (insn->imm.seg_of || insn->imm.rshift > 1 || insn->imm.curpos_rel) yasm_error_set(YASM_ERROR_VALUE, N_("invalid jump target")); insn->imm.curpos_rel = 1; } } /* Transform the bytecode */ yasm_lc3b__bc_transform_insn(bc, insn); } #define YYCTYPE unsigned char #define YYCURSOR id #define YYLIMIT id #define YYMARKER marker #define YYFILL(n) (void)(n) yasm_arch_regtmod yasm_lc3b__parse_check_regtmod(yasm_arch *arch, const char *oid, size_t id_len, uintptr_t *data) { const YYCTYPE *id = (const YYCTYPE *)oid; /*const char *marker;*/ /*!re2c /* integer registers */ 'r' [0-7] { *data = (oid[1]-'0'); return YASM_ARCH_REG; } /* catchalls */ [\001-\377]+ { return YASM_ARCH_NOTREGTMOD; } [\000] { return YASM_ARCH_NOTREGTMOD; } */ } #define RET_INSN(g, m) \ do { \ group = g##_insn; \ mod = m; \ nelems = NELEMS(g##_insn); \ goto done; \ } while(0) yasm_arch_insnprefix yasm_lc3b__parse_check_insnprefix(yasm_arch *arch, const char *oid, size_t id_len, unsigned long line, yasm_bytecode **bc, uintptr_t *prefix) { const YYCTYPE *id = (const YYCTYPE *)oid; const lc3b_insn_info *group = empty_insn; unsigned long mod = 0; unsigned int nelems = NELEMS(empty_insn); lc3b_id_insn *id_insn; *bc = (yasm_bytecode *)NULL; *prefix = 0; /*const char *marker;*/ /*!re2c /* instructions */ 'add' { RET_INSN(addand, 0x00); } 'and' { RET_INSN(addand, 0x40); } 'br' { RET_INSN(br, 0x00); } 'brn' { RET_INSN(br, 0x08); } 'brz' { RET_INSN(br, 0x04); } 'brp' { RET_INSN(br, 0x02); } 'brnz' { RET_INSN(br, 0x0C); } 'brnp' { RET_INSN(br, 0x0A); } 'brzp' { RET_INSN(br, 0x06); } 'brnzp' { RET_INSN(br, 0x0E); } 'jsr' { RET_INSN(br, 0x40); } 'jmp' { RET_INSN(jmp, 0); } 'lea' { RET_INSN(lea, 0); } 'ld' { RET_INSN(ldst, 0x20); } 'ldi' { RET_INSN(ldst, 0xA0); } 'st' { RET_INSN(ldst, 0x30); } 'sti' { RET_INSN(ldst, 0xB0); } 'ldb' { RET_INSN(ldstb, 0x60); } 'stb' { RET_INSN(ldstb, 0x70); } 'not' { RET_INSN(not, 0); } 'ret' { RET_INSN(nooperand, 0xCE); } 'rti' { RET_INSN(nooperand, 0x80); } 'nop' { RET_INSN(nooperand, 0); } 'lshf' { RET_INSN(shift, 0x00); } 'rshfl' { RET_INSN(shift, 0x10); } 'rshfa' { RET_INSN(shift, 0x30); } 'trap' { RET_INSN(trap, 0); } /* catchalls */ [\001-\377]+ { return YASM_ARCH_NOTINSNPREFIX; } [\000] { return YASM_ARCH_NOTINSNPREFIX; } */ done: id_insn = yasm_xmalloc(sizeof(lc3b_id_insn)); yasm_insn_initialize(&id_insn->insn); id_insn->group = group; id_insn->mod_data = mod; id_insn->num_info = nelems; *bc = yasm_bc_create_common(&lc3b_id_insn_callback, id_insn, line); return YASM_ARCH_INSN; } static void lc3b_id_insn_destroy(void *contents) { lc3b_id_insn *id_insn = (lc3b_id_insn *)contents; yasm_insn_delete(&id_insn->insn, yasm_lc3b__ea_destroy); yasm_xfree(contents); } static void lc3b_id_insn_print(const void *contents, FILE *f, int indent_level) { const lc3b_id_insn *id_insn = (const lc3b_id_insn *)contents; yasm_insn_print(&id_insn->insn, f, indent_level); /*TODO*/ } /*@only@*/ yasm_bytecode * yasm_lc3b__create_empty_insn(yasm_arch *arch, unsigned long line) { lc3b_id_insn *id_insn = yasm_xmalloc(sizeof(lc3b_id_insn)); yasm_insn_initialize(&id_insn->insn); id_insn->group = empty_insn; id_insn->mod_data = 0; id_insn->num_info = NELEMS(empty_insn); return yasm_bc_create_common(&lc3b_id_insn_callback, id_insn, line); }