diff options
Diffstat (limited to 'lib/inst.c')
-rw-r--r-- | lib/inst.c | 455 |
1 files changed, 455 insertions, 0 deletions
diff --git a/lib/inst.c b/lib/inst.c new file mode 100644 index 0000000..5be2438 --- /dev/null +++ b/lib/inst.c @@ -0,0 +1,455 @@ +/* Copyright (C) 2023 Aryadev Chavali + + * You may distribute and modify this code under the terms of the + * GPLv2 license. You should have received a copy of the GPLv2 + * license with this file. If not, please write to: + * aryadev@aryadevchavali.com. + + * Created: 2023-10-15 + * Author: Aryadev Chavali + * Description: Implementation of bytecode for instructions + */ + +#include <assert.h> +#include <stdbool.h> +#include <stdio.h> +#include <string.h> + +#include "./inst.h" + +const char *opcode_as_cstr(opcode_t code) +{ + switch (code) + { + case OP_NOOP: + return "NOOP"; + break; + case OP_PUSH_BYTE: + return "PUSH_BYTE"; + break; + case OP_PUSH_WORD: + return "PUSH_WORD"; + break; + case OP_PUSH_HWORD: + return "PUSH_HWORD"; + break; + case OP_PUSH_REGISTER_BYTE: + return "PUSH_REGISTER_BYTE"; + break; + case OP_PUSH_REGISTER_WORD: + return "PUSH_REGISTER_WORD"; + break; + case OP_PUSH_REGISTER_HWORD: + return "PUSH_REGISTER_HWORD"; + break; + case OP_POP_BYTE: + return "POP_BYTE"; + break; + case OP_POP_WORD: + return "POP_WORD"; + break; + case OP_POP_HWORD: + return "POP_HWORD"; + break; + case OP_MOV_BYTE: + return "MOV_BYTE"; + break; + case OP_MOV_WORD: + return "MOV_WORD"; + break; + case OP_MOV_HWORD: + return "MOV_HWORD"; + break; + case OP_DUP_BYTE: + return "DUP_BYTE"; + break; + case OP_DUP_HWORD: + return "DUP_HWORD"; + break; + case OP_DUP_WORD: + return "DUP_WORD"; + break; + case OP_NOT_BYTE: + return "NOT_BYTE"; + break; + case OP_NOT_HWORD: + return "NOT_HWORD"; + break; + case OP_NOT_WORD: + return "NOT_WORD"; + break; + case OP_OR_BYTE: + return "OR_BYTE"; + break; + case OP_OR_HWORD: + return "OR_HWORD"; + break; + case OP_OR_WORD: + return "OR_WORD"; + break; + case OP_AND_BYTE: + return "AND_BYTE"; + break; + case OP_AND_HWORD: + return "AND_HWORD"; + break; + case OP_AND_WORD: + return "AND_WORD"; + break; + case OP_XOR_BYTE: + return "XOR_BYTE"; + break; + case OP_XOR_HWORD: + return "XOR_HWORD"; + break; + case OP_XOR_WORD: + return "XOR_WORD"; + break; + case OP_EQ_BYTE: + return "EQ_BYTE"; + break; + case OP_EQ_CHAR: + return "EQ_CHAR"; + break; + case OP_EQ_INT: + return "EQ_INT"; + break; + case OP_EQ_HWORD: + return "EQ_HWORD"; + break; + case OP_EQ_LONG: + return "EQ_LONG"; + break; + case OP_EQ_WORD: + return "EQ_WORD"; + break; + case OP_LT_BYTE: + return "LT_BYTE"; + break; + case OP_LT_CHAR: + return "LT_CHAR"; + break; + case OP_LT_HWORD: + return "LT_HWORD"; + break; + case OP_LT_INT: + return "LT_INT"; + break; + case OP_LT_LONG: + return "LT_LONG"; + break; + case OP_LT_WORD: + return "LT_WORD"; + break; + case OP_LTE_BYTE: + return "LTE_BYTE"; + break; + case OP_LTE_CHAR: + return "LTE_CHAR"; + break; + case OP_LTE_HWORD: + return "LTE_HWORD"; + break; + case OP_LTE_INT: + return "LTE_INT"; + break; + case OP_LTE_LONG: + return "LTE_LONG"; + break; + case OP_LTE_WORD: + return "LTE_WORD"; + break; + case OP_GT_BYTE: + return "GT_BYTE"; + break; + case OP_GT_CHAR: + return "GT_CHAR"; + break; + case OP_GT_HWORD: + return "GT_HWORD"; + break; + case OP_GT_INT: + return "GT_INT"; + break; + case OP_GT_LONG: + return "GT_LONG"; + break; + case OP_GT_WORD: + return "GT_WORD"; + break; + case OP_GTE_BYTE: + return "GTE_BYTE"; + break; + case OP_GTE_CHAR: + return "GTE_CHAR"; + break; + case OP_GTE_HWORD: + return "GTE_HWORD"; + break; + case OP_GTE_INT: + return "GTE_INT"; + break; + case OP_GTE_LONG: + return "GTE_LONG"; + break; + case OP_GTE_WORD: + return "GTE_WORD"; + break; + case OP_PLUS_BYTE: + return "PLUS_BYTE"; + break; + case OP_PLUS_HWORD: + return "PLUS_HWORD"; + break; + case OP_PLUS_WORD: + return "PLUS_WORD"; + break; + case OP_JUMP_ABS: + return "JUMP_ABS"; + break; + case OP_JUMP_STACK: + return "JUMP_STACK"; + break; + case OP_JUMP_REGISTER: + return "JUMP_REGISTER"; + break; + case OP_JUMP_IF_BYTE: + return "JUMP_IF_BYTE"; + break; + case OP_JUMP_IF_HWORD: + return "JUMP_IF_HWORD"; + break; + case OP_JUMP_IF_WORD: + return "JUMP_IF_WORD"; + break; + case OP_PRINT_CHAR: + return "PRINT_CHAR"; + break; + case OP_PRINT_BYTE: + return "PRINT_BYTE"; + break; + case OP_PRINT_INT: + return "PRINT_INT"; + break; + case OP_PRINT_HWORD: + return "PRINT_HWORD"; + break; + case OP_PRINT_LONG: + return "PRINT_LONG"; + break; + case OP_PRINT_WORD: + return "PRINT_WORD"; + break; + case OP_HALT: + return "HALT"; + break; + case NUMBER_OF_OPCODES: + return ""; + break; + } + return ""; +} + +void data_print(data_t datum, data_type_t type, FILE *fp) +{ + switch (type) + { + case DATA_TYPE_NIL: + break; + case DATA_TYPE_BYTE: + fprintf(fp, "%X", datum.as_byte); + break; + case DATA_TYPE_HWORD: + fprintf(fp, "%X", datum.as_hword); + break; + case DATA_TYPE_WORD: + fprintf(fp, "%lX", datum.as_word); + break; + } +} + +void inst_print(inst_t instruction, FILE *fp) +{ + static_assert(NUMBER_OF_OPCODES == 73, "inst_bytecode_size: Out of date"); + fprintf(fp, "%s(", opcode_as_cstr(instruction.opcode)); + if (OPCODE_IS_TYPE(instruction.opcode, OP_PUSH)) + { + data_type_t type = (data_type_t)instruction.opcode; + fprintf(fp, "datum=0x"); + data_print(instruction.operand, type, fp); + } + else if (OPCODE_IS_TYPE(instruction.opcode, OP_PUSH_REGISTER) || + OPCODE_IS_TYPE(instruction.opcode, OP_MOV) || + instruction.opcode == OP_JUMP_REGISTER) + { + fprintf(fp, "reg=0x"); + data_print(instruction.operand, DATA_TYPE_BYTE, fp); + } + else if (OPCODE_IS_TYPE(instruction.opcode, OP_DUP)) + { + fprintf(fp, "n=%lu", instruction.operand.as_word); + } + else if (instruction.opcode == OP_JUMP_ABS || + OPCODE_IS_TYPE(instruction.opcode, OP_JUMP_IF)) + { + fprintf(fp, "address=0x"); + data_print(instruction.operand, DATA_TYPE_WORD, fp); + } + fprintf(fp, ")"); +} + +size_t inst_bytecode_size(inst_t inst) +{ + static_assert(NUMBER_OF_OPCODES == 73, "inst_bytecode_size: Out of date"); + size_t size = 1; // for opcode + if (OPCODE_IS_TYPE(inst.opcode, OP_PUSH)) + { + if (inst.opcode == OP_PUSH_BYTE) + ++size; + else if (inst.opcode == OP_PUSH_HWORD) + size += HWORD_SIZE; + else if (inst.opcode == OP_PUSH_WORD) + size += WORD_SIZE; + } + else if (OPCODE_IS_TYPE(inst.opcode, OP_PUSH_REGISTER) || + OPCODE_IS_TYPE(inst.opcode, OP_MOV) || + inst.opcode == OP_JUMP_REGISTER) + // Only need a byte for the register + ++size; + else if (OPCODE_IS_TYPE(inst.opcode, OP_DUP) || inst.opcode == OP_JUMP_ABS || + OPCODE_IS_TYPE(inst.opcode, OP_JUMP_IF)) + size += WORD_SIZE; + return size; +} + +void inst_write_bytecode(inst_t inst, darr_t *darr) +{ + static_assert(NUMBER_OF_OPCODES == 73, "inst_write_bytecode: Out of date"); + // Append opcode + darr_append_byte(darr, inst.opcode); + // Then append 0 or more operands + data_type_t to_append = DATA_TYPE_NIL; + if (OPCODE_IS_TYPE(inst.opcode, OP_PUSH)) + to_append = (data_type_t)inst.opcode; + else if (OPCODE_IS_TYPE(inst.opcode, OP_PUSH_REGISTER) || + OPCODE_IS_TYPE(inst.opcode, OP_MOV) || + inst.opcode == OP_JUMP_REGISTER) + to_append = DATA_TYPE_BYTE; + else if (OPCODE_IS_TYPE(inst.opcode, OP_DUP) || inst.opcode == OP_JUMP_ABS || + OPCODE_IS_TYPE(inst.opcode, OP_JUMP_IF)) + to_append = DATA_TYPE_WORD; + + switch (to_append) + { + case DATA_TYPE_NIL: + break; + case DATA_TYPE_BYTE: + darr_append_byte(darr, inst.operand.as_byte); + break; + case DATA_TYPE_HWORD: + darr_append_bytes(darr, (byte *)&inst.operand.as_hword, HWORD_SIZE); + break; + case DATA_TYPE_WORD: + darr_append_bytes(darr, (byte *)&inst.operand.as_word, WORD_SIZE); + break; + } +} + +void insts_write_bytecode(inst_t *insts, size_t size, darr_t *darr) +{ + for (size_t i = 0; i < size; ++i) + inst_write_bytecode(insts[i], darr); +} + +data_t read_type_from_darr(darr_t *darr, data_type_t type) +{ + switch (type) + { + case DATA_TYPE_NIL: + break; + case DATA_TYPE_BYTE: + if (darr->used > darr->available) + // TODO: Error (darr has no space left) + return DBYTE(0); + return DBYTE(darr->data[darr->used++]); + break; + case DATA_TYPE_HWORD: + if (darr->used + HWORD_SIZE > darr->available) + // TODO: Error (darr has no space left) + return DWORD(0); + hword u = 0; + memcpy(&u, darr->data + darr->used, HWORD_SIZE); + darr->used += HWORD_SIZE; + return DHWORD(u); + break; + case DATA_TYPE_WORD: + if (darr->used + WORD_SIZE > darr->available) + // TODO: Error (darr has no space left) + return DWORD(0); + word w = 0; + memcpy(&w, darr->data + darr->used, WORD_SIZE); + darr->used += WORD_SIZE; + return DWORD(w); + break; + } + // TODO: Error (unrecognised type) + return DBYTE(0); +} + +inst_t inst_read_bytecode(darr_t *darr) +{ + static_assert(NUMBER_OF_OPCODES == 73, "inst_read_bytecode: Out of date"); + if (darr->used >= darr->available) + return (inst_t){0}; + inst_t inst = {0}; + opcode_t opcode = darr->data[darr->used++]; + if (opcode > OP_HALT || opcode == NUMBER_OF_OPCODES || opcode < OP_NOOP) + return INST_NOOP; + // Read operands + if (OPCODE_IS_TYPE(opcode, OP_PUSH)) + inst.operand = read_type_from_darr(darr, (data_type_t)opcode); + // Read register (as a byte) + else if (OPCODE_IS_TYPE(opcode, OP_PUSH_REGISTER) || + OPCODE_IS_TYPE(opcode, OP_MOV) || opcode == OP_JUMP_REGISTER) + inst.operand = read_type_from_darr(darr, DATA_TYPE_BYTE); + else if (OPCODE_IS_TYPE(opcode, OP_DUP) || opcode == OP_JUMP_ABS || + OPCODE_IS_TYPE(opcode, OP_JUMP_IF)) + inst.operand = read_type_from_darr(darr, DATA_TYPE_WORD); + // Otherwise opcode doesn't take operands + + inst.opcode = opcode; + + return inst; +} + +inst_t *insts_read_bytecode(darr_t *bytes, size_t *ret_size) +{ + *ret_size = 0; + // NOTE: Here we use the darr as a dynamic array of inst_t. + darr_t instructions = {0}; + darr_init(&instructions, sizeof(inst_t)); + while (bytes->used < bytes->available) + { + inst_t instruction = inst_read_bytecode(bytes); + darr_append_bytes(&instructions, (byte *)&instruction, sizeof(instruction)); + } + *ret_size = instructions.used / sizeof(inst_t); + return (inst_t *)instructions.data; +} + +void insts_write_bytecode_file(inst_t *instructions, size_t size, FILE *fp) +{ + darr_t darr = {0}; + darr_init(&darr, 0); + insts_write_bytecode(instructions, size, &darr); + darr_write_file(&darr, fp); + free(darr.data); +} + +inst_t *insts_read_bytecode_file(FILE *fp, size_t *ret) +{ + darr_t darr = darr_read_file(fp); + inst_t *instructions = insts_read_bytecode(&darr, ret); + free(darr.data); + return instructions; +} |