eaxhla/source/assembler.c
2024-07-16 19:42:26 -04:00

446 lines
15 KiB
C

#include "assembler.h"
#include <stdlib.h>
#include <string.h>
#define REGULAR_BEGIN (ADD)
#define REGULAR_END (CMP)
#define IRREGULAR_BEGIN (INC)
#define IRREGULAR_END (IDIV)
#define SPECIAL_1_BEGIN (NOP)
#define SPECIAL_1_END (HLT)
#define SPECIAL_2_BEGIN (SYSENTER)
#define SPECIAL_2_END (CPUID)
#define JUMP_IF_BEGIN (JO)
#define JUMP_IF_END (JG)
#define MOVE_IF_BEGIN (CMOVO)
#define MOVE_IF_END (CMOVG)
#define REGULAR_COUNT (REGULAR_END - REGULAR_BEGIN + 1) // 16
#define IRREGULAR_COUNT (IRREGULAR_END - IRREGULAR_BEGIN + 1) // 16
#define SPECIAL_1_COUNT (SPECIAL_1_END - SPECIAL_1_BEGIN + 1) // 6
#define SPECIAL_2_COUNT (SPECIAL_2_END - SPECIAL_2_BEGIN + 1) // 6
#define JUMP_IF_COUNT (JUMP_IF_END - JUMP_IF_BEGIN + 1) // 16
#define MOVE_IF_COUNT (MOVE_IF_END - MOVE_IF_BEGIN + 1) // 16
static int assemble_clean_up_queued = 0;
static next empty_count = 0;
static next empty_holes = 0;
static next * empty_array = NULL;
static next * empty_imbue = NULL;
static next * empty_store = NULL;
static void input (form when,
byte data) {
// Input one byte to text sector.
text_sector_byte [text_sector_size] = data;
text_sector_size += (next) when;
}
static void input_by (form when,
size_index size,
next data) {
// Input size-dependent bytes to text sector.
input ((when != 0) && (size >= D8), (byte) ((data >> 0) & 0xff));
input ((when != 0) && (size >= D16), (byte) ((data >> 8) & 0xff));
input ((when != 0) && (size >= D32), (byte) ((data >> 16) & 0xff));
input ((when != 0) && (size >= D32), (byte) ((data >> 24) & 0xff));
// 64-BIT SUPPORT
}
static void asmdirrel (form when,
next data) {
// Assembler directive, queue relative memory address.
empty_array [empty_holes] = text_sector_size;
empty_imbue [empty_holes] = data;
empty_holes += (next) when;
}
static void asmdirmem (form when,
next code) {
// Assembler directive, queue memory address.
empty_store [code] = text_sector_size;
empty_count += (next) when;
}
static void asmdirimm (form when,
size_index size,
next data) {
// Assembler directive, queue immediate value at current size.
input_by (when, size, data);
}
static void input_at (form when,
size_index size,
next data,
next base) {
// Input relative memory address to text sector.
asmdirrel (when, data);
input ((when != 0) && (size >= D8), (byte) ((base >> 0) & 0xff));
input ((when != 0) && (size >= D16), (byte) ((base >> 8) & 0xff));
input ((when != 0) && (size >= D32), (byte) ((base >> 16) & 0xff));
input ((when != 0) && (size >= D32), (byte) ((base >> 24) & 0xff));
// NO DEREFERENCING
// 64-BIT SUPPORT
}
static form front (form data) { return ((data >= 4) && (data <= 7)); }
static form lower (form data) { return ((data >= 0) && (data <= 7)); }
static form upper (form data) { return ((data >= 8) && (data <= 15)); }
static form far (next label) { return (label && 1); } // Unused for now.
static form near (next label) { return (label && 0); } // Unused for now.
static void build_short_prefix (form when) {
// 66
input (when, 0x66);
}
static void build_long_prefix (form big_registers,
form new_destination,
form new_source) {
// 40-4D!0X02
input (big_registers || new_destination || new_source,
(byte) (0x40
+ 0x01 * new_destination
+ 0x04 * new_source
+ 0x08 * big_registers));
}
static void build_register_direction (form when,
next destination,
next source) {
// C0-FF
input (when,
(byte) (0xc0
+ 0x01 * (destination & 0x07)
+ 0x08 * (source & 0x07)));
}
static void build_register_redirection (form when,
next direction) {
// 05-3D
input (when,
(byte) (0x05
+ 0x08 * (direction & 0x07)));
}
static void build_constant (form when,
size_index size) {
// 80/81
input (when,
(byte) (0x80
+ 0x01 * (size != D8)));
}
static void build_regular (operation_index operation,
size_index size,
type_index to,
next destination,
type_index from,
next source) {
// 00-3F : add, or, adc, sbb, and, sub, xor, cmp
build_short_prefix (size == D16);
build_long_prefix (size == D64,
(to == REG) && (upper ((form) destination)),
(from == REG) && (upper ((form) source)));
input ((size == D8)
&& (to == REG)
&& ((from == REG) || (from == IMM))
&& (((front ((form) destination) && lower ((form) source)) //
|| (lower ((form) destination) && front ((form) source))) //
|| ((to == REG) && (from == IMM) && front ((form) destination))),
(byte) 0x40);
input ((from == IMM) && (to == REG) && (destination == 0),
(byte) (0x05
+ 0x08 * (operation & 0x07))
- 0x01 * (size == D8));
build_constant ((from == IMM) && ! ((to == REG) && (destination == 0)),
size);
input (! ((from == IMM) && (to == REG) && (destination == 0)),
(byte) (0x08 * (operation - REGULAR_BEGIN)
+ 0x01 * ((to == MEM) && (from == IMM) && (size == D8))
- 0x01 * ((to == REG) && (from == IMM) && (size != D8))
+ 0x01 * (size != D8)
+ 0x02 * ((to == REG) && (from == MEM))
+ 0x04 * ((to == MEM) && (from == IMM))
+ 0xc0 * ((to == REG) && (from == IMM)))
+ (destination & 0x07) * ((to == REG) && (from == IMM)));
build_register_direction ((to == REG) && (from == REG),
destination, source);
build_register_redirection ((to == REG) && (from == MEM), destination);
build_register_redirection ((to == MEM) && (from == REG), source);
input_by ((to == REG) && (from == MEM), D32, (next) ~0);
input_by ((to == REG) && (from == IMM), size, source);
input_by ((to == MEM) && (from == REG), D32, (next) ~0);
input_by ((to == MEM) && (from == IMM), D32, (next) ~0);
input_by ((to == MEM) && (from == IMM), size, source);
}
static void build_irregular (operation_index operation,
size_index size,
type_index to,
next destination) {
// F0-FF : inc, dec, not, neg, mul, imul, div, idiv
build_short_prefix (size == D16);
build_long_prefix (size == D64,
(to == REG) && (upper ((form) destination)), 0);
input ((size == D8) && (to == REG) && front ((form) destination),
(byte) 0x40);
input (1,
(byte) (0xf7
+ 0x08 * ((operation == INC) || (operation == DEC))
- 0x01 * (size == D8)));
input (to == REG,
(byte) (0xc0
+ 0x08 * (operation - IRREGULAR_BEGIN))
+ 0x01 * (destination & 0x07));
input (to == MEM,
(byte) (0x05
+ 0x08 * (operation - IRREGULAR_BEGIN)));
}
static void build_special_1 (operation_index operation) {
// nop, retn, retf, leave, lock, hlt
const byte data [1 * SPECIAL_1_COUNT] = {
0x90, 0xc3, 0xcb, 0xc9, 0xf0, 0xf4
};
input (1, data [operation - SPECIAL_1_BEGIN]);
}
static void build_special_2 (operation_index operation) {
// sysenter, sysleave, syscall, sysret, pause, cpuid
const byte data [2 * SPECIAL_2_COUNT] = {
0x0f, 0x0f, 0x0f, 0x0f, 0xf3, 0x0f,
0x34, 0x35, 0x05, 0x07, 0x90, 0xa2
};
input (1, data [operation - SPECIAL_2_BEGIN]);
input (1, data [operation - SPECIAL_2_BEGIN + SPECIAL_2_COUNT]);
}
static void build_jump_if (operation_index operation,
size_index size,
next location) {
// j**
(void) size; // For now, everything is a far jump.
input (far (location), 0x0f);
input (far (location), (byte) (0x80 + operation - JUMP_IF_BEGIN));
input (near (location), (byte) (0x70 + operation - JUMP_IF_BEGIN));
// displacement (4, 0X12345678);
}
static void build_move_if (operation_index operation,
size_index size,
type_index to,
next destination,
type_index from,
next source) {
// cmov**
build_short_prefix (size == D16);
build_long_prefix (size == D64,
(to == REG) && (upper ((form) destination)),
(from == REG) && (upper ((form) source)));
input (1, 0x0f);
input (1, (byte) (0x40 + operation - MOVE_IF_BEGIN));
build_register_direction ((to == REG) && (from == REG),
destination, source);
build_register_redirection ((to == REG) && (from == MEM), destination);
// displacement (4, 0X12345678); // Not implemented at this point!
}
static void build_jump (size_index size,
type_index to,
next destination) {
// jmp
input ((to == REG) && upper ((form) destination), (byte) 0X41);
input (to == REL, (byte) (0xe9 + 0x02 * (size == D8)));
input (to == REG, (byte) 0xff);
input (to == REG, (byte) (0xe0 + 0x01 * (destination & 0x07)));
input (to == MEM, (byte) 0xff);
input (to == MEM, (byte) 0x25);
// displacement (to == MEM, 4, 0x12345678); // Keep when in mind!
}
static void build_move (size_index size,
type_index to,
next destination,
type_index from,
next source) {
// mov
build_short_prefix (size == D16);
build_long_prefix (size == D64,
(to == REG) && (upper ((form) destination)),
(from == REG) && (upper ((form) source)));
input ((to == REG) && (from == REG), (byte) (0x88 + (size != D8)));
input ((to == REG) && (from == MEM), (byte) (0x8a + (size != D8)));
input ((to == MEM) && (from == REG), (byte) (0x88 + (size != D8)));
build_register_redirection ((to == REG) && (from == MEM), destination);
build_register_redirection ((to == MEM) && (from == REG), source);
input ((to == REG) && ((from == IMM) || (from == REL)),
(byte) (0xb8
// + 0x08 * (size != D8)
+ 0x01 * (destination & 0x07)));
input ((to == MEM) && (from == IMM), (byte) (0xc6 + (size != D8)));
input ((to == MEM) && (from == IMM), (byte) (0x05));
input_at ((to == REG) && (from == MEM), D32, source, 0);
input_by ((to == REG) && (from == IMM), size, source);
input_at ((to == MEM) && (from == REG), D32, (next) ~0, (next) ~0);
input_at ((to == MEM) && (from == IMM), D32, (next) ~0, (next) ~0);
input_by ((to == MEM) && (from == IMM), size, source);
input_at ((to == REG) && (from == REL), D32, source, 0x4010b0);
}
static void build_call (type_index from,
next source) {
// call
input (from == REL, (byte) 0xe8);
input_at (from == REL, D32, source, (next) -(text_sector_size + 4));
}
static void assemble_clean_up (void) {
if (assemble_clean_up_queued == 0) {
return;
}
free (text_sector_byte);
free (empty_array);
free (empty_imbue);
free (empty_store);
}
next text_sector_size = 0;
byte * text_sector_byte = NULL;
int was_instruction_array_empty = 0;
unsigned int text_entry_point = 0;
void assemble (next count,
next * array) {
// Main batched assembling procedure.
next index;
if ((count == 0) || (array == NULL)) {
was_instruction_array_empty = 1;
return;
}
// Right now, batching is not supported, it will be soon.
// In that case, realloc function will be used with memset.
text_sector_byte = calloc (1440UL, sizeof (* text_sector_byte));
empty_array = calloc (144UL, sizeof (* empty_array));
empty_imbue = calloc (144UL, sizeof (* empty_imbue));
empty_store = calloc (144UL, sizeof (* empty_store));
if (assemble_clean_up_queued == 0) {
atexit (assemble_clean_up);
assemble_clean_up_queued = ! assemble_clean_up_queued;
}
for (index = 0; index < count; ++index) {
if (array [index] == ASMDIRREL) {
asmdirrel (1, array [index + 1]);
index += 1;
} else if (array [index] == ASMDIRMEM) {
asmdirmem (1, array [index + 1]);
index += 1;
} else if (array [index] == ASMDIRIMM) {
next repeat;
for (repeat = 0; repeat < array [index + 2]; ++repeat) {
asmdirimm (1, array [index + 1],
array [index + 3 + repeat]);
}
index += 2 + array [index + 2];
// } else if (array [index] == ASMDIRREP) {
} else if ((array [index] >= REGULAR_BEGIN)
&& (array [index] <= REGULAR_END)) {
build_regular (array [index + 0], array [index + 1],
array [index + 2], array [index + 3],
array [index + 4], array [index + 5]);
index += 5;
} else if ((array [index] >= IRREGULAR_BEGIN)
&& (array [index] <= IRREGULAR_END)) {
build_irregular (array [index + 0], array [index + 1],
array [index + 2], array [index + 3]);
index += 3;
} else if ((array [index] >= SPECIAL_1_BEGIN)
&& (array [index] <= SPECIAL_1_END)) {
build_special_1 (array [index + 0]);
index += 0;
} else if ((array [index] >= SPECIAL_2_BEGIN)
&& (array [index] <= SPECIAL_2_END)) {
build_special_2 (array [index + 0]);
index += 0;
} else if ((array [index] >= JUMP_IF_BEGIN)
&& (array [index] <= JUMP_IF_END)) {
build_jump_if (array [index + 0], array [index + 1],
array [index + 2]);
index += 2;
} else if ((array [index] >= MOVE_IF_BEGIN)
&& (array [index] <= MOVE_IF_END)) {
build_move_if (array [index + 0], array [index + 1],
array [index + 2], array [index + 3],
array [index + 4], array [index + 5]);
index += 5;
} else if (array [index] == JMP) {
build_jump (array [index + 1], array [index + 2],
array [index + 3]);
index += 3;
} else if (array [index] == MOV) {
build_move (array [index + 1], array [index + 2],
array [index + 3], array [index + 4],
array [index + 5]);
index += 5;
} else if (array [index] == CALL) {
build_call (array [index + 1], array [index + 2]);
index += 2;
} else {
return;
}
}
text_entry_point = empty_store [0];
for (index = 0; index < empty_holes; ++index) {
next set = 0, get = empty_array [index];
memcpy (& set, & text_sector_byte [get], sizeof (set));
set += empty_store [empty_imbue [index]];
memcpy (& text_sector_byte [get], & set, sizeof (set));
}
}