Compare commits

..

2 Commits

Author SHA1 Message Date
veclav talica
bd19a43c0d gdb.sh 2023-09-19 09:13:57 +05:00
veclav talica
958a89272d opCall, return stack, r12 for thread pointer 2023-09-19 09:13:46 +05:00
5 changed files with 81 additions and 30 deletions

3
gdb.sh Executable file
View File

@ -0,0 +1,3 @@
#!/bin/sh
gdb ./zig-out/bin/nmvm -ex 'b arch.x86-64.execute' -ex 'layout asm' -ex 'r'

View File

@ -1,2 +1,8 @@
# .nmvm Near Metal Virtual Machine # .nmvm Near Metal Virtual Machine
Exercise in building low overhead VM via architecture specific means. Exercise in building low overhead VM via architecture specific means.
## Cases
- Native stack usage for virtual machine.
- Specific permutations of instructions for case optimizations.
- Array processing instructions.
- Absolute addressing for interpreter state, in TLS.

View File

@ -1,5 +1,10 @@
// todo: Use r12, r13, ... instead? They're preserved in Sys V abi which might make it more confortable,
// but they might increase binary size, gotta test.
// todo: Try using something else that has lesser opcode size.
// Execution thread convention: // Execution thread convention:
// rdi <- binary thread // r12 <- binary thread pointer
// r13 <- return stack pointer
// Resources used: // Resources used:
// https://mort.coffee/home/fast-interpreters/ // https://mort.coffee/home/fast-interpreters/
@ -10,14 +15,17 @@
// https://csiflabs.cs.ucdavis.edu/~ssdavis/50/att-syntax.htm // https://csiflabs.cs.ucdavis.edu/~ssdavis/50/att-syntax.htm
pub const Word = u64; pub const Word = u64;
pub const RecursionLimit = 1024;
threadlocal var return_stack: [RecursionLimit + 1]Word = undefined;
// todo: Variant that pushes array of words. // todo: Variant that pushes array of words.
/// (iw | -- iw) /// (iw | -- iw)
pub fn opPushWord() callconv(.Naked) noreturn { pub fn opPushWord() callconv(.Naked) noreturn {
asm volatile ( asm volatile (
\\ add $0x10, %%rdi \\ add $0x10, %%r12
\\ pushq -8(%%rdi) \\ pushq -8(%%r12)
\\ jmpq *(%%rdi) \\ jmpq *(%%r12)
); );
} }
@ -25,9 +33,9 @@ pub fn opPushWord() callconv(.Naked) noreturn {
/// (w --) /// (w --)
pub fn opSinkWord() callconv(.Naked) noreturn { pub fn opSinkWord() callconv(.Naked) noreturn {
asm volatile ( asm volatile (
\\ add $0x08, %%rdi \\ add $0x08, %%r12
\\ addq $0x08, %%rsp \\ addq $0x08, %%rsp
\\ jmpq *(%%rdi) \\ jmpq *(%%r12)
); );
} }
@ -53,13 +61,13 @@ pub fn opSumWordsWithOverflow() callconv(.Naked) noreturn {
// https://www.felixcloutier.com/x86/setcc // https://www.felixcloutier.com/x86/setcc
// idea: Could https://www.felixcloutier.com/x86/cmovcc be better for overflow push? // idea: Could https://www.felixcloutier.com/x86/cmovcc be better for overflow push?
asm volatile ( asm volatile (
\\ addq $0x08, %%r12
\\ movq (%%rsp), %%rax \\ movq (%%rsp), %%rax
\\ adcq 8(%%rsp), %%rax \\ adcq 8(%%rsp), %%rax
\\ movq %%rax, 8(%%rsp) \\ movq %%rax, 8(%%rsp)
\\ setc %%al \\ setc %%al
\\ movb %%al, 7(%%rsp) \\ movb %%al, (%%rsp)
\\ addq $0x08, %%rdi \\ jmpq *(%%r12)
\\ jmpq *(%%rdi)
); );
} }
@ -72,20 +80,47 @@ pub fn opSumWordsWithOverflow() callconv(.Naked) noreturn {
// @call(.always_tail, binary[offset].function, .{ &binary[offset], cond }); // @call(.always_tail, binary[offset].function, .{ &binary[offset], cond });
// } // }
/// (addr) // todo: Complex call op that would receive immediate mask that would tell
pub fn opReturn() callconv(.Naked) noreturn { // which positions of stack to duplicate, as well as mixing of plain immediate operands.
// https://www.felixcloutier.com/x86/ret // Or we could decouple it from call, it might be useful at other places.
asm volatile ("ret"); /// (iw |)
} pub fn opCall() callconv(.Naked) noreturn {
pub fn execute(binary: []const Word, entry_addr: usize) void {
// todo: Ensure correctness.
// https://wiki.osdev.org/System_V_ABI
// https://www.felixcloutier.com/x86/call
asm volatile ( asm volatile (
\\ call *(%%rdi) \\ leaq 16(%%r12), %%rax
: \\ subq $0x8, %%r13
: [thread] "rdi" (&binary[entry_addr]), \\ movq %%rax, (%%r13)
: "rflags", "rax", "rbx", "rsp", "rbp", "r12", "r13", "r14", "r15", "rsi", "rdx", "rcx", "r8", "r9", "r10", "r11", "memory" \\ movq 8(%%r12), %%r12
\\ jmpq *(%%r12)
);
}
/// (addr)
pub fn opReturn() callconv(.Naked) noreturn {
asm volatile (
\\ movq (%%r13), %%r12
\\ addq $0x08, %%r13
\\ jmpq *(%%r12)
);
}
// todo: Make sure it's non reentry in one given thread.
pub fn execute(binary: []const Word, entry_addr: usize) void {
@setCold(true);
// todo: Ensure correctness.
// https://wiki.osdev.org/System_V_ABI
// todo: Use remaining stack as return.
// Such device is used so that opReturn could be used for return.
asm volatile (
\\ movq $0f, 8(%%r13)
\\ leaq 8(%%r13), %%rax
\\ movq %%rax, (%%r13)
\\ jmpq *(%%r12)
\\ 0:
:
: [thread] "r" (&binary[entry_addr]),
[retstk] "r" (&return_stack[return_stack.len - 2]),
: "rflags", "rax", "rbx", "rsp", "rdi", "rbp", "r14", "r15", "rsi", "rdx", "rcx", "r8", "r9", "r10", "r11", "memory"
); );
} }

View File

@ -14,4 +14,4 @@
// idea: 'JIT' could be done by simple op* compiled binary copying up until `jmpq *(%%rdi)`, // idea: 'JIT' could be done by simple op* compiled binary copying up until `jmpq *(%%rdi)`,
// with immediate operand prelude modified, which could be done procedurally. // with immediate operand prelude modified, which could be done procedurally.
usingnamespace @import("arch/x86-64.zig"); pub usingnamespace @import("arch/x86-64.zig");

View File

@ -1,16 +1,23 @@
const int = @import("interpreter.zig"); const int = @import("interpreter.zig");
pub fn main() !void { pub fn main() !void {
const binary = [_]int.Word{ // todo: Mixing return addresses in stack poses a challenge, hm.
@as(int.Word, @intFromPtr(&int.opPushWord)), const add = [_]int.Word{
~@as(int.Word, 1),
@as(int.Word, @intFromPtr(&int.opPushWord)),
~@as(int.Word, 1),
@as(int.Word, @intFromPtr(&int.opSumWordsWithOverflow)), @as(int.Word, @intFromPtr(&int.opSumWordsWithOverflow)),
@as(int.Word, @intFromPtr(&int.opReturn)),
};
const entry = [_]int.Word{
@as(int.Word, @intFromPtr(&int.opPushWord)),
1,
@as(int.Word, @intFromPtr(&int.opPushWord)),
2,
@as(int.Word, @intFromPtr(&int.opCall)),
@as(int.Word, @intFromPtr(&add)),
@as(int.Word, @intFromPtr(&int.opSinkWord)), @as(int.Word, @intFromPtr(&int.opSinkWord)),
@as(int.Word, @intFromPtr(&int.opSinkWord)), @as(int.Word, @intFromPtr(&int.opSinkWord)),
@as(int.Word, @intFromPtr(&int.opReturn)), @as(int.Word, @intFromPtr(&int.opReturn)),
}; };
int.execute(&binary, 0); int.execute(&entry, 0);
} }