aboutsummaryrefslogtreecommitdiff
path: root/src/interp.c
diff options
context:
space:
mode:
authorXavier Del Campo Romero <xavi.dcr@tutanota.com>2023-11-26 22:43:30 +0100
committerXavier Del Campo Romero <xavi.dcr@tutanota.com>2024-04-21 01:51:24 +0200
commitf25b015e5b668028c34974bbb22faa4105c26690 (patch)
tree28f2b08c17b3585d06694ad74004d0617eadb785 /src/interp.c
downloadnanowasm-sync-f25b015e5b668028c34974bbb22faa4105c26690.tar.gz
First commit
Diffstat (limited to 'src/interp.c')
-rw-r--r--src/interp.c516
1 files changed, 516 insertions, 0 deletions
diff --git a/src/interp.c b/src/interp.c
new file mode 100644
index 0000000..3a32df0
--- /dev/null
+++ b/src/interp.c
@@ -0,0 +1,516 @@
+/*
+ * nanowasm, a tiny WebAssembly/Wasm interpreter
+ * Copyright (C) 2023-2024 Xavier Del Campo Romero
+ *
+ * This Source Code Form is subject to the terms of the Mozilla Public
+ * License, v. 2.0. If a copy of the MPL was not distributed with this
+ * file, You can obtain one at https://mozilla.org/MPL/2.0/.
+ */
+
+#include <nanowasm/nw.h>
+#include <nw/log.h>
+#include <nw/interp.h>
+#include <nw/opcodes.h>
+#include <nw/ops.h>
+#include <nw/sections.h>
+#include <nw/types.h>
+#include <errno.h>
+#include <limits.h>
+#include <inttypes.h>
+#include <stdbool.h>
+#include <stdint.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+
+static const enum opcode initexpr_opcodes[] =
+{
+ OP_NOP,
+ OP_END,
+ OP_I32_CONST,
+ OP_I64_CONST,
+ OP_F32_CONST,
+ OP_F64_CONST
+};
+
+const struct interp_set interp_initexpr_set =
+{
+ .opcodes = initexpr_opcodes,
+ .n = sizeof initexpr_opcodes / sizeof *initexpr_opcodes
+};
+
+static int (*const ops[])(struct nw_interp *) =
+{
+ [OP_UNREACHABLE] = op_unreachable,
+ [OP_NOP] = op_nop,
+ [OP_BLOCK] = op_block,
+ [OP_LOOP] = op_loop,
+ [OP_IF] = op_if,
+ [OP_ELSE] = op_else,
+ [OP_END] = op_end,
+ [OP_BR] = op_br,
+ [OP_BR_IF] = op_br_if,
+ [OP_BR_TABLE] = op_br_table,
+ [OP_RETURN] = op_return,
+ [OP_CALL] = op_call,
+ [OP_CALL_INDIRECT] = op_call_indirect,
+ [OP_GET_LOCAL] = op_get_local,
+ [OP_SET_LOCAL] = op_set_local,
+ [OP_TEE_LOCAL] = op_tee_local,
+ [OP_GET_GLOBAL] = op_get_global,
+ [OP_SET_GLOBAL] = op_set_global,
+ [OP_I32_LOAD] = op_i32_load,
+ [OP_I32_STORE] = op_i32_store,
+ [OP_I32_CONST] = op_i32_const,
+ [OP_I64_CONST] = op_i64_const,
+ [OP_F32_CONST] = op_f32_const,
+ [OP_F64_CONST] = op_f64_const,
+ [OP_I32_SUB] = op_i32_sub
+};
+
+int interp_run(struct nw_interp *const i)
+{
+ uint8_t op;
+
+ if (!fread(&op, sizeof op, 1, i->f))
+ {
+ LOG("%s: fread(3) failed, feof=%d, ferror=%d\n", __func__, feof(i->f),
+ ferror(i->f));
+ i->exception = "I/O error";
+ return -1;
+ }
+ else if (op >= sizeof ops / sizeof *ops)
+ {
+ LOG("%s: invalid opcode %#" PRIx8 "\n", __func__, op);
+ i->exception = "invalid opcode";
+ return -1;
+ }
+ else if (!ops[op])
+ {
+ LOG("%s: unsupported opcode %#" PRIx8 "\n", __func__, op);
+ i->exception = "invalid opcode";
+ return -1;
+ }
+
+ return ops[op](i);
+}
+
+static int run_opcode_limited(struct nw_interp *const in,
+ const struct interp_set *const set)
+{
+ uint8_t op;
+
+ if (!fread(&op, sizeof op, 1, in->f))
+ {
+ LOG("%s: fread(3) failed, feof=%d, ferror=%d\n",
+ __func__, feof(in->f), ferror(in->f));
+ in->exception = "I/O error";
+ return -1;
+ }
+
+ for (size_t i = 0; i < set->n; i++)
+ if (op == set->opcodes[i])
+ return ops[op](in);
+
+ LOG("%s: unexpected opcode %#" PRIx8 "\n", __func__, op);
+ in->exception = "invalid opcode";
+ return -1;
+}
+
+int interp_run_limited(struct nw_interp *const i,
+ const struct interp_set *const set)
+{
+ while (!i->exit)
+ if (run_opcode_limited(i, set))
+ {
+ LOG("%s: run_opcode_limited failed\n", __func__);
+ return -1;
+ }
+
+ return 0;
+}
+
+int interp_check_opcode(const uint8_t op, FILE *const f)
+{
+ static int (*const checks[])(FILE *) =
+ {
+ [OP_UNREACHABLE] = check_unreachable,
+ [OP_NOP] = check_nop,
+ [OP_BLOCK] = check_block,
+ [OP_LOOP] = check_loop,
+ [OP_IF] = check_if,
+ [OP_ELSE] = check_else,
+ [OP_END] = check_end,
+ [OP_BR] = check_br,
+ [OP_BR_IF] = check_br_if,
+ [OP_BR_TABLE] = check_br_table,
+ [OP_RETURN] = check_return,
+ [OP_CALL] = check_call,
+ [OP_CALL_INDIRECT] = check_call_indirect,
+ [OP_GET_LOCAL] = check_get_local,
+ [OP_SET_LOCAL] = check_set_local,
+ [OP_TEE_LOCAL] = check_tee_local,
+ [OP_GET_GLOBAL] = check_get_global,
+ [OP_SET_GLOBAL] = check_set_global,
+ [OP_I32_LOAD] = check_i32_load,
+ [OP_I32_STORE] = check_i32_store,
+ [OP_I32_CONST] = check_i32_const,
+ [OP_I64_CONST] = check_i64_const,
+ [OP_F32_CONST] = check_f32_const,
+ [OP_F64_CONST] = check_f64_const,
+ [OP_I32_SUB] = check_i32_sub
+ };
+
+ if (op >= sizeof checks / sizeof *checks)
+ {
+ LOG("%s: invalid opcode %#" PRIx8 "\n", __func__, op);
+ return 1;
+ }
+ else if (!checks[op])
+ {
+ LOG("%s: unsupported opcode %#" PRIx8 "\n", __func__, op);
+ return 1;
+ }
+
+ return checks[op](f);
+}
+
+int interp_start(const struct nw_interp_cfg *const cfg, FILE *const f,
+ struct nw_interp *const i)
+{
+ *i = (const struct nw_interp)
+ {
+ .f = f,
+ .cfg = *cfg
+ };
+
+ return 0;
+}
+
+void *interp_stackptr(const struct nw_interp *const i)
+{
+ return (char *)i->cfg.stack.buf + i->stack_i;
+}
+
+static int push_frame(struct nw_interp *const i,
+ const struct nw_frame *const src)
+{
+ struct nw_frame *const dst = interp_stackptr(i);
+
+ if (interp_stack_push(i, src, sizeof (*src)))
+ {
+ LOG("%s: interp_stack_push failed\n", __func__);
+ return -1;
+ }
+ else if (i->fp)
+ i->fp->next = dst;
+
+ i->fp = dst;
+ return 0;
+}
+
+static bool mul_overflow(const size_t a, const size_t b)
+{
+ return a && (a * b) / a != b;
+}
+
+static void init_i32(const varuint32 count, void *const p)
+{
+ for (int32_t *i = p; i - (const int32_t *)p < count; i++)
+ *i = 0;
+}
+
+static void init_i64(const varuint32 count, void *const p)
+{
+ for (int64_t *i = p; i - (const int64_t *)p < count; i++)
+ *i = 0;
+}
+
+static void init_f32(const varuint32 count, void *const p)
+{
+ for (float *i = p; i - (const float *)p < count; i++)
+ *i = 0;
+}
+
+static void init_f64(const varuint32 count, void *const p)
+{
+ for (double *i = p; i - (const double *)p < count; i++)
+ *i = 0;
+}
+
+static void init_locals(const enum value_type type, const varuint32 count,
+ void *const p)
+{
+ static void (*const init[])(varuint32, void *) =
+ {
+ [VALUE_TYPE_I32] = init_i32,
+ [VALUE_TYPE_I64] = init_i64,
+ [VALUE_TYPE_F32] = init_f32,
+ [VALUE_TYPE_F64] = init_f64
+ };
+
+ init[type](count, p);
+}
+
+static int push_locals(struct nw_interp *const i,
+ const struct nw_frame *const f)
+{
+ const enum value_type t = f->local_type;
+ const size_t typesz = get_type_size(t);
+ const unsigned long n = f->n_locals;
+
+ if (mul_overflow(typesz, f->n_locals))
+ {
+ LOG("%s: local variables size mul overflow", __func__);
+ i->exception = "mul overfllow";
+ return -1;
+ }
+
+ const size_t totalsz = typesz * n, max = i->cfg.stack.n;
+
+ if (totalsz > max || i->stack_i > max - totalsz)
+ {
+ LOG("%s: cannot allocate locals\n", __func__);
+ i->exception = "stack overflow";
+ return 1;
+ }
+
+ init_locals(t, n, interp_stackptr(i));
+ i->stack_i += totalsz;
+ return 0;
+}
+
+static int do_push_labels(struct nw_interp *const i,
+ const struct nw_frame *const fr)
+{
+ size_t n = 0;
+
+ for (;;)
+ {
+
+ interp_check_opcode();
+ }
+}
+
+static int push_labels(struct nw_interp *const i,
+ const struct nw_frame *const fr)
+{
+ FILE *const f = i->f;
+ const long orig = ftell(f);
+
+ if (orig < 0)
+ {
+ LOG("%s: ftell(3): %s\n", __func__, strerror(errno));
+ return -1;
+ }
+ else if (do_push_labels(i, fr))
+ {
+ LOG("%s: do_push_labels failed\n", __func__);
+ return -1;
+ }
+ else if (fseek(f, orig, SEEK_SET))
+ {
+ LOG("%s: fseek(3): %s\n", __func__, strerror(errno));
+ return -1;
+ }
+
+ return -1;
+}
+
+int interp_push(struct nw_interp *const i, const struct nw_frame *const f)
+{
+ if (push_frame(i, f))
+ {
+ LOG("%s: push_frame failed\n", __func__);
+ return -1;
+ }
+ else if (push_locals(i, f))
+ {
+ LOG("%s: push_locals failed\n", __func__);
+ return -1;
+ }
+ else if (push_labels(i, f))
+ {
+ LOG("%s: push_labels failed\n", __func__);
+ return -1;
+ }
+
+ return 0;
+}
+
+struct retval_priv
+{
+ enum value_type type;
+
+ union
+ {
+ int32_t i32;
+ int64_t i64;
+ float f32;
+ double f64;
+ } u;
+};
+
+static void get_i32(const void *const buf, struct retval_priv *const rp)
+{
+ rp->u.i32 = *(((const int32_t *)buf) - 1);
+}
+
+static void get_i64(const void *const buf, struct retval_priv *const rp)
+{
+ rp->u.i64 = *(((const int64_t *)buf) - 1);
+}
+
+static void get_f32(const void *const buf, struct retval_priv *const rp)
+{
+ rp->u.f32 = *(((const float *)buf) - 1);
+}
+
+static void get_f64(const void *const buf, struct retval_priv *const rp)
+{
+ rp->u.f64 = *(((const double *)buf) - 1);
+}
+
+static int get_retval(struct nw_interp *const i,
+ struct retval_priv *const rp)
+{
+ const struct retval *const r = &i->fp->retval;
+ const size_t sz = get_type_size(r->type), max = i->cfg.stack.n;
+
+ if (max < sz || i->stack_i >= max - sz)
+ {
+ static const char exc[] = "stack underflow";
+
+ LOG("%s: %s\n", __func__, exc);
+ i->exception = exc;
+ return -1;
+ }
+
+ const void *const buf = (const char *)interp_stackptr(i) - sz;
+ static void (*const get[])(const void *, struct retval_priv *) =
+ {
+ [VALUE_TYPE_I32] = get_i32,
+ [VALUE_TYPE_I64] = get_i64,
+ [VALUE_TYPE_F32] = get_f32,
+ [VALUE_TYPE_F64] = get_f64
+ };
+
+ get[r->type](buf, rp);
+ rp->type = r->type;
+ i->stack_i -= sz;
+ return 0;
+}
+
+int interp_pop(struct nw_interp *const i)
+{
+ if (!i->fp)
+ {
+ static const char exc[] = "no frame pointer";
+
+ LOG("%s: %s\n", __func__, exc);
+ i->exception = exc;
+ return -1;
+ }
+
+ const struct retval *const r = &i->fp->retval;
+ struct retval_priv rp;
+
+ if (r->returns && get_retval(i, &rp))
+ {
+ LOG("%s: get_retval failed\n", __func__);
+ return -1;
+ }
+
+ const char *const stackptr = interp_stackptr(i);
+ const ptrdiff_t diff = stackptr - (const char *)i->fp;
+
+ i->stack_i -= diff;
+
+ if (!(i->fp = i->fp->prev))
+ {
+ /* Entry point is always assumed to return int, which is
+ * defined as an i32 variable according to Wasm. */
+ if (rp.type != VALUE_TYPE_I32)
+ {
+ LOG("%s: expected i32 return type, got %s\n", __func__,
+ value_type_tostr(rp.type));
+ i->exception = "unexpected return type";
+ return -1;
+ }
+
+ i->retval = rp.u.i32;
+ i->exit = true;
+ }
+
+ return 0;
+}
+
+int interp_stack_push(struct nw_interp *const i, const void *const src,
+ const size_t n)
+{
+ void *const dst = interp_stackptr(i);
+
+ if (i->cfg.stack.n < n || i->stack_i > i->cfg.stack.n - n)
+ {
+ LOG("%s: stack overflow\n", __func__);
+ i->exception = "stack overflow";
+ return -1;
+ }
+
+ memcpy(dst, src, n);
+ i->stack_i += n;
+ return 0;
+}
+
+int interp_stack_pop(struct nw_interp *const i, void *const dst,
+ const size_t n)
+{
+ if (i->stack_i < n)
+ {
+ LOG("%s: stack underflow\n", __func__);
+ i->exception = "stack underflow";
+ return -1;
+ }
+
+ i->stack_i -= n;
+ memcpy(dst, interp_stackptr(i), n);
+ return 0;
+}
+
+int interp_heap_store(struct nw_interp *const i, const size_t addr,
+ const void *const src, const size_t n)
+{
+ if (i->cfg.heap.n < n || addr > i->cfg.heap.n - n)
+ {
+ static const char exc[] = "heap overflow";
+
+ LOG("%s: %s\n", __func__, exc);
+ i->exception = exc;
+ return -1;
+ }
+
+ void *const dst = (char *)i->cfg.heap.buf + addr;
+
+ memcpy(dst, src, n);
+ return 0;
+}
+
+int interp_heap_load(struct nw_interp *const i, const size_t addr,
+ void *const dst, const size_t n)
+{
+ const size_t max = i->cfg.heap.n;
+
+ if (max < n || addr > max - n)
+ {
+ static const char exc[] = "heap out-of-bounds access";
+
+ LOG("%s: %s (%lu, max %zu)\n", __func__, exc, (unsigned long)addr, max);
+ i->exception = exc;
+ return -1;
+ }
+
+ const void *const src = (const char *)i->cfg.heap.buf + addr;
+
+ memcpy(dst, src, n);
+ return 0;
+}