From 2a376db307644e272cd0e856a1b0a0aecc1b8f13 Mon Sep 17 00:00:00 2001 From: Filipe Marques Date: Mon, 8 Jul 2024 16:05:36 +0200 Subject: [PATCH] Dealing with the linear memory in external functions --- example/define_host_function/README.md | 119 ++++++++++++++++++++ example/define_host_function/dune | 9 +- example/define_host_function/extern_mem.ml | 51 +++++++++ example/define_host_function/extern_mem.wat | 19 ++++ 4 files changed, 197 insertions(+), 1 deletion(-) create mode 100644 example/define_host_function/extern_mem.ml create mode 100644 example/define_host_function/extern_mem.wat diff --git a/example/define_host_function/README.md b/example/define_host_function/README.md index bea9d513f..74a875b54 100644 --- a/example/define_host_function/README.md +++ b/example/define_host_function/README.md @@ -1,5 +1,7 @@ # Using and defining external functions (host functions) +## Dealing with the Stack + Given the following `extern.wat` file: @@ -104,7 +106,124 @@ $ ./extern.exe 13 ``` +## Dealing with the Linear Memory + +Owi also allows interacting with linear memory through external functions. +This is helpful because it enables the host system to communicate directly +with a Wasm instance through its linear memory. Consider the tiny example +below to illustrate this: + + +```wat +(module $extern_mem + + (import "chorizo" "memset" (func $memset (param i32 i32 i32))) + + (import "chorizo" "print_x64" (func $print_x64 (param i64))) + + (memory 1) + + (func $start + + ;; memset start byte lenght + (call $memset (i32.const 0) (i32.const 0xAA) (i32.const 8)) + + ;; print_x64 ptr + (call $print_x64 (i64.load (i32.const 0))) + ) + + (start $start) +) +``` + +In the module `$extern_mem`, we first import `$memset` and `$print_x64`. Then, +in the `$start` function, we initialize the memory starting at address +`(i32.const 0)` with a sequence of length `(i32.const 8)` with bytes of +`(i32.const 0xAA)`. + +The definition of the external functions follows the same format as the +[previous example]. The difference is that, now, in the GADT definition of +memset to allow the memory to be passed to this function, we need to wrap +the three I32 arguments in a Mem variant. That is, instead of writing +memset as: + +```ocaml +(Func (Arg (I32, (Arg (I32, (Arg (I32, Res))))), R0), memset) +``` + +One should use: + +```ocaml +(Func (Mem (Arg (I32, (Arg (I32, (Arg (I32, Res)))))), R0), memset) +``` + +See the module below for the whole implementation: + + +```ocaml +open Owi + +(* an extern module that will be linked with a wasm module *) +let extern_module : Concrete_value.Func.extern_func Link.extern_module = + (* some custom functions *) + let memset m start c n = + let rec loop offset = + if Int32.le offset n then begin + Concrete_memory.store_8 m ~addr:(Int32.add start offset) c; + loop (Int32.add offset 1l) + end + in loop 0l + in + let print_x64 (i : int64) = Printf.printf "0x%LX\n%!" i in + (* we need to describe their types *) + let functions = + [ ( "print_x64" + , Concrete_value.Func.Extern_func (Func (Arg (I64, Res), R0), print_x64) + ) + ; ( "memset" + , Concrete_value.Func.Extern_func + (Func (Mem (Arg (I32, (Arg (I32, (Arg (I32, Res)))))), R0), memset) ) + ] + in + { functions } + +(* a link state that contains our custom module, available under the name `chorizo` *) +let link_state = + Link.extern_module Link.empty_state ~name:"chorizo" extern_module + +(* a pure wasm module refering to `$extern_mem` *) +let pure_wasm_module = + match Parse.Text.Module.from_file (Fpath.v "extern_mem.wat") with + | Error e -> Result.failwith e + | Ok modul -> modul + +(* our pure wasm module, linked with `chorizo` *) +let module_to_run, link_state = + match + Compile.Text.until_link link_state ~unsafe:false ~optimize:true ~name:None + pure_wasm_module + with + | Error e -> Result.failwith e + | Ok v -> v + +(* let's run it ! it will print the values as defined in the print_i64 function *) +let () = + match Interpret.Concrete.modul link_state.envs module_to_run with + | Error e -> Result.failwith e + | Ok () -> () +``` + +Running the above program should yield: + +```sh +$ ./extern_mem.exe +0xAAAAAAAAAAAAAAAA +``` + +## Advanced Usage + To learn more, see our advanced [Game of Life] example based on the famous cellular automaton by Conway. It show how to link several modules from different `.wat` files. [Game of Life]: ./life_game +[previous example]: ./README.md#dealing-with-the-stack diff --git a/example/define_host_function/dune b/example/define_host_function/dune index 64ad65a0f..d78a500f1 100644 --- a/example/define_host_function/dune +++ b/example/define_host_function/dune @@ -2,11 +2,18 @@ (name extern) (libraries owi)) +(executable + (name extern_mem) + (libraries owi)) + (mdx (libraries owi fpath) (deps %{bin:owi} (file extern.exe) (file extern.ml) - (file extern.wat)) + (file extern.wat) + (file extern_mem.exe) + (file extern_mem.ml) + (file extern_mem.wat)) (files README.md)) diff --git a/example/define_host_function/extern_mem.ml b/example/define_host_function/extern_mem.ml new file mode 100644 index 000000000..06ae83ba3 --- /dev/null +++ b/example/define_host_function/extern_mem.ml @@ -0,0 +1,51 @@ +open Owi + +(* an extern module that will be linked with a wasm module *) +let extern_module : Concrete_value.Func.extern_func Link.extern_module = + (* some custom functions *) + let memset m start byte length = + let rec loop offset = + if Int32.le offset length then begin + Concrete_memory.store_8 m ~addr:(Int32.add start offset) byte; + loop (Int32.add offset 1l) + end + in + loop 0l + in + let print_x64 (i : int64) = Printf.printf "0x%LX\n%!" i in + (* we need to describe their types *) + let functions = + [ ( "print_x64" + , Concrete_value.Func.Extern_func (Func (Arg (I64, Res), R0), print_x64) + ) + ; ( "memset" + , Concrete_value.Func.Extern_func + (Func (Mem (Arg (I32, Arg (I32, Arg (I32, Res)))), R0), memset) ) + ] + in + { functions } + +(* a link state that contains our custom module, available under the name `chorizo` *) +let link_state = + Link.extern_module Link.empty_state ~name:"chorizo" extern_module + +(* a pure wasm module refering to `$extern_mem` *) +let pure_wasm_module = + match Parse.Text.Module.from_file (Fpath.v "extern_mem.wat") with + | Error e -> Result.failwith e + | Ok modul -> modul + +(* our pure wasm module, linked with `chorizo` *) +let module_to_run, link_state = + match + Compile.Text.until_link link_state ~unsafe:false ~optimize:true ~name:None + pure_wasm_module + with + | Error e -> Result.failwith e + | Ok v -> v + +(* let's run it ! it will print the values as defined in the print_i64 function *) +let () = + match Interpret.Concrete.modul link_state.envs module_to_run with + | Error e -> Result.failwith e + | Ok () -> () diff --git a/example/define_host_function/extern_mem.wat b/example/define_host_function/extern_mem.wat new file mode 100644 index 000000000..b5590a344 --- /dev/null +++ b/example/define_host_function/extern_mem.wat @@ -0,0 +1,19 @@ +(module $extern_mem + + (import "chorizo" "memset" (func $memset (param i32 i32 i32))) + + (import "chorizo" "print_x64" (func $print_x64 (param i64))) + + (memory 1) + + (func $start + + ;; memset 0 0xAA 8 + (call $memset (i32.const 0) (i32.const 0xAA) (i32.const 8)) + + ;; print_x64 ptr + (call $print_x64 (i64.load (i32.const 0))) + ) + + (start $start) +)