From 3ae88c0c5a4e298de6efb63f0a7374ab0523a9b9 Mon Sep 17 00:00:00 2001 From: Luke Wagner Date: Sat, 8 Jun 2024 18:13:03 -0500 Subject: [PATCH] Define the wasm32 build target --- README.md | 5 +- design/mvp/BuildTargets.md | 452 ++++++++++++++++++++++++ design/mvp/CanonicalABI.md | 77 ++-- design/mvp/canonical-abi/definitions.py | 61 ++-- design/mvp/canonical-abi/run_tests.py | 6 +- 5 files changed, 551 insertions(+), 50 deletions(-) create mode 100644 design/mvp/BuildTargets.md diff --git a/README.md b/README.md index 2f8c6320..ca34e4a2 100644 --- a/README.md +++ b/README.md @@ -5,8 +5,8 @@ user-focused explanation, take a look at the **[Component Model Documentation]** This repository contains the high-level [goals], [use cases], [design choices] and [FAQ] of the Component Model as well as more-detailed, low-level explainer -docs describing the [IDL], [text format], [binary format], [concurrency model] -and [Canonical ABI]. +docs describing the [IDL], [text format], [binary format], [concurrency model], +[Canonical ABI] and [Core WebAssembly Build Targets]. In the future, this repository will additionally contain a [formal spec], reference interpreter and test suite. @@ -34,6 +34,7 @@ To contribute to any of these repositories, see the Community Group's [Binary Format]: design/mvp/Binary.md [Concurrency Model]: design/mvp/Async.md [Canonical ABI]: design/mvp/CanonicalABI.md +[Core WebAssembly Build Targets]: design/mvp/BuildTargets.md [formal spec]: spec/ [W3C WebAssembly Community Group]: https://www.w3.org/community/webassembly/ [Contributing Guidelines]: https://webassembly.org/community/contributing/ diff --git a/design/mvp/BuildTargets.md b/design/mvp/BuildTargets.md new file mode 100644 index 00000000..6b4e6d27 --- /dev/null +++ b/design/mvp/BuildTargets.md @@ -0,0 +1,452 @@ +# Core WebAssembly Build Targets Explainer + +For any given WIT [`world`], the Component Model defines multiple **Core +WebAssembly build targets** that all logically represent the same world but +provide Core WebAssembly producer toolchains different low-level representation +choices. + +* [Motivation](#motivation) +* [Build Targets](#build-targets) +* [Target World](#target-world) +* [Imports and Exports](#imports-and-exports) + * [WIT-derived Function Imports](#wit-derived-function-imports) + * [WIT-derived Function Exports](#wit-derived-function-exports) + * [Memory Exports](#memory-exports) + * [Initialization Export](#initialization-export) +* [Support Definitions](#supporting-definitions) + * [Interface Name Canonicalization](#interface-name-canonicalization) + * [ABI Options](#abi-options) + * [Current Component Instance and Task](#current-component-instance-and-task) +* [Example](#example) +* [Relation to Compiler Flags](#relation-to-compiler-flags) + + +## Motivation + +While the Component Model's [binary format] provides more [linking] +functionality and optimization choices than the Core WebAssembly build targets +listed below, there are several reasons for having the Component Model +additionally define build targets that use the existing standard [Core +WebAssembly Binary Format]: +* It allows *interface authors* (e.g., in [WASI]) to write their interface + just once (in WIT) to target both core and component runtimes. +* It allows existing *Core WebAssembly producer toolchains* to more easily + and incrementally target the Component Model. +* It allows existing *Core WebAssembly runtimes* to implement WIT-defined + interfaces without having to implement the full Component Model, providing an + incremental implementation step towards the full Component Model. + +Furthermore, any module matching a Core WebAssembly build target can be +trivially wrapped (e.g., by [`wasm-tools component new`]) to become a +semantically-equivalent component and thus these modules can be considered +**simple components**. + + +## Build Targets + +Currently, there is only one build target defined: +* `wasm32`: uses one 32-bit linear memory + +Other build targets can be added as needed in the future. In particular, the +following additional build targets are anticipated: +* `wasm64`: uses one 64-bit linear memory (based on [memory64]). +* `wasmgc`: uses managed memory (based on [wasm-gc]). + +When the [async] and [shared-everything-threads] proposals stabilize, they +could either be added backwards-compatibly to existing build targets or added +as separate build targets. + + +## Target World + +The rest of this document assumes a single, fixed "target world". This target +world determines a fixed list of import and export names, each with associated +component-level types. For example, if a runtime wants to support "all of WASI +Preview 2", the target world (currently) would be: +```wit +world all-of-WASI { + include wasi:http/proxy@0.2.0; + include wasi:cli/command@0.2.0; +} +``` +However, a runtime can also choose to support just `wasi:http/proxy` or +`wasi:cli/command` or a subset of one of these worlds: this is a choice every +producer and consumer gets to make independently. WASI and the Component Model +only establish a fixed set of names that *MAY* appear in imports and exports +and, when present, what the agreed-upon semantics *MUST* be. + +Additionally, we assume that the target world has been fully resolved into a +pure [`componenttype`] in the same way as when creating a [WIT package] which +means that `include`s have been inlined and `use`d types have been replaced by +direct aliases to the resolved type. + + +## Imports and Exports + +Every build target defines the following set of imports: + 1. [WIT-derived function imports](#wit-derived-imports) + +and the union of the following sets of exports: + 1. [WIT-derived function exports](#wit-derived-exports) + 2. [Memory exports](#memory-exports) + 3. [Initialization export](#initialization-export) + +Every Core WebAssembly import and export name defined by the build target +starts with a `prefix` string that incorporates the build target: +* For `wasm32` this `prefix` string is `cm32p2`. + +The leading `cm` of the `prefix` indicates that this import or export is using +the Component Model's Canonical ABI. The trailing `p2` of the `prefix` +indicates the version of the Canonical ABI assumed by the compiled module, +allowing the Canonical ABI to change as part of future Component Model Preview +or RC releases without ambiguity. Thus, `p2` is distinct from the version of +any particular WASI or other WIT interface and is instead more analogous to the +`version` field of the Component Model [binary format]. + +A Core WebAssembly module *MAY* include imports and exports other than those +defined by the build target for the target world. However, if an import or +export starts with the `prefix`, it *MUST* be included in the [target world]'s +set of imports and exports defined by the build target and rejected by the +runtime otherwise. + +The runtime behavior of the WIT-derived imports and exports is entirely defined +by the [Canonical ABI], as explained in detail below. The only additional +global runtime behavioral rule that does not strictly follow from the Canonical +ABI is: + * Modules *MUST NOT* call any imports during the Core WebAssembly [`start`] + function that needs memory (as defined by whether [`flatten_functype`] + sets `needs.memory`). Hosts *MUST* trap eagerly (at the start of the import + call) in this case. + +This rule allows modules to be run in a wide variety of runtimes (such as +browsers) which do not expose memory until after the `start` function returns. +This matches the general Core WebAssembly toolchain convention that `start` +functions should only be used for module-internal initialization. +General-purpose initialization code that may call imports should instead run +during [initialization](#initialization-export). + +Other runtime behaviors that are implied by the Canonical ABI but are worth +stating explicitly here are: + * The host may not reenter guest wasm code on the same callstack (i.e., once + a wasm module calls a host import, the host may not recursively call back + into the calling wasm module instance). + * Once a module instance traps, the host *MUST NOT* execute any code with + that module instance in the future. + * Any WIT-derived export *MAY* be called repeatedly and in any + order by the host. Producer toolchains *MUST* handle this case without + trapping or triggering Undefined Behavior (but *MAY* eagerly return an error + value according to the declared return type). + +The following subsections specify the sets of imports and exports enumerated +above: + +### WIT-derived Function Imports + +The Core WebAssembly function *imports* derived from the [target world] are +defined as follows (with [`prefix`](#imports-and-exports) as defined above and +the [ABI Options] and [current component instance and task] as defined below): + +* For each import of a WIT interface `i` with [canonicalized interface name] `cin`: + * For each function in `i` with name `fn` and type `ft`, the build target includes: + * `(import "|" "" )`, where: + * `flat-type` is [`flatten_functype`]`(ft, 'lower')`, + * the runtime behavior is defined by [`canon_lower`]. + * For each *original* resource type in `i` with name `rn`, the build target includes: + * `(import "|" "_drop" (func (param i32)))`, where: + * the runtime behavior is defined by [`canon_resource_drop`]. +* For each import of a function with name `fn` and type `ft`, the build target includes: + * `(import "" "" )`, where: + * `flat-type` and the runtime behavior are defined the same as in the + interface case above. +* For each export of a WIT interface `i` with [canonicalized interface name] `cin`: + * For each *original* resource type in `i` with name `rn`, the build target includes: + * `(import "|_ex_" "_drop" (func (param i32)))`, + * `(import "|_ex_" "_new" (func (param i32) (result i32)))`, and + * `(import "|_ex_" "_rep" (func (param i32) (result i32)))`, where: + * the runtime behavior is defined by [`canon_resource_drop`], + [`canon_resource_new`] and [`canon_resource_rep`], resp. + +Above, the word "original" in "*original* resource type" means a resource type +that isn't defined to be equal to another resource type (using `type foo = bar` +in WIT). + +### WIT-derived Function Exports + +The Core WebAssembly function *exports* derived from the [target world] are +defined as follows (with [`prefix`](#imports-and-exports) as defined above and +the [ABI Options] and [current component instance and task] as defined below): + +* For each export of a WIT interface `i` with [canonicalized interface name] `cin`: + * For each function in `i` with name `fn` and type `ft`, the build target includes: + * `(export "||" )` and + * `(export "||_post" (func (params )))`, where: + * `flat-type` is [`flatten_functype`]`(ft, 'lift')`, + * `flat-params` is `flat-type.results`, and + * the runtime behavior is defined by [`canon_lift`] with `None` as the + `caller`, a no-op `on_block` callback, an `on_start` callback that + provides the host's arguments to the callee and an `on_return` callback + that returns the callee's results back to the host. + * For each *original* resource type in `i` with name `rn`, the build target includes: + * `(export "||_dtor" (func (param i32)))`, which is: + * called by the host when an owned handle returned by a previous export + call is dropped by the host, + * passed the same `i32` value that was passed by the guest to `_new` + for the resource that is now being destroyed. +* For each export of a function with name `fn` and type `ft`, the build target includes: + * `(export "||" )` and + * `(export "||_post" (func (params )))`, where: + * `flat-type`, `flat-params` and the runtime behavior are defined the same + as in the interface case above. + +These exports are not *required* to exist in a module (if they aren't present, +they just won't be called), but if an export *is* present with the given name, +it *MUST* have the given type. If there is a `_post` function export, +though, there *MUST* also be a corresponding exported ``. This `_post` +function *MUST* only be called by the host immediately following a call to +`` as defined by `canon_lift`. + +### Memory Exports + +If [`flatten_functype`] sets `needs.memory` for any WIT-derived function import +or export *used by the module*, the following export *MUST* be present: + +* `(export "_memory" (memory 0))` + +This exported linear memory is used as the `memory` field of [`canonopt`] in +the Canonical ABI. + +If [`flatten_functype`] sets `needs.realloc` for any WIT-derived function +import or export *used by the module*, the following export *MUST* be present: + +* `(export "_realloc" (func (param i32 i32 i32 i32) (result i32)))` + +This exported allocation function is used as the `realloc` field of +[`canonopt`] in the Canonical ABI. + +### Initialization Export + +*Every* build target includes the following optional Core WebAssembly function +export: + +* `(export "_initialize" (func))` + +A producer toolchain can rely on this initialization function being called some +time before any other export call. + +## Supporting Definitions + +The following supporting definitions are referenced above as part of defining +the WIT-derived imports and exports: + +### Interface Name Canonicalization + +Given an [`interfacename`] `in`, the **canonicalization** of `in` is given by: +* If `in` has no trailing `@`, the canonicalization is just `in`. +* Otherwise, the canonicalization is `@` where: + * `in` is split into `@`, + * `version` is split into `..` followed by the optional + `-` and `+` fields, as defined by [SemVer 2.0], and + * `canonicalized-version` is: + * if the optional `prerelease` field is present: + * `..-` + * otherwise, if `major` and `minor` are `0`: + * `0.0.` + * otherwise, if `major` is `0`: + * `0.` + * otherwise: + * ``. + +For example: + +| Interface name | Canonicalized interface name | +| --------------------------- | ---------------------------- | +| `a:b/c` | `a:b/c` | +| `a:b/c@1.2.3+alpha` | `a:b/c@1` | +| `a:b/c@0.1.2+alpha` | `a:b/c@0.1` | +| `a:b/c@0.0.1+alpha` | `a:b/c@0.0.1` | +| `a:b/c@1.2.3-nightly+alpha` | `a:b/c@1.2.3-nightly` | + +The reason for this canonicalization is to avoid requiring every runtime to +implement semver-aware matching wherein all imports of names in the left column +match if they are the same in the right column. Instead, producer toolchains +perform canonicalization at build time so that Core WebAssembly runtimes can +continue to use a simple table of imports matched by string equality. + +### ABI Options + +The Canonical ABI is parameterized by a small set of ABI options +([`canonopt`]) which are set as follows: + +The `memory` and `realloc` options are set by the Memory Exports defined +[above](#memory-exports). + +The `post-return` option for a WIT function named `fn` is set to be the +exported `_post` function defined [above](#wit-derived-function-exports) +if present (otherwise `None`). + +Additionally: +* The `string-encoding` is fixed to `utf8`. +* The (unstable Preview 3) `async` field is unset. + +When `gc` and `memory64` fields are added to `canonopt`, they would be +mentioned here and configured by the build target. + +### Current Component Instance and Task + +The Canonical ABI maintains per-component-instance spec-level state that +affects the lifting and lowering of parameters and results in imports and +exports. As described above, Core WebAssembly build targets treat each Core +WebAssembly module as a simple component, and thus there is always a **current +component instance** created for each Core WebAssembly module instance that is +passed as an argument to each Canonical ABI import. + +Canonical ABI imports also take a **current task** which contains per-call +spec-level state used to dynamically enforce the rules for reentrance, +`borrow`, and, in a Preview 3 timeframe, async calls). Until Preview 3 async is +enabled for a build target, there is only ever *at most one* task per instance +(corresponding to an active synchronous host-to-wasm call, noting that |host → +wasm → host → wasm| reentrance is disallowed) and thus the current component +instance mentioned above also implies the current task. + + +## Example + +Given the following world: +```wit +package ns:pkg@0.2.1; + +interface i { + resource r { + constructor(s: string); + m: func() -> string; + } + frob: func(in: r) -> r; +} + +world w { + import f: func() -> string; + import i; + import j: interface { + resource r { + constructor(s: string); + m: func() -> string; + } + frob: func(in: r) -> r; + } + export g: func() -> string; + export i; + export j: interface { + resource r { + constructor(s: string); + m: func() -> string; + } + frob: func(in: r) -> r; + } +} +``` +the `wasm32` build target includes the following imports and exports (noting +that any particular module can import and export a subset of these, subject to +the requirements mentioned above): +```wat +(module + (import "cm32p2" "f" (func (param i32))) + (import "cm32p2|ns:pkg/i@0.2" "[constructor]r" (func (param i32 i32) (result i32))) + (import "cm32p2|ns:pkg/i@0.2" "[method]r.m" (func (param i32 i32))) + (import "cm32p2|ns:pkg/i@0.2" "frob" (func (result i32) (result i32))) + (import "cm32p2|ns:pkg/i@0.2" "r_drop" (func (param i32))) + (import "cm32p2|j" "[constructor]r" (func (param i32 i32) (result i32))) + (import "cm32p2|j" "[method]r.m" (func (param i32 i32))) + (import "cm32p2|j" "frob" (func (result i32) (result i32))) + (import "cm32p2|j" "r_drop" (func (param i32))) + (import "cm32p2|_ex_ns:pkg/i@0.2" "r_drop" (func (param i32))) + (import "cm32p2|_ex_ns:pkg/i@0.2" "r_new" (func (param i32) (result i32))) + (import "cm32p2|_ex_ns:pkg/i@0.2" "r_rep" (func (param i32) (result i32))) + (import "cm32p2|_ex_j" "r_drop" (func (param i32))) + (import "cm32p2|_ex_j" "r_new" (func (param i32) (result i32))) + (import "cm32p2|_ex_j" "r_rep" (func (param i32) (result i32))) + (export "cm32p2||g" (func (result i32))) + (export "cm32p2||g_post" (func (param i32))) + (export "cm32p2|ns:pkg/i@0.2|[constructor]r" (func (param i32 i32) (result i32))) + (export "cm32p2|ns:pkg/i@0.2|[method]r.m" (func (param i32) (result i32))) + (export "cm32p2|ns:pkg/i@0.2|frob" (func (result i32) (result i32))) + (export "cm32p2|ns:pkg/i@0.2|r_dtor" (func (param i32))) + (export "cm32p2|j|[constructor]r" (func (param i32 i32) (result i32))) + (export "cm32p2|j|[method]r.m" (func (param i32) (result i32))) + (export "cm32p2|j|frob" (func (param i32) (result i32))) + (export "cm32p2|j|r_dtor" (func (param i32) (result i32))) + (export "cm32p2_memory" (memory 0)) + (export "cm32p2_realloc" (func (param i32 i32 i32 i32) (result i32))) + (export "cm32p2_initialize" (func)) +) +``` +As defined by the Component Model, but worth calling out explicitly: this world +contains 4 distinct resource types with 4 distinct resource tables that have +overlapping index spaces, even though all 4 resources are syntactically named +`r` in the WIT: +1. The `r` in the imported `ns:pkg/i` interface, used by the imported + `ns:pkg/i@0.2` functions. +2. The `r` in the imported anonymous `j` interface, used by the imported `j` + functions. +3. The `r` in the exported `ns:pkg/i` interface, used by the exported + `ns:pkg/i@0.2` functions *and* the imported `_ex_ns:pkg/i@0.2` functions. +4. The `r` in the exported anonymous `j` interface, used by the exported `j` + functions *and* the imported `_ex_j` functions. + +Each resource type has a unique `*_drop` function import, so the number of +`*_drop` functions is the number of resource tables. + + +## Relation to Compiler Flags + +One option for producer toolchains is to always emit a Core WebAssembly build +target and then optionally wrap the result into a component binary as a final +build step (which aligns well with the overall [linking] toolchain pipeline). +In this case, the toolchain unconditionally takes the Core WebAssembly build +target as an argument and then takes an independent flag specifying whether to +emit a Core WebAssembly module or a component. + +For example: +* For `wasi-libc`-based toolchains like `wasi-sdk` or `rustc`: + * The `--target` is `wasm32-wasip2`, combining the `wasm32` build target + defined in this document with the additional information that the language + runtime can import [WASI Preview 2]-defined interfaces. + * The default output is a component, but `-Wl,--emit-module` can be passed to + instruct the linker to only emit a module. +* For Go: + * The `GOARCH` is `wasm32` and the `GOOS` is `wasip2` + * The `-buildmode` would select whether to emit a module or component + + +[Target World]: #target-world +[Canonicalized Interface Name]: #interface-name-canonicalization +[ABI Options]: #abi-options +[Current Component Instance and Task]: #current-component-instance-and-task + +[Async]: Async.md +[Binary Format]: Binary.md +[Canonical ABI]: CanonicalABI.md +[`flatten_functype`]: CanonicalABI.md#flattening +[`canon_lift`]: CanonicalABI.md#canon-lift +[`canon_lower`]: CanonicalABI.md#canon-lower +[`canon_resource_drop`]: CanonicalABI.md#canon-resourcedrop +[`canon_resource_new`]: CanonicalABI.md#canon-resourcenew +[`canon_resource_rep`]: CanonicalABI.md#canon-resourcerep +[`componenttype`]: Explainer.md#type-definitions +[`canonopt`]: Explainer.md#canonical-abi +[`interfacename`]: Explainer.md#import-and-export-definitions +[Linking]: Linking.md +[`world`]: WIT.md#wit-worlds +[WIT Package]: WIT.md#package-format + +[Core WebAssembly Binary Format]: https://webassembly.github.io/spec/core/binary/index.html +[`start`]: https://webassembly.github.io/spec/core/syntax/modules.html#start-function + +[memory64]: https://github.com/webAssembly/memory64 +[wasm-gc]: https://github.com/WebAssembly/gc +[shared-everything-threads]: https://github.com/webAssembly/shared-everything-threads +[WASI]: https://github.com/webAssembly/wasi +[WASI Preview 2]: https://github.com/WebAssembly/WASI/blob/main/preview2/README.md + +[`wasm-tools component new`]: https://github.com/bytecodealliance/wasm-tools#tools-included + +[SemVer 2.0]: https://semver.org/spec/v2.0.0.html diff --git a/design/mvp/CanonicalABI.md b/design/mvp/CanonicalABI.md index 5109865c..d0e0a24b 100644 --- a/design/mvp/CanonicalABI.md +++ b/design/mvp/CanonicalABI.md @@ -1535,13 +1535,26 @@ Given all this, the top-level definition of `flatten_functype` is: MAX_FLAT_PARAMS = 16 MAX_FLAT_RESULTS = 1 -def flatten_functype(opts, ft, context): - flat_params = flatten_types(ft.param_types()) - flat_results = flatten_types(ft.result_types()) +class Needs: + memory: bool = False + realloc: bool = False + +def reverse_context(context): + match context: + case 'lift' : return 'lower' + case 'lower' : return 'lift' + +def flatten_functype(opts, ft, context, needs): + flat_params = flatten_types(ft.param_types(), reverse_context(context), needs) + flat_results = flatten_types(ft.result_types(), context, needs) if opts.sync: if len(flat_params) > MAX_FLAT_PARAMS: + needs.memory = True + if context == 'lift': + needs.realloc = True flat_params = ['i32'] if len(flat_results) > MAX_FLAT_RESULTS: + needs.memory = True match context: case 'lift': flat_results = ['i32'] @@ -1556,23 +1569,29 @@ def flatten_functype(opts, ft, context): flat_results = [] case 'lower': if len(flat_params) > 1: + needs.memory = True flat_params = ['i32'] if len(flat_results) > 0: + needs.memory = True flat_params += ['i32'] flat_results = ['i32'] return CoreFuncType(flat_params, flat_results) - -def flatten_types(ts): - return [ft for t in ts for ft in flatten_type(t)] ``` +The `Needs` object tracks whether a Canonical ABI call requires the +`memory` or `realloc` `canonopt`s to be set, as required by Component +Model validation. + As shown here, the core signatures `async` functions use a lower limit on the maximum number of parameters (1) and results (0) passed as scalars before falling back to passing through memory. -Presenting the definition of `flatten_type` piecewise, we start with the +Presenting the definition of `flatten_type(s)` piecewise, we start with the top-level case analysis: ```python -def flatten_type(t): +def flatten_types(ts, context, needs): + return [ft for t in ts for ft in flatten_type(t, context, needs)] + +def flatten_type(t, context, needs): match despecialize(t): case Bool() : return ['i32'] case U8() | U16() | U32() : return ['i32'] @@ -1581,19 +1600,29 @@ def flatten_type(t): case F32() : return ['f32'] case F64() : return ['f64'] case Char() : return ['i32'] - case String() | List(_) : return ['i32', 'i32'] - case Record(fields) : return flatten_record(fields) - case Variant(cases) : return flatten_variant(cases) + case Record(fields) : return flatten_record(fields, context, needs) + case Variant(cases) : return flatten_variant(cases, context, needs) case Flags(labels) : return ['i32'] * num_i32_flags(labels) case Own(_) | Borrow(_) : return ['i32'] -``` + case String() | List(_): + needs.memory = True + if context == 'lower': + needs.realloc = True + return ['i32', 'i32'] +``` +Note that `context` refers to whether the particular *value* is being lifted or +lowered, not whether this is part of a lifted or lowered call to a function. In +particular, `flatten_functype` above reverses the direction of parameters since +a lifted function call lowers its parameters. Thus, `needs.realloc` is only set +for the string/list parameters of lifted exports and results of lowered +imports. Record flattening simply flattens each field in sequence. ```python -def flatten_record(fields): +def flatten_record(fields, context, needs): flat = [] for f in fields: - flat += flatten_type(f.t) + flat += flatten_type(f.t, context, needs) return flat ``` @@ -1606,16 +1635,16 @@ case, all flattened variants are passed with the same static set of core types, which may involve, e.g., reinterpreting an `f32` as an `i32` or zero-extending an `i32` into an `i64`. ```python -def flatten_variant(cases): +def flatten_variant(cases, context, needs): flat = [] for c in cases: if c.t is not None: - for i,ft in enumerate(flatten_type(c.t)): + for i,ft in enumerate(flatten_type(c.t, context, needs)): if i < len(flat): flat[i] = join(flat[i], ft) else: flat.append(ft) - return flatten_type(discriminant_type(cases)) + flat + return flatten_type(discriminant_type(cases), context, needs) + flat def join(a, b): if a == b: return a @@ -1727,7 +1756,7 @@ reinterprets between the different types appropriately and also traps if the high bits of an `i64` are set for a 32-bit type: ```python def lift_flat_variant(cx, vi, cases): - flat_types = flatten_variant(cases) + flat_types = flatten_variant(cases, 'lift', Needs()) assert(flat_types.pop(0) == 'i32') case_index = vi.next('i32') trap_if(case_index >= len(cases)) @@ -1837,14 +1866,14 @@ manually coercing the otherwise-incompatible type pairings allowed by `join`: ```python def lower_flat_variant(cx, v, cases): case_index, case_value = match_case(v, cases) - flat_types = flatten_variant(cases) + flat_types = flatten_variant(cases, 'lower', Needs()) assert(flat_types.pop(0) == 'i32') c = cases[case_index] if c.t is None: payload = [] else: payload = lower_flat(cx, case_value, c.t) - for i,(fv,have) in enumerate(zip(payload, flatten_type(c.t))): + for i,(fv,have) in enumerate(zip(payload, flatten_type(c.t, 'lower', Needs()))): want = flat_types.pop(0) match (have, want): case ('f32', 'i32') : payload[i] = encode_float_as_i32(fv) @@ -1876,7 +1905,7 @@ parameters or results (given by the `CoreValueIter` `vi`) into a tuple of component-level values with types `ts`. ```python def lift_flat_values(cx, max_flat, vi, ts): - flat_types = flatten_types(ts) + flat_types = flatten_types(ts, 'lift', Needs()) if len(flat_types) > max_flat: return lift_heap_values(cx, vi, ts) else: @@ -1900,7 +1929,7 @@ out-param: def lower_flat_values(cx, max_flat, vs, ts, out_param = None): assert(cx.inst.may_leave) cx.inst.may_leave = False - flat_types = flatten_types(ts) + flat_types = flatten_types(ts, 'lower', Needs()) if len(flat_types) > max_flat: flat_vals = lower_heap_values(cx, vs, ts, out_param) else: @@ -2297,7 +2326,7 @@ caller and lowers them into the current instance: async def canon_task_start(task, core_ft, flat_args): assert(len(core_ft.params) == len(flat_args)) trap_if(task.opts.sync) - trap_if(core_ft != flatten_functype(CanonicalOptions(), FuncType([], task.ft.params), 'lower')) + trap_if(core_ft != flatten_functype(CanonicalOptions(), FuncType([], task.ft.params), 'lower', Needs())) task.start() args = task.on_start() flat_results = lower_flat_values(task, MAX_FLAT_RESULTS, args, task.ft.param_types(), CoreValueIter(flat_args)) @@ -2327,7 +2356,7 @@ current instance and passes them to the caller: async def canon_task_return(task, core_ft, flat_args): assert(len(core_ft.params) == len(flat_args)) trap_if(task.opts.sync) - trap_if(core_ft != flatten_functype(CanonicalOptions(), FuncType(task.ft.results, []), 'lower')) + trap_if(core_ft != flatten_functype(CanonicalOptions(), FuncType(task.ft.results, []), 'lower', Needs())) task.return_() results = lift_flat_values(task, MAX_FLAT_PARAMS, CoreValueIter(flat_args), task.ft.result_types()) task.on_return(results) diff --git a/design/mvp/canonical-abi/definitions.py b/design/mvp/canonical-abi/definitions.py index 1911db67..f4f3ea2c 100644 --- a/design/mvp/canonical-abi/definitions.py +++ b/design/mvp/canonical-abi/definitions.py @@ -1058,13 +1058,26 @@ def lower_borrow(cx, rep, t): MAX_FLAT_PARAMS = 16 MAX_FLAT_RESULTS = 1 -def flatten_functype(opts, ft, context): - flat_params = flatten_types(ft.param_types()) - flat_results = flatten_types(ft.result_types()) +class Needs: + memory: bool = False + realloc: bool = False + +def reverse_context(context): + match context: + case 'lift' : return 'lower' + case 'lower' : return 'lift' + +def flatten_functype(opts, ft, context, needs): + flat_params = flatten_types(ft.param_types(), reverse_context(context), needs) + flat_results = flatten_types(ft.result_types(), context, needs) if opts.sync: if len(flat_params) > MAX_FLAT_PARAMS: + needs.memory = True + if context == 'lift': + needs.realloc = True flat_params = ['i32'] if len(flat_results) > MAX_FLAT_RESULTS: + needs.memory = True match context: case 'lift': flat_results = ['i32'] @@ -1079,16 +1092,18 @@ def flatten_functype(opts, ft, context): flat_results = [] case 'lower': if len(flat_params) > 1: + needs.memory = True flat_params = ['i32'] if len(flat_results) > 0: + needs.memory = True flat_params += ['i32'] flat_results = ['i32'] return CoreFuncType(flat_params, flat_results) -def flatten_types(ts): - return [ft for t in ts for ft in flatten_type(t)] +def flatten_types(ts, context, needs): + return [ft for t in ts for ft in flatten_type(t, context, needs)] -def flatten_type(t): +def flatten_type(t, context, needs): match despecialize(t): case Bool() : return ['i32'] case U8() | U16() | U32() : return ['i32'] @@ -1097,28 +1112,32 @@ def flatten_type(t): case F32() : return ['f32'] case F64() : return ['f64'] case Char() : return ['i32'] - case String() | List(_) : return ['i32', 'i32'] - case Record(fields) : return flatten_record(fields) - case Variant(cases) : return flatten_variant(cases) + case Record(fields) : return flatten_record(fields, context, needs) + case Variant(cases) : return flatten_variant(cases, context, needs) case Flags(labels) : return ['i32'] * num_i32_flags(labels) case Own(_) | Borrow(_) : return ['i32'] + case String() | List(_): + needs.memory = True + if context == 'lower': + needs.realloc = True + return ['i32', 'i32'] -def flatten_record(fields): +def flatten_record(fields, context, needs): flat = [] for f in fields: - flat += flatten_type(f.t) + flat += flatten_type(f.t, context, needs) return flat -def flatten_variant(cases): +def flatten_variant(cases, context, needs): flat = [] for c in cases: if c.t is not None: - for i,ft in enumerate(flatten_type(c.t)): + for i,ft in enumerate(flatten_type(c.t, context, needs)): if i < len(flat): flat[i] = join(flat[i], ft) else: flat.append(ft) - return flatten_type(discriminant_type(cases)) + flat + return flatten_type(discriminant_type(cases), context, needs) + flat def join(a, b): if a == b: return a @@ -1194,7 +1213,7 @@ def lift_flat_record(cx, vi, fields): return record def lift_flat_variant(cx, vi, cases): - flat_types = flatten_variant(cases) + flat_types = flatten_variant(cases, 'lift', Needs()) assert(flat_types.pop(0) == 'i32') case_index = vi.next('i32') trap_if(case_index >= len(cases)) @@ -1274,14 +1293,14 @@ def lower_flat_record(cx, v, fields): def lower_flat_variant(cx, v, cases): case_index, case_value = match_case(v, cases) - flat_types = flatten_variant(cases) + flat_types = flatten_variant(cases, 'lower', Needs()) assert(flat_types.pop(0) == 'i32') c = cases[case_index] if c.t is None: payload = [] else: payload = lower_flat(cx, case_value, c.t) - for i,(fv,have) in enumerate(zip(payload, flatten_type(c.t))): + for i,(fv,have) in enumerate(zip(payload, flatten_type(c.t, 'lower', Needs()))): want = flat_types.pop(0) match (have, want): case ('f32', 'i32') : payload[i] = encode_float_as_i32(fv) @@ -1305,7 +1324,7 @@ def lower_flat_flags(v, labels): ### Lifting and Lowering Values def lift_flat_values(cx, max_flat, vi, ts): - flat_types = flatten_types(ts) + flat_types = flatten_types(ts, 'lift', Needs()) if len(flat_types) > max_flat: return lift_heap_values(cx, vi, ts) else: @@ -1321,7 +1340,7 @@ def lift_heap_values(cx, vi, ts): def lower_flat_values(cx, max_flat, vs, ts, out_param = None): assert(cx.inst.may_leave) cx.inst.may_leave = False - flat_types = flatten_types(ts) + flat_types = flatten_types(ts, 'lower', Needs()) if len(flat_types) > max_flat: flat_vals = lower_heap_values(cx, vs, ts, out_param) else: @@ -1490,7 +1509,7 @@ async def canon_task_backpressure(task, flat_args): async def canon_task_start(task, core_ft, flat_args): assert(len(core_ft.params) == len(flat_args)) trap_if(task.opts.sync) - trap_if(core_ft != flatten_functype(CanonicalOptions(), FuncType([], task.ft.params), 'lower')) + trap_if(core_ft != flatten_functype(CanonicalOptions(), FuncType([], task.ft.params), 'lower', Needs())) task.start() args = task.on_start() flat_results = lower_flat_values(task, MAX_FLAT_RESULTS, args, task.ft.param_types(), CoreValueIter(flat_args)) @@ -1502,7 +1521,7 @@ async def canon_task_start(task, core_ft, flat_args): async def canon_task_return(task, core_ft, flat_args): assert(len(core_ft.params) == len(flat_args)) trap_if(task.opts.sync) - trap_if(core_ft != flatten_functype(CanonicalOptions(), FuncType(task.ft.results, []), 'lower')) + trap_if(core_ft != flatten_functype(CanonicalOptions(), FuncType(task.ft.results, []), 'lower', Needs())) task.return_() results = lift_flat_values(task, MAX_FLAT_PARAMS, CoreValueIter(flat_args), task.ft.result_types()) task.on_return(results) diff --git a/design/mvp/canonical-abi/run_tests.py b/design/mvp/canonical-abi/run_tests.py index 3d4de578..7179daeb 100644 --- a/design/mvp/canonical-abi/run_tests.py +++ b/design/mvp/canonical-abi/run_tests.py @@ -319,13 +319,13 @@ def test_flatten(t, params, results): if len(results) > definitions.MAX_FLAT_RESULTS: expect.results = ['i32'] - got = flatten_functype(CanonicalOptions(), t, 'lift') + got = flatten_functype(CanonicalOptions(), t, 'lift', Needs()) assert(got == expect) if len(results) > definitions.MAX_FLAT_RESULTS: expect.params += ['i32'] expect.results = [] - got = flatten_functype(CanonicalOptions(), t, 'lower') + got = flatten_functype(CanonicalOptions(), t, 'lower', Needs()) assert(got == expect) test_flatten(FuncType([U8(),F32(),F64()],[]), ['i32','f32','f64'], []) @@ -355,7 +355,7 @@ async def callee(task, x): caller_inst = ComponentInstance() caller_task = Task(caller_opts, caller_inst, None, lambda:()) - return_in_heap = len(flatten_types([t])) > definitions.MAX_FLAT_RESULTS + return_in_heap = len(flatten_types([t], 'lift', Needs())) > definitions.MAX_FLAT_RESULTS asyncio.run(caller_task.enter())