mirror of
https://github.com/fluencelabs/wasm-bindgen
synced 2025-06-23 17:51:33 +00:00
Rewrite wasm-bindgen with updated interface types proposal (#1882)
This commit is a pretty large scale rewrite of the internals of wasm-bindgen. No user-facing changes are expected as a result of this PR, but due to the scale of changes here it's likely inevitable that at least something will break. I'm hoping to get more testing in though before landing! The purpose of this PR is to update wasm-bindgen to the current state of the interface types proposal. The wasm-bindgen tool was last updated when it was still called "WebIDL bindings" so it's been awhile! All support is now based on https://github.com/bytecodealliance/wasm-interface-types which defines parsers/binary format/writers/etc for wasm-interface types. This is a pretty massive PR and unfortunately can't really be split up any more afaik. I don't really expect realistic review of all the code here (or commits), but some high-level changes are: * Interface types now consists of a set of "adapter functions". The IR in wasm-bindgen is modeled the same way not. * Each adapter function has a list of instructions, and these instructions work at a higher level than wasm itself, for example with strings. * The wasm-bindgen tool has a suite of instructions which are specific to it and not present in the standard. (like before with webidl bindings) * The anyref/multi-value transformations are now greatly simplified. They're simply "optimization passes" over adapter functions, removing instructions that are otherwise present. This way we don't have to juggle so much all over the place, and instructions always have the same meaning.
This commit is contained in:
360
crates/cli-support/src/wit/nonstandard.rs
Normal file
360
crates/cli-support/src/wit/nonstandard.rs
Normal file
@ -0,0 +1,360 @@
|
||||
use crate::intrinsic::Intrinsic;
|
||||
use crate::wit::AdapterId;
|
||||
use std::borrow::Cow;
|
||||
use std::collections::{HashMap, HashSet};
|
||||
use std::path::PathBuf;
|
||||
use walrus::TypedCustomSectionId;
|
||||
|
||||
/// A synthetic custom section which is not standardized, never will be, and
|
||||
/// cannot be serialized or parsed. This is synthesized from all of the
|
||||
/// compiler-emitted wasm-bindgen sections and then immediately removed to be
|
||||
/// processed in the JS generation pass.
|
||||
#[derive(Default, Debug)]
|
||||
pub struct WasmBindgenAux {
|
||||
/// Extra typescript annotations that should be appended to the generated
|
||||
/// TypeScript file. This is provided via a custom attribute in Rust code.
|
||||
pub extra_typescript: String,
|
||||
|
||||
/// A map from identifier to the contents of each local module defined via
|
||||
/// the `#[wasm_bindgen(module = "/foo.js")]` import options.
|
||||
pub local_modules: HashMap<String, String>,
|
||||
|
||||
/// A map from unique crate identifier to the list of inline JS snippets for
|
||||
/// that crate identifier.
|
||||
pub snippets: HashMap<String, Vec<String>>,
|
||||
|
||||
/// A list of all `package.json` files that are intended to be included in
|
||||
/// the final build.
|
||||
pub package_jsons: HashSet<PathBuf>,
|
||||
|
||||
/// A map from exported function id to where it's expected to be exported
|
||||
/// to.
|
||||
pub export_map: HashMap<AdapterId, AuxExport>,
|
||||
|
||||
/// A map from imported function id to what it's expected to import.
|
||||
pub import_map: HashMap<AdapterId, AuxImport>,
|
||||
|
||||
/// Small bits of metadata about imports.
|
||||
pub imports_with_catch: HashSet<AdapterId>,
|
||||
pub imports_with_variadic: HashSet<AdapterId>,
|
||||
pub imports_with_assert_no_shim: HashSet<AdapterId>,
|
||||
|
||||
/// Auxiliary information to go into JS/TypeScript bindings describing the
|
||||
/// exported enums from Rust.
|
||||
pub enums: Vec<AuxEnum>,
|
||||
|
||||
/// Auxiliary information to go into JS/TypeScript bindings describing the
|
||||
/// exported structs from Rust and their fields they've got exported.
|
||||
pub structs: Vec<AuxStruct>,
|
||||
|
||||
/// Information about various internal functions used to manage the `anyref`
|
||||
/// table, later used to process JS bindings.
|
||||
pub anyref_table: Option<walrus::TableId>,
|
||||
pub anyref_alloc: Option<walrus::FunctionId>,
|
||||
pub anyref_drop_slice: Option<walrus::FunctionId>,
|
||||
}
|
||||
|
||||
pub type WasmBindgenAuxId = TypedCustomSectionId<WasmBindgenAux>;
|
||||
|
||||
#[derive(Debug)]
|
||||
pub struct AuxExport {
|
||||
/// When generating errors about this export, a helpful name to remember it
|
||||
/// by.
|
||||
pub debug_name: String,
|
||||
/// Comments parsed in Rust and forwarded here to show up in JS bindings.
|
||||
pub comments: String,
|
||||
/// Argument names in Rust forwarded here to configure the names that show
|
||||
/// up in TypeScript bindings.
|
||||
pub arg_names: Option<Vec<String>>,
|
||||
/// What kind of function this is and where it shows up
|
||||
pub kind: AuxExportKind,
|
||||
}
|
||||
|
||||
/// All possible kinds of exports from a wasm module.
|
||||
///
|
||||
/// This `enum` says where to place an exported wasm function. For example it
|
||||
/// may want to get hooked up to a JS class, or it may want to be exported as a
|
||||
/// free function (etc).
|
||||
///
|
||||
/// TODO: it feels like this should not really be here per se. We probably want
|
||||
/// to either construct the JS object itself from within wasm or somehow move
|
||||
/// more of this information into some other section. Really what this is is
|
||||
/// sort of an "export map" saying how to wire up all the free functions from
|
||||
/// the wasm module into the output expected JS module. All our functions here
|
||||
/// currently take integer parameters and require a JS wrapper, but ideally
|
||||
/// we'd change them one day to taking/receiving `anyref` which then use some
|
||||
/// sort of webidl import to customize behavior or something like that. In any
|
||||
/// case this doesn't feel quite right in terms of priviledge separation, so
|
||||
/// we'll want to work on this. For now though it works.
|
||||
#[derive(Debug)]
|
||||
pub enum AuxExportKind {
|
||||
/// A free function that's just listed on the exported module
|
||||
Function(String),
|
||||
|
||||
/// A function that's used to create an instane of a class. The function
|
||||
/// actually return just an integer which is put on an JS object currently.
|
||||
Constructor(String),
|
||||
|
||||
/// This function is intended to be a getter for a field on a class. The
|
||||
/// first argument is the internal pointer and the returned value is
|
||||
/// expected to be the field.
|
||||
Getter { class: String, field: String },
|
||||
|
||||
/// This function is intended to be a setter for a field on a class. The
|
||||
/// first argument is the internal pointer and the second argument is
|
||||
/// expected to be the field's new value.
|
||||
Setter { class: String, field: String },
|
||||
|
||||
/// This is a free function (ish) but scoped inside of a class name.
|
||||
StaticFunction { class: String, name: String },
|
||||
|
||||
/// This is a member function of a class where the first parameter is the
|
||||
/// implicit integer stored in the class instance.
|
||||
Method {
|
||||
class: String,
|
||||
name: String,
|
||||
/// Whether or not this is calling a by-value method in Rust and should
|
||||
/// clear the internal pointer in JS automatically.
|
||||
consumed: bool,
|
||||
},
|
||||
}
|
||||
|
||||
#[derive(Debug)]
|
||||
pub struct AuxEnum {
|
||||
/// The name of this enum
|
||||
pub name: String,
|
||||
/// The copied Rust comments to forward to JS
|
||||
pub comments: String,
|
||||
/// A list of variants with their name and value
|
||||
pub variants: Vec<(String, u32)>,
|
||||
}
|
||||
|
||||
#[derive(Debug)]
|
||||
pub struct AuxStruct {
|
||||
/// The name of this struct
|
||||
pub name: String,
|
||||
/// The copied Rust comments to forward to JS
|
||||
pub comments: String,
|
||||
/// Whether to generate helper methods for inspecting the class
|
||||
pub is_inspectable: bool,
|
||||
}
|
||||
|
||||
/// All possible types of imports that can be imported by a wasm module.
|
||||
///
|
||||
/// This `enum` is intended to map out what an imported value is. For example
|
||||
/// this contains a ton of shims and various ways you can call a function. The
|
||||
/// base variant here is `Value` which simply means "hook this up to the import"
|
||||
/// and the signatures will match up.
|
||||
///
|
||||
/// Note that this is *not* the same as the webidl bindings section. This is
|
||||
/// intended to be coupled with that to map out what actually gets hooked up to
|
||||
/// an import in the wasm module. The two work in tandem.
|
||||
///
|
||||
/// Some of these items here are native to JS (like `Value`, indexing
|
||||
/// operations, etc). Others are shims generated by wasm-bindgen (like `Closure`
|
||||
/// or `Instanceof`).
|
||||
#[derive(Debug)]
|
||||
pub enum AuxImport {
|
||||
/// This import is expected to simply be whatever is the value that's
|
||||
/// imported
|
||||
Value(AuxValue),
|
||||
|
||||
/// A static method on a class is being imported, and the `this` of the
|
||||
/// function call is expected to always be the class.
|
||||
ValueWithThis(JsImport, String),
|
||||
|
||||
/// This import is expected to be a function that takes an `anyref` and
|
||||
/// returns a `bool`. It's expected that it tests if the argument is an
|
||||
/// instance of (using `instanceof`) the name specified.
|
||||
///
|
||||
/// TODO: can we use `Reflect` or something like that to avoid an extra kind
|
||||
/// of import here?
|
||||
Instanceof(JsImport),
|
||||
|
||||
/// This import is expected to be a shim that returns the JS value named by
|
||||
/// `JsImport`.
|
||||
Static(JsImport),
|
||||
|
||||
/// This import is intended to manufacture a JS closure with the given
|
||||
/// signature and then return that back to Rust.
|
||||
Closure {
|
||||
mutable: bool, // whether or not this was a `FnMut` closure
|
||||
dtor: u32, // table element index of the destructor function
|
||||
adapter: AdapterId, // the adapter which translates the types for this closure
|
||||
nargs: usize,
|
||||
},
|
||||
|
||||
/// This import is expected to be a shim that simply calls the `foo` method
|
||||
/// on the first object, passing along all other parameters and returning
|
||||
/// the resulting value.
|
||||
StructuralMethod(String),
|
||||
|
||||
/// This import is a "structural getter" which simply returns the `.field`
|
||||
/// value of the first argument as an object.
|
||||
///
|
||||
/// e.g. `function(x) { return x.foo; }`
|
||||
StructuralGetter(String),
|
||||
|
||||
/// This import is a "structural getter" which simply returns the `.field`
|
||||
/// value of the specified class
|
||||
///
|
||||
/// e.g. `function() { return TheClass.foo; }`
|
||||
StructuralClassGetter(JsImport, String),
|
||||
|
||||
/// This import is a "structural setter" which simply sets the `.field`
|
||||
/// value of the first argument to the second argument.
|
||||
///
|
||||
/// e.g. `function(x, y) { x.foo = y; }`
|
||||
StructuralSetter(String),
|
||||
|
||||
/// This import is a "structural setter" which simply sets the `.field`
|
||||
/// value of the specified class to the first argument of the function.
|
||||
///
|
||||
/// e.g. `function(x) { TheClass.foo = x; }`
|
||||
StructuralClassSetter(JsImport, String),
|
||||
|
||||
/// This import is expected to be a shim that is an indexing getter of the
|
||||
/// JS class here, where the first argument of the function is the field to
|
||||
/// look up. The return value is the value of the field.
|
||||
///
|
||||
/// e.g. `function(x) { return TheClass[x]; }`
|
||||
///
|
||||
/// TODO: can we use `Reflect` or something like that to avoid an extra kind
|
||||
/// of import here?
|
||||
IndexingGetterOfClass(JsImport),
|
||||
|
||||
/// This import is expected to be a shim that is an indexing getter of the
|
||||
/// first argument interpreted as an object where the field to look up is
|
||||
/// the second argument.
|
||||
///
|
||||
/// e.g. `function(x, y) { return x[y]; }`
|
||||
///
|
||||
/// TODO: can we use `Reflect` or something like that to avoid an extra kind
|
||||
/// of import here?
|
||||
IndexingGetterOfObject,
|
||||
|
||||
/// This import is expected to be a shim that is an indexing setter of the
|
||||
/// JS class here, where the first argument of the function is the field to
|
||||
/// set and the second is the value to set it to.
|
||||
///
|
||||
/// e.g. `function(x, y) { TheClass[x] = y; }`
|
||||
///
|
||||
/// TODO: can we use `Reflect` or something like that to avoid an extra kind
|
||||
/// of import here?
|
||||
IndexingSetterOfClass(JsImport),
|
||||
|
||||
/// This import is expected to be a shim that is an indexing setter of the
|
||||
/// first argument interpreted as an object where the next two fields are
|
||||
/// the field to set and the value to set it to.
|
||||
///
|
||||
/// e.g. `function(x, y, z) { x[y] = z; }`
|
||||
///
|
||||
/// TODO: can we use `Reflect` or something like that to avoid an extra kind
|
||||
/// of import here?
|
||||
IndexingSetterOfObject,
|
||||
|
||||
/// This import is expected to be a shim that is an indexing deleter of the
|
||||
/// JS class here, where the first argument of the function is the field to
|
||||
/// delete.
|
||||
///
|
||||
/// e.g. `function(x) { delete TheClass[x]; }`
|
||||
///
|
||||
/// TODO: can we use `Reflect` or something like that to avoid an extra kind
|
||||
/// of import here?
|
||||
IndexingDeleterOfClass(JsImport),
|
||||
|
||||
/// This import is expected to be a shim that is an indexing deleter of the
|
||||
/// first argument interpreted as an object where the second argument is
|
||||
/// the field to delete.
|
||||
///
|
||||
/// e.g. `function(x, y) { delete x[y]; }`
|
||||
///
|
||||
/// TODO: can we use `Reflect` or something like that to avoid an extra kind
|
||||
/// of import here?
|
||||
IndexingDeleterOfObject,
|
||||
|
||||
/// This import is a generated shim which will wrap the provided pointer in
|
||||
/// a JS object corresponding to the Class name given here. The class name
|
||||
/// is one that is exported from the Rust/wasm.
|
||||
///
|
||||
/// TODO: sort of like the export map below we should ideally create the
|
||||
/// `anyref` from within Rust itself and then return it directly rather than
|
||||
/// requiring an intrinsic here to do so.
|
||||
WrapInExportedClass(String),
|
||||
|
||||
/// This is an intrinsic function expected to be implemented with a JS glue
|
||||
/// shim. Each intrinsic has its own expected signature and implementation.
|
||||
Intrinsic(Intrinsic),
|
||||
}
|
||||
|
||||
/// Values that can be imported verbatim to hook up to an import.
|
||||
#[derive(Debug)]
|
||||
pub enum AuxValue {
|
||||
/// A bare JS value, no transformations, just put it in the slot.
|
||||
Bare(JsImport),
|
||||
|
||||
/// A getter function for the class listed for the field, acquired using
|
||||
/// `getOwnPropertyDescriptor`.
|
||||
Getter(JsImport, String),
|
||||
|
||||
/// Like `Getter`, but accesses a field of a class instead of an instance
|
||||
/// of the class.
|
||||
ClassGetter(JsImport, String),
|
||||
|
||||
/// Like `Getter`, except the `set` property.
|
||||
Setter(JsImport, String),
|
||||
|
||||
/// Like `Setter`, but for class fields instead of instance fields.
|
||||
ClassSetter(JsImport, String),
|
||||
}
|
||||
|
||||
/// What can actually be imported and typically a value in each of the variants
|
||||
/// above of `AuxImport`
|
||||
///
|
||||
/// A `JsImport` is intended to indicate what exactly is being imported for a
|
||||
/// particular operation.
|
||||
#[derive(Debug, Hash, Eq, PartialEq, Clone)]
|
||||
pub struct JsImport {
|
||||
/// The base of whatever is being imported, either from a module, the global
|
||||
/// namespace, or similar.
|
||||
pub name: JsImportName,
|
||||
/// Various field accesses (like `.foo.bar.baz`) to hang off the `name`
|
||||
/// above.
|
||||
pub fields: Vec<String>,
|
||||
}
|
||||
|
||||
/// Return value of `determine_import` which is where we look at an imported
|
||||
/// function AST and figure out where it's actually being imported from
|
||||
/// (performing some validation checks and whatnot).
|
||||
#[derive(Debug, Hash, Eq, PartialEq, Clone)]
|
||||
pub enum JsImportName {
|
||||
/// An item is imported from the global scope. The `name` is what's
|
||||
/// imported.
|
||||
Global { name: String },
|
||||
/// Same as `Global`, except the `name` is imported via an ESM import from
|
||||
/// the specified `module` path.
|
||||
Module { module: String, name: String },
|
||||
/// Same as `Module`, except we're importing from a local module defined in
|
||||
/// a local JS snippet.
|
||||
LocalModule { module: String, name: String },
|
||||
/// Same as `Module`, except we're importing from an `inline_js` attribute
|
||||
InlineJs {
|
||||
unique_crate_identifier: String,
|
||||
snippet_idx_in_crate: usize,
|
||||
name: String,
|
||||
},
|
||||
/// A global import which may have a number of vendor prefixes associated
|
||||
/// with it, like `webkitAudioPrefix`. The `name` is the name to test
|
||||
/// whether it's prefixed.
|
||||
VendorPrefixed { name: String, prefixes: Vec<String> },
|
||||
}
|
||||
|
||||
impl walrus::CustomSection for WasmBindgenAux {
|
||||
fn name(&self) -> &str {
|
||||
"wasm-bindgen custom section"
|
||||
}
|
||||
|
||||
fn data(&self, _: &walrus::IdsToIndices) -> Cow<[u8]> {
|
||||
panic!("shouldn't emit custom sections just yet");
|
||||
}
|
||||
}
|
Reference in New Issue
Block a user