summaryrefslogtreecommitdiff
path: root/crates/typst-library/src/foundations/plugin.rs
diff options
context:
space:
mode:
authorLaurenz <laurmaedje@gmail.com>2024-10-27 19:04:55 +0100
committerGitHub <noreply@github.com>2024-10-27 18:04:55 +0000
commitbe7cfc85d08c545abfac08098b7b33b4bd71f37e (patch)
treef4137fa2aaa57babae1f7603a9b2ed7e688f43d8 /crates/typst-library/src/foundations/plugin.rs
parentb8034a343831e8609aec2ec81eb7eeda57aa5d81 (diff)
Split out four new crates (#5302)
Diffstat (limited to 'crates/typst-library/src/foundations/plugin.rs')
-rw-r--r--crates/typst-library/src/foundations/plugin.rs365
1 files changed, 365 insertions, 0 deletions
diff --git a/crates/typst-library/src/foundations/plugin.rs b/crates/typst-library/src/foundations/plugin.rs
new file mode 100644
index 00000000..31107dc3
--- /dev/null
+++ b/crates/typst-library/src/foundations/plugin.rs
@@ -0,0 +1,365 @@
+use std::fmt::{self, Debug, Formatter};
+use std::hash::{Hash, Hasher};
+use std::sync::{Arc, Mutex};
+
+use ecow::{eco_format, EcoString};
+use typst_syntax::Spanned;
+use wasmi::{AsContext, AsContextMut};
+
+use crate::diag::{bail, At, SourceResult, StrResult};
+use crate::engine::Engine;
+use crate::foundations::{func, repr, scope, ty, Bytes};
+use crate::World;
+
+/// A WebAssembly plugin.
+///
+/// Typst is capable of interfacing with plugins compiled to WebAssembly. Plugin
+/// functions may accept multiple [byte buffers]($bytes) as arguments and return
+/// a single byte buffer. They should typically be wrapped in idiomatic Typst
+/// functions that perform the necessary conversions between native Typst types
+/// and bytes.
+///
+/// Plugins run in isolation from your system, which means that printing,
+/// reading files, or anything like that will not be supported for security
+/// reasons. To run as a plugin, a program needs to be compiled to a 32-bit
+/// shared WebAssembly library. Many compilers will use the
+/// [WASI ABI](https://wasi.dev/) by default or as their only option (e.g.
+/// emscripten), which allows printing, reading files, etc. This ABI will not
+/// directly work with Typst. You will either need to compile to a different
+/// target or [stub all functions](https://github.com/astrale-sharp/wasm-minimal-protocol/blob/master/wasi-stub).
+///
+/// # Plugins and Packages
+/// Plugins are distributed as packages. A package can make use of a plugin
+/// simply by including a WebAssembly file and loading it. Because the
+/// byte-based plugin interface is quite low-level, plugins are typically
+/// exposed through wrapper functions, that also live in the same package.
+///
+/// # Purity
+/// Plugin functions must be pure: Given the same arguments, they must always
+/// return the same value. The reason for this is that Typst functions must be
+/// pure (which is quite fundamental to the language design) and, since Typst
+/// function can call plugin functions, this requirement is inherited. In
+/// particular, if a plugin function is called twice with the same arguments,
+/// Typst might cache the results and call your function only once.
+///
+/// # Example
+/// ```example
+/// #let myplugin = plugin("hello.wasm")
+/// #let concat(a, b) = str(
+/// myplugin.concatenate(
+/// bytes(a),
+/// bytes(b),
+/// )
+/// )
+///
+/// #concat("hello", "world")
+/// ```
+///
+/// # Protocol
+/// To be used as a plugin, a WebAssembly module must conform to the following
+/// protocol:
+///
+/// ## Exports
+/// A plugin module can export functions to make them callable from Typst. To
+/// conform to the protocol, an exported function should:
+///
+/// - Take `n` 32-bit integer arguments `a_1`, `a_2`, ..., `a_n` (interpreted as
+/// lengths, so `usize/size_t` may be preferable), and return one 32-bit
+/// integer.
+///
+/// - The function should first allocate a buffer `buf` of length
+/// `a_1 + a_2 + ... + a_n`, and then call
+/// `wasm_minimal_protocol_write_args_to_buffer(buf.ptr)`.
+///
+/// - The `a_1` first bytes of the buffer now constitute the first argument, the
+/// `a_2` next bytes the second argument, and so on.
+///
+/// - The function can now do its job with the arguments and produce an output
+/// buffer. Before returning, it should call
+/// `wasm_minimal_protocol_send_result_to_host` to send its result back to the
+/// host.
+///
+/// - To signal success, the function should return `0`.
+///
+/// - To signal an error, the function should return `1`. The written buffer is
+/// then interpreted as an UTF-8 encoded error message.
+///
+/// ## Imports
+/// Plugin modules need to import two functions that are provided by the runtime.
+/// (Types and functions are described using WAT syntax.)
+///
+/// - `(import "typst_env" "wasm_minimal_protocol_write_args_to_buffer" (func (param i32)))`
+///
+/// Writes the arguments for the current function into a plugin-allocated
+/// buffer. When a plugin function is called, it
+/// [receives the lengths](#exports) of its input buffers as arguments. It
+/// should then allocate a buffer whose capacity is at least the sum of these
+/// lengths. It should then call this function with a `ptr` to the buffer to
+/// fill it with the arguments, one after another.
+///
+/// - `(import "typst_env" "wasm_minimal_protocol_send_result_to_host" (func (param i32 i32)))`
+///
+/// Sends the output of the current function to the host (Typst). The first
+/// parameter shall be a pointer to a buffer (`ptr`), while the second is the
+/// length of that buffer (`len`). The memory pointed at by `ptr` can be freed
+/// immediately after this function returns. If the message should be
+/// interpreted as an error message, it should be encoded as UTF-8.
+///
+/// # Resources
+/// For more resources, check out the
+/// [wasm-minimal-protocol repository](https://github.com/astrale-sharp/wasm-minimal-protocol).
+/// It contains:
+///
+/// - A list of example plugin implementations and a test runner for these
+/// examples
+/// - Wrappers to help you write your plugin in Rust (Zig wrapper in
+/// development)
+/// - A stubber for WASI
+#[ty(scope, cast)]
+#[derive(Clone)]
+pub struct Plugin(Arc<Repr>);
+
+/// The internal representation of a plugin.
+struct Repr {
+ /// The raw WebAssembly bytes.
+ bytes: Bytes,
+ /// The function defined by the WebAssembly module.
+ functions: Vec<(EcoString, wasmi::Func)>,
+ /// Owns all data associated with the WebAssembly module.
+ store: Mutex<Store>,
+}
+
+/// Owns all data associated with the WebAssembly module.
+type Store = wasmi::Store<StoreData>;
+
+/// If there was an error reading/writing memory, keep the offset + length to
+/// display an error message.
+struct MemoryError {
+ offset: u32,
+ length: u32,
+ write: bool,
+}
+/// The persistent store data used for communication between store and host.
+#[derive(Default)]
+struct StoreData {
+ args: Vec<Bytes>,
+ output: Vec<u8>,
+ memory_error: Option<MemoryError>,
+}
+
+#[scope]
+impl Plugin {
+ /// Creates a new plugin from a WebAssembly file.
+ #[func(constructor)]
+ pub fn construct(
+ /// The engine.
+ engine: &mut Engine,
+ /// Path to a WebAssembly file.
+ ///
+ /// For more details, see the [Paths section]($syntax/#paths).
+ path: Spanned<EcoString>,
+ ) -> SourceResult<Plugin> {
+ let Spanned { v: path, span } = path;
+ let id = span.resolve_path(&path).at(span)?;
+ let data = engine.world.file(id).at(span)?;
+ Plugin::new(data).at(span)
+ }
+}
+
+impl Plugin {
+ /// Create a new plugin from raw WebAssembly bytes.
+ #[comemo::memoize]
+ #[typst_macros::time(name = "load plugin")]
+ pub fn new(bytes: Bytes) -> StrResult<Plugin> {
+ let engine = wasmi::Engine::default();
+ let module = wasmi::Module::new(&engine, bytes.as_slice())
+ .map_err(|err| format!("failed to load WebAssembly module ({err})"))?;
+
+ let mut linker = wasmi::Linker::new(&engine);
+ linker
+ .func_wrap(
+ "typst_env",
+ "wasm_minimal_protocol_send_result_to_host",
+ wasm_minimal_protocol_send_result_to_host,
+ )
+ .unwrap();
+ linker
+ .func_wrap(
+ "typst_env",
+ "wasm_minimal_protocol_write_args_to_buffer",
+ wasm_minimal_protocol_write_args_to_buffer,
+ )
+ .unwrap();
+
+ let mut store = Store::new(&engine, StoreData::default());
+ let instance = linker
+ .instantiate(&mut store, &module)
+ .and_then(|pre_instance| pre_instance.start(&mut store))
+ .map_err(|e| eco_format!("{e}"))?;
+
+ // Ensure that the plugin exports its memory.
+ if !matches!(
+ instance.get_export(&store, "memory"),
+ Some(wasmi::Extern::Memory(_))
+ ) {
+ bail!("plugin does not export its memory");
+ }
+
+ // Collect exported functions.
+ let functions = instance
+ .exports(&store)
+ .filter_map(|export| {
+ let name = export.name().into();
+ export.into_func().map(|func| (name, func))
+ })
+ .collect();
+
+ Ok(Plugin(Arc::new(Repr { bytes, functions, store: Mutex::new(store) })))
+ }
+
+ /// Call the plugin function with the given `name`.
+ #[comemo::memoize]
+ #[typst_macros::time(name = "call plugin")]
+ pub fn call(&self, name: &str, args: Vec<Bytes>) -> StrResult<Bytes> {
+ // Find the function with the given name.
+ let func = self
+ .0
+ .functions
+ .iter()
+ .find(|(v, _)| v == name)
+ .map(|&(_, func)| func)
+ .ok_or_else(|| {
+ eco_format!("plugin does not contain a function called {name}")
+ })?;
+
+ let mut store = self.0.store.lock().unwrap();
+ let ty = func.ty(store.as_context());
+
+ // Check function signature.
+ if ty.params().iter().any(|&v| v != wasmi::core::ValType::I32) {
+ bail!(
+ "plugin function `{name}` has a parameter that is not a 32-bit integer"
+ );
+ }
+ if ty.results() != [wasmi::core::ValType::I32] {
+ bail!("plugin function `{name}` does not return exactly one 32-bit integer");
+ }
+
+ // Check inputs.
+ let expected = ty.params().len();
+ let given = args.len();
+ if expected != given {
+ bail!(
+ "plugin function takes {expected} argument{}, but {given} {} given",
+ if expected == 1 { "" } else { "s" },
+ if given == 1 { "was" } else { "were" },
+ );
+ }
+
+ // Collect the lengths of the argument buffers.
+ let lengths = args
+ .iter()
+ .map(|a| wasmi::Val::I32(a.len() as i32))
+ .collect::<Vec<_>>();
+
+ // Store the input data.
+ store.data_mut().args = args;
+
+ // Call the function.
+ let mut code = wasmi::Val::I32(-1);
+ func.call(store.as_context_mut(), &lengths, std::slice::from_mut(&mut code))
+ .map_err(|err| eco_format!("plugin panicked: {err}"))?;
+ if let Some(MemoryError { offset, length, write }) =
+ store.data_mut().memory_error.take()
+ {
+ return Err(eco_format!(
+ "plugin tried to {kind} out of bounds: pointer {offset:#x} is out of bounds for {kind} of length {length}",
+ kind = if write { "write" } else { "read" }
+ ));
+ }
+
+ // Extract the returned data.
+ let output = std::mem::take(&mut store.data_mut().output);
+
+ // Parse the functions return value.
+ match code {
+ wasmi::Val::I32(0) => {}
+ wasmi::Val::I32(1) => match std::str::from_utf8(&output) {
+ Ok(message) => bail!("plugin errored with: {message}"),
+ Err(_) => {
+ bail!("plugin errored, but did not return a valid error message")
+ }
+ },
+ _ => bail!("plugin did not respect the protocol"),
+ };
+
+ Ok(output.into())
+ }
+
+ /// An iterator over all the function names defined by the plugin.
+ pub fn iter(&self) -> impl Iterator<Item = &EcoString> {
+ self.0.functions.as_slice().iter().map(|(func_name, _)| func_name)
+ }
+}
+
+impl Debug for Plugin {
+ fn fmt(&self, f: &mut Formatter) -> fmt::Result {
+ f.pad("Plugin(..)")
+ }
+}
+
+impl repr::Repr for Plugin {
+ fn repr(&self) -> EcoString {
+ "plugin(..)".into()
+ }
+}
+
+impl PartialEq for Plugin {
+ fn eq(&self, other: &Self) -> bool {
+ self.0.bytes == other.0.bytes
+ }
+}
+
+impl Hash for Plugin {
+ fn hash<H: Hasher>(&self, state: &mut H) {
+ self.0.bytes.hash(state);
+ }
+}
+
+/// Write the arguments to the plugin function into the plugin's memory.
+fn wasm_minimal_protocol_write_args_to_buffer(
+ mut caller: wasmi::Caller<StoreData>,
+ ptr: u32,
+) {
+ let memory = caller.get_export("memory").unwrap().into_memory().unwrap();
+ let arguments = std::mem::take(&mut caller.data_mut().args);
+ let mut offset = ptr as usize;
+ for arg in arguments {
+ if memory.write(&mut caller, offset, arg.as_slice()).is_err() {
+ caller.data_mut().memory_error = Some(MemoryError {
+ offset: offset as u32,
+ length: arg.len() as u32,
+ write: true,
+ });
+ return;
+ }
+ offset += arg.len();
+ }
+}
+
+/// Extracts the output of the plugin function from the plugin's memory.
+fn wasm_minimal_protocol_send_result_to_host(
+ mut caller: wasmi::Caller<StoreData>,
+ ptr: u32,
+ len: u32,
+) {
+ let memory = caller.get_export("memory").unwrap().into_memory().unwrap();
+ let mut buffer = std::mem::take(&mut caller.data_mut().output);
+ buffer.resize(len as usize, 0);
+ if memory.read(&caller, ptr as _, &mut buffer).is_err() {
+ caller.data_mut().memory_error =
+ Some(MemoryError { offset: ptr, length: len, write: false });
+ return;
+ }
+ caller.data_mut().output = buffer;
+}