Update the wasi-nn witx files

alexcrichton · abrown · commit 8adc5b9b3bb8 · 2021-02-18T09:56:51.000-08:00
diff --git a/phases/ephemeral/docs.md b/phases/ephemeral/docs.md
@@ -1209,15 +1209,15 @@ Size: 4
 
 Alignment: 4
 
-## <a href="#nn_errno" name="nn_errno"></a> `nn_errno`: Enum(`u16`)
+## <a href="#nn_errno" name="nn_errno"></a> `nn_errno`: `Variant`
 Error codes returned by functions in this API. This is prefixed to avoid conflicts with the `$errno` in
 `typenames.witx`.
 
 Size: 2
 
 Alignment: 2
 
-### Variants
+### Variant cases
 - <a href="#nn_errno.success" name="nn_errno.success"></a> `success`
 No error occurred.
 
@@ -1230,7 +1230,7 @@ Caller module is missing a memory export.
 - <a href="#nn_errno.busy" name="nn_errno.busy"></a> `busy`
 Device or resource busy.
 
-## <a href="#tensor_dimensions" name="tensor_dimensions"></a> `tensor_dimensions`: `Array<u32>`
+## <a href="#tensor_dimensions" name="tensor_dimensions"></a> `tensor_dimensions`: `List<u32>`
 The dimensions of a tensor.
 
 The array length matches the tensor rank and each element in the array
@@ -1240,14 +1240,14 @@ Size: 8
 
 Alignment: 4
 
-## <a href="#tensor_type" name="tensor_type"></a> `tensor_type`: Enum(`u8`)
+## <a href="#tensor_type" name="tensor_type"></a> `tensor_type`: `Variant`
 The type of the elements in a tensor.
 
 Size: 1
 
 Alignment: 1
 
-### Variants
+### Variant cases
 - <a href="#tensor_type.f16" name="tensor_type.f16"></a> `f16`
 
 - <a href="#tensor_type.f32" name="tensor_type.f32"></a> `f32`
@@ -1256,7 +1256,7 @@ Alignment: 1
 
 - <a href="#tensor_type.i32" name="tensor_type.i32"></a> `i32`
 
-## <a href="#tensor_data" name="tensor_data"></a> `tensor_data`: `Array<u8>`
+## <a href="#tensor_data" name="tensor_data"></a> `tensor_data`: `List<u8>`
 The tensor data
 
 Initially conceived as a sparse representation, each empty cell would be filled with zeroes and
@@ -1269,14 +1269,14 @@ Size: 8
 
 Alignment: 4
 
-## <a href="#tensor" name="tensor"></a> `tensor`: Struct
+## <a href="#tensor" name="tensor"></a> `tensor`: `Record`
 A tensor.
 
 Size: 20
 
 Alignment: 4
 
-### Struct members
+### Record members
 - <a href="#tensor.dimensions" name="tensor.dimensions"></a> `dimensions`: [`tensor_dimensions`](#tensor_dimensions)
 Describe the size of the tensor (e.g. 2x2x2x2 -> [2, 2, 2, 2]). To represent a tensor containing a single value,
 use `[1]` for the tensor dimensions.
@@ -1292,55 +1292,55 @@ Contains the tensor data.
 
 Offset: 12
 
-## <a href="#graph_builder" name="graph_builder"></a> `graph_builder`: `Array<u8>`
+## <a href="#graph_builder" name="graph_builder"></a> `graph_builder`: `List<u8>`
 The graph initialization data. This consists of an array of buffers because implementing backends may encode their
 graph IR in parts (e.g. OpenVINO stores its IR and weights separately).
 
 Size: 8
 
 Alignment: 4
 
-## <a href="#graph_builder_array" name="graph_builder_array"></a> `graph_builder_array`: `Array<graph_builder>`
+## <a href="#graph_builder_array" name="graph_builder_array"></a> `graph_builder_array`: `List<graph_builder>`
 
 Size: 8
 
 Alignment: 4
 
-## <a href="#graph" name="graph"></a> `graph`
+## <a href="#graph" name="graph"></a> `graph`: `Handle`
 An execution graph for performing inference (i.e. a model).
 
 Size: 4
 
 Alignment: 4
 
 ### Supertypes
-## <a href="#graph_encoding" name="graph_encoding"></a> `graph_encoding`: Enum(`u8`)
+## <a href="#graph_encoding" name="graph_encoding"></a> `graph_encoding`: `Variant`
 Describes the encoding of the graph. This allows the API to be implemented by various backends that encode (i.e.
 serialize) their graph IR differently.
 
 Size: 1
 
 Alignment: 1
 
-### Variants
+### Variant cases
 - <a href="#graph_encoding.openvino" name="graph_encoding.openvino"></a> `openvino`
 TODO document buffer order
 
-## <a href="#execution_target" name="execution_target"></a> `execution_target`: Enum(`u8`)
+## <a href="#execution_target" name="execution_target"></a> `execution_target`: `Variant`
 Define where the graph should be executed.
 
 Size: 1
 
 Alignment: 1
 
-### Variants
+### Variant cases
 - <a href="#execution_target.cpu" name="execution_target.cpu"></a> `cpu`
 
 - <a href="#execution_target.gpu" name="execution_target.gpu"></a> `gpu`
 
 - <a href="#execution_target.tpu" name="execution_target.tpu"></a> `tpu`
 
-## <a href="#graph_execution_context" name="graph_execution_context"></a> `graph_execution_context`
+## <a href="#graph_execution_context" name="graph_execution_context"></a> `graph_execution_context`: `Handle`
 A $graph_execution_context allows for attaching inputs prior to calling [`compute`](#compute) on a graph and retrieving outputs after
 the computation has completed. TODO a handle may not be the right type but we want it to be opaque to users.
 
@@ -2705,7 +2705,7 @@ Which channels on the socket to shut down.
 
 ---
 
-#### <a href="#load" name="load"></a> `load(builder: graph_builder_array, encoding: graph_encoding, target: execution_target) -> (nn_errno, graph)`
+#### <a href="#load" name="load"></a> `load(builder: graph_builder_array, encoding: graph_encoding, target: execution_target) -> Result<graph, nn_errno>`
 Load an opaque sequence of bytes to use for inference.
 
 This allows runtime implementations to support multiple graph encoding formats. For unsupported graph encodings,
@@ -2722,14 +2722,21 @@ The encoding of the graph.
 Where to execute the graph.
 
 ##### Results
-- <a href="#load.error" name="load.error"></a> `error`: [`nn_errno`](#nn_errno)
+- <a href="#load.error" name="load.error"></a> `error`: `Result<graph, nn_errno>`
+
+###### Variant Layout
+- size: 8
+- align: 4
+- tag_size: 4
+###### Variant cases
+- <a href="#load.error.ok" name="load.error.ok"></a> `ok`: [`graph`](#graph)
 
-- <a href="#load.graph" name="load.graph"></a> `graph`: [`graph`](#graph)
+- <a href="#load.error.err" name="load.error.err"></a> `err`: [`nn_errno`](#nn_errno)
 
 
 ---
 
-#### <a href="#init_execution_context" name="init_execution_context"></a> `init_execution_context(graph: graph) -> (nn_errno, graph_execution_context)`
+#### <a href="#init_execution_context" name="init_execution_context"></a> `init_execution_context(graph: graph) -> Result<graph_execution_context, nn_errno>`
 TODO Functions like `describe_graph_inputs` and `describe_graph_outputs` (returning
 an array of `$tensor_description`s) might be useful for introspecting the graph but are not yet included here.
 Create an execution instance of a loaded graph.
@@ -2739,14 +2746,21 @@ TODO this may need to accept flags that might affect the compilation or executio
 - <a href="#init_execution_context.graph" name="init_execution_context.graph"></a> `graph`: [`graph`](#graph)
 
 ##### Results
-- <a href="#init_execution_context.error" name="init_execution_context.error"></a> `error`: [`nn_errno`](#nn_errno)
+- <a href="#init_execution_context.error" name="init_execution_context.error"></a> `error`: `Result<graph_execution_context, nn_errno>`
+
+###### Variant Layout
+- size: 8
+- align: 4
+- tag_size: 4
+###### Variant cases
+- <a href="#init_execution_context.error.ok" name="init_execution_context.error.ok"></a> `ok`: [`graph_execution_context`](#graph_execution_context)
 
-- <a href="#init_execution_context.context" name="init_execution_context.context"></a> `context`: [`graph_execution_context`](#graph_execution_context)
+- <a href="#init_execution_context.error.err" name="init_execution_context.error.err"></a> `err`: [`nn_errno`](#nn_errno)
 
 
 ---
 
-#### <a href="#set_input" name="set_input"></a> `set_input(context: graph_execution_context, index: u32, tensor: tensor) -> nn_errno`
+#### <a href="#set_input" name="set_input"></a> `set_input(context: graph_execution_context, index: u32, tensor: tensor) -> Result<(), nn_errno>`
 Define the inputs to use for inference.
 
 This should return an $nn_errno (TODO define) if the input tensor does not match the expected dimensions and type.
@@ -2761,12 +2775,21 @@ The index of the input to change.
 The tensor to set as the input.
 
 ##### Results
-- <a href="#set_input.error" name="set_input.error"></a> `error`: [`nn_errno`](#nn_errno)
+- <a href="#set_input.error" name="set_input.error"></a> `error`: `Result<(), nn_errno>`
+
+###### Variant Layout
+- size: 8
+- align: 4
+- tag_size: 4
+###### Variant cases
+- <a href="#set_input.error.ok" name="set_input.error.ok"></a> `ok`
+
+- <a href="#set_input.error.err" name="set_input.error.err"></a> `err`: [`nn_errno`](#nn_errno)
 
 
 ---
 
-#### <a href="#get_output" name="get_output"></a> `get_output(context: graph_execution_context, index: u32, out_buffer: Pointer<u8>, out_buffer_max_size: buffer_size) -> (nn_errno, buffer_size)`
+#### <a href="#get_output" name="get_output"></a> `get_output(context: graph_execution_context, index: u32, out_buffer: Pointer<u8>, out_buffer_max_size: buffer_size) -> Result<buffer_size, nn_errno>`
 Extract the outputs after inference.
 
 This should return an $nn_errno (TODO define) if the inference has not yet run.
@@ -2785,15 +2808,22 @@ tensor metadata (i.e. dimension, element type) but this should be added at some
 - <a href="#get_output.out_buffer_max_size" name="get_output.out_buffer_max_size"></a> `out_buffer_max_size`: [`buffer_size`](#buffer_size)
 
 ##### Results
-- <a href="#get_output.error" name="get_output.error"></a> `error`: [`nn_errno`](#nn_errno)
-
-- <a href="#get_output.bytes_written" name="get_output.bytes_written"></a> `bytes_written`: [`buffer_size`](#buffer_size)
+- <a href="#get_output.error" name="get_output.error"></a> `error`: `Result<buffer_size, nn_errno>`
 The number of bytes of tensor data written to the `$out_buffer`.
 
+###### Variant Layout
+- size: 8
+- align: 4
+- tag_size: 4
+###### Variant cases
+- <a href="#get_output.error.ok" name="get_output.error.ok"></a> `ok`: [`buffer_size`](#buffer_size)
+
+- <a href="#get_output.error.err" name="get_output.error.err"></a> `err`: [`nn_errno`](#nn_errno)
+
 
 ---
 
-#### <a href="#compute" name="compute"></a> `compute(context: graph_execution_context) -> nn_errno`
+#### <a href="#compute" name="compute"></a> `compute(context: graph_execution_context) -> Result<(), nn_errno>`
 Compute the inference on the given inputs (see [`set_input`](#set_input)).
 
 This should return an $nn_errno (TODO define) if the inputs are not all defined.
@@ -2802,5 +2832,14 @@ This should return an $nn_errno (TODO define) if the inputs are not all defined.
 - <a href="#compute.context" name="compute.context"></a> `context`: [`graph_execution_context`](#graph_execution_context)
 
 ##### Results
-- <a href="#compute.error" name="compute.error"></a> `error`: [`nn_errno`](#nn_errno)
+- <a href="#compute.error" name="compute.error"></a> `error`: `Result<(), nn_errno>`
+
+###### Variant Layout
+- size: 8
+- align: 4
+- tag_size: 4
+###### Variant cases
+- <a href="#compute.error.ok" name="compute.error.ok"></a> `ok`
+
+- <a href="#compute.error.err" name="compute.error.err"></a> `err`: [`nn_errno`](#nn_errno)
 
diff --git a/phases/ephemeral/witx/wasi_ephemeral_nn.witx b/phases/ephemeral/witx/wasi_ephemeral_nn.witx
@@ -15,7 +15,7 @@
 ;;; Error codes returned by functions in this API. This is prefixed to avoid conflicts with the `$errno` in
 ;;; `typenames.witx`.
 (typename $nn_errno
-  (enum u16
+  (enum (@witx tag u16)
     ;;; No error occurred.
     $success
     ;;; Caller module passed an invalid argument.
@@ -31,11 +31,11 @@
 ;;;
 ;;; The array length matches the tensor rank and each element in the array
 ;;; describes the size of each dimension.
-(typename $tensor_dimensions (array u32))
+(typename $tensor_dimensions (list u32))
 
 ;;; The type of the elements in a tensor.
 (typename $tensor_type
-  (enum u8
+  (enum (@witx tag u8)
     $f16
     $f32
     $u8
@@ -50,11 +50,11 @@
 ;;; tensor with 4-byte f32 elements would have a data array of length 16). Naturally, this representation requires
 ;;; some knowledge of how to lay out data in memory--e.g. using row-major ordering--and could perhaps be improved
 ;;; by future witx features (TODO).
-(typename $tensor_data (array u8))
+(typename $tensor_data (list u8))
 
 ;;; A tensor.
 (typename $tensor
-  (struct
+  (record
     ;;; Describe the size of the tensor (e.g. 2x2x2x2 -> [2, 2, 2, 2]). To represent a tensor containing a single value,
     ;;; use `[1]` for the tensor dimensions.
     (field $dimensions $tensor_dimensions)
@@ -69,24 +69,24 @@
 
 ;;; The graph initialization data. This consists of an array of buffers because implementing backends may encode their
 ;;; graph IR in parts (e.g. OpenVINO stores its IR and weights separately).
-(typename $graph_builder (array u8))
-(typename $graph_builder_array (array $graph_builder))
+(typename $graph_builder (list u8))
+(typename $graph_builder_array (list $graph_builder))
 
 ;;; An execution graph for performing inference (i.e. a model).
 (typename $graph (handle))
 
 ;;; Describes the encoding of the graph. This allows the API to be implemented by various backends that encode (i.e.
 ;;; serialize) their graph IR differently.
 (typename $graph_encoding
-  (enum u8
+  (enum (@witx tag u8)
     ;;; TODO document buffer order
     $openvino
   )
 )
 
 ;;; Define where the graph should be executed.
 (typename $execution_target
-  (enum u8
+  (enum (@witx tag u8)
     $cpu
     $gpu
     $tpu
@@ -113,8 +113,7 @@
     ;;; Where to execute the graph.
     (param $target $execution_target)
 
-    (result $error $nn_errno)
-    (result $graph $graph)
+    (result $error (expected $graph (error $nn_errno)))
   )
 
   ;;; TODO Functions like `describe_graph_inputs` and `describe_graph_outputs` (returning
@@ -124,8 +123,7 @@
   ;;; TODO this may need to accept flags that might affect the compilation or execution of the graph.
   (@interface func (export "init_execution_context")
     (param $graph $graph)
-    (result $error $nn_errno)
-    (result $context $graph_execution_context)
+    (result $error (expected $graph_execution_context (error $nn_errno)))
   )
 
   ;;; Define the inputs to use for inference.
@@ -138,7 +136,7 @@
     ;;; The tensor to set as the input.
     (param $tensor $tensor)
 
-    (result $error $nn_errno)
+    (result $error (expected (error $nn_errno)))
   )
 
   ;;; Extract the outputs after inference.
@@ -154,16 +152,15 @@
     (param $out_buffer (@witx pointer u8))
     (param $out_buffer_max_size $buffer_size)
 
-    (result $error $nn_errno)
     ;;; The number of bytes of tensor data written to the `$out_buffer`.
-    (result $bytes_written $buffer_size)
+    (result $error (expected $buffer_size (error $nn_errno)))
   )
 
   ;;; Compute the inference on the given inputs (see `set_input`).
   ;;;
   ;;; This should return an $nn_errno (TODO define) if the inputs are not all defined.
   (@interface func (export "compute")
     (param $context $graph_execution_context)
-    (result $error $nn_errno)
+    (result $error (expected (error $nn_errno)))
   )
 )
diff --git a/tools/witx/tests/wasi-docs.rs b/tools/witx/tests/wasi-docs.rs
@@ -9,7 +9,7 @@ fn validate_docs() {
         witx::phases::ephemeral().unwrap(),
         witx::phases::old::snapshot_0().unwrap(),
     ] {
-        let doc = witx::load(&phase).unwrap_or_else(|e| panic!("failed to parse: {}", e));
+        let doc = witx::load(&phase).unwrap_or_else(|e| panic!("failed to parse: {:?}", e));
         diff_against_filesystem(&doc.to_md(), &witx::phases::docs_path(&phase));
     }
 }
diff --git a/tools/witx/tests/witxt/wasi.witxt b/tools/witx/tests/witxt/wasi.witxt
@@ -24,3 +24,10 @@
 (witx
   (load
     "../../../../phases/ephemeral/witx/wasi_ephemeral_fd.witx"))
+
+;; wasi-nn should work
+(witx
+  (load
+    "../../../../phases/ephemeral/witx/wasi_ephemeral_nn.witx"
+  )
+)

Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@ fn validate_docs() {`
`9`	`9`	`witx::phases::ephemeral().unwrap(),`
`10`	`10`	`witx::phases::old::snapshot_0().unwrap(),`
`11`	`11`	`] {`
`12`		`- let doc = witx::load(&phase).unwrap_or_else(\|e\| panic!("failed to parse: {}", e));`
	`12`	`+ let doc = witx::load(&phase).unwrap_or_else(\|e\| panic!("failed to parse: {:?}", e));`
`13`	`13`	`diff_against_filesystem(&doc.to_md(), &witx::phases::docs_path(&phase));`
`14`	`14`	`}`
`15`	`15`	`}`