PyPI - xmos-ai-tools - Versions diffs - 1.2.1.dev20__py3-none-win_amd64.whl → 1.3.2.dev180__py3-none-win_amd64.whl - Mend

xmos-ai-tools 1.2.1.dev20__py3-none-win_amd64.whl → 1.3.2.dev180__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (229) hide show

xmos_ai_tools/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
-from importlib.metadata import version, PackageNotFoundError
-try:
-    __version__ = version(__name__)
-except PackageNotFoundError:
-    # package is not installed
-    pass
+from importlib.metadata import version, PackageNotFoundError
+try:
+    __version__ = version(__name__)
+except PackageNotFoundError:
+    # package is not installed
+    pass

xmos_ai_tools/io_server/__init__.py CHANGED Viewed

@@ -1,151 +1,151 @@
-# Copyright (c) 2020, XMOS Ltd, All rights reserved
-import usb
-from typing import Tuple
-import numpy as np
-IOSERVER_INVOKE = int(0x01)
-IOSERVER_TENSOR_SEND_OUTPUT = int(0x02)
-IOSERVER_TENSOR_RECV_INPUT = int(0x03)
-IOSERVER_RESET = int(0x07)
-IOSERVER_EXIT = int(0x08)
-class IOServerError(Exception):
-    """Error from device"""
-    pass
-class IOError(IOServerError):
-    """IO Error from device"""
-    pass
-def handle_usb_error(func):
-    def wrapper(*args, **kwargs):
-        try:
-            return func(*args, **kwargs)
-        except usb.core.USBError as e:
-            print(f"USB error {e}")
-            if e.backend_error_code == usb.backend.libusb1.LIBUSB_ERROR_PIPE:
-                raise IOError()
-            else:
-                raise IOServerError(f"Wow...") from e
-    return wrapper
-class IOServer:
-    def __init__(self, output_details: Tuple[dict, ...] = None, timeout=5000):
-        self.__out_ep = None
-        self.__in_ep = None
-        self._dev = None
-        self._output_details = output_details
-        self._timeout = timeout
-        self._max_block_size = 512  # TODO read from (usb) device?
-        super().__init__()
-    def bytes_to_arr(self, data_bytes, tensor_num):
-        if self._output_details:
-            d = self._output_details[tensor_num]
-            s = d["shape"]
-            return np.frombuffer(data_bytes, dtype=d["dtype"])[: np.prod(s)].reshape(s)
-        return np.frombuffer(data_bytes, dtype=np.uint8)
-    def write_input_tensor(self, raw_img, tensor_num=0, model_num=0):
-        self._download_data(
-            IOSERVER_TENSOR_RECV_INPUT,
-            raw_img,
-            tensor_num=tensor_num,
-            model_num=model_num,
-        )
-    def read_output_tensor(self, tensor_num=0, model_num=0):
-        # Retrieve result from device
-        data_read = self._upload_data(
-            IOSERVER_TENSOR_SEND_OUTPUT,
-            model_num=model_num,
-            tensor_num=tensor_num,
-        )
-        assert type(data_read) is bytearray
-        return self.bytes_to_arr(data_read, tensor_num)
-    def close(self):
-        if self._dev is not None:
-            self._dev.write(self._out_ep, bytes([IOSERVER_EXIT, 0, 0]), 1000)
-            usb.util.dispose_resources(self._dev)
-            self._dev = None
-    @handle_usb_error
-    def _download_data(self, cmd, data_bytes, tensor_num=0, model_num=0):
-        # TODO rm this extra CMD packet
-        self._out_ep.write(bytes([cmd, model_num, tensor_num]))
-        self._out_ep.write(data_bytes, 1000)
-        if (len(data_bytes) % self._max_block_size) == 0:
-            self._out_ep.write(bytearray(), 1000)
-    @handle_usb_error
-    def _upload_data(self, cmd, tensor_num=0, model_num=0):
-        read_data = bytearray()
-        self._out_ep.write(bytes([cmd, model_num, tensor_num]), self._timeout)
-        buff = usb.util.create_buffer(self._max_block_size)
-        read_len = self._dev.read(self._in_ep, buff, 10000)
-        read_data.extend(buff[:read_len])
-        while read_len == self._max_block_size:
-            read_len = self._dev.read(self._in_ep, buff, 10000)
-            read_data.extend(buff[:read_len])
-        return read_data
-    def _clear_error(self):
-        self._dev.clear_halt(self._out_ep)
-        self._dev.clear_halt(self._in_ep)
-    def connect(self):
-        self._dev = None
-        while self._dev is None:
-            # TODO - more checks that we have the right device..
-            self._dev = usb.core.find(idVendor=0x20B1, product="xAISRV")
-        # set the active configuration. With no arguments, the first
-        # configuration will be the active one
-        self._dev.set_configuration()
-        # get an endpoint instance
-        cfg = self._dev.get_active_configuration()
-        intf = cfg[(0, 0)]
-        self._out_ep = usb.util.find_descriptor(
-            intf,
-            # match the first OUT endpoint
-            custom_match=lambda e: usb.util.endpoint_direction(e.bEndpointAddress)
-            == usb.util.ENDPOINT_OUT,
-        )
-        self._in_ep = usb.util.find_descriptor(
-            intf,
-            # match the first IN endpoint
-            custom_match=lambda e: usb.util.endpoint_direction(e.bEndpointAddress)
-            == usb.util.ENDPOINT_IN,
-        )
-        assert self._out_ep is not None
-        assert self._in_ep is not None
-        print("Connected to XCORE_IO_SERVER via USB")
-    # TODO move to super()
-    def start_inference(self):
-        # Send cmd
-        self._out_ep.write(bytes([IOSERVER_INVOKE, 0, 0]), 1000)
-        # Send out a 0 length packet
-        self._out_ep.write(bytes([]), 1000)
-    def reset(self):
-        # Send cmd
-        self._out_ep.write(bytes([IOSERVER_RESET, 0, 0]), 1000)
-        # Send out a 0 length packet
-        self._out_ep.write(bytes([]), 1000)
+# Copyright (c) 2020, XMOS Ltd, All rights reserved
+import usb
+from typing import Tuple
+import numpy as np
+IOSERVER_INVOKE = int(0x01)
+IOSERVER_TENSOR_SEND_OUTPUT = int(0x02)
+IOSERVER_TENSOR_RECV_INPUT = int(0x03)
+IOSERVER_RESET = int(0x07)
+IOSERVER_EXIT = int(0x08)
+class IOServerError(Exception):
+    """Error from device"""
+    pass
+class IOError(IOServerError):
+    """IO Error from device"""
+    pass
+def handle_usb_error(func):
+    def wrapper(*args, **kwargs):
+        try:
+            return func(*args, **kwargs)
+        except usb.core.USBError as e:
+            print(f"USB error {e}")
+            if e.backend_error_code == usb.backend.libusb1.LIBUSB_ERROR_PIPE:
+                raise IOError()
+            else:
+                raise IOServerError(f"Wow...") from e
+    return wrapper
+class IOServer:
+    def __init__(self, output_details: Tuple[dict, ...] = None, timeout=5000):
+        self.__out_ep = None
+        self.__in_ep = None
+        self._dev = None
+        self._output_details = output_details
+        self._timeout = timeout
+        self._max_block_size = 512  # TODO read from (usb) device?
+        super().__init__()
+    def bytes_to_arr(self, data_bytes, tensor_num):
+        if self._output_details:
+            d = self._output_details[tensor_num]
+            s = d["shape"]
+            return np.frombuffer(data_bytes, dtype=d["dtype"])[: np.prod(s)].reshape(s)
+        return np.frombuffer(data_bytes, dtype=np.uint8)
+    def write_input_tensor(self, raw_img, tensor_num=0, model_num=0):
+        self._download_data(
+            IOSERVER_TENSOR_RECV_INPUT,
+            raw_img,
+            tensor_num=tensor_num,
+            model_num=model_num,
+        )
+    def read_output_tensor(self, tensor_num=0, model_num=0):
+        # Retrieve result from device
+        data_read = self._upload_data(
+            IOSERVER_TENSOR_SEND_OUTPUT,
+            model_num=model_num,
+            tensor_num=tensor_num,
+        )
+        assert type(data_read) is bytearray
+        return self.bytes_to_arr(data_read, tensor_num)
+    def close(self):
+        if self._dev is not None:
+            self._dev.write(self._out_ep, bytes([IOSERVER_EXIT, 0, 0]), 1000)
+            usb.util.dispose_resources(self._dev)
+            self._dev = None
+    @handle_usb_error
+    def _download_data(self, cmd, data_bytes, tensor_num=0, model_num=0):
+        # TODO rm this extra CMD packet
+        self._out_ep.write(bytes([cmd, model_num, tensor_num]))
+        self._out_ep.write(data_bytes, 1000)
+        if (len(data_bytes) % self._max_block_size) == 0:
+            self._out_ep.write(bytearray(), 1000)
+    @handle_usb_error
+    def _upload_data(self, cmd, tensor_num=0, model_num=0):
+        read_data = bytearray()
+        self._out_ep.write(bytes([cmd, model_num, tensor_num]), self._timeout)
+        buff = usb.util.create_buffer(self._max_block_size)
+        read_len = self._dev.read(self._in_ep, buff, 10000)
+        read_data.extend(buff[:read_len])
+        while read_len == self._max_block_size:
+            read_len = self._dev.read(self._in_ep, buff, 10000)
+            read_data.extend(buff[:read_len])
+        return read_data
+    def _clear_error(self):
+        self._dev.clear_halt(self._out_ep)
+        self._dev.clear_halt(self._in_ep)
+    def connect(self):
+        self._dev = None
+        while self._dev is None:
+            # TODO - more checks that we have the right device..
+            self._dev = usb.core.find(idVendor=0x20B1, product="xAISRV")
+        # set the active configuration. With no arguments, the first
+        # configuration will be the active one
+        self._dev.set_configuration()
+        # get an endpoint instance
+        cfg = self._dev.get_active_configuration()
+        intf = cfg[(0, 0)]
+        self._out_ep = usb.util.find_descriptor(
+            intf,
+            # match the first OUT endpoint
+            custom_match=lambda e: usb.util.endpoint_direction(e.bEndpointAddress)
+            == usb.util.ENDPOINT_OUT,
+        )
+        self._in_ep = usb.util.find_descriptor(
+            intf,
+            # match the first IN endpoint
+            custom_match=lambda e: usb.util.endpoint_direction(e.bEndpointAddress)
+            == usb.util.ENDPOINT_IN,
+        )
+        assert self._out_ep is not None
+        assert self._in_ep is not None
+        print("Connected to XCORE_IO_SERVER via USB")
+    # TODO move to super()
+    def start_inference(self):
+        # Send cmd
+        self._out_ep.write(bytes([IOSERVER_INVOKE, 0, 0]), 1000)
+        # Send out a 0 length packet
+        self._out_ep.write(bytes([]), 1000)
+    def reset(self):
+        # Send cmd
+        self._out_ep.write(bytes([IOSERVER_RESET, 0, 0]), 1000)
+        # Send out a 0 length packet
+        self._out_ep.write(bytes([]), 1000)

xmos_ai_tools/runtime/buildfiles/aitoolslib.cmake CHANGED Viewed

@@ -1,13 +1,13 @@
-set(XMOS_AITOOLSLIB_DEFINITIONS
-        "TF_LITE_STATIC_MEMORY"
-		"TF_LITE_STRIP_ERROR_STRINGS"
-		"XCORE"
-		"NO_INTERPRETER"
-    )
-if("${APP_BUILD_ARCH}" STREQUAL xs3a OR ${CMAKE_SYSTEM_PROCESSOR} STREQUAL XCORE_XS3A)
-	set(XMOS_AITOOLSLIB_LIBRARIES "${CMAKE_CURRENT_LIST_DIR}/../lib/libxtflitemicro.a")
-else()
-	set(XMOS_AITOOLSLIB_LIBRARIES "${CMAKE_CURRENT_LIST_DIR}/../lib/libhost_xtflitemicro.a")
-endif()
-set(XMOS_AITOOLSLIB_INCLUDES "${CMAKE_CURRENT_LIST_DIR}/../include")
+set(XMOS_AITOOLSLIB_DEFINITIONS
+        "TF_LITE_STATIC_MEMORY"
+		"TF_LITE_STRIP_ERROR_STRINGS"
+		"XCORE"
+		"NO_INTERPRETER"
+    )
+if("${APP_BUILD_ARCH}" STREQUAL xs3a OR ${CMAKE_SYSTEM_PROCESSOR} STREQUAL XCORE_XS3A)
+	set(XMOS_AITOOLSLIB_LIBRARIES "${CMAKE_CURRENT_LIST_DIR}/../lib/libxtflitemicro.a")
+else()
+	set(XMOS_AITOOLSLIB_LIBRARIES "${CMAKE_CURRENT_LIST_DIR}/../lib/libhost_xtflitemicro.a")
+endif()
+set(XMOS_AITOOLSLIB_INCLUDES "${CMAKE_CURRENT_LIST_DIR}/../include")

xmos_ai_tools/runtime/buildfiles/aitoolslib.make CHANGED Viewed

@@ -1,8 +1,8 @@
-XMOS_AITOOLSLIB_DEFINITIONS = \
--DTF_LITE_STATIC_MEMORY \
--DTF_LITE_STRIP_ERROR_STRINGS \
--DXCORE \
--DNO_INTERPRETER
-XMOS_AITOOLSLIB_LIBRARIES = $(XMOS_AITOOLSLIB_PATH)/lib/libxtflitemicro.a
-XMOS_AITOOLSLIB_INCLUDES = -I$(XMOS_AITOOLSLIB_PATH)/include
+XMOS_AITOOLSLIB_DEFINITIONS = \
+-DTF_LITE_STATIC_MEMORY \
+-DTF_LITE_STRIP_ERROR_STRINGS \
+-DXCORE \
+-DNO_INTERPRETER
+XMOS_AITOOLSLIB_LIBRARIES = $(XMOS_AITOOLSLIB_PATH)/lib/libxtflitemicro.a
+XMOS_AITOOLSLIB_INCLUDES = -I$(XMOS_AITOOLSLIB_PATH)/include

xmos_ai_tools/runtime/include/flash_server.h CHANGED Viewed

@@ -26,9 +26,8 @@ typedef struct flash {
 typedef enum flash_command {
   FLASH_READ_PARAMETERS =
       0, ///< Read a set of parameters.   // TODO: share with lib_tflite_micro
-  FLASH_READ_MODEL = 1, ///< Read a whole model.
-  FLASH_READ_OPERATORS =
-      2, ///< Read the binary for an operator - future extension
+  FLASH_READ_PARAMETERS_ASYNC = 1, ///< Read parameters asynchronously.
+  FLASH_READ_SYNCHRONIZE      = 2, ///< Complete async read.
   FLASH_READ_XIP =
       3, ///< Read code to execute-in-place throught L2 cache - future extension
   FLASH_SERVER_QUIT = 4,

xmos_ai_tools/runtime/include/lib_nn/api/add_int16_transform.h CHANGED Viewed

@@ -29,7 +29,8 @@
 C_API int add_int16_tensor_blob(void *output,
                           float input1_scaler,
                           float input2_scaler,
-                          float output_scaler);
+                          float output_scaler,
+                          char *err_msg);
 /**
  * Macro that calculates the number of int16_t that should be allocated to

xmos_ai_tools/runtime/include/lib_nn/api/dequantize_int16_transform.h CHANGED Viewed

@@ -21,7 +21,8 @@
  * @returns 1 on success, 0 on fail (fallback required)
  */
 C_API int dequantize_int16_tensor_blob(void *output,
-                                 float input_scaler);
+                                 float input_scaler,
+                                 char *err_msg);
 /**
  * Macro that calculates the number of int16_t that should be allocated to

xmos_ai_tools/runtime/include/lib_nn/api/multiply_int16_transform.h CHANGED Viewed

@@ -25,7 +25,8 @@
  */
 C_API int requantize_int16_tensor_blob(void *output,
                                  float input_scaler,
-                                 float output_scaler);
+                                 float output_scaler,
+                                 char *err_msg);
 /**
  * Macro that calculates the number of int16_t that should be allocated to
  * store the output of ``quantise_int16_tensor_blob()``
@@ -56,7 +57,8 @@ C_API int requantize_int16_tensor_blob(void *output,
 C_API int multiply_int16_tensor_blob(void *output,
                                float input1_scaler,
                                float input2_scaler,
-                               float output_scaler);
+                               float output_scaler,
+                               char *err_msg);
 /**
  * Macro that calculates the number of int16_t that should be allocated to

xmos_ai_tools/runtime/include/lib_nn/api/nn_api.h CHANGED Viewed

@@ -8,6 +8,8 @@
 #define C_API EXTERN_C
+#define ERR_MSG_DESCRIPTOR_FAIL_BYTES() (128)
 #ifndef __has_builtin
 #define __has_builtin(x) 0
 #endif

xmos_ai_tools/runtime/include/lib_nn/api/nn_layers.h CHANGED Viewed

@@ -109,50 +109,6 @@ typedef struct padding_sizes_t {
   int32_t right;
 } padding_sizes_t;
-/**
- * @brief Execute @oper{pad_prepare} function.
- *
- * `plan` points to the output vector @tensor{y} with length @math{N}.
- *
- * `p` struct describing the padding to be applied to the input tensor.
- *
- * `x` parameters describing the input tensor to be padded.
- *
- * `bytes_per_pixel` the bytes per pixel for tensor x.
- *
- * @param plan             [out]  The output vector @tensor{y}
- * @param p                [in]   The input vector @tensor{x}
- * @param x                [in]   Look-up table @tensor{T}
- * @param bytes_per_pixel  [in]   Length @math{N} of input and output vectors
- */
-C_API void pad_prepare(nn_pad_plan_t *plan, const padding_sizes_t *p,
-                       const nn_image_params_t *x,
-                       const unsigned bytes_per_pixel);
-/**
- * @brief Execute @oper{pad_run} job.
- *
- * See @oper_ref{pad_run} for more details about the @oper{requantize_16_to_8}
- * operator.
- *
- * `Y` points to the output vector @tensor{y}.
- *
- * `X` points to the input vector @tensor{x}.
- *
- * `plan` points to the (initialized) plan.
- *
- * @requires_word_alignment{Y,X}
- *
- * @param y   [out]    The output vector @tensor{y}
- * @param x   [in]     The input vector @tensor{x}
- * @param plan [in]    The prameters describing how to pad.
- */
-void pad_run(char *y, char *x, const nn_pad_plan_t *p, uint32_t pad_value);
-void pad_ref(char *y, char *x, const padding_sizes_t *p,
-             const nn_image_params_t *xp, const unsigned bytes_per_pixel,
-             uint32_t pad_value);
 /**
  * Func to calculate n_3
  */
@@ -336,12 +292,16 @@ void softmax_generate_exp_lut(int zero_point, float scale, float *lut);
 void softmax_ref(int8_t *Y, const int8_t *X, const float zero_point,
                  const float scale, const int length);
-void slice_memcpy(int8_t *dst, int8_t *src, int32_t *in_offsets,
-                  int32_t *out_offsets, int32_t *begin, int32_t *end,
-                  void (*memcpy_func)(void *, void *, size_t));
+void softmax_single(int8_t *Y, const int8_t *X, const float *lut,
+                    const int offset);
+void mean_int8(const int8_t *input, int8_t *output, const int start_dim_size,
+               const int mean_dim_size, const int end_dim_size,
+               const float in_zero_point, const float out_zero_point,
+               const float scale_mul);
+void mean_int16(const int16_t *input, int16_t *output, const int start_dim_size,
+                const int mean_dim_size, const int end_dim_size,
+                const float scale_mul);
-void slice_memcpy_get_params(int *begin_dst, int *end_dst, int *in_offsets,
-                             int *out_offsets, int *shape_dst, const int *begin,
-                             const int *size, const int *shape,
-                             const int dtype_size, const int rank);
 #endif // LAYERS_H_

xmos_ai_tools/runtime/include/lib_nn/api/nn_op_utils.h CHANGED Viewed

@@ -8,6 +8,9 @@
 #include "xs3_vpu.h"
+C_API int calculateAlignedThreadSplit(int tc, int split_size, int split_start[], int split_end[]);
+C_API int calculateThreadSplit(int tc, int split_size, int split_start[], int split_end[], int alignment);
 #ifdef __XC__
 extern "C" {
 #endif

xmos_ai_tools/runtime/include/lib_nn/api/quadratic_approximation.h CHANGED Viewed

@@ -78,5 +78,6 @@ C_API float approximation_function_tanh(float x);
 C_API float approximation_function_logistics(float x);
 C_API float approximation_function_elu(float x);
 C_API float approximation_function_relu(float x);
+C_API float approximation_function_relu6(float x);
 #endif

xmos_ai_tools/runtime/include/lib_nn/api/version.h CHANGED Viewed

@@ -1,11 +1,11 @@
-// Copyright (c) 2020, XMOS Ltd, All rights reserved
+// Copyright (c) 2024, XMOS Ltd, All rights reserved
 #ifndef LIB_NN_VERSION_H_
 #define LIB_NN_VERSION_H_
 namespace lib_nn {
 static const unsigned major_version = 0;
-static const unsigned minor_version = 3;
+static const unsigned minor_version = 4;
 static const unsigned patch_version = 0;
 }  // namespace lib_nn

xmos_ai_tools/runtime/include/lib_nn/api/vpu_memmove_word_aligned.h ADDED Viewed

@@ -0,0 +1,15 @@
+#ifndef _vpu_memmove_word_aligned_h_
+#define _vpu_memmove_word_aligned_h_
+/**
+ * Function that copies a block of memory. Both source and destination
+ * address must be word aligned. Any number of bytes can be copied. There
+ * may be an overlap between the destination and source.
+ *
+ * @param     dst         Destination address, must be word aligned.
+ * @param     src         Source address, must be word aligned.
+ * @param     byte_count  Number of bytes to copy - may be zero
+ */
+void vpu_memmove_word_aligned(void * dst, const void * src, unsigned int byte_count);
+#endif

xmos_ai_tools/runtime/include/lib_nn/api/vpu_memset_256.h ADDED Viewed

@@ -0,0 +1,55 @@
+#include <stdint.h>
+#ifndef _vpu_memset_256_h_
+#define _vpu_memset_256_h_
+/**
+ * Function that replicates a vector. The source address must be word
+ * aligned, the destination address is assumed to be aligned with the
+ * replication pattern in the source. Any number of bytes can be copied.
+ * There should not be an overlap between the destination and source.
+ *
+ * It is assumed that the source address contains 32 replicated bytes (if
+ * the destination address is byte aligned), or that it contains 16
+ * replicated shorts (if the destination address is 16-bit aligned), or
+ * that it contains 8 replicated ints.
+ *
+ * broadcast_32_to_256() and BROADCAST_8_TO_32() cane be used to
+ * create the source vector
+ *
+ * @param     dst         Destination address
+ * @param     src         Source address, must be word aligned.
+ * @param     byte_count  Number of bytes to copy - may be zero
+ */
+void vpu_memset_256(void *dst, const void *src, unsigned int byte_count);
+/**
+ * Function that replicates an int over a vector. The vector must be
+ * aligned on an 8-byte boundary. In order to replicate a byte or short over
+ * a vector, combine this with a call to BROADCAST_8_TO_32() or
+ * BROADCAST_16_TO_32(). Declare the vector as a uint64_t x[] in order to
+ * guarantee 8-byte alignement.
+ *
+ * @param     dst         Destination address, must be 8-byte aligned
+ * @param     from        Value to be replicated
+ */
+void broadcast_32_to_256(void *dst, uint32_t from);
+/**
+ * Macro that replicates a byte over an int.
+ * Use with broadcast_32_to_256() in order to replicate a byte over a vector
+ */
+#define BROADCAST_8_TO_32(f) (((uint8_t)f) * 0x01010101)
+/**
+ * Macro that replicates a short over an int
+ * Use with broadcast_32_to_256() in order to replicate a short over a vector
+ */
+#define BROADCAST_16_TO_32(f) (((uint16_t)f) * 0x00010001)
+/**
+ * Macro that replicates a byte over a short
+ */
+#define BROADCAST_8_TO_16(f) (((uint8_t)f) * 0x00000101)
+#endif

xmos_ai_tools/runtime/include/lib_tflite_micro/api/fast_flash.h CHANGED Viewed

@@ -3,6 +3,7 @@
 #include <quadflash.h>
+#ifdef __XC__
 /** Fast flash library.
  * Before calling any of the functions in here, lib_quad_flash must be initialised as normal by using
  * fl_connectToDevice(qspi, flash_spec, n_flash_spec).
@@ -44,4 +45,9 @@ int fast_flash_init(fl_QSPIPorts &qspi);
  */
 void fast_flash_read(fl_QSPIPorts &qspi, unsigned addr, unsigned word_count, unsigned read_data[], chanend ?c_data_out);
+#else
+int fast_flash_init(fl_QSPIPorts *qspi);
+void fast_flash_read(fl_QSPIPorts *qspi, unsigned addr, unsigned word_count, unsigned read_data[], chanend_t c_data_out);
+#endif
 #endif