Merge pull request #312 from v923z/norm

v923z · web-flow · commit 5f716a788343 · 2021-02-09T18:57:11.000+01:00
improved linalg.norm
diff --git a/code/ndarray.c b/code/ndarray.c
@@ -632,7 +632,7 @@ ndarray_obj_t *ndarray_new_dense_ndarray(uint8_t ndim, size_t *shape, uint8_t dt
     int32_t *strides = m_new(int32_t, ULAB_MAX_DIMS);
     strides[ULAB_MAX_DIMS-1] = dtype == NDARRAY_BOOL ? 1 : mp_binary_get_size('@', dtype, NULL);
     for(size_t i=ULAB_MAX_DIMS; i > 1; i--) {
-        strides[i-2] = strides[i-1] * shape[i-1];
+        strides[i-2] = strides[i-1] * MAX(1, shape[i-1]);
     }
     return ndarray_new_ndarray(ndim, shape, strides, dtype);
 }
diff --git a/code/numpy/linalg/linalg.c b/code/numpy/linalg/linalg.c
@@ -354,7 +354,23 @@ MP_DEFINE_CONST_FUN_OBJ_1(linalg_inv_obj, linalg_inv);
 //|    ...
 //|
 
-static mp_obj_t linalg_norm(mp_obj_t x) {
+static mp_obj_t linalg_norm(size_t n_args, const mp_obj_t *pos_args, mp_map_t *kw_args) {
+    static const mp_arg_t allowed_args[] = {
+        { MP_QSTR_, MP_ARG_REQUIRED | MP_ARG_OBJ, { .u_rom_obj = mp_const_none} } ,
+        { MP_QSTR_axis, MP_ARG_OBJ, { .u_rom_obj = mp_const_none } },
+    };
+
+    mp_arg_val_t args[MP_ARRAY_SIZE(allowed_args)];
+    mp_arg_parse_all(n_args, pos_args, kw_args, MP_ARRAY_SIZE(allowed_args), allowed_args, args);
+
+    mp_obj_t x = args[0].u_obj;
+    mp_obj_t axis = args[1].u_obj;
+    if((axis != mp_const_none) && (!MP_OBJ_IS_INT(axis))) {
+        mp_raise_TypeError(translate("axis must be None, or an integer"));
+    }
+
+
+// static mp_obj_t linalg_norm(mp_obj_t x) {
     mp_float_t dot = 0.0, value;
     size_t count = 1;
 
@@ -370,33 +386,74 @@ static mp_obj_t linalg_norm(mp_obj_t x) {
         return mp_obj_new_float(MICROPY_FLOAT_C_FUN(sqrt)(dot * (count - 1)));
     } else if(MP_OBJ_IS_TYPE(x, &ulab_ndarray_type)) {
         ndarray_obj_t *ndarray = MP_OBJ_TO_PTR(x);
-        if((ndarray->ndim != 1) && (ndarray->ndim != 2)) {
-            mp_raise_ValueError(translate("norm is defined for 1D and 2D arrays"));
-        }
         uint8_t *array = (uint8_t *)ndarray->array;
-
+        // always get a float, so that we don't have to resolve the dtype later
         mp_float_t (*func)(void *) = ndarray_get_float_function(ndarray->dtype);
+        shape_strides _shape_strides = tools_reduce_axes(ndarray, axis);
+        mp_float_t *rarray = NULL;
+        ndarray_obj_t *results = NULL;
+        if((axis != mp_const_none) && (ndarray->ndim > 1)) {
+            results = ndarray_new_dense_ndarray(MAX(1, ndarray->ndim-1), _shape_strides.shape, NDARRAY_FLOAT);
+            rarray = results->array;
+        } else {
+            rarray = m_new(mp_float_t, 1);
+        }
 
-        size_t k = 0;
+        #if ULAB_MAX_DIMS > 3
+        size_t i = 0;
         do {
-            size_t l = 0;
+        #endif
+            #if ULAB_MAX_DIMS > 2
+            size_t j = 0;
             do {
-                value = func(array);
-                dot = dot + (value * value - dot) / count++;
-                array += ndarray->strides[ULAB_MAX_DIMS - 1];
-                l++;
-            } while(l < ndarray->shape[ULAB_MAX_DIMS - 1]);
-            array -= ndarray->strides[ULAB_MAX_DIMS - 1] * ndarray->shape[ULAB_MAX_DIMS - 1];
-            array += ndarray->strides[ULAB_MAX_DIMS - 2];
-            k++;
-        } while(k < ndarray->shape[ULAB_MAX_DIMS - 2]);
-        return mp_obj_new_float(MICROPY_FLOAT_C_FUN(sqrt)(dot * (count - 1)));
-    } else {
-        mp_raise_TypeError(translate("argument must be an interable or ndarray"));
+            #endif
+                #if ULAB_MAX_DIMS > 1
+                size_t k = 0;
+                do {
+                #endif
+                    size_t l = 0;
+                    if(axis != mp_const_none) {
+                        count = 1;
+                        dot = 0.0;
+                    }
+                    do {
+                        value = func(array);
+                        dot = dot + (value * value - dot) / count++;
+                        array += _shape_strides.strides[0];
+                        l++;
+                    } while(l < _shape_strides.shape[0]);
+                    *rarray = MICROPY_FLOAT_C_FUN(sqrt)(dot * (count - 1));
+                    if(results != NULL) {
+                        rarray++;
+                    }
+                #if ULAB_MAX_DIMS > 1
+                    array -= _shape_strides.strides[0] * _shape_strides.shape[0];
+                    array += _shape_strides.strides[ULAB_MAX_DIMS - 1];
+                    k++;
+                } while(k < _shape_strides.shape[ULAB_MAX_DIMS - 1]);
+                #endif
+            #if ULAB_MAX_DIMS > 2
+                array -= _shape_strides.strides[ULAB_MAX_DIMS - 1] * _shape_strides.shape[ULAB_MAX_DIMS-1];
+                array += _shape_strides.strides[ULAB_MAX_DIMS - 2];
+                j++;
+            } while(j < _shape_strides.shape[ULAB_MAX_DIMS - 2]);
+            #endif
+        #if ULAB_MAX_DIMS > 3
+            array -= _shape_strides.strides[ULAB_MAX_DIMS - 2] * _shape_strides.shape[ULAB_MAX_DIMS-2];
+            array += _shape_strides.strides[ULAB_MAX_DIMS - 3];
+            i++;
+        } while(i < _shape_strides.shape[ULAB_MAX_DIMS - 3]);
+        #endif
+        if(results == NULL) {
+            return mp_obj_new_float(*rarray);
+        }
+        return results;
     }
+    return mp_const_none; // we should never reach this point
 }
 
-MP_DEFINE_CONST_FUN_OBJ_1(linalg_norm_obj, linalg_norm);
+MP_DEFINE_CONST_FUN_OBJ_KW(linalg_norm_obj, 1, linalg_norm);
+// MP_DEFINE_CONST_FUN_OBJ_1(linalg_norm_obj, linalg_norm);
 
 #if ULAB_MAX_DIMS > 1
 #if ULAB_LINALG_HAS_TRACE
diff --git a/code/numpy/linalg/linalg.h b/code/numpy/linalg/linalg.h
@@ -24,5 +24,5 @@ MP_DECLARE_CONST_FUN_OBJ_1(linalg_eig_obj);
 MP_DECLARE_CONST_FUN_OBJ_1(linalg_inv_obj);
 MP_DECLARE_CONST_FUN_OBJ_1(linalg_trace_obj);
 MP_DECLARE_CONST_FUN_OBJ_2(linalg_dot_obj);
-MP_DECLARE_CONST_FUN_OBJ_2(linalg_norm_obj);
+MP_DECLARE_CONST_FUN_OBJ_KW(linalg_norm_obj);
 #endif
diff --git a/code/numpy/numerical/numerical.c b/code/numpy/numerical/numerical.c
@@ -63,38 +63,6 @@ static void numerical_reduce_axes(ndarray_obj_t *ndarray, int8_t axis, size_t *s
     }
 }
 
-static shape_strides numerical_reduce_axes_(ndarray_obj_t *ndarray, mp_obj_t axis) {
-    // TODO: replace numerical_reduce_axes with this function, wherever applicable
-    int8_t ax = mp_obj_get_int(axis);
-    if(ax < 0) ax += ndarray->ndim;
-    if((ax < 0) || (ax > ndarray->ndim - 1)) {
-        mp_raise_ValueError(translate("index out of range"));
-    }
-    shape_strides _shape_strides;
-    _shape_strides.index = ULAB_MAX_DIMS - ndarray->ndim + ax;
-    size_t *shape = m_new(size_t, ULAB_MAX_DIMS);
-    memset(shape, 0, sizeof(size_t)*ULAB_MAX_DIMS);
-    _shape_strides.shape = shape;
-    int32_t *strides = m_new(int32_t, ULAB_MAX_DIMS);
-    memset(strides, 0, sizeof(uint32_t)*ULAB_MAX_DIMS);
-    _shape_strides.strides = strides;
-    if((ndarray->ndim == 1) && (_shape_strides.axis == 0)) {
-        _shape_strides.index = 0;
-        _shape_strides.shape[ULAB_MAX_DIMS - 1] = 1;
-    } else {
-        for(uint8_t i = ULAB_MAX_DIMS - 1; i > 0; i--) {
-            if(i > _shape_strides.index) {
-                _shape_strides.shape[i] = ndarray->shape[i];
-                _shape_strides.strides[i] = ndarray->strides[i];
-            } else {
-                _shape_strides.shape[i] = ndarray->shape[i-1];
-                _shape_strides.strides[i] = ndarray->strides[i-1];
-            }
-        }
-    }
-    return _shape_strides;
-}
-
 #if ULAB_NUMPY_HAS_ALL | ULAB_NUMPY_HAS_ANY
 static mp_obj_t numerical_all_any(mp_obj_t oin, mp_obj_t axis, uint8_t optype) {
     bool anytype = optype == NUMERICAL_ALL ? 1 : 0;
@@ -130,25 +98,25 @@ static mp_obj_t numerical_all_any(mp_obj_t oin, mp_obj_t axis, uint8_t optype) {
                             l++;
                         } while(l < ndarray->shape[ULAB_MAX_DIMS - 1]);
                     #if ULAB_MAX_DIMS > 1
-                        array -= ndarray->strides[ULAB_MAX_DIMS - 1] * ndarray->shape[ULAB_MAX_DIMS-1];
+                        array -= ndarray->strides[ULAB_MAX_DIMS - 1] * ndarray->shape[ULAB_MAX_DIMS - 1];
                         array += ndarray->strides[ULAB_MAX_DIMS - 2];
                         k++;
                     } while(k < ndarray->shape[ULAB_MAX_DIMS - 2]);
                     #endif
                 #if ULAB_MAX_DIMS > 2
-                    array -= ndarray->strides[ULAB_MAX_DIMS - 2] * ndarray->shape[ULAB_MAX_DIMS-2];
+                    array -= ndarray->strides[ULAB_MAX_DIMS - 2] * ndarray->shape[ULAB_MAX_DIMS - 2];
                     array += ndarray->strides[ULAB_MAX_DIMS - 3];
                     j++;
                 } while(j < ndarray->shape[ULAB_MAX_DIMS - 3]);
                 #endif
             #if ULAB_MAX_DIMS > 3
-                array -= ndarray->strides[ULAB_MAX_DIMS - 3] * ndarray->shape[ULAB_MAX_DIMS-3];
+                array -= ndarray->strides[ULAB_MAX_DIMS - 3] * ndarray->shape[ULAB_MAX_DIMS - 3];
                 array += ndarray->strides[ULAB_MAX_DIMS - 4];
                 i++;
             } while(i < ndarray->shape[ULAB_MAX_DIMS - 4]);
             #endif
         } else {
-            shape_strides _shape_strides = numerical_reduce_axes_(ndarray, axis);
+            shape_strides _shape_strides = tools_reduce_axes(ndarray, axis);
             ndarray_obj_t *results = ndarray_new_dense_ndarray(MAX(1, ndarray->ndim-1), _shape_strides.shape, NDARRAY_BOOL);
             uint8_t *rarray = (uint8_t *)results->array;
             if(optype == NUMERICAL_ALL) {
@@ -173,33 +141,33 @@ static mp_obj_t numerical_all_any(mp_obj_t oin, mp_obj_t axis, uint8_t optype) {
                                 // optype == NUMERICAL_ANY
                                 *rarray = 1;
                                 // since we are breaking out of the loop, move the pointer forward
-                                array += ndarray->strides[_shape_strides.index] * (ndarray->shape[_shape_strides.index] - l);
+                                array += _shape_strides.strides[0] * (_shape_strides.shape[0] - l);
                                 break;
                             } else if((value == MICROPY_FLOAT_CONST(0.0)) & anytype) {
                                 // optype == NUMERICAL_ALL
                                 *rarray = 0;
                                 // since we are breaking out of the loop, move the pointer forward
-                                array += ndarray->strides[_shape_strides.index] * (ndarray->shape[_shape_strides.index] - l);
+                                array += _shape_strides.strides[0] * (_shape_strides.shape[0] - l);
                                 break;
                             }
-                            array += ndarray->strides[_shape_strides.index];
+                            array += _shape_strides.strides[0];
                             l++;
-                        } while(l < ndarray->shape[_shape_strides.index]);
+                        } while(l < _shape_strides.shape[0]);
                     #if ULAB_MAX_DIMS > 1
                         rarray++;
-                        array -= ndarray->strides[_shape_strides.index] * ndarray->shape[_shape_strides.index];
+                        array -= _shape_strides.strides[0] * _shape_strides.shape[0];
                         array += _shape_strides.strides[ULAB_MAX_DIMS - 1];
                         k++;
                     } while(k < _shape_strides.shape[ULAB_MAX_DIMS - 1]);
                     #endif
                 #if ULAB_MAX_DIMS > 2
-                    array -= _shape_strides.strides[ULAB_MAX_DIMS - 1] * _shape_strides.shape[ULAB_MAX_DIMS-1];
+                    array -= _shape_strides.strides[ULAB_MAX_DIMS - 1] * _shape_strides.shape[ULAB_MAX_DIMS - 1];
                     array += _shape_strides.strides[ULAB_MAX_DIMS - 2];
                     j++;
                 } while(j < _shape_strides.shape[ULAB_MAX_DIMS - 2]);
                 #endif
             #if ULAB_MAX_DIMS > 3
-                array -= _shape_strides.strides[ULAB_MAX_DIMS - 2] * _shape_strides.shape[ULAB_MAX_DIMS-2];
+                array -= _shape_strides.strides[ULAB_MAX_DIMS - 2] * _shape_strides.shape[ULAB_MAX_DIMS - 2];
                 array += _shape_strides.strides[ULAB_MAX_DIMS - 3];
                 i++;
             } while(i < _shape_strides.shape[ULAB_MAX_DIMS - 3])
diff --git a/code/numpy/numerical/numerical.h b/code/numpy/numerical/numerical.h
@@ -17,13 +17,6 @@
 
 // TODO: implement cumsum
 
-typedef struct {
-    uint8_t index;
-    int8_t axis;
-    size_t *shape;
-    int32_t *strides;
-} shape_strides;
-
 #define RUN_ARGMIN1(ndarray, type, array, results, rarray, index, op)\
 ({\
     uint16_t best_index = 0;\
diff --git a/code/ulab.c b/code/ulab.c
@@ -33,7 +33,7 @@
 
 #include "user/user.h"
 
-#define ULAB_VERSION 2.3.2
+#define ULAB_VERSION 2.3.3
 #define xstr(s) str(s)
 #define str(s) #s
 #define ULAB_VERSION_STRING xstr(ULAB_VERSION) xstr(-) xstr(ULAB_MAX_DIMS) xstr(D)
diff --git a/code/ulab_tools.c b/code/ulab_tools.c
@@ -9,7 +9,7 @@
  */
 
 
-
+#include <string.h>
 #include "py/runtime.h"
 
 #include "ulab.h"
@@ -158,3 +158,36 @@ void *ndarray_set_float_function(uint8_t dtype) {
     }
 }
 #endif /* NDARRAY_BINARY_USES_FUN_POINTER */
+
+shape_strides tools_reduce_axes(ndarray_obj_t *ndarray, mp_obj_t axis) {
+    // TODO: replace numerical_reduce_axes with this function, wherever applicable
+    if(!mp_obj_is_int(axis) & (axis != mp_const_none)) {
+        mp_raise_TypeError(translate("axis must be an interable or ndarray"));
+    }
+    shape_strides _shape_strides;
+    size_t *shape = m_new(size_t, ULAB_MAX_DIMS);
+    _shape_strides.shape = shape;
+    int32_t *strides = m_new(int32_t, ULAB_MAX_DIMS);
+    _shape_strides.strides = strides;
+
+    memcpy(_shape_strides.shape, ndarray->shape, sizeof(size_t) * ULAB_MAX_DIMS);
+    memcpy(_shape_strides.strides, ndarray->strides, sizeof(int32_t) * ULAB_MAX_DIMS);
+    // for axis == mp_const_none, simply return the original shape and strides
+    if(axis != mp_const_none) {
+        int8_t ax = mp_obj_get_int(axis);
+        if(ax < 0) ax += ndarray->ndim;
+        if((ax < 0) || (ax > ndarray->ndim - 1)) {
+            mp_raise_ValueError(translate("index out of range"));
+        }
+        // move the axis to the leftmost position, and align everything else to the right
+        uint8_t index = ULAB_MAX_DIMS - ndarray->ndim + ax;
+        _shape_strides.shape[0] = ndarray->shape[index];
+        _shape_strides.strides[0] = ndarray->strides[index];
+        for(uint8_t i = 0; i < index; i++) {
+            // entries to the left of index must be shifted to the right
+            _shape_strides.shape[i + 1] = ndarray->shape[i];
+            _shape_strides.strides[i + 1] = ndarray->strides[i];
+        }
+    }
+    return _shape_strides;
+}
diff --git a/code/ulab_tools.h b/code/ulab_tools.h
@@ -11,8 +11,17 @@
 #ifndef _TOOLS_
 #define _TOOLS_
 
+#include "ndarray.h"
+
 #define SWAP(t, a, b) { t tmp = a; a = b; b = tmp; }
 
+typedef struct _shape_strides_t {
+    uint8_t index;
+    int8_t axis;
+    size_t *shape;
+    int32_t *strides;
+} shape_strides;
+
 mp_float_t ndarray_get_float_uint8(void *);
 mp_float_t ndarray_get_float_int8(void *);
 mp_float_t ndarray_get_float_uint16(void *);
@@ -23,4 +32,5 @@ void *ndarray_get_float_function(uint8_t );
 uint8_t ndarray_upcast_dtype(uint8_t , uint8_t );
 void *ndarray_set_float_function(uint8_t );
 
+shape_strides tools_reduce_axes(ndarray_obj_t *, mp_obj_t );
 #endif
diff --git a/docs/ulab-change-log.md b/docs/ulab-change-log.md
@@ -1,3 +1,9 @@
+Tue, 9 Feb 2021
+
+version 2.3.3
+
+    linalg.norm should now work with the axis keyword argument
+
 Mon, 8 Feb 2021
 
 version 2.3.2

Original file line number	Diff line number	Diff line change
`@@ -632,7 +632,7 @@ ndarray_obj_t ndarray_new_dense_ndarray(uint8_t ndim, size_t shape, uint8_t dt`
`632`	`632`	`int32_t *strides = m_new(int32_t, ULAB_MAX_DIMS);`
`633`	`633`	`strides[ULAB_MAX_DIMS-1] = dtype == NDARRAY_BOOL ? 1 : mp_binary_get_size('@', dtype, NULL);`
`634`	`634`	`for(size_t i=ULAB_MAX_DIMS; i > 1; i--) {`
`635`		`- strides[i-2] = strides[i-1] * shape[i-1];`
	`635`	`+ strides[i-2] = strides[i-1] * MAX(1, shape[i-1]);`
`636`	`636`	`}`
`637`	`637`	`return ndarray_new_ndarray(ndim, shape, strides, dtype);`
`638`	`638`	`}`