🕵️ testing + 🏗️ build & 🚀 release (#3)

jvdd · web-flow · commit 0dc8d56f5b2f · 2022-11-26T14:38:15.000+01:00
* 🕵️ first tests

* 🙈

* 🙏 add build

* 🌔 nightly rust toolchain

* 🙈 typo

* 🚀 add release

* 🙃 bumb version

* 🧹 update readme

* 🖊️ update readme
diff --git a/.github/workflows/ci-tsdownsample.yml b/.github/workflows/ci-tsdownsample.yml
@@ -40,4 +40,160 @@ jobs:
       - run: make lint  # Lint Python & Rust
       - run: make mypy  # Type check Python
 
+  Test:
+    runs-on: ${{ matrix.os }}
+    strategy:
+      fail-fast: false
+      matrix:
+        os: ['windows-latest', 'macOS-latest', 'ubuntu-latest']
+        rust: ['nightly']  # ['stable', 'beta']
+        python-version: ['3.7', '3.8', '3.9', '3.10', '3.11']
+    
+    env:
+      PYTHON: ${{ matrix.python-version }}
+
+    steps:
+      - uses: actions/checkout@v3
+      - uses: actions/setup-python@v4
+        with:
+          python-version: ${{ matrix.python-version }}
+      - run: pip install -r tests/requirements.txt
+
+      - name: Install Rust toolchain
+        uses: actions-rs/toolchain@v1
+        with:
+          profile: minimal
+          toolchain: nightly
+          components: clippy, rustfmt
+      - name: Setup Rust
+        run: |
+          rustup update nightly --no-self-update
+          rustup default nightly
+      - name: Cache rust
+        uses: Swatinem/rust-cache@v2
+
+      - name: install develop version
+        run: make install
+      # python setup.py develop
+        
+      - run: pip install -r tests/requirements.txt
+
+      - run: pip freeze
+
+      - run: make test  # Test Python
+
+      - name: Upload coverage to Codecov
+        uses: codecov/codecov-action@v3
+
+  Build:
+  # Perhaps smth more in line with this https://github.com/messense/crfs-rs/blob/main/.github/workflows/Python.yml
+    name: build on ${{ matrix.os }} (${{ matrix.target }} - ${{ matrix.manylinux || 'auto' }})
+    # only run on push to main and on release
+    if: "success() && (startsWith(github.ref, 'refs/tags/') || github.ref == 'refs/heads/main' || contains(github.event.pull_request.labels.*.name, 'Full Build'))"
+    strategy:
+      fail-fast: false
+      matrix:
+        os: [ubuntu, macos, windows]
+        target: [x86_64, aarch64]
+        manylinux: [auto]
+        include:
+          - os: windows
+            ls: dir
+          - os: windows
+            ls: dir
+            target: i686
+            python-architecture: x86
+          - os: macos
+            target: aarch64
+          - os: ubuntu
+            target: i686
+          # GCC 4.8.5 in manylinux2014 container doesn't support c11 atomic
+          # we use manylinux_2_24 container for aarch64 and armv7 targets instead,
+          - os: ubuntu
+            target: aarch64
+            container: messense/manylinux_2_24-cross:aarch64
+          - os: ubuntu
+            target: armv7
+            container: messense/manylinux_2_24-cross:armv7
+          - os: ubuntu
+            target: ppc64le
+            container: messense/manylinux_2_24-cross:ppc64le
+          - os: ubuntu
+            target: s390x
+            container: messense/manylinux_2_24-cross:s390x
+          # musllinux
+          - os: ubuntu
+            target: x86_64
+            manylinux: musllinux_1_1
+          - os: ubuntu
+            target: aarch64
+            manylinux: musllinux_1_1
+        exclude:
+          # this fails
+          - os: windows
+            target: aarch64
+
+    runs-on: ${{ matrix.os }}-latest
+    steps:
+    - uses: actions/checkout@v3
+
+    - name: set up python
+      uses: actions/setup-python@v4
+      # with:
+        # python-version: '3.11'
+        # architecture: ${{ matrix.python-architecture || 'x64' }}
+
+    - name: build sdist
+      if: ${{ matrix.os == 'ubuntu' && matrix.target == 'x86_64' && matrix.manylinux == 'auto' }}
+      uses: PyO3/maturin-action@v1
+      with:
+        command: sdist
+        args: --out dist
+
+    - name: build wheels
+      uses: PyO3/maturin-action@v1
+      with:
+        rust-toolchain: nightly
+        target: ${{ matrix.target }}
+        manylinux: ${{ matrix.manylinux || 'auto' }}
+        container: ${{ matrix.container }}
+        args: --release --out dist --interpreter ${{ matrix.interpreter || '3.7 3.8 3.9 3.10 3.11' }}
+
+    - run: ${{ matrix.ls || 'ls -lh' }} dist/
+
+    - uses: actions/upload-artifact@v3
+      with:
+        name: pypi_files
+        path: dist
+
+  Release:
+    needs: [Lint_and_Check, Test, Build]
+    if: "success() && startsWith(github.ref, 'refs/tags/')"
+    runs-on: ubuntu-latest
+
+    steps:
+    - uses: actions/checkout@v3
+
+    - name: set up python
+      uses: actions/setup-python@v4
+      # with:
+        # python-version: '3.10'
+
+    - run: pip install -U twine
+
+    - name: get dist artifacts
+      uses: actions/download-artifact@v3
+      with:
+        name: pypi_files
+        path: dist
+
+    - run: twine check dist/*
+
+    - name: upload to pypi
+      run: twine upload dist/*
+      env:
+        TWINE_USERNAME: __token__
+        TWINE_PASSWORD: ${{ secrets.pypi_token }}
+
 # https://github.com/samuelcolvin/rtoml/blob/main/.github/workflows/ci.yml
+# https://github.com/messense/rjmespath-py/blob/main/.github/workflows/CI.yml
diff --git a/Makefile b/Makefile
@@ -2,6 +2,9 @@
 isort = isort tsdownsample tests
 black = black tsdownsample tests
 
+install:
+	pip install -r requirements.txt
+	pip install -e .
 
 .PHONY: format
 format:
@@ -29,8 +32,14 @@ lint: lint-python lint-rust
 mypy:
 	mypy tsdownsample
 
+
+.PHONY: test
+test:
+	pytest --cov=tsdownsample --cov-report=term-missing --cov-report=html --cov-report=xml
+
+
 .PHONY: all
-all: lint mypy testcov
+all: lint mypy test
 
 .PHONY: clean
 clean:
diff --git a/README.md b/README.md
@@ -9,17 +9,31 @@
 
 ## Features ✨
 
-* **Fast**: written in rust with pyo3 bindings  
+* **Fast**: written in rust with PyO3 bindings  
   - leverages optimized [argminmax](https://github.com/jvdd/argminmax) - which is SIMD accelerated with runtime feature detection
   - scales linearly with the number of data points
-  - scales multi-threaded with rayon (rust)
+  - multithreaded with Rayon (in Rust)
+    <details>
+      <summary><i>Why we do not use Python multiprocessing</i></summary>
+      Citing the <a href="https://pyo3.rs/v0.17.3/parallelism.html">PyO3 docs on parallelism</a>:<br>
+      <blockquote>
+          CPython has the infamous Global Interpreter Lock, which prevents several threads from executing Python bytecode in parallel. This makes threading in Python a bad fit for CPU-bound tasks and often forces developers to accept the overhead of multiprocessing.
+      </blockquote>
+      In Rust - which is a compiled language - there is no GIL, so CPU-bound tasks can be parallelized (with <a href="https://github.com/rayon-rs/rayon">Rayon</a>) with little to no overhead.
+    </details>
 * **Efficient**: memory efficient
   - works on views of the data (no copies)
   - no intermediate data structures are created
 * **Flexible**: works on any type of data
-    - supported datatypes are `f16`, `f32`, `f64`, `i16`, `i32`, `i64`, `u16`, `u32`, `u64`  
-    *!! 🚀 `f16` [argminmax](https://github.com/jvdd/argminmax) is 200-300x faster than numpy*
-* **Easy to use**: simple API
+    - supported datatypes are `f16`, `f32`, `f64`, `i16`, `i32`, `i64`, `u16`, `u32`, `u64`
+    <details>
+      <summary><i>!! 🚀 <code>f16</code> <a href="https://github.com/jvdd/argminmax">argminmax</a> is 200-300x faster than numpy</i></summary>
+      In contrast with all other data types above, <code>f16</code> is *not* hardware supported (i.e., no instructions for f16) by most modern CPUs!! <br>
+      🐌 Programming languages facilitate support for this datatype by either (i) upcasting to `f32` or (ii) using a software implementation. <br>
+      💡 As for argminmax, only comparisons are needed - and thus no arithmetic operations - creating a <ins>symmetrical ordinal mapping from <code>f16</code> to <code>i16</code></ins> is sufficient. This mapping allows to use the hardware supported scalar and SIMD <code>i16</code> instructions - while not producing any memory overhead 🎉 <br>
+      <i>More details are described in <a href="https://github.com/jvdd/argminmax/pull/1">argminmax PR #1</a>.</i>
+    </details>
+* **Easy to use**: simple & flexible API
 
 ## Install
 
@@ -33,15 +47,15 @@ pip install tsdownsample
 ## Usage
 
 ```python
-import tsdownsample as tsds
+from tsdownsample import MinMaxLTTBDowsampler
 import pandas as pd; import numpy as np
 
 # Create a time series
 y = np.random.randn(10_000_000)
 s = pd.Series(y)
 
 # Downsample to 1000 points
-s_ds = tsds.minmaxlttb(s, n_out=1000)
+s_ds = MinMaxLTTBDownsampler.downsample(s, n_out=1000)
 ```
 
 ---
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,9 +1,10 @@
 [build-system]
-requires = ["setuptools", "wheel", "setuptools-rust"]
+requires = ["setuptools", "wheel", "setuptools-rust"] #, "maturin"]
+# build-backend = "maturin"  # TODO: this works as well!
 
 [project]
 name = "tsdownsample"
-version = "0.1.0a1"
+version = "0.1.0a2"
 requires-python = ">=3.7"
 description = "Time series downsampling in rust"
 authors = [{name = "Jeroen Van Der Donckt"}]
@@ -15,7 +16,6 @@ classifiers = [
     'License :: OSI Approved :: MIT License',
     'Intended Audience :: Developers',
     'Programming Language :: Python :: 3',
-    'Programming Language :: Python :: 3.6',  # TODO?
     'Programming Language :: Python :: 3.7',
     'Programming Language :: Python :: 3.8',
     'Programming Language :: Python :: 3.9',
diff --git a/requirements.txt b/requirements.txt
@@ -1,4 +1,5 @@
 numpy
 pandas
 # Build dependencies
-setuptools_rust
+setuptools_rust
+# maturin
diff --git a/tests/requirements.txt b/tests/requirements.txt
@@ -0,0 +1,2 @@
+pytest
+pytest-cov
diff --git a/tests/test_tsdownsample.py b/tests/test_tsdownsample.py
diff --git a/tsdownsample/__init__.py b/tsdownsample/__init__.py
diff --git a/tsdownsample/downsampling_interface.py b/tsdownsample/downsampling_interface.py