aai-institute
diff --git a/‎.bumpversion.cfg‎
Lines changed: 1 addition & 1 deletion b/‎.bumpversion.cfg‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.gitattributes‎
Lines changed: 1 addition & 0 deletions b/‎.gitattributes‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎.github/workflows/main.yaml‎
Lines changed: 38 additions & 15 deletions b/‎.github/workflows/main.yaml‎
Lines changed: 38 additions & 15 deletions
diff --git a/‎.github/workflows/publish.yaml‎
Lines changed: 13 additions & 7 deletions b/‎.github/workflows/publish.yaml‎
Lines changed: 13 additions & 7 deletions
diff --git a/‎.github/workflows/run-notebook-tests-workflow.yaml‎
Lines changed: 2 additions & 1 deletion b/‎.github/workflows/run-notebook-tests-workflow.yaml‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎.gitignore‎
Lines changed: 10 additions & 1 deletion b/‎.gitignore‎
Lines changed: 10 additions & 1 deletion
diff --git a/‎.test_durations‎
Lines changed: 0 additions & 4 deletions b/‎.test_durations‎
Lines changed: 0 additions & 4 deletions
diff --git a/‎CHANGELOG.md‎
Lines changed: 36 additions & 2 deletions b/‎CHANGELOG.md‎
Lines changed: 36 additions & 2 deletions
diff --git a/‎CLAUDE.local.md‎ b/‎CLAUDE.local.md‎
diff --git a/‎CONTRIBUTING.md‎
Lines changed: 15 additions & 6 deletions b/‎CONTRIBUTING.md‎
Lines changed: 15 additions & 6 deletions
@@ -1,5 +1,5 @@
 [bumpversion]
-current_version = 0.9.3.dev0
+current_version = 0.10.1.dev0
 commit = False
 tag = False
 allow_dirty = False
 
@@ -2,3 +2,4 @@ notebooks/*.ipynb -linguist-detectable
 *.png filter=lfs diff=lfs merge=lfs -text
 *.svg filter=lfs diff=lfs merge=lfs -text
 logo.svg -filter=lfs -diff=lfs -merge=lfs text
+*.pkl filter=lfs diff=lfs merge=lfs -text
@@ -112,13 +112,13 @@ jobs:
       group_number: ${{ matrix.group_number }}
     needs: [ code-quality ]
 
-  push-docs-and-release-testpypi:
-    name: Publish documentation # and maybe release package to TestPyPI
+  publish-docs:
+    name: Publish documentation
     runs-on: ubuntu-22.04
     needs: [docs, group-tests, notebook-tests]
-    if: ${{ github.ref == 'refs/heads/develop' }}
+    if: ${{ github.ref == 'refs/heads/develop' && github.event_name != 'pull_request'  }}
     concurrency:
-      group: publish
+      group: publish-docs
     steps:
       - uses: actions/checkout@v4
         with:
@@ -140,14 +140,37 @@ jobs:
           title: Development
           email: ${{ env.GITHUB_BOT_EMAIL }}
           username: ${{ env.GITHUB_BOT_USERNAME }}
-      # Deactivated until we solve the issue with the credentials (Jan. 2025)
-      # - name: Build and publish to TestPyPI
-      #   env:
-      #     TWINE_USERNAME: __token__
-      #     TWINE_PASSWORD: ${{ secrets.TEST_PYPI_PASSWORD }}
-      #   run: |
-      #     set -x
-      #     export BUILD_NUMBER=$GITHUB_RUN_NUMBER
-      #     bump2version --no-tag --no-commit --verbose --serialize '{major}.{minor}.{patch}.{release}{$BUILD_NUMBER}' boguspart
-      #     python setup.py sdist bdist_wheel
-      #     twine upload -r testpypi --verbose --non-interactive dist/*
+
+
+  publish-testpypi:
+    name: Publish package to TestPyPI
+    runs-on: ubuntu-22.04
+    needs: [group-tests, notebook-tests]
+    if: ${{ github.ref == 'refs/heads/develop' && github.event_name != 'pull_request' }}
+    concurrency:
+      group: publish-testpypi
+    permissions:
+      id-token: write
+    environment:
+      name: testpypi
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+          lfs: true
+      - name: Setup Python 3.9
+        uses: ./.github/actions/python
+        with:
+          python_version: 3.9
+      - name: Bump version and build package
+        run: |
+          set -x
+          export BUILD_NUMBER=$GITHUB_RUN_NUMBER
+          bump2version --no-tag --no-commit --verbose --serialize '{major}.{minor}.{patch}.{release}{$BUILD_NUMBER}' boguspart
+          python setup.py sdist bdist_wheel
+      - name: Publish to TestPyPI
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          repository-url: https://test.pypi.org/legacy/
+          print-hash: true
+          verbose: true
@@ -23,8 +23,13 @@ env:
 jobs:
   publish:
     runs-on: ubuntu-22.04
+    environment:
+      name: publish
+      url: https://pypi.org/pydvl
     concurrency:
       group: publish
+    permissions:
+      id-token: write
     steps:
       - name: Checking out last commit in release
         if: ${{ github.event_name != 'workflow_dispatch' }}
@@ -54,6 +59,14 @@ jobs:
           # Make the version available as env variable for next steps
           echo CURRENT_VERSION=$CURRENT_VERSION >> $GITHUB_ENV
         shell: bash
+      - name: Build dist
+        run: |
+          python setup.py sdist bdist_wheel
+      - name: Publish to PyPI
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          verbose: true
+          print-hash: true
       - name: Deploy Docs
         uses: ./.github/actions/deploy-docs
         with:
@@ -63,10 +76,3 @@ jobs:
           email: ${{ env.GITHUB_BOT_EMAIL }}
           username: ${{ env.GITHUB_BOT_USERNAME }}
           set-default: 'true'
-      - name: Build and publish to PyPI
-        env:
-          TWINE_USERNAME: ${{ secrets.PYPI_USERNAME }}
-          TWINE_PASSWORD: ${{ secrets.PYPI_PASSWORD }}
-        run: |
-          python setup.py sdist bdist_wheel
-          twine upload --verbose --non-interactive dist/*
 
@@ -26,11 +26,12 @@ jobs:
     - name: Free Disk Space (Ubuntu)
       uses: jlumbroso/free-disk-space@main
       with:
-        large-packages: false
+        large-packages: true
         docker-images: false
     - uses: actions/checkout@v4
       with:
         fetch-depth: 0
+        lfs: true
     - name: Setup Python ${{ inputs.python_version }}
       uses: ./.github/actions/python
       with:
 
@@ -110,7 +110,7 @@ celerybeat.pid
 .venv
 env/
 venv/
-venv38/
+venv39/
 ENV/
 env.bak/
 venv.bak/
@@ -141,9 +141,18 @@ pylint.html
 runs/
 data/models/
 *.pkl
+!data/*.pkl
 
 # Docs
 docs_build
 
 # pytest-profiling
 prof/
+
+# JS tooling
+node_modules/
+package.json
+package-lock.json
+
+#
+.serena
@@ -1781,10 +1781,6 @@
     "tests/value/shapley/test_montecarlo.py::test_linear_montecarlo_with_outlier[owen-kwargs1-scorer0-0.2-2-0-21]": 6.573138832000012,
     "tests/value/shapley/test_montecarlo.py::test_linear_montecarlo_with_outlier[owen_antithetic-kwargs2-scorer0-0.2-2-0-21]": 10.124256999999972,
     "tests/value/shapley/test_montecarlo.py::test_linear_montecarlo_with_outlier[permutation_montecarlo-kwargs0-scorer0-0.2-2-0-21]": 2.7115268339999545,
-    "tests/value/shapley/test_montecarlo.py::test_montecarlo_shapley_housing_dataset[12-3-12-combinatorial_montecarlo-kwargs0]": 0.16786966001382098,
-    "tests/value/shapley/test_montecarlo.py::test_montecarlo_shapley_housing_dataset[12-3-12-owen-kwargs1]": 17.011920137971174,
-    "tests/value/shapley/test_montecarlo.py::test_montecarlo_shapley_housing_dataset[12-3-12-owen_antithetic-kwargs2]": 35.88025256394758,
-    "tests/value/shapley/test_montecarlo.py::test_montecarlo_shapley_housing_dataset[12-3-4-group_testing-kwargs3]": 0.25901710899779573,
     "tests/value/shapley/test_montecarlo.py::test_seed[combinatorial_montecarlo-kwargs0-test_game0]": 0.04085670800000685,
     "tests/value/shapley/test_montecarlo.py::test_seed[group_testing-kwargs3-test_game0]": 0.23488145900003587,
     "tests/value/shapley/test_montecarlo.py::test_seed[owen-kwargs1-test_game0]": 0.30296191700003305,
 
@@ -2,13 +2,40 @@
 
 ## Unreleased
 
+### Added
+
+- Support for `torch.Tensor` as underlying data type in `Dataset` and
+  `GroupedDataset`
+  [PR #673](https://github.com/aai-institute/pyDVL/pull/673)
+- Support for pytorch models in most valuation methods when wrapped in
+  classes implementing the protocol `TorchSupervisedModel`, e.g. by using
+  [skorch.NeuralNetClassifier](https://skorch.readthedocs.io/en/stable/classifier.html)
+  models
+  [PR #673](https://github.com/aai-institute/pyDVL/pull/673)
+- Improved documentation and examples using DeepSets for Data Utility Learning 
+  [PR #674](https://github.com/aai-institute/pyDVL/pull/674)
+
+### Fixed
+
+- Issues with `Dataset` indexing
+  [PR #673](https://github.com/aai-institute/pyDVL/pull/673)
+
+### Changed
+
+
+## v0.10.0 - 💥📚🐞🆕 New valuation interface, improved docs, new methods, breaking changes and tons of improvements
+
 
 ### Added
 
+- Simple result serialization to resume computation of values
+  [PR #666](https://github.com/aai-institute/pyDVL/pull/666)
 - Simple memory monitor / reporting
   [PR #663](https://github.com/aai-institute/pyDVL/pull/663)
 - New stopping criterion `MaxSamples`
   [PR #661](https://github.com/aai-institute/pyDVL/pull/661)
+- New pseudo-stopping criterion `History` to record value updates during fitting
+  [PR #653](https://github.com/aai-institute/pyDVL/pull/653)
 - Introduced `UtilityModel` and two implementations `IndicatorUtilityModel`
   and `DeepSetsUtilityModel` for data utility learning
   [PR #650](https://github.com/aai-institute/pyDVL/pull/650)
@@ -29,6 +56,7 @@
 - Refactor MSR Banzhaf semivalues with the new sampler architecture.
   [PR #605](https://github.com/aai-institute/pyDVL/pull/605)
   [PR #641](https://github.com/aai-institute/pyDVL/pull/641)
+  [PR #653](https://github.com/aai-institute/pyDVL/pull/653)
 - Refactor group-testing shapley values with new sampler architecture
   [PR #602](https://github.com/aai-institute/pyDVL/pull/602)
 - Refactor least-core data valuation methods with more supported sampling
@@ -89,9 +117,13 @@
 
 ### Changed
 
+- Major rewrite of the documentation for the new interface in 0.10.0
+  [PR #653](https://github.com/aai-institute/pyDVL/pull/653)
 - Slicing, comparing and setting of `ValuationResult` behave in a more 
-  natural way
-  [PR #660](https://github.com/aai-institute/pyDVL/pull/660)
+  natural and consistent way. Several bug fixes.
+  [PR #653](https://github.com/aai-institute/pyDVL/pull/653)
+  [PR #660](https://github.com/aai-institute/pyDVL/pull/660) 
+  [PR #666](https://github.com/aai-institute/pyDVL/pull/666)
 - Switched all semi-value coefficients and sampler weights to log-space in
   order to avoid overflows
   [PR #643](https://github.com/aai-institute/pyDVL/pull/643)
@@ -160,6 +192,8 @@
     - renaming `PreConditioner` -> `Preconditioner`
     - fit to `TensorOperator`
     [PR #601](https://github.com/aai-institute/pyDVL/pull/601)
+  - Bumped `zarr` dependency to v3
+    [PR #668](https://github.com/aai-institute/pyDVL/pull/668) 
 
 
 ## 0.9.2 - 🏗  Bug fixes, logging improvement
 
@@ -415,7 +415,7 @@ To add a citation inside a markdown file, use the notation `[@ citekey]` (with
 no space). Alas,
 because of when mkdocs-bibtex enters the pipeline, it won't process docstrings.
 For module documentation, we manually inject html into the markdown files. For
-example, in `pydvl.value.shapley.montecarlo` we have:
+example, in `pydvl.valuation.methods.shapley` we have:
 
 ```markdown
 """
@@ -676,8 +676,18 @@ part):
 ```shell
 build_scripts/release-version.sh 0.1.6
 ```
+This will:
 
-To find out how to use the script, pass the `-h` or `--help` flags:
+ - Pull latest remote version of develop (fast-forward only) from origin
+ - Create a branch `release/v0.1.6`
+ - Bump version number: 0.1.5.dev1234 ⟶   0.1.6
+ - Merge release branch into master locally and on origin
+ - Tag as `v0.1.6`
+ - Bump version number again to next development pre-release
+ - Merge release branch into develop locally and on origin
+ - Delete release branch
+
+For usage details, pass the `-h` or `--help` flags:
 
 ```shell
 build_scripts/release-version.sh --help
@@ -687,11 +697,10 @@ If running in interactive mode (without `-y|--yes`), the script will output a
 summary of pending changes and ask for confirmation before executing the
 actions.
 
-Once this is done, a tag will be created on the repository. You should then
-create a GitHub
+Once the script is done, you should then create a GitHub
 [release](https://docs.github.com/en/repositories/releasing-projects-on-github/managing-releases-in-a-repository#creating-a-release)
-for that tag. That will a trigger a CI pipeline that will automatically create a
-package and publish it from CI to PyPI.
+for the tag that was created. That will a trigger a CI pipeline that will
+automatically create a package and publish it from CI to PyPI.
 
 ### Manual release process