HolyLab
diff --git a/‎.github/dependabot.yml‎
Lines changed: 7 additions & 0 deletions b/‎.github/dependabot.yml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎.github/workflows/CI.yml‎
Lines changed: 77 additions & 0 deletions b/‎.github/workflows/CI.yml‎
Lines changed: 77 additions & 0 deletions
diff --git a/‎Project.toml‎
Lines changed: 6 additions & 2 deletions b/‎Project.toml‎
Lines changed: 6 additions & 2 deletions
diff --git a/‎README.md‎
Lines changed: 146 additions & 0 deletions b/‎README.md‎
Lines changed: 146 additions & 0 deletions
diff --git a/‎demo/GroundTruth.png‎
72.1 KB b/‎demo/GroundTruth.png‎
72.1 KB
diff --git a/‎demo/ResultGsvdNMF.png‎
73.2 KB b/‎demo/ResultGsvdNMF.png‎
73.2 KB
diff --git a/‎demo/ResultHals.png‎
74.4 KB b/‎demo/ResultHals.png‎
74.4 KB
diff --git a/‎demo/generate_ground_truth.jl‎
Lines changed: 44 additions & 0 deletions b/‎demo/generate_ground_truth.jl‎
Lines changed: 44 additions & 0 deletions
@@ -0,0 +1,7 @@
+# https://docs.github.com/github/administering-a-repository/configuration-options-for-dependency-updates
+version: 2
+updates:
+  - package-ecosystem: "github-actions"
+    directory: "/" # Location of package manifests
+    schedule:
+      interval: "weekly"
@@ -0,0 +1,77 @@
+name: CI
+on:
+  push:
+    branches:
+      - main
+    tags: ['*']
+  pull_request:
+  workflow_dispatch:
+concurrency:
+  # Skip intermediate builds: always.
+  # Cancel intermediate builds: only if it is a pull request build.
+  group: ${{ github.workflow }}-${{ github.ref }}
+  cancel-in-progress: ${{ startsWith(github.ref, 'refs/pull/') }}
+jobs:
+  test:
+    name: Julia ${{ matrix.version }} - ${{ matrix.os }} - ${{ matrix.arch }} - ${{ github.event_name }}
+    runs-on: ${{ matrix.os }}
+    timeout-minutes: 60
+    permissions: # needed to allow julia-actions/cache to proactively delete old caches that it has created
+      actions: write
+      contents: read
+    strategy:
+      fail-fast: false
+      matrix:
+        version:
+          - '1.10'
+          - '1'
+        os:
+          - ubuntu-latest
+        arch:
+          - x64
+    steps:
+      - uses: actions/checkout@v4
+      - uses: julia-actions/setup-julia@v2
+        with:
+          version: ${{ matrix.version }}
+          arch: ${{ matrix.arch }}
+      - uses: julia-actions/cache@v2
+      - uses: julia-actions/julia-buildpkg@v1
+      - uses: julia-actions/julia-runtest@v1
+      - uses: julia-actions/julia-processcoverage@v1
+      - uses: codecov/codecov-action@v4
+        with:
+          files: lcov.info
+          token: ${{ secrets.CODECOV_TOKEN }}
+          fail_ci_if_error: false
+  # docs:
+  #   name: Documentation
+  #   runs-on: ubuntu-latest
+  #   permissions:
+  #     actions: write # needed to allow julia-actions/cache to proactively delete old caches that it has created
+  #     contents: write
+  #     statuses: write
+  #   steps:
+  #     - uses: actions/checkout@v4
+  #     - uses: julia-actions/setup-julia@v2
+  #       with:
+  #         version: '1'
+  #     - uses: julia-actions/cache@v2
+  #     - name: Configure doc environment
+  #       shell: julia --project=docs --color=yes {0}
+  #       run: |
+  #         using Pkg
+  #         Pkg.develop(PackageSpec(path=pwd()))
+  #         Pkg.instantiate()
+  #     - uses: julia-actions/julia-buildpkg@v1
+  #     - uses: julia-actions/julia-docdeploy@v1
+  #       env:
+  #         GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+  #         DOCUMENTER_KEY: ${{ secrets.DOCUMENTER_KEY }}
+  #     - name: Run doctests
+  #       shell: julia --project=docs --color=yes {0}
+  #       run: |
+  #         using Documenter: DocMeta, doctest
+  #         using GsvdInitialization
+  #         DocMeta.setdocmeta!(GsvdInitialization, :DocTestSetup, :(using GsvdInitialization); recursive=true)
+  #         doctest(GsvdInitialization)
@@ -7,14 +7,18 @@ version = "0.1.0"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 NMF = "6ef6ca0d-6ad7-5ff6-b225-e928bfa0a386"
 NonNegLeastSquares = "b7351bd1-99d9-5c5d-8786-f205a815c4d7"
+TSVD = "9449cd9e-2762-5aa3-a617-5413e99d722e"
 
 [compat]
+LinearAlgebra = "1"
 NMF = "1"
 NonNegLeastSquares = "0.4"
-julia = "1"
+TSVD = "0.4"
+julia = "1.10"
 
 [extras]
+NMF = "6ef6ca0d-6ad7-5ff6-b225-e928bfa0a386"
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 
 [targets]
-test = ["Test"]
+test = ["NMF", "Test"]
@@ -1 +1,147 @@
 # GsvdInitialization
+
+[![CI](https://github.com/HolyLab/GsvdInitialization.jl/actions/workflows/CI.yml/badge.svg)](https://github.com/HolyLab/GsvdInitialization.jl/actions/workflows/CI.yml)
+[![codecov](https://codecov.io/gh/HolyLab/GsvdInitialization.jl/graph/badge.svg?token=LxqRCsZIvn)](https://codecov.io/gh/HolyLab/GsvdInitialization.jl)
+
+This package includes the code of the paper 'GSVD-NMF: Recovering Missing Features in
+Non-negative Matrix Factorization`. 
+It is used to recover Non-negative matrix factorization(NMF) components from low-dimensional space to higher dimensional space by exploiting the generalized singular value decomposition (GSVD) between existing NMF results and the SVD of X.
+This method allows the incremental expansion of the number of components, which can be convenient and effective for interactive analysis of large-scale data.
+
+See also [NMFMerge](https://github.com/HolyLab/NMFMerge.jl) for the converse operation. Together, the two result in a substantial improvement in the quality and consistency of NMF factorization.
+---------------------------
+
+Demo:
+
+To run this demo, NMF.jl and LinearAlgebra.jl are also required.
+
+Install and load packages
+```julia
+julia>] add GsvdInitialization;
+julia> using GsvdInitialization, NMF, LinearAlgebra;
+```
+
+Generating grouth truth with 10 features.
+
+```julia
+julia> include("demo/generate_ground_truth.jl")
+julia> W_GT, H_GT = generate_ground_truth();
+julia> X = W_GT*H_GT;
+```
+
+<img src="demo/GroundTruth.png" alt="Sample Figure" width="400"/>
+
+Running standard NMF(HALS) using NNDSVD as initialization on X. Here, we're taking a couple of precautions to try to ensure the best possible result from NMF:
+- we disable premature convergence by setting `maxiter` to something that is practically infinite
+- we use the full `svd`, rather than `rsvd`, for initializing NNDSVD, as `svd` gives higher-quality results than `rsvd`
+Despite these precautions, we'll see that the NMF result leaves much to be desired:
+
+```julia
+julia> result_hals = nnmf(X, 10; init=:nndsvd, alg = :cd, tol = 1e-4, maxiter=10^12, initdata = svd(X));
+julia> sum(abs2, X-result_hals.W*result_hals.H)/sum(abs2, X)
+0.0999994991270576
+```
+The result is given by
+
+<img src="demo/ResultHals.png" alt="Sample Figure" width="400"/>
+
+This factorization is not perfect as two components are same and two features share one component.
+Then, running GSVD-NMF on X (also using NNSVD as initialization).
+
+```julia
+Wgsvd, Hgsvd = gsvdnmf(X, 9=>10; alg = :cd, tol_final = 1e-4, tol_intermediate = 1e-2, maxiter = 10^12);
+julia> sum(abs2, X-Wgsvd*Hgsvd)/sum(abs2, X)
+1.2322603074132593e-10
+```
+Gsvd-NMF factorizes the gound truth well based on the comparison between relative fitting errors and figures.
+
+<img src="demo/ResultGsvdNMF.png" alt="Sample Figure" width="400"/>
+
+
+---------------------------
+
+## Functions
+
+W, H = **gsvdnmf**(X::AbstractMatrix, ncomponents::Pair{Int,Int}; tol_final=1e-4, tol_intermediate=1e-4, kwargs...)
+
+This function performs "GSVD-NMF" on 2D data matrix ``X``.
+
+Arguments:
+
+``X``: non-nagetive 2D data matrix
+
+``ncomponents::Pair{Int,Int}``: in the form of ``n1 => n2``, augments from ``n1`` components to ``n2``components, where ``n1`` is the number of components for initial NMF (under-complete NMF), and ``n2`` is the number of components for final NMF.
+
+Alternatively, ``ncomponents`` can be an integer denoting the number of components for final NMF. 
+In this case, ``gsvdnmf`` defaults to augment components on initial NMF solution by 1.
+
+Keyword arguments:
+
+``tol_final``： The tolerence of final NMF, default:``10^{-4}``
+
+``tol_intermediate``: The tolerence of initial NMF (under-complete NMF), default: $\mathrm{tol\\_final}$
+
+Other keyword arguments are passed to ``NMF.nnmf``.
+
+-----
+
+W, H = **gsvdnmf**(X::AbstractMatrix, W::AbstractMatrix, H::AbstractMatrix, f; 
+                   n2 = size(first(f), 2), 
+                   tol_nmf=1e-4, 
+                   kwargs...)
+
+This funtion augments components for ``W`` and ``H``, and subsequently polishs new ``W`` and ``H`` by NMF.
+
+Arguments:
+
+``X``: non-nagetive 2D data matrix
+
+``W``: initialization of initial NMF
+
+``H``: initialization of initial NMF
+
+``n2``: the number of components in augmented matrix
+
+``f``: SVD (or Truncated SVD) of ``X``, ``f`` needs to be explicitly writen in ``Tuple`` form.
+
+Keyword arguments 
+
+``tol_nmf``: the tolerance of  NMF polishing step, default: $10^{-4}$
+
+Other keyword arguments are passed to ``NMF.nnmf``.
+
+-----
+
+Wadd, Hadd, S = **gsvdrecover**(X, W0, H0, kadd, f)
+
+This funtion augments components for ``W`` and ``H`` without polishing NMF step.
+
+Outputs:
+
+``Wadd``: augmented NMF solution
+
+``Hadd``: augmented NMF solution
+
+``S``: related generalized singular value
+
+Arguments:
+
+``X``: non-nagetive 2D data matrix
+
+``W0``: NMF solution
+
+``H0``: NMF solution
+
+``kadd``: number of new components
+
+``f``: SVD (or Truncated SVD) of ``X``, ``f`` needs to be indexable.
+
+-----
+
+## Citation
+The code is welcomed to be used in your publication, please cite:
+
+
+
+
+
@@ -0,0 +1,44 @@
+function generate_ground_truth()
+    m, n, nfeatures = 150, 120, 10
+    feature_sigmas = 2*ones(nfeatures)
+    feature_centers = [i*10+10 for i in 1:nfeatures]
+    feature_intensity = ones(nfeatures)
+    W = W_init_gauss(m, feature_centers, feature_sigmas, feature_intensity)
+    H = zeros(nfeatures, n)
+    for r in 1:nfeatures
+        h_start = r*10+7
+        h_length = 10
+        h_end = h_start+h_length-1
+        H[r, h_start:h_end] .+= ones(1, h_length)'
+    end
+    return W, H
+end
+
+function W_init_gauss(n, centers, sigmas, intensity)
+    W = []
+    nc, ns, ni = length(centers), length(sigmas), length(intensity)
+    nc == ns && ns == ni||throw(ArgumentError("centers, sigmas and intensity should have same length"))
+    for i in 1:nc
+        w = zeros(n)
+        gauss_template = gaussiantemplate(sigmas[i])
+        δ = Int(round((length(gauss_template)-1)/2))
+        template_start = centers[i]-δ
+        template_end = template_start + length(gauss_template)-1
+        w[template_start:template_end] .+= intensity[i]*gauss_template
+        push!(W, w)
+    end
+    return hcat(W...) 
+end
+
+function gaussiantemplate(T::Type, r::Real)
+    len = round(Int, 8*r+1)
+    w = (len - 1) ÷ 2
+    template = Array{T}(undef, len)
+    R2 = 2*r*r
+    for x = -w:w
+        template[x+w+1] = exp(-(x*x)/R2)
+    end
+    return template
+end
+gaussiantemplate(r::Real) = gaussiantemplate(Float64, r)
+