softmin
diff --git a/‎doc/source/example.rst‎
Lines changed: 3 additions & 1 deletion b/‎doc/source/example.rst‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎doc/source/examples/MF.ipynb‎
Lines changed: 413 additions & 0 deletions b/‎doc/source/examples/MF.ipynb‎
Lines changed: 413 additions & 0 deletions
diff --git a/‎doc/source/tutorials.rst‎
Lines changed: 1 addition & 0 deletions b/‎doc/source/tutorials.rst‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎doc/source/tutorials/ReHLine_MF.rst‎
Lines changed: 294 additions & 1 deletion b/‎doc/source/tutorials/ReHLine_MF.rst‎
Lines changed: 294 additions & 1 deletion
diff --git a/‎rehline/__init__.py‎
Lines changed: 5 additions & 1 deletion b/‎rehline/__init__.py‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎rehline/_base.py‎
Lines changed: 14 additions & 0 deletions b/‎rehline/_base.py‎
Lines changed: 14 additions & 0 deletions
@@ -16,6 +16,7 @@ Example Gallery
    examples/Path_solution.ipynb
    examples/Warm_start.ipynb
    examples/Sklearn_Mixin.ipynb   
+   examples/MF.ipynb  
 
 List of Examples
 ----------------
@@ -30,4 +31,5 @@ List of Examples
    examples/RankRegression.ipynb
    examples/Path_solution.ipynb
    examples/Warm_start.ipynb
-   examples/Sklearn_Mixin.ipynb 
+   examples/Sklearn_Mixin.ipynb 
+   examples/MF.ipynb  
@@ -63,4 +63,5 @@ List of Tutorials
    ./tutorials/constraint
    ./tutorials/ReHLine_sklearn
    ./tutorials/warmstart
+   ./tutorials/ReHLine_MF
 
@@ -1,2 +1,295 @@
 ReHLine: Matrix Factorization
-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This tutorial illustrates how to conduct Matrix Factorization (MF) with multiple PLQ loss functions through ReHLine. 
+We provide 2 versions of prediction methods:
+
+.. math::
+    \begin{aligned}
+    &\text{Including bias terms:}     && \hat{r}_{ui} = \mathbf{p}_u^T \mathbf{q}_i + \alpha_u + \beta_i \\
+    &\text{Excluding bias terms:}   && \hat{r}_{ui} = \mathbf{p}_u^T \mathbf{q}_i \\
+    \end{aligned}
+
+
+Mathematical Formulation
+------------------------
+
+Considering a User-Item-Rating triplet dataset :math:`(u, i, r_{ui})` derived from target sparse matrix, the optimization problem corresponding to this scenario is:
+
+.. math::
+        \min_{\substack{
+            \mathbf{P} \in \mathbb{R}^{n \times r}\ 
+            \pmb{\alpha} \in \mathbb{R}^n \\
+            \mathbf{Q} \in \mathbb{R}^{m \times r}\ 
+            \pmb{\beta} \in \mathbb{R}^m
+        }} 
+        \left[
+            \sum_{(u,i)\in \Omega} C \cdot \text{PLQ}(r_{ui}, \ \mathbf{p}_u^T \mathbf{q}_i + \alpha_u + \beta_i) 
+        \right]  
+        + 
+        \left[ 
+            \frac{\rho}{n}\sum_{u=1}^n(\|\mathbf{p}_u\|_2^2 + \alpha_u^2) 
+            + \frac{1-\rho}{m}\sum_{i=1}^m(\|\mathbf{q}_i\|_2^2 + \beta_i^2) 
+        \right]
+
+.. math::
+        \ \text{ s.t. } \ 
+        \mathbf{A} \begin{bmatrix}
+                        \pmb{\alpha} & \mathbf{P}
+                    \end{bmatrix}^T + 
+                    \mathbf{b}\mathbf{1}_{n}^T \geq \mathbf{0}
+        \ \text{ and } \ 
+        \mathbf{A} \begin{bmatrix}
+                        \pmb{\beta} & \mathbf{Q}
+                    \end{bmatrix}^T + 
+                    \mathbf{b}\mathbf{1}_{m}^T \geq \mathbf{0}
+
+
+where
+
+- :math:`\text{PLQ}(\cdot , \cdot)` 
+  is a convex piecewise linear-quadratic loss function. You can find built-in loss functions in the `Loss <./loss.rst>`_ section.
+  
+- :math:`\mathbf{A}` is a :math:`K \times r` matrix and :math:`\mathbf{b}` is a :math:`K`-dimensional vector 
+  representing :math:`K` linear constraints. See `Constraints <./constraint.rst>`_ for more details.
+
+- :math:`\Omega`
+  is a user-item collection that records all training data
+
+- :math:`n` is number of users, :math:`m` is number of items
+
+- :math:`r` is length of latent factors (rank of MF) 
+
+- :math:`C` is regularization parameter, :math:`\rho` balances regularization strength between user and item
+
+- :math:`\mathbf{p}_u` and :math:`\alpha_u`
+  are latent vector and individual bias of u-th user. Specifically, :math:`\mathbf{p}_u` is the u-th row of :math:`\mathbf{P}`, and :math:`\alpha_u` is the u-th element of :math:`\pmb{\alpha}`
+  
+- :math:`\mathbf{q}_i` and :math:`\beta_i`
+  are latent vector and individual bias of i-th item. Specifically, :math:`\mathbf{q}_i` is the i-th row of :math:`\mathbf{Q}`, and :math:`\beta_i` is the i-th element of :math:`\pmb{\beta}`
+
+
+Implementation Guide
+--------------------
+
+A simple synthetic dataset is used for illustration. The implementation can be easily adapted to your specific triplet data, allowing you to experiment with various loss functions.
+
+Setup
+^^^^^
+
+To proceed, ensure that you have already installed :code:`rehline`:
+
+.. code-block:: bash
+
+    pip install rehline
+
+Basic Usage
+^^^^^^^^^^^
+
+.. code-block:: python
+
+   # 1. Necessary Packages
+   import numpy as np
+   from rehline import plqMF_Ridge, make_ratings
+   from sklearn.model_selection import train_test_split
+   from sklearn.metrics import mean_absolute_error
+
+
+   # 2. Data Preparation
+   # Generate synthetic data (replace with your own data in practice)
+   user_num, item_num = 1200, 4000 
+   ratings = make_ratings(n_users=user_num, n_items=item_num, 
+                         n_interactions=50000, seed=42)
+   
+   # Split into training and testing sets
+   X_train, X_test, y_train, y_test = train_test_split(
+       ratings['X'], ratings['y'], test_size=0.3, random_state=42)
+
+
+   # 3. Model Construction
+   clf = plqMF_Ridge(
+       C=0.001,                        ## Regularization strength
+       rank=6,                         ## Latent factor dimension
+       loss={'name': 'mae'},           ## Use absolute loss
+       n_users=user_num,               ## Number of users
+       n_items=item_num,               ## Number of items
+   )
+   clf.fit(X_train, y_train)
+
+
+   # 4. Evaluation
+   y_pred = clf.decision_function(X_test)
+   mae_score = mean_absolute_error(y_test, y_pred)
+   print(f"Test MAE: {mae_score:.3f}")
+ 
+Advanced Configuration
+^^^^^^^^^^^^^^^^^^^^^^
+
+Choosing different `loss functions <./loss.rst>`_ through :code:`loss`:
+
+.. code-block:: python
+
+   # Square loss
+   clf_mse = plqMF_Ridge(
+        C=0.001, 
+        rank=6, 
+        loss={'name': 'mse'},          ## Choose square loss
+        n_users=user_num, 
+        n_items=item_num)
+   
+   # Hinge loss (suitable for binary data)
+   clf_hinge = plqMF_Ridge(
+        C=0.001, 
+        rank=6, 
+        loss={'name': 'hinge'},        ## Choose hinge loss
+        n_users=user_num, 
+        n_items=item_num)
+
+`Linear constraints <./constraint.rst>`_ can be applied via :code:`constraint`:
+
+.. code-block:: python
+
+   # Implement a linear constraint 
+   clf_nonnegative = plqMF_Ridge(
+        C=0.001, 
+        rank=6, 
+        loss={'name': 'mae'},
+        n_users=user_num, 
+        n_items=item_num,
+        constraint=[{'name': '>=0'}]   ## Use nonnegative constraint
+    )
+  
+The algorithm includes bias terms by default. To disable them, set: :code:`biased=False`:
+
+.. code-block:: python
+
+   # Exclude user and item biases
+   clf_unbiased = plqMF_Ridge(
+        C=0.001, 
+        rank=6, 
+        loss={'name': 'mae'},
+        n_users=user_num, 
+        n_items=item_num,
+        biased=False                   ## Disable bias terms
+    )
+  
+Imposing different strengths of regularization on items/users through :code:`rho`:
+
+.. code-block:: python
+
+   # Imbalanced penalty 
+   clf_asymmetric = plqMF_Ridge(
+        C=0.001, 
+        rank=6, 
+        loss={'name': 'mae'},
+        n_users=user_num, 
+        n_items=item_num,
+        rho=0.7                        ## Add heavier penalties for user parameters
+    )
+
+Parameter Tuning
+^^^^^^^^^^^^^^^^
+
+The model complexity is mainly controlled by :code:`C` and :code:`rank`. 
+
+.. code-block:: python
+
+   
+   for C_value in [0.0002, 0.001, 0.005]:
+       clf = plqMF_Ridge(
+            C=C_value,                 ## Try different regularization strengths
+            rank=6, 
+            loss={'name': 'mae'},
+            n_users=user_num, 
+            n_items=item_num
+        )
+       clf.fit(X_train, y_train)
+       y_pred = clf.decision_function(X_test)
+       mae = mean_absolute_error(y_test, y_pred)
+       print(f"C={C_value}: MAE = {mae:.3f}")
+
+
+   for rank_value in [4, 8, 12]:
+       clf = plqMF_Ridge(
+            C=0.001, 
+            rank=rank_value,           ## Try different latent factor dimensions
+            loss={'name': 'mae'},
+            n_users=user_num, 
+            n_items=item_num
+        )
+       clf.fit(X_train, y_train)
+       y_pred = clf.decision_function(X_test)
+       mae = mean_absolute_error(y_test, y_pred)
+       print(f"rank={rank_value}: MAE = {mae:.3f}")
+
+Convergence Tracking
+^^^^^^^^^^^^^^^^^^^^
+
+You can customize the optimization process by setting your preferred iteration counts and tolerance levels. 
+Training progress can be monitored either by enabling :code:`verbose` output during fitting or by examining the :code:`history` attribute after fitting.
+
+.. code-block:: python
+
+    clf = plqMF_Ridge(
+        C=0.001,               
+        rank=6,                
+        loss={'name': 'mae'},  
+        n_users=user_num,     
+        n_items=item_num,  
+        max_iter_CD=15,                ## Outer CD iterations
+        tol_CD=1e-5,                   ## Outer CD tolerance  
+        max_iter=8000,                 ## ReHLine solver iterations
+        tol=1e-2,                      ## ReHLine solver tolerance
+        verbose=1,                     ## Enable progress output
+    )
+    clf.fit(X_train, y_train)
+
+    print(clf.history)                 ## Check training trace of cumulative loss and objection value
+
+Different Gaussian initial conditions can be manually set by :code:`init_mean` and :code:`init_sd`:
+
+.. code-block:: python
+
+    # Initialize model with positive shifted normal 
+    clf = plqMF_Ridge(
+        C=0.001,
+        rank=6,
+        loss={'name': 'mae'},
+        n_users=user_num,
+        n_items=item_num,
+        init_mean=1.0,                 ## Manually set mean of normal distribution
+        init_sd=0.5                    ## Manually set sd of normal distribution
+    )
+
+Practical Guidance
+^^^^^^^^^^^^^^^^^^
+
+- The first column of :code:`X` corresponds to **users**, and the second column corresponds to **items**. Please ensure this aligns with your :code:`n_users` and :code:`n_items` parameters.
+- The default penalty strength is relatively weak; it is recommended to set a relatively small :code:`C` value initially.
+- When using larger :code:`C` values, consider increasing :code:`max_iter` to avoid ConvergenceWarning.
+
+
+Regularization Conversion
+-------------------------
+The regularization in this algorithm is tuned via :math:`C` and :math:`\rho`. For users who prefer to set the penalty strength directly, you may achieve conversion through the following formula:
+
+.. math::
+        \lambda_{\text{user}} = \frac{\rho}{Cn}
+        \quad\text{and}\quad  
+        \lambda_{\text{item}} = \frac{(1 - \rho)}{Cm}
+
+
+.. math::
+        C = \frac{1}{m \cdot \lambda_{\text{item}} + n \cdot \lambda_{\text{user}}}
+        \quad\text{and}\quad  
+        \rho = \frac{1}{\frac{m \cdot \lambda_{\text{item}}}{ n \cdot \lambda_{\text{user}}}+1}
+
+
+Example
+-------
+
+.. nblinkgallery::
+   :caption: Empirical Risk Minimization
+   :name: rst-link-gallery
+
+   ../examples/MF.ipynb
@@ -5,14 +5,18 @@
 from ._internal import rehline_internal, rehline_result
 from ._path_sol import plqERM_Ridge_path_sol
 from ._sklearn_mixin import plq_Ridge_Classifier, plq_Ridge_Regressor
+from ._mf_class import plqMF_Ridge
+from ._data import make_ratings 
 
 __all__ = ("_BaseReHLine",
            "ReHLine_solver",
            "ReHLine",
            "plqERM_Ridge",
            "CQR_Ridge",
+           "plqMF_Ridge",
            "plqERM_Ridge_path_sol",
            "plq_Ridge_Classifier",
            "plq_Ridge_Regressor",
            "_make_loss_rehline_param",
-           "_make_constraint_rehline_param")
+           "_make_constraint_rehline_param",
+           "make_ratings")
@@ -393,6 +393,20 @@ def _make_loss_rehline_param(loss, X, y):
         U = np.array([[1.0] * n, [-1.0] * n])
         V = np.array([-y , y])
 
+    elif (loss['name'] == 'SVM square') \
+            or (loss['name'] == 'svm square') \
+            or (loss['name'] == 'hinge square'):
+        Tau = np.inf * np.ones((1, n)) 
+        S = - np.sqrt(2) * y.reshape(1,-1)
+        T = np.sqrt(2) * np.ones((1, n)) 
+
+    elif (loss['name'] == 'MSE') \
+            or (loss['name'] == 'mse') \
+            or (loss['name'] == 'mean square error'):
+        Tau = np.inf * np.ones((2, n)) 
+        S = np.array([[np.sqrt(2)] * n, [-np.sqrt(2)] * n])
+        T = np.array([-np.sqrt(2) * y , np.sqrt(2) * y])
+
 
     else:
         raise Exception("Sorry, ReHLine currently does not support this loss function, \