cloudexplain
diff --git a/‎pyproject.toml‎
Lines changed: 3 additions & 2 deletions b/‎pyproject.toml‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎src/xaiflow/mlflow_plugin.py‎
Lines changed: 25 additions & 173 deletions b/‎src/xaiflow/mlflow_plugin.py‎
Lines changed: 25 additions & 173 deletions
diff --git a/‎src/xaiflow/templates/assets/bundle.js‎
Lines changed: 5 additions & 5 deletions b/‎src/xaiflow/templates/assets/bundle.js‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎src/xaiflow/templates/assets/bundle.js.map‎
Lines changed: 1 addition & 1 deletion b/‎src/xaiflow/templates/assets/bundle.js.map‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/xaiflow/templates/components/DeepDiveChart.svelte‎
Lines changed: 17 additions & 7 deletions b/‎src/xaiflow/templates/components/DeepDiveChart.svelte‎
Lines changed: 17 additions & 7 deletions
diff --git a/‎src/xaiflow/templates/components/DeepDiveManager.svelte‎
Lines changed: 1 addition & 1 deletion b/‎src/xaiflow/templates/components/DeepDiveManager.svelte‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/xaiflow/templates/utils/utils.ts‎
Lines changed: 1 addition & 0 deletions b/‎src/xaiflow/templates/utils/utils.ts‎
Lines changed: 1 addition & 0 deletions
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "xaiflow"
-version = "0.1.0rc5"
+version = "0.1.0rc6"
 description = "MLflow integration library for generating interactive HTML reports with SHAP analysis using Svelte and Chart.js"
 authors = [
     {name = "CloudExplain Team", email = "tobias@cloudexplain.eu"}
@@ -41,7 +41,8 @@ dev = [
     "pytest-cov>=2.12.0",
     "black>=21.0.0",
     "flake8>=3.9.0",
-    "playwright"
+    "playwright",
+    "pytest-mock",
 ]
 
 [project.urls]
 
@@ -5,6 +5,7 @@
 
 import os
 import json
+import warnings
 import tempfile
 import shutil
 import mlflow
@@ -33,7 +34,8 @@ def log_feature_importance_report(
         importance_values: List[float] | np.ndarray = None,
         run_id: Optional[str] = None,
         artifact_path: str = "reports",
-        report_name: str = "feature_importance_report.html"
+        report_name: str = "feature_importance_report.html",
+        round_decimals: int = 4
     ) -> str:
         """
         Log an interactive feature importance report as an MLflow artifact
@@ -45,16 +47,33 @@ def log_feature_importance_report(
             run_id: MLflow run ID (uses active run if None)
             artifact_path: Path within MLflow artifacts to store the report
             report_name: Name of the HTML report file
+            round_decimals: Number of decimals to round feature values and SHAP values
             
         Returns:
             str: Path to the logged artifact
         """
 
         if not isinstance(shap_values, Explanation):
             raise ValueError("shap_values must be an instance of shap.Explanation. Pls call explainer(X) or similar to get a valid Explanation object.")
-        feature_values = shap_values.data
-        base_values = shap_values.base_values
-        shap_values = shap_values.values
+        if np.issubdtype(shap_values.data.dtype, np.floating):
+            feature_values = np.round(shap_values.data, round_decimals)
+        else:
+            feature_values = shap_values.data
+        base_values = np.round(shap_values.base_values, round_decimals)[0]
+        shap_values = np.round(shap_values.values, round_decimals)
+        if feature_values.ndim != shap_values.ndim:
+            if shap_values.ndim - feature_values.ndim > 1:
+                NotImplementedError("It looks like you're using multi-target regression or multi-output classification. Currently we don't support this."
+                              " You can still use the plugin, just hand over shap_values[..., <target_index>] to get the SHAP values for a specific target/class."
+                              " Please ensure that the shap_values.dim - feature_values.dim is 1 or less.")
+            else:
+                warnings.warn("Feature values and SHAP values dimensions do not match. This can be due to multi-target regression or (multi-target) classification."
+                              " If you want a specific target/class, please hand over shap_values[..., <target_index>] to get the SHAP values for that target/class."
+                              " We fall back to shap_values[..., -1] in this case."
+                )
+                shap_values = shap_values[..., -1]
+                base_values = float(base_values[-1])
+
         # Use active run if no run_id provided
         if run_id is None:
             active_run = mlflow.active_run()
@@ -95,8 +114,8 @@ def log_feature_importance_report(
             with open(temp_path, 'w', encoding='utf-8') as f:
                 f.write(html_content)
 
-            with open('test_report.html', 'w', encoding='utf-8') as f:
-                f.write(html_content)
+            # with open('test_report.html', 'w', encoding='utf-8') as f:
+            #     f.write(html_content)
 
             # Log the report as an MLflow artifact
             artifact_full_path = f"{artifact_path}/{report_name}"
@@ -119,104 +138,6 @@ def log_feature_importance_report(
             if os.path.exists(temp_path):
                 os.unlink(temp_path)
 
-    def log_model_explanation_report(
-        self,
-        model,
-        X_test: np.ndarray,
-        y_test: np.ndarray,
-        feature_names: List[str],
-        model_name: str = "model",
-        run_id: Optional[str] = None,
-        artifact_path: str = "reports",
-        report_name: str = "model_explanation_report.html"
-    ) -> str:
-        """
-        Log a comprehensive model explanation report with SHAP analysis
-        
-        Args:
-            model: Trained model object
-            X_test: Test data features
-            y_test: Test data targets
-            feature_names: List of feature names
-            model_name: Name of the model
-            run_id: MLflow run ID (uses active run if None)
-            artifact_path: Path within MLflow artifacts to store the report
-            report_name: Name of the HTML report file
-            
-        Returns:
-            str: Path to the logged artifact
-        """
-        
-        try:
-            import shap
-        except ImportError:
-            raise ImportError("SHAP is required for model explanation reports. Install with: pip install shap")
-        
-        # Use active run if no run_id provided
-        if run_id is None:
-            active_run = mlflow.active_run()
-            if active_run is None:
-                raise ValueError("No active MLflow run found. Please start a run or provide run_id.")
-            run_id = active_run.info.run_id
-        
-        # Calculate feature importance (if model supports it)
-        try:
-            if hasattr(model, 'feature_importances_'):
-                importance_values = model.feature_importances_.tolist()
-            elif hasattr(model, 'coef_'):
-                importance_values = np.abs(model.coef_).flatten().tolist()
-            else:
-                # Use permutation importance as fallback
-                from sklearn.inspection import permutation_importance
-                perm_importance = permutation_importance(model, X_test, y_test, random_state=42)
-                importance_values = perm_importance.importances_mean.tolist()
-        except Exception as e:
-            print(f"Warning: Could not calculate feature importance: {e}")
-            importance_values = [1.0 / len(feature_names)] * len(feature_names)
-        
-        # Calculate SHAP values
-        try:
-            # Use TreeExplainer for tree-based models, LinearExplainer for linear models
-            if hasattr(model, 'tree_'):
-                explainer = shap.TreeExplainer(model)
-            else:
-                explainer = shap.LinearExplainer(model, X_test)
-            
-            # Calculate SHAP values for a subset of test data (for performance)
-            sample_size = min(100, len(X_test))
-            sample_indices = np.random.choice(len(X_test), sample_size, replace=False)
-            X_sample = X_test[sample_indices]
-            
-            shap_values_matrix = explainer.shap_values(X_sample)
-            
-            # Handle multi-class case (take first class for now)
-            if isinstance(shap_values_matrix, list):
-                shap_values_matrix = shap_values_matrix[0]
-            
-            shap_values = shap_values_matrix.tolist()
-            
-        except Exception as e:
-            print(f"Warning: Could not calculate SHAP values: {e}")
-            # Generate dummy SHAP values
-            sample_size = min(100, len(X_test))
-            shap_values = []
-            for _ in range(sample_size):
-                sample_shap = [
-                    np.random.normal(0, abs(imp_val) * 0.1) 
-                    for imp_val in importance_values
-                ]
-                shap_values.append(sample_shap)
-        
-        # Log the report
-        return self.log_feature_importance_report(
-            feature_names=feature_names,
-            importance_values=importance_values,
-            shap_values=shap_values,
-            run_id=run_id,
-            artifact_path=artifact_path,
-            report_name=report_name
-        )
-    
     def _generate_html_content(
         self,
         importance_data: Dict[str, Any],
@@ -289,72 +210,3 @@ def _generate_html_content(
         )
 
         return html_content
-        # Write to file
-    
-    def get_report_url(self, run_id: str, artifact_path: str = "reports", report_name: str = "feature_importance_report.html") -> str:
-        """
-        Get the MLflow UI URL for viewing the report
-        
-        Args:
-            run_id: MLflow run ID
-            artifact_path: Path within MLflow artifacts where the report is stored
-            report_name: Name of the HTML report file
-            
-        Returns:
-            str: URL to view the report in MLflow UI
-        """
-        
-        # Get the MLflow tracking URI
-        tracking_uri = mlflow.get_tracking_uri()
-        
-        # Construct the artifact URL
-        artifact_full_path = f"{artifact_path}/{report_name}"
-        
-        if tracking_uri.startswith("http"):
-            # Remote MLflow server
-            base_url = tracking_uri.rstrip('/')
-            url = f"{base_url}/#/experiments/runs/{run_id}/artifacts/{artifact_full_path}"
-        else:
-            # Local MLflow server (assume default port 5000)
-            url = f"http://localhost:5000/#/experiments/runs/{run_id}/artifacts/{artifact_full_path}"
-        
-        return url
-
-
-# Convenience functions for easy usage
-def log_feature_importance(
-    feature_names: List[str],
-    importance_values: List[float],
-    shap_values: Optional[List[List[float]]] = None,
-    **kwargs
-) -> str:
-    """
-    Convenience function to log feature importance report to MLflow
-    """
-    plugin = XaiflowPlugin()
-    return plugin.log_feature_importance_report(
-        feature_names=feature_names,
-        importance_values=importance_values,
-        shap_values=shap_values,
-        **kwargs
-    )
-
-
-def log_model_explanation(
-    model,
-    X_test: np.ndarray,
-    y_test: np.ndarray,
-    feature_names: List[str],
-    **kwargs
-) -> str:
-    """
-    Convenience function to log model explanation report to MLflow
-    """
-    plugin = XaiflowPlugin()
-    return plugin.log_model_explanation_report(
-        model=model,
-        X_test=X_test,
-        y_test=y_test,
-        feature_names=feature_names,
-        **kwargs
-    )
@@ -10,6 +10,7 @@
   
     // Register the necessary components
     Chart.register(BarController, BarElement, CategoryScale, LinearScale, Title, Tooltip, Legend);
+    console.log("DeepDiveChart: NEWNEWNEW Initialized Chart.js components");
 
     interface Props {
       shapValues: number[][];
@@ -85,11 +86,11 @@
     }
   
     function updateChart(singleShapValues: number[]) {
-      console.log("updateChart called with singleShapValues:", singleShapValues, "and singleFeatureValues:", singleFeatureValues);
+      console.log("DeepDiveChart: updateChart called with singleShapValues:", singleShapValues, "and singleFeatureValues:", singleFeatureValues);
       maxOfData = Math.max(...singleShapValues);
       minOfData = Math.min(...singleShapValues);
       const screen = getScreenSizeFlags();
-      console.log("Screen size flags:", screen);
+      console.log("DeepDiveChart: Screen size flags:", screen);
       
       // Color mapping based on isHigherOutputBetter prop
       pointBackgroundColor = singleShapValues.map(d => {
@@ -99,20 +100,29 @@
         // If higher output is NOT better, use normal color mapping (red=high, green=low)
         const colorValue = isHigherOutputBetter ? (100 - normalizedValue) : normalizedValue;
         
+        console.log("Normalized Value:", normalizedValue, "Color Value:", colorValue);
         return colorMap(colorValue);
         // return colorValue;
       });
       
       console.log("Max of Data", maxOfData);
       console.log("Min of Data", minOfData);
-  
+
       if (chart) {
         chart.data.labels = featureNames;
+        console.log("DeepDiveChart: NEW Updating chart with new data", singleShapValues, featureNames, base_value);
         cumulativeValues = createCumulativeStartEndRangesFromValues(singleShapValues, base_value)
+        console.log("DeepDiveChart: NEW 2 Updating chart with new data", cumulativeValues);
         chart.data.datasets[0].data = cumulativeValues;
         maxCumulativeValue = Math.max(...cumulativeValues.map(d => d[1]));
-        console.log("Max Cumulative Value", maxCumulativeValue);
         chart.data.datasets[0].backgroundColor = pointBackgroundColor;
+        // Dynamically update y-axis min and max
+        console.log("DeepDiveChart: Updating chart with new data", cumulativeValues, pointBackgroundColor);
+        if (chart.options.scales?.y) {
+          console.log("DeepDiveChart: Updating y-axis min and max to ", Math.floor(minOfData), Math.ceil(maxOfData * 1.05));
+          chart.options.scales.y.min = Math.floor(minOfData);
+          chart.options.scales.y.max = Math.ceil(maxOfData * 1.05);
+        }
         // Update x-axis rotation based on screen size
         if (chart.options.scales?.x?.ticks) {
           chart.options.scales.x.ticks.maxRotation = screen.isLargeScreen ? 45 : 90;
@@ -247,8 +257,8 @@
               }
             },
             y: {
-              min: 0,
-              max: Math.floor(maxCumulativeValue * 1.3),
+              min: Math.floor(minOfData * 0.95),
+              max: Math.ceil(maxOfData * 1.05),
               ticks: {
                 font: {
                   size: window.innerWidth < 768 ? 8 : window.innerWidth < 1024 ? 10 : 12
@@ -401,7 +411,7 @@
     });
   </script>
 
-  <canvas bind:this={chartCanvas}></canvas>
+  <canvas id="deepdive-canvas" bind:this={chartCanvas}></canvas>
 
   <style>
     canvas {
 
@@ -104,7 +104,7 @@
 </script>
 
 <div>
-<div class="observation-dropdown" style="position:relative;max-width:300px;">
+<div class="deepdive-observation-dropdown" style="position:relative;max-width:300px;">
     <label for="observation-filter">Filter Observations:</label>
     <input id="observation-filter" type="text" bind:value={filterText} placeholder="Type to filter..."
         on:focus={handleInputFocus} on:blur={handleInputBlur} autocomplete="off" />
 
@@ -1,6 +1,7 @@
 export function createCumulativeStartEndRangesFromValues(array: number[], base_value: number): [number, number][] {
   let cumulative = 0;
   return array.map((value, index) => {
+    console.log("createCumulativeStartEndRangesFromValues: index", index, "value", value, "cumulative", cumulative, "base_value", base_value);
     if (index === 0) {
       cumulative = base_value;
     }
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,7 @@`
`1`	`1`	`export function createCumulativeStartEndRangesFromValues(array: number[], base_value: number): [number, number][] {`
`2`	`2`	`let cumulative = 0;`
`3`	`3`	`return array.map((value, index) => {`
	`4`	`+ console.log("createCumulativeStartEndRangesFromValues: index", index, "value", value, "cumulative", cumulative, "base_value", base_value);`
`4`	`5`	`if (index === 0) {`
`5`	`6`	`cumulative = base_value;`
`6`	`7`	`}`