instadeepai
diff --git a/‎src/mlipaudit/benchmarks/nudged_elastic_band/nudged_elastic_band.py‎
Lines changed: 1 addition & 0 deletions b/‎src/mlipaudit/benchmarks/nudged_elastic_band/nudged_elastic_band.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/mlipaudit/benchmarks/sampling/helpers.py‎
Lines changed: 2 additions & 2 deletions b/‎src/mlipaudit/benchmarks/sampling/helpers.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/mlipaudit/ui/bond_length_distribution.py‎
Lines changed: 5 additions & 16 deletions b/‎src/mlipaudit/ui/bond_length_distribution.py‎
Lines changed: 5 additions & 16 deletions
diff --git a/‎src/mlipaudit/ui/conformer_selection.py‎
Lines changed: 9 additions & 5 deletions b/‎src/mlipaudit/ui/conformer_selection.py‎
Lines changed: 9 additions & 5 deletions
diff --git a/‎src/mlipaudit/ui/dihedral_scan.py‎
Lines changed: 16 additions & 8 deletions b/‎src/mlipaudit/ui/dihedral_scan.py‎
Lines changed: 16 additions & 8 deletions
diff --git a/‎src/mlipaudit/ui/folding_stability.py‎
Lines changed: 64 additions & 54 deletions b/‎src/mlipaudit/ui/folding_stability.py‎
Lines changed: 64 additions & 54 deletions
diff --git a/‎src/mlipaudit/ui/noncovalent_interactions.py‎
Lines changed: 7 additions & 3 deletions b/‎src/mlipaudit/ui/noncovalent_interactions.py‎
Lines changed: 7 additions & 3 deletions
@@ -160,6 +160,7 @@ class NEBResult(BenchmarkResult):
     Attributes:
         reaction_results: A dictionary of reaction results where
             the keys are the reaction identifiers.
+        convergence_rate: The fraction of converged reactions.
     """
 
     reaction_results: list[NEBReactionResult]
 
@@ -117,13 +117,13 @@ def calculate_distribution_hellinger_distance(
         reference_hist: Reference histogram array
         sampled_hist: Sampled histogram array
         normalize: Whether to normalize histograms before comparison (only
-        set this to False if the histograms are already normalized).
+            set this to False if the histograms are already normalized).
 
     Raises:
         ValueError: If the histograms have different shapes.
 
     Returns:
-        float: Hellinger distance between the two distributions
+        The Hellinger distance between the two distributions
     """
     if reference_hist.shape != sampled_hist.shape:
         raise ValueError("Histograms must have the same shape")
 
@@ -92,31 +92,20 @@ def bond_length_distribution_page(
     distribution_data = [
         {
             "Model name": model_name,
-            "Average deviation": result.avg_deviation,
+            "Average deviation (Å)": result.avg_deviation,
             "Score": result.score,
         }
         for model_name, result in data.items()
         if model_name in selected_models
     ]
 
+    st.markdown("## Summary statistics")
+
     df = pd.DataFrame(distribution_data)
 
     df.sort_values("Score", ascending=False, inplace=True)
     display_model_scores(df)
 
-    st.markdown("## Best model summary")
-
-    # Get best model
-    best_model_row = df.loc[df["Score"].idxmax()]
-    best_model_name = best_model_row["Model name"]
-
-    st.markdown(f"The best model is **{best_model_name}**.")
-
-    st.metric(
-        "Total average deviation (absolute)",
-        f"{float(best_model_row['Average deviation']):.3f}",
-    )
-
     st.markdown("## Bond length deviation distribution per model")
 
     # Get all unique ring types from the data
@@ -154,7 +143,7 @@ def bond_length_distribution_page(
                 .encode(
                     x=alt.X(
                         "Model name:N",
-                        title="Model name",
+                        title="Model",
                         axis=alt.Axis(labelAngle=-45, labelLimit=100),
                     ),
                     y=alt.Y(
@@ -164,7 +153,7 @@ def bond_length_distribution_page(
                     ),
                     color=alt.Color(
                         "Model name:N",
-                        title="Model name",
+                        title="Model",
                         legend=alt.Legend(orient="top"),
                     ),
                 )
 
@@ -115,8 +115,6 @@ def conformer_selection_page(
     with col3:
         create_st_image(CONFORMER_IMG_DIR / "rsz_efa00.png", "Efavirenz")
 
-    st.markdown("## Summary statistics")
-
     # Download data and get model names
     if "conformer_selection_cached_data" not in st.session_state:
         st.session_state.conformer_selection_cached_data = data_func()
@@ -137,13 +135,15 @@ def conformer_selection_page(
         return
 
     df = _process_data_into_dataframe(data, selected_models)
+
+    st.markdown("## Summary statistics")
+
     df_display = df.copy()
     df_display.index.name = "Model name"
     df_display.sort_values("Score", ascending=False, inplace=True)
     display_model_scores(df_display)
 
     st.markdown("## MAE and RMSE per model")
-    st.markdown("")
 
     # Melt the dataframe to prepare for Altair chart
     chart_df = (
@@ -202,7 +202,11 @@ def conformer_selection_page(
             alt.Chart(error_chart_df)
             .mark_bar()
             .encode(
-                x=alt.X("Molecule:N", title="Molecule"),
+                x=alt.X(
+                    "Molecule:N",
+                    title="Molecule",
+                    axis=alt.Axis(labelAngle=-45, labelLimit=100),
+                ),
                 y=alt.Y("Value:Q", title="Error (kcal/mol)"),
                 color="Metric:N",
                 xOffset="Metric:N",
@@ -258,7 +262,7 @@ def conformer_selection_page(
         .mark_circle(size=80, opacity=0.7)
         .encode(
             x=alt.X("Reference Energy:Q", title="Reference Energy (kcal/mol)"),
-            y=alt.Y("Predicted Energy:Q", title="Inferred Energy (kcal/mol)"),
+            y=alt.Y("Predicted Energy:Q", title="Predicted Energy (kcal/mol)"),
             tooltip=["Reference Energy:Q", "Energy:Q"],
         )
         .properties(
 
@@ -150,9 +150,10 @@ def dihedral_scan_page(
         {
             "Model name": model_name,
             "Score": result.score,
-            "MAE": result.avg_mae * conversion_factor,
-            "RMSE": result.avg_rmse * conversion_factor,
-            "Barrier Height Error": result.mae_barrier_height * conversion_factor,
+            f"MAE ({selected_energy_unit})": result.avg_mae * conversion_factor,
+            f"RMSE ({selected_energy_unit})": result.avg_rmse * conversion_factor,
+            f"Barrier Height MAE ({selected_energy_unit})": result.mae_barrier_height
+            * conversion_factor,
             "Pearson Correlation": result.avg_pearson_r,
         }
         for model_name, result in data.items()
@@ -174,20 +175,27 @@ def dihedral_scan_page(
 
     st.markdown("## Mean barrier height error")
     df_barrier = df[df["Model name"].isin(selected_models)][
-        ["Model name", "Barrier Height Error"]
+        ["Model name", f"Barrier Height MAE ({selected_energy_unit})"]
     ]
 
     barrier_chart = (
         alt.Chart(df_barrier)
         .mark_bar()
         .encode(
-            x=alt.X("Model name:N", title="Model ID"),
+            x=alt.X(
+                "Model name:N",
+                title="Model",
+                axis=alt.Axis(labelAngle=-45, labelLimit=100),
+            ),
             y=alt.Y(
-                "Barrier Height Error:Q",
+                f"Barrier Height MAE ({selected_energy_unit}):Q",
                 title=f"Mean Barrier Height Error ({selected_energy_unit})",
             ),
-            color=alt.Color("Model name:N", title="Model ID"),
-            tooltip=["Model name:N", "Barrier Height Error:Q"],
+            color=alt.Color("Model name:N", title="Model"),
+            tooltip=[
+                alt.Tooltip("Model name:N", title="Model"),
+                f"Barrier Height MAE ({selected_energy_unit}):Q",
+            ],
         )
         .properties(
             width=600,
 
@@ -34,37 +34,39 @@ def _data_to_dataframes(
     agg_data = []
 
     for model_name, result in data.items():
-        if model_name in selected_models:
-            for molecule_result in result.molecules:
-                if not molecule_result.failed:
-                    for idx in range(len(molecule_result.rmsd_trajectory)):  # type: ignore
-                        rad_of_gyr_dev = (
-                            molecule_result.radius_of_gyration_deviation[idx]  # type: ignore
-                        )
-                        plot_data.append({
-                            "Model": model_name,
-                            "Structure": molecule_result.structure_name,
-                            "Frame": idx,
-                            "RMSD": molecule_result.rmsd_trajectory[idx],  # type: ignore
-                            "TM score": molecule_result.tm_score_trajectory[idx],  # type: ignore
-                            "Rad of Gyr Dev": rad_of_gyr_dev,
-                            "DSSP match": molecule_result.match_secondary_structure[
-                                idx
-                            ],  # type: ignore
-                        })
-                        # Next line is to stay within max. line length below
-                        max_dev_rad_of_gyr = (
-                            molecule_result.max_abs_deviation_radius_of_gyration
-                        )
-                        agg_data.append({
-                            "Model": model_name,
-                            "Score": result.score,
-                            "Structure": molecule_result.structure_name,
-                            "avg. RMSD": molecule_result.avg_rmsd,
-                            "avg. TM score": molecule_result.avg_tm_score,
-                            "avg. DSSP match": molecule_result.avg_match,
-                            "max. abs. dev. Rad. of Gyr.": max_dev_rad_of_gyr,
-                        })
+        if model_name not in selected_models:
+            continue
+
+        for molecule_result in result.molecules:
+            if molecule_result.failed:
+                continue
+
+            for idx in range(len(molecule_result.rmsd_trajectory)):  # type: ignore
+                plot_data.append({
+                    "Model": model_name,
+                    "Structure": molecule_result.structure_name,
+                    "Frame": idx,
+                    "RMSD": molecule_result.rmsd_trajectory[idx],  # type: ignore
+                    "TM score": molecule_result.tm_score_trajectory[idx],  # type: ignore
+                    "Rad of Gyr Dev": molecule_result.radius_of_gyration_deviation[  # type: ignore
+                        idx
+                    ],
+                    "DSSP match": molecule_result.match_secondary_structure[idx],  # type: ignore
+                })
+                # Next line is to stay within max. line length below
+                max_dev_rad_of_gyr = (
+                    molecule_result.max_abs_deviation_radius_of_gyration
+                )
+                agg_data.append({
+                    "Model": model_name,
+                    "Score": result.score,
+                    "Structure": molecule_result.structure_name,
+                    "Average RMSD (Å)": molecule_result.avg_rmsd,
+                    "Average TM score": molecule_result.avg_tm_score,
+                    "Average DSSP match": molecule_result.avg_match,
+                    "Maximum absolute deviation"
+                    " of the radius of gyration (Å)": max_dev_rad_of_gyr,
+                })
 
     df = pd.DataFrame(plot_data)
     df_agg = pd.DataFrame(agg_data)
@@ -91,10 +93,10 @@ def _transform_dataframes_for_visualization(
         df_agg_filtered.groupby("Model")
         .agg({
             "Score": "mean",
-            "avg. RMSD": "mean",
-            "avg. TM score": "mean",
-            "avg. DSSP match": "mean",
-            "max. abs. dev. Rad. of Gyr.": "mean",
+            "Average RMSD (Å)": "mean",
+            "Average TM score": "mean",
+            "Average DSSP match": "mean",
+            "Maximum absolute deviation of the radius of gyration (Å)": "mean",
         })
         .round(4)
         .reset_index()
@@ -114,27 +116,32 @@ def _transform_dataframes_for_visualization(
 
     # Ensure numeric values for aggregation
     df_agg_filtered_numeric = df_agg_filtered.copy()
-    df_agg_filtered_numeric["avg. RMSD"] = pd.to_numeric(
-        df_agg_filtered_numeric["avg. RMSD"], errors="coerce"
+    df_agg_filtered_numeric["Average RMSD (Å)"] = pd.to_numeric(
+        df_agg_filtered_numeric["Average RMSD (Å)"], errors="coerce"
     )
-    df_agg_filtered_numeric["avg. TM score"] = pd.to_numeric(
-        df_agg_filtered_numeric["avg. TM score"], errors="coerce"
+    df_agg_filtered_numeric["Average TM score"] = pd.to_numeric(
+        df_agg_filtered_numeric["Average TM score"], errors="coerce"
     )
-    df_agg_filtered_numeric["avg. DSSP match"] = pd.to_numeric(
-        df_agg_filtered_numeric["avg. DSSP match"], errors="coerce"
+    df_agg_filtered_numeric["Average DSSP match"] = pd.to_numeric(
+        df_agg_filtered_numeric["Average DSSP match"], errors="coerce"
     )
-    df_agg_filtered_numeric["max. abs. dev. Rad. of Gyr."] = pd.to_numeric(
-        df_agg_filtered_numeric["max. abs. dev. Rad. of Gyr."], errors="coerce"
+    df_agg_filtered_numeric[
+        "Maximum absolute deviation of the radius of gyration (Å)"
+    ] = pd.to_numeric(
+        df_agg_filtered_numeric[
+            "Maximum absolute deviation of the radius of gyration (Å)"
+        ],
+        errors="coerce",
     )
 
     # Calculate averages across structures for each model
     avg_metrics = (
         df_agg_filtered_numeric.groupby("Model")
         .agg({
-            "avg. RMSD": "mean",
-            "avg. TM score": "mean",
-            "avg. DSSP match": "mean",
-            "max. abs. dev. Rad. of Gyr.": "mean",
+            "Average RMSD (Å)": "mean",
+            "Average TM score": "mean",
+            "Average DSSP match": "mean",
+            "Maximum absolute deviation of the radius of gyration (Å)": "mean",
         })
         .reset_index()
     )
@@ -146,10 +153,10 @@ def _transform_dataframes_for_visualization(
     metrics_long = avg_metrics.melt(
         id_vars=["Model"],
         value_vars=[
-            "avg. RMSD",
-            "avg. TM score",
-            "avg. DSSP match",
-            "max. abs. dev. Rad. of Gyr.",
+            "Average RMSD (Å)",
+            "Average TM score",
+            "Average DSSP match",
+            "Maximum absolute deviation of the radius of gyration (Å)",
         ],
         var_name="Metric",
         value_name="Value",
@@ -236,10 +243,13 @@ def folding_stability_page(
     #  the lower/closer to 0 the value the better
     #  and one for  the closer to 1 the value the better
     metrics_long_0 = metrics_long[
-        metrics_long["Metric"].isin(["avg. RMSD", "max. abs. dev. Rad. of Gyr."])
+        metrics_long["Metric"].isin([
+            "Average RMSD (Å)",
+            "Maximum absolute deviation of the radius of gyration (Å)",
+        ])
     ].copy()
     metrics_long_1 = metrics_long[
-        metrics_long["Metric"].isin(["avg. TM score", "avg. DSSP match"])
+        metrics_long["Metric"].isin(["Average TM score", "Average DSSP match"])
     ].copy()
     st.markdown("### RMSD and Radius of Gyration")
     # Create a grouped bar chart
@@ -253,7 +263,7 @@ def folding_stability_page(
                 sort=None,
                 axis=alt.Axis(labelAngle=-45, labelLimit=100),
             ),
-            y=alt.Y("Value:Q", title="Value"),
+            y=alt.Y("Value:Q", title="Metric"),
             color=alt.Color("Metric:N", title="Metric"),
             xOffset=alt.XOffset("Metric:N"),
             tooltip=["Model:N", "Metric:N", "Value:Q"],
 
@@ -227,7 +227,7 @@ def noncovalent_interactions_page(
     )
 
     # Drop the score for the rest of processing
-    df_subset.drop(columns=["Score"])
+    df_subset = df_subset.drop(columns=["Score"])
 
     # Reshape dataframe for Altair plotting
     df_melted = (
@@ -251,9 +251,13 @@ def noncovalent_interactions_page(
             ),
             x=alt.X("RMSE:Q", title="RMSE (kcal/mol)"),
             yOffset=alt.YOffset("Model name:N"),
-            color=alt.Color("Model name:N", title="Model Name"),
+            color=alt.Color("Model name:N", title="Model"),
             opacity=alt.condition(selection, alt.value(0.8), alt.value(0.3)),
-            tooltip=["Model name:N", "Interaction type:N", "RMSE:Q"],
+            tooltip=[
+                alt.Tooltip("Model name:N", title="Model"),
+                "Interaction type:N",
+                "RMSE:Q",
+            ],
         )
         .resolve_scale(color="independent")
         .properties(