emdgroup · nihaase · Mar 11, 2026 · Copilot · Mar 11, 2026 · Copilot
diff --git a/octopus/study/data_preparator.py b/octopus/study/data_preparator.py
@@ -106,6 +106,7 @@ def _transform_bool_to_int(self):
     def _create_row_id_col(self):
         """Create a unique row identifier if not provided."""
         if not self.row_id_col:
+            self.data = self.data.copy()
-            self.data = self.data.copy()
-            self.data = self.data.copy()
             self.data["row_id"] = list(range(len(self.data)))
-            self.data = self.data.copy()
-            self.data["row_id"] = list(range(len(self.data)))
+            # Use a shallow copy to avoid the cost of a full deep copy of the DataFrame
+            # while still ensuring we don't mutate any external references to the original object.
+            self.data = self.data.copy(deep=False)
+            self.data["row_id"] = np.arange(len(self.data))
-            self.data["row_id"] = list(range(len(self.data)))
+            self.data["row_id"] = pd.RangeIndex(len(self.data))
-            self.data = self.data.copy()
-            self.data["row_id"] = list(range(len(self.data)))
+            # Use a shallow copy to avoid the cost of a full deep copy of the DataFrame
+            # while still ensuring we don't mutate any external references to the original object.
+            self.data = self.data.copy(deep=False)
+            self.data["row_id"] = np.arange(len(self.data))
-            self.data["row_id"] = list(range(len(self.data)))
+            self.data["row_id"] = pd.RangeIndex(len(self.data))
             self.row_id_col = "row_id"