Merge pull request #25 from szepeviktor/typos

dholzmueller · web-flow · commit 5d9e26a39457 · 2025-08-14T12:02:56.000+02:00
Fix typos
diff --git a/docs/source/bench/03_code.md b/docs/source/bench/03_code.md
@@ -14,7 +14,7 @@ a list of the most important hyperparameters.
 
 ## Datasets
 
-We represent our datasets using the `DictDatset` class from `tab_models`.
+We represent our datasets using the `DictDataset` class from `tab_models`.
 These datasets can be loaded as follows:
 
 ```python
diff --git a/docs/source/models/01_sklearn_interfaces.rst b/docs/source/models/01_sklearn_interfaces.rst
@@ -112,7 +112,7 @@ but fails to run predict() due to pytorch-lightning device issues.
 
 .. code-block:: language
     import torch
-    import dill  # might also work with pickle instad
+    import dill  # might also work with pickle instead
     torch.save(model, 'model.pkl', pickle_module=dill, _use_new_zipfile_serialization=False)
     model = torch.load('model.pkl', map_location='cpu', pickle_module=dill)
 
diff --git a/docs/source/models/nn_classes.md b/docs/source/models/nn_classes.md
@@ -35,7 +35,7 @@ for continuous and categorical variables.
 Moreover, during training, we also pass the labels 'y' through the Layer, 
 which allows to implement mixup, label smoothing, 
 and output standardization as Layer objects.
-- `Fitter` classes initialize the NN based on a single foward pass 
+- `Fitter` classes initialize the NN based on a single forward pass 
 on the (subsampled) training (and possibly validation) set. 
 This is done using the `fit()` or `fit_transform()` functions 
 similar to scikit-learn preprocessing classes, 
diff --git a/pytabkit/bench/data/get_uci.py b/pytabkit/bench/data/get_uci.py
@@ -621,7 +621,7 @@ def get_metro_interstate_traffic_volume():
     replace_chars_in_file('metro_interstate_traffic_volume.data', '  ', ' ')
     
     
-    # Now we are in the position ot read the data, convert the time and date, and movel the labels
+    # Now we are in the position to read the data, convert the time and date, and movel the labels
     
     
     data = load_raw_data('metro_interstate_traffic_volume_short.data', ',', description_columns = 0, date_column = 16, date_sep = '-', date_order = 'Ymd', time_column = 17, time_sep = ':')
@@ -736,7 +736,7 @@ def get_tarvel_review_ratings():
     prepare_new_data_set_group_id()
     
     
-    # Download the data and correct the mispelling of its name
+    # Download the data and correct the misspelling of its name
     
     download_and_save('http://archive.ics.uci.edu/ml/machine-learning-databases/00485/google_review_ratings.csv', 'travel_review_ratings.data')
     
@@ -1332,8 +1332,8 @@ def get_smartphone_human_activity():
 def get_artificial_characters():
     
     prepare_new_data_set_group_id()
-    #download_and_save('https://archive.ics.uci.edu/ml/machine-learning-databases/artificial-characters/character.tar.Z', 'artficial_characters.tar.Z')
-    #download_and_save('https://archive.ics.uci.edu/ml/machine-learning-databases/artificial-characters/character.names', 'artficial_characters.description')
+    #download_and_save('https://archive.ics.uci.edu/ml/machine-learning-databases/artificial-characters/character.tar.Z', 'artificial_characters.tar.Z')
+    #download_and_save('https://archive.ics.uci.edu/ml/machine-learning-databases/artificial-characters/character.names', 'artificial_characters.description')
 
     print("Artificial Characters is currently not processed since:")
     print("  - the data comes in a rather convoluted form")
@@ -1534,7 +1534,7 @@ def get_thyroids():
     download_and_save('https://archive.ics.uci.edu/ml/machine-learning-databases/thyroid-disease/dis.test', 'thyroid_dis.test.data') 
     download_and_save('https://archive.ics.uci.edu/ml/machine-learning-databases/thyroid-disease/dis.names', 'thyroid_dis.description')
 
-    # new-thyroid.data only contains 215 samples and is thus ommitted
+    # new-thyroid.data only contains 215 samples and is thus omitted
 
     download_and_save('http://archive.ics.uci.edu/ml/machine-learning-databases/thyroid-disease/hypothyroid.data', 'thyroid_hypo.data') 
     download_and_save('http://archive.ics.uci.edu/ml/machine-learning-databases/thyroid-disease/hypothyroid.names', 'thyroid_hypo.description')
@@ -2819,7 +2819,7 @@ def get_wave_energy():
 
     # For each of the 4 data sets, the last column contains the sum of columns 32 to 47.
     # I assume the last column is the label and columns 32 to 47 are intermediate results
-    # and that only the first 32 colums should be used as features.
+    # and that only the first 32 columns should be used as features.
     indices = range(32, 48)
 
     data_adelaide = load_raw_data('WECs_DataSet/Adelaide_Data.csv', sep=',')
diff --git a/pytabkit/bench/scheduling/jobs.py b/pytabkit/bench/scheduling/jobs.py
@@ -17,12 +17,12 @@ def __init__(self, job_id: int, time_s: float,
         """
         :param job_id: Job id.
         :param time_s: Time in seconds that the job ran for.
-        :param oom_cpu: Whether an out-of-memory error occured on the CPU.
-        :param oom_gpu: Whether an out-of-memory error occured on the GPU.
+        :param oom_cpu: Whether an out-of-memory error occurred on the CPU.
+        :param oom_gpu: Whether an out-of-memory error occurred on the GPU.
         :param finished_normally: Whether the job ran normally,
             such that its time and RAM values are representative of how it would normally run.
             For example, if the job ran faster because the results were already partially precomputed,
-            it should not count towards the time estimation. Of course, if an exception occured,
+            it should not count towards the time estimation. Of course, if an exception occurred,
             we should have finished_normally=False.
         :param exception_msg: Exception message (if there was any).
         """
diff --git a/pytabkit/models/alg_interfaces/catboost_interfaces.py b/pytabkit/models/alg_interfaces/catboost_interfaces.py
@@ -252,7 +252,7 @@ def _fit(self, train_ds: DictDataset, val_ds: Optional[DictDataset], params: Dic
             # with these parameters, catboost will reload from the model automatically if it is there
         bst = catboost.CatBoost(params)
         with warnings.catch_warnings():
-            warnings.filterwarnings('ignore', message='Can\'t optimze method "evaluate" because self argument is used')
+            warnings.filterwarnings('ignore', message='Can\'t optimize method "evaluate" because self argument is used')
             bst.fit(self._convert_ds(train_ds), eval_set=None if val_ds is None else self._convert_ds(val_ds))
 
         if val_ds is not None:
diff --git a/pytabkit/models/alg_interfaces/nn_interfaces.py b/pytabkit/models/alg_interfaces/nn_interfaces.py
@@ -307,7 +307,7 @@ def __init__(self, space: Optional[Union[str, Dict[str, Any]]] = None, n_hyperop
             }
             utils.update_dict(default_config, remove_keys=list(space.keys()))
         elif not isinstance(space, dict):
-            print(f'Unkown hyperparameter space: {space}')
+            print(f'Unknown hyperparameter space: {space}')
 
         config = utils.update_dict(default_config, config)
         opt_class = SMACOptimizer if opt_method == 'smac' else HyperoptOptimizer
diff --git a/pytabkit/models/alg_interfaces/other_interfaces.py b/pytabkit/models/alg_interfaces/other_interfaces.py
@@ -1053,7 +1053,7 @@ def fit(self, X, y, X_val, y_val, cat_features: Optional[List[str]] = None):
             'learning_rate_weights': 0.005,  # learning rate for leaf weights
             'learning_rate_index': 0.01,  # learning rate for split indices
             'learning_rate_values': 0.01,  # learning rate for split values
-            'learning_rate_leaf': 0.01,  # learning rate for leafs (logits)
+            'learning_rate_leaf': 0.01,  # learning rate for leaves (logits)
 
             'optimizer': 'adam',  # optimizer
             'cosine_decay_steps': 0,  # decay steps for lr schedule (CosineDecayRestarts)
diff --git a/pytabkit/models/alg_interfaces/tabm_interface.py b/pytabkit/models/alg_interfaces/tabm_interface.py
@@ -334,7 +334,7 @@ def evaluate(part: str) -> float:
         }
         best_params = [p.clone() for p in model.parameters()]
         # Early stopping: the training stops when
-        # there are more than `patience` consequtive bad updates.
+        # there are more than `patience` consecutive bad updates.
         remaining_patience = patience
 
         try:
diff --git a/pytabkit/models/alg_interfaces/xgboost_interfaces.py b/pytabkit/models/alg_interfaces/xgboost_interfaces.py
@@ -498,7 +498,7 @@ def _sample_params(self, is_classification: bool, seed: int, n_train: int):
                 # 'max_bin'  # also makes things slower
             }
         elif hpo_space_name == 'large-v3':
-            # shrunk verion of large-v2: removed gamma, colsample_bytree
+            # shrunk version of large-v2: removed gamma, colsample_bytree
             params = {
                 'n_estimators': 1000,
                 'early_stopping_rounds': 50,
@@ -513,7 +513,7 @@ def _sample_params(self, is_classification: bool, seed: int, n_train: int):
                 'grow_policy': rng.choice(['depthwise', 'lossguide']),
             }
         elif hpo_space_name == 'large-v4':
-            # modified verion of large-v3
+            # modified version of large-v3
             params = {
                 'n_estimators': 1000,
                 'early_stopping_rounds': 50,
@@ -529,7 +529,7 @@ def _sample_params(self, is_classification: bool, seed: int, n_train: int):
                 'max_leaves': round(np.exp(rng.uniform(np.log(2.0), np.log(2048.0))))  # added
             }
         elif hpo_space_name == 'large-v5':
-            # shrunk verion of large-v3 but without the extra stuff from large-v4
+            # shrunk version of large-v3 but without the extra stuff from large-v4
             params = {
                 'n_estimators': 1000,
                 'early_stopping_rounds': 50,
@@ -543,7 +543,7 @@ def _sample_params(self, is_classification: bool, seed: int, n_train: int):
                 'reg_lambda': np.exp(rng.uniform(np.log(1e-3), np.log(20.0))),  # modified
             }
         elif hpo_space_name == 'large-v6':
-            # shrunk verion of large-v4
+            # shrunk version of large-v4
             params = {
                 'n_estimators': 1000,
                 'early_stopping_rounds': 50,
diff --git a/pytabkit/models/nn_models/activations.py b/pytabkit/models/nn_models/activations.py
@@ -31,7 +31,7 @@ def backward(ctx, grad_output):
         return _swish_jit_bwd(x, grad_output)
 
 
-# don't use the optimized version since this seems to behave slighty differently for Pytorch Lightning
+# don't use the optimized version since this seems to behave slightly differently for Pytorch Lightning
 # def swish(x): return _SwishJitAutoFn.apply(x)
 def swish(x): return x * torch.sigmoid(x)
 
@@ -59,7 +59,7 @@ def backward(ctx, grad_output):
         return _mish_jit_bwd(x, grad_output)
 
 
-# don't use the optimized version since this seems to behave slighty differently for Pytorch Lightning
+# don't use the optimized version since this seems to behave slightly differently for Pytorch Lightning
 # def mish(x): return MishJitAutoFn.apply(x)
 def mish(x): return x.mul(torch.tanh(F.softplus(x)))
 
diff --git a/pytabkit/models/nn_models/rtdl_resnet.py b/pytabkit/models/nn_models/rtdl_resnet.py
@@ -796,7 +796,7 @@ class NeuralNetClassifierWrapped(NeuralNetClassifier):
     def __init__(self, *args, **kwargs):
         super().__init__(*args, **kwargs)
         self.categorical_indicator = None
-        self.n_classes = None  # automatically infered from train if not set
+        self.n_classes = None  # automatically inferred from train if not set
 
     def set_categorical_indicator(self, categorical_indicator):
         self.categorical_indicator = categorical_indicator
@@ -843,7 +843,7 @@ def initialize_optimizer_ft_transformer(self, triggered_directly=None):
         Deprecated, don't use it anymore.
 
     """
-    # handle deprecated paramter
+    # handle deprecated parameter
     # if triggered_directly is not None:
     #     warnings.warn(
     #         "The 'triggered_directly' argument to 'initialize_optimizer' is "
diff --git a/pytabkit/models/nn_models/tabm.py b/pytabkit/models/nn_models/tabm.py
@@ -528,7 +528,7 @@ def __init__(
                 else 'normal'
                 if arch_type in ('tabm-mini-normal', 'tabm-normal')
                 # For other arch_types, the initialization depends
-                # on the presense of num_embeddings.
+                # on the presence of num_embeddings.
                 else 'random-signs'
                 if num_embeddings is None
                 else 'normal'
diff --git a/pytabkit/models/nn_models/tabr_lib.py b/pytabkit/models/nn_models/tabr_lib.py
@@ -821,7 +821,7 @@ def cat(data: List[T], /, dim: int = 0) -> T:
     The same works for sequences of named tuples, dataclasses, tensors and
     nested combinations of all mentioned collection types.
 
-    *Below, additinal technical examples are provided.*
+    *Below, additional technical examples are provided.*
 
     The common setup:
 
diff --git a/pytabkit/models/sklearn/sklearn_interfaces.py b/pytabkit/models/sklearn/sklearn_interfaces.py
@@ -136,7 +136,7 @@ def __init__(self, device: Optional[str] = None, random_state: Optional[Union[in
         :param verbosity: Verbosity level (default=0, higher means more verbose).
             Set to 2 to see logs from intermediate epochs.
         :param train_metric_name: Name of the training metric
-            (default='cross_entropy' for clasification and 'mse' for regression).
+            (default='cross_entropy' for classification and 'mse' for regression).
             Currently most other metrics are not available for training.
         :param val_metric_name: Name of the validation metric (used for selecting the best epoch).
             Defaults are 'class_error' for classification and 'rmse' for regression.
diff --git a/pytabkit/models/torch_utils.py b/pytabkit/models/torch_utils.py
@@ -54,7 +54,7 @@ def cat_if_necessary(tensors: List[torch.Tensor], dim: int):
     This can make it faster if no copying behavior is needed.
     :param tensors: Tensors to be concatenated.
     :param dim: Dimension in which the tensor should be concatenated.
-    :return: The concatendated tensor.
+    :return: The concatenated tensor.
     """
     if len(tensors) == 1:
         return tensors[0]
diff --git a/scripts/create_probclass_plots.py b/scripts/create_probclass_plots.py
@@ -98,7 +98,7 @@ def plot_barscatter_ax(ax: plt.Axes, df: pd.DataFrame, xlabel: Optional[str], yl
     hue_order = hues
 
     # Make sure to remove the 'facecolor': 'w' property here, otherwise
-    # the palette gets overrided
+    # the palette gets overridden
     boxprops = {'edgecolor': 'k', 'linewidth': 1}
     lineprops = {'color': 'k', 'linewidth': 1}
 
diff --git a/tests/test_rtdl_nns.py b/tests/test_rtdl_nns.py
@@ -70,9 +70,9 @@
 #     predictions = clf.predict(X_test)
 #     # If no error is raised, the classifier can handle unseen categories
 #
-# @pytest.mark.parametrize("tranformed_target", [True, False])
+# @pytest.mark.parametrize("transformed_target", [True, False])
 # @pytest.mark.parametrize("model_name", ["resnet", "mlp", "ft_transformer"])
-# def test_regressor_numerical_categorical(tranformed_target, model_name):
+# def test_regressor_numerical_categorical(transformed_target, model_name):
 #     # Generate synthetic data with a mix of numerical and categorical features
 #     X, y = make_regression(n_samples=1000, n_features=3, n_informative=2, random_state=43)
 #     cat_feature = np.random.choice([1, 2, 3], size=X.shape[0])
@@ -84,11 +84,11 @@
 #     X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=43)
 #
 #     if model_name == "resnet":
-#         regressor = Resnet_RTDL_D_Regressor(transformed_target=tranformed_target, random_state=41, device="cpu")
+#         regressor = Resnet_RTDL_D_Regressor(transformed_target=transformed_target, random_state=41, device="cpu")
 #     elif model_name == "mlp":
-#         regressor = MLP_RTDL_D_Regressor(transformed_target=tranformed_target, random_state=41, device="cpu")
+#         regressor = MLP_RTDL_D_Regressor(transformed_target=transformed_target, random_state=41, device="cpu")
 #     elif model_name == "ft_transformer":
-#         regressor = FTT_D_Regressor(transformed_target=tranformed_target, random_state=41, device="cpu")
+#         regressor = FTT_D_Regressor(transformed_target=transformed_target, random_state=41, device="cpu")
 #     regressor.fit(X_train, y_train, cat_indicator=cat_features)
 #     predictions = regressor.predict(X_test)
 #
diff --git a/tests/test_tabr.py b/tests/test_tabr.py
@@ -57,8 +57,8 @@
 #     # If no error is raised, the classifier can handle unseen categories
 #
 #
-# @pytest.mark.parametrize("tranformed_target", [True, False])
-# def test_regressor_numerical_categorical(tranformed_target):
+# @pytest.mark.parametrize("transformed_target", [True, False])
+# def test_regressor_numerical_categorical(transformed_target):
 #     # Generate synthetic data with a mix of numerical and categorical features
 #     X, y = make_regression(n_samples=1000, n_features=5, n_informative=3, random_state=42)
 #     cat_feature = np.random.choice([1, 2, 3], size=X.shape[0])
@@ -70,7 +70,7 @@
 #     X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
 #
 #     # Train the regressor
-#     regressor = TabR_S_D_Regressor(n_epochs=20, transformed_target=tranformed_target)
+#     regressor = TabR_S_D_Regressor(n_epochs=20, transformed_target=transformed_target)
 #     regressor.fit(X_train, y_train, cat_features=cat_features)
 #     predictions = regressor.predict(X_test)
 #

Original file line number	Diff line number	Diff line change
`@@ -307,7 +307,7 @@ def __init__(self, space: Optional[Union[str, Dict[str, Any]]] = None, n_hyperop`
`307`	`307`	`}`
`308`	`308`	`utils.update_dict(default_config, remove_keys=list(space.keys()))`
`309`	`309`	`elif not isinstance(space, dict):`
`310`		`- print(f'Unkown hyperparameter space: {space}')`
	`310`	`+ print(f'Unknown hyperparameter space: {space}')`
`311`	`311`
`312`	`312`	`config = utils.update_dict(default_config, config)`
`313`	`313`	`opt_class = SMACOptimizer if opt_method == 'smac' else HyperoptOptimizer`
Original file line number	Diff line number	Diff line change
`@@ -334,7 +334,7 @@ def evaluate(part: str) -> float:`
`334`	`334`	`}`
`335`	`335`	`best_params = [p.clone() for p in model.parameters()]`
`336`	`336`	`# Early stopping: the training stops when`
`337`		- # there are more than `patience` consequtive bad updates.
	`337`	+ # there are more than `patience` consecutive bad updates.
`338`	`338`	`remaining_patience = patience`
`339`	`339`
`340`	`340`	`try:`