NxNiki
diff --git a/‎.gitignore‎
Lines changed: 1 addition & 0 deletions b/‎.gitignore‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎scripts/save_config.py‎
Lines changed: 60 additions & 0 deletions b/‎scripts/save_config.py‎
Lines changed: 60 additions & 0 deletions
diff --git a/‎…vie_decoding/dataloader/save_patients.py‎ ‎scripts/save_patients.py‎src/movie_decoding/dataloader/save_patients.py renamed to scripts/save_patients.py
Lines changed: 1 addition & 3 deletions b/‎…vie_decoding/dataloader/save_patients.py‎ ‎scripts/save_patients.py‎src/movie_decoding/dataloader/save_patients.py renamed to scripts/save_patients.py
Lines changed: 1 addition & 3 deletions
diff --git a/‎src/movie_decoding/batch_main.sh‎
Lines changed: 1 addition & 5 deletions b/‎src/movie_decoding/batch_main.sh‎
Lines changed: 1 addition & 5 deletions
diff --git a/‎src/movie_decoding/config/__init__.py‎ b/‎src/movie_decoding/config/__init__.py‎
diff --git a/‎src/movie_decoding/config/config.py‎
Lines changed: 150 additions & 0 deletions b/‎src/movie_decoding/config/config.py‎
Lines changed: 150 additions & 0 deletions
diff --git a/‎src/movie_decoding/config/file_path.py‎
Lines changed: 8 additions & 0 deletions b/‎src/movie_decoding/config/file_path.py‎
Lines changed: 8 additions & 0 deletions
@@ -34,5 +34,6 @@ src/movie_decoding/__pycache__/
 
 data/
 ._data
+config/*.yaml
 results/
 wandb/
@@ -0,0 +1,60 @@
+"""
+This script is used to define the basic config parameters for a movie decoding project.
+Custom parameters can be added to any of the three fields of config (experiment, model, data).
+"""
+
+from movie_decoding.config.config import ExperimentConfig, PipelineConfig
+from movie_decoding.config.file_path import CONFIG_FILE_PATH, DATA_PATH, RESULT_PATH
+
+if __name__ == "__main__":
+    experiment_config = ExperimentConfig(name="test", patient=562)
+
+    config = PipelineConfig(experiment=experiment_config)
+    config.model.architecture = "multi-vit"
+    config.model.learning_rate = 1e-4
+    config.model.batch_size = 128
+    config.model.weight_decay = 1e-4
+    config.model.epochs = 5
+    config.model.lr_drop = 50
+    config.model.validation_step = 25
+    config.model.early_stop = 75
+    config.model.num_labels = 8
+    config.model.merge_label = True
+    config.model.img_embedding_size = 192
+    config.model.hidden_size = 256
+    config.model.num_hidden_layers = 6
+    config.model.num_attention_heads = 8
+    config.model.patch_size = (1, 5)
+    config.model.intermediate_size = 192 * 2
+    config.model.classifier_proj_size = 192
+
+    config.experiment.seed = 42
+    config.experiment.use_spike = True
+    config.experiment.use_lfp = False
+    config.experiment.use_combined = False
+    config.experiment.use_shuffle = True
+    config.experiment.use_bipolar = False
+    config.experiment.use_sleep = False
+    config.experiment.use_overlap = False
+    config.experiment.use_long_input = False
+    config.experiment.use_spontaneous = False
+    config.experiment.use_augment = False
+    config.experiment.use_shuffle_diagnostic = True
+    config.experiment.model_aggregate_type = "sum"
+
+    config.data.result_path = str(RESULT_PATH)
+    config.data.spike_path = str(DATA_PATH)
+    config.data.lfp_path = "undefined"
+    config.data.lfp_data_mode = "sf2000-bipolar-region-clean"
+    config.data.spike_data_mode = "notch CAR-quant-neg"
+    config.data.spike_data_mode_inference = "notch CAR-quant-neg"
+    config.data.spike_data_sd = [3.5]
+    config.data.spike_data_sd_inference = 3.5
+    config.data.use_augment = False
+    config.data.use_long_input = False
+    config.data.use_shuffle_diagnostic = False
+    config.data.model_aggregate_type = "sum"
+    config.data.movie_label_path = str(DATA_PATH / "8concepts_merged.npy")
+    config.data.movie_sampling_rate = 30
+
+    config.export_config(CONFIG_FILE_PATH)
@@ -5,11 +5,9 @@
 import numpy as np
 import pandas as pd
 
+from movie_decoding.config.file_path import PATIENTS_FILE_PATH, SURROGATE_FILE_PATH
 from movie_decoding.dataloader.patients import Patients
 
-PATIENTS_FILE_PATH = Path(__file__).resolve().parents[3] / "data/patients"
-SURROGATE_FILE_PATH = Path(__file__).resolve().parents[3] / "data/surrogate_windows"
-
 
 def read_annotation(annotation_file: str) -> List[int]:
     """
 
@@ -1,4 +1,3 @@
-### common_average_job.sh START ###
 #!/bin/bash
 #$ -cwd
 # error = Merged with joblog
@@ -30,7 +29,7 @@ conda activate movie_decoding
 
 # in the following two lines substitute the command with the
 # needed command below:
-python main.py 
+python main.py
 
 # echo job info on joblog:
 echo "Job $JOB_ID ended on:   " `hostname -s`
@@ -39,6 +38,3 @@ echo " "
 ### extract_clusterless_parallel.job STOP ###
 # this site shows how to do array jobs: https://info.hpc.sussex.ac.uk/hpc-guide/how-to/array.html
 # (better than the Hoffman site https://www.hoffman2.idre.ucla.edu/Using-H2/Computing/Computing.html#how-to-build-a-submission-script)
-
-
- 
@@ -0,0 +1,150 @@
+from datetime import datetime
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Tuple, Union
+
+import yaml
+from pydantic import BaseModel, Field
+
+
+class BaseConfig(BaseModel):
+    alias: Dict[str, str] = {}
+    param: Dict[str, Any] = {}
+
+    def __getitem__(self, key: str) -> Any:
+        if key in self.param:
+            return self.param[key]
+        return getattr(self, key)
+
+    def __setitem__(self, key: str, value: Any):
+        if key in self.model_fields:
+            setattr(self, key, value)
+        else:
+            self.param[key] = value
+
+    def __getattr__(self, name):
+        """Handles alias access and custom parameters."""
+        if name in self.alias:
+            return getattr(self, self.alias[name])
+        if name in self.param:
+            return self.param[name]
+        raise AttributeError(f"'{type(self).__name__}' object has no attribute '{name}'")
+
+    def __setattr__(self, name, value):
+        """Handles alias assignment, field setting, or adding to _param."""
+        if name in self.alias:
+            name = self.alias[name]
+
+        # Check if it's a field defined in the model
+        if name in self.model_fields:
+            super().__setattr__(name, value)
+        else:
+            # Otherwise, treat it as a custom parameter
+            self.param[name] = value
+
+    def __contains__(self, key: str) -> bool:
+        return key in self.param or hasattr(self, key)
+
+
+class ExperimentConfig(BaseConfig):
+    """
+    configurations regarding the experiment
+    """
+
+    name: Optional[str] = None
+    patient: Optional[Union[List[int], int]] = None
+
+
+class ModelConfig(BaseConfig):
+    name: Optional[str] = None
+    learning_rate: Optional[float] = Field(1e-4, alias="lr")
+    learning_rate_drop: Optional[int] = Field(50, alias="lr_drop")
+    batch_size: Optional[int] = 128
+    epochs: Optional[int] = 100
+    hidden_size: Optional[int] = 192
+    num_hidden_layers: Optional[int] = 4
+    num_attention_heads: Optional[int] = 6
+    patch_size: Optional[Tuple[int, int]] = None
+
+    alias: Dict[str, str] = {
+        "lr": "learning_rate",
+        "lr_drop": "learning_rate_drop",
+    }
+
+
+class DataConfig(BaseConfig):
+    data_type: Optional[str] = None
+    sd: Optional[float] = None
+    root_path: Optional[Union[str, Path]] = None
+    data_path: Optional[Union[str, Path]] = None
+
+
+class PipelineConfig(BaseModel):
+    experiment: Optional[ExperimentConfig] = ExperimentConfig()
+    model: Optional[ModelConfig] = ModelConfig()
+    data: Optional[DataConfig] = DataConfig()
+
+    # class Config:
+    #     arbitrary_types_allowed = True
+
+    @classmethod
+    def read_config(cls, config_file: Union[str, Path]) -> "PipelineConfig":
+        """Reads a YAML configuration file and returns an instance of PipelineConfig."""
+        with open(config_file, "r") as file:
+            config_dict = yaml.safe_load(file)
+        return cls(**config_dict)
+
+    def export_config(self, output_file: Union[str, Path] = "config.yaml") -> None:
+        """Exports current properties to a YAML configuration file."""
+        if isinstance(output_file, str):
+            output_file = Path(output_file)
+
+        if not output_file.suffix:
+            output_file = output_file / "config.yaml"
+
+        # Create new path with the suffix added before the extension
+        output_file = output_file.with_name(f"{output_file.stem}{self._file_tag}{output_file.suffix}")
+
+        dir_path = output_file.parent
+        dir_path.mkdir(parents=True, exist_ok=True)
+
+        with open(output_file, "w") as file:
+            yaml.safe_dump(self.model_dump(), file)
+
+    @property
+    def _file_tag(self) -> str:
+        current_time = datetime.now()
+        formatted_time = current_time.strftime("%Y-%m-%d-%H:%M:%S")
+        return f"_{self.experiment.name}-{self.model.name}-{self.data.data_type}_{formatted_time}"
+
+
+if __name__ == "__main__":
+    pipeline_config = PipelineConfig()
+    pipeline_config.model.name = "vit"
+    pipeline_config.model.learning_rate = 0.001
+    pipeline_config.experiment.name = "movie-decoding"
+
+    # Access and print properties
+    print(f"Experiment Name: {pipeline_config.experiment.name}")
+    print(f"Patient ID: {pipeline_config.experiment.patient}")
+    print(f"Model Name: {pipeline_config.model.name}")
+    print(f"Learning Rate: {pipeline_config.model.learning_rate}")
+    print(f"Batch Size: {pipeline_config.model.batch_size}")
+
+    # Access using aliases
+    print(f"Learning Rate (alias 'lr'): {pipeline_config.model['lr']}")
+    print(f"Learning Rate (alias 'lr'): {pipeline_config.model.lr}")
+
+    # Set new custom parameters
+    pipeline_config.model["new_param"] = "custom_value"
+    print(f"Custom Parameter 'new_param': {pipeline_config.model['new_param']}")
+    pipeline_config.model.new_param2 = "custom_value"
+    print(f"Custom Parameter 'new_param2': {pipeline_config.model.new_param2}")
+
+    # Try to access a non-existent field (will raise AttributeError)
+    try:
+        print(pipeline_config.model.some_non_existent_field)
+    except AttributeError as e:
+        print(e)
+
+    # Export config:
+    pipeline_config.export_config()
@@ -0,0 +1,8 @@
+from pathlib import Path
+
+ROOT_PATH = Path(__file__).resolve().parents[3]
+DATA_PATH = ROOT_PATH / "data"
+PATIENTS_FILE_PATH = ROOT_PATH / "data/patients"
+SURROGATE_FILE_PATH = ROOT_PATH / "data/surrogate_windows"
+CONFIG_FILE_PATH = ROOT_PATH / "config"
+RESULT_PATH = ROOT_PATH / "results"