Skip to content

Commit 011ce61

Browse files
committed
update project config
1 parent 34ab501 commit 011ce61

File tree

2 files changed

+10
-2
lines changed

2 files changed

+10
-2
lines changed

scripts/2_process_data.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121
train_set, test_set = data_processor.split_data(test_size=0.2, random_state=42)
2222

2323
processed_gcs_bucket_connector = GCSConnector(bucket_name=config.gcs_processed_taxi_data_bucket_name)
24-
train_file_name = "green_taxi_train_set.parquet"
24+
train_file_name = config.train_file_name
2525
processed_gcs_bucket_connector.upload(train_set, train_file_name)
26-
test_file_name = "green_taxi_test_set.parquet"
26+
test_file_name = config.test_file_name
2727
processed_gcs_bucket_connector.upload(test_set, test_file_name)

src/project_config.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,10 +16,18 @@ class ProjectConfig(BaseModel):
1616
num_features: list[str]
1717
cat_features: Optional[list[str]]
1818
target: list[str]
19+
train_file_name: str
20+
test_file_name: str
21+
experiment_name: str
1922

2023
@classmethod
2124
def from_yaml(cls, config_path: str):
2225
"""Load configuration from yaml file"""
2326
with open(config_path, "r") as f:
2427
config_dict = yaml.safe_load(f)
2528
return cls(**config_dict)
29+
30+
31+
class Tags(BaseModel):
32+
git_sha: str
33+
branch: str

0 commit comments

Comments
 (0)