Skip to content

Commit 616b057

Browse files
authored
Merge pull request #94 from ciaran28/main
Bug Fix : Databricks Workflows
2 parents 883b1f5 + bb01321 commit 616b057

File tree

4 files changed

+54
-38
lines changed

4 files changed

+54
-38
lines changed

.github/workflows/taskDatabricks.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -90,10 +90,10 @@ jobs:
9090
#################################/
9191
## Deploy Azure Infrastructure.
9292
#################################/
93-
- name: Deploy Azure Resources
94-
run: ${{ inputs.SCRIPT_LANGUAGE }} infrastructure/databricks/databricks_utils/${{ inputs.SCRIPT_LANGUAGE }}/utils_create_azure_resources.py
95-
env:
96-
ENVIRONMENT: ${{ inputs.ENVIRONMENT }}
93+
#- name: Deploy Azure Resources
94+
# run: ${{ inputs.SCRIPT_LANGUAGE }} infrastructure/databricks/databricks_utils/${{ inputs.SCRIPT_LANGUAGE }}/utils_create_azure_resources.py
95+
# env:
96+
# ENVIRONMENT: ${{ inputs.ENVIRONMENT }}
9797

9898

9999

data_science/src_nyc_taxi/training/__init__.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -207,8 +207,8 @@ def set_mlflow(
207207
):
208208
if namespace.env is not None:
209209
params = yaml.safe_load(pathlib.Path(namespace.env).read_text())
210-
experiment_name = params['ML_PIPELINE_FILES']['TRAIN_REGISTER']['PARAMETERS']['EXPERIMENT_NAME']
211-
track_in_azure_ml = params['ML_PIPELINE_FILES']['TRAIN_REGISTER']['PARAMETERS']['TRACK_IN_AZURE_ML']
210+
experiment_name = params['Global']['ExperimentName']
211+
track_in_azure_ml = params['Global']['AMLTraking']
212212

213213
if track_in_azure_ml:
214214
if track_in_azure_ml:
Lines changed: 47 additions & 31 deletions
Original file line numberDiff line numberDiff line change
@@ -1,32 +1,48 @@
1-
ModelOne:
2-
objective": "regression"
3-
"metric": "rmse"
4-
"num_leaves": 25
5-
"learning_rate": 0.2
6-
"bagging_fraction": 0.9
7-
"feature_fraction": 0.9
8-
"bagging_seed": 42
9-
"verbosity": -1
10-
"seed": 42
1+
Global:
2+
ExperimentName: "nyc_taxi_dbx_job"
3+
AMLTraking: False
114

12-
ModelTwo:
13-
objective": "regression"
14-
"metric": "rmse"
15-
"num_leaves": 27
16-
"learning_rate": 0.3
17-
"bagging_fraction": 0.9
18-
"feature_fraction": 0.9
19-
"bagging_seed": 42
20-
"verbosity": -1
21-
"seed": 42
22-
23-
ModelThree:
24-
objective": "regression"
25-
"metric": "rmse"
26-
"num_leaves": 30
27-
"learning_rate": 0.4
28-
"bagging_fraction": 0.9
29-
"feature_fraction": 0.9
30-
"bagging_seed": 42
31-
"verbosity": -1
32-
"seed": 42
5+
ModelConfigs: [
6+
{
7+
"ModelName": "ModelOne",
8+
"ModelParams": {
9+
"objective": "regression",
10+
"metric": "rmse",
11+
"num_leaves": 25,
12+
"learning_rate": 0.2,
13+
"bagging_fraction": 0.9,
14+
"feature_fraction": 0.9,
15+
"bagging_seed": 42,
16+
"verbosity": -1,
17+
"seed": 42
18+
}
19+
},
20+
{
21+
"ModelName": "ModelTwo",
22+
"ModelParams": {
23+
"objective": "regression",
24+
"metric": "rmse",
25+
"num_leaves": 27,
26+
"learning_rate": 0.3,
27+
"bagging_fraction": 0.9,
28+
"feature_fraction": 0.9,
29+
"bagging_seed": 42,
30+
"verbosity": -1,
31+
"seed": 42
32+
}
33+
},
34+
{
35+
"ModelName": "ModelThree",
36+
"ModelParams": {
37+
"objective": "regression",
38+
"metric": "rmse",
39+
"num_leaves": 30,
40+
"learning_rate": 0.4,
41+
"bagging_fraction": 0.9,
42+
"feature_fraction": 0.9,
43+
"bagging_seed": 42,
44+
"verbosity": -1,
45+
"seed": 42
46+
}
47+
}
48+
]

mlOps/nyc_taxi/databricks_pipelines/workflow.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ custom:
22

33
# Cluster configs for each environment
44
default-cluster-spec: &default-cluster-spec
5-
spark_version: '11.3.x-cpu-ml-scala2.12'
5+
spark_version: '13.0.x-cpu-ml-scala2.12'
66
node_type_id: 'Standard_DS3_v2'
77
driver_node_type_id: 'Standard_DS3_v2'
88
num_workers: 1

0 commit comments

Comments
 (0)