Skip to content

Commit 5c6d87b

Browse files
committed
Get datasets from web instead of blob
Signed-off-by: Keith Battocchi <[email protected]>
1 parent b0936ac commit 5c6d87b

11 files changed

+16
-16
lines changed

econml/tests/test_dominicks.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ def test_dominicks():
2020
if not os.path.isfile(file_name):
2121
print("Downloading file (this might take a few seconds)...")
2222
urllib.request.urlretrieve(
23-
"https://msalicedatapublic.blob.core.windows.net/datasets/OrangeJuice/oj_large.csv", file_name)
23+
"https://msalicedatapublic.z5.web.core.windows.net/datasets/OrangeJuice/oj_large.csv", file_name)
2424
oj_data = pd.read_csv(file_name)
2525

2626
brands = sorted(set(oj_data["brand"]))

notebooks/Causal Forest and Orthogonal Random Forest Examples.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1510,7 +1510,7 @@
15101510
"\n",
15111511
"if not os.path.isfile(file_name):\n",
15121512
" print(\"Downloading file (this might take a few seconds)...\")\n",
1513-
" urllib.request.urlretrieve(\"https://msalicedatapublic.blob.core.windows.net/datasets/OrangeJuice/oj_large.csv\", file_name)\n",
1513+
" urllib.request.urlretrieve(\"https://msalicedatapublic.z5.web.core.windows.net/datasets/OrangeJuice/oj_large.csv\", file_name)\n",
15141514
"oj_data = pd.read_csv(file_name)\n",
15151515
"oj_data.head()"
15161516
]

notebooks/CustomerScenarios/Case Study - Customer Segmentation at An Online Media Company - EconML + DoWhy.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -137,7 +137,7 @@
137137
"outputs": [],
138138
"source": [
139139
"# Import the sample pricing data\n",
140-
"file_url = \"https://msalicedatapublic.blob.core.windows.net/datasets/Pricing/pricing_sample.csv\"\n",
140+
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/Pricing/pricing_sample.csv\"\n",
141141
"train_data = pd.read_csv(file_url)"
142142
]
143143
},

notebooks/CustomerScenarios/Case Study - Customer Segmentation at An Online Media Company.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -122,7 +122,7 @@
122122
"execution_count": 2,
123123
"source": [
124124
"# Import the sample pricing data\n",
125-
"file_url = \"https://msalicedatapublic.blob.core.windows.net/datasets/Pricing/pricing_sample.csv\"\n",
125+
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/Pricing/pricing_sample.csv\"\n",
126126
"train_data = pd.read_csv(file_url)"
127127
],
128128
"outputs": [],

notebooks/CustomerScenarios/Case Study - Multi-investment Attribution at A Software Company - EconML + DoWhy.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -128,7 +128,7 @@
128128
"outputs": [],
129129
"source": [
130130
"# Import the sample multi-attribution data\n",
131-
"file_url = \"https://msalicedatapublic.blob.core.windows.net/datasets/ROI/multi_attribution_sample.csv\"\n",
131+
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/ROI/multi_attribution_sample.csv\"\n",
132132
"multi_data = pd.read_csv(file_url)"
133133
]
134134
},

notebooks/CustomerScenarios/Case Study - Multi-investment Attribution at A Software Company.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -107,7 +107,7 @@
107107
"execution_count": 2,
108108
"source": [
109109
"# Import the sample multi-attribution data\n",
110-
"file_url = \"https://msalicedatapublic.blob.core.windows.net/datasets/ROI/multi_attribution_sample.csv\"\n",
110+
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/ROI/multi_attribution_sample.csv\"\n",
111111
"multi_data = pd.read_csv(file_url)"
112112
],
113113
"outputs": [],

notebooks/CustomerScenarios/Case Study - Recommendation AB Testing at An Online Travel Company - EconML + DoWhy.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -150,7 +150,7 @@
150150
"outputs": [],
151151
"source": [
152152
"# Import the sample AB data\n",
153-
"file_url = \"https://msalicedatapublic.blob.core.windows.net/datasets/RecommendationAB/ab_sample.csv\" \n",
153+
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/RecommendationAB/ab_sample.csv\" \n",
154154
"ab_data = pd.read_csv(file_url)"
155155
]
156156
},

notebooks/CustomerScenarios/Case Study - Recommendation AB Testing at An Online Travel Company.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -129,7 +129,7 @@
129129
"execution_count": 2,
130130
"source": [
131131
"# Import the sample AB data\n",
132-
"file_url = \"https://msalicedatapublic.blob.core.windows.net/datasets/RecommendationAB/ab_sample.csv\" \n",
132+
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/RecommendationAB/ab_sample.csv\" \n",
133133
"ab_data = pd.read_csv(file_url)"
134134
],
135135
"outputs": [],

notebooks/CustomerScenarios/Case Study - Using EconML to evaluate the treatment effect of training program - Lalonde dataset.ipynb

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -336,7 +336,7 @@
336336
"# Data\n",
337337
"## female\n",
338338
"### read in and slice data\n",
339-
"female_data = pd.read_csv('https://msalicedatapublic.blob.core.windows.net/datasets/Lalonde/calonico_smith_all.csv')\n",
339+
"female_data = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/calonico_smith_all.csv')\n",
340340
"female_data[\"haschild\"]=(female_data[\"nchildren75\"]>0)*1\n",
341341
"female_data = female_data[pd.notnull(female_data.re75) & pd.notnull(female_data.re79)]\n",
342342
"female_treatment = female_data[female_data.treated==1.].copy()\n",
@@ -349,13 +349,13 @@
349349
"\n",
350350
"## male\n",
351351
"### read in and slice data\n",
352-
"male_data = pd.read_csv('https://msalicedatapublic.blob.core.windows.net/datasets/Lalonde/smith_todd.csv')\n",
352+
"male_data = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/smith_todd.csv')\n",
353353
"male_treatment = male_data[male_data.treated==1.].copy()\n",
354354
"male_control = male_data[male_data.treated==0.].copy()\n",
355-
"male_cps1 = pd.read_csv('https://msalicedatapublic.blob.core.windows.net/datasets/Lalonde/cps_controls.csv')\n",
356-
"male_psid1 = pd.read_csv('https://msalicedatapublic.blob.core.windows.net/datasets/Lalonde/psid_controls.csv')\n",
357-
"male_cps3 = pd.read_csv('https://msalicedatapublic.blob.core.windows.net/datasets/Lalonde/cps_controls3.csv')\n",
358-
"male_psid3 = pd.read_csv('https://msalicedatapublic.blob.core.windows.net/datasets/Lalonde/psid_controls3.csv')\n",
355+
"male_cps1 = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/cps_controls.csv')\n",
356+
"male_psid1 = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/psid_controls.csv')\n",
357+
"male_cps3 = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/cps_controls3.csv')\n",
358+
"male_psid3 = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/psid_controls3.csv')\n",
359359
"### some preprocessing\n",
360360
"for df in [male_psid1,male_psid3,male_cps1,male_cps3]:\n",
361361
" df.rename(columns={'treat':'treated', 'education':'educ', 'hispanic':'hisp'}, inplace=True)"

notebooks/Double Machine Learning Examples.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1925,7 +1925,7 @@
19251925
"\n",
19261926
"if not os.path.isfile(file_name):\n",
19271927
" print(\"Downloading file (this might take a few seconds)...\")\n",
1928-
" urllib.request.urlretrieve(\"https://msalicedatapublic.blob.core.windows.net/datasets/OrangeJuice/oj_large.csv\", file_name)\n",
1928+
" urllib.request.urlretrieve(\"https://msalicedatapublic.z5.web.core.windows.net/datasets/OrangeJuice/oj_large.csv\", file_name)\n",
19291929
"oj_data = pd.read_csv(file_name)"
19301930
]
19311931
},

0 commit comments

Comments
 (0)