Skip to content

Commit da45e91

Browse files
authored
update datasets host url for notebooks (#959)
Signed-off-by: kgao <kevin.leo.gao@gmail.com>
1 parent 7b08a47 commit da45e91

11 files changed

+16
-16
lines changed

econml/tests/test_dominicks.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ def test_dominicks():
1919
if not os.path.isfile(file_name):
2020
print("Downloading file (this might take a few seconds)...")
2121
urllib.request.urlretrieve(
22-
"https://msalicedatapublic.z5.web.core.windows.net/datasets/OrangeJuice/oj_large.csv", file_name)
22+
"https://econmldata.azurewebsites.net/datasets/OrangeJuice/oj_large.csv", file_name)
2323
oj_data = pd.read_csv(file_name)
2424

2525
brands = sorted(set(oj_data["brand"]))

notebooks/Causal Forest and Orthogonal Random Forest Examples.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -1514,7 +1514,7 @@
15141514
"\n",
15151515
"if not os.path.isfile(file_name):\n",
15161516
" print(\"Downloading file (this might take a few seconds)...\")\n",
1517-
" urllib.request.urlretrieve(\"https://msalicedatapublic.z5.web.core.windows.net/datasets/OrangeJuice/oj_large.csv\",\n",
1517+
" urllib.request.urlretrieve(\"https://econmldata.azurewebsites.net/datasets/OrangeJuice/oj_large.csv\",\n",
15181518
" file_name)\n",
15191519
"oj_data = pd.read_csv(file_name)\n",
15201520
"oj_data.head()"

notebooks/CustomerScenarios/Case Study - Customer Segmentation at An Online Media Company - EconML + DoWhy.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -136,7 +136,7 @@
136136
"outputs": [],
137137
"source": [
138138
"# Import the sample pricing data\n",
139-
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/Pricing/pricing_sample.csv\"\n",
139+
"file_url = \"https://econmldata.azurewebsites.net/datasets/Pricing/pricing_sample.csv\"\n",
140140
"train_data = pd.read_csv(file_url)"
141141
]
142142
},

notebooks/CustomerScenarios/Case Study - Customer Segmentation at An Online Media Company.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -122,7 +122,7 @@
122122
"outputs": [],
123123
"source": [
124124
"# Import the sample pricing data\n",
125-
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/Pricing/pricing_sample.csv\"\n",
125+
"file_url = \"https://econmldata.azurewebsites.net/datasets/Pricing/pricing_sample.csv\"\n",
126126
"train_data = pd.read_csv(file_url)"
127127
]
128128
},

notebooks/CustomerScenarios/Case Study - Multi-investment Attribution at A Software Company - EconML + DoWhy.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -125,7 +125,7 @@
125125
"outputs": [],
126126
"source": [
127127
"# Import the sample multi-attribution data\n",
128-
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/ROI/multi_attribution_sample.csv\"\n",
128+
"file_url = \"https://econmldata.azurewebsites.net/datasets/ROI/multi_attribution_sample.csv\"\n",
129129
"multi_data = pd.read_csv(file_url)"
130130
]
131131
},

notebooks/CustomerScenarios/Case Study - Multi-investment Attribution at A Software Company.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -108,7 +108,7 @@
108108
"outputs": [],
109109
"source": [
110110
"# Import the sample multi-attribution data\n",
111-
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/ROI/multi_attribution_sample.csv\"\n",
111+
"file_url = \"https://econmldata.azurewebsites.net/datasets/ROI/multi_attribution_sample.csv\"\n",
112112
"multi_data = pd.read_csv(file_url)"
113113
]
114114
},

notebooks/CustomerScenarios/Case Study - Recommendation AB Testing at An Online Travel Company - EconML + DoWhy.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -145,7 +145,7 @@
145145
"outputs": [],
146146
"source": [
147147
"# Import the sample AB data\n",
148-
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/RecommendationAB/ab_sample.csv\"\n",
148+
"file_url = \"https://econmldata.azurewebsites.net/datasets/RecommendationAB/ab_sample.csv\"\n",
149149
"ab_data = pd.read_csv(file_url)"
150150
]
151151
},

notebooks/CustomerScenarios/Case Study - Recommendation AB Testing at An Online Travel Company.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -133,7 +133,7 @@
133133
"outputs": [],
134134
"source": [
135135
"# Import the sample AB data\n",
136-
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/RecommendationAB/ab_sample.csv\"\n",
136+
"file_url = \"https://econmldata.azurewebsites.net/datasets/RecommendationAB/ab_sample.csv\"\n",
137137
"ab_data = pd.read_csv(file_url)"
138138
]
139139
},

notebooks/CustomerScenarios/Case Study - Using EconML to evaluate the treatment effect of training program - Lalonde dataset.ipynb

+6-6
Original file line numberDiff line numberDiff line change
@@ -337,7 +337,7 @@
337337
"# Data\n",
338338
"## female\n",
339339
"### read in and slice data\n",
340-
"female_data = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/calonico_smith_all.csv')\n",
340+
"female_data = pd.read_csv('https://econmldata.azurewebsites.net/datasets/Lalonde/calonico_smith_all.csv')\n",
341341
"female_data[\"haschild\"]=(female_data[\"nchildren75\"]>0)*1\n",
342342
"female_data = female_data[pd.notnull(female_data.re75) & pd.notnull(female_data.re79)]\n",
343343
"female_treatment = female_data[female_data.treated==1.].copy()\n",
@@ -350,13 +350,13 @@
350350
"\n",
351351
"## male\n",
352352
"### read in and slice data\n",
353-
"male_data = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/smith_todd.csv')\n",
353+
"male_data = pd.read_csv('https://econmldata.azurewebsites.net/datasets/Lalonde/smith_todd.csv')\n",
354354
"male_treatment = male_data[male_data.treated==1.].copy()\n",
355355
"male_control = male_data[male_data.treated==0.].copy()\n",
356-
"male_cps1 = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/cps_controls.csv')\n",
357-
"male_psid1 = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/psid_controls.csv')\n",
358-
"male_cps3 = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/cps_controls3.csv')\n",
359-
"male_psid3 = pd.read_csv('https://msalicedatapublic.z5.web.core.windows.net/datasets/Lalonde/psid_controls3.csv')\n",
356+
"male_cps1 = pd.read_csv('https://econmldata.azurewebsites.net/datasets/Lalonde/cps_controls.csv')\n",
357+
"male_psid1 = pd.read_csv('https://econmldata.azurewebsites.net/datasets/Lalonde/psid_controls.csv')\n",
358+
"male_cps3 = pd.read_csv('https://econmldata.azurewebsites.net/datasets/Lalonde/cps_controls3.csv')\n",
359+
"male_psid3 = pd.read_csv('https://econmldata.azurewebsites.net/datasets/Lalonde/psid_controls3.csv')\n",
360360
"### some preprocessing\n",
361361
"for df in [male_psid1,male_psid3,male_cps1,male_cps3]:\n",
362362
" df.rename(columns={'treat':'treated', 'education':'educ', 'hispanic':'hisp'}, inplace=True)"

notebooks/Double Machine Learning Examples.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -1923,7 +1923,7 @@
19231923
"\n",
19241924
"if not os.path.isfile(file_name):\n",
19251925
" print(\"Downloading file (this might take a few seconds)...\")\n",
1926-
" urllib.request.urlretrieve(\"https://msalicedatapublic.z5.web.core.windows.net/datasets/OrangeJuice/oj_large.csv\",\n",
1926+
" urllib.request.urlretrieve(\"https://econmldata.azurewebsites.net/datasets/OrangeJuice/oj_large.csv\",\n",
19271927
" file_name)\n",
19281928
"oj_data = pd.read_csv(file_name)"
19291929
]

notebooks/Solutions/Causal Interpretation for Employee Attrition Dataset.ipynb

+1-1
Original file line numberDiff line numberDiff line change
@@ -375,7 +375,7 @@
375375
}
376376
],
377377
"source": [
378-
"file_url = \"https://msalicedatapublic.z5.web.core.windows.net/datasets/EmployeeAttrition/Employee-Attrition.csv\"\n",
378+
"file_url = \"https://econmldata.azurewebsites.net/datasets/EmployeeAttrition/Employee-Attrition.csv\"\n",
379379
"attritionData = pd.read_csv(file_url)\n",
380380
"attritionData.head(5)"
381381
]

0 commit comments

Comments
 (0)