File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 22 "cells" : [
33 {
44 "cell_type" : " markdown" ,
5- "id" : " 342e73df " ,
5+ "id" : " 0 " ,
66 "metadata" : {},
77 "source" : [
88 " # Lifelines Modelling\n " ,
1212 {
1313 "cell_type" : " code" ,
1414 "execution_count" : null ,
15- "id" : " c1dc8173 " ,
15+ "id" : " 1 " ,
1616 "metadata" : {},
1717 "outputs" : [],
1818 "source" : [
2525 },
2626 {
2727 "cell_type" : " markdown" ,
28- "id" : " b457091b " ,
28+ "id" : " 2 " ,
2929 "metadata" : {},
3030 "source" : [
3131 " ## Prepare the Input Data\n " ,
3535 {
3636 "cell_type" : " code" ,
3737 "execution_count" : null ,
38- "id" : " 43c007ae " ,
38+ "id" : " 3 " ,
3939 "metadata" : {},
4040 "outputs" : [],
4141 "source" : [
42- " df = su.read_sales_data()\n " ,
42+ " df = su.read_sales_data(\" ../data/sales_df.csv \" )\n " ,
4343 " len_b = len(df)\n " ,
4444 " df = df.drop_duplicates()\n " ,
4545 " len_a = len(df)\n " ,
4949 },
5050 {
5151 "cell_type" : " markdown" ,
52- "id" : " 55e9800a " ,
52+ "id" : " 4 " ,
5353 "metadata" : {},
5454 "source" : [
5555 " ## Build, Fit, and Rank with the Cox Model\n " ,
5959 {
6060 "cell_type" : " code" ,
6161 "execution_count" : null ,
62- "id" : " 361fe200 " ,
62+ "id" : " 5 " ,
6363 "metadata" : {},
6464 "outputs" : [],
6565 "source" : [
114114 },
115115 {
116116 "cell_type" : " markdown" ,
117- "id" : " eaaab92d " ,
117+ "id" : " 6 " ,
118118 "metadata" : {},
119119 "source" : [
120120 " ## Check Cox Assumptions\n " ,
124124 {
125125 "cell_type" : " code" ,
126126 "execution_count" : null ,
127- "id" : " 8498ea11 " ,
127+ "id" : " 7 " ,
128128 "metadata" : {},
129129 "outputs" : [],
130130 "source" : [
133133 },
134134 {
135135 "cell_type" : " markdown" ,
136- "id" : " d21572b9 " ,
136+ "id" : " 8 " ,
137137 "metadata" : {},
138138 "source" : [
139139 " ## Evaluate Cox Performance\n " ,
143143 {
144144 "cell_type" : " code" ,
145145 "execution_count" : null ,
146- "id" : " c06844c7 " ,
146+ "id" : " 9 " ,
147147 "metadata" : {},
148148 "outputs" : [],
149149 "source" : [
162162 },
163163 {
164164 "cell_type" : " markdown" ,
165- "id" : " c477b0e5 " ,
165+ "id" : " 10 " ,
166166 "metadata" : {},
167167 "source" : [
168168 " ## Compare Weibull and Log-Normal AFT Variants\n " ,
172172 {
173173 "cell_type" : " code" ,
174174 "execution_count" : null ,
175- "id" : " 9308a7a9 " ,
175+ "id" : " 11 " ,
176176 "metadata" : {},
177177 "outputs" : [],
178178 "source" : [
249249 },
250250 {
251251 "cell_type" : " markdown" ,
252- "id" : " 85f53f3a " ,
252+ "id" : " 12 " ,
253253 "metadata" : {},
254254 "source" : [
255255 " We look at recall since we are only interested in a list of customers who will order in a certain intervall. We are not actually interested in the absolute order of the priority list. Recall tells us how many of the top k have been correctly included in the top k."
258258 {
259259 "cell_type" : " code" ,
260260 "execution_count" : null ,
261- "id" : " 007521ed " ,
261+ "id" : " 13 " ,
262262 "metadata" : {},
263263 "outputs" : [],
264264 "source" : [
282282 ],
283283 "metadata" : {
284284 "kernelspec" : {
285- "display_name" : " sme-kt-zh-collaboration-forecasting" ,
285+ "display_name" : " sme-kt-zh-collaboration-forecasting (3.12.3) " ,
286286 "language" : " python" ,
287287 "name" : " python3"
288288 },
296296 "name" : " python" ,
297297 "nbconvert_exporter" : " python" ,
298298 "pygments_lexer" : " ipython3" ,
299- "version" : " 3.11.14 "
299+ "version" : " 3.12.3 "
300300 }
301301 },
302302 "nbformat" : 4 ,
Original file line number Diff line number Diff line change 22 "cells" : [
33 {
44 "cell_type" : " markdown" ,
5- "id" : " 1y6kpzwajfw " ,
5+ "id" : " 0 " ,
66 "metadata" : {},
77 "source" : [
88 " # RSF Modelling\n " ,
1212 {
1313 "cell_type" : " code" ,
1414 "execution_count" : null ,
15- "id" : " b31030b6 " ,
15+ "id" : " 1 " ,
1616 "metadata" : {},
1717 "outputs" : [],
1818 "source" : [
2727 },
2828 {
2929 "cell_type" : " markdown" ,
30- "id" : " u1in2aq63no " ,
30+ "id" : " 2 " ,
3131 "metadata" : {},
3232 "source" : [
3333 " ## Prepare the Input Data\n " ,
3737 {
3838 "cell_type" : " code" ,
3939 "execution_count" : null ,
40- "id" : " dc65164f " ,
40+ "id" : " 3 " ,
4141 "metadata" : {},
4242 "outputs" : [],
4343 "source" : [
44- " df = su.read_sales_data()\n " ,
44+ " df = su.read_sales_data(\" ../data/sales_df.csv \" )\n " ,
4545 " len_b = len(df)\n " ,
4646 " df = df.drop_duplicates()\n " ,
4747 " len_a = len(df)\n " ,
5151 },
5252 {
5353 "cell_type" : " markdown" ,
54- "id" : " enodf5zrb9r " ,
54+ "id" : " 4 " ,
5555 "metadata" : {},
5656 "source" : [
5757 " ## Feature Engineering\n " ,
6161 {
6262 "cell_type" : " code" ,
6363 "execution_count" : null ,
64- "id" : " 09b14307 " ,
64+ "id" : " 5 " ,
6565 "metadata" : {},
6666 "outputs" : [],
6767 "source" : [
9999 },
100100 {
101101 "cell_type" : " markdown" ,
102- "id" : " vr70gk02d8 " ,
102+ "id" : " 6 " ,
103103 "metadata" : {},
104104 "source" : [
105105 " ## Train / Test Split and Survival Data Preparation\n " ,
109109 {
110110 "cell_type" : " code" ,
111111 "execution_count" : null ,
112- "id" : " pqym5f9y31 " ,
112+ "id" : " 7 " ,
113113 "metadata" : {},
114114 "outputs" : [],
115115 "source" : [
131131 },
132132 {
133133 "cell_type" : " markdown" ,
134- "id" : " oy1837j4h7 " ,
134+ "id" : " 8 " ,
135135 "metadata" : {},
136136 "source" : [
137137 " ## Fit the RSF Model\n " ,
141141 {
142142 "cell_type" : " code" ,
143143 "execution_count" : null ,
144- "id" : " b232d36ftrd " ,
144+ "id" : " 9 " ,
145145 "metadata" : {},
146146 "outputs" : [],
147147 "source" : [
177177 },
178178 {
179179 "cell_type" : " markdown" ,
180- "id" : " l4zik5zvi7o " ,
180+ "id" : " 10 " ,
181181 "metadata" : {},
182182 "source" : [
183183 " ## Evaluate RSF Performance\n " ,
187187 {
188188 "cell_type" : " code" ,
189189 "execution_count" : null ,
190- "id" : " ihs8vbovjn " ,
190+ "id" : " 11 " ,
191191 "metadata" : {},
192192 "outputs" : [],
193193 "source" : [
216216 },
217217 {
218218 "cell_type" : " markdown" ,
219- "id" : " dljgu0g217 " ,
219+ "id" : " 12 " ,
220220 "metadata" : {},
221221 "source" : [
222222 " ## Tune Hyperparameters\n " ,
226226 {
227227 "cell_type" : " code" ,
228228 "execution_count" : null ,
229- "id" : " 9b9e4549 " ,
229+ "id" : " 13 " ,
230230 "metadata" : {},
231231 "outputs" : [],
232232 "source" : [
256256 },
257257 {
258258 "cell_type" : " markdown" ,
259- "id" : " 2hyfphb325k " ,
259+ "id" : " 14 " ,
260260 "metadata" : {},
261261 "source" : [
262262 " ## Evaluate Tuned RSF and Compare\n " ,
266266 {
267267 "cell_type" : " code" ,
268268 "execution_count" : null ,
269- "id" : " 2ybvzmao1vr " ,
269+ "id" : " 15 " ,
270270 "metadata" : {},
271271 "outputs" : [],
272272 "source" : [
290290 },
291291 {
292292 "cell_type" : " markdown" ,
293- "id" : " 15c7317e " ,
293+ "id" : " 16 " ,
294294 "metadata" : {},
295295 "source" : [
296296 " ## Results Discussion Optimized vs Unoptimized\n " ,
300300 {
301301 "cell_type" : " code" ,
302302 "execution_count" : null ,
303- "id" : " a6fl4aargf8 " ,
303+ "id" : " 17 " ,
304304 "metadata" : {},
305305 "outputs" : [],
306306 "source" : [
323323 ],
324324 "metadata" : {
325325 "kernelspec" : {
326- "display_name" : " sme-kt-zh-collaboration-forecasting" ,
326+ "display_name" : " sme-kt-zh-collaboration-forecasting (3.12.3) " ,
327327 "language" : " python" ,
328328 "name" : " python3"
329329 },
337337 "name" : " python" ,
338338 "nbconvert_exporter" : " python" ,
339339 "pygments_lexer" : " ipython3" ,
340- "version" : " 3.11.14 "
340+ "version" : " 3.12.3 "
341341 }
342342 },
343343 "nbformat" : 4 ,
You can’t perform that action at this time.
0 commit comments