Skip to content

Commit 8037583

Browse files
committed
WORKSHOP8: Tweaking the summary slides for the final workshop
1 parent b9d0120 commit 8037583

11 files changed

+127
-72
lines changed

build_models.html

+18-18
Large diffs are not rendered by default.

exploring_graph_data.html

+2-2
Original file line numberDiff line numberDiff line change
@@ -222,7 +222,7 @@ <h2><a href="#content">Alternative Explorations of the Online Retail Dataset</a>
222222
</div>
223223
<div id="postamble" data-toggle="wy-nav-shift" class="status">
224224
<p class="author"><span class="glyphicon glyphicon-user"></span> Mick Cooney <a href="mailto:mickcooney@gmail.com" class="email">mickcooney@gmail.com</a></p>
225-
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: November 23, 2021</p>
225+
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: December 06, 2021</p>
226226
</div>
227227
</div>
228228

@@ -691,7 +691,7 @@ <h1><span class="header-section-number">5</span> R Environment</h1>
691691
## collate en_US.UTF-8
692692
## ctype en_US.UTF-8
693693
## tz Etc/UTC
694-
## date 2021-11-23
694+
## date 2021-12-06
695695
##
696696
## ─ Packages ───────────────────────────────────────────────────────────────────
697697
## package * version date lib source

exploring_retail_data.html

+2-2
Original file line numberDiff line numberDiff line change
@@ -283,7 +283,7 @@ <h2><a href="#content">Exploring the Online Retail Dataset</a></h2>
283283
</div>
284284
<div id="postamble" data-toggle="wy-nav-shift" class="status">
285285
<p class="author"><span class="glyphicon glyphicon-user"></span> Mick Cooney <a href="mailto:mickcooney@gmail.com" class="email">mickcooney@gmail.com</a></p>
286-
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: November 23, 2021</p>
286+
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: December 06, 2021</p>
287287
</div>
288288
</div>
289289

@@ -1978,7 +1978,7 @@ <h1><span class="header-section-number">11</span> R Environment</h1>
19781978
## collate en_US.UTF-8
19791979
## ctype en_US.UTF-8
19801980
## tz Etc/UTC
1981-
## date 2021-11-23
1981+
## date 2021-12-06
19821982
##
19831983
## ─ Packages ───────────────────────────────────────────────────────────────────
19841984
## package * version date lib source

exploring_retail_dataexplorer.html

+2-2
Original file line numberDiff line numberDiff line change
@@ -218,7 +218,7 @@ <h2><a href="#content">Exploring the Cleaned Online Retail Dataset with DataExpl
218218
</div>
219219
<div id="postamble" data-toggle="wy-nav-shift" class="status">
220220
<p class="author"><span class="glyphicon glyphicon-user"></span> Mick Cooney <a href="mailto:mickcooney@gmail.com" class="email">mickcooney@gmail.com</a></p>
221-
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: November 23, 2021</p>
221+
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: December 06, 2021</p>
222222
</div>
223223
</div>
224224

@@ -337,7 +337,7 @@ <h1><span class="header-section-number">4</span> R Environment</h1>
337337
## collate en_US.UTF-8
338338
## ctype en_US.UTF-8
339339
## tz Etc/UTC
340-
## date 2021-11-23
340+
## date 2021-12-06
341341
##
342342
## ─ Packages ───────────────────────────────────────────────────────────────────
343343
## package * version date lib source

initial_arules_models.html

+11-11
Large diffs are not rendered by default.

initial_btyd_models.html

+2-2
Original file line numberDiff line numberDiff line change
@@ -240,7 +240,7 @@ <h2><a href="#content">Using Buy-Till-You-Die (BTYD) Models the Online Retail Da
240240
</div>
241241
<div id="postamble" data-toggle="wy-nav-shift" class="status">
242242
<p class="author"><span class="glyphicon glyphicon-user"></span> Mick Cooney <a href="mailto:mickcooney@gmail.com" class="email">mickcooney@gmail.com</a></p>
243-
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: November 23, 2021</p>
243+
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: December 06, 2021</p>
244244
</div>
245245
</div>
246246

@@ -1205,7 +1205,7 @@ <h1><span class="header-section-number">5</span> R Environment</h1>
12051205
## collate en_US.UTF-8
12061206
## ctype en_US.UTF-8
12071207
## tz Etc/UTC
1208-
## date 2021-11-23
1208+
## date 2021-12-06
12091209
##
12101210
## ─ Packages ───────────────────────────────────────────────────────────────────
12111211
## package * version date lib source

initial_rfm_models.html

+2-2
Original file line numberDiff line numberDiff line change
@@ -229,7 +229,7 @@ <h2><a href="#content">Using RFM Models the Online Retail Dataset</a></h2>
229229
</div>
230230
<div id="postamble" data-toggle="wy-nav-shift" class="status">
231231
<p class="author"><span class="glyphicon glyphicon-user"></span> Mick Cooney <a href="mailto:mickcooney@gmail.com" class="email">mickcooney@gmail.com</a></p>
232-
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: November 23, 2021</p>
232+
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: December 06, 2021</p>
233233
</div>
234234
</div>
235235

@@ -651,7 +651,7 @@ <h1><span class="header-section-number">4</span> R Environment</h1>
651651
## collate en_US.UTF-8
652652
## ctype en_US.UTF-8
653653
## tz Etc/UTC
654-
## date 2021-11-23
654+
## date 2021-12-06
655655
##
656656
## ─ Packages ───────────────────────────────────────────────────────────────────
657657
## package * version date lib source

initial_timeseries_models.html

+2-2
Original file line numberDiff line numberDiff line change
@@ -217,7 +217,7 @@ <h2><a href="#content">Time Series Analysis of the Online Retail Dataset</a></h2
217217
</div>
218218
<div id="postamble" data-toggle="wy-nav-shift" class="status">
219219
<p class="author"><span class="glyphicon glyphicon-user"></span> Mick Cooney <a href="mailto:mickcooney@gmail.com" class="email">mickcooney@gmail.com</a></p>
220-
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: November 23, 2021</p>
220+
<p class="date"><span class="glyphicon glyphicon-calendar"></span> Last updated: December 06, 2021</p>
221221
</div>
222222
</div>
223223

@@ -443,7 +443,7 @@ <h1><span class="header-section-number">3</span> R Environment</h1>
443443
## collate en_US.UTF-8
444444
## ctype en_US.UTF-8
445445
## tz Etc/UTC
446-
## date 2021-11-23
446+
## date 2021-12-06
447447
##
448448
## ─ Packages ───────────────────────────────────────────────────────────────────
449449
## package * version date lib source

retrieve_retail_data.html

+1-1
Original file line numberDiff line numberDiff line change
@@ -326,7 +326,7 @@ <h1><span class="header-section-number">2</span> R Environment</h1>
326326
## collate en_US.UTF-8
327327
## ctype en_US.UTF-8
328328
## tz Etc/UTC
329-
## date 2021-11-23
329+
## date 2021-12-06
330330
##
331331
## ─ Packages ───────────────────────────────────────────────────────────────────
332332
## package * version date lib source

summary_slides.Rmd

+51-15
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
---
22
title: "Project Overview: Results and Conclusions"
33
author: "Mick Cooney <mickcooney@gmail.com>"
4-
date: "Wednesday, 8 December 2021"
4+
date: "Monday, 6 December 2021"
55
output:
66
revealjs::revealjs_presentation:
77
theme: night
@@ -66,6 +66,21 @@ product_group_tokens_tbl <- read_rds("data/product_group_tokens_tbl.rds")
6666
```
6767

6868

69+
# Key Findings
70+
71+
---
72+
73+
Information in data
74+
75+
\
76+
77+
RFM modelling is useful
78+
79+
\
80+
81+
More work to be done
82+
83+
6984

7085
# Transaction Data
7186

@@ -140,17 +155,21 @@ ggplot(plot_tbl, aes(x = invoice_date, y = customer_id, group = customer_id)) +
140155

141156

142157
```{r plot_customer_segment_count, echo=FALSE}
158+
n_customer <- customer_segments_tbl %>% nrow()
159+
143160
plot_tbl <- customer_segments_tbl %>%
144161
count(segment, name = "count", sort = TRUE)
145162
146163
ggplot(plot_tbl) +
147164
geom_col(aes(x = segment, y = count, fill = segment)) +
165+
scale_y_continuous(labels = label_comma()) +
148166
scale_fill_brewer(type = "qual", palette = "Set1") +
149167
labs(
150-
x = "Segment",
151-
y = "Count"
168+
x = "Segment",
169+
y = "Count",
170+
title = "RFM Modelling Segmentation Sizes",
171+
subtitle = glue("{cust_count} Customers", cust_count = label_comma()(n_customer))
152172
) +
153-
ggtitle("RFM Modelling Segmentation Sizes") +
154173
theme(
155174
axis.text.x = element_text(angle = 20, vjust = 0.5),
156175
legend.position = "none"
@@ -185,7 +204,7 @@ segment_plot <- ggplot(plot_tbl) +
185204
x = "Customer Segment",
186205
y = "Value"
187206
) +
188-
ggtitle("Segmentation Metrics for Recent Data") +
207+
ggtitle("Segmentation Metrics for Validation Data") +
189208
theme(
190209
axis.text.x = element_text(angle = 20, vjust = 0.5, size = 8),
191210
legend.position = "none"
@@ -209,16 +228,20 @@ segment_plot + scale_y_log10(labels = label_comma())
209228
---
210229

211230
```{r plot_product_group_splits, echo=FALSE}
231+
n_product <- product_group_tnxgroups_tbl %>% nrow()
232+
212233
plot_tbl <- product_group_tnxgroups_tbl %>%
213234
count(product_group, name = "cluster_count")
214235
215236
ggplot(plot_tbl) +
216237
geom_col(aes(x = product_group, y = cluster_count)) +
238+
scale_y_continuous(labels = label_comma()) +
217239
labs(
218-
x = "Product Group",
219-
y = "Cluster Size"
220-
) +
221-
ggtitle("Product Cluster Sizes")
240+
x = "Product Group",
241+
y = "Cluster Size",
242+
title = "Product Cluster Sizes",
243+
subtitle = glue("{prod_count} Unique Products", prod_count = label_comma()(n_product))
244+
)
222245
```
223246

224247
---
@@ -258,18 +281,31 @@ wc_plot %>% plot()
258281

259282
---
260283

261-
* Lack of stakeholder input
262-
* Returns not properly analysed
263-
* RFM Models are simplistic
264-
* Clustering requires more work
265-
* Product data lacks depth
284+
Lack of stakeholder input
285+
286+
\
266287

288+
Sales returns not analysed properly
267289

290+
\
268291

269-
# Thank You
292+
Product data lacks depth
270293

271294
---
272295

296+
RFM models simplistic (BTYD worth exploring)
297+
298+
\
299+
300+
Clustering can be expanded
301+
302+
303+
304+
305+
## Thank You
306+
307+
\
308+
273309

274310
mickcooney@gmail.com
275311

summary_slides.html

+34-15
Large diffs are not rendered by default.

0 commit comments

Comments
 (0)