This time I am sharing analysis of the most popular movies / TV shows across Netflix, Disney+, Hulu and HBOmax on weekly basis, instead of daily, with anticipation of better trends catching.
So, let`s count how many movies made the top5, I assume it is less than 5 *60…
library(tidyverse) library (gt) platforms <- c('Disney+','HBOmax', 'Hulu', 'Netflix') # additionally, load CSV data using readrWrangle raw data – reverse (fresh date first), take top 5, take last 60 days
fjune_dt % rev () %>% slice (1:5) %>% select (1:60) fdjune_dt % rev () %>% slice (1:5) %>% select (1:60) hdjune_dt % rev () %>% slice (1:5) %>% select (1:60) hulu_dt % rev () %>% slice (1:5) %>% select (1:60)Gather it together and count the number of unique titles in Top5 for 60 days
fjune_dt_gathered <- gather (fjune_dt) fdjune_dt_gathered <- gather (fdjune_dt) hdjune_dt_gathered <- gather (hdjune_dt) hulu_dt_gathered <- gather (hulu_dt) unique_fjune_gathered % length () unique_fdjune_gathered % length () unique_hdjune_gathered % length () unique_hulu_gathered % length () unique_gathered <- c(unique_fdjune_gathered, unique_hdjune_gathered, unique_hulu_gathered, unique_fjune_gathered) unique_gathered <- as.data.frame (t(unique_gathered), stringsAsFactors = F) colnames (unique_gathered) <- platformsLet`s make a nice table for the results
unique_gathered_gt % tab_header( title = "Number of unique movies (titles) in Top5")%>% tab_style( style = list( cell_text(color = "purple")), locations = cells_column_labels( columns = vars(HBOmax)))%>% tab_style( style = list( cell_text(color = "green")), locations = cells_column_labels( columns = vars(Hulu))) %>% tab_style( style = list( cell_text(color = "red")), locations = cells_column_labels( columns = vars(Netflix))) unique_gathered_gt
data:image/s3,"s3://crabby-images/b5797/b57972e5af04940a0f88e6a96ff2abd2030b3a6b" alt=""
Using similar code we can count the number of unique titles which were #1 one or more days
data:image/s3,"s3://crabby-images/63cef/63cef853fc4a3edca29fe22b4dfaad3400bc9c37" alt=""
What movie was the longest in Tops / #1?
table_fjune_top5 <- sort (table (fjune_dt_gathered$value), decreasing = T) # Top5 table_fdjune_top5 <- sort (table (fdjune_dt_gathered$value), decreasing = T) table_hdjune_top5 <- sort (table (hdjune_dt_gathered$value), decreasing = T) table_hulu_top5 <- sort (table (hulu_dt_gathered$value), decreasing = T)Plotting the results
bb5fdjune <- barplot (table_fdjune_top5 [1:5], ylim=c(0,62), main = "Days in Top5, Disney+", las = 1, col = 'blue') text(bb5fdjune,table_fdjune_top5 [1:5] +2,labels=as.character(table_fdjune_top5 [1:5])) bb5hdjune <- barplot (table_hdjune_top5 [1:5], ylim=c(0,60), main = "Days in Top5, HBO Max", las = 1, col = 'grey', cex.names=0.7) text(bb5hdjune,table_hdjune_top5 [1:5] +2,labels=as.character(table_hdjune_top5 [1:5])) bb5hulu <- barplot (table_hulu_top5 [1:5], ylim=c(0,60), main = "Days in Top5, Hulu", las = 1, col = 'green') text(bb5hulu,table_hulu_top5 [1:5] +2,labels=as.character(table_hulu_top5 [1:5])) bb5fjune <- barplot (table_fjune_top5 [1:5], ylim=c(0,60), main = "Days in Top5, Netflix", las = 1, col = 'red') text(bb5fjune,table_fjune_top5 [1:5] +2,labels=as.character(table_fjune_top5 [1:5]))
data:image/s3,"s3://crabby-images/1640d/1640d9b20395029b75d4d4df4c4c042d57d6930e" alt=""
data:image/s3,"s3://crabby-images/e1e55/e1e55257ca8e891ffb3a3ef43ca518d150fcfaf5" alt=""
data:image/s3,"s3://crabby-images/43239/432395d336ba92ef7e1c4ea207377de955055b61" alt=""
data:image/s3,"s3://crabby-images/cded7/cded70cffa15d950a8de927c9ce6c8d2373488de" alt=""
The same for the movies / TV shows reached the first place in weekly count
data:image/s3,"s3://crabby-images/fec39/fec391f1523617f636ddfa65b19bba2a9713a790" alt=""
data:image/s3,"s3://crabby-images/d46f8/d46f801423d0cdd9118d7c6602c6c01393be4bf7" alt=""
data:image/s3,"s3://crabby-images/ac7f0/ac7f072b0b4deb3b4fe5e5b629f81fea8d31c101" alt=""
data:image/s3,"s3://crabby-images/51ddb/51ddb860e4d45393c9ad1d880c05f1be5ebe3e07" alt=""
Average days in top distribution
#top 5 ad5_fjune <- as.data.frame (table_fjune_top5, stringsAsFActrors=FALSE) ad5_fdjune <- as.data.frame (table_fdjune_top5, stringsAsFActrors=FALSE) ad5_hdjune <- as.data.frame (table_hdjune_top5, stringsAsFActrors=FALSE) ad5_hulu <- as.data.frame (table_hulu_top5, stringsAsFActrors=FALSE) par (mfcol = c(1,4)) boxplot (ad5_fdjune$Freq, ylim=c(0,20), main = "Days in Top5, Disney+") boxplot (ad5_hdjune$Freq, ylim=c(0,20), main = "Days in Top5, HBO Max") boxplot (ad5_hulu$Freq, ylim=c(0,20), main = "Days in Top5, Hulu") boxplot (ad5_fjune$Freq, ylim=c(0,20), main = "Days in Top5, Netflix")
data:image/s3,"s3://crabby-images/765a7/765a73bd42fe5e3948e4fe70229a40538544677c" alt=""
The same for the movies / TV shows reached the first place in weekly count (#1)
data:image/s3,"s3://crabby-images/127d5/127d50452c9f4c4a55f232b44265296432ed2a0d" alt=""