Le cas de mars 2017

## Loading tidyverse: ggplot2
## Loading tidyverse: tibble
## Loading tidyverse: tidyr
## Loading tidyverse: readr
## Loading tidyverse: purrr
## Loading tidyverse: dplyr
## Conflicts with tidy packages ----------------------------------------------
## filter(): dplyr, stats
## lag():    dplyr, stats
## Parsed with column specification:
## cols(
##   date = col_character(),
##   label = col_character(),
##   nb_visits = col_integer(),
##   entry_nb_visits = col_integer(),
##   exit_nb_visits = col_integer()
## )

sur une plus longue durée ?

## Parsed with column specification:
## cols(
##   year = col_integer(),
##   month = col_character(),
##   label = col_character(),
##   nb_visits = col_integer(),
##   entry_nb_visits = col_integer(),
##   exit_nb_visits = col_integer()
## )
## Warning: 1 parsing failure.
##     row             col               expected actual                                                       file
## 1115205 entry_nb_visits no trailing characters     e3 './data/data.gouv.fr/20140101_20170331_parmois_parurl.csv'

Les blockbusters

urls_mois %>%
  filter(stringr::str_detect(label, "datasets")) %>% 
  filter(!stringr::str_detect(label, "Autres")) %>% 
  filter(nb_visits > 10) %>% 
  mutate(url = stringr::str_replace(label, "fr/datasets/", "")) %>% 
  mutate(url = stringr::str_replace(url, "/index", "")) %>% 
  group_by(url) %>% 
  summarise(nb_visits = round(mean(nb_visits, na.rm = TRUE), digits = 0)) %>%
  mutate(rank = dense_rank(desc(nb_visits))) %>% 
  filter(rank < 500) %>% 
  arrange(desc(nb_visits)) %>% 
  DT::datatable()