library(generalconference)
#> Loading required package: dplyr
#>
#> Attaching package: 'dplyr'
#> The following objects are masked from 'package:stats':
#>
#> filter, lag
#> The following objects are masked from 'package:base':
#>
#> intersect, setdiff, setequal, union
#> Loading required package: furrr
#> Loading required package: future
#> Loading required package: glue
#>
#> Attaching package: 'glue'
#> The following object is masked from 'package:dplyr':
#>
#> collapse
#> Loading required package: purrr
#> Loading required package: stringr
#> Loading required package: readr
#> Loading required package: rvest
#>
#> Attaching package: 'rvest'
#> The following object is masked from 'package:readr':
#>
#> guess_encoding
#> Loading required package: tictoc
#> Loading required package: tidyr
#> Loading required package: xml2
Use the following code to download a session one-off:
# Define the file path
year = 2021
month = 4
mo_str = "04"
path=glue("/home/rstudio/generalconference/data/sessions/{year}{mo_str}.rds")
generalconference::scrape_conference_talks(year, month, path)
# Read the dataframe in
df_conf <- readr::read_rds(path)
df_conf %>%
unnest(sessions) %>%
unnest(talks)
#> # A tibble: 37 × 13
#> year month session_name session_id session_url talk_urls talk_session_id
#> <dbl> <dbl> <chr> <int> <chr> <chr> <int>
#> 1 2021 4 Saturday Mor… 1 /study/gener… /study/ge… 1
#> 2 2021 4 Saturday Mor… 1 /study/gener… /study/ge… 2
#> 3 2021 4 Saturday Mor… 1 /study/gener… /study/ge… 3
#> 4 2021 4 Saturday Mor… 1 /study/gener… /study/ge… 4
#> 5 2021 4 Saturday Mor… 1 /study/gener… /study/ge… 5
#> 6 2021 4 Saturday Mor… 1 /study/gener… /study/ge… 6
#> 7 2021 4 Saturday Mor… 1 /study/gener… /study/ge… 7
#> 8 2021 4 Saturday Aft… 2 /study/gener… /study/ge… 1
#> 9 2021 4 Saturday Aft… 2 /study/gener… /study/ge… 2
#> 10 2021 4 Saturday Aft… 2 /study/gener… /study/ge… 3
#> # … with 27 more rows, and 6 more variables: url <chr>, title1 <chr>,
#> # author1 <chr>, author2 <chr>, kicker1 <chr>, paragraphs <list>