Bechdel Test 📽️

Plot No. 1

By Liam Bailey

Plot No. 2

By Long Nguyen

raw_bechdel <- read_csv("",
  col_types = "iicci"
) %>%
  mutate(imdb_id = paste0("tt", imdb_id))

bechdel <- raw_bechdel %>%
  mutate(group = sort(rep(1:9, 1000))[1:nrow(bechdel)]) %>%
  group_split(group) %>%
  future_map2_dfr(.y = omdb_api_keys, ~ mutate(.x, genre = map(
    possibly(function(id) {
      get_genres(find_by_id(id, api_key = .y))
    }, otherwise = NULL)
  ))) %>%

saveRDS(bechdel, here::here("2021_11_bechdel_test/bechdel.RDS"))
# Source:
stripes_pal <- c(
  brewer_pal(palette = "Reds", direction = -1)(9)[2:8],
  brewer_pal(palette = "Blues")(9)[2:8]

bechdel <- readRDS(here::here("2021_11_bechdel_test/bechdel.RDS"))

# Take care of duplicates
bechdel %>%
  add_count(year, title) %>%
  filter(n > 1)
#> # A tibble: 17 x 7
#>     year    id imdb_id     title                  rating genre         n
#>    <int> <int> <chr>       <chr>                   <int> <list>    <int>
#>  1  1931  1985 tt0021814   Dracula                     2 <chr [3]>     2
#>  2  1931  8213 tt0021815   Dracula                     3 <chr [3]>     2
#>  3  1959  9209 tt0053285   Sleeping Beauty             3 <chr [5]>     2
#>  4  1959   474 tt53285     Sleeping Beauty             3 <NULL>        2
#>  5  1983  4449 tt0086425   Terms of Endearment         3 <chr [2]>     2
#>  6  1983  4448 tt0086425   Terms of Endearment         1 <chr [2]>     2
#>  7  1997  4380 tt0117056   Ayneh                       3 <chr [1]>     2
#>  8  1997  4381 tt0117056   Ayneh                       3 <chr [1]>     2
#>  9  2011  4889 tt2043900   Last Call at the Oasis      3 <chr [1]>     2
#> 10  2011  4907 tt2043900   Last Call at the Oasis      3 <chr [1]>     2
#> 11  2014  6000 tt2180411   Into the Woods              3 <chr [5]>     2
#> 12  2014  8702 tt002180411 Into the Woods              3 <NULL>        2
#> 13  2015  6655 tt0810819   The Danish Girl             3 <chr [3]>     2
#> 14  2015  9081 ttNA        The Danish Girl             3 <NULL>        2
#> 15  2017  7241 tt0451279   Wonder Woman                3 <chr [5]>     3
#> 16  2017  9294 ttNA        Wonder Woman                3 <NULL>        3
#> 17  2017  9293 ttNA        Wonder Woman                3 <NULL>        3
# There were actually two different Dracula (Drácula) movies in 1931 :D
# What's up with Terms of Endearment tho?

bechdel_long <- bechdel %>%
  mutate(n_genres = map_int(genre, length)) %>%
  filter(n_genres > 0) %>%
  distinct(year, title, rating, .keep_all = TRUE) %>%
  select(-n_genres) %>%

bechdel_long %>%
  count(genre) %>%
#> # A tibble: 27 x 2
#>    genre           n
#>    <chr>       <int>
#>  1 Game-Show       1
#>  2 Adult           3
#>  3 N/A             5
#>  4 News            8
#>  5 Film-Noir      68
#>  6 Documentary    98
#>  7 Short         121
#>  8 Western       139
#>  9 Sport         185
#> 10 Music         323
#> # … with 17 more rows
  theme_void(base_size = 13, base_family = "Inter Medium") +
      text = element_text(colour = "white"),
      legend.position = "top",
      strip.text = element_text(
        family = "Inter Semi Bold",
        size = rel(1),
        margin = margin(b = 1)
      plot.title = element_text(
        family = "Metropolis Extra Bold",
        size = rel(2)
      plot.subtitle = ggtext::element_textbox_simple(
        size = rel(1.4),
        margin = margin(t = 10, b = 15)
      plot.caption = element_text(
        margin = margin(t = 20)
      plot.background = element_rect(fill = "black"),
      plot.margin = margin(15, 20, 15, 20)

stripes <- bechdel_long %>%
  add_count(genre) %>%
  filter(n > 10) %>%
  mutate(pass = if_else(rating == 3, 1L, 0L)) %>%
  slice(sort(rep(seq_len(nrow(bechdel_long)), 2))) %>%
  mutate(genre = if_else(row_number() %% 2 == 0, "OVERALL", genre)) %>%
  group_by(genre, year) %>%
  summarise(prop_pass = mean(pass)) %>%
  ungroup() %>%
  ggplot(aes(year, 1, fill = prop_pass)) +
  geom_tile() +
    colours = stripes_pal,
    breaks = c(0, 1),
    labels = label_percent(),
    guide = guide_colourbar(
      title = NULL,
      label.hjust = c(1.5, -.3),
      label.vjust = 6.5,
      barwidth = 7,
      barheight = .3,
      ticks = FALSE
  ) +
  facet_wrap(~ fct_reorder(genre, prop_pass, mean) %>%
    fct_relevel("OVERALL", after = Inf),
  ncol = 6
  ) +
    title = "Cooling Stripes?",
    subtitle = glue::glue("Percentage of movies having at least two women who talk to each other about something other than a man, {min(bechdel$year)}–{max(bechdel$year)}"),
    caption = "Data: IMDb/OMDb & — Graphic: Long Nguyen (@long39ng) — #TidyTuesday"


