Data

http://langcog.github.io/wordbankr/

Packages

library(tidyverse)
library(wordbankr)
library(here)
my_sounds <- c("meow", "woof woof", "cockadoodledoo")

# first get the items in the animal category
sounds <- get_item_data(language = "English (American)", 
                         form = "WG") %>%
  filter(definition %in% my_sounds) 

# then get instrument data for those items
sounds_data <- get_instrument_data(
  language = "English (American)",
  form = "WG",
  items = sounds$item_id,
  administrations = TRUE,
  iteminfo = TRUE
  ) %>% 
  mutate(produces = value == "produces",
         understands = case_when(
           produces == TRUE | value == "understands" ~ TRUE,
           TRUE ~ FALSE
         )) %>% 
  drop_na(produces) %>% 
  rename(sound = uni_lemma)

# what proportion of kids at each age understand/produce each word?
sounds_summary <- sounds_data %>% 
  group_by(age, sound) %>%
  summarise(kids_produce = sum(produces, na.rm = TRUE),
            kids_understand = sum(understands, na.rm = TRUE),
            kids_respond = n_distinct(data_id),
            prop_produce = kids_produce / kids_respond,
            prop_understand = kids_understand / kids_respond)

Now letโ€™s export both data frames for the lab.

write_csv(sounds_data, here::here("data",
                                       "animal_sounds_data.csv"))
write_csv(sounds_summary, here::here("data",
                                        "animal_sounds_summary.csv"))
LS0tCnRpdGxlOiAiTGFiIDAzYTogQW5pbWFsIFdvcmQgQ2xlYW5pbmciCnN1YnRpdGxlOiAiQk1JIDUvNjI1IgphdXRob3I6ICJBbGlzb24gSGlsbCIKb3V0cHV0OgogIGh0bWxfZG9jdW1lbnQ6CiAgICB0aGVtZTogZmxhdGx5CiAgICBjb2RlX2Rvd25sb2FkOiB0cnVlCi0tLQoKYGBge3Igc2V0dXAsIGluY2x1ZGUgPSBGQUxTRSwgY2FjaGUgPSBGQUxTRX0Ka25pdHI6Om9wdHNfY2h1bmskc2V0KGVycm9yID0gVFJVRSwgY29tbWVudCA9IE5BLCB3YXJuaW5nID0gRkFMU0UsIGVycm9ycyA9IEZBTFNFLCBtZXNzYWdlID0gRkFMU0UsIHRpZHkgPSBGQUxTRSwgY2FjaGUgPSBGQUxTRSkKYGBgCgojIERhdGEKaHR0cDovL2xhbmdjb2cuZ2l0aHViLmlvL3dvcmRiYW5rci8KCiMgUGFja2FnZXMKCmBgYHtyfQpsaWJyYXJ5KHRpZHl2ZXJzZSkKbGlicmFyeSh3b3JkYmFua3IpCmxpYnJhcnkoaGVyZSkKYGBgCgpgYGB7cn0KbXlfc291bmRzIDwtIGMoIm1lb3ciLCAid29vZiB3b29mIiwgImNvY2thZG9vZGxlZG9vIikKCiMgZmlyc3QgZ2V0IHRoZSBpdGVtcyBpbiB0aGUgYW5pbWFsIGNhdGVnb3J5CnNvdW5kcyA8LSBnZXRfaXRlbV9kYXRhKGxhbmd1YWdlID0gIkVuZ2xpc2ggKEFtZXJpY2FuKSIsIAogICAgICAgICAgICAgICAgICAgICAgICAgZm9ybSA9ICJXRyIpICU+JQogIGZpbHRlcihkZWZpbml0aW9uICVpbiUgbXlfc291bmRzKSAKCiMgdGhlbiBnZXQgaW5zdHJ1bWVudCBkYXRhIGZvciB0aG9zZSBpdGVtcwpzb3VuZHNfZGF0YSA8LSBnZXRfaW5zdHJ1bWVudF9kYXRhKAogIGxhbmd1YWdlID0gIkVuZ2xpc2ggKEFtZXJpY2FuKSIsCiAgZm9ybSA9ICJXRyIsCiAgaXRlbXMgPSBzb3VuZHMkaXRlbV9pZCwKICBhZG1pbmlzdHJhdGlvbnMgPSBUUlVFLAogIGl0ZW1pbmZvID0gVFJVRQogICkgJT4lIAogIG11dGF0ZShwcm9kdWNlcyA9IHZhbHVlID09ICJwcm9kdWNlcyIsCiAgICAgICAgIHVuZGVyc3RhbmRzID0gY2FzZV93aGVuKAogICAgICAgICAgIHByb2R1Y2VzID09IFRSVUUgfCB2YWx1ZSA9PSAidW5kZXJzdGFuZHMiIH4gVFJVRSwKICAgICAgICAgICBUUlVFIH4gRkFMU0UKICAgICAgICAgKSkgJT4lIAogIGRyb3BfbmEocHJvZHVjZXMpICU+JSAKICByZW5hbWUoc291bmQgPSB1bmlfbGVtbWEpCgojIHdoYXQgcHJvcG9ydGlvbiBvZiBraWRzIGF0IGVhY2ggYWdlIHVuZGVyc3RhbmQvcHJvZHVjZSBlYWNoIHdvcmQ/CnNvdW5kc19zdW1tYXJ5IDwtIHNvdW5kc19kYXRhICU+JSAKICBncm91cF9ieShhZ2UsIHNvdW5kKSAlPiUKICBzdW1tYXJpc2Uoa2lkc19wcm9kdWNlID0gc3VtKHByb2R1Y2VzLCBuYS5ybSA9IFRSVUUpLAogICAgICAgICAgICBraWRzX3VuZGVyc3RhbmQgPSBzdW0odW5kZXJzdGFuZHMsIG5hLnJtID0gVFJVRSksCiAgICAgICAgICAgIGtpZHNfcmVzcG9uZCA9IG5fZGlzdGluY3QoZGF0YV9pZCksCiAgICAgICAgICAgIHByb3BfcHJvZHVjZSA9IGtpZHNfcHJvZHVjZSAvIGtpZHNfcmVzcG9uZCwKICAgICAgICAgICAgcHJvcF91bmRlcnN0YW5kID0ga2lkc191bmRlcnN0YW5kIC8ga2lkc19yZXNwb25kKQpgYGAKCgpOb3cgbGV0J3MgZXhwb3J0IGJvdGggZGF0YSBmcmFtZXMgZm9yIHRoZSBsYWIuCgpgYGB7cn0Kd3JpdGVfY3N2KHNvdW5kc19kYXRhLCBoZXJlOjpoZXJlKCJkYXRhIiwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgImFuaW1hbF9zb3VuZHNfZGF0YS5jc3YiKSkKd3JpdGVfY3N2KHNvdW5kc19zdW1tYXJ5LCBoZXJlOjpoZXJlKCJkYXRhIiwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICJhbmltYWxfc291bmRzX3N1bW1hcnkuY3N2IikpCmBgYAoK

Creative Commons License