## ----include = FALSE---------------------------------------------------------- knitr::opts_chunk$set( collapse = TRUE, comment = "#>" ) ## ----setup, include=FALSE----------------------------------------------------- knitr::opts_chunk$set(warning = FALSE, message = FALSE) library(nycOpenData) library(ggplot2) library(dplyr) ## ----small-sample------------------------------------------------------------- small_sample <- nyc_pull_dataset(dataset = "gakf-suji", limit = 3) small_sample # Seeing what columns are in the dataset names(small_sample) ## ----filter-incident---------------------------------------------------------- incident_slash_stab <- nyc_pull_dataset("gakf-suji", limit = 3, filters = list(incident_type = "Stabbing")) head(incident_slash_stab) # Checking to see the filtering worked incident_slash_stab |> distinct(incident_type) ## ----slashing-stabbing-------------------------------------------------------- # Creating the datasets slash <- nyc_pull_dataset("gakf-suji", limit = 50, filters = list(facility = "AMKC", incident_type = "Slashing")) stab <- nyc_pull_dataset("gakf-suji", limit = 50, filters = list(facility = "AMKC", incident_type = "Stabbing")) # Calling head of our new dataset slash |> slice_head(n = 6) stab |> slice_head(n = 6) # Quick check to make sure our filtering worked slash |> summarize(rows = n()) stab |> summarize(rows = n()) ## ----fig.cap="This figure shows incident types by facility."------------------ data <- nyc_pull_dataset("gakf-suji", limit = 100) |> filter(incident_type %in% c("Slashing", "Stabbing")) |> count(incident_type, name = "count") ggplot(data, aes(x = incident_type, y = count)) + geom_col(position = "dodge") + theme_minimal() + labs( title = "Slashing vs Stabbing Incidents by Facility", x = "Incident Type", y = "Number of Incidents", fill = "Facility" )