library(tidyverse)
library(janitor)
library(lubridate)Combining the Datasets
Set up
Loading the libraries
Importing VERSA
versa_data <- read_rds("data-processed/01-clean-versa.rds") |> glimpse()Rows: 17,256
Columns: 18
$ primary_key <chr> "TX20234", "TX20234", "TX20235", "TX20237", "TX202…
$ charge <chr> "Poss Marij < 2OZ", "Poss CS PG 2 >= 1G < 4G", "WA…
$ charge_count <dbl> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,…
$ ethnicity <chr> "H", "H", "H", "H", "H", "H", "H", "H", "H", "H", …
$ charge_date <date> 2023-01-03, 2023-01-03, 2023-01-21, 2023-01-22, 2…
$ person_age <dbl> 27, 27, 50, 37, NA, 26, 21, NA, 29, NA, 30, 21, 25…
$ person_first_name <chr> "CRISPIN", "CRISPIN", "MOISES", "FERMIN", "JOSE", …
$ person_second_name <chr> "III", "III", NA, NA, "CARLOS", NA, "GUADALUPE", "…
$ person_third_name <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
$ person_last_name <chr> "MERCADO", "MERCADO", "DE LA CRUZ LOPEZ", "RODRIGU…
$ officer_id <dbl> 15882, 15882, 15969, 15001, 15001, 15001, 15001, 1…
$ arrest_county <chr> "Dimmit", "Dimmit", "Dimmit", "Kinney", "Kinney", …
$ code <chr> "HS", "HS", "CP", "PC", "PC", "PC", "PC", "PC", "P…
$ severity_code <chr> "Versa Misdemeanor Charges", "VT Felony Charges", …
$ severity_code_clean <chr> "Misdemeanor Charges", "Felony Charges", "Federal/…
$ person_race_abbr <chr> "H", "H", "H", "H", "H", "H", "H", "H", "H", "H", …
$ person_gender_abbr <chr> "M", "M", "M", "M", "M", "F", "M", "M", "M", "M", …
$ arrest_state <chr> "TEXAS", "TEXAS", "TEXAS", "TEXAS", "TEXAS", "TEXA…
Import SPURS
spurs_data <- read_rds("data-processed/01-clean-spurs.rds") |> glimpse()Rows: 41,379
Columns: 19
$ arrest_county <chr> "Aransas", "Bee", "Bee", "Cameron", "Cameron", "Ec…
$ arrest_division <chr> "Texas Highway Patrol", "Texas Highway Patrol", "T…
$ arrest_id <dbl> 209274810, 210182331, 223969513, 213772403, 213772…
$ arrest_state <chr> "TEXAS", "TEXAS", "TEXAS", "TEXAS", "TEXAS", "TEXA…
$ arrest_urn <chr> "CMAR00171811", "CMAR00172979", "CMAR00183927", "C…
$ arresting_officer <chr> "Kaitlynn King", "Luke William Kanz", "Justin K Ja…
$ spurs_officer_id <chr> "Kk26997", "Lk23525", "Jj25825", "Jc05699", "Jc056…
$ statute <chr> "46.02(A)", "481.121(B)(1)", "46.02(A)", "481.121(…
$ code <chr> "Penal Code", "Health And Safety Code", "Penal Cod…
$ inv_number <chr> "2022I-THP3-149480", "2022I-THP3-149608", "2022I-T…
$ severity_code_clean <chr> "Misdemeanor Charges", "Misdemeanor Charges", "Mis…
$ charge <chr> "Unl Carrying Weapon", "Possession Of Marihuana <2…
$ person_first_name <chr> "WESLIN", "JOEL", "JESUS", "SERGIO", "SERGIO", "KI…
$ person_last_name <chr> "LEMKE", "CASAS", "CADENA", "ARMENDAREZ-GARCA", "A…
$ person_age <dbl> 23, 27, 52, 23, 23, 29, 29, 45, 29, 17, 24, 24, 24…
$ charge_date <date> 2022-01-01, 2022-01-01, 2022-01-01, 2022-01-01, 2…
$ person_race_abbr <chr> "W", "H", "H", "H", "H", "H", "H", "H", "H", "H", …
$ person_gender_abbr <chr> "M", "M", "M", "M", "M", "F", "F", "M", "M", "M", …
$ charge_count <dbl> 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1,…
Combine both clean data sets
data_combine <- versa_data |>
bind_rows(spurs_data)
data_combineExport combined file
data_combine |>
write_rds("data-processed/02-combine.rds")