Combining the Datasets

Set up

Loading the libraries

library(tidyverse)
library(janitor)
library(lubridate)

Importing VERSA

versa_data <- read_rds("data-processed/01-clean-versa.rds") |> glimpse()
Rows: 17,256
Columns: 18
$ primary_key         <chr> "TX20234", "TX20234", "TX20235", "TX20237", "TX202…
$ charge              <chr> "Poss Marij < 2OZ", "Poss CS PG 2 >= 1G < 4G", "WA…
$ charge_count        <dbl> 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,…
$ ethnicity           <chr> "H", "H", "H", "H", "H", "H", "H", "H", "H", "H", …
$ charge_date         <date> 2023-01-03, 2023-01-03, 2023-01-21, 2023-01-22, 2…
$ person_age          <dbl> 27, 27, 50, 37, NA, 26, 21, NA, 29, NA, 30, 21, 25…
$ person_first_name   <chr> "CRISPIN", "CRISPIN", "MOISES", "FERMIN", "JOSE", …
$ person_second_name  <chr> "III", "III", NA, NA, "CARLOS", NA, "GUADALUPE", "…
$ person_third_name   <chr> NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA…
$ person_last_name    <chr> "MERCADO", "MERCADO", "DE LA CRUZ LOPEZ", "RODRIGU…
$ officer_id          <dbl> 15882, 15882, 15969, 15001, 15001, 15001, 15001, 1…
$ arrest_county       <chr> "Dimmit", "Dimmit", "Dimmit", "Kinney", "Kinney", …
$ code                <chr> "HS", "HS", "CP", "PC", "PC", "PC", "PC", "PC", "P…
$ severity_code       <chr> "Versa Misdemeanor Charges", "VT Felony Charges", …
$ severity_code_clean <chr> "Misdemeanor Charges", "Felony Charges", "Federal/…
$ person_race_abbr    <chr> "H", "H", "H", "H", "H", "H", "H", "H", "H", "H", …
$ person_gender_abbr  <chr> "M", "M", "M", "M", "M", "F", "M", "M", "M", "M", …
$ arrest_state        <chr> "TEXAS", "TEXAS", "TEXAS", "TEXAS", "TEXAS", "TEXA…

Import SPURS

spurs_data <- read_rds("data-processed/01-clean-spurs.rds") |> glimpse()
Rows: 41,379
Columns: 19
$ arrest_county       <chr> "Aransas", "Bee", "Bee", "Cameron", "Cameron", "Ec…
$ arrest_division     <chr> "Texas Highway Patrol", "Texas Highway Patrol", "T…
$ arrest_id           <dbl> 209274810, 210182331, 223969513, 213772403, 213772…
$ arrest_state        <chr> "TEXAS", "TEXAS", "TEXAS", "TEXAS", "TEXAS", "TEXA…
$ arrest_urn          <chr> "CMAR00171811", "CMAR00172979", "CMAR00183927", "C…
$ arresting_officer   <chr> "Kaitlynn King", "Luke William Kanz", "Justin K Ja…
$ spurs_officer_id    <chr> "Kk26997", "Lk23525", "Jj25825", "Jc05699", "Jc056…
$ statute             <chr> "46.02(A)", "481.121(B)(1)", "46.02(A)", "481.121(…
$ code                <chr> "Penal Code", "Health And Safety Code", "Penal Cod…
$ inv_number          <chr> "2022I-THP3-149480", "2022I-THP3-149608", "2022I-T…
$ severity_code_clean <chr> "Misdemeanor Charges", "Misdemeanor Charges", "Mis…
$ charge              <chr> "Unl Carrying Weapon", "Possession Of Marihuana <2…
$ person_first_name   <chr> "WESLIN", "JOEL", "JESUS", "SERGIO", "SERGIO", "KI…
$ person_last_name    <chr> "LEMKE", "CASAS", "CADENA", "ARMENDAREZ-GARCA", "A…
$ person_age          <dbl> 23, 27, 52, 23, 23, 29, 29, 45, 29, 17, 24, 24, 24…
$ charge_date         <date> 2022-01-01, 2022-01-01, 2022-01-01, 2022-01-01, 2…
$ person_race_abbr    <chr> "W", "H", "H", "H", "H", "H", "H", "H", "H", "H", …
$ person_gender_abbr  <chr> "M", "M", "M", "M", "M", "F", "F", "M", "M", "M", …
$ charge_count        <dbl> 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1,…

Combine both clean data sets

data_combine <- versa_data |> 
  bind_rows(spurs_data)

data_combine

Export combined file

data_combine |>
write_rds("data-processed/02-combine.rds")