CLiREN-LMS
Data Visualization and Dashboards

Visualizing Missingness and Data Quality

Code Example 1

30-45 minutes Applied Step 6 of 9
Code

Code Example 1

6 / 9
Code

Code Example 1

r

missing_by_variable <- prepared_data |>
  summarise(
    consent_date = sum(is.na(consent_date)),
    age_years = sum(is.na(age_years_derived)),
    day28_outcome = sum(is.na(day28_outcome)),
    discharge_date = sum(is.na(discharge_date))
  ) |>
  pivot_longer(
    cols = everything(),
    names_to = "variable",
    values_to = "missing_count"
  )

missing_by_variable |>
  ggplot(aes(x = reorder(variable, missing_count), y = missing_count)) +
  geom_col() +
  coord_flip() +
  labs(
    title = "Missing Values in Key Variables",
    x = "Variable",
    y = "Missing records"
  )