fixed likert stacked bars

2025-08-08 05:24:09 +00:00 · 2021-12-13 10:31:37 +00:00 · 2021-12-13 10:31:37 +00:00 · 38da21b4b0
commit 38da21b4b0
parent eb62ab07e5
2 changed files with 191 additions and 18 deletions
--- a/TODO.taskpaper
+++ b/TODO.taskpaper
@ -1,12 +1,12 @@
 # Prep work (JK):
-	- JK: aggregation of free-text answers: Q17, Q18 so that they can be used for subsetting
+	- JK: aggregation of free-text answers: Q17, Q18 so that they can be used for subsetting @done

 # Basic summary visualisations (RH):
- Q2 (respondent age)
- Q3 (year of study)
- Q16 (gender identity)
- Q17 (ethnic self-id)
- Q18 (religion)
+- Q2 (respondent age) @done
+- Q3 (year of study) @done
+- Q16 (gender identity) @done
+- Q17 (ethnic self-id) @done
+- Q18 (religion) @done

 # Visualisations of LIKERT responses (RH):
 - For questions Q6 (subject interest) / Q5 (subject knowledge) / Q7 employability prospects: 
@ -27,6 +27,13 @@
 	- Q17
 	- Q18

+# Dataset corrections:
+- typo in Interest_data$InterestinstudyingSociaology
+- adapt Interest_data$InterestedinStudyingPsychology to be consistent and others
+
+# Visualisation formatting:
+- Add colour to bar charts with colorbrewer()
+
 For later:
 - JK: calcuate baseline comparator using UCAS application data for Q5/6, stack with UOB application data for key subjects + 2-3 other samples

--- a/tsr_survey_analysis.Rmd
+++ b/tsr_survey_analysis.Rmd
@ -16,7 +16,7 @@ library(RColorBrewer)
 library("stringr")    # Load stringr package, used for wrapping label text in plots
 library(dplyr)        # Used for filtering below
 library(scales)       # Used for adding percentages to bar charts
-library(kable)        # Used for generating markdown tables
+# library(kable)        # Used for generating markdown tables

 # Define colour palettes for plots below
 coul3 <- brewer.pal(3, "RdYlBu") # Using RdYlBu range to generate 3 colour palette: https://colorbrewer2.org/#type=diverging&scheme=RdYlBu&n=5
@ -25,9 +25,13 @@ TSR_data <- read.csv("./data/TSR data complete.csv")
 subject_data <- read.csv("./data/Subject data.csv")

 # Set up local workspace, as needed:
+
 if (dir.exists("data") == FALSE) {
  dir.create("data") 
 }
+
+# These paths are excluded from github as it is best practice for end-user to generate their own
+
 if (dir.exists("figures") == FALSE) {
  dir.create("figures") 
 }
@ -109,9 +113,9 @@ TSR_data_rs_positive_summaries_ethnicity <- factor(TSR_data_rs_positive$Ethnicit

 TSR_data_rs_positive_summaries_ethnicity <- str_wrap(TSR_data_rs_positive_summaries_ethnicity, width = 30)

-TSR_data__theology_positive_summaries_gender <- factor(TSR_data_theology_positive$Gender, levels = c(1, 2, 3, 4), labels = c("Male", "Female", "I identify my gender in another way", "Prefer not to say"))
+TSR_data_theology_positive_summaries_gender <- factor(TSR_data_theology_positive$Gender, levels = c(1, 2, 3, 4), labels = c("Male", "Female", "I identify my gender in another way", "Prefer not to say"))
 # JK note: using stringr here to wrap axis titles
-TSR_data__theology_positive_summaries_gender <- str_wrap(TSR_data__theology_positive_summaries_gender, width = 10)
+TSR_data_theology_positive_summaries_gender <- str_wrap(TSR_data_theology_positive_summaries_gender, width = 10)

 TSR_data_rs_positive_summaries_gender <- factor(TSR_data_rs_positive$Gender, levels = c(1, 2, 3, 4), labels = c("Male", "Female", "I identify my gender in another way", "Prefer not to say"))
 # JK note: using stringr here to wrap axis titles
@ -180,14 +184,9 @@ ggsave("figures/TSR_data_summaries_ethnicity3.png")
 	- visualisation as summaries for all subjects LIKERT data as stacked bar chart (colours for bar segments from cool to warm)
 	
 ```{r Visualization by Subject}
-### Each Subject is a different column so will need to figure out how to code the columns together into one graph
-  # Higher score indicates less agreement...need to reverse score
-
-## 1=5, 2=4, 3=3, 4=2, 5=1, 6=0 --- Not done yet. See what they look like without reverse scoring

 ## Files have been reverse scored - Higher score now indicates more agreement

-
 #Q5 Subject Knowledge/Understanding
 subject_data$Subject <- factor(subject_data$Subject, levels = c(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12), labels = c("Philosophy", "Sociology", "Psychology", "History", "Ethics", "Theology", "Religious Studies", "Politics", "English", "Math", "Computer Science", "Business"))

@ -216,17 +215,184 @@ employability_bar + labs(title = "please rate ... employability prospects", x =
 # save to png file for reports
 ggsave("figures/TSR_data_subject_employability.png")

-### Categorical Graph ###
+### Likert Stacked Bar Chart ###

-#devtools::install_github('jbryer/likert')
-
-#likert_test <- likert(subject_data)
+# Take selection of data re: understanding
 Understanding_data <- TSR_data[, 6:17]
+# Convert each column to factors
+Understanding_data$GoodunderstandingofPhilosophy = factor(Understanding_data$GoodunderstandingofPhilosophy,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofSociology = factor(Understanding_data$GoodunderstandingofSociology,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofPsychology = factor(Understanding_data$GoodunderstandingofPsychology,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofHistory = factor(Understanding_data$GoodunderstandingofHistory,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofEthics = factor(Understanding_data$GoodunderstandingofEthics,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofTheology = factor(Understanding_data$GoodunderstandingofTheology,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofReligiousStudies = factor(Understanding_data$GoodunderstandingofReligiousStudies,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofPolitics = factor(Understanding_data$GoodunderstandingofPolitics,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofEnglish = factor(Understanding_data$GoodunderstandingofEnglish,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofMath = factor(Understanding_data$GoodunderstandingofMath,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofComputerScience = factor(Understanding_data$GoodunderstandingofComputerScience,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Understanding_data$GoodunderstandingofBusiness = factor(Understanding_data$GoodunderstandingofBusiness,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+names(Understanding_data) <- c("Philosophy", "Sociology", "Psychology", "History", "Ethics", "Theology", "Religious Studies", "Politics", "English", "Math", "Computer Science", "Business")
+
+str(Understanding_data)
+levels(Understanding_data)
+summary(Understanding_data)
 likert_test_understand <- likert(Understanding_data)
+plot(likert_test_understand)
+# save to png file for reports
+ggsave("figures/understanding_likert.png")

 Interest_data <- TSR_data[, 18:29]
+# Convert each column to factors
+Interest_data$InterestinstudyingPhilosophy = factor(Interest_data$InterestinstudyingPhilosophy,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestinstudyingSociaology = factor(Interest_data$InterestinstudyingSociaology,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinStudyingPsychology = factor(Interest_data$InterestedinStudyingPsychology,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingHistory = factor(Interest_data$InterestedinstudyingHistory,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingEthics = factor(Interest_data$InterestedinstudyingEthics,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingTheology = factor(Interest_data$InterestedinstudyingTheology,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingReligiousStudies = factor(Interest_data$InterestedinstudyingReligiousStudies,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingPolitics = factor(Interest_data$InterestedinstudyingPolitics,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingEnglish = factor(Interest_data$InterestedinstudyingEnglish,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingMath = factor(Interest_data$InterestedinstudyingMath,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingComputerScience = factor(Interest_data$InterestedinstudyingComputerScience,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Interest_data$InterestedinstudyingBusiness = factor(Interest_data$InterestedinstudyingBusiness,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+names(Interest_data) <- c("Philosophy", "Sociology", "Psychology", "History", "Ethics", "Theology", "Religious Studies", "Politics", "English", "Math", "Computer Science", "Business")
+
+likert_test_interest <- likert(Interest_data)
+plot(likert_test_interest)
+# save to png file for reports
+ggsave("figures/interest_likert.png")
+

 Employability_data <- TSR_data[, 30:41]
+# Convert each column to factors
+Employability_data$Philosophyemployability = factor(Employability_data$Philosophyemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$Sociologyemployability = factor(Employability_data$Sociologyemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$PsychologyEmployability = factor(Employability_data$PsychologyEmployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$Historyemployability = factor(Employability_data$Historyemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$Ethicsemployability = factor(Employability_data$Ethicsemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$Theologyemployability = factor(Employability_data$Theologyemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$ReligiousStudiesemployability = factor(Employability_data$ReligiousStudiesemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$Politicsemployability = factor(Employability_data$Politicsemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$Englishemployability = factor(Employability_data$Englishemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$Mathemployability = factor(Employability_data$Mathemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$ComputerScienceemployability = factor(Employability_data$ComputerScienceemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+Employability_data$Businessemployability = factor(Employability_data$Businessemployability,
+                       ordered = TRUE,
+                       levels = c("1", "2", "3", "4", "5")
+                       )
+names(Employability_data) <- c("Philosophy", "Sociology", "Psychology", "History", "Ethics", "Theology", "Religious Studies", "Politics", "English", "Math", "Computer Science", "Business")
+
+likert_test_employability <- likert(Employability_data)
+plot(likert_test_employability)
+# save to png file for reports
+ggsave("figures/employability_likert.png")
+

 ```