Spaces:

robertvidigal
/

CGD

Sleeping

App Files Files Community

robertvidigal commited on Jan 29

Commit

d86b4f7

verified ·

1 Parent(s): 8ba63ef

Upload 11 files

Browse files

Files changed (12) hide show

.RData +3 -0
.Rhistory +512 -0
.gitattributes +4 -0
.gitignore +8 -1
app.R +1566 -0
cses-shiny.Rproj +17 -0
cses_labs.rds +0 -0
cses_labs_sec.rds +0 -0
cses_shiny_data.rda +3 -0
cses_shiny_data.rds +3 -0
cses_variable_labels.csv +52 -0
world.rda +3 -0

.RData ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1f6725ad5536f6ac30971212826b4956210c8ed27a6f18e7a3a37bcb293557ca
+size 34939611

.Rhistory ADDED Viewed

	@@ -0,0 +1,512 @@

+# REMOVING SOME SPECIFIC CATEGORIES FOR SIMPLICITY OF ATA PRESENTATION
+# # -----------------------------------------------------------------------
+#cses_imd$IMD3010[cses_imd$IMD3010==6]<-3;
+#cses_imd$IMD2004[cses_imd$IMD2004==5]<-NA
+#cses_imd$IMD5007[cses_imd$IMD5007==5]<-0; # 4-point
+#cses_imd$IMD5052_2<-round(cses_imd$IMD5052_2, 1)
+# # -----------------------------------------------------------------------
+# WEIGHTS
+# # -----------------------------------------------------------------------
+cses_imd$no_weight <- 1 # UNWEIGHTED (RAW DATA)
+table(cses_imd$no_weight)
+table(cses_imd$IMD1010_1) # SAMPLE (SELECTION BIAS)
+cses_imd$weight_sample <- cses_imd$IMD1010_1
+table(cses_imd$IMD1010_2) # DEMOGRAPHIC (NON-RESPONSE BIAS)
+cses_imd$weight_demographic <- cses_imd$IMD1010_2 # PREFERRED WEIGHT (DEFAULT)
+#table(cses_imd$IMD1010_3) # POLITICAL (VOTING)- NOT USING IT
+#cses_imd$weight_political <- cses_imd$IMD1010_3
+# # -----------------------------------------------------------------------
+# SELECTING VARIABLES FOR DATA PLAYGROUND
+# # -----------------------------------------------------------------------
+vars <- c(
+"gendermc",
+"wealthf",
+"edrerf",
+"age",
+"ur",
+"labor_force",
+"compulsory_vote",
+"pais",
+"wave",
+"pais_num",
+"pais_lab",
+"no_weight",
+"weight_sample",
+"weight_demographic",
+"IMD1008_MOD"
+)
+# --- Variable Labels
+vars_labels <- read.csv("./Data preprocessing/cses_variable_labels_raw.csv",
+encoding = "latin1")
+# Variable Display for Dropdown Menu (category + question + name)
+vars_labels$display_en <- paste0(vars_labels$category_short_en, ": ",
+vars_labels$question_short_en,
+" (", vars_labels$column_name, ")", sep = "")
+vars2 <- vars_labels$column_name
+vars3 <- c(vars2, vars)
+# Check if all variables are present and subset dataset for shinyapp
+vars3 %in% names(cses_imd)
+cses_out <- cses_imd[vars3]
+# CHECKING INDIVIDUAL VARIABLES
+#table(cses_out$IMD2005_1) # remove 7 8 9; 6-point
+#table(cses_out$IMD2005_2) # remove 7 8 9; 4-point
+#table(cses_out$IMD2016) # remove 7:9 values; 5-point
+#table(cses_out$IMD2019_1) # remove 7:9 values; 2-point
+#table(cses_out$IMD3001_PR_1) # remove  9999993 9999995 9999996 9999997 9999998 9999999; 2-point
+#table(cses_out$IMD3001_PR_2) # remove  9999993 9999995 9999996 9999997 9999998 9999999; 2-point
+#table(cses_out$IMD3001_LH) # remove  9999993 9999995 9999996 9999997 9999998 9999999; 2-point
+#table(cses_out$IMD3001_UH) # remove 9999993 9999995 9999996 9999997 9999998 9999999; 2-point
+#table(cses_out$IMD3001_TS) # remove 9; 6-point
+#table(cses_out$IMD3002_OUTGOV) # remove  9999996 9999997 9999998 9999999; 2-point
+#table(cses_out$IMD3002_VS_1) # remove 9; 2-point
+#table(cses_out$IMD3002_LR_CSES) # remove  9; 3-point
+#table(cses_out$IMD3005_1) # remove  7 8 9; 2-point
+#table(cses_out$IMD3010) # remove 7 8 9, 6 should be recoded to 3; 5-point
+#table(cses_out$IMD3011) # remove 7 8 9; 5-point
+#table(cses_out$IMD3012) # remove 7 8 9; 5-point
+#table(cses_out$IMD3013_1) # remove 7 8 9; 3-point with 1,3,5
+#table(cses_out$IMD3013_2) # remove 7 8 9; 2-point with 1,2
+#table(cses_out$IMD3013_3) # remove 7 8 9; 2-point with 4 and 5
+#table(cses_out$IMD3014) # remove 6 7 8 9; 4-point
+#table(cses_out$IMD5006_1) # remove 999; TOO MANY
+#table(cses_out$IMD5006_2) # remove 999; TOO MANY
+#table(cses_out$IMD5013) # ok; 3-point
+#table(cses_out$IMD5014) # remove 7; 5-point
+#table(cses_out$IMD5032_4) # remove 9; 3-point
+#table(cses_out$IMD5033) # remove 9; 3-point
+#table(cses_out$IMD5034_2) # remove 6 9; 2-point
+#table(cses_out$IMD5035) # remove 999; TOO MANY
+#table(cses_out$IMD5048) # ok; 3-point
+#table(cses_out$IMD5049) # remove 999; TOO MANY
+#table(cses_out$IMD5050_1) # ok; 7-point
+#table(cses_out$IMD5051_1) # remove 99 and -88; 10-point
+#table(cses_out$IMD5052_2) # remove 99; TOO MANY
+#table(cses_out$IMD5053_1) # remove 999999; TOO MANY
+#table(cses_out$IMD5054_2) # remove 999; TOO MANY
+#table(cses_out$IMD5055_1) # remove 999; TOO MANY
+#table(cses_out$IMD5056_2) # remove 99999; TOO MANY
+#table(cses_out$IMD5057_1) # remove 9999999999; TOO MANY
+#table(cses_out$IMD5058_1) # remove 997   999; TOO MANY
+#table(cses_imd$IMD3001_TS) # REMOVE 9
+#table(cses_imd$IMD5054_2) # REMOVE 999
+#table(cses_imd$IMD5057_1) # REMOVE 9999999999
+#table(cses_imd$IMD5035) # REMOVE 999
+#table(cses_imd$IMD5056_2)  # REMOVE 99999
+#table(cses_imd$IMD5055_1) # remove 999
+#table(cses_imd$IMD5053_1) # remove 999999
+#table(cses_imd$IMD5052_2) # remove 99
+#table(cses_imd$IMD5006_2) # REMOVE 999
+#table(cses_imd$IMD5006_1) # REMOVE 999
+#table(cses_imd$IMD5058_1) # REMOVE 997 999
+#table(cses_imd$IMD5049) # REMOVE 999
+# # -----------------------------------------------------------------------
+# REMOVING NAs/NRs/DKs
+# # -----------------------------------------------------------------------
+# 95. VOLUNTEERED: HAVEN'T HEARD OF LEFT-RIGHT
+# 97. VOLUNTEERED: REFUSED
+# 98. VOLUNTEERED: DON'T KNOW WHERE TO PLACE
+# 99. MISSING
+cses_out <- cses_out %>%
+mutate(across(c(IMD2014, IMD3006,
+IMD5051_1, IMD5052_2,
+IMD2014, IMD3006), ~
+replace(.x, .x %in% c(-88, -77, -66, 95:99), NA)))
+# FIX NEGATIVE VALUES
+#cses_out$IMD5051_1<-(cses_out$IMD5051_1+10)/2
+cses_out <- cses_out %>%
+mutate(across(c(IMD3001, IMD3001_PR_1, IMD3001_PR_2,
+IMD3001_LH, IMD3001_UH, IMD2001_2,
+IMD3002_OUTGOV, IMD3002_LR_CSES), ~
+replace(.x, .x %in% c(9999993:9999999, 9997:9999), NA)))
+cses_out <- cses_out %>%
+mutate(across(c(IMD5006_1, IMD5006_2, IMD5035,
+IMD5049, IMD5053_1, IMD5054_2,
+IMD5045_1, IMD5055_1, IMD5056_2,
+IMD5057_1, IMD5058_1,
+IMD5054_2), ~
+replace(.x, .x %in% c(9999999999, 999999, 99999, 997, 998, 999), NA)))
+cses_out <- cses_out %>%
+mutate(across(c(IMD3001_TS, IMD3002_VS_1, IMD5032_4,
+IMD5033, IMD3002_LR_CSES), ~ replace(.x, .x %in% c(9), NA)))
+cses_out <- cses_out %>%
+mutate(across(c(IMD2005_1, IMD2005_2, IMD2016,
+IMD2019_1, IMD3005_1, IMD3011,
+IMD3012, IMD3013_1, IMD3013_2,
+IMD3010, IMD3013_3, IMD2002, IMD5036_3,
+IMD2004, IMD2007), ~ replace(.x, .x %in% c(7:9), NA)))
+cses_out <- cses_out %>%
+mutate(across(c(IMD3014, IMD5014, IMD5034_2, IMD2003, IMD2006), ~
+replace(.x, .x %in% c(6:9), NA)))
+# # -----------------------------------------------------------------------
+# CONTINUOUS VARIABLES RECODE INTO QUINTILES (~20% per category)
+# # -----------------------------------------------------------------------
+# Quintiles (5 groups) — overwrite the column with a factor that shows pretty labels.
+# The factor's internal codes are 1..5 in order,
+# so as.integer(df[[col]]) returns 1..5.
+quantile_cut_quintiles <- function(
+data, value_col, digits = 0, big_mark = ",",
+include_lowest = TRUE, type = 7) # linear interpolation of the empirical CDF
+{
+stopifnot(is.data.frame(data), value_col %in% names(data))
+x <- data[[value_col]]
+# Breaks at "0,20,40,60,80,100"
+br <- as.numeric(quantile(x, probs = seq(0, 1, 0.2), na.rm = TRUE, type = type))
+br <- br[is.finite(br)]
+br <- unique(br)
+# Edge cases: all-NA or constant
+if (length(br) < 2) {
+rng <- if (all(is.na(x))) c(NA, NA) else range(x, na.rm = TRUE)
+lab <- if (all(is.na(x))) NA_character_ else paste0("[", rng[1], ", ", rng[2], "]")
+f <- factor(ifelse(is.na(x), NA_character_, lab), levels = lab)  # single level => code 1
+data[[value_col]] <- f
+attr(data[[value_col]], "breaks") <- br
+return(data)
+}
+# Ensure strictly increasing breaks (avoid duplicate labels)
+for (i in 2:length(br)) {
+if (br[i] <= br[i - 1]) {
+bump <- 1e-8 * max(1, abs(br[i - 1]))
+br[i] <- br[i - 1] + bump
+}
+}
+# Formatting
+fmt <- function(v) formatC(v, format = "f", digits = digits, big.mark = big_mark)
+# Labels: first/last open-ended text
+labs <- c(
+paste0("Less than ", fmt(br[2])),
+paste0(fmt(br[2]), " to ", fmt(br[3])),
+paste0(fmt(br[3]), " to ", fmt(br[4])),
+paste0(fmt(br[4]), " to ", fmt(br[5])),
+paste0("More than ", fmt(br[5]))
+)
+# Get quintile codes 1..5, then map to labels
+codes <- as.integer(findInterval(x, br, rightmost.closed = TRUE, all.inside = TRUE))
+codes[is.na(x)] <- NA_integer_
+# Create factor with levels in the *desired* order so codes 1..5 align
+f <- factor(ifelse(is.na(codes), NA_character_, labs[codes]), levels = labs)
+data[[value_col]] <- f
+attr(data[[value_col]], "breaks") <- br
+data
+}
+# Check the new factor labels (built from raw cutpoints)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5054_2")
+table(cses_out$IMD5054_2); levels(cses_out$IMD5054_2)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5057_1")
+table(cses_out$IMD5057_1); levels(cses_out$IMD5057_1)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5035")
+table(cses_out$IMD5035); levels(cses_out$IMD5035)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5056_2")
+table(cses_out$IMD5056_2); levels(cses_out$IMD5056_2)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5055_1", digits=2)
+table(cses_out$IMD5055_1); levels(cses_out$IMD5055_1)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5053_1")
+table(cses_out$IMD5053_1); levels(cses_out$IMD5053_1)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5052_2")
+table(cses_out$IMD5052_2); levels(cses_out$IMD5052_2)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5006_2")
+table(cses_out$IMD5006_2); levels(cses_out$IMD5006_2)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5006_1")
+table(cses_out$IMD5006_1); levels(cses_out$IMD5006_1)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5058_1")
+table(cses_out$IMD5058_1); levels(cses_out$IMD5058_1)
+cses_out <- quantile_cut_quintiles(cses_out, "IMD5049")
+table(cses_out$IMD5049); levels(cses_out$IMD5049)
+# Turn factor quintiles into labelled numerics 1..5 using the factor's own levels as value labels
+factor_quintiles_to_labelled <- function(df, vars) {
+stopifnot(is.data.frame(df))
+for (v in vars) {
+if (!v %in% names(df)) next
+f <- df[[v]]
+if (!is.factor(f)) { warning(sprintf("'%s' is not a factor; skipping.", v)); next }
+lv <- levels(f)
+if (length(lv) != 5) { warning(sprintf("'%s' has %d levels (expected 5); skipping.", v, length(lv))); next }
+df[[v]] <- haven::labelled(as.integer(f), labels = stats::setNames(1:5, lv))
+}
+df
+}
+qvars <- c("IMD5054_2","IMD5057_1","IMD5035","IMD5056_2",
+"IMD5055_1","IMD5053_1","IMD5052_2","IMD5006_2","IMD5006_1",
+"IMD5058_1","IMD5049")
+cses_out <- factor_quintiles_to_labelled(cses_out, qvars)
+# REMOVING CONTINUOUS VARS FOR NOW...
+#labs <- labs[!labs %in% c("IMD3001_TS", "IMD5054_2", "IMD5057_1", "IMD5035",
+#                          "IMD5056_2", "IMD5055_1", "IMD5053_1", "IMD5052_2",
+#                          "IMD5006_2", "IMD5006_1", "IMD5058_1", "IMD5049")]
+# # -----------------------------------------------------------------------
+# OUTCOME VARIABLES RECODE (NUMERIC TO LABELS)
+# # -----------------------------------------------------------------------
+# Function to convert labels to sentence case
+to_sentence_case <- function(x) {
+sapply(x, function(s) {
+s <- tolower(s)
+# Capitalize first letter after ) or .
+s <- gsub("([).]\\s*)([a-z])", "\\1\\U\\2", s, perl = TRUE)
+# Also capitalize the very first character if needed
+sub("^(\\w)", "\\U\\1", s, perl = TRUE)
+}, USE.NAMES = FALSE)
+}
+#  Label output dataset to include the labels through haven package
+# Safer: won't touch your quintile-binned columns
+label_all_for_haven <- function(data, data_out, exclude_vars = NULL) {
+label_table <- attr(data, "label.table", exact = TRUE)
+data_labeled <- data_out
+for (var in names(data_out)) {
+# 1) explicit exclude list
+if (!is.null(exclude_vars) && var %in% exclude_vars) next
+# 2) skip if already a factor (e.g., your quintile pretty labels)
+if (is.factor(data_out[[var]])) next
+# 3) skip if marked as quintiled by attribute you set (optional)
+if (!is.null(attr(data_out[[var]], "q5_breaks"))) next
+if (!is.null(label_table[[var]])) {
+values <- label_table[[var]]
+# Clean labels: remove number prefixes, apply sentence case
+clean_labels <- sub("^\\d+\\.\\s*", "", names(values))
+clean_labels <- to_sentence_case(clean_labels)
+# Build named vector: names = labels, values = numeric codes
+labelled_vec <- setNames(as.numeric(values), clean_labels)
+# Preserve original column's storage; attach labels if numeric/integer
+var_data <- data_out[[var]]
+if (is.numeric(var_data) || is.integer(var_data)) {
+data_labeled[[var]] <- haven::labelled(var_data, labels = labelled_vec)
+} else {
+# Non-numeric targets get skipped to avoid clobbering (e.g., factors/quintiles)
+# Alternatively, you could coerce if you really want:
+# data_labeled[[var]] <- haven::labelled(as.numeric(var_data), labels = labelled_vec)
+}
+}
+}
+data_labeled
+}
+cses_out_labels <- label_all_for_haven(cses_imd, cses_out,
+exclude_vars = c("IMD5054_2","IMD5057_1","IMD5035","IMD5056_2",
+"IMD5055_1","IMD5053_1","IMD5052_2","IMD5006_2",
+"IMD5006_1","IMD5058_1","IMD5049"))
+# # -----------------------------------------------------------------------
+# CUSTOM FIXES FOR NOW
+# # -----------------------------------------------------------------------
+cses_out_labels$IMD2004[cses_out_labels$IMD2004==5]<-NA
+cses_out_labels$IMD3010 <- labelled(
+x = replace(cses_out_labels$IMD3010, cses_out_labels$IMD3010 == 6, 3),
+labels = c(
+"Very satisfied"         = 1,
+"Satisfied"              = 2,
+"Neither"                = 3,
+"Not very satisfied"     = 4,
+"Not all satisfied"      = 5
+)
+)
+cses_out_labels$IMD5007 <- labelled(
+x = replace(cses_out_labels$IMD5007, cses_out_labels$IMD5007 == 5, 0),
+labels = c(
+"No"                     = 0,
+"Yes; no sanctions"      = 3,
+"Yes; weakly enforced"   = 2,
+"Yes; strictly enforced" = 1
+)
+)
+cses_out_labels$IMD5052_2<-round(cses_out_labels$IMD5052_2, 1)
+# # -----------------------------------------------------------------------
+# Exporting DATA (.rds lighter file storage)
+# # -----------------------------------------------------------------------
+# MERGE PAIS_LAB TO CSES_OUT BEFORE EXPORT
+pais_lab_merge<-subset(pais_lab, select=c("pais_lab", "pais_nam"))
+cses_out_labels <- merge(cses_out_labels, pais_lab_merge, by = "pais_lab")
+str(cses_out_labels)
+# REMOVING CONTINUOUS VARS FOR NOW...
+#cses_out_labels<-subset(cses_out_labels, select=-c(IMD3001_TS, IMD5054_2, IMD5057_1, IMD5035,
+#                                     IMD5056_2, IMD5055_1, IMD5053_1, IMD5052_2,
+#                                     IMD5006_2, IMD5006_1, IMD5058_1, IMD5049))
+# EXPORT RDS
+saveRDS(cses_out_labels, "./cses_shiny_data.rds")
+# EXPORT RDA (MAX COMPRESSION)
+cses_shiny_data<-cses_out_labels
+save(cses_shiny_data, file="cses_shiny_data.rda")
+tools::resaveRdaFiles("./cses_shiny_data.rda", compress = "xz")
+tools::checkRdaFiles("./cses_shiny_data.rda")
+# # -----------------------------------------------------------------------
+# EXTRACTING RESPONSE OPTIONS FOR VARS_LABELS DATA
+# # -----------------------------------------------------------------------
+# Define the format_labels function to extract and format ROs
+format_labels <- function(label_table) {
+valid_labels <- label_table[label_table > -15 & label_table < 90]  # Exclude special codes / DK / NA / NR / ETC
+formatted <- sapply(seq_along(valid_labels), function(i) {
+paste0("(", valid_labels[i], ") ", names(valid_labels)[i])
+})
+paste(formatted, collapse = " ")
+}
+# Extract Response Options from Dataset Attributes (label.table)
+for (var in names(cses_imd)) {
+if (var %in% vars_labels$column_name) {
+label_table <- attr(cses_imd, "label.table", exact=T)[[var]]
+if (!is.null(label_table)) {
+vars_labels$responses_en[vars_labels$column_name == var] <- format_labels(label_table)
+}
+}
+}
+table(vars_labels$responses_en=="" | is.na(vars_labels$responses_en))
+# # -----------------------------------------------------------------------
+# FILLING "Question Wording" & "Response Options" for Variables.
+# # -----------------------------------------------------------------------
+qword_ro<-read.csv("./Data preprocessing/cses_qwording.csv", header=T)
+vars_labels <- vars_labels %>%
+left_join(qword_ro, by = "column_name", suffix = c(".old", "")) %>%
+# Select columns from qword_ro and non-duplicated columns from vars_labels
+select(-contains(".old"))
+table(vars_labels$responses_en=="" | is.na(vars_labels$responses_en))
+# REMOVING NAs/NRs/DKs from ROs and other CLEANING (mojibake/encoding errors)
+#vars_labels$responses_en<-gsub("â€“", ":", vars_labels$responses_en)
+#vars_labels$responses_en<-gsub("00.", "0.", vars_labels$responses_en)
+#vars_labels$question_short_en<-gsub("ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â‚¬Å¡Ã‚Â¬ÃƒÂ¢Ã¢â€šÂ¬Ã…â€œ", ":", vars_labels$question_short_en)
+#vars_labels$question_short_en<-gsub("ÃƒÆ’Ã†â€™Ãƒâ€šÃ‚Â¢ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â€šÂ¬Ã…Â¡Ãƒâ€šÃ‚Â¬ÃƒÆ’Ã‚Â¢ÃƒÂ¢Ã¢â‚¬Å¡Ã‚Â¬Ãƒâ€¦Ã¢â‚¬Å“", "", vars_labels$question_short_en)
+vars_labels$responses_en<-trimws(vars_labels$responses_en)
+vars_labels$responses_en<-gsub(" \\(7\\) 7. VOLUNTEERED: REFUSED", "", vars_labels$responses_en)
+vars_labels$responses_en<-gsub(" \\(8\\) 8. VOLUNTEERED: DON'T KNOW", "", vars_labels$responses_en)
+vars_labels$responses_en<-gsub(" \\(9\\) 9. MISSING", "", vars_labels$responses_en)
+vars_labels$responses_en<-gsub(" \\(6\\) 6. OTHER", "", vars_labels$responses_en)
+vars_labels$responses_en<-gsub(" \\(6\\) 6. \\[SEE ELECTION STUDY NOTES\\]", "", vars_labels$responses_en)
+vars_labels$responses_en<-gsub(" \\(7\\) 7. NOT APPLICABLE \\[NO ALLIANCES PERMITTED\\]", "", vars_labels$responses_en)
+vars_labels$responses_en<-gsub(" \\(6\\) 6. NO INTERNATIONAL ELECTION OBSERVERS", "", vars_labels$responses_en)
+vars_labels$responses_en<-gsub(" \\(7\\) 7. NOT APPLICABLE", "", vars_labels$responses_en)
+vars_labels$responses_en<-gsub("\\(1\\) 1. VERY SATISFIED \\(2\\) 2. FAIRLY SATISFIED \\(4\\) 4. NOT VERY SATISFIED \\(5\\) 5. NOT AT ALL SATISFIED \\(6\\) 6. NEITHER SATISFIED NOR DISSATISFIED",
+"\\(1\\) 1. VERY SATISFIED \\(2\\) 2. FAIRLY SATISFIED \\(3\\) 3. NEITHER SATISFIED NOR DISSATISFIED \\(4\\) 4. NOT VERY SATISFIED \\(5\\) 5. NOT AT ALL SATISFIED",
+vars_labels$responses_en)
+vars_labels$responses_en<-trimws(vars_labels$responses_en)
+# Remove Extra  and WhiteSpaces respectivelly
+vars_labels$responses_en <- gsub("(\\s|^)-?\\d+\\.\\s", "\\1", vars_labels$responses_en)
+vars_labels$responses_en <- gsub("([).])\\s+", "\\1 ", vars_labels$responses_en)
+vars_labels$responses_en<-gsub("\\(5\\) NO", "\\(0\\) NO", vars_labels$responses_en) # COMPULSORY VOTE IMD5007
+# Create responses_en_rec
+vars_labels$responses_en_rec<-to_sentence_case(vars_labels$responses_en)
+vars_labels$question_short_en<-to_sentence_case(vars_labels$question_short_en)
+vars_labels$question_short_en <- gsub("([).-])\\s+", "\\1 ", vars_labels$question_short_en)
+# # -----------------------------------------------------------------------
+# EXPORT CSES LABELS
+# # -----------------------------------------------------------------------
+# REMOVING CONTINUOUS VARS FOR NOW...
+#vars_labels <- vars_labels[!vars_labels$column_name %in%
+#                                   c("IMD3001_TS", "IMD5054_2", "IMD5057_1", "IMD5035",
+#                                     "IMD5056_2", "IMD5055_1", "IMD5053_1", "IMD5052_2",
+#                                     "IMD5006_2", "IMD5006_1", "IMD5058_1", "IMD5049"), ]
+write.csv(vars_labels, "./cses_variable_labels.csv", row.names=F)
+# # -----------------------------------------------------------------------
+# LABS VECTOR
+# # -----------------------------------------------------------------------
+labs <- vars_labels$column_name
+names(labs) <- vars_labels$display_en
+labs[order(names(labs))]
+names(vars_labels$column_name) <- vars_labels$display_en
+vars_labels$labs2 <- labs
+vars_labels$question_en_comp <- paste0(vars_labels$question_en,
+vars_labels$responses_en_rec,
+sep = " ")
+# Dropping MACRO Variables from Outcomes but keeping at secondary vars
+drop_macro <- grep("Macro Data:", names(labs), value = TRUE)
+labs_sec <- labs
+labs <- labs[!(names(labs) %in% drop_macro)]
+# # -----------------------------------------------------------------------
+# FINAL EXPORT OF LABELS
+# # -----------------------------------------------------------------------
+saveRDS(labs, "./cses_labs.rds")
+saveRDS(labs_sec, "./cses_labs_sec.rds")
+# END
+# # -----------------------------------------------------------------------
+message("Code ended succesfully")
+# # -----------------------------------------------------------------------
+### CSES DATA PLAYGROUND
+# Date: November 10th, 2025
+# Author: Robert Vidigal, PhD
+# Purpose: CSES Shiny Data Playground based on LAPOP Lab Data Playground
+# Prev file: ./shiny_preprocessing.R
+# Machine: Windows OS
+# Status: On-going
+# # -----------------------------------------------------------------------
+### Data In:
+# 1. cses_shiny_data.rda
+# 2. cses_variable_labels.csv
+# 3. cses_labs.rds
+# 4. and fonts from /wwww/
+### Data Out: N/A
+# # -----------------------------------------------------------------------
+options(shiny.useragg = TRUE) # speed it up
+# # -----------------------------------------------------------------------
+# Packages loading
+# # -----------------------------------------------------------------------
+library(lapop); library(bslib); library(htmltools); require(bsplus)
+suppressPackageStartupMessages(library(dplyr))
+library(tidyr); library(stringr); library(haven)
+require(shiny); library(shinyWidgets); require(shinyjs)
+suppressPackageStartupMessages(library(Hmisc, exclude = c("src", "summarize", "units", "format.pval")))
+lapop_fonts() # LAPOP GRAPH STYLE
+# IMD CSES Data (only preselected variables)
+# # -----------------------------------------------------------------------
+# RDA FILE BEST COMPRESSION FOR RSHINY
+load(file="./cses_shiny_data.rda"); dstrata<-cses_shiny_data; rm(cses_shiny_data)
+# Labels data (for DP display)
+vars_labels <- read.csv("./cses_variable_labels.csv", encoding = "latin1")
+# Labs vector (for DP display outcomes versus secondary vars that include macro vars)
+labs <- readRDS("./cses_labs.rds")
+labs_sec <- readRDS("./cses_labs_sec.rds")
+# Dropping Demographics (OLD, ALLOW USERS TO USE BOTH RAW AND RECODE DEMOG VARS)
+#drop_demoglabs <- c("IMD2001_2", "IMD2002", "IMD2003", "IMD2006", "IMD2007") # Demographics
+#labs_sec <- labs[ !(unname(labs) %in% drop_demoglabs) ]
+# Error handling function (so app does not break easily)
+Error<-function(x){
+tryCatch(x,error=function(e) return(FALSE))
+}
+# CSES election-year vector for TS
+waves_total = c("1996", "1997", "1998", "1999", "2000", "2001", "2002",
+"2003", "2004", "2005", "2006", "2007", "2008", "2009",
+"2010", "2011", "2012", "2013", "2014", "2015", "2016",
+"2017", "2018", "2019", "2020",  "2021")
+# Escape stuff that ggtext/markdown treats specially
+sanitize_for_ggtext <- function(x) {
+x <- as.character(x)
+# HTML specials
+x <- gsub("&", "&amp;", x, fixed = TRUE)
+x <- gsub("<", "&lt;",  x, fixed = TRUE)
+x <- gsub(">", "&gt;",  x, fixed = TRUE)
+# Markdown link/emphasis/backtick
+x <- gsub("\\[", "&#91;", x)
+x <- gsub("\\]", "&#93;", x)
+x <- gsub("\\(", "&#40;", x)
+x <- gsub("\\)", "&#41;", x)
+x <- gsub("\\*", "&#42;", x)
+x <- gsub("_",  "&#95;", x)
+x <- gsub("`",  "&#96;", x)
+x
+}
+# # -----------------------------------------------------------------------
+# Helper function for TS (handle missing values at end or middle of series)
+# # -----------------------------------------------------------------------
+omit_na_edges <- function(df) {
+# Find which rows have NA values
+na_rows <- apply(df, 1, function(row) any(is.na(row)))
+# Find the first and last non-NA row
+first_non_na <- which(!na_rows)[1]
+last_non_na <- which(!na_rows)[length(which(!na_rows))]
+# Subset df to only include rows between the first and last non-NA rows
+df_clean <- df[first_non_na:last_non_na, ]
+return(df_clean)
+}
+### MOVE IT TO LAPOP_TS???
+View(dstrata)
+View(vars_labels)
+View(pais_lab_merge)
+View(qword_ro)
+grep("Not at all", qword_ro$responses_en)
+grep("Not at all", qword_ro$responses_en, value = T)
+grep("all", qword_ro$responses_en, value = T)
+grep("not", qword_ro$responses_en, value = T)
+grep("none", qword_ro$responses_en, value = T)
+grep("never", qword_ro$responses_en, value = T)
+grep("never", qword_ro$responses_en, value = T)
+grepl("never", qword_ro$responses_en, value = T)
+grep("(1)", qword_ro$responses_en, value = T)
+grep("no", qword_ro$responses_en, value = T)
+grep("NOT AT ALL", qword_ro$responses_en, value = T)
+grep("NOT AT ALL", qword_ro$responses_en)
+devtools::install_github("lapop-central/lapop",
+force = TRUE,
+build_vignettes = TRUE)
+shiny::runApp()
+runApp()

.gitattributes CHANGED Viewed

@@ -45,3 +45,7 @@ cses-shiny/www/Roboto-Bold.ttf filter=lfs diff=lfs merge=lfs -text
 cses-shiny/www/Roboto-Light.ttf filter=lfs diff=lfs merge=lfs -text
 cses-shiny/www/Roboto-Medium.ttf filter=lfs diff=lfs merge=lfs -text
 cses-shiny/www/Roboto-Regular.ttf filter=lfs diff=lfs merge=lfs -text

 cses-shiny/www/Roboto-Light.ttf filter=lfs diff=lfs merge=lfs -text
 cses-shiny/www/Roboto-Medium.ttf filter=lfs diff=lfs merge=lfs -text
 cses-shiny/www/Roboto-Regular.ttf filter=lfs diff=lfs merge=lfs -text
+.RData filter=lfs diff=lfs merge=lfs -text
+cses_shiny_data.rda filter=lfs diff=lfs merge=lfs -text
+cses_shiny_data.rds filter=lfs diff=lfs merge=lfs -text
+world.rda filter=lfs diff=lfs merge=lfs -text

.gitignore CHANGED Viewed

	@@ -1 +1,8 @@
1	- .~~DS_Store~~

+.Rproj.user
+.Rhistory
+.RData
+.Ruserdata
+*.dcf
+rsconnect/shinyapps.io/centerforglobaldemocracy/cses-shiny.dcf
+app_old_warning.R
+app_w_stack.R

app.R ADDED Viewed

	@@ -0,0 +1,1566 @@

+### CSES DATA PLAYGROUND
+# Date: November 10th, 2025
+# Author: Robert Vidigal, PhD
+# Purpose: CSES Shiny Data Playground based on LAPOP Lab Data Playground
+# Prev file: ./shiny_preprocessing.R
+# Machine: Windows OS
+# Status: On-going
+# # -----------------------------------------------------------------------
+### Data In:
+# 1. cses_shiny_data.rda
+# 2. cses_variable_labels.csv
+# 3. cses_labs.rds
+# 4. and fonts from /wwww/
+### Data Out: N/A
+# # -----------------------------------------------------------------------
+options(shiny.useragg = TRUE) # speed it up
+# # -----------------------------------------------------------------------
+# Packages loading
+# # -----------------------------------------------------------------------
+library(lapop); library(bslib); library(htmltools); require(bsplus)
+suppressPackageStartupMessages(library(dplyr))
+library(tidyr); library(stringr); library(haven)
+require(shiny); library(shinyWidgets); require(shinyjs); require(ggtext)
+suppressPackageStartupMessages(library(Hmisc, exclude = c("src", "summarize", "units", "format.pval")))
+lapop_fonts() # LAPOP GRAPH STYLE
+# IMD CSES Data (only preselected variables)
+# # -----------------------------------------------------------------------
+# RDA FILE BEST COMPRESSION FOR RSHINY
+load(file="./cses_shiny_data.rda");
+# Labels data (for DP display)
+vars_labels <- read.csv("./cses_variable_labels.csv", encoding = "latin1")
+# Labs vector (for DP display outcomes versus secondary vars that include macro vars)
+labs <- readRDS("./cses_labs.rds")
+labs_sec <- readRDS("./cses_labs_sec.rds")
+load(file="./world.rda")
+# Dropping Demographics (OLD, ALLOW USERS TO USE BOTH RAW AND RECODE DEMOG VARS)
+#drop_demoglabs <- c("IMD2001_2", "IMD2002", "IMD2003", "IMD2006", "IMD2007") # Demographics
+#labs_sec <- labs[ !(unname(labs) %in% drop_demoglabs) ]
+# # -----------------------------------------------------------------------
+# Error handling function (so app does not break easily)
+# # -----------------------------------------------------------------------
+Error<-function(x){
+  tryCatch(x,error=function(e) return(FALSE))
+}
+# CSES election-year vector for TS
+waves_total = c("1996", "1997", "1998", "1999", "2000", "2001", "2002",
+                "2003", "2004", "2005", "2006", "2007", "2008", "2009",
+                "2010", "2011", "2012", "2013", "2014", "2015", "2016",
+                "2017", "2018", "2019", "2020",  "2021")
+# Escape stuff that ggtext/markdown treats specially
+sanitize_for_ggtext <- function(x) {
+  x <- as.character(x)
+  # HTML specials
+  x <- gsub("&", "&amp;", x, fixed = TRUE)
+  x <- gsub("<", "&lt;",  x, fixed = TRUE)
+  x <- gsub(">", "&gt;",  x, fixed = TRUE)
+  # Markdown link/emphasis/backtick
+  x <- gsub("\\[", "&#91;", x)
+  x <- gsub("\\]", "&#93;", x)
+  x <- gsub("\\(", "&#40;", x)
+  x <- gsub("\\)", "&#41;", x)
+  x <- gsub("\\*", "&#42;", x)
+  x <- gsub("_",  "&#95;", x)
+  x <- gsub("`",  "&#96;", x)
+  x
+}
+# # -----------------------------------------------------------------------
+# Helper function for TS
+# # -----------------------------------------------------------------------
+# (handle missing values at end or middle of series)
+omit_na_edges <- function(df) {
+  # Find which rows have NA values
+  na_rows <- apply(df, 1, function(row) any(is.na(row)))
+  # Find the first and last non-NA row
+  first_non_na <- which(!na_rows)[1]
+  last_non_na <- which(!na_rows)[length(which(!na_rows))]
+  # Subset df to only include rows between the first and last non-NA rows
+  df_clean <- df[first_non_na:last_non_na, ]
+  return(df_clean)
+}
+# # -----------------------------------------------------------------------
+# Custom weighted averages & CIs, much faster than survey_mean() etc
+# # -----------------------------------------------------------------------
+weighted.ttest.ci <- function(x, weights) {
+  nx <- length(x)
+  vx <- Hmisc::wtd.var(x, weights, normwt = TRUE, na.rm = TRUE) # Weighted variance
+  mx <- weighted.mean(x, weights, na.rm = TRUE) # Weighted mean
+  stderr <- sqrt(vx/nx)
+  tstat <- mx/stderr ## not mx - mu
+  cint <- qt(1 - 0.05/2, nx - 1)
+  cint <- tstat + c(-cint, cint)
+  confint = cint * stderr
+  result = data.frame(prop = mx, lb = confint[1], ub = confint[2])
+  return(result)
+}
+# # -----------------------------------------------------------------------
+# Helper for missing country-year by outcome_var
+# # -----------------------------------------------------------------------
+get_missing_combinations <- function(data, outcome_var, wave_var,
+                                     selected_waves, selected_countries) {
+  # Convert wave values to string using haven labels
+  data <- data %>%
+    mutate(wave_str = as.character(haven::as_factor(.data[[wave_var]])))
+  # Build the full country-wave grid
+  all_combos <- expand.grid(
+    pais_nam = selected_countries,
+    wave = selected_waves,
+    stringsAsFactors = FALSE
+  )
+  # Subset only relevant countries
+  data <- data %>%
+    filter(pais_nam %in% selected_countries)
+  # Summarize: how many valid (non-NA and not 0) values exist per combo
+  summary <- data %>%
+    group_by(pais_nam, wave = wave_str) %>%
+    summarise(
+      n_valid = sum(!is.na(.data[[outcome_var]]) & .data[[outcome_var]] != 0),
+      .groups = "drop"
+    )
+  # Merge and detect missing
+  missing <- all_combos %>%
+    left_join(summary, by = c("pais_nam", "wave")) %>%
+    filter(is.na(n_valid) | n_valid == 0) %>%
+    select(pais_nam, wave)
+  return(missing)
+}
+# # -----------------------------------------------------------------------
+# Helper function for mover plot (weighting and handling NAs)
+# # -----------------------------------------------------------------------
+process_data <- function(data, outcome_var, recode_range,
+                         group_var, var_label, weight_var) {
+  if (is.null(group_var)) {
+    return(NULL)
+  }
+  processed_data <- data %>%
+    drop_na(!!sym(outcome_var)) %>%
+    mutate(outcome_rec = case_when(
+      is.na(!!sym(outcome_var)) ~ NA_real_,
+      !!sym(outcome_var) >= recode_range[1] & !!sym(outcome_var) <= recode_range[2] ~ 100,
+      TRUE ~ 0
+    )) %>%
+    group_by(vallabel = haven::as_factor(haven::zap_missing(!!sym(group_var)))) %>%
+    summarise_at(vars("outcome_rec"), list(~weighted.ttest.ci(., !!sym(weight_var)))) %>%
+    unnest_wider(col = "outcome_rec") %>%
+    mutate(
+      varlabel = var_label,
+      proplabel = paste0(round(prop), "%")
+    ) %>%
+    drop_na(.)
+  return(processed_data)
+}
+# # -----------------------------------------------------------------------
+# BOOTSTRAP THEME
+# # -----------------------------------------------------------------------
+cses_theme <- bs_theme(
+  version = 5,
+  bootswatch = "cosmo",
+  bg = "#ffffff",
+  fg = "#212529",
+  primary = "#C4722A",
+  secondary = "#C4722A",
+  success = "#28a745",
+  info = "#0066cc",
+  warning = "#dc3545",
+  danger = "#dc3545",
+  #base_font = font_google("Open Sans"),
+  #heading_font = font_google("Roboto Slab"),
+  #code_font = font_google("Fira Mono"),
+  #font_scale = 1
+)
+# # -----------------------------------------------------------------------
+# HOVER POP-UP FOR LEFTSIDE MENU
+# # -----------------------------------------------------------------------
+info_badge <- function(text, title, content) {
+  bsplus::bs_embed_popover(
+    tags$span(text, tags$span(icon("info-circle"), class = "me-1",  style = "color:#C4722A;")),
+    title = title,
+    content = content,
+    placement = "right",
+    trigger = "click",
+    container = "body"
+  )
+}
+# # -----------------------------------------------------------------------
+# N-SIZE FUNCTION TO PULL COUNTRY-YEAR COMBOS (CHATGPT)
+# # -----------------------------------------------------------------------
+get_sample_counts <- function(
+    data, outcome_var,
+    wave_var = "wave", country_var = "pais_nam",
+    selected_waves = NULL, selected_countries = NULL,
+    complete_grid = FALSE
+) {
+  df <- data
+  if (!is.null(selected_waves))     df <- dplyr::filter(df, .data[[wave_var]] %in% selected_waves)
+  if (!is.null(selected_countries)) df <- dplyr::filter(df, .data[[country_var]] %in% selected_countries)
+  df <- dplyr::filter(df, !is.na(.data[[outcome_var]]))
+  per_wave <- df |>
+    dplyr::count(wave = .data[[wave_var]], name = "n") |>
+    dplyr::arrange(wave)
+  per_country <- df |>
+    dplyr::count(pais = .data[[country_var]], name = "n") |>
+    dplyr::arrange(pais)
+  per_country_wave <- df |>
+    dplyr::count(pais = .data[[country_var]], wave = .data[[wave_var]], name = "n") |>
+    dplyr::arrange(pais, wave)
+  if (complete_grid) {
+    all_waves <- if (!is.null(selected_waves)) selected_waves else sort(unique(data[[wave_var]]))
+    all_countries <- if (!is.null(selected_countries)) selected_countries else sort(unique(data[[country_var]]))
+    per_country_wave <- per_country_wave |>
+      tidyr::complete(pais = all_countries, wave = all_waves, fill = list(n = 0)) |>
+      dplyr::arrange(pais, wave)
+    per_country <- per_country_wave |>
+      dplyr::group_by(pais) |>
+      dplyr::summarise(n = sum(n), .groups = "drop") |>
+      dplyr::arrange(pais)
+    per_wave <- per_country_wave |>
+      dplyr::group_by(wave) |>
+      dplyr::summarise(n = sum(n), .groups = "drop") |>
+      dplyr::arrange(wave)
+  }
+  list(
+    overall = nrow(df),
+    per_wave = per_wave,
+    per_country = per_country,
+    per_country_wave = per_country_wave
+  )
+}
+# # -----------------------------------------------------------------------
+# # -----------------------------------------------------------------------
+# # -----------------------------------------------------------------------
+# # -----------------------------------------------------------------------
+# Creating User Interface UI!
+# # -----------------------------------------------------------------------
+ui <- fluidPage(
+  useShinyjs(),
+  theme = cses_theme,
+  tags$h2("CSES Data Playground",
+          style = "color: #C4722A; font-weight: bold; font-size: 36px;"),
+  sidebarLayout(
+    # ----- Sidebar panel for inputs
+    sidebarPanel(width = 3,
+      selectInput("variable", "Outcome",
+                  labs[order(names(labs))],
+                  selected = "IMD3010"),
+      # Default picks most recent module
+      pickerInput(inputId = "module",
+                  label = tagList(info_badge("Module",
+                          HTML("Please select which CSES Modules to be available in the analysis. Then, select which countries and years below."),
+                          "Module")),
+                  choices = sort(levels(as_factor(cses_shiny_data$IMD1008_MOD)[!is.na(cses_shiny_data$IMD1008_MOD)])),
+                  selected = c("MODULE 5"),
+                  options = list(`actions-box` = TRUE),
+                  multiple = TRUE),
+      # ----- COUNTRY
+      pickerInput(inputId = "pais",
+                  label = "Countries",
+                    #tagList(info_badge("Countries",
+                    #HTML("Please select which countries to be included in the analysis."),
+                    #"Countries")),
+                  choices = sort(levels(as_factor(cses_shiny_data$pais)[!is.na(cses_shiny_data$pais)])),
+                  options = list(`actions-box` = TRUE),
+                  multiple = TRUE),
+      # ----- WAVE
+      pickerInput(inputId = "wave",
+                  label = "Years",
+                  #tagList(info_badge("Years",
+                  #                           HTML("Please select which years to be included in the analysis."),
+                  #                           "Years")),
+                  choices = c("1996" = "1996", "1997" = "1997", "1998" = "1998",
+                              "1999" = "1999", "2000" = "2000", "2001" = "2001",
+                              "2002" = "2002", "2003" = "2003", "2004" = "2004",
+                              "2005" = "2005", "2006" = "2006", "2007" = "2007",
+                              "2008" = "2008", "2009" = "2009", "2010" = "2010",
+                              "2011" = "2011", "2012" = "2012", "2013" = "2013",
+                              "2014" = "2014", "2015" = "2015", "2016" = "2016",
+                              "2017" = "2017", "2018" = "2018", "2019" = "2019",
+                              "2020" = "2020", "2021" = "2021"),
+                  options = list(`actions-box` = TRUE),
+                  multiple = TRUE),
+      # ----- WEIGHT selection radio buttons
+      bsplus::use_bs_popover(),
+      radioButtons(
+        inputId = "weight_type",
+        label = tagList(info_badge("Weights",
+                        HTML("Further information on weights is available in <b>Part 6</b> of CSES Module 4."),
+                        "Weights")),
+        # For a link, add:
+        # HTML('Further information on weights is available in <b>Part 6</b> of CSES Module 4. <br><a href=\"#\" target=\"_blank\">Open doc</a>')
+        choiceValues = c("no_weight", "weight_demographic", "weight_sample"),
+        choiceNames  = list(
+          info_badge("Unweighted", "No weights applied. Raw proportions/percentages.",
+                     "Unweighted"),
+          info_badge("Demographic weight", "Post-stratification targets.",
+                     "Demographic weight"),
+          info_badge("Sample weight", "Design/selection probability weights.",
+                     "Sample weight")
+        ),
+        selected = "no_weight"),
+      # This fixes a formatting issue with checkboxGroupInput() below
+      tags$head(
+        tags$style(
+          HTML("
+          .checkbox-inline {
+                    margin-left: 0px;
+                    margin-right: 10px;
+          }
+         .checkbox-inline+.checkbox-inline {
+                    margin-left: 0px;
+                    margin-right: 10px;
+         }
+    .shiny-notification {
+      width: 615px !important; /* max width */
+      max-height: 140px; /* max height */
+      word-wrap: break-word;
+      white-space: normal;
+      overflow-y: auto; /* scrollbar */
+      right: 330px !important; /* shift away from right edge */
+      box-sizing: border-box;
+      font-size: 14px;
+    }"))),
+      # This triggers the "Generate" button
+      tags$script(HTML("
+      Shiny.addCustomMessageHandler('clickGenerateButton', function(message) {
+    $('#go').click();
+  });
+")),
+      # This makes the slider input to allow only integers for CSES years
+      tags$style(type = "text/css", ".irs-grid-pol.small {height: 0px;}"),
+# Make popovers white + wire TRUE hover with JavaScript
+      tags$style(HTML("
+  .popover {
+    --bs-popover-bg: #ffffff;
+    --bs-popover-border-color: #dddddd;
+    --bs-popover-header-bg: #ffffff;
+    --bs-popover-header-color: #212529;
+    --bs-popover-body-color: #212529;
+    border-color: #dddddd;
+  }
+  .popover .popover-header,
+  .popover .popover-body {
+    background-color: #ffffff;
+    color: #212529;
+  }
+")),
+      tags$script(HTML("
+(function() {
+  function upgradeDataAttr(el){
+  // Force manual disable
+    if (el.getAttribute('data-toggle') === 'popover') {
+      el.setAttribute('data-bs-toggle','popover');
+      el.removeAttribute('data-toggle');
+    }
+  }
+  function getPopover(el){
+    // Force manual trigger so we fully control hover behavior
+    return bootstrap.Popover.getOrCreateInstance(el, {
+      container: 'body',
+      trigger: 'manual',
+      html: true, sanitize: false
+    });
+  }
+  function addHoverBehavior(el){
+    var timer = null;
+    var inst  = getPopover(el);
+    function startHide(delay){
+      if (timer) clearTimeout(timer);
+      timer = setTimeout(function(){
+        inst.hide();
+      }, delay);
+    }
+    function cancelHide(){
+      if (timer) { clearTimeout(timer); timer = null; }
+    }
+    // Show on hover
+    el.addEventListener('mouseenter', function(){
+      cancelHide();
+      inst.show();
+      // Auto-dismiss after 10s (unless user is hovering the popover)
+      startHide(10000);
+    });
+    // Hide shortly after leaving the icon (unless pointer is on the popover)
+    el.addEventListener('mouseleave', function(){
+      // small delay to allow moving into the popover
+      setTimeout(function(){
+        var pop = document.getElementById(el.getAttribute('aria-describedby'));
+        if (!pop || !pop.matches(':hover')) inst.hide();
+      }, 150);
+    });
+    // Keep open while hovering the popover; hide when leaving it
+    el.addEventListener('shown.bs.popover', function(){
+      var pop = document.getElementById(el.getAttribute('aria-describedby'));
+      if (!pop) return;
+      pop.addEventListener('mouseenter', cancelHide);
+      pop.addEventListener('mouseleave', function(){
+        startHide(150);  // quick close after leaving the box
+      });
+    });
+    // Prevent click toggling from fighting our hover logic
+    el.addEventListener('click', function(e){ e.preventDefault(); });
+  }
+  document.addEventListener('DOMContentLoaded', function(){
+    document.querySelectorAll('[data-bs-toggle=\"popover\"], [data-toggle=\"popover\"]').forEach(function(el){
+      upgradeDataAttr(el);
+      getPopover(el);       // ensure BS5 instance exists
+      addHoverBehavior(el); // wire hover behavior + auto-dismiss
+    });
+  });
+})();
+")),
+      # Show recode slider only for TS, CC, and mover plots (not for histogram)
+      conditionalPanel(
+        'input.tabs == "Time Series" |
+        input.tabs == "Cross Country" |
+        input.tabs == "World Map" |
+        input.tabs == "Breakdown"',
+        uiOutput("sliderUI"),
+        # Mean Value toggle
+       # checkboxInput("use_mean", "Mean value", FALSE),
+      ),
+      # Add additional breakdown variable in mover plot
+      conditionalPanel(
+        'input.tabs == "Breakdown"',
+        selectInput("variable_sec",
+                    label = tagList(
+          info_badge("Subgroup for analysis",
+                    HTML("Optionally split the Breakdown plot by another subgroup from the dataset.
+                 Select <b>None</b> to disable."), "Secondary Variable")),
+                    c("None" = "None",
+                      labs_sec[order(names(labs_sec))])),
+        checkboxGroupInput("demog", "Demographic Variables",
+                           c("Gender" = "gendermc",
+                             "Age" = "age",
+                             "Income" = "wealth",
+                             "Education" = "edre",
+                             "Urban/Rural" = "ur"),
+                           selected = c("gendermc", "age", "edre"),
+                           inline = TRUE)),
+      # Include button in UI (disabled)
+      #actionButton("go", "Generate")
+      tags$div(
+        style = "display: none;",
+        actionButton("go", "Generate"))),
+    # Main panel for displaying outputs ----
+    # # -----------------------------------------------------------------------
+    mainPanel(
+      # Output: Formatted text for caption ----
+      h3(textOutput("caption")),
+      h5(textOutput("wording")),
+      h5(textOutput("response")),
+      tabsetPanel(id = "tabs",
+                  tabPanel("Histogram", plotOutput("hist")),
+                  tabPanel("Time Series", plotOutput("ts")),
+                  tabPanel("Cross Country", plotOutput("cc")),
+                  tabPanel("Breakdown", plotOutput("mover")),
+                  tabPanel("World Map", plotOutput("map"))),
+      br(),
+      fluidRow(column(12,
+                      tags$div(style = "margin-top:-15px"),
+                      downloadButton(outputId = "downloadPlot", label = "Download Figure"),
+                      downloadButton(outputId = "downloadTable", label = "Download Table"),
+                      tags$div(style = "height:10px"),
+                      uiOutput("ns_card"),
+                      #uiOutput("missing_warning_card"),
+        )
+      )
+    )
+  )
+)
+# # -----------------------------------------------------------------------
+# # -----------------------------------------------------------------------
+# # -----------------------------------------------------------------------
+# # -----------------------------------------------------------------------
+# Define SERVER logic
+# # -----------------------------------------------------------------------
+# The server function will be called when each client (browser) loads the app.
+server <- function(input, output, session) {
+  observe({
+    req(input$variable)
+    if (!input$variable %in% names(cses_shiny_data)) {
+      showNotification("Selected variable not found in data!", type = "error")
+    }
+    if (!input$weight_type %in% names(cses_shiny_data)) {
+      showNotification("Selected weight column not found!", type = "error")
+    }
+  })
+  # Triggers "go" between server and ui to generate default plots
+  observe({
+    if (!is.null(input$module) && !is.null(input$pais) && !is.null(input$wave)) {
+      isolate({
+        session$sendCustomMessage("clickGenerateButton", list())
+      })
+    }
+  })
+  # Check the number of selected variables for breakdown
+   observeEvent(input$demog, {
+    if (length(input$demog) > 3) {
+      # Show a warning message
+      showNotification(HTML("You should only select a maximum of 3 demographic variables to plot."), type = "warning")
+    }
+  })
+  # MAKE IT REACTIVE
+  # # -----------------------------------------------------------------------
+  formulaText <- reactive({
+    paste(input$variable)
+  })
+  outcome <- reactive({
+    input$variable
+  })
+  wave <- reactive({
+    input$wave
+  })
+  outcome_code <- reactive({
+    vars_labels$column_name[which(vars_labels$column_name == paste(outcome()))]
+  })
+  outcome_lab <- reactive({
+    vars_labels$question_short_en[which(vars_labels$column_name == paste(outcome()))]
+  })
+  variable_sec <- reactive({
+    input$variable_sec
+  })
+  variable_sec_lab <- reactive({
+    vars_labels$question_short_en[which(vars_labels$column_name == paste(variable_sec()))]
+  })
+  sliderParams <- reactiveValues(valuex = c(1, 1))
+  # Reactive: Filter dataset based on selected module(s)
+  # # -----------------------------------------------------------------------
+  filtered_data <- reactive({
+    req(input$module)
+    cses_shiny_data %>%
+      dplyr::filter(IMD1008_MOD %in% input$module)
+  })
+# OLD CODE THAT WOULD FORCE PRESELECTION, BUT IT BREAKS THE APP WITH FULL DATASET
+# Observe changes in module input to update wave and pais
+  observeEvent(filtered_data(), {
+    data <- filtered_data()
+    wave_choices <- sort(unique(data$wave))
+    pais_choices <- sort(unique(data$pais))
+    updatePickerInput(
+      session = session,
+      inputId = "wave",
+      choices = wave_choices,
+      selected = wave_choices  # you can leave this empty if no preselection
+    )
+#
+#    updatePickerInput(
+#      session = session,
+#      inputId = "pais",
+#      choices = pais_choices,
+#      selected = pais_choices
+#    )
+})
+  all_waves  <- sort(unique(cses_shiny_data$wave))
+  all_paises <- sort(unique(cses_shiny_data$pais))
+  observeEvent(input$module, {
+    req(input$module)
+    # Filter for the selected module
+    valid <- dplyr::filter(cses_shiny_data, IMD1008_MOD %in% input$module)
+    valid_waves  <- sort(unique(valid$wave))
+    valid_paises <- sort(unique(valid$pais))
+    wave_disabled <- !(all_waves %in% valid_waves)
+    pais_disabled <- !(all_paises %in% valid_paises)
+    # 🔹 Automatically select *all valid waves* when a module is chosen
+    shinyWidgets::updatePickerInput(
+      session, "wave",
+      choices = all_waves,
+      selected = valid_waves,  # <-- changed line
+      choicesOpt = list(
+        disabled = wave_disabled,
+        style    = ifelse(wave_disabled, "color:#999;", "")
+      )
+    )
+    # 🔹 Automatically select *all valid countries* too (optional)
+    shinyWidgets::updatePickerInput(
+      session, "pais",
+      choices = all_paises,
+      selected = valid_paises,  # <-- changed line
+      choicesOpt = list(
+        disabled = pais_disabled,
+        style    = ifelse(pais_disabled, "color:#999;", "")
+      )
+    )
+  })
+# Set default recode slider values:
+# # -----------------------------------------------------------------------
+# 2-point: 1-1
+# 3-point: 3-3
+# 4-point: 1-2
+# 5-point: 4-5
+# 6-point: 3-3
+# 7-point: 5-7
+# 10-point: 8-10
+# ALL OTHER: MEAN
+# UPDATE SLIDER DEFAULTS AND MEAN BEHAVIOR
+# -----------------------------------------------------------------------
+observeEvent({
+  list(input$variable, input$use_mean)
+}, {
+  # compute numeric vector safely
+  xvals <- suppressWarnings(as.numeric(cses_shiny_data[[formulaText()]]))
+  maxval <- max(xvals, na.rm = TRUE)
+  # --- DEFAULT RECODE RANGES ---
+  if (maxval == 1) {
+    sliderParams$valuex <- c(1, 1)
+  } else if (maxval == 2) {
+    sliderParams$valuex <- c(1, 1)
+  } else if (maxval == 3) {
+    sliderParams$valuex <- c(3, 3)
+  } else if (maxval == 4) {
+    sliderParams$valuex <- c(1, 2)
+  } else if (maxval == 5) {
+    sliderParams$valuex <- c(4, 5)
+  } else if (maxval == 6) {
+    sliderParams$valuex <- c(3, 3)
+  } else if (maxval == 7) {
+    sliderParams$valuex <- c(5, 7)
+  } else if (maxval == 10) {
+    sliderParams$valuex <- c(8, 10)
+  } else {
+    mean_val <- mean(xvals, na.rm = TRUE)
+    sliderParams$valuex <- c(mean_val, mean_val)
+  }
+  # --- IF USER SELECTED "USE MEAN VALUE" ---
+  if (isTRUE(input$use_mean)) {
+    mean_val <- mean(xvals, na.rm = TRUE)
+    sliderParams$valuex <- c(mean_val, mean_val)
+  }
+  # force slider update
+  updateSliderInput(
+    session,
+    inputId = "recode",
+    value = sliderParams$valuex
+  )
+})
+# RECODE SLIDER
+# # -----------------------------------------------------------------------
+output$sliderUI <- renderUI({
+  sliderInput(
+    inputId = "recode",
+    label = tagList(
+      info_badge(
+        "Which values do you want to graph?",
+        HTML("Please select which outcome values to be displayed."),
+        "Which values do you want to graph?"
+      )
+    ),
+    min = min(as.numeric(cses_shiny_data[[formulaText()]]), na.rm = TRUE),
+    max = max(as.numeric(cses_shiny_data[[formulaText()]]), na.rm = TRUE),
+    value = sliderParams$valuex,
+    step = 1
+  )
+})
+# Filtering data based on user's selection (dff)
+dff <- eventReactive(input$go, ignoreNULL = FALSE, {
+  cses_shiny_data %>%
+    dplyr::filter(as_factor(wave) %in% input$wave) %>% # year
+    dplyr::filter(pais_nam %in% input$pais) # country
+})
+# Rendering var caption based on user's var selection
+cap <- renderText({
+  vars_labels$question_short_en[which(vars_labels$column_name == formulaText())]
+})
+output$caption <- renderText({
+  cap()
+})
+# Rendering variable code + wording based on user's var selection
+word <- renderText({
+  paste0(toupper(vars_labels$column_name[which(vars_labels$column_name == formulaText())]), ". ",
+         vars_labels$question_en[which(vars_labels$column_name == formulaText())])
+})
+output$wording <- renderText({
+  word()
+})
+# Rendering ROs based on user's var selection
+resp <- renderText({
+  vars_labels$responses_en_rec[which(vars_labels$column_name == formulaText())]
+})
+output$response <- renderText({
+  resp()
+})
+# Rendering variable_sec ROs
+resp_sec <- renderText({
+  vars_labels$responses_en_rec[which(vars_labels$column_name == input$variable_sec)]
+})
+output$response_sec <- renderText({
+  resp_sec()
+})
+# Rendering User selected recode value(s)
+slider_values <- renderText({
+  if(input$recode[1] == input$recode[2]) {
+    paste0("(value: ", unique(input$recode), ")")
+  } else {
+    paste0("(range: ", paste(input$recode, collapse = " to "), ")")
+  }
+})
+output$selected_values <- renderText({
+  slider_values()
+})
+# Toggle recode slider
+# # -----------------------------------------------------------------------
+observe({
+  if (isTRUE(input$use_mean)) {
+    shinyjs::disable("recode")
+  } else {
+    shinyjs::enable("recode")
+  }
+})
+# # -----------------------------------------------------------------------
+# N-SIZE CARD
+# # -----------------------------------------------------------------------
+output$ns_card <- renderUI({
+    req(dff(), outcome(), input$wave, input$pais)
+selected_waves <- as.character(input$wave)
+selected_countries <- as.character(input$pais)
+ns <- get_sample_counts(
+      data = dff(),
+      outcome_var = outcome(),
+      wave_var = "wave",
+      country_var = "pais_nam",   # adjust if your helper uses a different input col
+      selected_waves = selected_waves,
+      selected_countries = selected_countries
+    )
+    # If absolutely no non-missing data, show a gentle note
+    if (is.null(ns$overall) || ns$overall == 0) {
+      return(tags$div(
+        style = "border:2px solid #17a2b8; border-radius:8px; padding:14px; background:#e9f7ff; margin-bottom:20px;",
+        HTML(paste0("ℹ️ <b>Ns</b> for <b>", outcome(), "</b>: No non-missing observations in the current selection."))
+      ))
+    }
+    # Expect columns: ns$per_wave (wave, n) and ns$per_country_wave (pais, wave, n)
+    pCW <- ns$per_country_wave
+    # If your helper names the country column differently, change "pais" below
+    # Control whether to show zeros
+    show_zeros <- FALSE
+    # Order waves nicely
+    waves <- unique(pCW$wave)
+    # If waves are numeric-like but char, coerce to numeric for sorting (silently)
+    suppressWarnings({
+      wave_num <- suppressWarnings(as.numeric(as.character(waves)))
+      if (all(!is.na(wave_num))) waves <- waves[order(wave_num)] else waves <- sort(waves)
+    })
+    # Create a quick lookup for total N per wave
+    per_wave_tbl <- ns$per_wave |>
+      dplyr::mutate(wave_chr = as.character(wave)) |>
+      dplyr::select(wave_chr, n)
+    # Build one <details> block per wave
+    blocks <- lapply(seq_along(waves), function(i) {
+      w <- waves[i]
+      w_chr <- as.character(w)
+      wt <- per_wave_tbl$n[match(w_chr, per_wave_tbl$wave_chr)]
+      wt <- ifelse(is.na(wt), 0, wt)
+      rows <- pCW |>
+        dplyr::filter(as.character(wave) == w_chr)
+      if (!show_zeros) rows <- dplyr::filter(rows, n > 0)
+      rows <- dplyr::arrange(rows, dplyr::desc(n), .by_group = FALSE)
+      items <- lapply(seq_len(nrow(rows)), function(j) {
+        n_j <- format(rows$n[j], big.mark = ",")
+        is_zero <- isTRUE(rows$n[j] == 0)
+        li_style <- if (is_zero) "color:#6c757d;" else NULL
+        # country column is "pais" as returned by the helper
+        tags$li(
+          tags$span(HTML(paste0("<b>", rows$pais[j], "</b>: N=", n_j))),
+          style = li_style
+        )
+      })
+      tags$details(
+        open = (i == 1),  # first year open by default
+        class = "ns-year",
+        tags$summary(
+          HTML(paste0("<b>", w_chr, "</b> — Total N=", format(wt, big.mark=",")))
+        ),
+        tags$ul(items)
+      )
+    })
+    tags$div(
+      style = "border:2px solid #17a2b8;
+      border-radius:8px;
+      padding:14px;
+      background:#e9f7ff;
+      margin-bottom:20px;
+      max-height:180px;
+      overflow-y:auto;",
+      # Title + grand total
+      tags$div(
+        HTML(paste0(
+          "📊 <b>Sample sizes</b> (non-missing <b>", outcome(), "</b>)<br>",
+          "<b>Total across selection:</b> ", format(ns$overall, big.mark = ",")
+        )),
+        style = "margin-bottom:6px;"
+      ),
+      tags$hr(style="margin:8px 0;"),
+      # Small CSS polish for the dropdowns
+      tags$style(HTML("
+      details.ns-year { margin-bottom: 8px; }
+      details > summary { cursor: pointer; list-style: none; }
+      details > summary::-webkit-details-marker { display: none; }
+    ")),
+      blocks
+    )
+  })
+# -----------------------------------------------------------------------
+# SOURCE INFO WITH ACTUAL DATA AVAILABILITY (not just user selections)
+# -----------------------------------------------------------------------
+source_info_both <- reactive({
+  req(dff(), outcome(), input$wave, input$pais, input$module)
+  # Reuse your helper to get Ns
+  ns <- get_sample_counts(
+    data = dff(),
+    outcome_var = outcome(),
+    wave_var = "wave",
+    country_var = "pais_nam",
+    selected_waves = input$wave,
+    selected_countries = input$pais
+  )
+  # Extract actual combinations with nonzero N
+  valid_combos <- ns$per_country_wave %>%
+    dplyr::filter(n > 0)
+  # Actual waves and countries that have data
+  valid_waves <- sort(unique(valid_combos$wave))
+  valid_countries <- sort(unique(valid_combos$pais))
+  selected_module = input$module
+  # Get abbreviations for these countries (match order)
+  pais_abbr <- cses_shiny_data %>%
+    dplyr::filter(pais_nam %in% valid_countries) %>%
+    distinct(pais_nam, pais_lab) %>%
+    arrange(match(pais_nam, valid_countries)) %>%
+    pull(pais_lab)
+  paste0(
+    "Source: CSES Data Playground\n\n",
+    str_wrap(paste0("CSES ", selected_module,
+      " - Years: ", paste(valid_waves, collapse = ", "),
+      ". Countries: ", paste(pais_abbr, collapse = ", ")
+    ), 130),
+    "\n\n",
+    str_wrap(paste0(word(), " ", resp()), 130)
+  )
+})
+# -----------------------------------------------------------------------
+source_info_pais <- reactive({
+  req(dff(), outcome(), input$wave, input$pais)
+  ns <- get_sample_counts(
+    data = dff(),
+    outcome_var = outcome(),
+    wave_var = "wave",
+    country_var = "pais_nam",
+    selected_waves = input$wave,
+    selected_countries = input$pais
+  )
+  valid_combos <- ns$per_country_wave %>%
+    dplyr::filter(n > 0)
+  valid_countries <- sort(unique(valid_combos$pais))
+  pais_abbr <- cses_shiny_data %>%
+    dplyr::filter(pais_nam %in% valid_countries) %>%
+    distinct(pais_nam, pais_lab) %>%
+    arrange(match(pais_nam, valid_countries)) %>%
+    pull(pais_lab)
+  paste0(
+    "Source: CSES Data Playground\n",
+    "Countries: ", str_wrap(paste(pais_abbr, collapse = ", "), 130),
+    "\n\n",
+    str_wrap(paste0(word(), " ", resp()), 130)
+  )
+})
+# -----------------------------------------------------------------------
+source_info_wave <- reactive({
+  req(dff(), outcome(), input$wave, input$pais, input$module)
+  ns <- get_sample_counts(
+    data = dff(),
+    outcome_var = outcome(),
+    wave_var = "wave",
+    country_var = "pais_nam",
+    selected_waves = input$wave,
+    selected_countries = input$pais
+  )
+  valid_combos <- ns$per_country_wave %>%
+    dplyr::filter(n > 0)
+  valid_waves <- sort(unique(valid_combos$wave))
+  selected_module = input$module
+  paste0(
+    "Source: CSES Data Playground\n", "CSES ", selected_module,
+    " - Years: ", str_wrap(paste(valid_waves, collapse = ", "), 130),
+    "\n\n",
+    str_wrap(paste0(word(), " ", resp()), 130)
+  )
+})
+# # -----------------------------------------------------------------------
+# PLOTS
+# # -----------------------------------------------------------------------
+# Histogram
+# # -----------------------------------------------------------------------
+# must break into data event, graph event, and renderPlot to get download to work
+  histd <- reactive({
+    req(dff(), input$variable, input$weight_type)
+    if (!input$variable %in% names(dff()) ||
+        !input$weight_type %in% names(dff())) {
+      return(NULL)
+    }
+    tryCatch({
+      dff() %>%
+        drop_na(!!sym(input$variable), !!sym(input$weight_type)) %>%
+        group_by(cat = haven::as_factor(!!sym(input$variable))) %>%
+        summarise(w = sum(!!sym(input$weight_type), na.rm = TRUE)) %>%
+        mutate(
+          prop = w / sum(w) * 100,
+          proplabel = paste0(round(prop), "%"),
+          cat = str_wrap(as.character(cat), width = 25)
+        )
+    }, error = function(e) {
+      NULL
+    })
+  })
+  histg <- reactive({lapop_hist(histd(),
+                        ymax = ifelse(any(histd()$prop > 90), 110, 100),
+                        source_info = "Source: CSES Data Playground")})
+  output$hist <- renderPlot({
+    req(dff(), nrow(dff()) > 0, input$variable, input$variable %in% names(dff()))
+    return(histg())
+  })
+# Time-series
+# # -----------------------------------------------------------------------
+  tsd <- reactive({
+    dta_ts <- Error(
+      dff() %>%
+        drop_na(!!sym(outcome()), !!sym(input$weight_type)) %>%
+        mutate(outcome_rec = case_when(
+          !!sym(outcome()) >= input$recode[1] &
+            !!sym(outcome()) <= input$recode[2] ~ 100,
+          TRUE ~ 0
+        )) %>%
+        group_by(wave = as.character(as_factor(wave))) %>%
+        summarise_at(
+          vars("outcome_rec"),
+          list(~weighted.ttest.ci(., !!sym(input$weight_type)))
+        ) %>%
+        unnest_wider(col = "outcome_rec") %>%
+        mutate(proplabel = paste0(round(prop), "%")) %>%
+        dplyr::filter(prop != 0)
+    )
+    validate(
+      need(dta_ts, "Error: no data available. Please verify that this question was asked in this country/year combination.")
+    )
+    dta_ts <- merge(dta_ts,
+                    data.frame(wave = as.character(waves_total), empty = 1),
+                    by = "wave", all.y = TRUE) %>%
+      dplyr::filter(!is.na(prop)) # TO EXCLUDE YEARS NOT IN THE SELECTION
+                                  # THEN YEARS ARE NOT SEQUENTIAL
+    return(omit_na_edges(dta_ts))
+  })
+  tsg <- reactive({lapop_ts(tsd(),
+                   ymax = ifelse(any(tsd()$prop > 85, na.rm = TRUE), 110, 100),
+                   #label_vjust = -1.5,
+                   label_vjust = ifelse(any(tsd()$prop > 80, na.rm = TRUE), -1.1, -1.5),
+                   source_info = "Source: CSES Data Playground",
+                   subtitle = "% in selected category",
+                   ci_type = "errorbar")
+  })
+  output$ts <- renderPlot({
+    return(tsg())
+  })
+# Cross Country
+# # -----------------------------------------------------------------------
+# define macro (aggregate-level) variables
+continuous_vars <- c("IMD3001_TS", "IMD5054_2", "IMD5057_1", "IMD5035",
+                     "IMD5056_2", "IMD5055_1", "IMD5053_1", "IMD5052_2")
+  ccd <- reactive({
+    var_sel <- outcome()
+    rec_min <- input$recode[1]
+    rec_max <- input$recode[2]
+    # CASE 1: Continuous macro-level variable (mean = TRUE)
+    if (var_sel %in% continuous_vars) {
+      curr_outcome <- sym(var_sel)
+      dta_cc <- dff() %>%
+        # Apply recode range first
+        mutate(
+          tmp_val = as.numeric(!!curr_outcome),
+          tmp_val = ifelse(tmp_val >= rec_min & tmp_val <= rec_max, tmp_val, NA_real_)
+        ) %>%
+        group_by(vallabel = pais_lab) %>%
+        summarise(
+          prop = mean(tmp_val, na.rm = TRUE)
+        ) %>%
+        ungroup() %>%
+        mutate(
+          lb = NA_real_,
+          ub = NA_real_,
+          proplabel = ifelse(is.na(prop), "", sprintf("%.2f", prop))
+        ) %>%
+        filter(!is.na(prop))
+      # CASE 2: Regular individual-level variable (weighted proportion)
+    } else {
+      dta_cc <- dff() %>%
+        drop_na(!!sym(var_sel), !!sym(input$weight_type)) %>%
+        mutate(outcome_rec = case_when(
+          !!sym(var_sel) >= rec_min & !!sym(var_sel) <= rec_max ~ 100,
+          TRUE ~ 0
+        )) %>%
+        group_by(vallabel = pais_lab) %>%
+        summarise_at(
+          vars("outcome_rec"),
+          list(~weighted.ttest.ci(., !!sym(input$weight_type)))
+        ) %>%
+        unnest_wider(col = "outcome_rec") %>%
+        filter(prop != 0) %>%
+        mutate(proplabel = paste0(round(prop), "%"))
+    }
+    validate(
+      need(nrow(dta_cc) > 0,
+           "Error: no data available. Please verify that this question was asked in this country/year combination.")
+    )
+    return(dta_cc)
+  })
+  ccg <- reactive({
+    lapop_cc(
+      ccd(),
+      sort = "hi-lo",
+      subtitle = ifelse(outcome() %in% continuous_vars,
+                        "Countries (within selected range)",
+                        "% in selected category"),
+      ymax = ifelse(outcome() %in% continuous_vars, 6,
+                    ifelse(any(ccd()$prop > 90, na.rm = TRUE), 110, 100)),
+      source_info = "Source: CSES Data Playground"
+    )
+  })
+  output$cc <- renderPlot({
+    ccg()
+  })
+# World Map
+# # -----------------------------------------------------------------------
+  mapd <- reactive({
+    var_sel <- outcome()
+    rec_min <- input$recode[1]
+    rec_max <- input$recode[2]
+    continuous_vars <- c("IMD3001_TS", "IMD5054_2", "IMD5057_1", "IMD5035",
+                         "IMD5056_2", "IMD5055_1", "IMD5053_1", "IMD5052_2")
+    req(input$module)
+    # --- NEW: allow only one module at a time ---
+    validate(
+      need(
+        length(input$module) == 1,
+        "Please select only ONE module to display a map."
+      )
+    )
+    # CASE 1: Continuous macro variable (mean values)
+    if (var_sel %in% continuous_vars) {
+      dta_map <- dff() %>%
+        mutate(
+          tmp_val = as.numeric(.data[[var_sel]]),
+          tmp_val = ifelse(tmp_val >= rec_min & tmp_val <= rec_max, tmp_val, NA_real_)
+        ) %>%
+        group_by(pais_lab = pais_lab) %>%       # IMPORTANT: must exist in your dataset
+        summarise(
+          value = mean(tmp_val, na.rm = TRUE),
+          .groups = "drop"
+        ) %>%
+        filter(!is.na(value))
+    } else {
+      # CASE 2: Categorical / proportion variables
+      dta_map <- dff() %>%
+        drop_na(.data[[var_sel]], .data[[input$weight_type]]) %>%
+        mutate(outcome_rec = case_when(
+          .data[[var_sel]] >= rec_min & .data[[var_sel]] <= rec_max ~ 100,
+          TRUE ~ 0
+        )) %>%
+        group_by(pais_lab = pais_lab) %>%
+        summarise_at(
+          vars("outcome_rec"),
+          list(~weighted.ttest.ci(., .data[[input$weight_type]]))
+        ) %>%
+        unnest_wider(col = "outcome_rec") %>%
+        filter(prop > 0) %>%
+        rename(value = prop)
+    }
+    validate(
+      need(nrow(dta_map) > 0,
+           "Error: no map data available for this country/year/variable selection.")
+    )
+    return(dta_map)
+  })
+  mapg <- reactive({
+    lapop_map(
+      mapd(), survey = "CSES",
+      source_info = "\nSource: CSES Data Playground"
+    )
+  })
+  output$map <- renderPlot({
+    mapg()
+  })
+# Breakdown
+# # -----------------------------------------------------------------------
+# Use function for each demographic breakdown variable
+  secdf <- eventReactive(input$go, ignoreNULL = FALSE, {
+    if (input$variable_sec == "None") {
+      NULL
+    } else if (variable_sec() == outcome()) {
+      showNotification(HTML("You cannot break the outcome variable by itself."), type = "error")
+      NULL
+    } else {
+      process_data(
+        data = dff(),
+        outcome_var = outcome(),
+        recode_range = input$recode,
+        group_var = input$variable_sec,
+        weight_var = input$weight_type,
+        var_label = stringr::str_wrap(variable_sec_lab(), width = 25)
+      )
+    }
+  })
+  genderdf <- eventReactive(input$go, ignoreNULL = FALSE, {
+    if ("gendermc" %in% input$demog) {
+      process_data(
+        data = dff(),
+        outcome_var = outcome(),
+        recode_range = input$recode,
+        weight_var = input$weight_type,
+        group_var = "gendermc",
+        var_label = "Gender"
+      )
+    } else {
+      NULL
+    }
+  })
+  wealthdf <- eventReactive(input$go, ignoreNULL = FALSE, {
+    if ("wealth" %in% input$demog) {
+      process_data(
+        data = dff(),
+        outcome_var = outcome(),
+        recode_range = input$recode,
+        weight_var = input$weight_type,
+        group_var = "wealthf",
+        var_label = "Wealth"
+      )
+    } else {
+      NULL
+    }
+  })
+  eddf <- eventReactive(input$go, ignoreNULL = FALSE, {
+    if ("edre" %in% input$demog) {
+      process_data(
+        data = dff(),
+        outcome_var = outcome(),
+        recode_range = input$recode,
+        weight_var = input$weight_type,
+        group_var = "edrerf",
+        var_label = "Education"
+      )
+    } else {
+      NULL
+    }
+  })
+  agedf <- eventReactive(input$go, ignoreNULL = FALSE, {
+    if ("age" %in% input$demog) {
+      process_data(
+        data = dff(),
+        outcome_var = outcome(),
+        recode_range = input$recode,
+        weight_var = input$weight_type,
+        group_var = "age",
+        var_label = "Age"
+      )
+    } else {
+      NULL
+    }
+  })
+  urdf <- eventReactive(input$go, ignoreNULL = FALSE, {
+    if ("ur" %in% input$demog) {
+      process_data(
+        data = dff(),
+        outcome_var = outcome(),
+        recode_range = input$recode,
+        weight_var = input$weight_type,
+        group_var = "ur",
+        var_label = "Place of\nResidence"
+      )
+    } else {
+      NULL
+    }
+  })
+  # Combine demographic data frames into one df
+  moverd <- reactive({
+    req(dff(), input$recode, input$weight_type)
+    dta_mover <- Error(rbind(
+      if (input$variable_sec != "None" && input$variable_sec != outcome()) {
+        process_data(
+          data = dff(),
+          outcome_var = outcome(),
+          recode_range = input$recode,
+          group_var = input$variable_sec,
+          weight_var = input$weight_type,
+          var_label = str_wrap(variable_sec_lab(), width = 25)
+        )
+      },
+      if ("gendermc" %in% input$demog) {
+        process_data(dff(), outcome(), input$recode, "gendermc", "Gender",
+                     input$weight_type)
+      },
+      if ("age" %in% input$demog) {
+        process_data(dff(), outcome(), input$recode, "age", "Age",
+                     input$weight_type)
+      },
+      if ("wealth" %in% input$demog) {
+        process_data(dff(), outcome(), input$recode, "wealthf", "Wealth",
+                     input$weight_type)
+      },
+      if ("edre" %in% input$demog) {
+        process_data(dff(), outcome(), input$recode, "edrerf", "Education",
+                     input$weight_type)
+      },
+      if ("ur" %in% input$demog) {
+        process_data(dff(), outcome(), input$recode, "ur", "Place of\nResidence",
+                     input$weight_type)
+      }
+    ))
+    validate(
+      need(dta_mover, "Error: no data available. Please verify that this question was asked in this country/year combination")
+    )
+    dta_mover$vallabel <- as.character(dta_mover$vallabel)
+    return(dta_mover)
+  })
+  moverg <- reactive({
+    moverg <- lapop_mover(moverd(),
+                          subtitle = "% in selected category",
+                          ymax = ifelse(any(moverd()$prop > 90, na.rm = TRUE), 119,
+                                        ifelse(any(moverd()$prop > 80, na.rm = TRUE), 109, 100)),
+                          source_info = "Source: CSES Data Playground")
+    return(moverg)
+  })
+  output$mover <- renderPlot({
+    return(moverg())
+  })
+# # -----------------------------------------------------------------------
+# DOWNLOAD SECTION
+# # -----------------------------------------------------------------------
+# Download Plot
+# # -----------------------------------------------------------------------
+  output$downloadPlot <- downloadHandler(
+    filename = function(file) {
+      weight_suffix <- switch(input$weight_type, # Add weight type to plot export
+                              "no_weight" = "unweighted",
+                              "weight_demographic" = "demogweighted",
+                              "weight_sample" = "sampleweighted")
+      ifelse(input$tabs == "Histogram", paste0("hist_", outcome(), "_", weight_suffix, ".svg"),
+             ifelse(input$tabs == "Time Series",  paste0("ts_", outcome(), "_", weight_suffix, ".svg"),
+                    ifelse(input$tabs == "Cross Country",  paste0("cc_", outcome(), "_", weight_suffix, ".svg"),
+                           ifelse(input$tabs == "World Map",  paste0("map_", outcome(), "_", weight_suffix, ".svg"),
+                                  paste0("mover_", outcome(), "_", weight_suffix, ".svg"))))) # Add plot type to file export
+    },
+    content = function(file) {
+      if(input$tabs == "Histogram") {
+        title_text <- isolate(cap())
+        word_text <- isolate(word())
+        hist_to_save <- lapop_hist(histd(),
+                                   main_title = title_text,
+                                   subtitle = "% in selected category ",
+                                   ymax = ifelse(any(histd()$prop > 90), 110, 100),
+                                   source_info = source_info_both()
+        )
+        lapop_save(hist_to_save, file)
+        showNotification(HTML("Histogram plot download complete ✓ "), type = "message")
+      } else if (input$tabs == "Time Series") {
+        title_text <- isolate(cap())
+        subtitle_text <- slider_values()
+        ts_to_save <-  lapop_ts(tsd(),
+                                main_title = title_text,
+                                subtitle = paste0("% in selected category ", subtitle_text),
+                                ymax = ifelse(any(tsd()$prop > 88, na.rm = TRUE), 110, 100),
+                                label_vjust = ifelse(any(tsd()$prop > 80, na.rm = TRUE), -1.1, -1.5),
+                                source_info = source_info_pais()
+        )
+        lapop_save(ts_to_save, file)
+        showNotification(HTML("Time series plot download complete ✓ "), type = "message")
+      } else if (input$tabs == "Cross Country") {
+        title_text <- isolate(cap())
+        subtitle_text <- slider_values()
+        cc_to_save <- lapop_cc(ccd(), sort = "hi-lo",
+                               main_title = title_text,
+                               subtitle = paste0("% in selected category ", subtitle_text),
+                               ymax = ifelse(any(ccd()$prop > 90, na.rm = TRUE), 110, 100),
+                               label_angle = 90,
+                               source_info = source_info_wave()
+        )
+        lapop_save(cc_to_save, file)
+        showNotification(HTML("Cross country plot download complete ✓ "), type = "message")
+      } else if (input$tabs == "World Map") {
+        title_text <- isolate(cap())
+        subtitle_text <- slider_values()
+        map_to_save <- lapop_map(mapd(),
+                               main_title = title_text,
+                               subtitle = paste0("% in selected category ", subtitle_text),
+                               source_info = paste0("\n", source_info_both()),
+                               survey = "CSES"
+        )
+        lapop_save(map_to_save, file)
+        showNotification(HTML("Map plot download complete ✓ "), type = "message")
+      } else {
+        title_text <- isolate(cap())
+        subtitle_text <- slider_values()
+        word_text <- isolate(word())
+        mover_to_save <- lapop_mover(
+          moverd(),
+          main_title = title_text,
+          subtitle = paste0("% in selected category ", subtitle_text),
+          ymax = ifelse(any(moverd()$prop > 90, na.rm = TRUE), 119,
+                        ifelse(any(moverd()$prop > 80, na.rm = TRUE), 109, 100)),
+          source_info = source_info_both()
+        )
+        lapop_save(mover_to_save, file)
+        showNotification(HTML("Break down plot download complete ✓ "), type = "message")
+      }
+    }
+  )
+# DOWNLOAD TABLE
+ # -----------------------------------------------------------------------
+  output$downloadTable <- downloadHandler(
+    filename = function(file) {
+      weight_suffix <- switch(input$weight_type, # Add weight type to file export
+                              "no_weight" = "unweighted",
+                              "weight_demographic" = "demogweighted",
+                              "weight_sample" = "sampleweighted")
+      ifelse(input$tabs == "Histogram", paste0("hist_", outcome(), "_", weight_suffix, ".csv"),
+             ifelse(input$tabs == "Time Series",  paste0("ts_", outcome(), "_", weight_suffix,".csv"),
+                    ifelse(input$tabs == "Cross Country",  paste0("cc_", outcome(), "_", weight_suffix, ".csv"),
+                           ifelse(input$tabs == "World Map",  paste0("map_", outcome(), "_", weight_suffix, ".csv"),
+                                  paste0("mover_", outcome(), "_", weight_suffix, ".csv")))))
+    },
+    content = function(file) {
+      if(input$tabs == "Histogram") {
+        write.csv(histd(), file, row.names=F)
+        showNotification(HTML("Histogram file download complete ✓ "),
+                         type = "message")
+      } else if (input$tabs == "Time Series") {
+        write.csv(tsd(), file, row.names=F)
+        showNotification(HTML("Time series file download complete ✓ "),
+                         type = "message")
+      } else if (input$tabs == "Cross Country") {
+        write.csv(ccd(), file, row.names=F)
+        showNotification(HTML("Cross country file download complete ✓ "),
+                         type = "message")
+      } else if (input$tabs == "World Map") {
+        write.csv(mapd(), file, row.names=F)
+        showNotification(HTML("Map file download complete ✓ "),
+                         type = "message")
+      } else {
+        write.csv(moverd(), file, row.names=F)
+        showNotification(HTML("Break down file download complete ✓ "),
+                         type = "message")
+      }
+    }
+  )
+}
+# RUN APP
+# # -----------------------------------------------------------------------
+shinyApp(ui, server)
+# # -----------------------------------------------------------------------
+# END
+# # -----------------------------------------------------------------------

cses-shiny.Rproj ADDED Viewed

	@@ -0,0 +1,17 @@

+Version: 1.0
+ProjectId: 77d77540-4c5c-492a-b2c3-65b0f1499688
+RestoreWorkspace: Default
+SaveWorkspace: Default
+AlwaysSaveHistory: Default
+EnableCodeIndexing: Yes
+UseSpacesForTab: Yes
+NumSpacesForTab: 2
+Encoding: UTF-8
+RnwWeave: Sweave
+LaTeX: pdfLaTeX
+AutoAppendNewline: Yes
+StripTrailingWhitespace: Yes

cses_labs.rds ADDED Viewed

Binary file (864 Bytes). View file

cses_labs_sec.rds ADDED Viewed

Binary file (1.44 kB). View file

cses_shiny_data.rda ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e3cad18ac3c75feeb3b170223f2ba6e11bfa690c08bb3bfa53e1ed9379381692
+size 3058556

cses_shiny_data.rds ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:698677f42d76fca9de837613d8b303e192033d81f1db33fd1f30f011244ed906
+size 4950894

cses_variable_labels.csv ADDED Viewed

	@@ -0,0 +1,52 @@

+"column_name","question_short_en","category_short_en","display_en","question_en","responses_en","responses_en_rec"
+"IMD2001_2","Age of respondent (in categories)","Demographic Data","Demographic Data: AGE OF RESPONDENT (IN CATEGORIES) (IMD2001_2)","Age of respondent (in categories listed below).","(1) YOUNGEST - 24 YEARS (2) 25-34 YEARS (3) 35-44 YEARS (4) 45-54 YEARS (5) 55-64 YEARS (6) 65 - OLDEST","(1) Youngest - 24 years (2) 25-34 years (3) 35-44 years (4) 45-54 years (5) 55-64 years (6) 65 - oldest"
+"IMD2002","Gender","Demographic Data","Demographic Data: GENDER (IMD2002)","Gender of Respondent.","(1) MALE (2) FEMALE (3) OTHER","(1) Male (2) Female (3) Other"
+"IMD2003","Education","Demographic Data","Demographic Data: EDUCATION (IMD2003)","Education of Respondent.","(0) NONE (NO EDUCATION) / ILLITERATE (1) PRIMARY EDUCATION/LOWER SECONDARY EDUCATION (2) HIGHER SECONDARY EDUCATION (3) POST-SECONDARY (NON-UNIVERSITY) EDUCATION (4) UNIVERSITY EDUCATION","(0) None (no education) / illiterate (1) Primary education/lower secondary education (2) Higher secondary education (3) Post-secondary (non-university) Education (4) University education"
+"IMD2004","Marital status","Demographic Data","Demographic Data: MARITAL STATUS (IMD2004)","Respondent's marital or civil union status.","(1) MARRIED OR LIVING TOGETHER AS MARRIED (2) WIDOWED (3) DIVORCED OR SEPARATED (MARRIED BUT SEPARATED/NOT LIVING WITH LEGAL SPOUSE) (4) SINGLE, NEVER MARRIED (5) [SEE ELECTION STUDY NOTES]","(1) Married or living together as married (2) Widowed (3) Divorced or separated (married but separated/not living with legal spouse) (4) Single, never married (5) [see election study notes]"
+"IMD2005_1","Religious services attendance","Demographic Data","Demographic Data: RELIGIOUS SERVICES ATTENDANCE (IMD2005_1)","Religious denomination.","(1) NEVER (2) ONCE A YEAR (3) TWO TO ELEVEN TIMES A YEAR (4) ONCE A MONTH (5) TWO OR MORE TIMES A MONTH (6) ONCE A WEEK/MORE THAN ONCE A WEEK","(1) Never (2) Once a year (3) Two to eleven times a year (4) Once a month (5) Two or more times a month (6) Once a week/more than once a week"
+"IMD2005_2","Religiosity","Demographic Data","Demographic Data: RELIGIOSITY (IMD2005_2)","Religiosity.","(1) HAVE NO RELIGIOUS BELIEFS (2) NOT VERY RELIGIOUS (3) SOMEWHAT RELIGIOUS (4) VERY RELIGIOUS","(1) Have no religious beliefs (2) Not very religious (3) Somewhat religious (4) Very religious"
+"IMD2006","Household income","Demographic Data","Demographic Data: HOUSEHOLD INCOME (IMD2006)","Household income quintile appropriate to the respondent.","(1) LOWEST HOUSEHOLD INCOME QUINTILE (2) SECOND HOUSEHOLD INCOME QUINTILE (3) THIRD HOUSEHOLD INCOME QUINTILE (4) FOURTH HOUSEHOLD INCOME QUINTILE (5) HIGHEST HOUSEHOLD INCOME QUINTILE","(1) Lowest household income quintile (2) Second household income quintile (3) Third household income quintile (4) Fourth household income quintile (5) Highest household income quintile"
+"IMD2007","Rural or urban residence","Demographic Data","Demographic Data: RURAL OR URBAN RESIDENCE (IMD2007)","Rural/Urban Residence.","(1) RURAL AREA OR VILLAGE (2) SMALL OR MIDDLE-SIZED TOWN (3) SUBURBS OF LARGE TOWN OR CITY (4) LARGE TOWN OR CITY","(1) Rural area or village (2) Small or middle-sized town (3) Suburbs of large town or city (4) Large town or city"
+"IMD2014","Current employment status","Demographic Data","Demographic Data: CURRENT EMPLOYMENT STATUS (IMD2014)","Current employment status of respondent.","(0) EMPLOYED : NO HOURS SPECIFIED (1) EMPLOYED : FULL-TIME (32 OR MORE HOURS WEEKLY) (2) EMPLOYED : PART-TIME (15-32 HOURS WEEKLY) (3) EMPLOYED : LESS THAN 15 HOURS (4) HELPING FAMILY MEMBER (5) UNEMPLOYED (6) STUDENT, IN SCHOOL, IN VOCATIONAL TRAINING (7) RETIRED (8) HOMEMAKER, HOME DUTIES (9) PERMANENTLY DISABLED (10) OTHERS, NOT IN LABOR FORCE (11) ON TEMPORARY JOB LEAVE (MATERNITY LEAVE, SICK LEAVE, ETC.) (12) CIVIL / MILITARY SERVICE","(0) Employed : no hours specified (1) Employed : full-time (32 or more hours weekly) (2) Employed : part-time (15-32 hours weekly) (3) Employed : less than 15 hours (4) Helping family member (5) Unemployed (6) Student, in school, in vocational training (7) Retired (8) Homemaker, home duties (9) Permanently disabled (10) Others, not in labor force (11) On temporary job leave (maternity leave, sick leave, etc.) (12) Civil / military service"
+"IMD2016","Socio economic status","Demographic Data","Demographic Data: SOCIO ECONOMIC STATUS (IMD2016)","Respondent's socio-economic status.","(1) WHITE COLLAR (2) WORKER (3) FARMER (4) SELF-EMPLOYED (5) OTHER","(1) White collar (2) Worker (3) Farmer (4) Self-employed (5) Other"
+"IMD2019_1","Union membership of respondent","Demographic Data","Demographic Data: UNION MEMBERSHIP OF RESPONDENT (IMD2019_1)","Union membership of respondent.","(0) R IS NOT A MEMBER OF A UNION (1) R IS MEMBER OF A UNION","(0) R is not a member of a union (1) R is member of a union"
+"IMD3001","Turnout: main election","Survey Data","Survey Data: TURNOUT: MAIN ELECTION (IMD3001)","Whether or not the respondent cast a ballot in the main election.","(0) RESPONDENT DID NOT CAST A BALLOT (1) RESPONDENT CAST A BALLOT","(0) Respondent did not cast a ballot (1) Respondent cast a ballot"
+"IMD3001_PR_1","Turnout: current presidential election - round 1","Survey Data","Survey Data: TURNOUT: CURRENT PRESIDENTIAL ELECTION - ROUND 1 (IMD3001_PR_1)","Whether or not the respondent cast a ballot in the first/second round of the Presidential elections.","(0) RESPONDENT DID NOT CAST A BALLOT (1) RESPONDENT CAST A BALLOT","(0) Respondent did not cast a ballot (1) Respondent cast a ballot"
+"IMD3001_PR_2","Turnout: current presidential election - round 2","Survey Data","Survey Data: TURNOUT: CURRENT PRESIDENTIAL ELECTION - ROUND 2 (IMD3001_PR_2)","Whether or not the respondent cast a ballot in the first/second round of the Presidential elections.","(0) RESPONDENT DID NOT CAST A BALLOT (1) RESPONDENT CAST A BALLOT","(0) Respondent did not cast a ballot (1) Respondent cast a ballot"
+"IMD3001_LH","Turnout: current lower house election","Survey Data","Survey Data: TURNOUT: CURRENT LOWER HOUSE ELECTION (IMD3001_LH)","Whether or not the respondent cast a ballot in the lower house election.","(0) RESPONDENT DID NOT CAST A BALLOT (1) RESPONDENT CAST A BALLOT","(0) Respondent did not cast a ballot (1) Respondent cast a ballot"
+"IMD3001_UH","Turnout: current upper house election","Survey Data","Survey Data: TURNOUT: CURRENT UPPER HOUSE ELECTION (IMD3001_UH)","Whether or not the respondent cast a ballot in the upper house election.","(0) RESPONDENT DID NOT CAST A BALLOT (1) RESPONDENT CAST A BALLOT","(0) Respondent did not cast a ballot (1) Respondent cast a ballot"
+"IMD3001_TS","Turnout: turnout switcher between current","Survey Data","Survey Data: TURNOUT: TURNOUT SWITCHER BETWEEN CURRENT (IMD3001_TS)","Whether or not the respondent reports voting in the current and previous election.","(0) RESPONDENT ABSTAINED IN BOTH ELECTIONS (1) RESPONDENT ABSTAINED IN CURRENT ELECTION BUT VOTED IN PREVIOUS ELECTION (2) RESPONDENT VOTED IN CURRENT ELECTION BUT ABSTAINED IN PREVIOUS ELECTION (3) RESPONDENT VOTED IN BOTH CURRENT AND PREVIOUS ELECTION (5) RESPONDENT ABSTAINED IN CURRENT ELECTION BUT INELIGIBLE TO VOTE IN PREVIOUS ELECTION (6) RESPONDENT VOTED IN CURRENT ELECTION BUT INELIGIBLE TO VOTE IN PREVIOUS ELECTION","(0) Respondent abstained in both elections (1) Respondent abstained in current election but voted in previous election (2) Respondent voted in current election but abstained in previous election (3) Respondent voted in both current and previous election (5) Respondent abstained in current election but ineligible to vote in previous election (6) Respondent voted in current election but ineligible to vote in previous election"
+"IMD3002_OUTGOV","Vote choice: current main election - vote for outgoing government (incumbent)","Survey Data","Survey Data: VOTE CHOICE: CURRENT MAIN ELECTION - VOTE FOR OUTGOING GOVERNMENT (INCUMBENT) (IMD3002_OUTGOV)","Whether or not the respondent cast a ballot for the outgoing incumbent.","(0) DID NOT VOTE FOR THE OUTGOING GOVERNMENT (INCUMBENT) (1) VOTED FOR THE OUTGOING GOVERNMENT (INCUMBENT)","(0) Did not vote for the outgoing government (incumbent) (1) Voted for the outgoing government (incumbent)"
+"IMD3002_VS_1","Vote choice: vote switcher between current election and previous election","Survey Data","Survey Data: VOTE CHOICE: VOTE SWITCHER BETWEEN CURRENT ELECTION AND PREVIOUS ELECTION (IMD3002_VS_1)"," Whether or not the respondent reports voting for the same party/coalition in the current and previous main election.","(0) DID NOT SWITCH (VOTED FOR SAME PARTY/COALITION IN CURRENT & PREVIOUS ELECTION) (1) SWITCHER (CHANGED VOTE IN CURRENT ELECTION FROM PREVIOUS ELECTION)","(0) Did not switch (voted for same party/coalition in current & previous election) (1) Switcher (changed vote in current election from previous election)"
+"IMD3002_LR_CSES","Vote choice: current main election - vote for leftist/center/rightist - cses","Survey Data","Survey Data: VOTE CHOICE: CURRENT MAIN ELECTION - VOTE FOR LEFTIST/CENTER/RIGHTIST - CSES (IMD3002_LR_CSES)","Whether or not the respondent reports voting for a leftist/center/rightist party/candidate of the party, based on CSES Collaborators experts' judgment of parties' ideology.","(1) VOTED FOR LEFTIST PARTY/CANDIDATE (2) VOTED FOR CENTER PARTY/CANDIDATE (3) VOTED FOR RIGHTIST PARTY/CANDIDATE","(1) Voted for leftist party/candidate (2) Voted for center party/candidate (3) Voted for rightist party/candidate"
+"IMD3005_1","Party identification: are you close to any political party","Survey Data","Survey Data: PARTY IDENTIFICATION: ARE YOU CLOSE TO ANY POLITICAL PARTY (IMD3005_1)","Do you usually think of yourself as close to any particular party?","(0) NO (1) YES","(0) No (1) Yes"
+"IMD3006","Ideology: left-right - self","Survey Data","Survey Data: IDEOLOGY: LEFT-RIGHT -  SELF (IMD3006)","Respondents' self-placement on a 0-10 left-right scale.","(0) LEFT (10) RIGHT","(0) Left (10) Right"
+"IMD3010","Satisfaction with democracy","Survey Data","Survey Data: SATISFACTION WITH DEMOCRACY (IMD3010)","On the whole, are you very satisfied, fairly satisfied, not very satisfied, or not at all satisfied with the way democracy works in [COUNTRY]?","(1) VERY SATISFIED (2) FAIRLY SATISFIED (3) NEITHER SATISFIED NOR DISSATISFIED (4) NOT VERY SATISFIED (0) NOT AT ALL SATISFIED","(1) Very satisfied (2) Fairly satisfied (3) Neither satisfied nor dissatisfied (4) Not very satisfied (0) Not at all satisfied"
+"IMD3011","Efficacy: who is in power can make a difference","Survey Data","Survey Data: EFFICACY: WHO IS IN POWER CAN MAKE A DIFFERENCE (IMD3011)","Some people say that it doesn't make any difference who is in power. Others say that it makes a big difference who is in power. Using the scale on this card, (where ONE means that it doesn't make any difference who is in power and FIVE means that it makes a big difference who is in power), where would you place yourself?","(1) IT DOESN'T MAKE ANY DIFFERENCE WHO IS IN POWER (5) IT MAKES A BIG DIFFERENCE WHO IS IN POWER","(1) It doesn't make any difference who is in power (5) It makes a big difference who is in power"
+"IMD3012","Efficacy: who people vote for makes a difference","Survey Data","Survey Data: EFFICACY: WHO PEOPLE VOTE FOR MAKES A DIFFERENCE (IMD3012)","Some people say that no matter who people vote for, it won't make any difference to what happens. Others say that who people vote for can make a big difference to what happens. Using the scale on this card, (where ONE means that voting won't make any difference to what happens and FIVE means that voting can make a big difference), where would you place yourself?","(1) WHO PEOPLE VOTE FOR WON'T MAKE ANY DIFFERENCE (5) WHO PEOPLE VOTE FOR CAN MAKE A BIG DIFFERENCE","(1) Who people vote for won't make any difference (5) Who people vote for can make a big difference"
+"IMD3013_1","State of economy (over past 12 months)","Survey Data","Survey Data: STATE OF ECONOMY (OVER PAST 12 MONTHS) (IMD3013_1)","Would you say that over the past twelve months, the state of the economy in [COUNTRY] has gotten better, stayed about the same, or gotten worse?","(1) GOTTEN BETTER (3) STAYED THE SAME (5) GOTTEN WORSE","(1) Gotten better (3) Stayed the same (5) Gotten worse"
+"IMD3013_2","State of economy - better","Survey Data","Survey Data: STATE OF ECONOMY - BETTER (IMD3013_2)","Would you say much better or somewhat better?","(1) MUCH BETTER (2) SOMEWHAT BETTER","(1) Much better (2) Somewhat better"
+"IMD3013_3","State of economy - worse","Survey Data","Survey Data: STATE OF ECONOMY - WORSE (IMD3013_3)","Would you say much worse or somewhat worse?","(4) SOMEWHAT WORSE (5) MUCH WORSE","(4) Somewhat worse (5) Much worse"
+"IMD3014","Government performance: general","Survey Data","Survey Data: GOVERNMENT PERFORMANCE: GENERAL (IMD3014)","Now thinking about the performance of the [government in [CAPITAL]/President] in general, how good or bad a job do you think the [government/President in [CAPITAL]] has done over the past [NUMBER OF YEARS SINCE LAST GOVERNMENT TOOK OFFICE, BEFORE THE CURRENT ELECTION] years? Has [it/he/she] done a very good job? A good job? A bad job? A very bad job?","(1) VERY GOOD JOB (2) GOOD JOB (3) BAD JOB (4) VERY BAD JOB","(1) Very good job (2) Good job (3) Bad job (4) Very bad job"
+"IMD5006_1","Electoral turnout - turnout as a percentage of registered voters (er)","Macro Data","Macro Data: ELECTORAL TURNOUT - TURNOUT AS A PERCENTAGE OF REGISTERED VOTERS (ER) (IMD5006_1)","Official voter turnout - Percentage of the registered voters (ER).","(0 to 100). PERCENT OF REGISTERED VOTERS (ER) WHO VOTED","(0 to 100). Percent of registered voters (er) Who voted"
+"IMD5006_2","Electoral turnout - turnout as a percentage of the voting age population (vap)","Macro Data","Macro Data: ELECTORAL TURNOUT - TURNOUT AS A PERCENTAGE OF THE VOTING AGE POPULATION (VAP) (IMD5006_2)","Official voter turnout - Percentage of Voting Age Population (VAP).","(0 to 100). PERCENT OF VOTING AGE POPULATION (VAP) WHO VOTED","(0 to 100). Percent of voting age population (vap) Who voted"
+"IMD5007","Compulsory voting","Macro Data","Macro Data: COMPULSORY VOTING (IMD5007)","Is voting compulsory?","(1) YES; STRICTLY ENFORCED SANCTIONS (2) YES; WEAKLY ENFORCED SANCTIONS (3) YES; WITHOUT SANCTION FOR VIOLATION (0) NO","(1) Yes; strictly enforced sanctions (2) Yes; weakly enforced sanctions (3) Yes; without sanction for violation (0) No"
+"IMD5013","Electoral formula in all segments: lower house","Macro Data","Macro Data: ELECTORAL FORMULA IN ALL SEGMENTS: LOWER HOUSE (IMD5013)","Whether the country uses a majoritarian formula, a proportional formula, or a mixed formula in all of its electoral segments/tiers.","(1) MAJORITARIAN (2) PROPORTIONAL (3) MIXED","(1) Majoritarian (2) Proportional (3) Mixed"
+"IMD5014","Electoral formula: presidential election","Macro Data","Macro Data: ELECTORAL FORMULA: PRESIDENTIAL ELECTION (IMD5014)","The electoral formula used to elect the President that is elected by popular vote.","(1) PLURALITY (2) ABSOLUTE MAJORITY RULE (3) QUALIFIED MAJORITY RULE (4) ELECTORAL COLLEGE (5) ALTERNATIVE VOTE","(1) Plurality (2) Absolute majority rule (3) Qualified majority rule (4) Electoral college (5) Alternative vote"
+"IMD5032_4","Post-election protest","Macro Data","Macro Data: POST-ELECTION PROTEST (IMD5032_4)","To what extent was there protest following the election?","(1) NO PROTEST AT ALL (2) SPORADIC PROTEST (3) SIGNIFICANT PROTEST","(1) No protest at all (2) Sporadic protest (3) Significant protest"
+"IMD5033","Fairness of the election","Macro Data","Macro Data: FAIRNESS OF THE ELECTION (IMD5033)","How impartial was the body that administered the election law?","(1) VERY IMPARTIAL (2) MOSTLY IMPARTIAL (3) NOT VERY IMPARTIAL (4) NOT IMPARTIAL AT ALL","(1) Very impartial (2) Mostly impartial (3) Not very impartial (4) Not impartial at all"
+"IMD5034_2","Election irregularities reported","Macro Data","Macro Data: ELECTION IRREGULARITIES REPORTED (IMD5034_2)","Were there irregularities reported by international election observers?","(0) NO (1) YES","(0) No (1) Yes"
+"IMD5035","Number of parties participating in election","Macro Data","Macro Data: NUMBER OF PARTIES PARTICIPATING IN ELECTION (IMD5035)","How many political parties received votes in the election?","(1 to 900). NUMBER OF PARTIES","(1 to 900). Number of parties"
+"IMD5036_3","Did any electoral alliance form?","Macro Data","Macro Data: DID ANY ELECTORAL ALLIANCE FORM? (IMD5036_3)","(If yes to IMD5036_1 or IMD5036_2) Did any electoral alliances form?","(0) NO (1) YES","(0) No (1) Yes"
+"IMD5045_1","Average district magnitude - lowest segment (tier) - lower house","Macro Data","Macro Data: AVERAGE DISTRICT MAGNITUDE - LOWEST SEGMENT (TIER) - LOWER HOUSE (IMD5045_1)","Average district magnitude in the first or lowest electoral segment (tier).","(1 to 900). NUMBER OF SEATS ELECTED PER DISTRICT","(1 to 900). Number of seats elected per district"
+"IMD5048","Regime: type of executive","Macro Data","Macro Data: REGIME: TYPE OF EXECUTIVE (IMD5048)","Classification of political regimes. ","(1) PARLIAMENTARY REGIME (2) MIXED REGIME (3) PRESIDENTIAL REGIME","(1) Parliamentary regime (2) Mixed regime (3) Presidential regime"
+"IMD5049","Age of current regime","Macro Data","Macro Data: AGE OF CURRENT REGIME (IMD5049)","The number of years since the most recent regime change.","(0 to 500). AGE OF THE REGIME (YEARS)","(0 to 500). Age of the regime (years)"
+"IMD5050_1","Freedom house rating - time t","Macro Data","Macro Data: FREEDOM HOUSE RATING - TIME T (IMD5050_1)","Freedom House's rating at three time periods (average of the ""Political Rights"" and ""Civil Liberties"" scores).","(1 to 7). FREEDOM HOUSE RATING SCORE","(1 to 7). Freedom house rating score"
+"IMD5051_1","Democracy-autocracy - polity iv rating - time t","Macro Data","Macro Data: DEMOCRACY-AUTOCRACY - POLITY IV RATING - TIME T (IMD5051_1)","The POLITY IV ratings of institutionalized democracy versus autocracy in a country at three time periods.","(-10) AUTOCRATIC (10) DEMOCRATIC","(-10) Autocratic (10) Democratic"
+"IMD5052_2","Gdp growth annual % (world bank) - time t-1 year","Macro Data","Macro Data: GDP GROWTH ANNUAL % (WORLD BANK) - TIME T-1 YEAR (IMD5052_2)","World Bank estimate of the annual GDP growth at three time periods.","(-20 to +25). PERCENT ANNUAL GROWTH","(-20 to +25). Percent annual growth"
+"IMD5053_1","Gdp per capita, ppp (world bank) - time t","Macro Data","Macro Data: GDP PER CAPITA, PPP (WORLD BANK) - TIME T (IMD5053_1)","World Bank estimate of the GDP per capita at three time periods.","(0 to 899,999). GDP PER CAPITA","(0 to 899,999). Gdp per capita"
+"IMD5054_2","Unemployment, total (world bank) - time t-1 year","Macro Data","Macro Data: UNEMPLOYMENT, TOTAL (WORLD BANK) - TIME T-1 YEAR (IMD5054_2)","World Bank estimates of the unemployment rate (% of total labor force) at three time periods.","(0 to 100). UNEMPLOYMENT RATE (% OF TOTAL LABOR FORCE)","(0 to 100). Unemployment rate (% of total labor force)"
+"IMD5055_1","Human development index (unpd) - time t","Macro Data","Macro Data: HUMAN DEVELOPMENT INDEX (UNPD)  - TIME T (IMD5055_1)","UNDP Human Development Index (HDI) at three time periods.","(0 to 1). HUMAN DEVELOPMENT INDEX","(0 to 1). Human development index"
+"IMD5056_2","Inflation, gdp deflator (annual %) (world bank) - time t-1 year","Macro Data","Macro Data: INFLATION, GDP DEFLATOR (ANNUAL %) (WORLD BANK) - TIME T-1 YEAR (IMD5056_2)","World Bank estimate of Inflation at three time periods.","(-100 to 10000). INFLATION (ANNUAL %)","(-100 to 10000). Inflation (annual %)"
+"IMD5057_1","Population, total (world bank) - time t","Macro Data","Macro Data: POPULATION, TOTAL (WORLD BANK) - TIME T (IMD5057_1)","World Bank estimates of the total population size, at three time periods.","(1000 to 9,999,999,999). POPULATION SIZE","(1000 to 9,999,999,999). Population size"
+"IMD5058_1","Effective number of electoral parties","Macro Data","Macro Data: EFFECTIVE NUMBER OF ELECTORAL PARTIES (IMD5058_1)","Effective Number of Electoral Parties (ENEP).","(0 to 1500). EFFECTIVE NUMBER OF ELECTORAL PARTIES","(0 to 1500). Effective number of electoral parties"

world.rda ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:16b3c603996b162bed809ca5a638e7e8baca0bdabe08b9dea4f52b21557d5742
+size 504800