singnalfuncPNCNB.R

library(dplyr)
library(foreign)
library(labelled)
library(pollster)
library(survey)
library(openxlsx)
library(ggplot2)
library(olsrr)
pkdhs <- read.dta("//Users//sulailfatima//Desktop//GoogleDrive//MGWR_DHS//PKKR71FL.DTA")
# creating the sampling weight variable. 
pkdhs$wt <- pkdhs$v005/1000000 

## Descriptive
# Recreating PDHS Table 9.14 Content of postnatal care for the newborn
# cord examination
pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    cord = case_when(
      m78a %in% c("no","don't know") ~ 0,
      m78a == "yes" ~ 1)) %>% 
  set_value_labels(cord = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(cord = "Cord examined")
cord_pct <- topline(pkdhs, variable = cord, weight = wt)

# measure temp
pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    temp = case_when(
      m78b %in% c("no","don't know") ~ 0,
      m78b == "yes" ~ 1)) %>% 
  set_value_labels(temp = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(temp = "Temperature measured")
temp_pct <- topline(pkdhs, variable = temp, weight = wt)

# Counseling on danger signs
pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    dang = case_when(
      m78c %in% c("no","don't know") ~ 0,
      m78c == "yes" ~ 1)) %>% 
  set_value_labels(dang = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(dang = "Counselling on danger signs")
dang_pct <- topline(pkdhs, variable = dang, weight = wt)

# Counseling on breastfeeding
pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    c_bf = case_when(
      m78d %in% c("no","don't know") ~ 0,
      m78d == "yes" ~ 1)) %>% 
  set_value_labels(c_bf = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(c_bf = "Counselling on breastfeeding")
cBF_pct <- topline(pkdhs, variable = c_bf, weight = wt)

# Observing breastfeeding
pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    obs_bf = case_when(
      m78e %in% c("no","don't know") ~ 0,
      m78e == "yes" ~ 1)) %>% 
  set_value_labels(obs_bf = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(obs_bf = "Observation of breastfeeding")
obsBF_pct <- topline(pkdhs, variable = obs_bf, weight = wt)

# Weighed
pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    weighed = case_when(
      m19a %in% c("not weighed","don't know") ~ 0,
      m19a %in% c("from written card", "from mother's recall") ~ 1)) %>% 
  set_value_labels(weighed = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(weighed = "Weighed")
w_pct <- topline(pkdhs, variable = weighed, weight = wt)


# Percentage with at least two signal functions performed during the
# first 2 days after birth

pkdhs <- pkdhs %>%
  rowwise() %>%
  mutate(yes_count = sum(cord, temp, dang, c_bf, obs_bf, weighed)) %>%
  mutate(
    signalfunc = case_when(
      yes_count >= 2 ~ 1,
      TRUE ~ 0)) %>%
  set_value_labels(signalfunc = c("At least 2 SFs" = 1, "Less than 2 SFs" = 0)) %>%
  set_variable_labels(signalfunc = "Signal functions for NB-PNC")
sf_pct <- topline(pkdhs, variable = signalfunc, weight = wt)
## Creating bar graph for 6 signal functions and at least 2 function performed
sep_signalfun <- c("cord_pct", "temp_pct", "dang_pct", "cBF_pct",
                   "obsBF_pct", "w_pct")
freq <- c(cord_pct$Frequency[cord_pct$Response == "Yes"],
          temp_pct$Frequency[temp_pct$Response == "Yes"],
          dang_pct$Frequency[dang_pct$Response == "Yes"],
          cBF_pct$Frequency[cBF_pct$Response == "Yes"],
          obsBF_pct$Frequency[obsBF_pct$Response == "Yes"],
          w_pct$Frequency[w_pct$Response == "Yes"])
pct <- c(cord_pct$Percent[cord_pct$Response == "Yes"],
         temp_pct$Percent[temp_pct$Response == "Yes"],
         dang_pct$Percent[dang_pct$Response == "Yes"],
         cBF_pct$Percent[cBF_pct$Response == "Yes"],
         obsBF_pct$Percent[obsBF_pct$Response == "Yes"],
         w_pct$Percent[w_pct$Response == "Yes"])
sep_signalfun <- c(
  "Cord examined",
  "Temperature measured",
  "Counseling on danger signs",
  "Counseling on breastfeeding",
  "Observed breastfeeding",
  "Weighed"
)
sum_signalfun <- data.frame(
  Variable = sep_signalfun,
  Frequency = freq,
  Percent = pct
)
# Calculate the percentage of births with "At least 2 SFs"
percent_at_least_two <- sf_pct %>%
  filter(Response == "At least 2 SFs") %>%
  summarize(percent = (Frequency / sum(sf_pct$Frequency)) * 100) %>%
  pull(percent)

# Print the result to verify
percent_at_least_two

df_signalfun <- data.frame(
  signal_function = c("Cord examined", "At least two signal functions", "Temperature measured", 
                      "Counseling on breastfeeding", "Counseling on danger signs", 
                      "Observed breastfeeding", "Weighed"),
  percentage = c(64.1, 57.8, 46.1, 45.2, 26.9, 25.8, 18.9)
)

df_signalfun <- df_signalfun %>%
  mutate(signal_function = factor(signal_function, 
                                  levels = c("At least two signal functions",
                                             "Weighed", "Observed breastfeeding",
                                             "Counseling on danger signs",
                                             "Counseling on breastfeeding", 
                                             "Temperature measured",
                                             "Cord examined")))


signalfunPlot <- ggplot(df_signalfun, 
                        aes(x = signal_function,
                            y = percentage, 
                            fill = percentage)) + 
  geom_bar(stat = "identity") +
  geom_text(aes(label = paste0(round(percentage, 1), "%")),  # Add percentage labels
            hjust = -0.2,   # Position labels slightly to the right of bars
            size = 5,
            fontface = "bold.italic") +
  scale_fill_gradient(high = "#003388", low = "#ff292f") +
  coord_flip() +
  ylim(0, 100) +  # Set y-axis maximum to 100%
  labs(title = "Percentage of Newborns Receiving Six Signal Functions of Postnatal Care",
       x = NULL,
       y = "Percentage (%)") +
  theme_minimal() +
  theme(legend.position = "none") +
  theme(
    legend.position = "none", title = element_text(face = "bold", size = 20),
    axis.text.x = element_text(size = 16),  # Increase x-axis label font size
    axis.text.y = element_text(size = 16)
  )
ggsave("signalfunPlot.png", signalfunPlot, dpi = 600 )

# Not included in the current analysis
# Media & Internet use
# Newspaper
pkdhs <- pkdhs %>% 
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(medx_newsp = case_when(
    v157 %in% c("at least once a week", "almost every day") ~ 1,
    v157 %in% c("not at all", "less than once a week") ~ 0,
    is.na(v157) ~ 0)) %>%
  set_value_labels(medx_newsp = c("Yes" = 1, "No" = 0)) %>%
  set_variable_labels(medx_newsp = "Reads a newspaper at least once a week")
topline(pkdhs, variable = medx_newsp, weight = wt)
# TV
pkdhs <- pkdhs %>% 
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(medx_tv = case_when(
    v159 %in% c("at least once a week", "almost every day") ~ 1,
    v159 %in% c("not at all", "less than once a week") ~ 0,
    is.na(v159) ~ 0)) %>%
  set_value_labels(medx_tv = c("Yes" = 1, "No" = 0)) %>%
  set_variable_labels(medx_tv = "Watches television at least once a week")
topline(pkdhs, variable = medx_tv, weight = wt)
# Radio
pkdhs <- pkdhs %>% 
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(medx_rad = case_when(
    v158 %in% c("at least once a week", "almost every day") ~ 1,
    v158 %in% c("not at all", "less than once a week") ~ 0,
    is.na(v158) ~ 0)) %>%
  set_value_labels(medx_rad = c("Yes" = 1, "No" = 0)) %>%
  set_variable_labels(medx_rad = "Listens to the radio at least once a week")
topline(pkdhs, variable = medx_rad, weight = wt)
# Internet
pkdhs <- pkdhs %>% 
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(medx_int = case_when(
    v171a == "yes, last 12 months" | v171a == "yes, before last 12 months" | v171a == "yes, can't establish when" ~ 1,
    v171a == "never" ~ 0)) %>%
  set_value_labels(medx_int = c("Yes" = 1, "No" = 0)) %>%
  set_variable_labels(medx_int = "Ever used the internetk")
topline(pkdhs, variable = medx_int, weight = wt)
# Overall media exposure
pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(media_exp = case_when(
    medx_newsp == 1 | medx_tv == 1 | medx_rad == 1 | medx_int == 1 ~ 1,
    TRUE ~ 0)) %>%
  set_value_labels(media_exp = c("Yes" = 1, "No" = 0)) %>%
  set_variable_labels(media_exp = "Media & Internet Exposure")
topline(pkdhs, media_exp, weight = wt)
xtab.mediaexp <- crosstab(pkdhs, media_exp, signalfunc, weight = wt,
                       pct_type = "row", unwt_n = T, format = "wide", n = T)


# Problems in accessing healthcare facility
pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    v467b_bi = case_when(
      v467b == "big problem" ~ 1,
      TRUE ~ 0)) %>%
  set_value_labels(v467b_bi = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(v467b_bi = "Getting permission to go for treatment")

pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    v467c_bi = case_when(
      v467c == "big problem" ~ 1,
      TRUE ~ 0)) %>%
  set_value_labels(v467c_bi = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(v467c_bi = "Getting money for treatment")
topline(pkdhs, v467c_bi, weight = wt)

pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    v467d_bi = case_when(
      v467d == "big problem" ~ 1,
      TRUE ~ 0)) %>%
  set_value_labels(v467d_bi = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(v467d_bi = "Distance to health facility")

pkdhs <- pkdhs %>%
  filter(v101 != "gb" & v101 != "ajk" & midx == 1 & b19 < 24) %>%
  mutate(
    v467f_bi = case_when(
      v467f == "big problem" ~ 1,
      TRUE ~ 0)) %>%
  set_value_labels(v467f_bi = c("Yes" = 1, "No"=0)) %>%
  set_variable_labels(v467f_bi = "Not wanting to go alone")

## Percentage with at least one problem in accessing HF
pkdhs <- pkdhs %>%
  rowwise() %>%
  mutate(
    yes_count = sum(v467b_bi, v467c_bi, v467d_bi, v467f_bi)) %>%
  mutate(
    accHF = case_when(yes_count >= 1 ~ 1,
    TRUE ~ 0)) %>%
  set_value_labels(accHF = c("Yes" = 1, "No" = 0)) %>%
  set_variable_labels(accHF = "At least one problem in accessing healthcare
                      facility")
topline(pkdhs, accHF, weight = wt)

# Cross Tabulations with maternal age (m_age_cat), birth order (bord_cat), place
# of delivery (b_HF), education (v106), region (v101), place of residence (v102),
# wealth index (v190), sex of child (b4), anc visits (anc), c-section performed 
# (cs), healthcare access (accHF) & owns a mobile phone (v169a) 
# 
# Mother's age @ birth
pkdhs <- pkdhs %>% 
  mutate(m_age = (b3 - v011)/12) %>% 
  mutate(
    m_age_cat = case_when(
      m_age < 20 ~ 0,
      m_age >= 20 & m_age < 35 ~ 1,
      m_age >= 35 ~ 2)) %>%
  set_value_labels(m_age_cat = c("< 20" = 0, "20 - 34" = 1, "35 - 49" = 2)) %>%
  set_variable_labels(m_age_cat = "Maternal age at birth")
#topline(pkdhs, m_age_cat, wt)
pkdhs$m_age_cat <- as.factor(pkdhs$m_age_cat)
xtab.m_age <- crosstab(pkdhs, m_age_cat, signalfunc, weight = wt,
                       pct_type = "row", unwt_n = T, format = "wide", n = T)
# birth order 
pkdhs <- pkdhs %>% mutate(
  bord_cat = case_when(
    bord == 1 ~ 1,
    bord >= 2 & bord <= 3 ~ 2,
    bord >= 4 & bord <= 5 ~ 3,
    bord >= 6 ~ 4)) %>%
  set_value_labels(bord_cat = c("1" = 1, "2-3" = 2, "4-5" = 3, ">6" = 4)) %>%
  set_variable_labels(bord_cat = "Birth order")
#topline(pkdhs, bord_cat, wt)
xtab.bord_cat <- crosstab(pkdhs, bord_cat, signalfunc, weight = wt,
                          pct_type = "row", unwt_n = T, format = "wide", n = T)
pkdhs$bord_cat <- as.factor(pkdhs$bord_cat)


# place of delivery
pkdhs <- pkdhs %>% 
  mutate(
  b_HF = case_when(
    m15 %in% c("government hospital", "rural health centre/mother child health centre",
               "bhu(basic health unit)","community midwife", "other public sector",
               "private hospital/clinic", "other private medical sector") ~ 1,
    TRUE ~ 0)) %>% 
  set_value_labels(b_HF = c("Institional delivery" = 1, "Elsewhere" = 0)) %>%
  set_variable_labels(b_HF = "Place of delivery")
#topline(pkdhs, b_HF, wt)
xtab.b_HF <- crosstab(pkdhs, b_HF, signalfunc, weight = wt,
                      pct_type = "row", unwt_n = T, format = "wide", n = T)
# education v106
xtab.v106 <- crosstab(pkdhs, v106, signalfunc, weight = wt,
                      pct_type = "row", unwt_n = T, format = "wide", n = T)
# region v101
xtab.v101 <- crosstab(pkdhs, v101, signalfunc, weight = wt,
                      pct_type = "row", unwt_n = T, format = "wide", n = T)
# place of residence v102
xtab.v102 <- crosstab(pkdhs, v102, signalfunc, weight = wt,
                      pct_type = "row", unwt_n = T, format = "wide", n = T)
# wealth index v190
xtab.v190 <- crosstab(pkdhs, v190, signalfunc, weight = wt,
                      pct_type = "row", unwt_n = T, format = "wide", n = T)
# sex of child b4
xtab.b4 <- crosstab(pkdhs, b4, signalfunc, weight = wt,
                    pct_type = "row", unwt_n = T, format = "wide", n = T)
# anc visits
pkdhs <- pkdhs %>%
  mutate(
    anc = case_when(
      m14 == 0 ~ 0,
      m14 >= 1 & m14 < 4 ~ 1,
      TRUE ~ 2)) %>%
  set_value_labels(anc = c("None" = 0, "1-3" = 1, "4 and more" = 2)) %>%
  set_variable_labels(anc = "Antenatal care visits") 
xtab.anc <- crosstab(pkdhs, anc, signalfunc, weight = wt,
                     pct_type = "row", unwt_n = T, format = "wide", n = T)
pkdhs$anc <- as.factor(pkdhs$anc)
# quality of anc
pkdhs <- pkdhs %>%
  mutate(
    m42cbi = case_when(
      m42c == "yes" ~ 1,
      TRUE ~ 0)) %>%
  mutate(
    m42dbi = case_when(
      m42d == "yes" ~ 1,
      TRUE ~ 0)) %>%
  mutate(
    m42ebi = case_when(
      m42e == "yes" ~ 1,
      TRUE ~ 0)) %>%
  mutate(
      m45bi = case_when(
        m45 == "yes" ~ 1,
        TRUE ~ 0)) %>%
  mutate(
    m60bi = case_when(
      m60 == "yes" ~ 1,
      TRUE ~ 0)) %>%
  rowwise() %>%
  mutate(
    yes_count = sum(m42cbi, m42dbi, m42ebi, m45bi, m60bi)) %>%
  mutate(
    ancqua = case_when(
      yes_count >= 4 ~1,
      TRUE ~ 0))%>%
  set_value_labels(ancqua = c("Poor" = 0, "Good" = 1)) %>%
  set_variable_labels(ancqua = "Quality of ANC") 
xtab.ancqua <- crosstab(pkdhs, ancqua, signalfunc, weight = wt,
                     pct_type = "row", unwt_n = T, format = "wide", n = T)

# v743a (women's participation in decision making)
pkdhs <- pkdhs %>%
  mutate(
    healthdecision = case_when(
      v743a == "respondent alone" ~ 1,
      v743a == "respondent and husband/partner" ~ 1,
      v743a == "respondent and other person" ~ 0,
      v743a == "husband/partner alone" ~ 0,
      v743a == "someone else" ~ 0,
      v743a == "other" ~ 0,
    )) %>%
  set_value_labels(healthdecision = c("Respondent Decides" = 1, "Respondent Does not Decide" = 0)) %>%
  set_variable_labels(healthdecision = "Participation in Decision-making for Health")
xtab.healthdecision <- crosstab(pkdhs, healthdecision, signalfunc, weight = wt,
                     pct_type = "row", unwt_n = T, format = "wide", n = T)

# delivery by csection (m17)
xtab.cs <- crosstab(pkdhs, m17, signalfunc, weight = wt,
                    pct_type = "row", unwt_n = T, format = "wide", n = T)

# Skilled Birth Attendence
pkdhs <- pkdhs %>%
  mutate(
    sba = case_when(
      m3a == "yes" ~ 1, # doctor
      m3b == "yes" ~ 1, # Nurse
      m3c == "yes" ~ 1, # Midwife
      m3d == "yes" ~ 1, # Lady health visitor
      m3e == "yes" ~ 1, # Community midwife 
      m3g == "yes" ~ 0, # Dai/traditional birth attendant
      m3h == "yes" ~ 0, # Family welfare wk
      m3i == "yes" ~ 0, # LHW
      m3j == "yes" ~ 0, # Homeopath 
      m3k == "yes" ~ 0, # other
      m3l == "yes" ~ 0, # Hakim
      m3m == "yes" ~ 0, # Relative/friend
      )) %>%
  set_value_labels(sba = c("Skilled" = 1, "Unskilled" = 0)) %>%
  set_variable_labels(sba = "Birth assisted by a skilled provider")
xtab.sba <- crosstab(pkdhs, sba, signalfunc, weight = wt,
                    pct_type = "row", unwt_n = T, format = "wide", n = T)
xtab.accHF <- crosstab(pkdhs, accHF, signalfunc, weight = wt,
                       pct_type = "row", unwt_n = T, format = "wide", n = T)
# Owns a mobile phone (v169a)
xtab.mobile <- crosstab(pkdhs, v169a, signalfunc, weight = wt,
                    pct_type = "row", unwt_n = T, format = "wide", n = T)


# exporting bivar analysis to MS Excel
library(openxlsx)
# storing all bivar analysis in one list
crosstab_results <- list(xtab.m_age, xtab.bord_cat, xtab.b_HF, 
                         xtab.v106, xtab.v101, xtab.v102, 
                         xtab.v190, xtab.b4, xtab.anc, xtab.ancqua, xtab.cs, xtab.sba,
                         xtab.accHF, xtab.mediaexp, xtab.mobile, xtab.healthdecision)
# Specify sheet names (modify as needed)
sheet_names <- c("Sheet1", "Sheet2", "Sheet3", "Sheet4", "Sheet5",
                 "Sheet6", "Sheet7", "Sheet8", "Sheet9", "Sheet10", "Sheet11",
                 "Sheet12", "Sheet13", "Sheet14", "Sheet15", "Sheet16")
# Create a new Excel workbook
wb <- createWorkbook()

# Loop through the list of results and write them to separate sheets
for (i in 1:length(crosstab_results)) {
  addWorksheet(wb, sheetName = sheet_names[i])
  writeData(wb, sheet = i, x = crosstab_results[[i]])
}
excel_file_path <- "output_crosstabs_Nov13.xlsx"

saveWorkbook(wb, file = excel_file_path, overwrite = TRUE)

# Running bivariate logistic regression
# Create a new Excel workbook
wb <- createWorkbook()
# Listing all Xs in one object
x_vars <- c("m_age_cat", "bord_cat", "b_HF", "v106", 
            "v101",  "v102","v190", "b4", "anc", "m17",
            "sba", "accHF",  "media_exp", "v169a", 
            "healthdecision", "ancqua")

model_list <- list()

for (var in x_vars) {
  formula <- formula(paste("signalfunc ~", var))
  model <- glm(formula, data = pkdhs, family = binomial)
  odds_ratios <- exp(cbind(OR = coef(model), confint(model)))
  #model_list[[var]] <- list(model = model, odds_ratios = odds_ratios)
  # Create a new sheet for each model
  addWorksheet(wb, sheetName = var)
  
  # Write the model summary to the sheet
  writeData(wb, sheet = var, x = model)
  # Write the odds ratios to the sheet
  writeData(wb, sheet = var, x = odds_ratios, startCol = "B", startRow = 10)
}

saveWorkbook(wb, file = "BivarLogRegNov13.xlsx", overwrite = TRUE)

adj.model <- glm(signalfunc ~ m_age_cat+ bord_cat+ b_HF+ v106+ 
                 v101+ v102+ v190 + b4 + anc + m17+
                 sba+ accHF + media_exp+ v169a+
                 healthdecision+ ancqua, data = pkdhs, 
                 family = binomial)
summary(adj.model)
adj.ORs <- exp(cbind(OR = coef(adj.model), confint(adj.model)))
wb <- createWorkbook()
addWorksheet(wb, sheetName = "adjModel")
writeData(wb, sheet = "adjModel", x = adj.model)
writeData(wb, sheet = "adjModel", x = adj.ORs, startCol = "H", rowNames = TRUE)
saveWorkbook(wb, file = "AdjLogReg_results14Nov.xlsx", overwrite = TRUE)

## Plotting Adj ORs as a forest plot
library(MASS)

or_CI <- adj.ORs %>%
  as.data.frame() %>%
  mutate(variable = rownames(adj.ORs))

or_CI <- rename(or_CI, c("AOR" = "OR",
                         "Lower_bound" = "2.5 %",
                         "Upper_bound" = "97.5 %"))

col_order <- c("variable", "AOR", "Lower_bound", "Upper_bound")
or_CI <- or_CI[, col_order]
or_CI$variable <- recode_factor(or_CI$variable,
                                "m_age_cat1" = "Mother's Age 20-34",
                                "m_age_cat2" = "Mother's Age 35-49",
                                "v106primary" = "Mother's Education: Primary",
                                "v106secondary" = "Mother's Education: Secondary",
                                "v106higher" = "Mother's Education: Higher",
                                "v102rural" = "Place of Residence: Rural",
                                "v101sindh" = "Sindh",
                                "v101kpk" = "KPK",
                                "v101balochistan" = "Balochistan",
                                "v101ict" = "ICT",
                                "v101fata" = "FATA",
                                "v190poorer" = "WI: Poorer",
                                "v190middle" = "WI: Middle",
                                "v190richer" = "WI: Richer",
                                "v190richest" = "WI: Richest",
                                "media_exp" = "Media Exposure: Yes",
                                "v169ayes" = "Owns a Mobile Phone",
                                "accHF" = "Access to HF: Yes",
                                "healthdecision" = "Decision-making: Health",
                                "anc1" = "ANC Visit: 1-3",
                                "anc2" = "ANC Visit: 4+",
                                "ancqua" = "ANC Quality: Good",
                                "sba" = "SBA",
                                "b_HF" = "Institutional Delivery",
                                "m17yes" = "CS Performed",
                                "b4female" = "Sex of Child: Female",
                                "bord_cat2" = "Birth Order 2-3",
                                "bord_cat3" = "Birth Order 4-5",
                                "bord_cat4" = "Birth Order 6+")


## Plotting AORs with 95%CI as a forestplot
custom_order <- c("Mother's Age 20-34",
                  "Mother's Age 35-49",
                  "Mother's Education: Primary",
                  "Mother's Education: Secondary",
                  "Mother's Education: Higher",
                  "Place of Residence: Rural",
                  "Sindh",
                  "KPK",
                  "Balochistan",
                  "ICT",
                  "FATA",
                  "WI: Poorer",
                  "WI: Middle",
                  "WI: Richer",
                  "WI: Richest",
                  "Media Exposure: Yes",
                  "Owns a Mobile Phone",
                  "Access to HF: Yes",
                  "Decision-making: Health",
                  "ANC Visit: 1-3",
                  "ANC Visit: 4+",
                  "ANC Quality: Good",
                  "SBA",
                  "Institutional Delivery",
                  "CS Performed",
                  "Sex of Child: Female",
                  "Birth Order 2-3",
                  "Birth Order 4-5",
                  "Birth Order 6+")
custom_colors <- (rev(c(
  "#FF4500", "#FF4500", "#1E90FF", "#1E90FF", "#1E90FF", "#32CD32", "#32CD32",
  "#32CD32", "#FF1493", "#768200", "#A52A2A", "#A52A2A", "#A52A2A", "#A52A2A",
  "#A52A2A", "#5F9EA0", "#FFD700", "#FFD700", "#FFD700", "#FFD700", "#dd9977",
  "#889900", "#889900", "#8A2BE2","#FF4500", "#FF4500", "#1E90FF", "#1E90FF",
  "#bf4599")))

plot_logit_model <- or_CI[-1,] %>%
  mutate(variable = factor(variable, levels = rev(custom_order))) %>%
  ggplot(aes(x = variable, y = AOR, color = variable)) +
  geom_point(shape = 16, size = 4, position = position_dodge(width = 1)) +
  geom_errorbar(aes(ymin = Lower_bound, ymax = Upper_bound),
                width = 0.2, linewidth = 0.7, position = position_dodge(width = 1)) +
  scale_color_manual(values = custom_colors) + # Custom colors for each variable
  xlab(NULL) +
  ylab("Adjusted Odds Ratios with 95% CI") +
  geom_hline(yintercept = 1, color = "red", size = 0.6, linetype='dashed') +
  theme_minimal() +
  theme(axis.title = element_text(size = 14, face = "bold"),
        axis.text = element_text(size = 12),
        legend.position = "none",
        panel.grid.minor = element_blank()) +
  coord_flip(ylim = c(0, 3.5))
plot_logit_model
ggsave("AORsForestPlot.png", plot_logit_model, dpi = 600 )


### For assessing interaction
##### Visualizing Interaction without running Regression
custom_colors1 <- rev(c(
  "#16722c", "#66d280", "#8199ba",
  "#88292f", "#c96480"))
df_summary <- pkdhs %>%
  filter(!is.na(v102)) %>%
  group_by(v190, v102) %>%
  summarise(proportion = mean(signalfunc))
df_summary$v190 <- factor(df_summary$v190,
                          levels = c("poorest", "poorer", "middle", "richer", "richest"),
                          labels = c("Poorest", "Poorer", "Middle", "Richer", "Richest"))
EMPlot <- ggplot(df_summary, aes(x = v102 , y = proportion,
                                 group = v190, color = v190)) +
  geom_line(size = 2, alpha = 0.5) +  # Line plot to show interaction
  geom_point(size = 8) +  # Adding points for each value
  labs(title = "Visualizing Interaction between Place of\n        Residence and Wealth Index",
       x = NULL,
       y = "Proportion of At least 2 Signal Functions",
       color = "Wealth Index") +
  scale_color_manual(values = custom_colors1,   # Custom color palette for legend
                     labels = c("Poorest", "Poorer", "Middle", "Richer", "Richest")) +  # Custom legend labels
  scale_x_discrete(labels = c("Urban", "Rural")) +
  theme_minimal() +
  theme(plot.title = element_text(size = rel(1.6)),
        axis.title.y = element_text(size = rel(1.5)),
        axis.text.x = element_text(hjust = 0.5, size = rel(1.5)),
        axis.text.y = element_text(hjust = 0.5, size = rel(1.5)))  # Rotate x-axis labels for readability
ggsave("InteractionPlot1.png", EMPlot, dpi = 600 )


## Not included in the current analysis
### stepwise regression
fullMod <- glm(signalfunc ~ m_age_cat+ bord_cat+ b_HF+ v106+ 
                 v101+ v102+ v190 + b4 + anc + m17+
                 sba+ accHF + media_exp+ v169a+
                 healthdecision+ ancqua, data = pkdhs, family = binomial)

#  Apply stepwise regression using both directions (forward and backward)
stepwise_model <- stepAIC(fullMod, direction = "both")
# Display the summary of the final model
summary(stepwise_model)

nullMod <- glm(signalfunc ~ 1, data = pkdhs, family = binomial)
summary(nullMod)

fullMod$deviance; nullMod$deviance
backMod <- step(fullMod, direction = "backward")


library(olsrr)
pncNBmod <- glm(signalfunc ~ m_age_cat+ bord_cat+ b_HF+ v106+ 
                 v101+ v102+ v190 + b4 + anc + m17+
                 sba+ accHF + media_exp+ v169a+
                 healthdecision+ ancqua, data = pkdhs)

pncNB.step_model <- ols_step_both_p(pncNBmod, p_remove = 0.2)
aic_plot <- plot(pncNB.step_model)
ggsave("aic_plot.png", aic_plot, dpi = 1200 )

## only plotting dropping AICs
# Load necessary libraries
library(ggplot2)

# Create the data frame
stepwise_data <- data.frame(
  Step = 0:11,
  Variable = c("Base Model", "HF_birth", "csec", "h_decision", "ancqua", 
               "region", "anc", "resid", "wealth", "sba", "accHF", "media_exp"),
  AIC = c(5566.557, 5031.286, 4825.383, 4728.731, 4648.601, 4362.371, 
          4319.873, 4307.091, 4281.959, 4275.854, 4273.231, 4271.377)
)

# Create the plot
aic_drop <- ggplot(stepwise_data, 
                   aes(x = Step, y = AIC)) + 
  geom_line(color = "skyblue", size = 3) + 
  geom_point(size = 5, color = "darkblue") + 
  geom_text(aes(label = Variable), 
            vjust = -1.15, 
            hjust = -1.01, 
            size = 4) + 
  labs(title = "Drop in AIC Across Stepwise Regression Steps", 
       x = "Step", 
       y = "AIC") + 
  theme_minimal(base_size = 12) + 
  theme(plot.title = element_text(hjust = 0.5, 
                                  face = "bold"), 
        axis.title = element_text(face = "bold"))
ggsave("aic_dropplot.png", aic_drop, dpi = 1200 )


ols_step_forward_p(pncNBmod, 0.2, hierarchical = T)


#########################
#########################

survey_design <- svydesign(
  id = ~v001,          # Replace PSU with your PSU variable
  strata = ~v022,   # Replace strata with your strata variable
  weights = ~wt,  # Replace weight with your weight variable
  data = pkdhs,   # Replace with your data frame
  nest = TRUE         # If sampling is nested, set to TRUE
)

pncNBmod <- svyglm(
  signalfunc ~ m_age_cat+ bord_cat+ b_HF+ v106+ 
    v101+ v102+ v190 + b4 + anc + m17+
    sba+ accHF + media_exp+ v169a+
    healthdecision+ ancqua,  # Specify your model formula
  design = survey_design,
  family=quasibinomial(link = "logit")              # Use binomial for logistic regression, or other families as needed
)

nbcare.stepw <- ols_step_both_p(
  pncNBmod,
  p_remove = 0.2)