Last updated: 2020-06-08

Checks: 7 0

Knit directory: Fiber_Intervention_Study/

This page contains the summary statistics of participants’ data across the study.

# get data
Participant Demographics

Summarize by Week

mydata <- microbiome_data$meta.dat %>%
  mutate(female = ifelse(Gender == "F", 1, 0),
         c.age = Age - mean(Age),
         IntB = ifelse(Intervention == "B", 1, 0),
         Stress = Stress.Scale,
         hispanic = ifelse(Ethnicity %in% c("White", "Asian", "Native America"), 1, 0),
         BMI = Weight_pre/((Height_cm/100)**2))

sumTab <- mydata %>%
  dplyr::group_by(Week) %>%
  dplyr::summarise(N = n(),
            Age_Mean = mean(Age),
            Age_SD = sd(Age),
            Weight_kg_M = mean(Weight_kg),
            Weight_kg_SD = sd(Weight_kg),
            Height_cm_M = mean(Height_cm),
            Height_cm_SD = sd(Height_cm))

kable(sumTab, format="html", digits=1) %>%
  kable_styling(full_width = T)
Week N Age_Mean Age_SD Weight_kg_M Weight_kg_SD Height_cm_M Height_cm_SD
1 11 27.8 2.0 71.2 10.7 164.0 8.2
4 10 28.0 2.1 71.5 11.3 164.1 8.6
8 7 27.9 2.3 73.3 8.8 162.6 5.7
12 9 28.0 2.2 69.8 10.5 161.9 5.2

Baseline Only for Significance Test

sumTab <- mydata %>%
  dplyr::filter(Week==1) %>%
  dplyr::group_by(Intervention) %>%
  dplyr::summarise(N = n(),
            PercentMale = (1 - mean(female))*100,
            Age_Mean = mean(Age),
            Age_SD = sd(Age),
            Weight_kg_M = mean(Weight_kg),
            Weight_kg_SD = sd(Weight_kg),
            Height_cm_M = mean(Height_cm),
            Height_cm_SD = sd(Height_cm),
            BMI_M = mean(BMI),
            BMI_SD = sd(BMI),
            VFL_M = mean(Visceral_Fat_Level_pre),
            VFL_SD = sd(Visceral_Fat_Level_pre),
            PercBF_M = mean(Perc_Body_Fat_pre),
            PercBF_SD = sd(Perc_Body_Fat_pre),
            PercLF_M = mean(LBM_pre),
            PercLF_SD = sd(LBM_pre),
            HEI_Total_M = mean(HEI_Total, na.rm=T),
            HEI_Total_SD = sd(HEI_Total, na.rm=T))

sumTab <- t(sumTab)
M <- sumTab[rownames(sumTab) %like% "_M",]
SD <- sumTab[rownames(sumTab) %like% "_SD",]
tab <- cbind(M, SD)
tab <- tab[, c(1,3,2,4)]
Ng <- c(sumTab[2,1], NA, sumTab[2,2], NA)
PercentMale <- c(sumTab[3,1], NA, sumTab[3,2], NA)

tab <- rbind(Ng, PercentMale, tab)
colnames(tab) <- c("GroupA_Mean","GroupA_SD", "GroupB_Mean", "GroupB_SD")

tab <- apply(tab, 1:2, as.numeric)

Next, we conducted Mann-Whitney-U test to compare distributions across intervention vs. placebo groups.

dat <- filter(mydata, Week == 1)

VAR <- c("Age", "Weight_kg", "Height_cm", "BMI", "Visceral_Fat_Level_pre", "Perc_Body_Fat_pre", "LBM_pre", "HEI_Total")
out <- numeric(length(VAR))

i <- 1
for(i in 1:length(VAR)){
  fit <- wilcox.test(dat[,VAR[i]] ~ dat$IntB)
  out[i] <- fit$p.value
out <- c(NA, NA, out)
out <- matrix(out, ncol=1)
colnames(out) <- "P_Value"
tab <- cbind(tab, out)

kable(tab, format="html", digits=3) %>%
  kable_styling(full_width = T)
GroupA_Mean GroupA_SD GroupB_Mean GroupB_SD P_Value
Ng 6.000 NA 5.000 NA NA
PercentMale 33.333 NA 40.000 NA NA
Age_Mean 27.333 1.506 28.400 2.608 0.638
Weight_kg_M 68.967 12.199 73.880 9.238 0.537
Height_cm_M 164.267 10.067 163.584 6.309 0.927
BMI_M 25.460 3.127 27.516 1.724 0.247
VFL_M 8.833 4.309 10.200 2.950 0.405
PercBF_M 29.750 8.551 32.340 4.999 0.464
PercLF_M 26.867 6.908 27.860 3.996 0.407
HEI_Total_M 89.364 0.446 89.817 0.365 0.201
tab <-
#write.csv(tab,paste0(w.d, "/tab/table_1_results.csv"))

numbers by ASA24, FFQ, Stool, and Blood Samples


asa24 <- microbiome_data$meta.dat

# If the recall number is missing, then they didn't response so we need to exclude them in the count.

asa24 %>%
# A tibble: 4 x 2
  Week      N
  <fct> <int>
1 1         9
2 4         7
3 8         4
4 12        2

Food Frequency Questionnaire (FFQ)

HEI scores were only gathered at onetime point. So, we need to subset to only 1 week then exclude the missing observations.

ffq <- microbiome_data$meta.dat

ffq %>%
  dplyr::filter(Week == 1,>%
  dplyr::summarise(N = n())
1 9

Stool Samples

Nvec <- matrix(ncol=1, nrow=5, dimnames = list(c("Total", "Week1", "Week4", "Week8", "Week12"), c("N")))

# total number of samples
Nvec[1,1] <- nsamples(phylo_data)

# week 1
subph <- subset_samples(phylo_data, Week == 1)
Nvec[2,1] <- nsamples(subph)

# week 4
subph <- subset_samples(phylo_data, Week == 4)
Nvec[3,1] <- nsamples(subph)

# week 8
subph <- subset_samples(phylo_data, Week == 8)
Nvec[4,1] <- nsamples(subph)

# week 12
subph <- subset_samples(phylo_data, Week == 12)
Nvec[5,1] <- nsamples(subph)

Total  37
Week1  11
Week4  10
Week8   7
Week12  9

Blood Samples

# Blood Samples
blood_data <- read_excel("data/Blood measures data/Copy of Fiber Study Blood Results.xlsx")

meta_data <- microbiome_data$meta.dat

keepVar <- c("SubjectID","Week", "Intervention", "Stress.Scale", "Ethnicity", "Gender", "Age")
meta_data <- meta_data [, keepVar] %>%
  filter(Week == 1)

blood_data <- full_join(blood_data, meta_data)
blood_data <- distinct(blood_data, SubjectID, time,.keep_all = T)

blood_data %>%
  dplyr::group_by(time) %>%
# A tibble: 2 x 2
  time      N
  <chr> <int>
1 Post     11
2 Pre      11

