An extensive amount of data management is obscured from this document, goal is to inform code writing, figure generation, and etc. not to evaluate these actual data.

library(knitr)
library(tidyverse)
library(readxl)
library(rio)
library(broom)
library(GGally)
library(ggridges)
library(lme4)
library(modelr)
library(nlme)
library(ggrepel)
library(broom.mixed)
library(ggrepel)
library(ggpubr)
library(drc)
library(mgcv)
library(purrr)
library(ggpmisc)
library(equatiomatic)
library(marginaleffects)
library(modelsummary)
library(sjPlot)
library(emmeans)
library(magic)
library(lemon)

###! Tread Carefully Here !##
options(dplyr.summarise.inform=F)
### This turns off the tidyverse summarize/summarise messages indicating default grouping patterns in resultant tibbles ##
### If you don't know what this means, check out https://stackoverflow.com/questions/62140483/how-to-interpret-dplyr-message-summarise-regrouping-output-by-x-override
### Implications of this being false are unknown errors and impacts in other activities in this R session!

summary plots

cbcolors <- c(
  "PFOS" = "#999999", 
  "PFOA" = "#E69F00", 
  "PFHxS" = "#56B4E9",
  "PFHxA" = "#999933",
  "PFNA" = "#F0E442",
  "PFBS" = "#0072B2",
  "6:2 FTS" = "#D55E00",
  "8:2 FTS" = "#CC79A7"
)

notsampleddf <- data.frame(
  treatment=c(rep("PFBS",3),rep("PFNA",3)),
  Tissue=c(rep(c("Brain","Kidney","Liver"),2)),
  COMPOUND=c("NA"),
  mean=c(rep(10,3),rep(10000,3)),
  label="NA",
  Sex="M"
)
reposition_legend(
  ggplot(data=bigplotstacker3|>filter(inmixture=="yes", singletoncompound=="yes"), aes(x=Tissue, y=Concentration, fill=Sex)) +
    geom_dotplot(binaxis="y",  stackdir="center")+
    facet_wrap(~fct_relevel(treatment, "PFOS","PFOA","PFHxS","PFNA","8:2 FTS","PFBS","PFHxA","6:2 FTS"), scales="free_y", axes="all") +
  geom_text(data=notsampleddf, aes(y=mean, label=label), color="black", show.legend=F)+
    scale_y_log10(labels=scales::label_comma())+
    theme_classic(base_size = 20) +
    labs(y="Wholebody, liver, brain, or kidney (ng/g); serum (ng/mL)", x=NULL)+
    theme(axis.text=element_text(color="black"), strip.background=element_rect(fill="white",color="white",linewidth=1), strip.text=element_text(face="bold"), legend.text=element_text(size=20), legend.title=element_text(size=20)) +
    guides(fill=guide_legend(override.aes=list(size=15))),
  position='center', panel='panel-3-3')

ggplot(data=bigplotstacker3|>filter(inmixture=="yes", singletoncompound=="no"), aes(x=Tissue, y=Concentration, fill=COMPOUND)) +
  geom_dotplot(binaxis="y",  stackdir="center", dotsize=1)+
  facet_wrap(~treatment, scales="free_y", axes="all") +
  scale_y_log10(labels=scales::label_comma())+
  theme_classic(base_size = 20) +
  labs(y="Wholebody, liver, brain, or kidney (ng/g); serum (ng/mL)", fill="", x=NULL) +
  guides(fill=guide_legend(title="PFAS"))+
  #scale_color_manual(values=cbcolors)+
  scale_fill_manual(values=cbcolors) +
  theme(axis.text=element_text(color="black"), strip.background=element_rect(fill="white",color="white",linewidth=1), strip.text=element_text(face="bold"), legend.text=element_text(size=14), legend.position="bottom") +
  guides(fill=guide_legend(override.aes=list(size=12), nrow=1))

cbcolors2 <- c(
  "PFOS" = "#999999", 
  "PFOA" = "#E69F00", 
  "PFHxS" = "#56B4E9",
  "PFHxA" = "#999933",
  "PFNA" = "#F0E442",
  "PFBS" = "#0072B2",
  "6:2 FTS" = "#D55E00",
  "8:2 FTS" = "#CC79A7",
  
  "PFPeA"="#AA0DFE",
  "PFPeS"="#3283FE",
  "PFTeDA"="#85660D",
  "PFTrDA"="#782AB6",
  "PFUnA"="#565656",
  "PFDS"="#1C8356",
  "PFDoA"="#16FF32",
  "PFDoS"="#F7E1A0",
  "PFHpA"="#E2E2E2",
  "PFHpS"="#1CBE4F",
  "PFMBA"="#C4451C",
  "PFNS"="#DEA0FD",
  "7:3 FTCA"="#FE00FA",
  "4:2 FTS"="#009e73",
  "EtFOSAA"="#325A9B",
  "MeFOSAA"="#FEAF16",
  "N-EtFOSE"="#F8A19F",
  "N-MeFOSE"="#90AD1C",
  "PFBA"="#F6222E",
  "PFDA"="#1CFFCE"
)



bigplotstacker3 <- bigplotstacker3 |>
  mutate(
    logConcentration=log(Concentration),
    logDose=log(dose)
  )


sumplot2 <- ggplot(data=bigplotstacker3, aes(x=dose, y=Concentration, color=COMPOUND)) +
  geom_point(size=3, alpha=0.25) +
  geom_smooth(method="lm", formula=y~x, se=F, linewidth=2) +
  facet_wrap(~Tissue) +
  scale_y_log10(labels=scales::label_comma())+
  scale_x_log10(labels=scales::label_comma())+
  theme_classic(base_size = 22) +
  labs(y="Wholebody, liver, brain, or kidney (ng/g); serum (ng/mL)", caption="", x="Dose (mg/kg-d)") +
  scale_color_manual(values=cbcolors2) +
  theme(strip.background=element_rect(fill="white",color="white",linewidth=1)) #+
  #scale_fill_manual(values=cbcolors2)

reposition_legend(sumplot2, 'center', panel='panel-3-2')

reposition_legend(
ggplot(data=bigplotstacker3, aes(x=dose, y=Concentration, color=COMPOUND)) +
  geom_point(size=3, alpha=0.25) +
  geom_smooth(method="lm", formula=y~x, se=F, linewidth=2) +
  facet_wrap(~Tissue*Sex) +
  scale_y_log10(labels=scales::label_comma())+
  scale_x_log10(labels=scales::label_comma())+
  theme_classic(base_size = 22) +
  labs(y="Wholebody, liver, brain, or kidney (ng/g); serum (ng/mL)", caption=NULL, color=NULL,x="Dose (mg/kg-d)") +
  scale_color_manual(values=cbcolors2) +
  theme(strip.background=element_rect(fill="white",color="white",linewidth=1)),
 'center', panel='panel-4-3')

all tissues all mixture using broom

fullmixedmodelsdosebased <- bigplotstacker3|>filter(!is.na(logDose)) |>
  nest(data=-Tissue) |>
  mutate(
    fit=map(data, ~ lmer(logConcentration ~logDose+Sex+(logDose|COMPOUND), data=.x)),
    tidied=map(fit, tidy),
    glanced=map(fit, glance),
    augmented=map(fit, augment)
  )
## boundary (singular) fit: see help('isSingular')
fullmixedmodelsdosebased |>
  unnest(tidied) 
fullmixedmodelsdosebased |>
  unnest(tidied) |>
  dplyr::select(Tissue, effect, term, estimate, std.error)|>
  group_by(Tissue, effect, term) |>
  summarize(`Mean, SE`=paste(round(estimate,3),", ",round(std.error,3))) |>
  pivot_wider(names_from=c(effect,term), values_from=`Mean, SE`) 
fullmixedmodelsdosebased |>
  unnest(glanced) 
#fullmixedmodelsdosebased|>
#  unnest(augmented)



ggplot(data=fullmixedmodelsdosebased|>unnest(augmented) , aes(x=logConcentration, y=.fitted, color=COMPOUND, shape=Sex))+
  geom_point() +
  geom_abline(slope=1)+
  geom_abline(slope=1, intercept=-1, linetype="dashed")+
  geom_abline(slope=1, intercept=1, linetype="dashed")+
  facet_wrap(~Tissue) +
  theme_classic(base_size=18) +
  labs(y="Predicted ln(Tissue (ng/g) or serum (ng/mL))", x="Observed ln(Tissue (ng/g) or serum (ng/mL))")+
  scale_color_manual(values=cbcolors2)

ggplot(data=fullmixedmodelsdosebased|>unnest(augmented) , aes(x=logConcentration, y=.fitted, color=COMPOUND, shape=Sex))+
  geom_point() +
  geom_abline(slope=1)+
  geom_abline(slope=1, intercept=-1, linetype="dashed")+
  geom_abline(slope=1, intercept=1, linetype="dashed")+
  facet_wrap(~Tissue*Sex) +
  theme_classic(base_size=18) +
  labs(y="Predicted ln(Tissue (ng/g) or serum (ng/mL))", x="Observed ln(Tissue (ng/g) or serum (ng/mL))")+
  scale_color_manual(values=cbcolors2)

all tissues all mixed to get random effect param values

Whole Body

mixallWB <- lmer(logConcentration ~logDose+Sex+(logDose|COMPOUND), data = bigplotstacker3|>filter(Tissue=="Wholebody",!is.na(logConcentration)), REML=T)
summary(mixallWB)
## Linear mixed model fit by REML ['lmerMod']
## Formula: logConcentration ~ logDose + Sex + (logDose | COMPOUND)
##    Data: 
## filter(bigplotstacker3, Tissue == "Wholebody", !is.na(logConcentration))
## 
## REML criterion at convergence: 1493.6
## 
## Scaled residuals: 
##     Min      1Q  Median      3Q     Max 
## -6.9700 -0.3582  0.0128  0.4269  4.0496 
## 
## Random effects:
##  Groups   Name        Variance Std.Dev. Corr
##  COMPOUND (Intercept) 7.99624  2.8278       
##           logDose     0.04017  0.2004   0.88
##  Residual             0.22966  0.4792       
## Number of obs: 1010, groups:  COMPOUND, 11
## 
## Fixed effects:
##             Estimate Std. Error t value
## (Intercept)  7.67585    0.86576   8.866
## logDose      0.83113    0.06435  12.916
## SexM         0.31552    0.03031  10.409
## 
## Correlation of Fixed Effects:
##         (Intr) logDos
## logDose  0.870       
## SexM    -0.015  0.011
fixef(mixallWB)
## (Intercept)     logDose        SexM 
##   7.6758520   0.8311269   0.3155191
ranef(mixallWB)
## $COMPOUND
##         (Intercept)     logDose
## 6:2 FTS  -0.5043785 -0.19609479
## 8:2 FTS   1.4884508  0.05694876
## PFBS     -3.6437169 -0.30698430
## PFHpS     2.4612902  0.26647197
## PFHxA    -6.0778594 -0.27626678
## PFHxS     1.6868963  0.13368940
## PFNA      1.3178685  0.01177662
## PFNS      1.5408796  0.06594370
## PFOA      1.7498237  0.13916327
## PFOS      2.0978518  0.16504180
## PFPeS    -2.1171061 -0.05968965
## 
## with conditional variances for "COMPOUND"
coef(mixallWB) 
## $COMPOUND
##         (Intercept)   logDose      SexM
## 6:2 FTS    7.171474 0.6350321 0.3155191
## 8:2 FTS    9.164303 0.8880757 0.3155191
## PFBS       4.032135 0.5241426 0.3155191
## PFHpS     10.137142 1.0975989 0.3155191
## PFHxA      1.597993 0.5548602 0.3155191
## PFHxS      9.362748 0.9648163 0.3155191
## PFNA       8.993721 0.8429035 0.3155191
## PFNS       9.216732 0.8970706 0.3155191
## PFOA       9.425676 0.9702902 0.3155191
## PFOS       9.773704 0.9961687 0.3155191
## PFPeS      5.558746 0.7714373 0.3155191
## 
## attr(,"class")
## [1] "coef.mer"
mixallWB |>
  tidy() |>
  #dplyr::select(effect, term, estimate, std.error)|>
  group_by(effect, term) |>
  summarize(`Mean, SE`=paste(round(estimate,3),", ",round(std.error,3))) |>
  pivot_wider(names_from=c(effect,term), values_from=`Mean, SE`) 
extract_eq(mixallWB, use_coefs=F, mean_separate=T,
           intercept="beta",
           swap_var_names=c(
             "logDose"="ln(Dose, mg/kg-d)",
             "logConcentration"="ln(Whole Body, ng/g)",
             "Sex"="Sex"),
           swap_subscript_names=c(
             "M"="Male"
           ))

\[ \begin{aligned} \operatorname{ln(Whole\ Body,\ ng/g)}_{i} &\sim N \left(\mu, \sigma^2 \right) \\ \mu &=\alpha_{j[i]} + \beta_{1j[i]}(\operatorname{ln(Dose,\ mg/kg-d)}) + \beta_{2}(\operatorname{Sex}_{\operatorname{Male}}) \\ \left( \begin{array}{c} \begin{aligned} &\alpha_{j} \\ &\beta_{1j} \end{aligned} \end{array} \right) &\sim N \left( \left( \begin{array}{c} \begin{aligned} &\mu_{\alpha_{j}} \\ &\mu_{\beta_{1j}} \end{aligned} \end{array} \right) , \left( \begin{array}{cc} \sigma^2_{\alpha_{j}} & \rho_{\alpha_{j}\beta_{1j}} \\ \rho_{\beta_{1j}\alpha_{j}} & \sigma^2_{\beta_{1j}} \end{array} \right) \right) \text{, for COMPOUND j = 1,} \dots \text{,J} \end{aligned} \]

extract_eq(mixallWB, use_coefs=T, mean_separate=T, index_factors=T,
           intercept="beta",
           swap_var_names=c(
             "logDose"="ln(Dose, mg/kg-d)",
             "logConcentration"="ln(Whole Body, ng/g)",
             "Sex"="Sex"),
           swap_subscript_names=c(
             "M"="Male"
           ))

\[ \begin{aligned} \operatorname{\widehat{ln(Whole\ Body,\ ng/g)}}_{i} &\sim N \left(\mu, \sigma^2 \right) \\ \mu &=7.68_{\alpha_{j[i]}} + 0.83_{\beta_{1j[i]}}(\operatorname{ln(Dose,\ mg/kg-d)}) + 0.32_{\beta_{2}}(\operatorname{Sex}_{\operatorname{Male}}) \\ \left( \begin{array}{c} \begin{aligned} &\alpha_{j} \\ &\beta_{1j} \end{aligned} \end{array} \right) &\sim N \left( \left( \begin{array}{c} \begin{aligned} &0 \\ &0 \end{aligned} \end{array} \right) , \left( \begin{array}{cc} 2.83 & 0.88 \\ 0.88 & 0.2 \end{array} \right) \right) \text{, for COMPOUND j = 1,} \dots \text{,J} \end{aligned} \]

tab_model(mixallWB)
  logConcentration
Predictors Estimates CI p
(Intercept) 7.68 5.98 – 9.37 <0.001
logDose 0.83 0.70 – 0.96 <0.001
Sex [M] 0.32 0.26 – 0.38 <0.001
Random Effects
σ2 0.23
τ00 COMPOUND 8.00
τ11 COMPOUND.logDose 0.04
ρ01 COMPOUND 0.88
ICC 0.96
N COMPOUND 11
Observations 1010
Marginal R2 / Conditional R2 0.460 / 0.979
modelsummary(dvnames(mixallWB), 
             estimate="{estimate} [{conf.low}, {conf.high}]", 
             statistic=NULL,
             coef_rename=coef_rename)
logConcentration
(Intercept) 7.676 [5.977, 9.375]
logDose 0.831 [0.705, 0.957]
SexM 0.316 [0.256, 0.375]
SD (Intercept COMPOUND) 2.828
SD (logDose COMPOUND) 0.200
Cor (Intercept~logDose COMPOUND) 0.881
SD (Observations) 0.479
Num.Obs. 1010
R2 Marg. 0.460
R2 Cond. 0.979
AIC 1507.6
BIC 1542.0
ICC 1.0
RMSE 0.47
plot_predictions(mixallWB, condition=list("logDose","COMPOUND")) +
  theme_classic() +
  labs(y="Estimated logConcentration")

plot_predictions(mixallWB, condition=list("logDose","COMPOUND")) +
  facet_wrap(~COMPOUND)+
  theme_classic() +
  labs(y="Estimated logConcentration")

all tissues no mixture using broom

nonemixedmodelsdosebased <- bigplotstacker3|>filter(!is.na(logDose)) |>
  nest(data=-Tissue) |>
  mutate(
    fit=map(data, ~ lmer(logConcentration ~logDose+Sex+(1|COMPOUND), data=.x)),
    tidied=map(fit, tidy),
    glanced=map(fit, glance),
    augmented=map(fit, augment)
  )

nonemixedmodelsdosebased |>
  unnest(tidied) 
nonemixedmodelsdosebased |>
  unnest(tidied) |>
  dplyr::select(Tissue, effect, term, estimate, std.error)|>
  group_by(Tissue, effect, term) |>
  summarize(`Mean, SE`=paste(round(estimate,3),", ",round(std.error,3))) |>
  pivot_wider(names_from=c(effect,term), values_from=`Mean, SE`) 
nonemixedmodelsdosebased |>
  unnest(glanced) 
#nonemixedmodelsdosebased|>
#  unnest(augmented)


ggplot(data=nonemixedmodelsdosebased|>unnest(augmented) , aes(x=logConcentration, y=.fitted, color=COMPOUND, shape=Sex))+
  geom_point() +
  geom_abline(slope=1)+
  geom_abline(slope=1, intercept=-1, linetype="dashed")+
  geom_abline(slope=1, intercept=1, linetype="dashed")+
  facet_wrap(~Tissue) +
  theme_classic(base_size=18) +
  labs(y="Predicted ln(Tissue (ng/g) or serum (ng/mL))", x="Observed ln(Tissue (ng/g) or serum (ng/mL))")+
  scale_color_manual(values=cbcolors2)

ggplot(data=nonemixedmodelsdosebased|>unnest(augmented) , aes(x=logConcentration, y=.fitted, color=COMPOUND, shape=Sex))+
  geom_point() +
  geom_abline(slope=1)+
  geom_abline(slope=1, intercept=-1, linetype="dashed")+
  geom_abline(slope=1, intercept=1, linetype="dashed")+
  facet_wrap(~Tissue*Sex) +
  theme_classic(base_size=18) +
  labs(y="Predicted ln(Tissue (ng/g) or serum (ng/mL))", x="Observed ln(Tissue (ng/g) or serum (ng/mL))")+
  scale_color_manual(values=cbcolors2)

all tissues no mixed to get random effect param values

Whole Body

nomixallWB <- lmer(logConcentration ~logDose+Sex+(1|COMPOUND), data = bigplotstacker3|>filter(Tissue=="Wholebody",!is.na(logConcentration)), REML=T)
summary(nomixallWB)
## Linear mixed model fit by REML ['lmerMod']
## Formula: logConcentration ~ logDose + Sex + (1 | COMPOUND)
##    Data: 
## filter(bigplotstacker3, Tissue == "Wholebody", !is.na(logConcentration))
## 
## REML criterion at convergence: 1763.2
## 
## Scaled residuals: 
##     Min      1Q  Median      3Q     Max 
## -6.5698 -0.3434  0.0374  0.4403  5.7816 
## 
## Random effects:
##  Groups   Name        Variance Std.Dev.
##  COMPOUND (Intercept) 6.5691   2.5630  
##  Residual             0.3071   0.5541  
## Number of obs: 1010, groups:  COMPOUND, 11
## 
## Fixed effects:
##             Estimate Std. Error t value
## (Intercept) 7.716252   0.773705   9.973
## logDose     0.908548   0.008793 103.323
## SexM        0.326414   0.035007   9.324
## 
## Correlation of Fixed Effects:
##         (Intr) logDos
## logDose  0.033       
## SexM    -0.022  0.037
fixef(nomixallWB)
## (Intercept)     logDose        SexM 
##   7.7162521   0.9085479   0.3264141
ranef(nomixallWB)
## $COMPOUND
##         (Intercept)
## 6:2 FTS  -0.1624136
## 8:2 FTS   1.4996219
## PFBS     -3.7808041
## PFHpS     1.5836937
## PFHxA    -5.6084134
## PFHxS     1.5314868
## PFNA      1.4245553
## PFNS      1.5908916
## PFOA      1.4490210
## PFOS      1.9662436
## PFPeS    -1.4938828
## 
## with conditional variances for "COMPOUND"
coef(nomixallWB) 
## $COMPOUND
##         (Intercept)   logDose      SexM
## 6:2 FTS    7.553839 0.9085479 0.3264141
## 8:2 FTS    9.215874 0.9085479 0.3264141
## PFBS       3.935448 0.9085479 0.3264141
## PFHpS      9.299946 0.9085479 0.3264141
## PFHxA      2.107839 0.9085479 0.3264141
## PFHxS      9.247739 0.9085479 0.3264141
## PFNA       9.140807 0.9085479 0.3264141
## PFNS       9.307144 0.9085479 0.3264141
## PFOA       9.165273 0.9085479 0.3264141
## PFOS       9.682496 0.9085479 0.3264141
## PFPeS      6.222369 0.9085479 0.3264141
## 
## attr(,"class")
## [1] "coef.mer"
nomixallWB |> glance()
nomixallWB |>
  tidy() |>
  #dplyr::select(effect, term, estimate, std.error)|>
  group_by(effect, term) |>
  summarize(`Mean, SE`=paste(round(estimate,3),", ",round(std.error,3))) |>
  pivot_wider(names_from=c(effect,term), values_from=`Mean, SE`) 
extract_eq(nomixallWB, use_coefs=F, mean_separate=T,
           intercept="beta",
           swap_var_names=c(
             "logDose"="ln(Dose, mg/kg-d)",
             "logConcentration"="ln(Whole Body, ng/g)",
             "Sex"="Sex"),
           swap_subscript_names=c(
             "M"="Male"
           ))

\[ \begin{aligned} \operatorname{ln(Whole\ Body,\ ng/g)}_{i} &\sim N \left(\mu, \sigma^2 \right) \\ \mu &=\alpha_{j[i]} + \beta_{1}(\operatorname{ln(Dose,\ mg/kg-d)}) + \beta_{2}(\operatorname{Sex}_{\operatorname{Male}}) \\ \alpha_{j} &\sim N \left(\mu_{\alpha_{j}}, \sigma^2_{\alpha_{j}} \right) \text{, for COMPOUND j = 1,} \dots \text{,J} \end{aligned} \]

extract_eq(nomixallWB, use_coefs=T, mean_separate=T, index_factors=T,
           intercept="beta",
           swap_var_names=c(
             "logDose"="ln(Dose, mg/kg-d)",
             "logConcentration"="ln(Whole Body, ng/g)",
             "Sex"="Sex"),
           swap_subscript_names=c(
             "M"="Male"
           ))

\[ \begin{aligned} \operatorname{\widehat{ln(Whole\ Body,\ ng/g)}}_{i} &\sim N \left(\mu, \sigma^2 \right) \\ \mu &=7.72_{\alpha_{j[i]}} + 0.91_{\beta_{1}}(\operatorname{ln(Dose,\ mg/kg-d)}) + 0.33_{\beta_{2}}(\operatorname{Sex}_{\operatorname{Male}}) \\ \alpha_{j} &\sim N \left(0, 2.56 \right) \text{, for COMPOUND j = 1,} \dots \text{,J} \end{aligned} \]

tab_model(nomixallWB)
  logConcentration
Predictors Estimates CI p
(Intercept) 7.72 6.20 – 9.23 <0.001
logDose 0.91 0.89 – 0.93 <0.001
Sex [M] 0.33 0.26 – 0.40 <0.001
Random Effects
σ2 0.31
τ00 COMPOUND 6.57
ICC 0.96
N COMPOUND 11
Observations 1010
Marginal R2 / Conditional R2 0.464 / 0.976
modelsummary(dvnames(nomixallWB), 
             estimate="{estimate} [{conf.low}, {conf.high}]", 
             statistic=NULL,
             coef_rename=coef_rename)
logConcentration
(Intercept) 7.716 [6.198, 9.235]
logDose 0.909 [0.891, 0.926]
SexM 0.326 [0.258, 0.395]
SD (Intercept COMPOUND) 2.563
SD (Observations) 0.554
Num.Obs. 1010
R2 Marg. 0.464
R2 Cond. 0.976
AIC 1773.2
BIC 1797.8
ICC 1.0
RMSE 0.55
plot_predictions(nomixallWB, condition=list("logDose","COMPOUND")) +
  theme_classic() +
  labs(y="Estimated logConcentration")

plot_predictions(nomixallWB, condition=list("logDose","COMPOUND")) +
  facet_wrap(~COMPOUND)+
  theme_classic() +
  labs(y="Estimated logConcentration")

matrix(c(rownames(as.data.frame(coef(nomixallWB)$COMPOUND)),
         rep(" & ", NROW(coef(nomixallWB)$COMPOUND)),
         round(as.data.frame(coef(nomixallWB)$COMPOUND),2)[,1],
         rep(" \\", NROW(coef(nomixallWB)$COMPOUND))), ncol=4)
##       [,1]      [,2]  [,3]   [,4] 
##  [1,] "6:2 FTS" " & " "7.55" " \\"
##  [2,] "8:2 FTS" " & " "9.22" " \\"
##  [3,] "PFBS"    " & " "3.94" " \\"
##  [4,] "PFHpS"   " & " "9.3"  " \\"
##  [5,] "PFHxA"   " & " "2.11" " \\"
##  [6,] "PFHxS"   " & " "9.25" " \\"
##  [7,] "PFNA"    " & " "9.14" " \\"
##  [8,] "PFNS"    " & " "9.31" " \\"
##  [9,] "PFOA"    " & " "9.17" " \\"
## [10,] "PFOS"    " & " "9.68" " \\"
## [11,] "PFPeS"   " & " "6.22" " \\"
bmatrix = function(x, digits=NULL, ...) {
  library(xtable)
  default_args = list(include.colnames=FALSE, only.contents=TRUE,
                      include.rownames=FALSE, hline.after=NULL, comment=FALSE,
                      print.results=FALSE)
  passed_args = list(...)
  calling_args = c(list(x=xtable(x, digits=digits)),
                   c(passed_args,
                     default_args[setdiff(names(default_args), names(passed_args))]))
  cat("\\begin{bmatrix}\n",
      do.call(print.xtable, calling_args),
      "\\end{bmatrix}\n")
}

bmatrix(matrix(c(rownames(as.data.frame(coef(nomixallWB)$COMPOUND)),
         round(as.data.frame(coef(nomixallWB)$COMPOUND),2)[,1]), ncol=2))
## \begin{bmatrix}
##   6:2 FTS & 7.55 \\ 
##   8:2 FTS & 9.22 \\ 
##   PFBS & 3.94 \\ 
##   PFHpS & 9.3 \\ 
##   PFHxA & 2.11 \\ 
##   PFHxS & 9.25 \\ 
##   PFNA & 9.14 \\ 
##   PFNS & 9.31 \\ 
##   PFOA & 9.17 \\ 
##   PFOS & 9.68 \\ 
##   PFPeS & 6.22 \\ 
##    \end{bmatrix}

\[ \widehat{ln(Whole\ Body,\ ng/g)} \sim N (\mu, 0.55) \\ \mu =\begin{bmatrix} 6:2 FTS & 7.55 \\ 8:2 FTS & 9.22 \\ PFBS & 3.94 \\ PFHpS & 9.3 \\ PFHxA & 2.11 \\ PFHxS & 9.25 \\ PFNA & 9.14 \\ PFNS & 9.31 \\ PFOA & 9.17 \\ PFOS & 9.68 \\ PFPeS & 6.22 \\ \end{bmatrix} + 0.91(ln(Dose, mg/kg))+ 0.33(Sex_{M=1;F=0}) \]

Comes from:

$$ 
\widehat{ln(Whole\ Body,\ ng/g)}  \sim N (\mu, `r round(as.data.frame(VarCorr(nomixallWB))[2,5],2)`) \\
\mu =\begin{bmatrix}
  6:2 FTS & 7.55 \\ 
  8:2 FTS & 9.22 \\ 
  PFBS & 3.94 \\ 
  PFHpS & 9.3 \\ 
  PFHxA & 2.11 \\ 
  PFHxS & 9.25 \\ 
  PFNA & 9.14 \\ 
  PFNS & 9.31 \\ 
  PFOA & 9.17 \\ 
  PFOS & 9.68 \\ 
  PFPeS & 6.22 \\ 
   \end{bmatrix} + `r round(fixef(nomixallWB),2)[[2]]`(ln(Dose, mg/kg))+ `r round(fixef(nomixallWB),2)[[3]]`(Sex_{M=1;F=0})
$$

written “in line” in the .Rmd file.

---
title: "Prediction of Additive PFAS Exposure in Mice Example"
author: "Andrew East"
date: "`r Sys.Date()`"
output: 
  html_document:
    df_print: paged
    toc: yes
    toc_float: yes
    code_folding: hide
    code_download: yes
---

An extensive amount of data management is obscured from this document, goal is to inform code writing, figure generation, and etc. not to evaluate these actual data.  


```{r, message=F, warning=F}

library(knitr)
library(tidyverse)
library(readxl)
library(rio)
library(broom)
library(GGally)
library(ggridges)
library(lme4)
library(modelr)
library(nlme)
library(ggrepel)
library(broom.mixed)
library(ggrepel)
library(ggpubr)
library(drc)
library(mgcv)
library(purrr)
library(ggpmisc)
library(equatiomatic)
library(marginaleffects)
library(modelsummary)
library(sjPlot)
library(emmeans)
library(magic)
library(lemon)

###! Tread Carefully Here !##
options(dplyr.summarise.inform=F)
### This turns off the tidyverse summarize/summarise messages indicating default grouping patterns in resultant tibbles ##
### If you don't know what this means, check out https://stackoverflow.com/questions/62140483/how-to-interpret-dplyr-message-summarise-regrouping-output-by-x-override
### Implications of this being false are unknown errors and impacts in other activities in this R session!


```



```{r, warning=FALSE, include=FALSE}

SGSfiles <- list.files(path="C:/Users/easta/Desktop/PFAS additivity in mice/Analysis/tissues_copyrawdata",
                       pattern="*.xlsx",
                       recursive=T,
                       full.names=T)

Data1 <- import_list(SGSfiles, rbind=T, rbind_fill=T, rbind_label="file", col_names=T,na="") |>
  dplyr::select(SAMPLE_NO,AXYS_ID,LAB_FLAG,COMPOUND,CONC_FOUND,UNIT,file) |>
  mutate(UNIT=factor(UNIT),
         COMPOUND=factor(COMPOUND)) |>
  filter(!UNIT%in%c("% Recovery")&SAMPLE_NO!="Lab Blank") |>  #insert LAB_FLAG code rejections here
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/New folder/SGSAxys_tissues_year2_batch/4728 DPWG90704 WG89323 PFAS/V89323PFAS_Database_L41244_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/New folder/SGSAxys_tissues_year2_batch/4728 DPWG90805 WG89322 PFAS/V89322PFAS_Database_L41244_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/New folder/SGSAxys_tissues_year2_batch/4728 DPWG90686 WG89324 PFAS/V89324PFAS_Database_L41244_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/New folder/SGSAxys_tissues_year2_batch/4728 DPWG90651 WG89699 PFAS/WG89699PFAS_Database_1.xlsx") |>
  droplevels()

keyfile <- read_csv("C:/Users/easta/Desktop/PFAS additivity in mice/Analysis/mousemixturesdatakeys/tissueanimalkey.csv") 

Data1 <- merge(Data1, keyfile|>dplyr::select(AnimalID, SAMPLE_NO,Treatment, sampletype, study,PFAS,Sex,Tissue), by="SAMPLE_NO")|>
  mutate(treatment=factor(Treatment, levels=c("PFOS","PFOA","PFHxS","PFHxA","PFNA","PFBS","6:2 FTS","8:2 FTS","C6-8 Low","C6-8 Medium","C6-8 High","FTS Low","FTS Medium","FTS High","Control")),
         sampletype=factor(sampletype),
         study=factor(study),
         singletoncompound=case_when(
           as.character(treatment)==as.character(COMPOUND) ~ "yes",
           T~"no"),
         inmixture=case_when(
           str_detect(PFAS,as.character(COMPOUND)) ~ "yes",
           T~"no"
         )) |>
  mutate(val_qual=
           case_when(
             is.na(LAB_FLAG) ~ "qual",
             LAB_FLAG=="J" ~ "trace",
             LAB_FLAG=="H" ~ "estimated, for info only",
             LAB_FLAG=="K" ~ "bad, maximum possible reported",
             LAB_FLAG=="U" ~ "nondetect",
             LAB_FLAG=="D" ~ "qual via dilution",
             LAB_FLAG=="X" ~ "ignore",
             LAB_FLAG=="D J" ~ "trace via dilution",
             LAB_FLAG=="K J" ~ "max possible, trace",
             LAB_FLAG=="K D J" ~ "max possible, trace, via dilution",
             LAB_FLAG=="U D" ~ "nondetect via dilution",
             LAB_FLAG=="U D H" ~ "nondetect via dilution, for info only",
             LAB_FLAG=="U H" ~ "non detect for info only",
             LAB_FLAG=="D H" ~ "estimated, over",
             T ~ "other, nonqual"
           )
  )


```


```{r include=FALSE}

Data1b <- import_list(SGSfiles, rbind=T, rbind_fill=T, rbind_label="file", col_names=T,na="") |>
  dplyr::select(SAMPLE_NO,AXYS_ID,LAB_FLAG,COMPOUND,CONC_FOUND,DETECTION_LIMIT,UNIT,file) |>
  mutate(UNIT=factor(UNIT),
         COMPOUND=factor(COMPOUND)) |>
  filter(!UNIT%in%c("% Recovery")&SAMPLE_NO!="Lab Blank") |>  #insert LAB_FLAG code rejections here
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/New folder/SGSAxys_tissues_year2_batch/4728 DPWG90704 WG89323 PFAS/V89323PFAS_Database_L41244_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/New folder/SGSAxys_tissues_year2_batch/4728 DPWG90805 WG89322 PFAS/V89322PFAS_Database_L41244_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/New folder/SGSAxys_tissues_year2_batch/4728 DPWG90686 WG89324 PFAS/V89324PFAS_Database_L41244_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/New folder/SGSAxys_tissues_year2_batch/4728 DPWG90651 WG89699 PFAS/WG89699PFAS_Database_1.xlsx") |>
  droplevels()

Data1b <- merge(Data1b, keyfile|>dplyr::select(AnimalID, SAMPLE_NO,Treatment, sampletype, study,PFAS,Sex,Tissue), by="SAMPLE_NO")|>
  mutate(treatment=factor(Treatment, levels=c("PFOS","PFOA","PFHxS","PFHxA","PFNA","PFBS","6:2 FTS","8:2 FTS","C6-8 Low","C6-8 Medium","C6-8 High","FTS Low","FTS Medium","FTS High","Control")),
         sampletype=factor(sampletype),
         study=factor(study),
         singletoncompound=case_when(
           as.character(treatment)==as.character(COMPOUND) ~ "yes",
           T~"no"),
         inmixture=case_when(
           str_detect(PFAS,as.character(COMPOUND)) ~ "yes",
           T~"no"
         )) |>
  mutate(val_qual=
           case_when(
             is.na(LAB_FLAG) ~ "qual",
             LAB_FLAG=="J" ~ "trace",
             LAB_FLAG=="H" ~ "estimated, for info only",
             LAB_FLAG=="K" ~ "bad, maximum possible reported",
             LAB_FLAG=="U" ~ "nondetect",
             LAB_FLAG=="D" ~ "qual via dilution",
             LAB_FLAG=="X" ~ "ignore",
             LAB_FLAG=="D J" ~ "trace via dilution",
             LAB_FLAG=="K J" ~ "max possible, trace",
             LAB_FLAG=="K D J" ~ "max possible, trace, via dilution",
             LAB_FLAG=="U D" ~ "nondetect via dilution",
             LAB_FLAG=="U D H" ~ "nondetect via dilution, for info only",
             LAB_FLAG=="U H" ~ "non detect for info only",
             LAB_FLAG=="D H" ~ "estimated, over",
             T ~ "other, nonqual"
           )
  )




```



```{r, warning=F, include=F}

SGSfiles2 <- list.files(path="C:/Users/easta/Desktop/PFAS additivity in mice/Analysis/waterwholebodyserum_copyrawdata",
                       pattern="*.xlsx",
                       recursive=T,
                       full.names=T)

Data12 <- import_list(SGSfiles2, rbind=T, rbind_fill=T, rbind_label="file", col_names=T,na="") |>
  dplyr::select(SAMPLE_NO,AXYS_ID,LAB_FLAG,COMPOUND,CONC_FOUND,UNIT,file) |>
  bind_rows() |>
  mutate(UNIT=factor(UNIT),
         COMPOUND=factor(COMPOUND)) |>
  filter(!UNIT%in%c("% Recovery")&SAMPLE_NO!="Lab Blank") |>  #insert LAB_FLAG code rejections here
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG87004 WG85096 PFAS/V85096PFAS_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86446 WG85199 PFAS EXTD/V85199PFAS-EXTD_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86452 WG85200 PFAS EXTD/V85200PFAS-EXTD_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86455 WG85201 PFAS EXTD/V85201PFAS-EXTD_Database_2.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86885 WG85051 PFAS/V85051PFAS_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86950 WG85052 PFAS/V85052PFAS_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86878 WG85083 PFAS/V85083PFAS_Database_1.xlsx") |>
  droplevels()

keyfile2 <- read_excel("C:/Users/easta/Desktop/PFAS additivity in mice/Analysis/mousemixturesdatakeys/Data_Key.xlsx", sheet="Sheet1") 

Data12 <- merge(Data12, keyfile2|>dplyr::select(animalnumberonly, SAMPLE_NO,treatment, sampletype, study,PFAS,sex), by="SAMPLE_NO")|>
  mutate(treatment=factor(treatment, levels=c("PFOS","PFOA","PFHxS","PFHxA","PFNA","PFBS","6:2 FTS","8:2 FTS","C68LOW","C68MED","C68HIGH","FTSLOW","FTSMED","FTSHIGH","Control")),
         sampletype=factor(sampletype),
         study=factor(study),
         singletoncompound=case_when(
           as.character(treatment)==as.character(COMPOUND) ~ "yes",
           T~"no"),
         inmixture=case_when(
           str_detect(PFAS,as.character(COMPOUND)) ~ "yes",
           T~"no"
         )) |>
  mutate(val_qual=
           case_when(
             is.na(LAB_FLAG) ~ "qual",
             LAB_FLAG=="J" ~ "trace",
             LAB_FLAG=="H" ~ "estimated",
             LAB_FLAG=="K" ~ "bad, maximum possible reported",
             LAB_FLAG=="U" ~ "nondetect",
             LAB_FLAG=="D" ~ "qual via dilution",
             LAB_FLAG=="X" ~ "ignore",
             LAB_FLAG=="D J" ~ "trace via dilution",
             LAB_FLAG=="D H"&study!="serum"&sampletype!="serum"&treatment!="6:2 FTS"&COMPOUND!="6:2 FTS" ~ "estimated, over",
             study=="serum"&sampletype=="serum"&treatment=="C68MED"&COMPOUND=="PFHxS"&LAB_FLAG=="D H"&str_detect(AXYS_ID,"2$") ~ "qual, over",
             study=="serum"&sampletype=="serum"&treatment=="C68MED"&COMPOUND=="PFHxS"&LAB_FLAG=="D H"&!str_detect(AXYS_ID,"2$") ~ "estimated, over",
             study=="serum"&sampletype=="serum"&treatment=="6:2 FTS"&COMPOUND=="6:2 FTS"&LAB_FLAG=="D H" ~ "qual, over",
             T ~ "other, nonqual"
           )
  )



Data12qualish <- Data12 |>
  filter(val_qual%in%c("qual","trace","qual via dilution","trace via dilution","qual, over")|
           (val_qual=="estimated"&study=="wholebody"&sampletype=="wholebody"&treatment=="PFOA"&COMPOUND=="PFOA")|
           (val_qual=="estimated"&study=="serum"&sampletype=="serum"&treatment=="PFHxS"&COMPOUND=="PFHxS")|
           (val_qual=="estimated, over"&study=="wholebody"&sampletype=="wholebody"&treatment=="PFNA"&COMPOUND=="PFNA")|
           (val_qual=="estimated, over"&study=="wholebody"&sampletype=="wholebody"&treatment=="PFOS"&COMPOUND=="PFOS")|
           (val_qual=="estimated, over"&study=="serum"&sampletype=="serum"&treatment=="C68MED"&COMPOUND=="PFHxS"&str_detect(AXYS_ID,"2$"))|
           (val_qual=="estimated, over"&study=="wholebody"&sampletype=="wholebody"&treatment=="C68MED"&COMPOUND=="PFHxS")|
           (val_qual=="estimated, over"&study=="serum"&sampletype=="serum"&treatment=="C68MED"&COMPOUND=="PFOS")|
           (val_qual=="estimated, over"&study=="wholebody"&sampletype=="wholebody"&(treatment=="C68LOW"|treatment=="C68MED"|treatment=="C68HIGH"|treatment=="FTSLOW"|treatment=="FTSMED"|treatment=="FTSHIGH")&COMPOUND=="PFOS")
  )

########## new stuff on 12JUL2024

serumdata <- Data12qualish |>
  ungroup() |>
  droplevels() |>
  filter(sampletype=="serum") |>
  #filter(inmixture=="yes"|treatment=="Control") |>
  mutate(
    treatment=case_when(
    treatment=="C68LOW" ~ "C6-8 Low",
    treatment=="C68MED" ~ "C6-8 Medium",
    treatment=="C68HIGH" ~ "C6-8 High",
    treatment=="FTSLOW" ~ "FTS Low",
    treatment=="FTSMED" ~ "FTS Medium",
    treatment=="FTSHIGH" ~ "FTS High",
    T ~ treatment
  ) 
  ) |>
  rename(AnimalID=animalnumberonly) |>
  dplyr::select(AnimalID,sex,treatment,COMPOUND,CONC_FOUND,sampletype,singletoncompound,inmixture,val_qual) |>  # include flags in select?
  mutate(sampletype=as.character(sampletype),
         COMPOUND=as.character(COMPOUND))|>
  droplevels() |>
  ungroup()

waterdata <- Data12qualish |>
  #filter(inmixture=="yes"|(treatment=="Control")) |>
  droplevels() |>
  group_by(sampletype,study,COMPOUND,treatment) |>
  mutate(CONC_FOUND=case_when(
    sampletype=="water"~(mean(CONC_FOUND, na.rm=T)/1e8),
    sampletype=="wholebody"~(mean(CONC_FOUND, na.rm=T)),
    T~mean(CONC_FOUND, na.rm=T)
  )
  ) |>
  mutate(
    treatment=case_when(
    treatment=="C68LOW" ~ "C6-8 Low",
    treatment=="C68MED" ~ "C6-8 Medium",
    treatment=="C68HIGH" ~ "C6-8 High",
    treatment=="FTSLOW" ~ "FTS Low",
    treatment=="FTSMED" ~ "FTS Medium",
    treatment=="FTSHIGH" ~ "FTS High",
    T ~ treatment
  ) 
  ) |>
  summarize(mean=mean(CONC_FOUND, na.rm=T)) |>
  pivot_wider(names_from=c(sampletype, study), values_from=mean) |>
  dplyr::select(c(COMPOUND,treatment,water_serum)) |>
  rename(dose=water_serum) |>
  mutate(logdose=log(dose))



waterdataWB <- Data12qualish |>
  #filter(inmixture=="yes"|(treatment=="Control")) |>
  droplevels() |>
  group_by(sampletype,study,COMPOUND,treatment) |>
  mutate(CONC_FOUND=case_when(
    sampletype=="water"~(mean(CONC_FOUND, na.rm=T)/1e8),
    sampletype=="wholebody"~(mean(CONC_FOUND, na.rm=T)),
    T~mean(CONC_FOUND, na.rm=T)
  )
  ) |>
  mutate(
    treatment=case_when(
    treatment=="C68LOW" ~ "C6-8 Low",
    treatment=="C68MED" ~ "C6-8 Medium",
    treatment=="C68HIGH" ~ "C6-8 High",
    treatment=="FTSLOW" ~ "FTS Low",
    treatment=="FTSMED" ~ "FTS Medium",
    treatment=="FTSHIGH" ~ "FTS High",
    T ~ treatment
  ) 
  ) |>
  summarize(mean=mean(CONC_FOUND, na.rm=T)) |>
  pivot_wider(names_from=c(sampletype, study), values_from=mean) |>
  dplyr::select(c(COMPOUND,treatment,water_wholebody)) |>
  rename(dose=water_wholebody) |>
  mutate(logdose=log(dose))



wholebodydata <- Data12qualish |>
  ungroup() |>
  droplevels() |>
  filter(sampletype=="wholebody") |>
  #filter(inmixture=="yes"|treatment=="Control") |>
  mutate(
    treatment=case_when(
    treatment=="C68LOW" ~ "C6-8 Low",
    treatment=="C68MED" ~ "C6-8 Medium",
    treatment=="C68HIGH" ~ "C6-8 High",
    treatment=="FTSLOW" ~ "FTS Low",
    treatment=="FTSMED" ~ "FTS Medium",
    treatment=="FTSHIGH" ~ "FTS High",
    T ~ treatment
  ) 
  ) |>
  rename(AnimalID=animalnumberonly) |>
  dplyr::select(AnimalID,sex,treatment,COMPOUND,CONC_FOUND,sampletype,singletoncompound,inmixture,val_qual) |>  # include flags in select?
  mutate(sampletype=as.character(sampletype),
         COMPOUND=as.character(COMPOUND))|>
  droplevels() |>
  ungroup()

wholebodydata <- merge(wholebodydata, waterdataWB, by=c("treatment","COMPOUND"))

wholebodydata <- wholebodydata |>
  mutate(Wholebody=CONC_FOUND,
         logWholebody=log(Wholebody))|>
  mutate(
    logdmw=case_when( # see https://apps.dtic.mil/sti/pdfs/AD1134355.pdf page 92 of 121 in pdf
      COMPOUND=="PFBS"~2.63,
      COMPOUND=="PFNA"~4.04,
      COMPOUND=="6:2 FTS"~0.92,
      COMPOUND=="8:2 FTS"~2.28,
      COMPOUND=="PFOS"~4.88,
      COMPOUND=="PFHxS"~3.82,
      COMPOUND=="PFOA"~3.51,
      COMPOUND=="PFHxA"~2.31
    )
  )
  

```


 


```{r, include=F}

Data12b <- import_list(SGSfiles2, rbind=T, rbind_fill=T, rbind_label="file", col_names=T,na="") |>
  dplyr::select(SAMPLE_NO,AXYS_ID,LAB_FLAG,COMPOUND,CONC_FOUND,DETECTION_LIMIT,UNIT,file) |>
  bind_rows() |>
  mutate(UNIT=factor(UNIT),
         COMPOUND=factor(COMPOUND)) |>
  filter(!UNIT%in%c("% Recovery")&SAMPLE_NO!="Lab Blank") |>  #insert LAB_FLAG code rejections here
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG87004 WG85096 PFAS/V85096PFAS_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86446 WG85199 PFAS EXTD/V85199PFAS-EXTD_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86452 WG85200 PFAS EXTD/V85200PFAS-EXTD_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86455 WG85201 PFAS EXTD/V85201PFAS-EXTD_Database_2.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86885 WG85051 PFAS/V85051PFAS_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86950 WG85052 PFAS/V85052PFAS_Database_1.xlsx") |>
  # theseareforpdrivefilesonly filter(file!="P:/Tox/SERDP-funded projects/PFAS mixtures mice kestrels/SGS AXYS/Data/FTP_backup/4728 DPWG86878 WG85083 PFAS/V85083PFAS_Database_1.xlsx") |>
  droplevels()


Data12b <- merge(Data12b, keyfile2|>dplyr::select(animalnumberonly, SAMPLE_NO,treatment, sampletype, study,PFAS,sex), by="SAMPLE_NO")|>
  mutate(treatment=factor(treatment, levels=c("PFOS","PFOA","PFHxS","PFHxA","PFNA","PFBS","6:2 FTS","8:2 FTS","C68LOW","C68MED","C68HIGH","FTSLOW","FTSMED","FTSHIGH","Control")),
         sampletype=factor(sampletype),
         study=factor(study),
         singletoncompound=case_when(
           as.character(treatment)==as.character(COMPOUND) ~ "yes",
           T~"no"),
         inmixture=case_when(
           str_detect(PFAS,as.character(COMPOUND)) ~ "yes",
           T~"no"
         )) |>
  mutate(val_qual=
           case_when(
             is.na(LAB_FLAG) ~ "qual",
             LAB_FLAG=="J" ~ "trace",
             LAB_FLAG=="H" ~ "estimated",
             LAB_FLAG=="K" ~ "bad, maximum possible reported",
             LAB_FLAG=="U" ~ "nondetect",
             LAB_FLAG=="D" ~ "qual via dilution",
             LAB_FLAG=="X" ~ "ignore",
             LAB_FLAG=="D J" ~ "trace via dilution",
             LAB_FLAG=="D H"&study!="serum"&sampletype!="serum"&treatment!="6:2 FTS"&COMPOUND!="6:2 FTS" ~ "estimated, over",
             study=="serum"&sampletype=="serum"&treatment=="C68MED"&COMPOUND=="PFHxS"&LAB_FLAG=="D H"&str_detect(AXYS_ID,"2$") ~ "qual, over",
             study=="serum"&sampletype=="serum"&treatment=="C68MED"&COMPOUND=="PFHxS"&LAB_FLAG=="D H"&!str_detect(AXYS_ID,"2$") ~ "estimated, over",
             study=="serum"&sampletype=="serum"&treatment=="6:2 FTS"&COMPOUND=="6:2 FTS"&LAB_FLAG=="D H" ~ "qual, over",
             T ~ "other, nonqual"
           )
  )


```



```{r, include=F}


tissuedatanotNA <- Data1 |>   #change Data1 to Data1qualish or include flags in select
  filter(!is.na(CONC_FOUND))|>
  #filter(inmixture=="yes"|treatment=="Control") |>
  dplyr::select(AnimalID,Sex,treatment,COMPOUND,CONC_FOUND,Tissue,singletoncompound,inmixture,val_qual) |>
  rename(sampletype=Tissue,
         sex=Sex) |>
  mutate(treatment=as.character(treatment),
         COMPOUND=as.character(COMPOUND))|>
  droplevels() |>
  ungroup()
  
datatissueserum <- rbind(serumdata,tissuedatanotNA)
datatissueserumwide <- datatissueserum |>
  pivot_wider(
    id_cols=c("AnimalID","sex","treatment","COMPOUND","singletoncompound","inmixture","val_qual"),
    names_from=c("sampletype"),
    values_from=c("CONC_FOUND")
  )

datatissueserumwide$treatment <- factor(datatissueserumwide$treatment, levels=c("PFOS","PFOA","PFHxS","PFHxA","PFBS","PFNA","6:2 FTS","8:2 FTS","C6-8 Low","C6-8 Medium","C6-8 High","FTS Low","FTS Medium","FTS High","Control"))

#datatissueserumwide$water2 <- datatissueserumwide$water/1e8
#datatissueserumwide <- datatissueserumwide |>
#  rename(dose=water2) |>
#  mutate(logdose=log(dose))

```



```{r, include=F}

dataliv <- read_excel("C:/Users/easta/Desktop/PFAS additivity in mice/Analysis/mousemixturesdatakeys/PFAS_mixtures_combined_bodyweights_organweights_MASTER.xlsx", col_types = c("text", "text", "numeric", "text", "text", "text", "date", "numeric", "date", "numeric", "date", "numeric", "date", "numeric", "date", "numeric", "numeric", "numeric", "numeric", "numeric", "text"), na = "N/A")


dataliv$relliv <- dataliv$liver_weight/(dataliv$SD28_weight-dataliv$liver_weight)
dataliv$relbrain <- dataliv$brain_weight/(dataliv$SD28_weight-dataliv$brain_weight)
dataliv$relkid <- dataliv$kidney_weight/(dataliv$SD28_weight-dataliv$kidney_weight)


#bigplotstacker3 |>
#  group_by(singletoncompound, treatment, Sex, Tissue,COMPOUND) |>
#  dplyr::summarize("Mean (SD)"=paste(round(mean(Concentration, na.rm=T),2),", (",round(sd(Concentration, na.rm=T),2),"), [",sum(!is.na(Concentration)),"]", sep="")) |>
#  pivot_wider(names_from=c(Tissue),values_from="Mean (SD)") |>
#  mutate(info=paste("mean, (SD), [n]")) |>
#  write_csv("FINALsummarizeddata.csv")

datalivlong <- dataliv |>
  pivot_longer(cols=c(SD0_weight,SD7_weight,SD14_weight,SD21_weight,SD28_weight), values_to="weight", names_to="day") |>
  mutate(day=parse_number(day))

#ggplot()+
#  geom_point(data=datalivlong, aes(x=day, y=weight, color=treatment))+
#  geom_smooth(data=datalivlong, aes(x=day, y=weight, color=treatment), method="lm", formula=y~x, se=F) +
#  facet_wrap(~sex)
#
#ggplot()+
#  geom_point(data=datalivlong, aes(x=day, y=weight, color=sex))+
#  geom_smooth(data=datalivlong, aes(x=day, y=weight, color=sex), method="loess", formula=y~x, se=F) +
#  facet_wrap(~treatment)
#
#ggplot()+
#  geom_point(data=datalivlong|>filter(treatment=="PFNA"), aes(x=day, y=weight, color=sex))+
#  geom_smooth(data=datalivlong|>filter(treatment=="PFNA"), aes(x=day, y=weight, color=sex), method="loess", formula=y~x, se=F) 




datalivlong2 <- dataliv |>
  pivot_longer(cols=c(brain_weight,liver_weight,kidney_weight), values_to="weight", names_to="tissue") |>
  mutate(tissue=str_remove(tissue,"_weight"))


#ggplot() + 
#  geom_boxplot(data=datalivlong2|>filter(study_round!="Whole Body"), aes(x=treatment, y=weight, color=sex))+
#  facet_wrap(~tissue, scales="free_y")
#



#datasub2 <- merge(x=ratiodata,y=datasub, by.x="treatment", by.y="treatmentF2", all=T)


dataliv2 <- dataliv |>
  dplyr::select(animal_ID,relliv,relbrain,relkid, SD28_weight,liver_weight,brain_weight,kidney_weight) |>
  rename(AnimalID=animal_ID)
```



```{r, include=F}
datatissueserumwide <- merge(datatissueserumwide,dataliv2,by="AnimalID")

datatissueserumwide <- datatissueserumwide |>
  group_by(AnimalID,COMPOUND) |>
  mutate(
    totalngbodyburden = sum((serum*0.0385*SD28_weight),(Kidney*SD28_weight),(Brain*SD28_weight),(Liver*SD28_weight),na.rm=T),
    logtotalngbodyburden = log(totalngbodyburden),
    totalbodyconcng_g = totalngbodyburden/SD28_weight,
    totalbodyconcmg_kg = totalbodyconcng_g/1000
  ) |>
  ungroup() |>
  data.frame()


datatissueserumwide <- datatissueserumwide |>
  mutate(
    logdmw=case_when( # see https://apps.dtic.mil/sti/pdfs/AD1134355.pdf page 92 of 121 in pdf
    COMPOUND=="PFBS"~2.63,
    COMPOUND=="PFNA"~4.04,
    COMPOUND=="6:2 FTS"~0.92,
    COMPOUND=="8:2 FTS"~2.28,
    COMPOUND=="PFOS"~4.88,
    COMPOUND=="PFHxS"~3.82,
    COMPOUND=="PFOA"~3.51,
    COMPOUND=="PFHxA"~2.31
  )
  )




```



```{r, include=F}

dataclinchem <- read_csv("C:/Users/easta/Desktop/PFAS additivity in mice/Analysis/mousemixturesdatakeys/PFAS_mixtures_clinchemdata.csv", 
    col_types = cols(
        ALB = col_double(), ALB_div_GLOB = col_double(), 
        ALT = col_double(), AST = col_double(), 
        BUN = col_double(), BUN_div_CREA = col_double(), 
        CHOL = col_double(), CREA = col_double(), 
        `GLOB calc.` = col_double(), GLU = col_double(), 
        TP = col_double(), TRIG = col_double()))



dataclinchemlong <- dataclinchem |>
  pivot_longer(cols=c(ALB,ALB_div_GLOB,ALT,AST,BUN,BUN_div_CREA,CHOL,CREA,`GLOB calc.`,GLU,TP,TRIG), values_to="value", names_to="CCparam")


```



```{r, include=F}

dataclinchem$AnimalID <- dataclinchem$animalID

test2 <- merge(datatissueserumwide, dataclinchem, by="AnimalID")

test2 <- merge(test2,waterdata, by=c("treatment","COMPOUND")) #check this if problems



```



```{r, include=F}

bigplotstacker <- test2 |>
  dplyr::select(treatment, COMPOUND, AnimalID, sex.x, singletoncompound, inmixture,val_qual, serum,Kidney,Brain,Liver,dose) |>
  rename(Serum=serum) |>
  pivot_longer(c(Serum,Kidney,Brain,Liver), names_to="Tissue", values_to="Concentration") |>
  rename(Sex=sex.x)

bigplotstacker2 <- wholebodydata |>
  mutate(treatment=factor(treatment, levels=c("PFOS","PFOA","PFHxS","PFHxA","PFBS","PFNA","6:2 FTS","8:2 FTS","C6-8 Low","C6-8 Medium","C6-8 High","FTS Low","FTS Medium","FTS High","Control"))) |>
  dplyr::select(treatment, COMPOUND, AnimalID,sex, singletoncompound, inmixture, val_qual,Wholebody, dose) |>
  pivot_longer(c(Wholebody), names_to="Tissue", values_to="Concentration")|>
  rename(Sex=sex)

bigplotstacker3 <- rbind(bigplotstacker, bigplotstacker2)


bigplotstacker3 <- bigplotstacker3 |>
  mutate(include=case_when(
    (str_detect(val_qual,"trace|nonqual|bad")&Tissue=="Brain")~"no",
    T~"yes")) |>
  filter(include=="yes") |>
  group_by(AnimalID, COMPOUND,Tissue)|>
  summarize_all(~first(na.omit(.))) |>
  dplyr::select(-val_qual) |>
  ungroup()


```

# summary plots

```{r, fig.height=15,fig.width=20}


cbcolors <- c(
  "PFOS" = "#999999", 
  "PFOA" = "#E69F00", 
  "PFHxS" = "#56B4E9",
  "PFHxA" = "#999933",
  "PFNA" = "#F0E442",
  "PFBS" = "#0072B2",
  "6:2 FTS" = "#D55E00",
  "8:2 FTS" = "#CC79A7"
)

notsampleddf <- data.frame(
  treatment=c(rep("PFBS",3),rep("PFNA",3)),
  Tissue=c(rep(c("Brain","Kidney","Liver"),2)),
  COMPOUND=c("NA"),
  mean=c(rep(10,3),rep(10000,3)),
  label="NA",
  Sex="M"
)




```

```{r, fig.height=10, fig.width=18, message=F, warning=F}

reposition_legend(
  ggplot(data=bigplotstacker3|>filter(inmixture=="yes", singletoncompound=="yes"), aes(x=Tissue, y=Concentration, fill=Sex)) +
    geom_dotplot(binaxis="y",  stackdir="center")+
    facet_wrap(~fct_relevel(treatment, "PFOS","PFOA","PFHxS","PFNA","8:2 FTS","PFBS","PFHxA","6:2 FTS"), scales="free_y", axes="all") +
  geom_text(data=notsampleddf, aes(y=mean, label=label), color="black", show.legend=F)+
    scale_y_log10(labels=scales::label_comma())+
    theme_classic(base_size = 20) +
    labs(y="Wholebody, liver, brain, or kidney (ng/g); serum (ng/mL)", x=NULL)+
    theme(axis.text=element_text(color="black"), strip.background=element_rect(fill="white",color="white",linewidth=1), strip.text=element_text(face="bold"), legend.text=element_text(size=20), legend.title=element_text(size=20)) +
    guides(fill=guide_legend(override.aes=list(size=15))),
  position='center', panel='panel-3-3')

ggplot(data=bigplotstacker3|>filter(inmixture=="yes", singletoncompound=="no"), aes(x=Tissue, y=Concentration, fill=COMPOUND)) +
  geom_dotplot(binaxis="y",  stackdir="center", dotsize=1)+
  facet_wrap(~treatment, scales="free_y", axes="all") +
  scale_y_log10(labels=scales::label_comma())+
  theme_classic(base_size = 20) +
  labs(y="Wholebody, liver, brain, or kidney (ng/g); serum (ng/mL)", fill="", x=NULL) +
  guides(fill=guide_legend(title="PFAS"))+
  #scale_color_manual(values=cbcolors)+
  scale_fill_manual(values=cbcolors) +
  theme(axis.text=element_text(color="black"), strip.background=element_rect(fill="white",color="white",linewidth=1), strip.text=element_text(face="bold"), legend.text=element_text(size=14), legend.position="bottom") +
  guides(fill=guide_legend(override.aes=list(size=12), nrow=1))



```



```{r, fig.height=13,fig.width=20, message=F, warning=F}


cbcolors2 <- c(
  "PFOS" = "#999999", 
  "PFOA" = "#E69F00", 
  "PFHxS" = "#56B4E9",
  "PFHxA" = "#999933",
  "PFNA" = "#F0E442",
  "PFBS" = "#0072B2",
  "6:2 FTS" = "#D55E00",
  "8:2 FTS" = "#CC79A7",
  
  "PFPeA"="#AA0DFE",
  "PFPeS"="#3283FE",
  "PFTeDA"="#85660D",
  "PFTrDA"="#782AB6",
  "PFUnA"="#565656",
  "PFDS"="#1C8356",
  "PFDoA"="#16FF32",
  "PFDoS"="#F7E1A0",
  "PFHpA"="#E2E2E2",
  "PFHpS"="#1CBE4F",
  "PFMBA"="#C4451C",
  "PFNS"="#DEA0FD",
  "7:3 FTCA"="#FE00FA",
  "4:2 FTS"="#009e73",
  "EtFOSAA"="#325A9B",
  "MeFOSAA"="#FEAF16",
  "N-EtFOSE"="#F8A19F",
  "N-MeFOSE"="#90AD1C",
  "PFBA"="#F6222E",
  "PFDA"="#1CFFCE"
)



bigplotstacker3 <- bigplotstacker3 |>
  mutate(
    logConcentration=log(Concentration),
    logDose=log(dose)
  )


sumplot2 <- ggplot(data=bigplotstacker3, aes(x=dose, y=Concentration, color=COMPOUND)) +
  geom_point(size=3, alpha=0.25) +
  geom_smooth(method="lm", formula=y~x, se=F, linewidth=2) +
  facet_wrap(~Tissue) +
  scale_y_log10(labels=scales::label_comma())+
  scale_x_log10(labels=scales::label_comma())+
  theme_classic(base_size = 22) +
  labs(y="Wholebody, liver, brain, or kidney (ng/g); serum (ng/mL)", caption="", x="Dose (mg/kg-d)") +
  scale_color_manual(values=cbcolors2) +
  theme(strip.background=element_rect(fill="white",color="white",linewidth=1)) #+
  #scale_fill_manual(values=cbcolors2)

reposition_legend(sumplot2, 'center', panel='panel-3-2')


reposition_legend(
ggplot(data=bigplotstacker3, aes(x=dose, y=Concentration, color=COMPOUND)) +
  geom_point(size=3, alpha=0.25) +
  geom_smooth(method="lm", formula=y~x, se=F, linewidth=2) +
  facet_wrap(~Tissue*Sex) +
  scale_y_log10(labels=scales::label_comma())+
  scale_x_log10(labels=scales::label_comma())+
  theme_classic(base_size = 22) +
  labs(y="Wholebody, liver, brain, or kidney (ng/g); serum (ng/mL)", caption=NULL, color=NULL,x="Dose (mg/kg-d)") +
  scale_color_manual(values=cbcolors2) +
  theme(strip.background=element_rect(fill="white",color="white",linewidth=1)),
 'center', panel='panel-4-3')


```



```{r, fig.height=13,fig.width=20, include=F}

notsampleddf <- data.frame(
  treatment=c(rep("PFBS",3),rep("PFNA",3)),
  Tissue=c(rep(c("Brain","Kidney","Liver"),2)),
  COMPOUND=c("NA"),
  mean=0.1,
  label="NA"
)


```





# all tissues all mixture using broom

```{r, fig.height=8, fig.width=12}

fullmixedmodelsdosebased <- bigplotstacker3|>filter(!is.na(logDose)) |>
  nest(data=-Tissue) |>
  mutate(
    fit=map(data, ~ lmer(logConcentration ~logDose+Sex+(logDose|COMPOUND), data=.x)),
    tidied=map(fit, tidy),
    glanced=map(fit, glance),
    augmented=map(fit, augment)
  )

fullmixedmodelsdosebased |>
  unnest(tidied) 

fullmixedmodelsdosebased |>
  unnest(tidied) |>
  dplyr::select(Tissue, effect, term, estimate, std.error)|>
  group_by(Tissue, effect, term) |>
  summarize(`Mean, SE`=paste(round(estimate,3),", ",round(std.error,3))) |>
  pivot_wider(names_from=c(effect,term), values_from=`Mean, SE`) 


fullmixedmodelsdosebased |>
  unnest(glanced) 

#fullmixedmodelsdosebased|>
#  unnest(augmented)



ggplot(data=fullmixedmodelsdosebased|>unnest(augmented) , aes(x=logConcentration, y=.fitted, color=COMPOUND, shape=Sex))+
  geom_point() +
  geom_abline(slope=1)+
  geom_abline(slope=1, intercept=-1, linetype="dashed")+
  geom_abline(slope=1, intercept=1, linetype="dashed")+
  facet_wrap(~Tissue) +
  theme_classic(base_size=18) +
  labs(y="Predicted ln(Tissue (ng/g) or serum (ng/mL))", x="Observed ln(Tissue (ng/g) or serum (ng/mL))")+
  scale_color_manual(values=cbcolors2)

ggplot(data=fullmixedmodelsdosebased|>unnest(augmented) , aes(x=logConcentration, y=.fitted, color=COMPOUND, shape=Sex))+
  geom_point() +
  geom_abline(slope=1)+
  geom_abline(slope=1, intercept=-1, linetype="dashed")+
  geom_abline(slope=1, intercept=1, linetype="dashed")+
  facet_wrap(~Tissue*Sex) +
  theme_classic(base_size=18) +
  labs(y="Predicted ln(Tissue (ng/g) or serum (ng/mL))", x="Observed ln(Tissue (ng/g) or serum (ng/mL))")+
  scale_color_manual(values=cbcolors2)

```

## all tissues all mixed to get random effect param values

### Whole Body

```{r}


mixallWB <- lmer(logConcentration ~logDose+Sex+(logDose|COMPOUND), data = bigplotstacker3|>filter(Tissue=="Wholebody",!is.na(logConcentration)), REML=T)
summary(mixallWB)
fixef(mixallWB)
ranef(mixallWB)
coef(mixallWB) 


mixallWB |>
  tidy() |>
  #dplyr::select(effect, term, estimate, std.error)|>
  group_by(effect, term) |>
  summarize(`Mean, SE`=paste(round(estimate,3),", ",round(std.error,3))) |>
  pivot_wider(names_from=c(effect,term), values_from=`Mean, SE`) 

extract_eq(mixallWB, use_coefs=F, mean_separate=T,
           intercept="beta",
           swap_var_names=c(
             "logDose"="ln(Dose, mg/kg-d)",
             "logConcentration"="ln(Whole Body, ng/g)",
             "Sex"="Sex"),
           swap_subscript_names=c(
             "M"="Male"
           ))

extract_eq(mixallWB, use_coefs=T, mean_separate=T, index_factors=T,
           intercept="beta",
           swap_var_names=c(
             "logDose"="ln(Dose, mg/kg-d)",
             "logConcentration"="ln(Whole Body, ng/g)",
             "Sex"="Sex"),
           swap_subscript_names=c(
             "M"="Male"
           ))

tab_model(mixallWB)

modelsummary(dvnames(mixallWB), 
             estimate="{estimate} [{conf.low}, {conf.high}]", 
             statistic=NULL,
             coef_rename=coef_rename)

plot_predictions(mixallWB, condition=list("logDose","COMPOUND")) +
  theme_classic() +
  labs(y="Estimated logConcentration")

plot_predictions(mixallWB, condition=list("logDose","COMPOUND")) +
  facet_wrap(~COMPOUND)+
  theme_classic() +
  labs(y="Estimated logConcentration")

```



# all tissues no mixture using broom

```{r, fig.height=8, fig.width=12}

nonemixedmodelsdosebased <- bigplotstacker3|>filter(!is.na(logDose)) |>
  nest(data=-Tissue) |>
  mutate(
    fit=map(data, ~ lmer(logConcentration ~logDose+Sex+(1|COMPOUND), data=.x)),
    tidied=map(fit, tidy),
    glanced=map(fit, glance),
    augmented=map(fit, augment)
  )

nonemixedmodelsdosebased |>
  unnest(tidied) 


nonemixedmodelsdosebased |>
  unnest(tidied) |>
  dplyr::select(Tissue, effect, term, estimate, std.error)|>
  group_by(Tissue, effect, term) |>
  summarize(`Mean, SE`=paste(round(estimate,3),", ",round(std.error,3))) |>
  pivot_wider(names_from=c(effect,term), values_from=`Mean, SE`) 


nonemixedmodelsdosebased |>
  unnest(glanced) 

#nonemixedmodelsdosebased|>
#  unnest(augmented)


ggplot(data=nonemixedmodelsdosebased|>unnest(augmented) , aes(x=logConcentration, y=.fitted, color=COMPOUND, shape=Sex))+
  geom_point() +
  geom_abline(slope=1)+
  geom_abline(slope=1, intercept=-1, linetype="dashed")+
  geom_abline(slope=1, intercept=1, linetype="dashed")+
  facet_wrap(~Tissue) +
  theme_classic(base_size=18) +
  labs(y="Predicted ln(Tissue (ng/g) or serum (ng/mL))", x="Observed ln(Tissue (ng/g) or serum (ng/mL))")+
  scale_color_manual(values=cbcolors2)

ggplot(data=nonemixedmodelsdosebased|>unnest(augmented) , aes(x=logConcentration, y=.fitted, color=COMPOUND, shape=Sex))+
  geom_point() +
  geom_abline(slope=1)+
  geom_abline(slope=1, intercept=-1, linetype="dashed")+
  geom_abline(slope=1, intercept=1, linetype="dashed")+
  facet_wrap(~Tissue*Sex) +
  theme_classic(base_size=18) +
  labs(y="Predicted ln(Tissue (ng/g) or serum (ng/mL))", x="Observed ln(Tissue (ng/g) or serum (ng/mL))")+
  scale_color_manual(values=cbcolors2)


```

## all tissues no mixed to get random effect param values

### Whole Body

```{r}

nomixallWB <- lmer(logConcentration ~logDose+Sex+(1|COMPOUND), data = bigplotstacker3|>filter(Tissue=="Wholebody",!is.na(logConcentration)), REML=T)
summary(nomixallWB)
fixef(nomixallWB)
ranef(nomixallWB)
coef(nomixallWB) 
nomixallWB |> glance()

nomixallWB |>
  tidy() |>
  #dplyr::select(effect, term, estimate, std.error)|>
  group_by(effect, term) |>
  summarize(`Mean, SE`=paste(round(estimate,3),", ",round(std.error,3))) |>
  pivot_wider(names_from=c(effect,term), values_from=`Mean, SE`) 

extract_eq(nomixallWB, use_coefs=F, mean_separate=T,
           intercept="beta",
           swap_var_names=c(
             "logDose"="ln(Dose, mg/kg-d)",
             "logConcentration"="ln(Whole Body, ng/g)",
             "Sex"="Sex"),
           swap_subscript_names=c(
             "M"="Male"
           ))

extract_eq(nomixallWB, use_coefs=T, mean_separate=T, index_factors=T,
           intercept="beta",
           swap_var_names=c(
             "logDose"="ln(Dose, mg/kg-d)",
             "logConcentration"="ln(Whole Body, ng/g)",
             "Sex"="Sex"),
           swap_subscript_names=c(
             "M"="Male"
           ))

tab_model(nomixallWB)

modelsummary(dvnames(nomixallWB), 
             estimate="{estimate} [{conf.low}, {conf.high}]", 
             statistic=NULL,
             coef_rename=coef_rename)

plot_predictions(nomixallWB, condition=list("logDose","COMPOUND")) +
  theme_classic() +
  labs(y="Estimated logConcentration")

plot_predictions(nomixallWB, condition=list("logDose","COMPOUND")) +
  facet_wrap(~COMPOUND)+
  theme_classic() +
  labs(y="Estimated logConcentration")


matrix(c(rownames(as.data.frame(coef(nomixallWB)$COMPOUND)),
         rep(" & ", NROW(coef(nomixallWB)$COMPOUND)),
         round(as.data.frame(coef(nomixallWB)$COMPOUND),2)[,1],
         rep(" \\", NROW(coef(nomixallWB)$COMPOUND))), ncol=4)


bmatrix = function(x, digits=NULL, ...) {
  library(xtable)
  default_args = list(include.colnames=FALSE, only.contents=TRUE,
                      include.rownames=FALSE, hline.after=NULL, comment=FALSE,
                      print.results=FALSE)
  passed_args = list(...)
  calling_args = c(list(x=xtable(x, digits=digits)),
                   c(passed_args,
                     default_args[setdiff(names(default_args), names(passed_args))]))
  cat("\\begin{bmatrix}\n",
      do.call(print.xtable, calling_args),
      "\\end{bmatrix}\n")
}

bmatrix(matrix(c(rownames(as.data.frame(coef(nomixallWB)$COMPOUND)),
         round(as.data.frame(coef(nomixallWB)$COMPOUND),2)[,1]), ncol=2))

```

$$ 
\widehat{ln(Whole\ Body,\ ng/g)}  \sim N (\mu, `r round(as.data.frame(VarCorr(nomixallWB))[2,5],2)`) \\
\mu =\begin{bmatrix}
  6:2 FTS & 7.55 \\ 
  8:2 FTS & 9.22 \\ 
  PFBS & 3.94 \\ 
  PFHpS & 9.3 \\ 
  PFHxA & 2.11 \\ 
  PFHxS & 9.25 \\ 
  PFNA & 9.14 \\ 
  PFNS & 9.31 \\ 
  PFOA & 9.17 \\ 
  PFOS & 9.68 \\ 
  PFPeS & 6.22 \\ 
   \end{bmatrix} + `r round(fixef(nomixallWB),2)[[2]]`(ln(Dose, mg/kg))+ `r round(fixef(nomixallWB),2)[[3]]`(Sex_{M=1;F=0})
$$


Comes from:  
```{verbatim}
$$ 
\widehat{ln(Whole\ Body,\ ng/g)}  \sim N (\mu, `r round(as.data.frame(VarCorr(nomixallWB))[2,5],2)`) \\
\mu =\begin{bmatrix}
  6:2 FTS & 7.55 \\ 
  8:2 FTS & 9.22 \\ 
  PFBS & 3.94 \\ 
  PFHpS & 9.3 \\ 
  PFHxA & 2.11 \\ 
  PFHxS & 9.25 \\ 
  PFNA & 9.14 \\ 
  PFNS & 9.31 \\ 
  PFOA & 9.17 \\ 
  PFOS & 9.68 \\ 
  PFPeS & 6.22 \\ 
   \end{bmatrix} + `r round(fixef(nomixallWB),2)[[2]]`(ln(Dose, mg/kg))+ `r round(fixef(nomixallWB),2)[[3]]`(Sex_{M=1;F=0})
$$
```
written "in line" in the .Rmd file.

