diff --git a/.gitignore b/.gitignore index 5df29fb..5049c59 100644 --- a/.gitignore +++ b/.gitignore @@ -69,7 +69,7 @@ out *.sav *.sas7bdat wsi -#*.log +dataverse # Temp files _gsdata_/ diff --git a/AEDB.EM.baseline.Rmd b/AEDB.EM.baseline.Rmd new file mode 100644 index 0000000..5cd1f53 --- /dev/null +++ b/AEDB.EM.baseline.Rmd @@ -0,0 +1,1221 @@ +--- +title: "Baseline characteristics" +author: "[Sander W. van der Laan, PhD](https://swvanderlaan.github.io) | @swvanderlaan | s.w.vanderlaan@gmail.com" +date: "`r Sys.Date()`" +output: + html_notebook: + cache: yes + code_folding: hide + collapse: yes + df_print: paged + fig.align: center + fig_caption: yes + fig_height: 6 + fig_retina: 2 + fig_width: 7 + highlight: tango + theme: lumen + toc: yes + toc_float: + collapsed: no + smooth_scroll: yes +mainfont: Arial +subtitle: Accompanying 'EntropyMasker' +editor_options: + chunk_output_type: inline +# bibliography: references.bib +# knit: worcs::cite_all +--- + +# General Setup +We will clean the environment, setup the locations, define colors, and create a datestamp. + +_Clean the environment._ +```{r echo = FALSE} +rm(list = ls()) +``` + +_Set locations and working directories..._ +```{r LocalSystem, echo = FALSE} +source("scripts/local.system.R") + +``` + +_... a package-installation function ..._ +```{r Function: installations} +source("scripts/functions.R") + +``` + + +_... and load those packages._ +```{r loading_packages, message=FALSE, warning=FALSE} +source("scripts/pack01.packages.R") + + +``` + +_We will create a datestamp and define the Utrecht Science Park Colour Scheme_. +```{r Setting: Colors} + +Today = format(as.Date(as.POSIXlt(Sys.time())), "%Y%m%d") +Today.Report = format(as.Date(as.POSIXlt(Sys.time())), "%A, %B %d, %Y") + +source("scripts/colors.R") + +``` + +```{r global_options, include = FALSE} +# further define some knitr-options. +knitr::opts_chunk$set(fig.width = 12, fig.height = 8, fig.path = 'Figures/', + wwarning = TRUE, # show warnings during codebook generation + message = TRUE, # show messages during codebook generation + error = TRUE, # do not interrupt codebook generation in case of errors, + # usually better for debugging + echo = TRUE, # show R code + eval = TRUE) +ggplot2::theme_set(ggplot2::theme_minimal()) +pander::panderOptions("table.split.table", Inf) +``` + +# This notebook + +In this notebook we create a baseline table of the samples used in **`EntropyMasker`**. + +# Athero-Express Biobank Study + +The [*Athero-Express Biobank Study (AE)*](https://doi.org/10.1007/s10564-004-2304-6) contains plaque material of patients that underwent endarterectomyat two Dutch tertiary referral centers. Details of the study design were described before. Briefly, blood and plaque material were obtained during endarterectomy and stored at -80 ℃. All patients provided informed consent and the study was approved by the medical ethics committee. + +## Load relevant samples + +```{r} +EM_samples <- fread(paste0(ANALYSIS_loc, "/dataverse/EntropyMasker_image_files_used.txt")) +``` + +## Load data + +Loading Athero-Express Biobank Study clinical and biobank data. + +```{r LoadAEDB} +cat("* get Athero-Express Biobank Study Database...") +# METHOD 1: It seems this method gives loads of errors and warnings, which all are hard to comprehend +# or debug. We expect 3,527 samples, and 927 variables; we get 927 variables!!! +# AEdata = as.data.table(read.spss(paste0(INP_loc,"/2017-1NEW_AtheroExpressDatabase_ScientificAE_20171306_v1.0.sav"), +# trim.factor.names = TRUE, trim_values = TRUE, # we trim spaces in values +# reencode = TRUE, # we re-encode to the local locale encoding +# add.undeclared.levels = "append", # we do *not* want to convert to R-factors +# use.value.labels = FALSE, # we do *not* convert variables with value labels into R factors +# use.missings = TRUE, sub = "NA", # we will set every missing variable to NA +# duplicated.value.labels = "condense", # we will condense duplicated value labels +# to.data.frame = TRUE)) +# AEdata.labels <- as.data.table(attr(AEdata, "variable.labels")) +# names(AEdata.labels) <- "Variable" + +# METHOD 2: Using library("haven") importing seems flawless; best argument being: +# we expect 3,527 samples and 888 variables, which is what you'd get with this method +# So for now, METHOD 2 is prefered. +# +require(haven) + +# AEDB <- haven::read_sav(paste0(AEDB_loc, "/2022_1_NEW_AtheroExpressDatabase_ScientificAE_15-02-2022.sav")) # something wrong with Age-variable +# AEDB <- haven::read_sav(paste0(AEDB_loc, "/2020_1_NEW_AtheroExpressDatabase_ScientificAE_30-09-2020.sav")) # duplicate studynumbers in it +AEDB <- haven::read_sav(paste0(AEDB_loc, "/2020_1_NEW_AtheroExpressDatabase_ScientificAE_16-03-2020.sav")) + +# writing off the SPSS data to an Excel. +# fwrite(AEdata, file = paste0(INP_loc,"/2017-1NEW_AtheroExpressDatabase_ScientificAE_20171306_v1.0.values.xlsx"), +# sep = ";", na = "NA", dec = ".", col.names = TRUE, row.names = FALSE, +# dateTimeAs = "ISO", showProgress = TRUE, verbose = TRUE) +# warnings() + +AEDB[1:10, 1:10] +dim(AEDB) + +``` + + + + + + + + + + + + + + + + + + + + + + +## Fixing and creating variables + +We have to fix certain clinical parameters: + +- symptoms +- diabetes +- alcohol use +- smoking +- plaque phenotypes + +### Symptoms + +We need to be very strict in defining *symptoms.* Therefore we will fix a new +variable that groups *symptoms* at inclusion. + +Coding of *symptoms* is as follows: + +- missing -999 +- Asymptomatic 0 +- TIA 1 +- minor stroke 2 +- Major stroke 3 +- Amaurosis fugax 4 +- Four vessel disease 5 +- Vertebrobasilary TIA 7 +- Retinal infarction 8 +- Symptomatic, but aspecific symtoms 9 +- Contralateral symptomatic occlusion 10 +- retinal infarction 11 +- armclaudication due to occlusion subclavian artery, CEA needed for bypass + 12 +- retinal infarction + TIAs 13 +- Ocular ischemic syndrome 14 +- ischemisch glaucoom 15 +- subclavian steal syndrome 16 +- TGA 17 + +We will group as follows: + +1. Asymptomatic > 0 +2. TIA > 1, 7, 13 +3. Stroke > 2, 3 +4. Ocular > 4, 14, 15 +5. Retinal infarction > 8, 11 +6. Other > 5, 9, 10, 12, 16, 17 + +```{r FixSymptoms, message=FALSE, warning=FALSE} + +# Fix symptoms + +attach(AEDB) +AEDB[,"Symptoms.5G"] <- NA +AEDB$Symptoms.5G[sympt == 0] <- "Asymptomatic" +AEDB$Symptoms.5G[sympt == 1 | sympt == 7 | sympt == 13] <- "TIA" +AEDB$Symptoms.5G[sympt == 2 | sympt == 3] <- "Stroke" +AEDB$Symptoms.5G[sympt == 4 | sympt == 14 | sympt == 15 ] <- "Ocular" +AEDB$Symptoms.5G[sympt == 8 | sympt == 11] <- "Retinal infarction" +AEDB$Symptoms.5G[sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Other" + + +# AsymptSympt +AEDB[,"AsymptSympt"] <- NA +AEDB$AsymptSympt[sympt == -999] <- NA +AEDB$AsymptSympt[sympt == 0] <- "Asymptomatic" +AEDB$AsymptSympt[sympt == 1 | sympt == 7 | sympt == 13 | sympt == 2 | sympt == 3] <- "Symptomatic" +AEDB$AsymptSympt[sympt == 4 | sympt == 14 | sympt == 15 | sympt == 8 | sympt == 11 | sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Ocular and others" + +# AsymptSympt +AEDB[,"AsymptSympt2G"] <- NA +AEDB$AsymptSympt2G[sympt == -999] <- NA +AEDB$AsymptSympt2G[sympt == 0] <- "Asymptomatic" +AEDB$AsymptSympt2G[sympt == 1 | sympt == 7 | sympt == 13 | sympt == 2 | sympt == 3 | sympt == 4 | sympt == 14 | sympt == 15 | sympt == 8 | sympt == 11 | sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Symptomatic" + +detach(AEDB) + +# table(AEDB$sympt, useNA = "ifany") +# table(AEDB$AsymptSympt2G, useNA = "ifany") +# table(AEDB$Symptoms.5G, useNA = "ifany") +# +# table(AEDB$AsymptSympt2G, AEDB$sympt, useNA = "ifany") +# table(AEDB$Symptoms.5G, AEDB$sympt, useNA = "ifany") +table(AEDB$AsymptSympt2G, AEDB$Symptoms.5G, useNA = "ifany") + +# AEDB.temp <- subset(AEDB, select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "sympt", "Symptoms.5G", "AsymptSympt")) +# require(labelled) +# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender) +# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital) +# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary) +# +# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE) +# +# table(AEDB.temp$Symptoms.5G, AEDB.temp$AsymptSympt) +# +# rm(AEDB.temp) +``` + +### Re-assessed symptoms + +We re-assessed the categorization of symptoms. These are summarized and parsed +in this section. + +Labeling of new symptom categories. + +```{r message=FALSE, warning=FALSE, paged.print=TRUE} + +AEDB$indexsymptoms_worst +AEDB$indexsymptoms_worst_4g +AEDB$indexsymptoms_latest +AEDB$indexsymptoms_latest_4g + +``` + +Getting counts for each of the most important categories. + +```{r} +cat("New 'worst' vs 'latest' symptom categories.\n") +table(as_factor(AEDB$indexsymptoms_worst_4g), as_factor(AEDB$indexsymptoms_latest_4g)) + +cat("\nNew 'worst' symptom categories.\n") +table((AEDB$indexsymptoms_worst_4g)) + +cat("\nNew 'latest' symptom categories.\n") +table(as_factor(AEDB$indexsymptoms_latest_4g)) +``` + +Comparing with the original symptom categories. + +```{r} +cat("New 'latest' vs original symptom 2G categories.\n") +table((AEDB$indexsymptoms_latest_4g), AEDB$AsymptSympt2G) + +cat("\nNew 'latest' vs original symptom 5G categories.\n") +table((AEDB$indexsymptoms_latest_4g), AEDB$Symptoms.5G) + +``` + +We need to be very strict in defining *symptoms.* Therefore we will fix a new +variable that groups *symptoms* at inclusion. + +Coding of *symptoms* is as follows: + +- asympt 0\ +- ocular 1\ +- TIA 2\ +- stroke 3\ +- unclear 9 + +We will group as follows: + +1. Asymptomatic > 0 +2. Symptomatic > 1, 2, 3 +3. NA > 9 + +```{r FixNewSymptoms} + +# Fix symptoms +attach(AEDB) + +# Symptoms.Update2G +AEDB[,"Symptoms.Update2G"] <- NA +AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 0] <- "Asymptomatic" +AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 1 | indexsymptoms_latest_4g == 2 | indexsymptoms_latest_4g == 3] <- "Symptomatic" +AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 9 ] <- NA + +# Symptoms.Update3G +AEDB[,"Symptoms.Update3G"] <- NA +AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 0] <- "Asymptomatic" +AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 1 | indexsymptoms_latest_4g == 2 | indexsymptoms_latest_4g == 3] <- "Symptomatic" +AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 9 ] <- "Unclear" + +detach(AEDB) + +table(AEDB$Symptoms.Update2G, AEDB$Symptoms.5G, useNA = "ifany") +table(AEDB$Symptoms.Update3G, AEDB$Symptoms.5G, useNA = "ifany") + +``` + +### Other clinical characteristics + +We will also fix the *diabetes* status variable. + +```{r FixDiabetes, message=FALSE, warning=FALSE} + +# Fix diabetes +attach(AEDB) +AEDB[,"DiabetesStatus"] <- NA +AEDB$DiabetesStatus[DM.composite == -999] <- NA +AEDB$DiabetesStatus[DM.composite == 0] <- "Control (no Diabetes Dx/Med)" +AEDB$DiabetesStatus[DM.composite == 1] <- "Diabetes" +detach(AEDB) + +table(AEDB$DM.composite, AEDB$DiabetesStatus) +# AEDB.temp <- subset(AEDB, select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "DM.composite", "DiabetesStatus")) +# require(labelled) +# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender) +# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital) +# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary) +# AEDB.temp$DiabetesStatus <- to_factor(AEDB.temp$DiabetesStatus) +# +# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE) +# +# rm(AEDB.temp) + +``` + +We will also fix the *smoking* status variable. We are interested in whether +someone never, ever or is currently (at the time of inclusion) smoking. This is +based on the questionnaire. + +- `diet801`: are you a smoker? +- `diet802`: did you smoke in the past? + +We already have some variables indicating smoking status: + +- `SmokingReported`: patient has reported to smoke. +- `SmokingYearOR`: smoking in the year of surgery? +- `SmokerCurrent`: currently smoking? + +```{r FixSmoking, message=FALSE, warning=FALSE} +require(labelled) +AEDB$diet801 <- to_factor(AEDB$diet801) +AEDB$diet802 <- to_factor(AEDB$diet802) +AEDB$diet805 <- to_factor(AEDB$diet805) +AEDB$SmokingReported <- to_factor(AEDB$SmokingReported) +AEDB$SmokerCurrent <- to_factor(AEDB$SmokerCurrent) +AEDB$SmokingYearOR <- to_factor(AEDB$SmokingYearOR) + +# table(AEDB$diet801) +# table(AEDB$diet802) +# table(AEDB$SmokingReported) +# table(AEDB$SmokerCurrent) +# table(AEDB$SmokingYearOR) +# table(AEDB$SmokingReported, AEDB$SmokerCurrent, useNA = "ifany", dnn = c("Reported smoking", "Current smoker")) +# +# table(AEDB$diet801, AEDB$diet802, useNA = "ifany", dnn = c("Smoker", "Past smoker")) + +cat("\nFixing smoking status.\n") +attach(AEDB) +AEDB[,"SmokerStatus"] <- NA +AEDB$SmokerStatus[diet802 == "don't know"] <- "Never smoked" +AEDB$SmokerStatus[diet802 == "I still smoke"] <- "Current smoker" +AEDB$SmokerStatus[SmokerCurrent == "no" & diet802 == "no"] <- "Never smoked" +AEDB$SmokerStatus[SmokerCurrent == "no" & diet802 == "yes"] <- "Ex-smoker" +AEDB$SmokerStatus[SmokerCurrent == "yes"] <- "Current smoker" +AEDB$SmokerStatus[SmokerCurrent == "no data available/missing"] <- NA +# AEDB$SmokerStatus[is.na(SmokerCurrent)] <- "Never smoked" +detach(AEDB) + +cat("\n* Current smoking status.\n") +table(AEDB$SmokerCurrent, + useNA = "ifany", + dnn = c("Current smoker")) + +cat("\n* Updated smoking status.\n") +table(AEDB$SmokerStatus, + useNA = "ifany", + dnn = c("Updated smoking status")) + +cat("\n* Comparing to 'SmokerCurrent'.\n") +table(AEDB$SmokerStatus, AEDB$SmokerCurrent, + useNA = "ifany", + dnn = c("Updated smoking status", "Current smoker")) + +# AEDB.temp <- subset(AEDB, select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "DM.composite", "DiabetesStatus")) +# require(labelled) +# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender) +# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital) +# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary) +# AEDB.temp$DiabetesStatus <- to_factor(AEDB.temp$DiabetesStatus) +# +# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE) +# +# rm(AEDB.temp) + + +``` + +We will also fix the *alcohol* status variable. + +```{r FixAlcohol, message=FALSE, warning=FALSE} + +# Fix diabetes +attach(AEDB) +AEDB[,"AlcoholUse"] <- NA +AEDB$AlcoholUse[diet810 == -999] <- NA +AEDB$AlcoholUse[diet810 == 0] <- "No" +AEDB$AlcoholUse[diet810 == 1] <- "Yes" +detach(AEDB) + +# AEDB.temp <- subset(AEDB, select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "diet810", "AlcoholUse")) +# require(labelled) +# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender) +# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital) +# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary) +# AEDB.temp$AlcoholUse <- to_factor(AEDB.temp$AlcoholUse) +# +# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE) +# +# rm(AEDB.temp) + + +``` + +We will also fix a history of CAD, stroke or peripheral intervention status variable. This will be based on `CAD_history`, `Stroke_history`, and `Peripheral.interv` + +```{r FixCAD_History, message=FALSE, warning=FALSE} + +# Fix diabetes +attach(AEDB) +AEDB[,"MedHx_CVD"] <- NA +AEDB$MedHx_CVD[CAD_history == 0 | Stroke_history == 0 | Peripheral.interv == 0] <- "No" +AEDB$MedHx_CVD[CAD_history == 1 | Stroke_history == 1 | Peripheral.interv == 1] <- "yes" +detach(AEDB) + +table(AEDB$CAD_history) +table(AEDB$Stroke_history) +table(AEDB$Peripheral.interv) +table(AEDB$MedHx_CVD) + +# AEDB.temp <- subset(AEDB, select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "diet810", "AlcoholUse")) +# require(labelled) +# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender) +# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital) +# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary) +# AEDB.temp$AlcoholUse <- to_factor(AEDB.temp$AlcoholUse) +# +# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE) +# +# rm(AEDB.temp) + + +``` + +### Plaque phenotypes + +We will also fix the *plaquephenotypes* variable. + +Coding of symptoms is as follows: + +- missing -999\ +- not relevant -888 +- fibrous 1\ +- fibroatheromatous 2\ +- atheromatous 3 + +```{r FixPlaquePhenotypes, message=FALSE, warning=FALSE} + +# Fix plaquephenotypes +attach(AEDB) +AEDB[,"OverallPlaquePhenotype"] <- NA +AEDB$OverallPlaquePhenotype[plaquephenotype == -999] <- NA +AEDB$OverallPlaquePhenotype[plaquephenotype == -999] <- NA +AEDB$OverallPlaquePhenotype[plaquephenotype == 1] <- "fibrous" +AEDB$OverallPlaquePhenotype[plaquephenotype == 2] <- "fibroatheromatous" +AEDB$OverallPlaquePhenotype[plaquephenotype == 3] <- "atheromatous" +detach(AEDB) + +# AEDB.temp <- subset(AEDB, select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "plaquephenotype", "OverallPlaquePhenotype")) +# require(labelled) +# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender) +# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital) +# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary) +# +# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE) +# +# rm(AEDB.temp) + +``` + +We will also fix and inverse-rank normal transform the continuous (manually) +scored plaque phenotypes. + +```{r IRNT PlaquePhenotypes} +AEDB$macmean0 <- as.numeric(AEDB$macmean0) +AEDB$smcmean0 <- as.numeric(AEDB$smcmean0) +AEDB$neutrophils <- as.numeric(AEDB$neutrophils) +AEDB$Mast_cells_plaque <- as.numeric(AEDB$Mast_cells_plaque) +AEDB$vessel_density_averaged <- as.numeric(AEDB$vessel_density_averaged) + +AEDB$MAC_rankNorm <- qnorm((rank(AEDB$macmean0, na.last = "keep") - 0.5) / sum(!is.na(AEDB$macmean0))) +AEDB$SMC_rankNorm <- qnorm((rank(AEDB$smcmean0, na.last = "keep") - 0.5) / sum(!is.na(AEDB$smcmean0))) +AEDB$Neutrophils_rankNorm <- qnorm((rank(AEDB$neutrophils, na.last = "keep") - 0.5) / sum(!is.na(AEDB$neutrophils))) +AEDB$MastCells_rankNorm <- qnorm((rank(AEDB$Mast_cells_plaque, na.last = "keep") - 0.5) / sum(!is.na(AEDB$Mast_cells_plaque))) +AEDB$VesselDensity_rankNorm <- qnorm((rank(AEDB$vessel_density_averaged, na.last = "keep") - 0.5) / sum(!is.na(AEDB$vessel_density_averaged))) + +``` + +```{r IRNT PlaquePhenotypes: Visualisation} +library(labelled) +AEDB$Gender <- to_factor(AEDB$Gender) +library(patchwork) + +p1 <- ggpubr::gghistogram(AEDB, "macmean0", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "% of macrophages (CD68)", + xlab = "% per region of interest", + ggtheme = theme_minimal()) + +p2 <- ggpubr::gghistogram(AEDB, "MAC_rankNorm", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "% of macrophages (CD68)", + xlab = "% per region of interest\ninverse-rank normalized number", + ggtheme = theme_minimal()) + +p1 | p2 + +p1 <- ggpubr::gghistogram(AEDB, "smcmean0", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "% of smooth muscle cells (SMA)", + xlab = "% per region of interest", + ggtheme = theme_minimal()) + +p2 <- ggpubr::gghistogram(AEDB, "SMC_rankNorm", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "% of smooth muscle cells (SMA)", + xlab = "% per region of interest\ninverse-rank normalized number", + ggtheme = theme_minimal()) + +p1 | p2 + + +p1 <- ggpubr::gghistogram(AEDB, "neutrophils", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "number of neutrophils (CD66b)", + xlab = "counts per plaque", + ggtheme = theme_minimal()) + +p2 <- ggpubr::gghistogram(AEDB, "Neutrophils_rankNorm", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "number of neutrophils (CD66b)", + xlab = "counts per plaque\ninverse-rank normalized number", + ggtheme = theme_minimal()) + +p1 | p2 + + +p1 <- ggpubr::gghistogram(AEDB, "Mast_cells_plaque", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "number of mast cells", + xlab = "counts per plaque", + ggtheme = theme_minimal()) + +p2 <- ggpubr::gghistogram(AEDB, "MastCells_rankNorm", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "number of mast cells", + xlab = "counts per plaque\ninverse-rank normalized number", + ggtheme = theme_minimal()) + +p1 | p2 + + +p1 <- ggpubr::gghistogram(AEDB, "vessel_density_averaged", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "number of intraplaque neovessels", + xlab = "counts per 3-4 hotspots", + ggtheme = theme_minimal()) + +p2 <- ggpubr::gghistogram(AEDB, "VesselDensity_rankNorm", + # y = "..count..", + color = "white", + fill = "Gender", + palette = c("#1290D9", "#DB003F"), + add = "median", + #add_density = TRUE, + rug = TRUE, + #add.params = list(color = "black", linetype = 2), + title = "number of intraplaque neovessels", + xlab = "counts per 3-4 hotspots\ninverse-rank normalized number", + ggtheme = theme_minimal()) + +p1 | p2 + +rm(p1, p2) +``` + +Here we calculate the *plaque instability/vulnerability* index + +```{r Plaque Vulnerability} +# Plaque vulnerability +require(labelled) +AEDB$Macrophages.bin <- to_factor(AEDB$Macrophages.bin) +AEDB$SMC.bin <- to_factor(AEDB$SMC.bin) +AEDB$IPH.bin <- to_factor(AEDB$IPH.bin) +AEDB$Calc.bin <- to_factor(AEDB$Calc.bin) +AEDB$Collagen.bin <- to_factor(AEDB$Collagen.bin) +AEDB$Fat.bin_10 <- to_factor(AEDB$Fat.bin_10) +AEDB$Fat.bin_40 <- to_factor(AEDB$Fat.bin_40) + +table(AEDB$Macrophages.bin) +table(AEDB$Fat.bin_10) +table(AEDB$Collagen.bin) +table(AEDB$SMC.bin) +table(AEDB$IPH.bin) + +# SPSS code + +# +# *** syntax- Plaque vulnerability**. +# COMPUTE Macro_instab = -999. +# IF macrophages.bin=2 Macro_instab=1. +# IF macrophages.bin=1 Macro_instab=0. +# EXECUTE. +# +# COMPUTE Fat10_instab = -999. +# IF Fat.bin_10=2 Fat10_instab=1. +# IF Fat.bin_10=1 Fat10_instab=0. +# EXECUTE. +# +# COMPUTE coll_instab=-999. +# IF Collagen.bin=2 coll_instab=0. +# IF Collagen.bin=1 coll_instab=1. +# EXECUTE. +# +# +# COMPUTE SMC_instab=-999. +# IF SMC.bin=2 SMC_instab=0. +# IF SMC.bin=1 SMC_instab=1. +# EXECUTE. +# +# COMPUTE IPH_instab=-999. +# IF IPH.bin=0 IPH_instab=0. +# IF IPH.bin=1 IPH_instab=1. +# EXECUTE. +# +# COMPUTE Instability=Macro_instab + Fat10_instab + coll_instab + SMC_instab + IPH_instab. +# EXECUTE. + +# Fix plaquephenotypes +attach(AEDB) +# mac instability +AEDB[,"MAC_Instability"] <- NA +AEDB$MAC_Instability[Macrophages.bin == -999] <- NA +AEDB$MAC_Instability[Macrophages.bin == "no/minor"] <- 0 +AEDB$MAC_Instability[Macrophages.bin == "moderate/heavy"] <- 1 + +# fat instability +AEDB[,"FAT10_Instability"] <- NA +AEDB$FAT10_Instability[Fat.bin_10 == -999] <- NA +AEDB$FAT10_Instability[Fat.bin_10 == " <10%"] <- 0 +AEDB$FAT10_Instability[Fat.bin_10 == " >10%"] <- 1 + +# col instability +AEDB[,"COL_Instability"] <- NA +AEDB$COL_Instability[Collagen.bin == -999] <- NA +AEDB$COL_Instability[Collagen.bin == "no/minor"] <- 1 +AEDB$COL_Instability[Collagen.bin == "moderate/heavy"] <- 0 + +# smc instability +AEDB[,"SMC_Instability"] <- NA +AEDB$SMC_Instability[SMC.bin == -999] <- NA +AEDB$SMC_Instability[SMC.bin == "no/minor"] <- 1 +AEDB$SMC_Instability[SMC.bin == "moderate/heavy"] <- 0 + +# iph instability +AEDB[,"IPH_Instability"] <- NA +AEDB$IPH_Instability[IPH.bin == -999] <- NA +AEDB$IPH_Instability[IPH.bin == "no"] <- 0 +AEDB$IPH_Instability[IPH.bin == "yes"] <- 1 + +detach(AEDB) + +table(AEDB$MAC_Instability, useNA = "ifany") +table(AEDB$FAT10_Instability, useNA = "ifany") +table(AEDB$COL_Instability, useNA = "ifany") +table(AEDB$SMC_Instability, useNA = "ifany") +table(AEDB$IPH_Instability, useNA = "ifany") + +# creating vulnerability index +AEDB <- AEDB %>% mutate(Plaque_Vulnerability_Index = factor(rowSums(.[grep("_Instability", names(.))], na.rm = TRUE)), + ) + +table(AEDB$Plaque_Vulnerability_Index, useNA = "ifany") + +# str(AEDB$Plaque_Vulnerability_Index) + +``` + +## Prepare baseline summary + +We are interested in the following variables at baseline in the whole cohort. + +- Age (years) +- Female sex (N, %) +- Artery type (N, %) +- Hospital (N, %) + + + + + + + + + + + + + + + + + + + + + + + + + + + +```{r Baseline AEDB: preparation} +cat("====================================================================================================\n") +cat("SELECTION THE SHIZZLE\n") + +### Artery levels +# AEdata$Artery_summary: +# value label +# NOT USE - 0 No artery known (yet), no surgery (patient ill, died, exited study), re-numbered to AAA +# USE - 1 carotid (left & right) +# USE - 2 femoral/iliac (left, right or both sides) +# NOT USE - 3 other carotid arteries (common, external) +# NOT USE - 4 carotid bypass and injury (left, right or both sides) +# NOT USE - 5 aneurysmata (carotid & femoral) +# NOT USE - 6 aorta +# NOT USE - 7 other arteries (renal, popliteal, vertebral) +# NOT USE - 8 femoral bypass, angioseal and injury (left, right or both sides) + +### AEdata$informedconsent +# value label +# NOT USE - -999 missing +# NOT USE - 0 no, died +# USE - 1 yes +# USE - 2 yes, health treatment when possible +# USE - 3 yes, no health treatment +# USE - 4 yes, no health treatment, no commercial business +# NOT USE - 5 yes, no tissue, no commerical business +# NOT USE - 6 yes, no tissue, no questionnaires, no medical info, no commercial business +# USE - 7 yes, no questionnaires, no health treatment, no commercial business +# USE - 8 yes, no questionnaires, health treatment when possible +# NOT USE - 9 yes, no tissue, no questionnaires, no health treatment, no commerical business +# USE - 10 yes, no health treatment, no medical info, no commercial business +# NOT USE - 11 yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business +# USE - 12 yes, no questionnaires, no health treatment +# NOT USE - 13 yes, no tissue, no health treatment +# NOT USE - 14 yes, no tissue, no questionnaires +# NOT USE - 15 yes, no tissue, health treatment when possible +# NOT USE - 16 yes, no tissue +# USE - 17 yes, no commerical business +# USE - 18 yes, health treatment when possible, no commercial business +# USE - 19 yes, no medical info, no commercial business +# USE - 20 yes, no questionnaires +# NOT USE - 21 yes, no tissue, no questionnaires, no health treatment, no medical info +# NOT USE - 22 yes, no tissue, no questionnaires, no health treatment, no commercial business +# USE - 23 yes, no medical info +# USE - 24 yes, no questionnaires, no commercial business +# USE - 25 yes, no questionnaires, no health treatment, no medical info +# USE - 26 yes, no questionnaires, health treatment when possible, no commercial business +# USE - 27 yes, no health treatment, no medical info +# NOT USE - 28 no, doesn't want to +# NOT USE - 29 no, unable to sign +# NOT USE - 30 no, no reaction +# NOT USE - 31 no, lost +# NOT USE - 32 no, too old +# NOT USE - 34 yes, no medical info, health treatment when possible +# NOT USE - 35 no (never asked for IC because there was no tissue) +# USE - 36 yes, no medical info, no commercial business, health treatment when possible +# NOT USE - 37 no, endpoint +# USE - 38 wil niets invullen, wel alles gebruiken +# USE - 39 second informed concents: yes, no commercial business +# NOT USE - 40 nooit geincludeerd + +cat("- sanity checking PRIOR to selection") +library(data.table) +require(labelled) +ae.gender <- to_factor(AEDB$Gender) +ae.hospital <- to_factor(AEDB$Hospital) +table(ae.gender, ae.hospital, dnn = c("Sex", "Hospital")) +ae.artery <- to_factor(AEDB$Artery_summary) +table(ae.artery, ae.gender, dnn = c("Sex", "Artery")) + +rm(ae.gender, ae.hospital, ae.artery) + +# I change numeric and factors manually because, well, I wouldn't know how to fix it otherwise +# to have this 'tibble' work with 'tableone'... :-) + +AEDB$Age <- as.numeric(AEDB$Age) +AEDB$diastoli <- as.numeric(AEDB$diastoli) +AEDB$systolic <- as.numeric(AEDB$systolic) + +AEDB$TC_finalCU <- as.numeric(AEDB$TC_finalCU) +AEDB$LDL_finalCU <- as.numeric(AEDB$LDL_finalCU) +AEDB$HDL_finalCU <- as.numeric(AEDB$HDL_finalCU) +AEDB$TG_finalCU <- as.numeric(AEDB$TG_finalCU) + +AEDB$TC_final <- as.numeric(AEDB$TC_final) +AEDB$LDL_final <- as.numeric(AEDB$LDL_final) +AEDB$HDL_final <- as.numeric(AEDB$HDL_final) +AEDB$TG_final <- as.numeric(AEDB$TG_final) + +AEDB$Age <- as.numeric(AEDB$Age) +AEDB$GFR_MDRD <- as.numeric(AEDB$GFR_MDRD) +AEDB$BMI <- as.numeric(AEDB$BMI) +AEDB$eCigarettes <- as.numeric(AEDB$eCigarettes) +AEDB$ePackYearsSmoking <- as.numeric(AEDB$ePackYearsSmoking) +AEDB$EP_composite_time <- as.numeric(AEDB$EP_composite_time) +AEDB$EP_major_time <- as.numeric(AEDB$EP_major_time) + +require(labelled) +AEDB$Artery_summary <- to_factor(AEDB$Artery_summary) +AEDB$ORyear <- to_factor(AEDB$ORyear) +AEDB$Gender <- to_factor(AEDB$Gender) +AEDB$Hospital <- to_factor(AEDB$Hospital) +AEDB$KDOQI <- to_factor(AEDB$KDOQI) +AEDB$BMI_WHO <- to_factor(AEDB$BMI_WHO) +AEDB$DiabetesStatus <- to_factor(AEDB$DiabetesStatus) +AEDB$SmokerStatus <- to_factor(AEDB$SmokerStatus) +AEDB$AlcoholUse <- to_factor(AEDB$AlcoholUse) + +AEDB$Hypertension.selfreport <- to_factor(AEDB$Hypertension1) +AEDB$Hypertension.selfreportdrug <- to_factor(AEDB$Hypertension2) +AEDB$Hypertension.composite <- to_factor(AEDB$Hypertension.composite) +AEDB$Hypertension.drugs <- to_factor(AEDB$Hypertension.drugs) + +AEDB$Med.anticoagulants <- to_factor(AEDB$Med.anticoagulants) +AEDB$Med.all.antiplatelet <- to_factor(AEDB$Med.all.antiplatelet) +AEDB$Med.Statin.LLD <- to_factor(AEDB$Med.Statin.LLD) + +AEDB$Stroke_Dx <- to_factor(AEDB$Stroke_Dx) +AEDB$CAD_history <- to_factor(AEDB$CAD_history) +AEDB$PAOD <- to_factor(AEDB$PAOD) +AEDB$Peripheral.interv <- to_factor(AEDB$Peripheral.interv) + +AEDB$sympt <- to_factor(AEDB$sympt) +AEDB$Symptoms.3g <- to_factor(AEDB$Symptoms.3g) +AEDB$Symptoms.4g <- to_factor(AEDB$Symptoms.4g) +AEDB$Symptoms.5G <- to_factor(AEDB$Symptoms.5G) +AEDB$AsymptSympt <- to_factor(AEDB$AsymptSympt) +AEDB$AsymptSympt2G <- to_factor(AEDB$AsymptSympt2G) +AEDB$Symptoms.Update2G <- to_factor(AEDB$Symptoms.Update2G) +AEDB$Symptoms.Update3G <- to_factor(AEDB$Symptoms.Update3G) + +AEDB$restenos <- to_factor(AEDB$restenos) +AEDB$stenose <- to_factor(AEDB$stenose) +AEDB$EP_composite <- to_factor(AEDB$EP_composite) +AEDB$EP_major <- to_factor(AEDB$EP_major) +AEDB$Macrophages.bin <- to_factor(AEDB$Macrophages.bin) +AEDB$SMC.bin <- to_factor(AEDB$SMC.bin) +AEDB$IPH.bin <- to_factor(AEDB$IPH.bin) +AEDB$Calc.bin <- to_factor(AEDB$Calc.bin) +AEDB$Collagen.bin <- to_factor(AEDB$Collagen.bin) +AEDB$Fat.bin_10 <- to_factor(AEDB$Fat.bin_10) +AEDB$Fat.bin_40 <- to_factor(AEDB$Fat.bin_40) +AEDB$OverallPlaquePhenotype <- to_factor(AEDB$OverallPlaquePhenotype) +AEDB$Plaque_Vulnerability_Index <- to_factor(AEDB$Plaque_Vulnerability_Index) + +AEDB$Artery_summary <- to_factor(AEDB$Artery_summary) + +AEDB$informedconsent <- to_factor(AEDB$informedconsent) + +AEDB.full <- subset(AEDB, + informedconsent != "missing" & # we are really strict in selecting based on 'informed consent'! + informedconsent != "no, died" & + informedconsent != "yes, no tissue, no commerical business" & + informedconsent != "yes, no tissue, no questionnaires, no medical info, no commercial business" & + informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commerical business" & + informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business" & + informedconsent != "yes, no tissue, no health treatment" & + informedconsent != "yes, no tissue, no questionnaires" & + informedconsent != "yes, no tissue, health treatment when possible" & + informedconsent != "yes, no tissue" & + informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info" & + informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commercial business" & + informedconsent != "no, doesn't want to" & + informedconsent != "no, unable to sign" & + informedconsent != "no, no reaction" & + informedconsent != "no, lost" & + informedconsent != "no, too old" & + informedconsent != "yes, no medical info, health treatment when possible" & + informedconsent != "no (never asked for IC because there was no tissue)" & + informedconsent != "no, endpoint" & + informedconsent != "nooit geincludeerd") +# AEDB.CEA[1:10, 1:10] +dim(AEDB.full) + +``` + +```{r Baseline AEDB: creation} +cat("===========================================================================================\n") +cat("CREATE BASELINE TABLE\n") + +# Baseline table variables +basetable_vars = c("Hospital", + "Artery_summary", + "Age", "Gender") + # "ORyear", + # "TC_finalCU", "LDL_finalCU", "HDL_finalCU", "TG_finalCU", + # "TC_final", "LDL_final", "HDL_final", "TG_final", + # "hsCRP_plasma", + # "systolic", "diastoli", "GFR_MDRD", "BMI", + # "KDOQI", "BMI_WHO", + # "SmokerStatus", "AlcoholUse", + # "DiabetesStatus", + # "Hypertension.selfreport", "Hypertension.selfreportdrug", "Hypertension.composite", "Hypertension.drugs", + # "Med.anticoagulants", "Med.all.antiplatelet", "Med.Statin.LLD", + # "Stroke_Dx", "sympt", "Symptoms.5G", "AsymptSympt", "AsymptSympt2G", + # "Symptoms.Update2G", + # "Symptoms.Update3G", + # "restenos", "stenose", + # "CAD_history", "PAOD", "Peripheral.interv", + # "EP_composite", "EP_composite_time", "EP_major", "EP_major_time", + # "MAC_rankNorm", "SMC_rankNorm", "Macrophages.bin", "SMC.bin", + # "Neutrophils_rankNorm", "MastCells_rankNorm", + # "IPH.bin", "VesselDensity_rankNorm", + # "Calc.bin", "Collagen.bin", + # "Fat.bin_10", "Fat.bin_40", + # "OverallPlaquePhenotype", "Plaque_Vulnerability_Index") + +basetable_bin = c("Hospital", + "Artery_summary", + "Gender") +# basetable_bin + +basetable_con = basetable_vars[!basetable_vars %in% basetable_bin] +# basetable_con +``` + +# Athero-Express Biobank Study Baseline Characteristics + +Showing the baseline table of the whole Athero-Express Biobank. + +```{r Baseline AEDB: Visualize AEDB} +# Create baseline tables +# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html +AEDB.tableOne = print(CreateTableOne(vars = basetable_vars, + factorVars = basetable_bin, + # strata = "Symptoms.4g", + data = AEDB.full, includeNA = TRUE), + nonnormal = c(), missing = TRUE, + quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, + format = "pf", + contDigits = 3)[,1:3] +``` + + +## Match samples used + +Here we match the full database with the samples used in **`EntropyMasker`**. + +```{r} +# Remove duplicate rows of the dataframe +library(dplyr) +temp <- EM_samples %>% select(., "Studynumber") %>% + distinct(.) + +AEDB_EM <- merge(temp, + AEDB, + by.x = "Studynumber", + by.y = "STUDY_NUMBER", + sort = FALSE) + +AEDB_EM.full <- subset(AEDB_EM, + informedconsent != "missing" & # we are really strict in selecting based on 'informed consent'! + informedconsent != "no, died" & + informedconsent != "yes, no tissue, no commerical business" & + informedconsent != "yes, no tissue, no questionnaires, no medical info, no commercial business" & + informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commerical business" & + informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business" & + informedconsent != "yes, no tissue, no health treatment" & + informedconsent != "yes, no tissue, no questionnaires" & + informedconsent != "yes, no tissue, health treatment when possible" & + informedconsent != "yes, no tissue" & + informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info" & + informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commercial business" & + informedconsent != "no, doesn't want to" & + informedconsent != "no, unable to sign" & + informedconsent != "no, no reaction" & + informedconsent != "no, lost" & + informedconsent != "no, too old" & + informedconsent != "yes, no medical info, health treatment when possible" & + informedconsent != "no (never asked for IC because there was no tissue)" & + informedconsent != "no, endpoint" & + informedconsent != "nooit geincludeerd") +# AEDB_EM.full[1:10, 1:10] + +rm(temp) +``` + + + +```{r Baseline AEDB: Visualize AEDB EM FULL} +# Create baseline tables +# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html +AEDB_EM.full.tableOne = print(CreateTableOne(vars = basetable_vars, + factorVars = basetable_bin, + # strata = "Symptoms.4g", + data = AEDB_EM.full, includeNA = TRUE), + nonnormal = c(), missing = TRUE, + quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, + format = "pf", + contDigits = 3)[,1:3] +``` + +```{r Baseline AEDB: Visualize AEDB EM} + +basetable_vars = c("Hospital", + "Artery_summary") + +basetable_bin = c("Hospital", + "Artery_summary") + +# Create baseline tables +# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html +AEDB_EM.tableOne = print(CreateTableOne(vars = basetable_vars, + factorVars = basetable_bin, + # strata = "Symptoms.4g", + data = AEDB_EM, includeNA = TRUE), + nonnormal = c(), missing = TRUE, + quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, + format = "pf", + contDigits = 3)[,1:3] +``` + +## Baseline writing + +Let's save the baseline characteristics of the Athero-Express Biobank Study. + +```{r Baseline SampleSelection: write} +# Write basetable + +require(openxlsx) + +write.xlsx(as.data.frame(AEDB.tableOne), + file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.BaselineTable.xlsx"), + rowNames = TRUE, + colNames = TRUE, + sheetName = "AE_Base", overwrite = TRUE) + +write.xlsx(as.data.frame(AEDB_EM.tableOne), + file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.EM.59.BaselineTable.xlsx"), + rowNames = TRUE, + colNames = TRUE, + sheetName = "AE_Base_EM_59", overwrite = TRUE) + +write.xlsx(as.data.frame(AEDB_EM.full.tableOne), + file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.EM.56.BaselineTable.xlsx"), + rowNames = TRUE, + colNames = TRUE, + sheetName = "AE_Base_EM_56", overwrite = TRUE) + +``` + +We will also write the newly prepared AEDB selected for this study which we can use in downstream analyses. + +```{r} +saveRDS(AEDB_EM.full, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.EM.FULL.RDS")) +saveRDS(AEDB.full, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.FULL.RDS")) +saveRDS(AEDB, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.raw.RDS")) + +``` + + +# Session information + +------------------------------------------------------------------------------------------------------------------------ + + Version: v1.0.2 + Last update: 2022-07-12 + Written by: Sander W. van der Laan (s.w.vanderlaan-2[at]umcutrecht.nl). + Description: Script to get some Athero-Express Biobank Study baseline characteristics. + Minimum requirements: R version 3.4.3 (2017-06-30) -- 'Single Candle', Mac OS X El Capitan + + **MoSCoW To-Do List** + The things we Must, Should, Could, and Would have given the time we have. + _M_ + + _S_ + + _C_ + + _W_ + + **Changes log** + * v1.0.2 Simplified the initial script. It now outputs the relevant R-objects (as .RDS). + * v1.0.1 Update to main AEDB (there is an error in the Age-variable in the new version). + * v1.0.0 Initial version. Add 'plaque vulnerability index', Fixed baseline table, added codes, and results. Major update to WORCS system. + +------------------------------------------------------------------------------------------------------------------------ + +```{r eval = TRUE} +sessionInfo() +``` + +# Saving environment + +```{r Saving} +save.image(paste0(PROJECT_loc, "/",Today,".",PROJECTNAME,".AEDB.EM.baseline.RData")) +``` + ++-----------------------------------------------------------------------------------------------------------------------------------------+ +| © 1979-2022 Sander W. van der Laan | s.w.vanderlaan[at]gmail.com | [swvanderlaan.github.io](https://swvanderlaan.github.io). | ++-----------------------------------------------------------------------------------------------------------------------------------------+ diff --git a/AEDB.EM.baseline.nb.html b/AEDB.EM.baseline.nb.html new file mode 100644 index 0000000..6645fca --- /dev/null +++ b/AEDB.EM.baseline.nb.html @@ -0,0 +1,4972 @@ + + + + + + + + + + + + + + + +Baseline characteristics + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + +
+
+
+
+
+ +
+ + + + + + + + +
+

General Setup

+

We will clean the environment, setup the locations, define colors, +and create a datestamp.

+

Clean the environment.

+ + + + +

Set locations and working directories…

+ + + +

+Create a new analysis directories.
+
+- general directory
+
+- for plots
+
+- for output of summary results
+
+- for baseline tables
+ + + +

… a package-installation function …

+ + + +
source("scripts/functions.R")
+ + + +

… and load those packages.

+ + + +
source("scripts/pack01.packages.R")
+ + +

+* General packages...
+ + + +

We will create a datestamp and define the Utrecht Science Park +Colour Scheme.

+ + + +

+Today = format(as.Date(as.POSIXlt(Sys.time())), "%Y%m%d")
+Today.Report = format(as.Date(as.POSIXlt(Sys.time())), "%A, %B %d, %Y")
+
+source("scripts/colors.R")
+ + + + + +
+
+

This notebook

+

In this notebook we create a baseline table of the samples used in +EntropyMasker.

+
+
+

Athero-Express Biobank Study

+

The Athero-Express +Biobank Study (AE) contains plaque material of patients that +underwent endarterectomyat two Dutch tertiary referral centers. Details +of the study design were described before. Briefly, blood and plaque +material were obtained during endarterectomy and stored at -80 ℃. All +patients provided informed consent and the study was approved by the +medical ethics committee.

+
+

Load relevant samples

+ + + +
EM_samples <- fread(paste0(ANALYSIS_loc, "/dataverse/EntropyMasker_image_files_used.txt"))
+ + + +
+
+

Load data

+

Loading Athero-Express Biobank Study clinical and biobank data.

+ + + +
cat("* get Athero-Express Biobank Study Database...")
+ + +
* get Athero-Express Biobank Study Database...
+ + +
# METHOD 1: It seems this method gives loads of errors and warnings, which all are hard to comprehend
+#           or debug. We expect 3,527 samples, and 927 variables; we get 927 variables!!!
+# AEdata = as.data.table(read.spss(paste0(INP_loc,"/2017-1NEW_AtheroExpressDatabase_ScientificAE_20171306_v1.0.sav"),
+#                                  trim.factor.names = TRUE, trim_values = TRUE, # we trim spaces in values
+#                                  reencode = TRUE, # we re-encode to the local locale encoding
+#                                  add.undeclared.levels = "append", # we do *not* want to convert to R-factors
+#                                  use.value.labels = FALSE, # we do *not* convert variables with value labels into R factors
+#                                  use.missings = TRUE, sub = "NA", # we will set every missing variable to NA
+#                                  duplicated.value.labels = "condense", # we will condense duplicated value labels
+#                                  to.data.frame = TRUE))
+# AEdata.labels <- as.data.table(attr(AEdata, "variable.labels"))
+# names(AEdata.labels) <- "Variable"
+
+# METHOD 2: Using library("haven") importing seems flawless; best argument being:
+#           we expect 3,527 samples and 888 variables, which is what you'd get with this method
+#           So for now, METHOD 2 is prefered. 
+#            
+require(haven)
+
+# AEDB <- haven::read_sav(paste0(AEDB_loc, "/2022_1_NEW_AtheroExpressDatabase_ScientificAE_15-02-2022.sav")) # something wrong with Age-variable
+# AEDB <- haven::read_sav(paste0(AEDB_loc, "/2020_1_NEW_AtheroExpressDatabase_ScientificAE_30-09-2020.sav")) # duplicate studynumbers in it
+AEDB <- haven::read_sav(paste0(AEDB_loc, "/2020_1_NEW_AtheroExpressDatabase_ScientificAE_16-03-2020.sav"))
+
+# writing off the SPSS data to an Excel.
+# fwrite(AEdata, file = paste0(INP_loc,"/2017-1NEW_AtheroExpressDatabase_ScientificAE_20171306_v1.0.values.xlsx"), 
+#        sep = ";", na = "NA", dec = ".", col.names = TRUE, row.names = FALSE,
+#        dateTimeAs = "ISO", showProgress = TRUE, verbose = TRUE)
+# warnings()
+
+AEDB[1:10, 1:10]
+ + +
+ +
+ + +
dim(AEDB)
+ + +
[1] 3791 1091
+ + + + + + + + + + + + + + + + + + +
+
+

Fixing and creating variables

+

We have to fix certain clinical parameters:

+
    +
  • symptoms
  • +
  • diabetes
  • +
  • alcohol use
  • +
  • smoking
  • +
  • plaque phenotypes
  • +
+
+

Symptoms

+

We need to be very strict in defining symptoms. Therefore we +will fix a new variable that groups symptoms at inclusion.

+

Coding of symptoms is as follows:

+
    +
  • missing -999
  • +
  • Asymptomatic 0
  • +
  • TIA 1
  • +
  • minor stroke 2
  • +
  • Major stroke 3
  • +
  • Amaurosis fugax 4
  • +
  • Four vessel disease 5
  • +
  • Vertebrobasilary TIA 7
  • +
  • Retinal infarction 8
  • +
  • Symptomatic, but aspecific symtoms 9
  • +
  • Contralateral symptomatic occlusion 10
  • +
  • retinal infarction 11
  • +
  • armclaudication due to occlusion subclavian artery, CEA needed for +bypass 12
  • +
  • retinal infarction + TIAs 13
  • +
  • Ocular ischemic syndrome 14
  • +
  • ischemisch glaucoom 15
  • +
  • subclavian steal syndrome 16
  • +
  • TGA 17
  • +
+

We will group as follows:

+
    +
  1. Asymptomatic > 0
  2. +
  3. TIA > 1, 7, 13
  4. +
  5. Stroke > 2, 3
  6. +
  7. Ocular > 4, 14, 15
  8. +
  9. Retinal infarction > 8, 11
  10. +
  11. Other > 5, 9, 10, 12, 16, 17
  12. +
+ + + +

+# Fix symptoms
+
+attach(AEDB)
+AEDB[,"Symptoms.5G"] <- NA
+AEDB$Symptoms.5G[sympt == 0] <- "Asymptomatic"
+AEDB$Symptoms.5G[sympt == 1 | sympt == 7 | sympt == 13] <- "TIA"
+AEDB$Symptoms.5G[sympt == 2 | sympt == 3] <- "Stroke"
+AEDB$Symptoms.5G[sympt == 4 | sympt == 14 | sympt == 15 ] <- "Ocular"
+AEDB$Symptoms.5G[sympt == 8 | sympt == 11] <- "Retinal infarction"
+AEDB$Symptoms.5G[sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Other"
+
+
+# AsymptSympt
+AEDB[,"AsymptSympt"] <- NA
+AEDB$AsymptSympt[sympt == -999] <- NA
+AEDB$AsymptSympt[sympt == 0] <- "Asymptomatic"
+AEDB$AsymptSympt[sympt == 1 | sympt == 7 | sympt == 13 | sympt == 2 | sympt == 3] <- "Symptomatic"
+AEDB$AsymptSympt[sympt == 4 | sympt == 14 | sympt == 15 | sympt == 8 | sympt == 11 | sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Ocular and others"
+
+# AsymptSympt
+AEDB[,"AsymptSympt2G"] <- NA
+AEDB$AsymptSympt2G[sympt == -999] <- NA
+AEDB$AsymptSympt2G[sympt == 0] <- "Asymptomatic"
+AEDB$AsymptSympt2G[sympt == 1 | sympt == 7 | sympt == 13 | sympt == 2 | sympt == 3 | sympt == 4 | sympt == 14 | sympt == 15 | sympt == 8 | sympt == 11 | sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Symptomatic"
+
+detach(AEDB)
+
+# table(AEDB$sympt, useNA = "ifany")
+# table(AEDB$AsymptSympt2G, useNA = "ifany")
+# table(AEDB$Symptoms.5G, useNA = "ifany")
+# 
+# table(AEDB$AsymptSympt2G, AEDB$sympt, useNA = "ifany")
+# table(AEDB$Symptoms.5G, AEDB$sympt, useNA = "ifany")
+table(AEDB$AsymptSympt2G, AEDB$Symptoms.5G, useNA = "ifany")
+ + +
              
+               Asymptomatic Ocular Other Retinal infarction Stroke  TIA <NA>
+  Asymptomatic          333      0     0                  0      0    0    0
+  Symptomatic             0    416   119                 43    732 1045    0
+  <NA>                    0      0     0                  0      0    0 1103
+ + +
# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "sympt", "Symptoms.5G", "AsymptSympt"))
+# require(labelled)
+# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
+# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
+# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
+# 
+# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
+# 
+# table(AEDB.temp$Symptoms.5G, AEDB.temp$AsymptSympt)
+# 
+# rm(AEDB.temp)
+ + + +
+
+

Re-assessed symptoms

+

We re-assessed the categorization of symptoms. These are summarized +and parsed in this section.

+

Labeling of new symptom categories.

+ + + +

+AEDB$indexsymptoms_worst
+ + +
<labelled<double>[3791]>: Latest cerebrovascular symptoms (indication CEA).
+   [1]  2  3  2  0  0  2  0  3 NA  0  0  0  2  1  0  0  0  0 NA  0  1  0  0  0  0  2  0  0 NA  0  0 NA  1  0  9  2  0  9  0  1  0  9  0  0  3  2  0 NA
+  [49]  0  0  1  9  2  9  1  0  0  2  2  2  0  9  2  0  0  0  2 NA  0  0  0  0  0  0  2  0  0  2  3  0  1  3  0 NA  0  0  9  2  3  3 NA  2  0  0  3 NA
+  [97] NA  3  1  0  9  1  2  0  0  0  2  0  0 NA NA  0  0  9 NA  2  2  1  1  2  0  0  9  2  0  3 NA  0 NA  2  0  0  0 NA  9  2  2 NA  0  3  2  0  2  0
+ [145]  1  1  0  0  0 NA NA  2 NA NA  3  0  9  0  0 NA  0  9  1  3  2  2  1  0  2 NA  0  1  0 NA  2  2  1  1 NA  0 NA  3  0  3 NA NA  0 NA NA NA NA  2
+ [193]  0  2  0  0  0  3 NA  2  0  0  0  0  0  0 NA  0 NA  3 NA  2  0 NA  2  0  3 NA NA  3 NA NA NA NA NA NA  0 NA  3  9 NA  0 NA  0 NA NA  1  0  2  3
+ [241] NA NA NA  0 NA NA  1 NA  2 NA NA NA NA  0  1  2  0 NA  0 NA  3  0  3  0  0 NA NA  2  3 NA NA NA NA  1 NA  2  2  3  0  0  0 NA NA  0  0  3  1  1
+ [289]  0  9  2  0  2  2 NA NA  1 NA NA NA  0  0 NA NA  3 NA  0 NA NA  1 NA  9 NA  0  3 NA NA NA NA NA  0 NA  1 NA  0  3  2 NA NA  2  1 NA NA NA NA  2
+ [337]  0  0  0  2 NA  1  1 NA  0  0 NA NA  1  3 NA  0 NA  2  1 NA NA  9 NA NA NA NA NA NA  9  0 NA  2  0 NA NA NA NA NA  2 NA NA NA  2  0  1  2  9  9
+ [385]  0 NA  3  0 NA  2 NA  3  9  9  2  0 NA NA  1  2 NA NA  0  3 NA NA NA NA NA NA  2  0 NA NA NA NA NA NA  9  0 NA NA NA NA NA NA  3 NA  0  2  9 NA
+ [433]  0  1 NA  0  2  1 NA NA  1  0  2  0 NA  0  3  3  1  0  3 NA  3  0 NA  2 NA  1  2  0 NA  0 NA NA NA NA  0  9  2  0 NA NA NA NA NA NA  0 NA NA  0
+ [481]  0  2 NA NA  0 NA  1 NA  2  3  0  2  2  0  0  1  2  3  9 NA  9 NA  2  2  1  2  2  1  2  0  1  3 NA NA NA NA NA NA NA  9 NA NA NA NA NA  1  0  0
+ [529] NA  3 NA  2  2  9  3 NA NA  2  2 NA  2  2 NA  2 NA NA  0 NA NA  1  0 NA NA  1  2  2 NA NA NA NA NA  0  2  0 NA  0  0  0  0  0  0 NA NA NA NA NA
+ [577] NA NA  2 NA NA NA NA  2 NA  0  3  0  0 NA NA NA NA  0 NA NA  0  3 NA NA NA  0 NA NA NA  9 NA NA NA NA NA NA NA  2  2 NA  2 NA NA NA  0 NA NA  1
+ [625]  1  9  0  2 NA NA NA NA  1 NA NA NA  2 NA  0  0 NA  0  9  2 NA  0  1 NA  0  1 NA  0  0  2 NA  1  9 NA  0  3  3  1  3 NA  2 NA NA  2 NA  0  9  0
+ [673]  1  1 NA  2  0 NA  2  1 NA NA NA NA  3  3 NA NA  3  0 NA  9 NA  3 NA NA  9  2  0  3  2  0  0 NA  0  2  2 NA NA  2  0 NA NA  2 NA  1 NA NA NA NA
+ [721] NA NA  2  2 NA  0 NA  2  0  2  2  2  2  1  0 NA NA NA NA  1 NA  2  0  0 NA NA NA  2  1  1 NA  2  0  1  0 NA  1  2  1  1  9  0 NA NA  0  1 NA NA
+ [769]  1  0  2 NA NA NA NA NA NA NA NA NA  0 NA NA NA  0 NA  1  1  2  1 NA NA NA NA NA NA NA  2 NA  0 NA NA  0 NA NA  0 NA NA NA NA  0 NA  0 NA NA  0
+ [817] NA NA  2  0 NA NA NA NA NA NA NA NA NA NA  1 NA NA NA NA NA  2 NA  1  0 NA  2  2  1  2 NA NA NA NA  0  9 NA NA  2  0 NA NA  3  0  2  2  0  1  0
+ [865]  0 NA  1  9  0  0  0  0  2  0  1  0  1  0 NA  0 NA NA  9 NA NA NA NA NA NA NA NA NA NA  0 NA  3  0 NA NA  2  9 NA NA NA  3 NA  1 NA NA  1  2  0
+ [913] NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA  0  1 NA NA NA NA NA NA  0 NA NA NA NA  2  1 NA NA  1 NA NA  1  0  1 NA  0  9 NA NA  1
+ [961] NA  2 NA NA  0 NA NA  3  0 NA NA  2  0 NA NA NA NA NA NA  3 NA  2 NA NA NA NA  1  2  1  0 NA  0 NA  0 NA NA NA NA NA  0
+ [ reached getOption("max.print") -- omitted 2791 entries ]
+
+Labels:
+ + +
+ +
+ + +
AEDB$indexsymptoms_worst_4g
+ + +
<labelled<double>[3791]>:  symptoms strokefenotype en symptoms.4g .
+   [1]  2  3  2  0  0  2  0  3 NA  0  0  0  2  1  0  0  0  0 NA  0  1  0  0  0  0  2  0  0 NA  0  0 NA  1  0  9  2  0  9  0  1  0  9  0  0  3  2  0 NA
+  [49]  0  0  1  9  2  9  1  0  0  2  2  2  0  9  2  0  0  0  2 NA  0  0  0  0  0  0  2  0  0  2  3  0  1  3  0 NA  0  0  9  2  3  3 NA  2  0  0  3 NA
+  [97] NA  3  1  0  9  1  2  0  0  0  2  0  0 NA NA  0  0  9 NA  2  2  1  1  2  0  0  9  2  0  3 NA  0 NA  2  0  0  0 NA  9  2  2 NA  0  3  2  0  2  0
+ [145]  1  1  0  0  0 NA NA  2 NA NA  3  0  9  0  0 NA  0  9  1  3  2  2  1  0  2 NA  0  1  0 NA  2  2  1  1 NA  0 NA  3  0  3 NA NA  0 NA NA NA NA  2
+ [193]  0  2  0  0  0  3 NA  2  0  0  0  0  0  0 NA  0 NA  3 NA  2  0 NA  2  0  3 NA NA  3 NA NA NA NA NA NA  0 NA  3  9 NA  0 NA  0 NA NA  1  0  2  3
+ [241] NA NA NA  0 NA NA  1 NA  2 NA NA NA NA  0  1  2  0 NA  0 NA  3  0  3  0  0 NA NA  2  3 NA NA NA NA  1 NA  2  2  3  0  0  0 NA NA  0  0  3  1  1
+ [289]  0  9  2  0  2  2 NA NA  1 NA NA NA  0  0 NA NA  3 NA  0 NA NA  1 NA  9 NA  0  3 NA NA NA NA NA  0 NA  1 NA  0  3  2 NA NA  2  1 NA NA NA NA  2
+ [337]  0  0  0  2 NA  1  1 NA  0  0 NA NA  1  3 NA  0 NA  2  1 NA NA  9 NA NA NA NA NA NA  9  0 NA  2  0 NA NA NA NA NA  2 NA NA NA  2  0  1  2  9  9
+ [385]  0 NA  3  0 NA  2 NA  3  9  9  2  0 NA NA  1  2 NA NA  0  3 NA NA NA NA NA NA  2  0 NA NA NA NA NA NA  9  0 NA NA NA NA NA NA  3 NA  0  2  9 NA
+ [433]  0  1 NA  0  2  1 NA NA  1  0  2  0 NA  0  3  3  1  0  3 NA  3  0 NA  2 NA  1  2  0 NA  0 NA NA NA NA  0  9  2  0 NA NA NA NA NA NA  0 NA NA  0
+ [481]  0  2 NA NA  0 NA  1 NA  2  3  0  2  2  0  0  1  2  3  9 NA  9 NA  2  2  1  2  2  1  2  0  1  3 NA NA NA NA NA NA NA  9 NA NA NA NA NA  1  0  0
+ [529] NA  3 NA  2  2  9  3 NA NA  2  2 NA  2  2 NA  2 NA NA  0 NA NA  1  0 NA NA  1  2  2 NA NA NA NA NA  0  2  0 NA  0  0  0  0  0  0 NA NA NA NA NA
+ [577] NA NA  2 NA NA NA NA  2 NA  0  3  0  0 NA NA NA NA  0 NA NA  0  3 NA NA NA  0 NA NA NA  9 NA NA NA NA NA NA NA  2  2 NA  2 NA NA NA  0 NA NA  1
+ [625]  1  9  0  2 NA NA NA NA  1 NA NA NA  2 NA  0  0 NA  0  9  2 NA  0  1 NA  0  1 NA  0  0  2 NA  1  9 NA  0  3  3  1  3 NA  2 NA NA  2 NA  0  9  0
+ [673]  1  1 NA  2  0 NA  2  1 NA NA NA NA  3  3 NA NA  3  0 NA  9 NA  3 NA NA  9  2  0  3  2  0  0 NA  0  2  2 NA NA  2  0 NA NA  2 NA  1 NA NA NA NA
+ [721] NA NA  2  2 NA  0 NA  2  0  2  2  2  2  1  0 NA NA NA NA  1 NA  2  0  0 NA NA NA  2  1  1 NA  2  0  1  0 NA  1  2  1  1  9  0 NA NA  0  1 NA NA
+ [769]  1  0  2 NA NA NA NA NA NA NA NA NA  0 NA NA NA  0 NA  1  1  2  1 NA NA NA NA NA NA NA  2 NA  0 NA NA  0 NA NA  0 NA NA NA NA  0 NA  0 NA NA  0
+ [817] NA NA  2  0 NA NA NA NA NA NA NA NA NA NA  1 NA NA NA NA NA  2 NA  1  0 NA  2  2  1  2 NA NA NA NA  0  9 NA NA  2  0 NA NA  3  0  2  2  0  1  0
+ [865]  0 NA  1  9  0  0  0  0  2  0  1  0  1  0 NA  0 NA NA  9 NA NA NA NA NA NA NA NA NA NA  0 NA  3  0 NA NA  2  9 NA NA NA  3 NA  1 NA NA  1  2  0
+ [913] NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA  0  1 NA NA NA NA NA NA  0 NA NA NA NA  2  1 NA NA  1 NA NA  1  0  1 NA  0  9 NA NA  1
+ [961] NA  2 NA NA  0 NA NA  3  0 NA NA  2  0 NA NA NA NA NA NA  3 NA  2 NA NA NA NA  1  2  1  0 NA  0 NA  0 NA NA NA NA NA  0
+ [ reached getOption("max.print") -- omitted 2791 entries ]
+
+Labels:
+ + +
+ +
+ + +
AEDB$indexsymptoms_latest
+ + +
<labelled<double>[3791]>: Latest cerebrovascular symptoms (indication CEA).
+   [1]  2  3  2  0  0  2  0  3 NA  0  0  0  2  1  0  0  0  0 NA  0  1  0  0  0  0  2  0  0 NA  0  0 NA  1  0  9  2  0  9  0  1  0  9  0  0  3  2  0 NA
+  [49]  0  0  1  9  2  9  1  0  0  2  2  9  0  9  2  0  0  0  2 NA  0  0  0  0  0  0  2  0  0  2  3  0  1  3  0 NA  0  0  9  2  3  3 NA  2  0  0  3 NA
+  [97] NA  3  1  0  9  1  2  0  0  0  2  0  0 NA NA  0  0  9 NA  2  2  1  1  2  0  0  9  2  0  3 NA  0 NA  2  0  0  0 NA  9  2  2 NA  0  3  2  0  2  0
+ [145]  1  1  0  0  0 NA NA  2 NA NA  3  0  9  0  0 NA  0  9  1  3  2  2  1  0  2 NA  0  1  0 NA  2  2  1  1 NA  0 NA  3  0  3 NA NA  0 NA NA NA NA  2
+ [193]  0  2  0  0  0  3 NA  2  0  0  0  0  0  0 NA  0 NA  3 NA  2  0 NA  2  0  3 NA NA  3 NA NA NA NA NA NA  0 NA  3  9 NA  0 NA  0 NA NA  1  0  2  3
+ [241] NA NA NA  0 NA NA  1 NA  2 NA NA NA NA  0  1  2  0 NA  0 NA  3  0  3  0  0 NA NA  2  3 NA NA NA NA  1 NA  2  2  3  0  0  0 NA NA  0  0  3  1  1
+ [289]  0  9  2  0  2  2 NA NA  1 NA NA NA  0  0 NA NA  3 NA  0 NA NA  1 NA  9 NA  0  3 NA NA NA NA NA  0 NA  1 NA  0  3  2 NA NA  2  1 NA NA NA NA  2
+ [337]  0  0  0  2 NA  1  1 NA  0  0 NA NA  1  3 NA  0 NA  2  1 NA NA  9 NA NA NA NA NA NA  9  0 NA  2  0 NA NA NA NA NA  2 NA NA NA  2  0  1  2  9  9
+ [385]  0 NA  3  0 NA  2 NA  3  9  9  2  0 NA NA  1  2 NA NA  0  3 NA NA NA NA NA NA  2  0 NA NA NA NA NA NA  9  0 NA NA NA NA NA NA  3 NA  0  2  9 NA
+ [433]  0  1 NA  0  2  1 NA NA  1  0  2  0 NA  0  3  3  1  0  3 NA  3  0 NA  2 NA  1  2  0 NA  0 NA NA NA NA  0  9  2  0 NA NA NA NA NA NA  0 NA NA  0
+ [481]  0  2 NA NA  0 NA  1 NA  2  3  0  2  2  0  0  1  2  3  9 NA  9 NA  2  2  1  2  2  1  2  0  1  3 NA NA NA NA NA NA NA  9 NA NA NA NA NA  1  0  0
+ [529] NA  3 NA  2  2  9  3 NA NA  2  2 NA  2  2 NA  2 NA NA  0 NA NA  1  0 NA NA  1  2  2 NA NA NA NA NA  0  2  0 NA  0  0  0  0  0  0 NA NA NA NA NA
+ [577] NA NA  2 NA NA NA NA  2 NA  0  3  0  0 NA NA NA NA  0 NA NA  0  3 NA NA NA  0 NA NA NA  9 NA NA NA NA NA NA NA  2  2 NA  2 NA NA NA  0 NA NA  1
+ [625]  1  9  0  2 NA NA NA NA  1 NA NA NA  2 NA  0  0 NA  0  9  2 NA  0  1 NA  0  1 NA  0  0  2 NA  1  9 NA  0  3  3  1  3 NA  2 NA NA  2 NA  0  9  0
+ [673]  1  1 NA  2  0 NA  2  1 NA NA NA NA  3  3 NA NA  3  0 NA  9 NA  3 NA NA  9  2  0  3  2  0  0 NA  0  2  2 NA NA  2  0 NA NA  2 NA  1 NA NA NA NA
+ [721] NA NA  2  2 NA  0 NA  2  0  2  2  2  2  1  0 NA NA NA NA  1 NA  2  0  0 NA NA NA  2  1  1 NA  2  0  1  0 NA  1  2  1  1  9  0 NA NA  0  1 NA NA
+ [769]  1  0  2 NA NA NA NA NA NA NA NA NA  0 NA NA NA  0 NA  1  1  2  1 NA NA NA NA NA NA NA  2 NA  0 NA NA  0 NA NA  0 NA NA NA NA  0 NA  0 NA NA  0
+ [817] NA NA  2  0 NA NA NA NA NA NA NA NA NA NA  1 NA NA NA NA NA  2 NA  1  0 NA  2  2  1  2 NA NA NA NA  0  9 NA NA  2  0 NA NA  3  0  2  2  0  1  0
+ [865]  0 NA  1  9  0  0  0  0  2  0  1  0  1  0 NA  0 NA NA  9 NA NA NA NA NA NA NA NA NA NA  0 NA  3  0 NA NA  2  9 NA NA NA  3 NA  1 NA NA  1  2  0
+ [913] NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA  0  1 NA NA NA NA NA NA  0 NA NA NA NA  2  1 NA NA  1 NA NA  1  0  1 NA  0  9 NA NA  1
+ [961] NA  2 NA NA  0 NA NA  3  0 NA NA  2  0 NA NA NA NA NA NA  3 NA  2 NA NA NA NA  1  2  1  0 NA  0 NA  0 NA NA NA NA NA  0
+ [ reached getOption("max.print") -- omitted 2791 entries ]
+
+Labels:
+ + +
+ +
+ + +
AEDB$indexsymptoms_latest_4g
+ + +
<labelled<double>[3791]>:  symptoms strokefenotype en symptoms.4g .
+   [1]  2  3  2  0  0  2  0  3 NA  0  0  0  2  1  0  0  0  0 NA  0  1  0  0  0  0  2  0  0 NA  0  0 NA  1  0  9  2  0  9  0  1  0  9  0  0  3  2  0 NA
+  [49]  0  0  1  9  2  9  1  0  0  2  2  9  0  9  2  0  0  0  2 NA  0  0  0  0  0  0  2  0  0  2  3  0  1  3  0 NA  0  0  9  2  3  3 NA  2  0  0  3 NA
+  [97] NA  3  1  0  9  1  2  0  0  0  2  0  0 NA NA  0  0  9 NA  2  2  1  1  2  0  0  9  2  0  3 NA  0 NA  2  0  0  0 NA  9  2  2 NA  0  3  2  0  2  0
+ [145]  1  1  0  0  0 NA NA  2 NA NA  3  0  9  0  0 NA  0  9  1  3  2  2  1  0  2 NA  0  1  0 NA  2  2  1  1 NA  0 NA  3  0  3 NA NA  0 NA NA NA NA  2
+ [193]  0  2  0  0  0  3 NA  2  0  0  0  0  0  0 NA  0 NA  3 NA  2  0 NA  2  0  3 NA NA  3 NA NA NA NA NA NA  0 NA  3  9 NA  0 NA  0 NA NA  1  0  2  3
+ [241] NA NA NA  0 NA NA  1 NA  2 NA NA NA NA  0  1  2  0 NA  0 NA  3  0  3  0  0 NA NA  2  3 NA NA NA NA  1 NA  2  2  3  0  0  0 NA NA  0  0  3  1  1
+ [289]  0  9  2  0  2  2 NA NA  1 NA NA NA  0  0 NA NA  3 NA  0 NA NA  1 NA  9 NA  0  3 NA NA NA NA NA  0 NA  1 NA  0  3  2 NA NA  2  1 NA NA NA NA  2
+ [337]  0  0  0  2 NA  1  1 NA  0  0 NA NA  1  3 NA  0 NA  2  1 NA NA  9 NA NA NA NA NA NA  9  0 NA  2  0 NA NA NA NA NA  2 NA NA NA  2  0  1  2  9  9
+ [385]  0 NA  3  0 NA  2 NA  3  9  9  2  0 NA NA  1  2 NA NA  0  3 NA NA NA NA NA NA  2  0 NA NA NA NA NA NA  9  0 NA NA NA NA NA NA  3 NA  0  2  9 NA
+ [433]  0  1 NA  0  2  1 NA NA  1  0  2  0 NA  0  3  3  1  0  3 NA  3  0 NA  2 NA  1  2  0 NA  0 NA NA NA NA  0  9  2  0 NA NA NA NA NA NA  0 NA NA  0
+ [481]  0  2 NA NA  0 NA  1 NA  2  3  0  2  2  0  0  1  2  3  9 NA  9 NA  2  2  1  2  2  1  2  0  1  3 NA NA NA NA NA NA NA  9 NA NA NA NA NA  1  0  0
+ [529] NA  3 NA  2  2  9  3 NA NA  2  2 NA  2  2 NA  2 NA NA  0 NA NA  1  0 NA NA  1  2  2 NA NA NA NA NA  0  2  0 NA  0  0  0  0  0  0 NA NA NA NA NA
+ [577] NA NA  2 NA NA NA NA  2 NA  0  3  0  0 NA NA NA NA  0 NA NA  0  3 NA NA NA  0 NA NA NA  9 NA NA NA NA NA NA NA  2  2 NA  2 NA NA NA  0 NA NA  1
+ [625]  1  9  0  2 NA NA NA NA  1 NA NA NA  2 NA  0  0 NA  0  9  2 NA  0  1 NA  0  1 NA  0  0  2 NA  1  9 NA  0  3  3  1  3 NA  2 NA NA  2 NA  0  9  0
+ [673]  1  1 NA  2  0 NA  2  1 NA NA NA NA  3  3 NA NA  3  0 NA  9 NA  3 NA NA  9  2  0  3  2  0  0 NA  0  2  2 NA NA  2  0 NA NA  2 NA  1 NA NA NA NA
+ [721] NA NA  2  2 NA  0 NA  2  0  2  2  2  2  1  0 NA NA NA NA  1 NA  2  0  0 NA NA NA  2  1  1 NA  2  0  1  0 NA  1  2  1  1  9  0 NA NA  0  1 NA NA
+ [769]  1  0  2 NA NA NA NA NA NA NA NA NA  0 NA NA NA  0 NA  1  1  2  1 NA NA NA NA NA NA NA  2 NA  0 NA NA  0 NA NA  0 NA NA NA NA  0 NA  0 NA NA  0
+ [817] NA NA  2  0 NA NA NA NA NA NA NA NA NA NA  1 NA NA NA NA NA  2 NA  1  0 NA  2  2  1  2 NA NA NA NA  0  9 NA NA  2  0 NA NA  3  0  2  2  0  1  0
+ [865]  0 NA  1  9  0  0  0  0  2  0  1  0  1  0 NA  0 NA NA  9 NA NA NA NA NA NA NA NA NA NA  0 NA  3  0 NA NA  2  9 NA NA NA  3 NA  1 NA NA  1  2  0
+ [913] NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA NA  0  1 NA NA NA NA NA NA  0 NA NA NA NA  2  1 NA NA  1 NA NA  1  0  1 NA  0  9 NA NA  1
+ [961] NA  2 NA NA  0 NA NA  3  0 NA NA  2  0 NA NA NA NA NA NA  3 NA  2 NA NA NA NA  1  2  1  0 NA  0 NA  0 NA NA NA NA NA  0
+ [ reached getOption("max.print") -- omitted 2791 entries ]
+
+Labels:
+ + +
+ +
+ + + +

Getting counts for each of the most important categories.

+ + + +
cat("New 'worst' vs 'latest' symptom categories.\n")
+ + +
New 'worst' vs 'latest' symptom categories.
+ + +
table(as_factor(AEDB$indexsymptoms_worst_4g), as_factor(AEDB$indexsymptoms_latest_4g))
+ + +
         
+          asymp ocular TIA stroke unclear
+  asymp     804     62  84     25      25
+  ocular      0    345   0      0       0
+  TIA         0     19 703      0       1
+  stroke      0      7  18    555       0
+  unclear     0      0   0      0      55
+ + +
cat("\nNew 'worst' symptom categories.\n")
+ + +

+New 'worst' symptom categories.
+ + +
table((AEDB$indexsymptoms_worst_4g))
+ + +

+   0    1    2    3    9 
+1000  345  723  580   55 
+ + +
cat("\nNew 'latest' symptom categories.\n")
+ + +

+New 'latest' symptom categories.
+ + +
table(as_factor(AEDB$indexsymptoms_latest_4g))
+ + +

+  asymp  ocular     TIA  stroke unclear 
+    804     433     805     580      81 
+ + + +

Comparing with the original symptom categories.

+ + + +
cat("New 'latest' vs original symptom 2G categories.\n")
+ + +
New 'latest' vs original symptom 2G categories.
+ + +
table((AEDB$indexsymptoms_latest_4g), AEDB$AsymptSympt2G)
+ + +
   
+    Asymptomatic Symptomatic
+  0          317         479
+  1            2         430
+  2            6         796
+  3            1         576
+  9            7          74
+ + +
cat("\nNew 'latest' vs original symptom 5G categories.\n")
+ + +

+New 'latest' vs original symptom 5G categories.
+ + +
table((AEDB$indexsymptoms_latest_4g), AEDB$Symptoms.5G)
+ + +
   
+    Asymptomatic Ocular Other Retinal infarction Stroke TIA
+  0          317     79    82                  9    128 181
+  1            2    313     4                 32     13  68
+  2            6     11    16                  2     90 677
+  3            1      2     7                  0    488  79
+  9            7     11    10                  0     13  40
+ + +
   
+ + + +

We need to be very strict in defining symptoms. Therefore we +will fix a new variable that groups symptoms at inclusion.

+

Coding of symptoms is as follows:

+
    +
  • asympt 0
    +
  • +
  • ocular 1
    +
  • +
  • TIA 2
    +
  • +
  • stroke 3
    +
  • +
  • unclear 9
  • +
+

We will group as follows:

+
    +
  1. Asymptomatic > 0
  2. +
  3. Symptomatic > 1, 2, 3
  4. +
  5. NA > 9
  6. +
+ + + +

+# Fix symptoms
+attach(AEDB)
+
+# Symptoms.Update2G
+AEDB[,"Symptoms.Update2G"] <- NA
+AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 0] <- "Asymptomatic"
+AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 1 | indexsymptoms_latest_4g == 2 | indexsymptoms_latest_4g == 3] <- "Symptomatic"
+AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 9 ] <- NA
+
+# Symptoms.Update3G
+AEDB[,"Symptoms.Update3G"] <- NA
+AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 0] <- "Asymptomatic"
+AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 1 | indexsymptoms_latest_4g == 2 | indexsymptoms_latest_4g == 3] <- "Symptomatic"
+AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 9 ] <- "Unclear"
+
+detach(AEDB)
+
+table(AEDB$Symptoms.Update2G, AEDB$Symptoms.5G, useNA = "ifany")
+ + +
              
+               Asymptomatic Ocular Other Retinal infarction Stroke  TIA <NA>
+  Asymptomatic          317     79    82                  9    128  181    8
+  Symptomatic             9    326    27                 34    591  824    7
+  <NA>                    7     11    10                  0     13   40 1088
+ + +
table(AEDB$Symptoms.Update3G, AEDB$Symptoms.5G, useNA = "ifany")
+ + +
              
+               Asymptomatic Ocular Other Retinal infarction Stroke  TIA <NA>
+  Asymptomatic          317     79    82                  9    128  181    8
+  Symptomatic             9    326    27                 34    591  824    7
+  Unclear                 7     11    10                  0     13   40    0
+  <NA>                    0      0     0                  0      0    0 1088
+ + + +
+
+

Other clinical characteristics

+

We will also fix the diabetes status variable.

+ + + +

+# Fix diabetes
+attach(AEDB)
+AEDB[,"DiabetesStatus"] <- NA
+AEDB$DiabetesStatus[DM.composite == -999] <- NA
+AEDB$DiabetesStatus[DM.composite == 0] <- "Control (no Diabetes Dx/Med)"
+AEDB$DiabetesStatus[DM.composite == 1] <- "Diabetes"
+detach(AEDB)
+
+table(AEDB$DM.composite, AEDB$DiabetesStatus)
+ + +
   
+    Control (no Diabetes Dx/Med) Diabetes
+  0                         2764        0
+  1                            0      985
+ + +
# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "DM.composite", "DiabetesStatus"))
+# require(labelled)
+# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
+# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
+# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
+# AEDB.temp$DiabetesStatus <- to_factor(AEDB.temp$DiabetesStatus)
+# 
+# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
+# 
+# rm(AEDB.temp)
+ + + +

We will also fix the smoking status variable. We are +interested in whether someone never, ever or is currently (at the time +of inclusion) smoking. This is based on the questionnaire.

+
    +
  • diet801: are you a smoker?
  • +
  • diet802: did you smoke in the past?
  • +
+

We already have some variables indicating smoking status:

+
    +
  • SmokingReported: patient has reported to smoke.
  • +
  • SmokingYearOR: smoking in the year of surgery?
  • +
  • SmokerCurrent: currently smoking?
  • +
+ + + +
require(labelled)
+AEDB$diet801 <- to_factor(AEDB$diet801)
+AEDB$diet802 <- to_factor(AEDB$diet802)
+AEDB$diet805 <- to_factor(AEDB$diet805)
+AEDB$SmokingReported <- to_factor(AEDB$SmokingReported)
+AEDB$SmokerCurrent <- to_factor(AEDB$SmokerCurrent)
+AEDB$SmokingYearOR <- to_factor(AEDB$SmokingYearOR)
+
+# table(AEDB$diet801)
+# table(AEDB$diet802)
+# table(AEDB$SmokingReported)
+# table(AEDB$SmokerCurrent)
+# table(AEDB$SmokingYearOR)
+# table(AEDB$SmokingReported, AEDB$SmokerCurrent, useNA = "ifany", dnn = c("Reported smoking", "Current smoker"))
+# 
+# table(AEDB$diet801, AEDB$diet802, useNA = "ifany", dnn = c("Smoker", "Past smoker"))
+
+cat("\nFixing smoking status.\n")
+ + +

+Fixing smoking status.
+ + +
attach(AEDB)
+AEDB[,"SmokerStatus"] <- NA
+AEDB$SmokerStatus[diet802 == "don't know"] <- "Never smoked"
+AEDB$SmokerStatus[diet802 == "I still smoke"] <- "Current smoker"
+AEDB$SmokerStatus[SmokerCurrent == "no" & diet802 == "no"] <- "Never smoked"
+AEDB$SmokerStatus[SmokerCurrent == "no" & diet802 == "yes"] <- "Ex-smoker"
+AEDB$SmokerStatus[SmokerCurrent == "yes"] <- "Current smoker"
+AEDB$SmokerStatus[SmokerCurrent == "no data available/missing"] <- NA
+# AEDB$SmokerStatus[is.na(SmokerCurrent)] <- "Never smoked"
+detach(AEDB)
+
+cat("\n* Current smoking status.\n")
+ + +

+* Current smoking status.
+ + +
table(AEDB$SmokerCurrent,
+      useNA = "ifany", 
+      dnn = c("Current smoker"))
+ + +
Current smoker
+no data available/missing                        no                       yes                      <NA> 
+                        0                      2364                      1308                       119 
+ + +
cat("\n* Updated smoking status.\n")
+ + +

+* Updated smoking status.
+ + +
table(AEDB$SmokerStatus,
+      useNA = "ifany", 
+      dnn = c("Updated smoking status"))
+ + +
Updated smoking status
+Current smoker      Ex-smoker   Never smoked           <NA> 
+          1308           1814            389            280 
+ + +
cat("\n* Comparing to 'SmokerCurrent'.\n")
+ + +

+* Comparing to 'SmokerCurrent'.
+ + +
table(AEDB$SmokerStatus, AEDB$SmokerCurrent, 
+      useNA = "ifany", 
+      dnn = c("Updated smoking status", "Current smoker"))
+ + +
                      Current smoker
+Updated smoking status no data available/missing   no  yes <NA>
+        Current smoker                         0    0 1308    0
+        Ex-smoker                              0 1814    0    0
+        Never smoked                           0  389    0    0
+        <NA>                                   0  161    0  119
+ + +
# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "DM.composite", "DiabetesStatus"))
+# require(labelled)
+# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
+# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
+# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
+# AEDB.temp$DiabetesStatus <- to_factor(AEDB.temp$DiabetesStatus)
+# 
+# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
+# 
+# rm(AEDB.temp)
+ + + +

We will also fix the alcohol status variable.

+ + + +

+# Fix diabetes
+attach(AEDB)
+AEDB[,"AlcoholUse"] <- NA
+AEDB$AlcoholUse[diet810 == -999] <- NA
+AEDB$AlcoholUse[diet810 == 0] <- "No"
+AEDB$AlcoholUse[diet810 == 1] <- "Yes"
+detach(AEDB)
+
+# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "diet810", "AlcoholUse"))
+# require(labelled)
+# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
+# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
+# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
+# AEDB.temp$AlcoholUse <- to_factor(AEDB.temp$AlcoholUse)
+# 
+# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
+# 
+# rm(AEDB.temp)
+ + + +

We will also fix a history of CAD, stroke or peripheral intervention +status variable. This will be based on CAD_history, +Stroke_history, and Peripheral.interv

+ + + +

+# Fix diabetes
+attach(AEDB)
+AEDB[,"MedHx_CVD"] <- NA
+AEDB$MedHx_CVD[CAD_history == 0 | Stroke_history == 0 | Peripheral.interv == 0] <- "No"
+AEDB$MedHx_CVD[CAD_history == 1 | Stroke_history == 1 | Peripheral.interv == 1] <- "yes"
+detach(AEDB)
+
+table(AEDB$CAD_history)
+ + +

+   0    1 
+2430 1285 
+ + +
table(AEDB$Stroke_history)
+ + +

+   0    1 
+2763  947 
+ + +
table(AEDB$Peripheral.interv)
+ + +

+   0    1 
+2579 1099 
+ + +
table(AEDB$MedHx_CVD)
+ + +

+  No  yes 
+1309 2475 
+ + +
# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "diet810", "AlcoholUse"))
+# require(labelled)
+# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
+# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
+# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
+# AEDB.temp$AlcoholUse <- to_factor(AEDB.temp$AlcoholUse)
+# 
+# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
+# 
+# rm(AEDB.temp)
+ + + +
+
+

Plaque phenotypes

+

We will also fix the plaquephenotypes variable.

+

Coding of symptoms is as follows:

+
    +
  • missing -999
    +
  • +
  • not relevant -888
  • +
  • fibrous 1
    +
  • +
  • fibroatheromatous 2
    +
  • +
  • atheromatous 3
  • +
+ + + +

+# Fix plaquephenotypes
+attach(AEDB)
+AEDB[,"OverallPlaquePhenotype"] <- NA
+AEDB$OverallPlaquePhenotype[plaquephenotype == -999] <- NA
+AEDB$OverallPlaquePhenotype[plaquephenotype == -999] <- NA
+AEDB$OverallPlaquePhenotype[plaquephenotype == 1] <- "fibrous"
+AEDB$OverallPlaquePhenotype[plaquephenotype == 2] <- "fibroatheromatous"
+AEDB$OverallPlaquePhenotype[plaquephenotype == 3] <- "atheromatous"
+detach(AEDB)
+
+# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "plaquephenotype", "OverallPlaquePhenotype"))
+# require(labelled)
+# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
+# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
+# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
+# 
+# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
+# 
+# rm(AEDB.temp)
+ + + +

We will also fix and inverse-rank normal transform the continuous +(manually) scored plaque phenotypes.

+ + + +
AEDB$macmean0 <- as.numeric(AEDB$macmean0)
+AEDB$smcmean0 <- as.numeric(AEDB$smcmean0)
+AEDB$neutrophils <- as.numeric(AEDB$neutrophils)
+AEDB$Mast_cells_plaque <- as.numeric(AEDB$Mast_cells_plaque)
+AEDB$vessel_density_averaged <- as.numeric(AEDB$vessel_density_averaged)
+
+AEDB$MAC_rankNorm <- qnorm((rank(AEDB$macmean0, na.last = "keep") - 0.5) / sum(!is.na(AEDB$macmean0)))
+AEDB$SMC_rankNorm <- qnorm((rank(AEDB$smcmean0, na.last = "keep") - 0.5) / sum(!is.na(AEDB$smcmean0)))
+AEDB$Neutrophils_rankNorm <- qnorm((rank(AEDB$neutrophils, na.last = "keep") - 0.5) / sum(!is.na(AEDB$neutrophils)))
+AEDB$MastCells_rankNorm <- qnorm((rank(AEDB$Mast_cells_plaque, na.last = "keep") - 0.5) / sum(!is.na(AEDB$Mast_cells_plaque)))
+AEDB$VesselDensity_rankNorm <- qnorm((rank(AEDB$vessel_density_averaged, na.last = "keep") - 0.5) / sum(!is.na(AEDB$vessel_density_averaged)))
+ + + + + + +
library(labelled)
+AEDB$Gender <- to_factor(AEDB$Gender)
+library(patchwork)
+
+p1 <- ggpubr::gghistogram(AEDB, "macmean0", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "% of macrophages (CD68)",
+                    xlab = "% per region of interest", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p2 <- ggpubr::gghistogram(AEDB, "MAC_rankNorm", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "% of macrophages (CD68)",
+                   xlab = "% per region of interest\ninverse-rank normalized number", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p1 | p2 
+ + +

+ + +

+p1 <- ggpubr::gghistogram(AEDB, "smcmean0", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "% of smooth muscle cells (SMA)",
+                    xlab = "% per region of interest", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p2 <- ggpubr::gghistogram(AEDB, "SMC_rankNorm", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "% of smooth muscle cells (SMA)",
+                   xlab = "% per region of interest\ninverse-rank normalized number", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p1 | p2 
+ + +

+ + +

+
+p1 <- ggpubr::gghistogram(AEDB, "neutrophils", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "number of neutrophils (CD66b)",
+                    xlab = "counts per plaque", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p2 <- ggpubr::gghistogram(AEDB, "Neutrophils_rankNorm", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "number of neutrophils (CD66b)",
+                   xlab = "counts per plaque\ninverse-rank normalized number", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p1 | p2 
+ + +

+ + +

+
+p1 <- ggpubr::gghistogram(AEDB, "Mast_cells_plaque", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "number of mast cells",
+                    xlab = "counts per plaque", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p2 <- ggpubr::gghistogram(AEDB, "MastCells_rankNorm", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "number of mast cells",
+                   xlab = "counts per plaque\ninverse-rank normalized number", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p1 | p2 
+ + +

+ + +

+
+p1 <- ggpubr::gghistogram(AEDB, "vessel_density_averaged", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "number of intraplaque neovessels",
+                    xlab = "counts per 3-4 hotspots", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p2 <- ggpubr::gghistogram(AEDB, "VesselDensity_rankNorm", 
+                    # y = "..count..", 
+                    color = "white",
+                    fill = "Gender",
+                    palette = c("#1290D9", "#DB003F"), 
+                    add = "median", 
+                    #add_density = TRUE,
+                    rug = TRUE,
+                    #add.params =  list(color = "black", linetype = 2), 
+                    title = "number of intraplaque neovessels",
+                   xlab = "counts per 3-4 hotspots\ninverse-rank normalized number", 
+                    ggtheme = theme_minimal())
+ + +
Warning: Using `bins = 30` by default. Pick better value with the argument `bins`.
+ + +
p1 | p2 
+ + +

+ + +

+rm(p1, p2)
+ + + +

Here we calculate the plaque instability/vulnerability +index

+ + + +
# Plaque vulnerability
+require(labelled)
+AEDB$Macrophages.bin <- to_factor(AEDB$Macrophages.bin)
+AEDB$SMC.bin <- to_factor(AEDB$SMC.bin)
+AEDB$IPH.bin <- to_factor(AEDB$IPH.bin)
+AEDB$Calc.bin <- to_factor(AEDB$Calc.bin)
+AEDB$Collagen.bin <- to_factor(AEDB$Collagen.bin)
+AEDB$Fat.bin_10 <- to_factor(AEDB$Fat.bin_10)
+AEDB$Fat.bin_40 <- to_factor(AEDB$Fat.bin_40)
+
+table(AEDB$Macrophages.bin)
+ + +

+      no/minor moderate/heavy 
+          1602           1215 
+ + +
table(AEDB$Fat.bin_10)
+ + +

+ <10%  >10% 
+ 1226  1628 
+ + +
table(AEDB$Collagen.bin)
+ + +

+      no/minor moderate/heavy 
+           540           2297 
+ + +
table(AEDB$SMC.bin)
+ + +

+      no/minor moderate/heavy 
+           870           1962 
+ + +
table(AEDB$IPH.bin)
+ + +

+  no  yes 
+1223 1628 
+ + +
# SPSS code
+
+# 
+# *** syntax- Plaque vulnerability**.
+# COMPUTE Macro_instab = -999.
+# IF macrophages.bin=2 Macro_instab=1.
+# IF macrophages.bin=1 Macro_instab=0.
+# EXECUTE.
+# 
+# COMPUTE Fat10_instab = -999.
+# IF Fat.bin_10=2 Fat10_instab=1.
+# IF Fat.bin_10=1 Fat10_instab=0.
+# EXECUTE.
+# 
+# COMPUTE coll_instab=-999.
+# IF Collagen.bin=2 coll_instab=0.
+# IF Collagen.bin=1 coll_instab=1.
+# EXECUTE.
+# 
+# 
+# COMPUTE SMC_instab=-999.
+# IF SMC.bin=2 SMC_instab=0.
+# IF SMC.bin=1 SMC_instab=1.
+# EXECUTE.
+# 
+# COMPUTE IPH_instab=-999.
+# IF IPH.bin=0 IPH_instab=0.
+# IF IPH.bin=1 IPH_instab=1.
+# EXECUTE.
+# 
+# COMPUTE Instability=Macro_instab + Fat10_instab +  coll_instab + SMC_instab + IPH_instab.
+# EXECUTE.
+
+# Fix plaquephenotypes
+attach(AEDB)
+# mac instability
+AEDB[,"MAC_Instability"] <- NA
+AEDB$MAC_Instability[Macrophages.bin == -999] <- NA
+AEDB$MAC_Instability[Macrophages.bin == "no/minor"] <- 0
+AEDB$MAC_Instability[Macrophages.bin == "moderate/heavy"] <- 1
+
+# fat instability
+AEDB[,"FAT10_Instability"] <- NA
+AEDB$FAT10_Instability[Fat.bin_10 == -999] <- NA
+AEDB$FAT10_Instability[Fat.bin_10 == " <10%"] <- 0
+AEDB$FAT10_Instability[Fat.bin_10 == " >10%"] <- 1
+
+# col instability 
+AEDB[,"COL_Instability"] <- NA
+AEDB$COL_Instability[Collagen.bin == -999] <- NA
+AEDB$COL_Instability[Collagen.bin == "no/minor"] <- 1
+AEDB$COL_Instability[Collagen.bin == "moderate/heavy"] <- 0
+
+# smc instability
+AEDB[,"SMC_Instability"] <- NA
+AEDB$SMC_Instability[SMC.bin == -999] <- NA
+AEDB$SMC_Instability[SMC.bin == "no/minor"] <- 1
+AEDB$SMC_Instability[SMC.bin == "moderate/heavy"] <- 0
+
+# iph instability
+AEDB[,"IPH_Instability"] <- NA
+AEDB$IPH_Instability[IPH.bin == -999] <- NA
+AEDB$IPH_Instability[IPH.bin == "no"] <- 0
+AEDB$IPH_Instability[IPH.bin == "yes"] <- 1
+
+detach(AEDB)
+
+table(AEDB$MAC_Instability, useNA = "ifany")
+ + +

+   0    1 <NA> 
+1602 1215  974 
+ + +
table(AEDB$FAT10_Instability, useNA = "ifany")
+ + +

+   0    1 <NA> 
+1226 1628  937 
+ + +
table(AEDB$COL_Instability, useNA = "ifany")
+ + +

+   0    1 <NA> 
+2297  540  954 
+ + +
table(AEDB$SMC_Instability, useNA = "ifany")
+ + +

+   0    1 <NA> 
+1962  870  959 
+ + +
table(AEDB$IPH_Instability, useNA = "ifany")
+ + +

+   0    1 <NA> 
+1223 1628  940 
+ + +
# creating vulnerability index
+AEDB <- AEDB %>% mutate(Plaque_Vulnerability_Index = factor(rowSums(.[grep("_Instability", names(.))], na.rm = TRUE)),
+                                )
+
+table(AEDB$Plaque_Vulnerability_Index, useNA = "ifany")
+ + +

+   0    1    2    3    4    5 
+1324  655  728  676  298  110 
+ + +
# str(AEDB$Plaque_Vulnerability_Index)
+ + + +
+
+
+

Prepare baseline summary

+

We are interested in the following variables at baseline in the whole +cohort.

+
    +
  • Age (years)
  • +
  • Female sex (N, %)
  • +
  • Artery type (N, %)
  • +
  • Hospital (N, %) + + + + + + + + + + + + + + + +
  • +
+ + + +
cat("====================================================================================================\n")
+ + +
====================================================================================================
+ + +
cat("SELECTION THE SHIZZLE\n")
+ + +
SELECTION THE SHIZZLE
+ + +
### Artery levels
+# AEdata$Artery_summary: 
+#           value                                                                                   label
+# NOT USE - 0 No artery known (yet), no surgery (patient ill, died, exited study), re-numbered to AAA
+# USE - 1                                                                  carotid (left & right)
+# USE - 2                                               femoral/iliac (left, right or both sides)
+# NOT USE - 3                                               other carotid arteries (common, external)
+# NOT USE - 4                                   carotid bypass and injury (left, right or both sides)
+# NOT USE - 5                                                         aneurysmata (carotid & femoral)
+# NOT USE - 6                                                                                   aorta
+# NOT USE - 7                                            other arteries (renal, popliteal, vertebral)
+# NOT USE - 8                        femoral bypass, angioseal and injury (left, right or both sides)
+
+### AEdata$informedconsent
+#           value                                                                                           label
+# NOT USE - -999                                                                                         missing
+# NOT USE - 0                                                                                        no, died
+# USE - 1                                                                                             yes
+# USE - 2                                                             yes, health treatment when possible
+# USE - 3                                                                        yes, no health treatment
+# USE - 4                                                yes, no health treatment, no commercial business
+# NOT USE - 5                                                          yes, no tissue, no commerical business
+# NOT USE - 6                      yes, no tissue, no questionnaires, no medical info, no commercial business
+# USE - 7                             yes, no questionnaires, no health treatment, no commercial business
+# USE - 8                                          yes, no questionnaires, health treatment when possible
+# NOT USE - 9                  yes, no tissue, no questionnaires, no health treatment, no commerical business
+# USE - 10                               yes, no health treatment, no medical info, no commercial business
+# NOT USE - 11 yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business
+# USE - 12                                                     yes, no questionnaires, no health treatment
+# NOT USE - 13                                                             yes, no tissue, no health treatment
+# NOT USE - 14                                                               yes, no tissue, no questionnaires
+# NOT USE - 15                                                  yes, no tissue, health treatment when possible
+# NOT USE - 16                                                                                  yes, no tissue
+# USE - 17                                                                     yes, no commerical business
+# USE - 18                                     yes, health treatment when possible, no commercial business
+# USE - 19                                                    yes, no medical info, no commercial business
+# USE - 20                                                                          yes, no questionnaires
+# NOT USE - 21                         yes, no tissue, no questionnaires, no health treatment, no medical info
+# NOT USE - 22                  yes, no tissue, no questionnaires, no health treatment, no commercial business
+# USE - 23                                                                            yes, no medical info
+# USE - 24                                                  yes, no questionnaires, no commercial business
+# USE - 25                                    yes, no questionnaires, no health treatment, no medical info
+# USE - 26                  yes, no questionnaires, health treatment when possible, no commercial business
+# USE - 27                                                      yes,  no health treatment, no medical info
+# NOT USE - 28                                                                             no, doesn't want to
+# NOT USE - 29                                                                              no, unable to sign
+# NOT USE - 30                                                                                 no, no reaction
+# NOT USE - 31                                                                                        no, lost
+# NOT USE - 32                                                                                     no, too old
+# NOT USE - 34                                            yes, no medical info, health treatment when possible
+# NOT USE - 35                                             no (never asked for IC because there was no tissue)
+# USE - 36                    yes, no medical info, no commercial business, health treatment when possible
+# NOT USE - 37                                                                                    no, endpoint
+# USE - 38                                                         wil niets invullen, wel alles gebruiken
+# USE - 39                                           second informed concents: yes, no commercial business
+# NOT USE - 40                                                                              nooit geincludeerd
+
+cat("- sanity checking PRIOR to selection")
+ + +
- sanity checking PRIOR to selection
+ + +
library(data.table)
+require(labelled)
+ae.gender <- to_factor(AEDB$Gender)
+ae.hospital <- to_factor(AEDB$Hospital)
+table(ae.gender, ae.hospital, dnn = c("Sex", "Hospital"))
+ + +
        Hospital
+Sex      St. Antonius, Nieuwegein UMC Utrecht
+  female                      524         636
+  male                       1211        1420
+ + +
ae.artery <- to_factor(AEDB$Artery_summary)
+table(ae.artery, ae.gender, dnn = c("Sex", "Artery"))
+ + +
                                                                                         Artery
+Sex                                                                                       female male
+  No artery known (yet), no surgery (patient ill, died, exited study), re-numbered to AAA      0    0
+  carotid (left & right)                                                                     805 1781
+  femoral/iliac (left, right or both sides)                                                  320  796
+  other carotid arteries (common, external)                                                   17   35
+  carotid bypass and injury (left, right or both sides)                                        6    3
+  aneurysmata (carotid & femoral)                                                              1    0
+  aorta                                                                                        3    5
+  other arteries (renal, popliteal, vertebral)                                                 4    9
+  femoral bypass, angioseal and injury (left, right or both sides)                             4    2
+ + +
rm(ae.gender, ae.hospital, ae.artery)
+
+# I change numeric and factors manually because, well, I wouldn't know how to fix it otherwise
+# to have this 'tibble' work with 'tableone'... :-)
+
+AEDB$Age <- as.numeric(AEDB$Age)
+AEDB$diastoli <- as.numeric(AEDB$diastoli)
+AEDB$systolic <- as.numeric(AEDB$systolic)
+
+AEDB$TC_finalCU <- as.numeric(AEDB$TC_finalCU)
+AEDB$LDL_finalCU <- as.numeric(AEDB$LDL_finalCU)
+AEDB$HDL_finalCU <- as.numeric(AEDB$HDL_finalCU)
+AEDB$TG_finalCU <- as.numeric(AEDB$TG_finalCU)
+
+AEDB$TC_final <- as.numeric(AEDB$TC_final)
+AEDB$LDL_final <- as.numeric(AEDB$LDL_final)
+AEDB$HDL_final <- as.numeric(AEDB$HDL_final)
+AEDB$TG_final <- as.numeric(AEDB$TG_final)
+
+AEDB$Age <- as.numeric(AEDB$Age)
+AEDB$GFR_MDRD <- as.numeric(AEDB$GFR_MDRD)
+AEDB$BMI <- as.numeric(AEDB$BMI)
+AEDB$eCigarettes <- as.numeric(AEDB$eCigarettes)
+AEDB$ePackYearsSmoking <- as.numeric(AEDB$ePackYearsSmoking)
+AEDB$EP_composite_time <- as.numeric(AEDB$EP_composite_time)
+AEDB$EP_major_time <- as.numeric(AEDB$EP_major_time)
+
+require(labelled)
+AEDB$Artery_summary <- to_factor(AEDB$Artery_summary)
+AEDB$ORyear <- to_factor(AEDB$ORyear)
+AEDB$Gender <- to_factor(AEDB$Gender)
+AEDB$Hospital <- to_factor(AEDB$Hospital)
+AEDB$KDOQI <- to_factor(AEDB$KDOQI)
+AEDB$BMI_WHO <- to_factor(AEDB$BMI_WHO)
+AEDB$DiabetesStatus <- to_factor(AEDB$DiabetesStatus)
+AEDB$SmokerStatus <- to_factor(AEDB$SmokerStatus)
+AEDB$AlcoholUse <- to_factor(AEDB$AlcoholUse)
+
+AEDB$Hypertension.selfreport <- to_factor(AEDB$Hypertension1)
+AEDB$Hypertension.selfreportdrug <- to_factor(AEDB$Hypertension2)
+AEDB$Hypertension.composite <- to_factor(AEDB$Hypertension.composite)
+AEDB$Hypertension.drugs <- to_factor(AEDB$Hypertension.drugs)
+
+AEDB$Med.anticoagulants <- to_factor(AEDB$Med.anticoagulants)
+AEDB$Med.all.antiplatelet <- to_factor(AEDB$Med.all.antiplatelet)
+AEDB$Med.Statin.LLD <- to_factor(AEDB$Med.Statin.LLD)
+
+AEDB$Stroke_Dx <- to_factor(AEDB$Stroke_Dx)
+AEDB$CAD_history <- to_factor(AEDB$CAD_history)
+AEDB$PAOD <- to_factor(AEDB$PAOD)
+AEDB$Peripheral.interv <- to_factor(AEDB$Peripheral.interv)
+
+AEDB$sympt <- to_factor(AEDB$sympt)
+AEDB$Symptoms.3g <- to_factor(AEDB$Symptoms.3g)
+AEDB$Symptoms.4g <- to_factor(AEDB$Symptoms.4g)
+AEDB$Symptoms.5G <- to_factor(AEDB$Symptoms.5G)
+AEDB$AsymptSympt <- to_factor(AEDB$AsymptSympt)
+AEDB$AsymptSympt2G <- to_factor(AEDB$AsymptSympt2G)
+AEDB$Symptoms.Update2G <- to_factor(AEDB$Symptoms.Update2G)
+AEDB$Symptoms.Update3G <- to_factor(AEDB$Symptoms.Update3G)
+
+AEDB$restenos <- to_factor(AEDB$restenos)
+AEDB$stenose <- to_factor(AEDB$stenose)
+AEDB$EP_composite <- to_factor(AEDB$EP_composite)
+AEDB$EP_major <- to_factor(AEDB$EP_major)
+AEDB$Macrophages.bin <- to_factor(AEDB$Macrophages.bin)
+AEDB$SMC.bin <- to_factor(AEDB$SMC.bin)
+AEDB$IPH.bin <- to_factor(AEDB$IPH.bin)
+AEDB$Calc.bin <- to_factor(AEDB$Calc.bin)
+AEDB$Collagen.bin <- to_factor(AEDB$Collagen.bin)
+AEDB$Fat.bin_10 <- to_factor(AEDB$Fat.bin_10)
+AEDB$Fat.bin_40 <- to_factor(AEDB$Fat.bin_40)
+AEDB$OverallPlaquePhenotype <- to_factor(AEDB$OverallPlaquePhenotype)
+AEDB$Plaque_Vulnerability_Index <- to_factor(AEDB$Plaque_Vulnerability_Index)
+
+AEDB$Artery_summary <- to_factor(AEDB$Artery_summary)
+
+AEDB$informedconsent <- to_factor(AEDB$informedconsent)
+
+AEDB.full <- subset(AEDB,
+                    informedconsent != "missing" & # we are really strict in selecting based on 'informed consent'!
+                       informedconsent != "no, died" & 
+                       informedconsent != "yes, no tissue, no commerical business" &
+                       informedconsent != "yes, no tissue, no questionnaires, no medical info, no commercial business" &
+                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commerical business" &
+                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business" &
+                       informedconsent != "yes, no tissue, no health treatment" &
+                       informedconsent != "yes, no tissue, no questionnaires" &
+                       informedconsent != "yes, no tissue, health treatment when possible" &
+                       informedconsent != "yes, no tissue" &
+                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info" &
+                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commercial business" &
+                       informedconsent != "no, doesn't want to" &
+                       informedconsent != "no, unable to sign" & 
+                       informedconsent != "no, no reaction" & 
+                       informedconsent != "no, lost" & 
+                       informedconsent != "no, too old" & 
+                       informedconsent != "yes, no medical info, health treatment when possible" &
+                       informedconsent != "no (never asked for IC because there was no tissue)" &
+                       informedconsent != "no, endpoint" & 
+                       informedconsent != "nooit geincludeerd")
+# AEDB.CEA[1:10, 1:10]
+dim(AEDB.full)
+ + +
[1] 3458 1114
+ + + + + + +
cat("===========================================================================================\n")
+ + +
===========================================================================================
+ + +
cat("CREATE BASELINE TABLE\n")
+ + +
CREATE BASELINE TABLE
+ + +
# Baseline table variables
+basetable_vars = c("Hospital", 
+                   "Artery_summary",
+                   "Age", "Gender")
+                   # "ORyear", 
+                   # "TC_finalCU", "LDL_finalCU", "HDL_finalCU", "TG_finalCU", 
+                   # "TC_final", "LDL_final", "HDL_final", "TG_final", 
+                   # "hsCRP_plasma",
+                   # "systolic", "diastoli", "GFR_MDRD", "BMI", 
+                   # "KDOQI", "BMI_WHO",
+                   # "SmokerStatus", "AlcoholUse",
+                   # "DiabetesStatus", 
+                   # "Hypertension.selfreport", "Hypertension.selfreportdrug", "Hypertension.composite", "Hypertension.drugs", 
+                   # "Med.anticoagulants", "Med.all.antiplatelet", "Med.Statin.LLD", 
+                   # "Stroke_Dx", "sympt", "Symptoms.5G", "AsymptSympt", "AsymptSympt2G",
+                   # "Symptoms.Update2G", 
+                   # "Symptoms.Update3G",
+                   # "restenos", "stenose",
+                   # "CAD_history", "PAOD", "Peripheral.interv", 
+                   # "EP_composite", "EP_composite_time", "EP_major", "EP_major_time",
+                   # "MAC_rankNorm", "SMC_rankNorm", "Macrophages.bin", "SMC.bin",
+                   # "Neutrophils_rankNorm", "MastCells_rankNorm",
+                   # "IPH.bin", "VesselDensity_rankNorm",
+                   # "Calc.bin", "Collagen.bin", 
+                   # "Fat.bin_10", "Fat.bin_40", 
+                   # "OverallPlaquePhenotype", "Plaque_Vulnerability_Index")
+
+basetable_bin = c("Hospital", 
+                  "Artery_summary",
+                  "Gender")
+# basetable_bin
+
+basetable_con = basetable_vars[!basetable_vars %in% basetable_bin]
+# basetable_con
+ + + +
+
+
+

Athero-Express Biobank Study Baseline Characteristics

+

Showing the baseline table of the whole Athero-Express Biobank.

+ + + +
# Create baseline tables
+# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html
+AEDB.tableOne = print(CreateTableOne(vars = basetable_vars, 
+                                         factorVars = basetable_bin,
+                                         # strata = "Symptoms.4g",
+                                         data = AEDB.full, includeNA = TRUE), 
+                          nonnormal = c(), missing = TRUE,
+                          quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, 
+                          format = "pf", 
+                          contDigits = 3)[,1:3]
+ + +
                         
+                          level                                                            Overall        Missing
+  n                                                                                          3458                
+  Hospital % (freq)       St. Antonius, Nieuwegein                                           45.3 (1567)  0.0    
+                          UMC Utrecht                                                        54.7 (1891)         
+  Artery_summary % (freq) carotid (left & right)                                             69.0 (2387)  0.0    
+                          femoral/iliac (left, right or both sides)                          28.8 ( 995)         
+                          other carotid arteries (common, external)                           1.3 (  45)         
+                          carotid bypass and injury (left, right or both sides)               0.2 (   7)         
+                          aneurysmata (carotid & femoral)                                     0.0 (   1)         
+                          aorta                                                               0.2 (   6)         
+                          other arteries (renal, popliteal, vertebral)                        0.3 (  12)         
+                          femoral bypass, angioseal and injury (left, right or both sides)    0.1 (   5)         
+  Age (mean (SD))                                                                          68.733 (9.214) 0.0    
+  Gender % (freq)         female                                                             29.7 (1026)  0.0    
+                          male                                                               70.3 (2432)         
+ + + +
+

Match samples used

+

Here we match the full database with the samples used in +EntropyMasker.

+ + + +
# Remove duplicate rows of the dataframe
+library(dplyr)
+temp <- EM_samples %>% select(., "Studynumber") %>%
+  distinct(.)
+
+AEDB_EM <- merge(temp,
+                 AEDB,
+                 by.x = "Studynumber",
+                 by.y = "STUDY_NUMBER", 
+                 sort = FALSE)
+
+AEDB_EM.full <- subset(AEDB_EM,
+                    informedconsent != "missing" & # we are really strict in selecting based on 'informed consent'!
+                       informedconsent != "no, died" & 
+                       informedconsent != "yes, no tissue, no commerical business" &
+                       informedconsent != "yes, no tissue, no questionnaires, no medical info, no commercial business" &
+                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commerical business" &
+                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business" &
+                       informedconsent != "yes, no tissue, no health treatment" &
+                       informedconsent != "yes, no tissue, no questionnaires" &
+                       informedconsent != "yes, no tissue, health treatment when possible" &
+                       informedconsent != "yes, no tissue" &
+                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info" &
+                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commercial business" &
+                       informedconsent != "no, doesn't want to" &
+                       informedconsent != "no, unable to sign" & 
+                       informedconsent != "no, no reaction" & 
+                       informedconsent != "no, lost" & 
+                       informedconsent != "no, too old" & 
+                       informedconsent != "yes, no medical info, health treatment when possible" &
+                       informedconsent != "no (never asked for IC because there was no tissue)" &
+                       informedconsent != "no, endpoint" & 
+                       informedconsent != "nooit geincludeerd")
+# AEDB_EM.full[1:10, 1:10]
+
+rm(temp)
+ + + + + + +
# Create baseline tables
+# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html
+AEDB_EM.full.tableOne = print(CreateTableOne(vars = basetable_vars, 
+                                         factorVars = basetable_bin,
+                                         # strata = "Symptoms.4g",
+                                         data = AEDB_EM.full, includeNA = TRUE), 
+                          nonnormal = c(), missing = TRUE,
+                          quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, 
+                          format = "pf", 
+                          contDigits = 3)[,1:3]
+ + +
                         
+                          level                                        Overall        Missing
+  n                                                                        56                
+  Hospital % (freq)       St. Antonius, Nieuwegein                       21.4 (12)    0.0    
+                          UMC Utrecht                                    78.6 (44)           
+  Artery_summary % (freq) carotid (left & right)                         85.7 (48)    0.0    
+                          femoral/iliac (left, right or both sides)      12.5 ( 7)           
+                          other arteries (renal, popliteal, vertebral)    1.8 ( 1)           
+  Age (mean (SD))                                                      69.500 (9.260) 0.0    
+  Gender % (freq)         female                                         33.9 (19)    0.0    
+                          male                                           66.1 (37)           
+ + + + + + +

+basetable_vars = c("Hospital", 
+                   "Artery_summary")
+
+basetable_bin = c("Hospital", 
+                  "Artery_summary")
+
+# Create baseline tables
+# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html
+AEDB_EM.tableOne = print(CreateTableOne(vars = basetable_vars, 
+                                         factorVars = basetable_bin,
+                                         # strata = "Symptoms.4g",
+                                         data = AEDB_EM, includeNA = TRUE), 
+                          nonnormal = c(), missing = TRUE,
+                          quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, 
+                          format = "pf", 
+                          contDigits = 3)[,1:3]
+ + +
                         
+                          level                                        Overall    Missing
+  n                                                                      59              
+  Hospital % (freq)       St. Antonius, Nieuwegein                     22.0 (13)  0.0    
+                          UMC Utrecht                                  78.0 (46)         
+  Artery_summary % (freq) carotid (left & right)                       84.7 (50)  0.0    
+                          femoral/iliac (left, right or both sides)    13.6 ( 8)         
+                          other arteries (renal, popliteal, vertebral)  1.7 ( 1)         
+ + + +
+
+

Baseline writing

+

Let’s save the baseline characteristics of the Athero-Express Biobank +Study.

+ + + +
# Write basetable
+
+require(openxlsx)
+
+write.xlsx(as.data.frame(AEDB.tableOne), 
+           file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.BaselineTable.xlsx"), 
+           rowNames = TRUE, 
+           colNames = TRUE, 
+           sheetName = "AE_Base", overwrite = TRUE)
+
+write.xlsx(as.data.frame(AEDB_EM.tableOne), 
+           file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.EM.59.BaselineTable.xlsx"), 
+           rowNames = TRUE, 
+           colNames = TRUE, 
+           sheetName = "AE_Base_EM_59", overwrite = TRUE)
+
+write.xlsx(as.data.frame(AEDB_EM.full.tableOne), 
+           file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.EM.56.BaselineTable.xlsx"), 
+           rowNames = TRUE, 
+           colNames = TRUE, 
+           sheetName = "AE_Base_EM_56", overwrite = TRUE)
+ + + +

We will also write the newly prepared AEDB selected for this study +which we can use in downstream analyses.

+ + + +
saveRDS(AEDB_EM.full, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.EM.FULL.RDS"))
+saveRDS(AEDB.full, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.FULL.RDS"))
+saveRDS(AEDB, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.raw.RDS"))
+ + + +
+
+
+

Session information

+
+
Version:      v1.0.2
+Last update:  2022-07-12
+Written by:   Sander W. van der Laan (s.w.vanderlaan-2[at]umcutrecht.nl).
+Description:  Script to get some Athero-Express Biobank Study baseline characteristics.
+Minimum requirements: R version 3.4.3 (2017-06-30) -- 'Single Candle', Mac OS X El Capitan
+
+**MoSCoW To-Do List**
+The things we Must, Should, Could, and Would have given the time we have.
+_M_
+
+_S_
+
+_C_
+
+_W_
+
+**Changes log**
+* v1.0.2 Simplified the initial script. It now outputs the relevant R-objects (as .RDS).
+* v1.0.1 Update to main AEDB (there is an error in the Age-variable in the new version).
+* v1.0.0 Initial version. Add 'plaque vulnerability index', Fixed baseline table, added codes, and results. Major update to WORCS system.
+
+ + + +
sessionInfo()
+ + +
R version 4.2.1 (2022-06-23)
+Platform: x86_64-apple-darwin21.5.0 (64-bit)
+Running under: macOS Ventura 13.0
+
+Matrix products: default
+LAPACK: /usr/local/Cellar/r/4.2.1/lib/R/lib/libRlapack.dylib
+
+locale:
+[1] en_US.UTF-8/en_US.UTF-8/en_US.UTF-8/C/en_US.UTF-8/en_US.UTF-8
+
+attached base packages:
+[1] grid      tools     stats     graphics  grDevices utils     datasets  methods   base     
+
+other attached packages:
+ [1] openxlsx_4.2.5       patchwork_1.1.0.9000 labelled_2.9.1       sjPlot_2.8.10        UpSetR_1.4.0         ggpubr_0.4.0        
+ [7] forestplot_2.0.1     checkmate_2.1.0      magrittr_2.0.3       pheatmap_1.0.12      devtools_2.4.3       usethis_2.1.6       
+[13] BlandAltmanLeh_0.3.1 tableone_0.13.2      haven_2.5.0          eeptools_1.2.4       DT_0.23              knitr_1.39          
+[19] forcats_0.5.1        stringr_1.4.0        purrr_0.3.4          tibble_3.1.7         ggplot2_3.3.6        tidyverse_1.3.1     
+[25] data.table_1.14.2    naniar_0.6.1         tidyr_1.2.0          dplyr_1.0.9          optparse_1.7.1       readr_2.1.2         
+[31] R.utils_2.11.0       R.oo_1.25.0          R.methodsS3_1.8.2    credentials_1.3.2   
+
+loaded via a namespace (and not attached):
+  [1] readxl_1.4.0       backports_1.4.1    plyr_1.8.7         sp_1.5-0           splines_4.2.1      TH.data_1.1-1      digest_0.6.29     
+  [8] htmltools_0.5.2    fansi_1.0.3        memoise_2.0.1      remotes_2.4.2      tzdb_0.3.0         modelr_0.1.8       sandwich_3.0-2    
+ [15] askpass_1.1        prettyunits_1.1.1  colorspace_2.0-3   rvest_1.0.2        mitools_2.4        xfun_0.31          callr_3.7.0       
+ [22] crayon_1.5.1       jsonlite_1.8.0     lme4_1.1-29        survival_3.3-1     zoo_1.8-10         glue_1.6.2         gtable_0.3.0      
+ [29] emmeans_1.7.5      sjstats_0.18.1     sjmisc_2.8.9       car_3.1-0          pkgbuild_1.3.1     abind_1.4-5        scales_1.2.0      
+ [36] mvtnorm_1.1-3      DBI_1.1.3          rstatix_0.7.0      ggeffects_1.1.2    Rcpp_1.0.8.3       xtable_1.8-4       performance_0.9.1 
+ [43] proxy_0.4-27       foreign_0.8-82     survey_4.1-1       vcd_1.4-10         datawizard_0.4.1   htmlwidgets_1.5.4  httr_1.4.3        
+ [50] getopt_1.20.3      RColorBrewer_1.1-3 ellipsis_0.3.2     farver_2.1.0       pkgconfig_2.0.3    sass_0.4.1         dbplyr_2.2.0      
+ [57] utf8_1.2.2         labeling_0.4.2     tidyselect_1.1.2   rlang_1.0.2        effectsize_0.7.0   munsell_0.5.0      cellranger_1.1.0  
+ [64] cachem_1.0.6       cli_3.3.0          generics_0.1.2     sjlabelled_1.2.0   broom_0.8.0        evaluate_0.15      fastmap_1.1.0     
+ [71] arm_1.12-2         yaml_2.3.5         sys_3.4            processx_3.6.1     fs_1.5.2           zip_2.2.0          pander_0.6.5      
+ [78] visdat_0.5.3       nlme_3.1-157       xml2_1.3.3         brio_1.1.3         compiler_4.2.1     rstudioapi_0.13    curl_4.3.2        
+ [85] e1071_1.7-11       testthat_3.1.4     ggsignif_0.6.3     reprex_2.0.1       bslib_0.3.1        stringi_1.7.6      ps_1.7.1          
+ [92] parameters_0.18.1  desc_1.4.1         lattice_0.20-45    Matrix_1.4-1       nloptr_2.0.3       vctrs_0.4.1        pillar_1.7.0      
+ [99] lifecycle_1.0.1    jquerylib_0.1.4    lmtest_0.9-40      estimability_1.3   maptools_1.1-4     insight_0.17.1     R6_2.5.1          
+[106] gridExtra_2.3      sessioninfo_1.2.2  codetools_0.2-18   boot_1.3-28        MASS_7.3-57        assertthat_0.2.1   pkgload_1.2.4     
+[113] openssl_2.0.2      rprojroot_2.0.3    withr_2.5.0        multcomp_1.4-19    bayestestR_0.12.1  hms_1.1.1          class_7.3-20      
+[120] coda_0.19-4        minqa_1.2.4        rmarkdown_2.14     carData_3.0-5      lubridate_1.8.0   
+ + + +
+
+

Saving environment

+ + + +
save.image(paste0(PROJECT_loc, "/",Today,".",PROJECTNAME,".AEDB.EM.baseline.RData"))
+ + + + +++ + + + + + +
© 1979-2022 Sander W. van der Laan | +s.w.vanderlaan[at]gmail.com | swvanderlaan.github.io.
+ +
+ +
---
title: "Baseline characteristics"
author: "[Sander W. van der Laan, PhD](https://swvanderlaan.github.io) | @swvanderlaan | s.w.vanderlaan@gmail.com"
date: "`r Sys.Date()`"
output:
  html_notebook:
    cache: yes
    code_folding: hide
    collapse: yes
    df_print: paged
    fig.align: center
    fig_caption: yes
    fig_height: 6
    fig_retina: 2
    fig_width: 7
    highlight: tango
    theme: lumen
    toc: yes
    toc_float:
      collapsed: no
      smooth_scroll: yes
mainfont: Arial
subtitle: Accompanying 'EntropyMasker'
editor_options:
  chunk_output_type: inline
# bibliography: references.bib
# knit: worcs::cite_all
---

# General Setup
We will clean the environment, setup the locations, define colors, and create a datestamp.

_Clean the environment._
```{r echo = FALSE}
rm(list = ls())
```

_Set locations and working directories..._
```{r LocalSystem, echo = FALSE}
source("scripts/local.system.R")

```

_... a package-installation function ..._
```{r Function: installations}
source("scripts/functions.R")

```


_... and load those packages._
```{r loading_packages, message=FALSE, warning=FALSE}
source("scripts/pack01.packages.R")


```

_We will create a datestamp and define the Utrecht Science Park Colour Scheme_.
```{r Setting: Colors}

Today = format(as.Date(as.POSIXlt(Sys.time())), "%Y%m%d")
Today.Report = format(as.Date(as.POSIXlt(Sys.time())), "%A, %B %d, %Y")

source("scripts/colors.R")

```

```{r global_options, include = FALSE}
# further define some knitr-options.
knitr::opts_chunk$set(fig.width = 12, fig.height = 8, fig.path = 'Figures/', 
                      wwarning = TRUE, # show warnings during codebook generation
  message = TRUE, # show messages during codebook generation
  error = TRUE, # do not interrupt codebook generation in case of errors,
                # usually better for debugging
  echo = TRUE,  # show R code
                      eval = TRUE)
ggplot2::theme_set(ggplot2::theme_minimal())
pander::panderOptions("table.split.table", Inf)
```

# This notebook 

In this notebook we create a baseline table of the samples used in **`EntropyMasker`**. 

# Athero-Express Biobank Study

The [*Athero-Express Biobank Study (AE)*](https://doi.org/10.1007/s10564-004-2304-6) contains plaque material of patients that underwent endarterectomyat two Dutch tertiary referral centers. Details of the study design were described before. Briefly, blood and plaque material were obtained during endarterectomy and stored at -80 ℃. All patients provided informed consent and the study was approved by the medical ethics committee.

## Load relevant samples

```{r}
EM_samples <- fread(paste0(ANALYSIS_loc, "/dataverse/EntropyMasker_image_files_used.txt"))
```

## Load data

Loading Athero-Express Biobank Study clinical and biobank data.

```{r LoadAEDB}
cat("* get Athero-Express Biobank Study Database...")
# METHOD 1: It seems this method gives loads of errors and warnings, which all are hard to comprehend
#           or debug. We expect 3,527 samples, and 927 variables; we get 927 variables!!!
# AEdata = as.data.table(read.spss(paste0(INP_loc,"/2017-1NEW_AtheroExpressDatabase_ScientificAE_20171306_v1.0.sav"),
#                                  trim.factor.names = TRUE, trim_values = TRUE, # we trim spaces in values
#                                  reencode = TRUE, # we re-encode to the local locale encoding
#                                  add.undeclared.levels = "append", # we do *not* want to convert to R-factors
#                                  use.value.labels = FALSE, # we do *not* convert variables with value labels into R factors
#                                  use.missings = TRUE, sub = "NA", # we will set every missing variable to NA
#                                  duplicated.value.labels = "condense", # we will condense duplicated value labels
#                                  to.data.frame = TRUE))
# AEdata.labels <- as.data.table(attr(AEdata, "variable.labels"))
# names(AEdata.labels) <- "Variable"

# METHOD 2: Using library("haven") importing seems flawless; best argument being:
#           we expect 3,527 samples and 888 variables, which is what you'd get with this method
#           So for now, METHOD 2 is prefered. 
#            
require(haven)

# AEDB <- haven::read_sav(paste0(AEDB_loc, "/2022_1_NEW_AtheroExpressDatabase_ScientificAE_15-02-2022.sav")) # something wrong with Age-variable
# AEDB <- haven::read_sav(paste0(AEDB_loc, "/2020_1_NEW_AtheroExpressDatabase_ScientificAE_30-09-2020.sav")) # duplicate studynumbers in it
AEDB <- haven::read_sav(paste0(AEDB_loc, "/2020_1_NEW_AtheroExpressDatabase_ScientificAE_16-03-2020.sav"))

# writing off the SPSS data to an Excel.
# fwrite(AEdata, file = paste0(INP_loc,"/2017-1NEW_AtheroExpressDatabase_ScientificAE_20171306_v1.0.values.xlsx"), 
#        sep = ";", na = "NA", dec = ".", col.names = TRUE, row.names = FALSE,
#        dateTimeAs = "ISO", showProgress = TRUE, verbose = TRUE)
# warnings()

AEDB[1:10, 1:10]
dim(AEDB)

```



<!-- ## Examine AEDB -->

<!-- We can examine the contents of the Athero-Express Biobank dataset to know what each variable is called, what class -->
<!-- (type) it has, and what the variable description is. -->

<!-- There is an excellent post on this: <https://www.r-bloggers.com/working-with-spss-labels-in-r/>. -->

<!-- ```{r AEDB: describe} -->
<!-- AEDB %>% sjPlot::view_df(show.type = TRUE, -->
<!--                          show.frq = TRUE, -->
<!--                          show.prc = TRUE, -->
<!--                          show.na = TRUE,  -->
<!--                          max.len = TRUE,  -->
<!--                          wrap.labels = 20, -->
<!--                          verbose = FALSE,  -->
<!--                          use.viewer = FALSE, -->
<!--                          file = paste0(OUT_loc, "/", Today, ".AEDB.dictionary.html"))  -->
<!-- ``` -->

## Fixing and creating variables

We have to fix certain clinical parameters:

-   symptoms
-   diabetes
-   alcohol use
-   smoking
-   plaque phenotypes

### Symptoms

We need to be very strict in defining *symptoms.* Therefore we will fix a new
variable that groups *symptoms* at inclusion.

Coding of *symptoms* is as follows:

-   missing -999
-   Asymptomatic 0
-   TIA 1
-   minor stroke 2
-   Major stroke 3
-   Amaurosis fugax 4
-   Four vessel disease 5
-   Vertebrobasilary TIA 7
-   Retinal infarction 8
-   Symptomatic, but aspecific symtoms 9
-   Contralateral symptomatic occlusion 10
-   retinal infarction 11
-   armclaudication due to occlusion subclavian artery, CEA needed for bypass
    12
-   retinal infarction + TIAs 13
-   Ocular ischemic syndrome 14
-   ischemisch glaucoom 15
-   subclavian steal syndrome 16
-   TGA 17

We will group as follows:

1.  Asymptomatic > 0
2.  TIA > 1, 7, 13
3.  Stroke > 2, 3
4.  Ocular > 4, 14, 15
5.  Retinal infarction > 8, 11
6.  Other > 5, 9, 10, 12, 16, 17

```{r FixSymptoms, message=FALSE, warning=FALSE}

# Fix symptoms

attach(AEDB)
AEDB[,"Symptoms.5G"] <- NA
AEDB$Symptoms.5G[sympt == 0] <- "Asymptomatic"
AEDB$Symptoms.5G[sympt == 1 | sympt == 7 | sympt == 13] <- "TIA"
AEDB$Symptoms.5G[sympt == 2 | sympt == 3] <- "Stroke"
AEDB$Symptoms.5G[sympt == 4 | sympt == 14 | sympt == 15 ] <- "Ocular"
AEDB$Symptoms.5G[sympt == 8 | sympt == 11] <- "Retinal infarction"
AEDB$Symptoms.5G[sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Other"


# AsymptSympt
AEDB[,"AsymptSympt"] <- NA
AEDB$AsymptSympt[sympt == -999] <- NA
AEDB$AsymptSympt[sympt == 0] <- "Asymptomatic"
AEDB$AsymptSympt[sympt == 1 | sympt == 7 | sympt == 13 | sympt == 2 | sympt == 3] <- "Symptomatic"
AEDB$AsymptSympt[sympt == 4 | sympt == 14 | sympt == 15 | sympt == 8 | sympt == 11 | sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Ocular and others"

# AsymptSympt
AEDB[,"AsymptSympt2G"] <- NA
AEDB$AsymptSympt2G[sympt == -999] <- NA
AEDB$AsymptSympt2G[sympt == 0] <- "Asymptomatic"
AEDB$AsymptSympt2G[sympt == 1 | sympt == 7 | sympt == 13 | sympt == 2 | sympt == 3 | sympt == 4 | sympt == 14 | sympt == 15 | sympt == 8 | sympt == 11 | sympt == 5 | sympt == 9 | sympt == 10 | sympt == 12 | sympt == 16 | sympt == 17] <- "Symptomatic"

detach(AEDB)

# table(AEDB$sympt, useNA = "ifany")
# table(AEDB$AsymptSympt2G, useNA = "ifany")
# table(AEDB$Symptoms.5G, useNA = "ifany")
# 
# table(AEDB$AsymptSympt2G, AEDB$sympt, useNA = "ifany")
# table(AEDB$Symptoms.5G, AEDB$sympt, useNA = "ifany")
table(AEDB$AsymptSympt2G, AEDB$Symptoms.5G, useNA = "ifany")

# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "sympt", "Symptoms.5G", "AsymptSympt"))
# require(labelled)
# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
# 
# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
# 
# table(AEDB.temp$Symptoms.5G, AEDB.temp$AsymptSympt)
# 
# rm(AEDB.temp)
```

### Re-assessed symptoms

We re-assessed the categorization of symptoms. These are summarized and parsed
in this section.

Labeling of new symptom categories.

```{r message=FALSE, warning=FALSE, paged.print=TRUE}

AEDB$indexsymptoms_worst
AEDB$indexsymptoms_worst_4g
AEDB$indexsymptoms_latest
AEDB$indexsymptoms_latest_4g

```

Getting counts for each of the most important categories.

```{r}
cat("New 'worst' vs 'latest' symptom categories.\n")
table(as_factor(AEDB$indexsymptoms_worst_4g), as_factor(AEDB$indexsymptoms_latest_4g))

cat("\nNew 'worst' symptom categories.\n")
table((AEDB$indexsymptoms_worst_4g))

cat("\nNew 'latest' symptom categories.\n")
table(as_factor(AEDB$indexsymptoms_latest_4g))
```

Comparing with the original symptom categories.

```{r}
cat("New 'latest' vs original symptom 2G categories.\n")
table((AEDB$indexsymptoms_latest_4g), AEDB$AsymptSympt2G)

cat("\nNew 'latest' vs original symptom 5G categories.\n")
table((AEDB$indexsymptoms_latest_4g), AEDB$Symptoms.5G)
   
```

We need to be very strict in defining *symptoms.* Therefore we will fix a new
variable that groups *symptoms* at inclusion.

Coding of *symptoms* is as follows:

-   asympt 0\
-   ocular 1\
-   TIA 2\
-   stroke 3\
-   unclear 9

We will group as follows:

1.  Asymptomatic > 0
2.  Symptomatic > 1, 2, 3
3.  NA > 9

```{r FixNewSymptoms}

# Fix symptoms
attach(AEDB)

# Symptoms.Update2G
AEDB[,"Symptoms.Update2G"] <- NA
AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 0] <- "Asymptomatic"
AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 1 | indexsymptoms_latest_4g == 2 | indexsymptoms_latest_4g == 3] <- "Symptomatic"
AEDB$Symptoms.Update2G[indexsymptoms_latest_4g == 9 ] <- NA

# Symptoms.Update3G
AEDB[,"Symptoms.Update3G"] <- NA
AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 0] <- "Asymptomatic"
AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 1 | indexsymptoms_latest_4g == 2 | indexsymptoms_latest_4g == 3] <- "Symptomatic"
AEDB$Symptoms.Update3G[indexsymptoms_latest_4g == 9 ] <- "Unclear"

detach(AEDB)

table(AEDB$Symptoms.Update2G, AEDB$Symptoms.5G, useNA = "ifany")
table(AEDB$Symptoms.Update3G, AEDB$Symptoms.5G, useNA = "ifany")

```

### Other clinical characteristics

We will also fix the *diabetes* status variable.

```{r FixDiabetes, message=FALSE, warning=FALSE}

# Fix diabetes
attach(AEDB)
AEDB[,"DiabetesStatus"] <- NA
AEDB$DiabetesStatus[DM.composite == -999] <- NA
AEDB$DiabetesStatus[DM.composite == 0] <- "Control (no Diabetes Dx/Med)"
AEDB$DiabetesStatus[DM.composite == 1] <- "Diabetes"
detach(AEDB)

table(AEDB$DM.composite, AEDB$DiabetesStatus)
# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "DM.composite", "DiabetesStatus"))
# require(labelled)
# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
# AEDB.temp$DiabetesStatus <- to_factor(AEDB.temp$DiabetesStatus)
# 
# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
# 
# rm(AEDB.temp)

```

We will also fix the *smoking* status variable. We are interested in whether
someone never, ever or is currently (at the time of inclusion) smoking. This is
based on the questionnaire.

-   `diet801`: are you a smoker?
-   `diet802`: did you smoke in the past?

We already have some variables indicating smoking status:

-   `SmokingReported`: patient has reported to smoke.
-   `SmokingYearOR`: smoking in the year of surgery?
-   `SmokerCurrent`: currently smoking?

```{r FixSmoking, message=FALSE, warning=FALSE}
require(labelled)
AEDB$diet801 <- to_factor(AEDB$diet801)
AEDB$diet802 <- to_factor(AEDB$diet802)
AEDB$diet805 <- to_factor(AEDB$diet805)
AEDB$SmokingReported <- to_factor(AEDB$SmokingReported)
AEDB$SmokerCurrent <- to_factor(AEDB$SmokerCurrent)
AEDB$SmokingYearOR <- to_factor(AEDB$SmokingYearOR)

# table(AEDB$diet801)
# table(AEDB$diet802)
# table(AEDB$SmokingReported)
# table(AEDB$SmokerCurrent)
# table(AEDB$SmokingYearOR)
# table(AEDB$SmokingReported, AEDB$SmokerCurrent, useNA = "ifany", dnn = c("Reported smoking", "Current smoker"))
# 
# table(AEDB$diet801, AEDB$diet802, useNA = "ifany", dnn = c("Smoker", "Past smoker"))

cat("\nFixing smoking status.\n")
attach(AEDB)
AEDB[,"SmokerStatus"] <- NA
AEDB$SmokerStatus[diet802 == "don't know"] <- "Never smoked"
AEDB$SmokerStatus[diet802 == "I still smoke"] <- "Current smoker"
AEDB$SmokerStatus[SmokerCurrent == "no" & diet802 == "no"] <- "Never smoked"
AEDB$SmokerStatus[SmokerCurrent == "no" & diet802 == "yes"] <- "Ex-smoker"
AEDB$SmokerStatus[SmokerCurrent == "yes"] <- "Current smoker"
AEDB$SmokerStatus[SmokerCurrent == "no data available/missing"] <- NA
# AEDB$SmokerStatus[is.na(SmokerCurrent)] <- "Never smoked"
detach(AEDB)

cat("\n* Current smoking status.\n")
table(AEDB$SmokerCurrent,
      useNA = "ifany", 
      dnn = c("Current smoker"))

cat("\n* Updated smoking status.\n")
table(AEDB$SmokerStatus,
      useNA = "ifany", 
      dnn = c("Updated smoking status"))

cat("\n* Comparing to 'SmokerCurrent'.\n")
table(AEDB$SmokerStatus, AEDB$SmokerCurrent, 
      useNA = "ifany", 
      dnn = c("Updated smoking status", "Current smoker"))

# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "DM.composite", "DiabetesStatus"))
# require(labelled)
# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
# AEDB.temp$DiabetesStatus <- to_factor(AEDB.temp$DiabetesStatus)
# 
# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
# 
# rm(AEDB.temp)


```

We will also fix the *alcohol* status variable.

```{r FixAlcohol, message=FALSE, warning=FALSE}

# Fix diabetes
attach(AEDB)
AEDB[,"AlcoholUse"] <- NA
AEDB$AlcoholUse[diet810 == -999] <- NA
AEDB$AlcoholUse[diet810 == 0] <- "No"
AEDB$AlcoholUse[diet810 == 1] <- "Yes"
detach(AEDB)

# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "diet810", "AlcoholUse"))
# require(labelled)
# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
# AEDB.temp$AlcoholUse <- to_factor(AEDB.temp$AlcoholUse)
# 
# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
# 
# rm(AEDB.temp)


```

We will also fix a history of CAD, stroke or peripheral intervention status variable. This will be based on `CAD_history`, `Stroke_history`, and `Peripheral.interv`

```{r FixCAD_History, message=FALSE, warning=FALSE}

# Fix diabetes
attach(AEDB)
AEDB[,"MedHx_CVD"] <- NA
AEDB$MedHx_CVD[CAD_history == 0 | Stroke_history == 0 | Peripheral.interv == 0] <- "No"
AEDB$MedHx_CVD[CAD_history == 1 | Stroke_history == 1 | Peripheral.interv == 1] <- "yes"
detach(AEDB)

table(AEDB$CAD_history)
table(AEDB$Stroke_history)
table(AEDB$Peripheral.interv)
table(AEDB$MedHx_CVD)

# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "diet810", "AlcoholUse"))
# require(labelled)
# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
# AEDB.temp$AlcoholUse <- to_factor(AEDB.temp$AlcoholUse)
# 
# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
# 
# rm(AEDB.temp)


```

### Plaque phenotypes

We will also fix the *plaquephenotypes* variable.

Coding of symptoms is as follows:

-   missing -999\
-   not relevant -888
-   fibrous 1\
-   fibroatheromatous 2\
-   atheromatous 3

```{r FixPlaquePhenotypes, message=FALSE, warning=FALSE}

# Fix plaquephenotypes
attach(AEDB)
AEDB[,"OverallPlaquePhenotype"] <- NA
AEDB$OverallPlaquePhenotype[plaquephenotype == -999] <- NA
AEDB$OverallPlaquePhenotype[plaquephenotype == -999] <- NA
AEDB$OverallPlaquePhenotype[plaquephenotype == 1] <- "fibrous"
AEDB$OverallPlaquePhenotype[plaquephenotype == 2] <- "fibroatheromatous"
AEDB$OverallPlaquePhenotype[plaquephenotype == 3] <- "atheromatous"
detach(AEDB)

# AEDB.temp <- subset(AEDB,  select = c("STUDY_NUMBER", "UPID", "Age", "Gender", "Hospital", "Artery_summary", "plaquephenotype", "OverallPlaquePhenotype"))
# require(labelled)
# AEDB.temp$Gender <- to_factor(AEDB.temp$Gender)
# AEDB.temp$Hospital <- to_factor(AEDB.temp$Hospital)
# AEDB.temp$Artery_summary <- to_factor(AEDB.temp$Artery_summary)
# 
# DT::datatable(AEDB.temp[1:10,], caption = "Excerpt of the whole AEDB.", rownames = FALSE)
# 
# rm(AEDB.temp)

```

We will also fix and inverse-rank normal transform the continuous (manually)
scored plaque phenotypes.

```{r IRNT PlaquePhenotypes}
AEDB$macmean0 <- as.numeric(AEDB$macmean0)
AEDB$smcmean0 <- as.numeric(AEDB$smcmean0)
AEDB$neutrophils <- as.numeric(AEDB$neutrophils)
AEDB$Mast_cells_plaque <- as.numeric(AEDB$Mast_cells_plaque)
AEDB$vessel_density_averaged <- as.numeric(AEDB$vessel_density_averaged)

AEDB$MAC_rankNorm <- qnorm((rank(AEDB$macmean0, na.last = "keep") - 0.5) / sum(!is.na(AEDB$macmean0)))
AEDB$SMC_rankNorm <- qnorm((rank(AEDB$smcmean0, na.last = "keep") - 0.5) / sum(!is.na(AEDB$smcmean0)))
AEDB$Neutrophils_rankNorm <- qnorm((rank(AEDB$neutrophils, na.last = "keep") - 0.5) / sum(!is.na(AEDB$neutrophils)))
AEDB$MastCells_rankNorm <- qnorm((rank(AEDB$Mast_cells_plaque, na.last = "keep") - 0.5) / sum(!is.na(AEDB$Mast_cells_plaque)))
AEDB$VesselDensity_rankNorm <- qnorm((rank(AEDB$vessel_density_averaged, na.last = "keep") - 0.5) / sum(!is.na(AEDB$vessel_density_averaged)))

```

```{r IRNT PlaquePhenotypes: Visualisation}
library(labelled)
AEDB$Gender <- to_factor(AEDB$Gender)
library(patchwork)

p1 <- ggpubr::gghistogram(AEDB, "macmean0", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "% of macrophages (CD68)",
                    xlab = "% per region of interest", 
                    ggtheme = theme_minimal())

p2 <- ggpubr::gghistogram(AEDB, "MAC_rankNorm", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "% of macrophages (CD68)",
                   xlab = "% per region of interest\ninverse-rank normalized number", 
                    ggtheme = theme_minimal())

p1 | p2 

p1 <- ggpubr::gghistogram(AEDB, "smcmean0", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "% of smooth muscle cells (SMA)",
                    xlab = "% per region of interest", 
                    ggtheme = theme_minimal())

p2 <- ggpubr::gghistogram(AEDB, "SMC_rankNorm", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "% of smooth muscle cells (SMA)",
                   xlab = "% per region of interest\ninverse-rank normalized number", 
                    ggtheme = theme_minimal())

p1 | p2 


p1 <- ggpubr::gghistogram(AEDB, "neutrophils", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "number of neutrophils (CD66b)",
                    xlab = "counts per plaque", 
                    ggtheme = theme_minimal())

p2 <- ggpubr::gghistogram(AEDB, "Neutrophils_rankNorm", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "number of neutrophils (CD66b)",
                   xlab = "counts per plaque\ninverse-rank normalized number", 
                    ggtheme = theme_minimal())

p1 | p2 


p1 <- ggpubr::gghistogram(AEDB, "Mast_cells_plaque", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "number of mast cells",
                    xlab = "counts per plaque", 
                    ggtheme = theme_minimal())

p2 <- ggpubr::gghistogram(AEDB, "MastCells_rankNorm", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "number of mast cells",
                   xlab = "counts per plaque\ninverse-rank normalized number", 
                    ggtheme = theme_minimal())

p1 | p2 


p1 <- ggpubr::gghistogram(AEDB, "vessel_density_averaged", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "number of intraplaque neovessels",
                    xlab = "counts per 3-4 hotspots", 
                    ggtheme = theme_minimal())

p2 <- ggpubr::gghistogram(AEDB, "VesselDensity_rankNorm", 
                    # y = "..count..", 
                    color = "white",
                    fill = "Gender",
                    palette = c("#1290D9", "#DB003F"), 
                    add = "median", 
                    #add_density = TRUE,
                    rug = TRUE,
                    #add.params =  list(color = "black", linetype = 2), 
                    title = "number of intraplaque neovessels",
                   xlab = "counts per 3-4 hotspots\ninverse-rank normalized number", 
                    ggtheme = theme_minimal())

p1 | p2 

rm(p1, p2)
```

Here we calculate the *plaque instability/vulnerability* index

```{r Plaque Vulnerability}
# Plaque vulnerability
require(labelled)
AEDB$Macrophages.bin <- to_factor(AEDB$Macrophages.bin)
AEDB$SMC.bin <- to_factor(AEDB$SMC.bin)
AEDB$IPH.bin <- to_factor(AEDB$IPH.bin)
AEDB$Calc.bin <- to_factor(AEDB$Calc.bin)
AEDB$Collagen.bin <- to_factor(AEDB$Collagen.bin)
AEDB$Fat.bin_10 <- to_factor(AEDB$Fat.bin_10)
AEDB$Fat.bin_40 <- to_factor(AEDB$Fat.bin_40)

table(AEDB$Macrophages.bin)
table(AEDB$Fat.bin_10)
table(AEDB$Collagen.bin)
table(AEDB$SMC.bin)
table(AEDB$IPH.bin)

# SPSS code

# 
# *** syntax- Plaque vulnerability**.
# COMPUTE Macro_instab = -999.
# IF macrophages.bin=2 Macro_instab=1.
# IF macrophages.bin=1 Macro_instab=0.
# EXECUTE.
# 
# COMPUTE Fat10_instab = -999.
# IF Fat.bin_10=2 Fat10_instab=1.
# IF Fat.bin_10=1 Fat10_instab=0.
# EXECUTE.
# 
# COMPUTE coll_instab=-999.
# IF Collagen.bin=2 coll_instab=0.
# IF Collagen.bin=1 coll_instab=1.
# EXECUTE.
# 
# 
# COMPUTE SMC_instab=-999.
# IF SMC.bin=2 SMC_instab=0.
# IF SMC.bin=1 SMC_instab=1.
# EXECUTE.
# 
# COMPUTE IPH_instab=-999.
# IF IPH.bin=0 IPH_instab=0.
# IF IPH.bin=1 IPH_instab=1.
# EXECUTE.
# 
# COMPUTE Instability=Macro_instab + Fat10_instab +  coll_instab + SMC_instab + IPH_instab.
# EXECUTE.

# Fix plaquephenotypes
attach(AEDB)
# mac instability
AEDB[,"MAC_Instability"] <- NA
AEDB$MAC_Instability[Macrophages.bin == -999] <- NA
AEDB$MAC_Instability[Macrophages.bin == "no/minor"] <- 0
AEDB$MAC_Instability[Macrophages.bin == "moderate/heavy"] <- 1

# fat instability
AEDB[,"FAT10_Instability"] <- NA
AEDB$FAT10_Instability[Fat.bin_10 == -999] <- NA
AEDB$FAT10_Instability[Fat.bin_10 == " <10%"] <- 0
AEDB$FAT10_Instability[Fat.bin_10 == " >10%"] <- 1

# col instability 
AEDB[,"COL_Instability"] <- NA
AEDB$COL_Instability[Collagen.bin == -999] <- NA
AEDB$COL_Instability[Collagen.bin == "no/minor"] <- 1
AEDB$COL_Instability[Collagen.bin == "moderate/heavy"] <- 0

# smc instability
AEDB[,"SMC_Instability"] <- NA
AEDB$SMC_Instability[SMC.bin == -999] <- NA
AEDB$SMC_Instability[SMC.bin == "no/minor"] <- 1
AEDB$SMC_Instability[SMC.bin == "moderate/heavy"] <- 0

# iph instability
AEDB[,"IPH_Instability"] <- NA
AEDB$IPH_Instability[IPH.bin == -999] <- NA
AEDB$IPH_Instability[IPH.bin == "no"] <- 0
AEDB$IPH_Instability[IPH.bin == "yes"] <- 1

detach(AEDB)

table(AEDB$MAC_Instability, useNA = "ifany")
table(AEDB$FAT10_Instability, useNA = "ifany")
table(AEDB$COL_Instability, useNA = "ifany")
table(AEDB$SMC_Instability, useNA = "ifany")
table(AEDB$IPH_Instability, useNA = "ifany")

# creating vulnerability index
AEDB <- AEDB %>% mutate(Plaque_Vulnerability_Index = factor(rowSums(.[grep("_Instability", names(.))], na.rm = TRUE)),
                                )

table(AEDB$Plaque_Vulnerability_Index, useNA = "ifany")

# str(AEDB$Plaque_Vulnerability_Index)

```

## Prepare baseline summary

We are interested in the following variables at baseline in the whole cohort.

-   Age (years)
-   Female sex (N, %)
-   Artery type (N, %)
-   Hospital (N, %)
<!-- -   Hypertension (N, %) -->
<!-- -   SBP (mmHg) -->
<!-- -   DBP (mmHg) -->
<!-- -   Diabetes mellitus (N, %) -->
<!-- -   Total cholesterol levels (mg/dL) -->
<!-- -   LDL cholesterol levels (mg/dL) -->
<!-- -   HDL cholesterol levels (mg/dL) -->
<!-- -   Triglyceride levels (mg/dL) -->
<!-- -   Use of statins (N, %) -->
<!-- -   Use of antiplatelet drugs (N, %) -->
<!-- -   BMI (kg/m²) -->
<!-- -   Smoking status (N, %) -->
<!--     -   Never smokers -->
<!--     -   Ex-smokers -->
<!--     -   Current smokers -->
<!-- -   History of CAD (N, %) -->
<!-- -   History of PAD (N, %) -->
<!-- -   Clinical manifestations -->
<!--     -   Asymptomatic -->
<!--     -   Amaurosis fugax -->
<!--     -   TIA -->
<!--     -   Stroke -->
<!-- -   eGFR (mL/min/1.73 m²) -->
<!-- -   stenosis -->
<!-- -   year of surgery -->
<!-- -   plaque characteristics -->

```{r Baseline AEDB: preparation}
cat("====================================================================================================\n")
cat("SELECTION THE SHIZZLE\n")

### Artery levels
# AEdata$Artery_summary: 
#           value                                                                                   label
# NOT USE - 0 No artery known (yet), no surgery (patient ill, died, exited study), re-numbered to AAA
# USE - 1                                                                  carotid (left & right)
# USE - 2                                               femoral/iliac (left, right or both sides)
# NOT USE - 3                                               other carotid arteries (common, external)
# NOT USE - 4                                   carotid bypass and injury (left, right or both sides)
# NOT USE - 5                                                         aneurysmata (carotid & femoral)
# NOT USE - 6                                                                                   aorta
# NOT USE - 7                                            other arteries (renal, popliteal, vertebral)
# NOT USE - 8                        femoral bypass, angioseal and injury (left, right or both sides)

### AEdata$informedconsent
#           value                                                                                           label
# NOT USE - -999                                                                                         missing
# NOT USE - 0                                                                                        no, died
# USE - 1                                                                                             yes
# USE - 2                                                             yes, health treatment when possible
# USE - 3                                                                        yes, no health treatment
# USE - 4                                                yes, no health treatment, no commercial business
# NOT USE - 5                                                          yes, no tissue, no commerical business
# NOT USE - 6                      yes, no tissue, no questionnaires, no medical info, no commercial business
# USE - 7                             yes, no questionnaires, no health treatment, no commercial business
# USE - 8                                          yes, no questionnaires, health treatment when possible
# NOT USE - 9                  yes, no tissue, no questionnaires, no health treatment, no commerical business
# USE - 10                               yes, no health treatment, no medical info, no commercial business
# NOT USE - 11 yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business
# USE - 12                                                     yes, no questionnaires, no health treatment
# NOT USE - 13                                                             yes, no tissue, no health treatment
# NOT USE - 14                                                               yes, no tissue, no questionnaires
# NOT USE - 15                                                  yes, no tissue, health treatment when possible
# NOT USE - 16                                                                                  yes, no tissue
# USE - 17                                                                     yes, no commerical business
# USE - 18                                     yes, health treatment when possible, no commercial business
# USE - 19                                                    yes, no medical info, no commercial business
# USE - 20                                                                          yes, no questionnaires
# NOT USE - 21                         yes, no tissue, no questionnaires, no health treatment, no medical info
# NOT USE - 22                  yes, no tissue, no questionnaires, no health treatment, no commercial business
# USE - 23                                                                            yes, no medical info
# USE - 24                                                  yes, no questionnaires, no commercial business
# USE - 25                                    yes, no questionnaires, no health treatment, no medical info
# USE - 26                  yes, no questionnaires, health treatment when possible, no commercial business
# USE - 27                                                      yes,  no health treatment, no medical info
# NOT USE - 28                                                                             no, doesn't want to
# NOT USE - 29                                                                              no, unable to sign
# NOT USE - 30                                                                                 no, no reaction
# NOT USE - 31                                                                                        no, lost
# NOT USE - 32                                                                                     no, too old
# NOT USE - 34                                            yes, no medical info, health treatment when possible
# NOT USE - 35                                             no (never asked for IC because there was no tissue)
# USE - 36                    yes, no medical info, no commercial business, health treatment when possible
# NOT USE - 37                                                                                    no, endpoint
# USE - 38                                                         wil niets invullen, wel alles gebruiken
# USE - 39                                           second informed concents: yes, no commercial business
# NOT USE - 40                                                                              nooit geincludeerd

cat("- sanity checking PRIOR to selection")
library(data.table)
require(labelled)
ae.gender <- to_factor(AEDB$Gender)
ae.hospital <- to_factor(AEDB$Hospital)
table(ae.gender, ae.hospital, dnn = c("Sex", "Hospital"))
ae.artery <- to_factor(AEDB$Artery_summary)
table(ae.artery, ae.gender, dnn = c("Sex", "Artery"))

rm(ae.gender, ae.hospital, ae.artery)

# I change numeric and factors manually because, well, I wouldn't know how to fix it otherwise
# to have this 'tibble' work with 'tableone'... :-)

AEDB$Age <- as.numeric(AEDB$Age)
AEDB$diastoli <- as.numeric(AEDB$diastoli)
AEDB$systolic <- as.numeric(AEDB$systolic)

AEDB$TC_finalCU <- as.numeric(AEDB$TC_finalCU)
AEDB$LDL_finalCU <- as.numeric(AEDB$LDL_finalCU)
AEDB$HDL_finalCU <- as.numeric(AEDB$HDL_finalCU)
AEDB$TG_finalCU <- as.numeric(AEDB$TG_finalCU)

AEDB$TC_final <- as.numeric(AEDB$TC_final)
AEDB$LDL_final <- as.numeric(AEDB$LDL_final)
AEDB$HDL_final <- as.numeric(AEDB$HDL_final)
AEDB$TG_final <- as.numeric(AEDB$TG_final)

AEDB$Age <- as.numeric(AEDB$Age)
AEDB$GFR_MDRD <- as.numeric(AEDB$GFR_MDRD)
AEDB$BMI <- as.numeric(AEDB$BMI)
AEDB$eCigarettes <- as.numeric(AEDB$eCigarettes)
AEDB$ePackYearsSmoking <- as.numeric(AEDB$ePackYearsSmoking)
AEDB$EP_composite_time <- as.numeric(AEDB$EP_composite_time)
AEDB$EP_major_time <- as.numeric(AEDB$EP_major_time)

require(labelled)
AEDB$Artery_summary <- to_factor(AEDB$Artery_summary)
AEDB$ORyear <- to_factor(AEDB$ORyear)
AEDB$Gender <- to_factor(AEDB$Gender)
AEDB$Hospital <- to_factor(AEDB$Hospital)
AEDB$KDOQI <- to_factor(AEDB$KDOQI)
AEDB$BMI_WHO <- to_factor(AEDB$BMI_WHO)
AEDB$DiabetesStatus <- to_factor(AEDB$DiabetesStatus)
AEDB$SmokerStatus <- to_factor(AEDB$SmokerStatus)
AEDB$AlcoholUse <- to_factor(AEDB$AlcoholUse)

AEDB$Hypertension.selfreport <- to_factor(AEDB$Hypertension1)
AEDB$Hypertension.selfreportdrug <- to_factor(AEDB$Hypertension2)
AEDB$Hypertension.composite <- to_factor(AEDB$Hypertension.composite)
AEDB$Hypertension.drugs <- to_factor(AEDB$Hypertension.drugs)

AEDB$Med.anticoagulants <- to_factor(AEDB$Med.anticoagulants)
AEDB$Med.all.antiplatelet <- to_factor(AEDB$Med.all.antiplatelet)
AEDB$Med.Statin.LLD <- to_factor(AEDB$Med.Statin.LLD)

AEDB$Stroke_Dx <- to_factor(AEDB$Stroke_Dx)
AEDB$CAD_history <- to_factor(AEDB$CAD_history)
AEDB$PAOD <- to_factor(AEDB$PAOD)
AEDB$Peripheral.interv <- to_factor(AEDB$Peripheral.interv)

AEDB$sympt <- to_factor(AEDB$sympt)
AEDB$Symptoms.3g <- to_factor(AEDB$Symptoms.3g)
AEDB$Symptoms.4g <- to_factor(AEDB$Symptoms.4g)
AEDB$Symptoms.5G <- to_factor(AEDB$Symptoms.5G)
AEDB$AsymptSympt <- to_factor(AEDB$AsymptSympt)
AEDB$AsymptSympt2G <- to_factor(AEDB$AsymptSympt2G)
AEDB$Symptoms.Update2G <- to_factor(AEDB$Symptoms.Update2G)
AEDB$Symptoms.Update3G <- to_factor(AEDB$Symptoms.Update3G)

AEDB$restenos <- to_factor(AEDB$restenos)
AEDB$stenose <- to_factor(AEDB$stenose)
AEDB$EP_composite <- to_factor(AEDB$EP_composite)
AEDB$EP_major <- to_factor(AEDB$EP_major)
AEDB$Macrophages.bin <- to_factor(AEDB$Macrophages.bin)
AEDB$SMC.bin <- to_factor(AEDB$SMC.bin)
AEDB$IPH.bin <- to_factor(AEDB$IPH.bin)
AEDB$Calc.bin <- to_factor(AEDB$Calc.bin)
AEDB$Collagen.bin <- to_factor(AEDB$Collagen.bin)
AEDB$Fat.bin_10 <- to_factor(AEDB$Fat.bin_10)
AEDB$Fat.bin_40 <- to_factor(AEDB$Fat.bin_40)
AEDB$OverallPlaquePhenotype <- to_factor(AEDB$OverallPlaquePhenotype)
AEDB$Plaque_Vulnerability_Index <- to_factor(AEDB$Plaque_Vulnerability_Index)

AEDB$Artery_summary <- to_factor(AEDB$Artery_summary)

AEDB$informedconsent <- to_factor(AEDB$informedconsent)

AEDB.full <- subset(AEDB,
                    informedconsent != "missing" & # we are really strict in selecting based on 'informed consent'!
                       informedconsent != "no, died" & 
                       informedconsent != "yes, no tissue, no commerical business" &
                       informedconsent != "yes, no tissue, no questionnaires, no medical info, no commercial business" &
                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commerical business" &
                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business" &
                       informedconsent != "yes, no tissue, no health treatment" &
                       informedconsent != "yes, no tissue, no questionnaires" &
                       informedconsent != "yes, no tissue, health treatment when possible" &
                       informedconsent != "yes, no tissue" &
                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info" &
                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commercial business" &
                       informedconsent != "no, doesn't want to" &
                       informedconsent != "no, unable to sign" & 
                       informedconsent != "no, no reaction" & 
                       informedconsent != "no, lost" & 
                       informedconsent != "no, too old" & 
                       informedconsent != "yes, no medical info, health treatment when possible" &
                       informedconsent != "no (never asked for IC because there was no tissue)" &
                       informedconsent != "no, endpoint" & 
                       informedconsent != "nooit geincludeerd")
# AEDB.CEA[1:10, 1:10]
dim(AEDB.full)

```

```{r Baseline AEDB: creation}
cat("===========================================================================================\n")
cat("CREATE BASELINE TABLE\n")

# Baseline table variables
basetable_vars = c("Hospital", 
                   "Artery_summary",
                   "Age", "Gender")
                   # "ORyear", 
                   # "TC_finalCU", "LDL_finalCU", "HDL_finalCU", "TG_finalCU", 
                   # "TC_final", "LDL_final", "HDL_final", "TG_final", 
                   # "hsCRP_plasma",
                   # "systolic", "diastoli", "GFR_MDRD", "BMI", 
                   # "KDOQI", "BMI_WHO",
                   # "SmokerStatus", "AlcoholUse",
                   # "DiabetesStatus", 
                   # "Hypertension.selfreport", "Hypertension.selfreportdrug", "Hypertension.composite", "Hypertension.drugs", 
                   # "Med.anticoagulants", "Med.all.antiplatelet", "Med.Statin.LLD", 
                   # "Stroke_Dx", "sympt", "Symptoms.5G", "AsymptSympt", "AsymptSympt2G",
                   # "Symptoms.Update2G", 
                   # "Symptoms.Update3G",
                   # "restenos", "stenose",
                   # "CAD_history", "PAOD", "Peripheral.interv", 
                   # "EP_composite", "EP_composite_time", "EP_major", "EP_major_time",
                   # "MAC_rankNorm", "SMC_rankNorm", "Macrophages.bin", "SMC.bin",
                   # "Neutrophils_rankNorm", "MastCells_rankNorm",
                   # "IPH.bin", "VesselDensity_rankNorm",
                   # "Calc.bin", "Collagen.bin", 
                   # "Fat.bin_10", "Fat.bin_40", 
                   # "OverallPlaquePhenotype", "Plaque_Vulnerability_Index")

basetable_bin = c("Hospital", 
                  "Artery_summary",
                  "Gender")
# basetable_bin

basetable_con = basetable_vars[!basetable_vars %in% basetable_bin]
# basetable_con
```

# Athero-Express Biobank Study Baseline Characteristics

Showing the baseline table of the whole Athero-Express Biobank.

```{r Baseline AEDB: Visualize AEDB}
# Create baseline tables
# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html
AEDB.tableOne = print(CreateTableOne(vars = basetable_vars, 
                                         factorVars = basetable_bin,
                                         # strata = "Symptoms.4g",
                                         data = AEDB.full, includeNA = TRUE), 
                          nonnormal = c(), missing = TRUE,
                          quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, 
                          format = "pf", 
                          contDigits = 3)[,1:3]
```


## Match samples used

Here we match the full database with the samples used in **`EntropyMasker`**. 

```{r}
# Remove duplicate rows of the dataframe
library(dplyr)
temp <- EM_samples %>% select(., "Studynumber") %>%
  distinct(.)

AEDB_EM <- merge(temp,
                 AEDB,
                 by.x = "Studynumber",
                 by.y = "STUDY_NUMBER", 
                 sort = FALSE)

AEDB_EM.full <- subset(AEDB_EM,
                    informedconsent != "missing" & # we are really strict in selecting based on 'informed consent'!
                       informedconsent != "no, died" & 
                       informedconsent != "yes, no tissue, no commerical business" &
                       informedconsent != "yes, no tissue, no questionnaires, no medical info, no commercial business" &
                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commerical business" &
                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info, no commercial business" &
                       informedconsent != "yes, no tissue, no health treatment" &
                       informedconsent != "yes, no tissue, no questionnaires" &
                       informedconsent != "yes, no tissue, health treatment when possible" &
                       informedconsent != "yes, no tissue" &
                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no medical info" &
                       informedconsent != "yes, no tissue, no questionnaires, no health treatment, no commercial business" &
                       informedconsent != "no, doesn't want to" &
                       informedconsent != "no, unable to sign" & 
                       informedconsent != "no, no reaction" & 
                       informedconsent != "no, lost" & 
                       informedconsent != "no, too old" & 
                       informedconsent != "yes, no medical info, health treatment when possible" &
                       informedconsent != "no (never asked for IC because there was no tissue)" &
                       informedconsent != "no, endpoint" & 
                       informedconsent != "nooit geincludeerd")
# AEDB_EM.full[1:10, 1:10]

rm(temp)
```



```{r Baseline AEDB: Visualize AEDB EM FULL}
# Create baseline tables
# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html
AEDB_EM.full.tableOne = print(CreateTableOne(vars = basetable_vars, 
                                         factorVars = basetable_bin,
                                         # strata = "Symptoms.4g",
                                         data = AEDB_EM.full, includeNA = TRUE), 
                          nonnormal = c(), missing = TRUE,
                          quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, 
                          format = "pf", 
                          contDigits = 3)[,1:3]
```

```{r Baseline AEDB: Visualize AEDB EM}

basetable_vars = c("Hospital", 
                   "Artery_summary")

basetable_bin = c("Hospital", 
                  "Artery_summary")

# Create baseline tables
# http://rstudio-pubs-static.s3.amazonaws.com/13321_da314633db924dc78986a850813a50d5.html
AEDB_EM.tableOne = print(CreateTableOne(vars = basetable_vars, 
                                         factorVars = basetable_bin,
                                         # strata = "Symptoms.4g",
                                         data = AEDB_EM, includeNA = TRUE), 
                          nonnormal = c(), missing = TRUE,
                          quote = FALSE, noSpaces = FALSE, showAllLevels = TRUE, explain = TRUE, 
                          format = "pf", 
                          contDigits = 3)[,1:3]
```

## Baseline writing

Let's save the baseline characteristics of the Athero-Express Biobank Study.

```{r Baseline SampleSelection: write}
# Write basetable

require(openxlsx)

write.xlsx(as.data.frame(AEDB.tableOne), 
           file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.BaselineTable.xlsx"), 
           rowNames = TRUE, 
           colNames = TRUE, 
           sheetName = "AE_Base", overwrite = TRUE)

write.xlsx(as.data.frame(AEDB_EM.tableOne), 
           file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.EM.59.BaselineTable.xlsx"), 
           rowNames = TRUE, 
           colNames = TRUE, 
           sheetName = "AE_Base_EM_59", overwrite = TRUE)

write.xlsx(as.data.frame(AEDB_EM.full.tableOne), 
           file = paste0(BASELINE_loc, "/",Today,".",PROJECTNAME,".AE.EM.56.BaselineTable.xlsx"), 
           rowNames = TRUE, 
           colNames = TRUE, 
           sheetName = "AE_Base_EM_56", overwrite = TRUE)

```

We will also write the newly prepared AEDB selected for this study which we can use in downstream analyses. 

```{r}
saveRDS(AEDB_EM.full, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.EM.FULL.RDS"))
saveRDS(AEDB.full, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.FULL.RDS"))
saveRDS(AEDB, file = paste0(OUT_loc, "/",Today,".",PROJECTNAME,".AEDB.raw.RDS"))

```


# Session information

------------------------------------------------------------------------------------------------------------------------

    Version:      v1.0.2
    Last update:  2022-07-12
    Written by:   Sander W. van der Laan (s.w.vanderlaan-2[at]umcutrecht.nl).
    Description:  Script to get some Athero-Express Biobank Study baseline characteristics.
    Minimum requirements: R version 3.4.3 (2017-06-30) -- 'Single Candle', Mac OS X El Capitan

    **MoSCoW To-Do List**
    The things we Must, Should, Could, and Would have given the time we have.
    _M_

    _S_

    _C_

    _W_

    **Changes log**
    * v1.0.2 Simplified the initial script. It now outputs the relevant R-objects (as .RDS).
    * v1.0.1 Update to main AEDB (there is an error in the Age-variable in the new version).
    * v1.0.0 Initial version. Add 'plaque vulnerability index', Fixed baseline table, added codes, and results. Major update to WORCS system.

------------------------------------------------------------------------------------------------------------------------

```{r eval = TRUE}
sessionInfo()
```

# Saving environment

```{r Saving}
save.image(paste0(PROJECT_loc, "/",Today,".",PROJECTNAME,".AEDB.EM.baseline.RData"))
```

+-----------------------------------------------------------------------------------------------------------------------------------------+
| <sup>© 1979-2022 Sander W. van der Laan | s.w.vanderlaan[at]gmail.com | [swvanderlaan.github.io](https://swvanderlaan.github.io).</sup> |
+-----------------------------------------------------------------------------------------------------------------------------------------+

+ + +
+
+ +
+ + + + + + + + + + + + + + + + + diff --git a/README.html b/README.html index 8756caf..43485f5 100644 --- a/README.html +++ b/README.html @@ -30,7 +30,7 @@ !function(e,t){"use strict";"object"==typeof module&&"object"==typeof module.exports?module.exports=e.document?t(e,!0):function(e){if(!e.document)throw new Error("jQuery requires a window with a document");return t(e)}:t(e)}("undefined"!=typeof window?window:this,function(C,e){"use strict";var t=[],r=Object.getPrototypeOf,s=t.slice,g=t.flat?function(e){return t.flat.call(e)}:function(e){return t.concat.apply([],e)},u=t.push,i=t.indexOf,n={},o=n.toString,v=n.hasOwnProperty,a=v.toString,l=a.call(Object),y={},m=function(e){return"function"==typeof e&&"number"!=typeof e.nodeType&&"function"!=typeof e.item},x=function(e){return null!=e&&e===e.window},E=C.document,c={type:!0,src:!0,nonce:!0,noModule:!0};function b(e,t,n){var r,i,o=(n=n||E).createElement("script");if(o.text=e,t)for(r in c)(i=t[r]||t.getAttribute&&t.getAttribute(r))&&o.setAttribute(r,i);n.head.appendChild(o).parentNode.removeChild(o)}function w(e){return null==e?e+"":"object"==typeof e||"function"==typeof e?n[o.call(e)]||"object":typeof e}var f="3.6.0",S=function(e,t){return new S.fn.init(e,t)};function p(e){var t=!!e&&"length"in e&&e.length,n=w(e);return!m(e)&&!x(e)&&("array"===n||0===t||"number"==typeof t&&0+~]|"+M+")"+M+"*"),U=new RegExp(M+"|>"),X=new RegExp(F),V=new RegExp("^"+I+"$"),G={ID:new RegExp("^#("+I+")"),CLASS:new RegExp("^\\.("+I+")"),TAG:new RegExp("^("+I+"|[*])"),ATTR:new RegExp("^"+W),PSEUDO:new RegExp("^"+F),CHILD:new RegExp("^:(only|first|last|nth|nth-last)-(child|of-type)(?:\\("+M+"*(even|odd|(([+-]|)(\\d*)n|)"+M+"*(?:([+-]|)"+M+"*(\\d+)|))"+M+"*\\)|)","i"),bool:new RegExp("^(?:"+R+")$","i"),needsContext:new RegExp("^"+M+"*[>+~]|:(even|odd|eq|gt|lt|nth|first|last)(?:\\("+M+"*((?:-\\d)?\\d*)"+M+"*\\)|)(?=[^-]|$)","i")},Y=/HTML$/i,Q=/^(?:input|select|textarea|button)$/i,J=/^h\d$/i,K=/^[^{]+\{\s*\[native \w/,Z=/^(?:#([\w-]+)|(\w+)|\.([\w-]+))$/,ee=/[+~]/,te=new RegExp("\\\\[\\da-fA-F]{1,6}"+M+"?|\\\\([^\\r\\n\\f])","g"),ne=function(e,t){var n="0x"+e.slice(1)-65536;return t||(n<0?String.fromCharCode(n+65536):String.fromCharCode(n>>10|55296,1023&n|56320))},re=/([\0-\x1f\x7f]|^-?\d)|^-$|[^\0-\x1f\x7f-\uFFFF\w-]/g,ie=function(e,t){return t?"\0"===e?"\ufffd":e.slice(0,-1)+"\\"+e.charCodeAt(e.length-1).toString(16)+" ":"\\"+e},oe=function(){T()},ae=be(function(e){return!0===e.disabled&&"fieldset"===e.nodeName.toLowerCase()},{dir:"parentNode",next:"legend"});try{H.apply(t=O.call(p.childNodes),p.childNodes),t[p.childNodes.length].nodeType}catch(e){H={apply:t.length?function(e,t){L.apply(e,O.call(t))}:function(e,t){var n=e.length,r=0;while(e[n++]=t[r++]);e.length=n-1}}}function se(t,e,n,r){var i,o,a,s,u,l,c,f=e&&e.ownerDocument,p=e?e.nodeType:9;if(n=n||[],"string"!=typeof t||!t||1!==p&&9!==p&&11!==p)return n;if(!r&&(T(e),e=e||C,E)){if(11!==p&&(u=Z.exec(t)))if(i=u[1]){if(9===p){if(!(a=e.getElementById(i)))return n;if(a.id===i)return n.push(a),n}else if(f&&(a=f.getElementById(i))&&y(e,a)&&a.id===i)return n.push(a),n}else{if(u[2])return H.apply(n,e.getElementsByTagName(t)),n;if((i=u[3])&&d.getElementsByClassName&&e.getElementsByClassName)return H.apply(n,e.getElementsByClassName(i)),n}if(d.qsa&&!N[t+" "]&&(!v||!v.test(t))&&(1!==p||"object"!==e.nodeName.toLowerCase())){if(c=t,f=e,1===p&&(U.test(t)||z.test(t))){(f=ee.test(t)&&ye(e.parentNode)||e)===e&&d.scope||((s=e.getAttribute("id"))?s=s.replace(re,ie):e.setAttribute("id",s=S)),o=(l=h(t)).length;while(o--)l[o]=(s?"#"+s:":scope")+" "+xe(l[o]);c=l.join(",")}try{return H.apply(n,f.querySelectorAll(c)),n}catch(e){N(t,!0)}finally{s===S&&e.removeAttribute("id")}}}return g(t.replace($,"$1"),e,n,r)}function ue(){var r=[];return function e(t,n){return r.push(t+" ")>b.cacheLength&&delete e[r.shift()],e[t+" "]=n}}function le(e){return e[S]=!0,e}function ce(e){var t=C.createElement("fieldset");try{return!!e(t)}catch(e){return!1}finally{t.parentNode&&t.parentNode.removeChild(t),t=null}}function fe(e,t){var n=e.split("|"),r=n.length;while(r--)b.attrHandle[n[r]]=t}function pe(e,t){var n=t&&e,r=n&&1===e.nodeType&&1===t.nodeType&&e.sourceIndex-t.sourceIndex;if(r)return r;if(n)while(n=n.nextSibling)if(n===t)return-1;return e?1:-1}function de(t){return function(e){return"input"===e.nodeName.toLowerCase()&&e.type===t}}function he(n){return function(e){var t=e.nodeName.toLowerCase();return("input"===t||"button"===t)&&e.type===n}}function ge(t){return function(e){return"form"in e?e.parentNode&&!1===e.disabled?"label"in e?"label"in e.parentNode?e.parentNode.disabled===t:e.disabled===t:e.isDisabled===t||e.isDisabled!==!t&&ae(e)===t:e.disabled===t:"label"in e&&e.disabled===t}}function ve(a){return le(function(o){return o=+o,le(function(e,t){var n,r=a([],e.length,o),i=r.length;while(i--)e[n=r[i]]&&(e[n]=!(t[n]=e[n]))})})}function ye(e){return e&&"undefined"!=typeof e.getElementsByTagName&&e}for(e in d=se.support={},i=se.isXML=function(e){var t=e&&e.namespaceURI,n=e&&(e.ownerDocument||e).documentElement;return!Y.test(t||n&&n.nodeName||"HTML")},T=se.setDocument=function(e){var t,n,r=e?e.ownerDocument||e:p;return r!=C&&9===r.nodeType&&r.documentElement&&(a=(C=r).documentElement,E=!i(C),p!=C&&(n=C.defaultView)&&n.top!==n&&(n.addEventListener?n.addEventListener("unload",oe,!1):n.attachEvent&&n.attachEvent("onunload",oe)),d.scope=ce(function(e){return a.appendChild(e).appendChild(C.createElement("div")),"undefined"!=typeof e.querySelectorAll&&!e.querySelectorAll(":scope fieldset div").length}),d.attributes=ce(function(e){return e.className="i",!e.getAttribute("className")}),d.getElementsByTagName=ce(function(e){return e.appendChild(C.createComment("")),!e.getElementsByTagName("*").length}),d.getElementsByClassName=K.test(C.getElementsByClassName),d.getById=ce(function(e){return a.appendChild(e).id=S,!C.getElementsByName||!C.getElementsByName(S).length}),d.getById?(b.filter.ID=function(e){var t=e.replace(te,ne);return function(e){return e.getAttribute("id")===t}},b.find.ID=function(e,t){if("undefined"!=typeof t.getElementById&&E){var n=t.getElementById(e);return n?[n]:[]}}):(b.filter.ID=function(e){var n=e.replace(te,ne);return function(e){var t="undefined"!=typeof e.getAttributeNode&&e.getAttributeNode("id");return t&&t.value===n}},b.find.ID=function(e,t){if("undefined"!=typeof t.getElementById&&E){var n,r,i,o=t.getElementById(e);if(o){if((n=o.getAttributeNode("id"))&&n.value===e)return[o];i=t.getElementsByName(e),r=0;while(o=i[r++])if((n=o.getAttributeNode("id"))&&n.value===e)return[o]}return[]}}),b.find.TAG=d.getElementsByTagName?function(e,t){return"undefined"!=typeof t.getElementsByTagName?t.getElementsByTagName(e):d.qsa?t.querySelectorAll(e):void 0}:function(e,t){var n,r=[],i=0,o=t.getElementsByTagName(e);if("*"===e){while(n=o[i++])1===n.nodeType&&r.push(n);return r}return o},b.find.CLASS=d.getElementsByClassName&&function(e,t){if("undefined"!=typeof t.getElementsByClassName&&E)return t.getElementsByClassName(e)},s=[],v=[],(d.qsa=K.test(C.querySelectorAll))&&(ce(function(e){var t;a.appendChild(e).innerHTML="",e.querySelectorAll("[msallowcapture^='']").length&&v.push("[*^$]="+M+"*(?:''|\"\")"),e.querySelectorAll("[selected]").length||v.push("\\["+M+"*(?:value|"+R+")"),e.querySelectorAll("[id~="+S+"-]").length||v.push("~="),(t=C.createElement("input")).setAttribute("name",""),e.appendChild(t),e.querySelectorAll("[name='']").length||v.push("\\["+M+"*name"+M+"*="+M+"*(?:''|\"\")"),e.querySelectorAll(":checked").length||v.push(":checked"),e.querySelectorAll("a#"+S+"+*").length||v.push(".#.+[+~]"),e.querySelectorAll("\\\f"),v.push("[\\r\\n\\f]")}),ce(function(e){e.innerHTML="";var t=C.createElement("input");t.setAttribute("type","hidden"),e.appendChild(t).setAttribute("name","D"),e.querySelectorAll("[name=d]").length&&v.push("name"+M+"*[*^$|!~]?="),2!==e.querySelectorAll(":enabled").length&&v.push(":enabled",":disabled"),a.appendChild(e).disabled=!0,2!==e.querySelectorAll(":disabled").length&&v.push(":enabled",":disabled"),e.querySelectorAll("*,:x"),v.push(",.*:")})),(d.matchesSelector=K.test(c=a.matches||a.webkitMatchesSelector||a.mozMatchesSelector||a.oMatchesSelector||a.msMatchesSelector))&&ce(function(e){d.disconnectedMatch=c.call(e,"*"),c.call(e,"[s!='']:x"),s.push("!=",F)}),v=v.length&&new RegExp(v.join("|")),s=s.length&&new RegExp(s.join("|")),t=K.test(a.compareDocumentPosition),y=t||K.test(a.contains)?function(e,t){var n=9===e.nodeType?e.documentElement:e,r=t&&t.parentNode;return e===r||!(!r||1!==r.nodeType||!(n.contains?n.contains(r):e.compareDocumentPosition&&16&e.compareDocumentPosition(r)))}:function(e,t){if(t)while(t=t.parentNode)if(t===e)return!0;return!1},j=t?function(e,t){if(e===t)return l=!0,0;var n=!e.compareDocumentPosition-!t.compareDocumentPosition;return n||(1&(n=(e.ownerDocument||e)==(t.ownerDocument||t)?e.compareDocumentPosition(t):1)||!d.sortDetached&&t.compareDocumentPosition(e)===n?e==C||e.ownerDocument==p&&y(p,e)?-1:t==C||t.ownerDocument==p&&y(p,t)?1:u?P(u,e)-P(u,t):0:4&n?-1:1)}:function(e,t){if(e===t)return l=!0,0;var n,r=0,i=e.parentNode,o=t.parentNode,a=[e],s=[t];if(!i||!o)return e==C?-1:t==C?1:i?-1:o?1:u?P(u,e)-P(u,t):0;if(i===o)return pe(e,t);n=e;while(n=n.parentNode)a.unshift(n);n=t;while(n=n.parentNode)s.unshift(n);while(a[r]===s[r])r++;return r?pe(a[r],s[r]):a[r]==p?-1:s[r]==p?1:0}),C},se.matches=function(e,t){return se(e,null,null,t)},se.matchesSelector=function(e,t){if(T(e),d.matchesSelector&&E&&!N[t+" "]&&(!s||!s.test(t))&&(!v||!v.test(t)))try{var n=c.call(e,t);if(n||d.disconnectedMatch||e.document&&11!==e.document.nodeType)return n}catch(e){N(t,!0)}return 0":{dir:"parentNode",first:!0}," ":{dir:"parentNode"},"+":{dir:"previousSibling",first:!0},"~":{dir:"previousSibling"}},preFilter:{ATTR:function(e){return e[1]=e[1].replace(te,ne),e[3]=(e[3]||e[4]||e[5]||"").replace(te,ne),"~="===e[2]&&(e[3]=" "+e[3]+" "),e.slice(0,4)},CHILD:function(e){return e[1]=e[1].toLowerCase(),"nth"===e[1].slice(0,3)?(e[3]||se.error(e[0]),e[4]=+(e[4]?e[5]+(e[6]||1):2*("even"===e[3]||"odd"===e[3])),e[5]=+(e[7]+e[8]||"odd"===e[3])):e[3]&&se.error(e[0]),e},PSEUDO:function(e){var t,n=!e[6]&&e[2];return G.CHILD.test(e[0])?null:(e[3]?e[2]=e[4]||e[5]||"":n&&X.test(n)&&(t=h(n,!0))&&(t=n.indexOf(")",n.length-t)-n.length)&&(e[0]=e[0].slice(0,t),e[2]=n.slice(0,t)),e.slice(0,3))}},filter:{TAG:function(e){var t=e.replace(te,ne).toLowerCase();return"*"===e?function(){return!0}:function(e){return e.nodeName&&e.nodeName.toLowerCase()===t}},CLASS:function(e){var t=m[e+" "];return t||(t=new RegExp("(^|"+M+")"+e+"("+M+"|$)"))&&m(e,function(e){return t.test("string"==typeof e.className&&e.className||"undefined"!=typeof e.getAttribute&&e.getAttribute("class")||"")})},ATTR:function(n,r,i){return function(e){var t=se.attr(e,n);return null==t?"!="===r:!r||(t+="","="===r?t===i:"!="===r?t!==i:"^="===r?i&&0===t.indexOf(i):"*="===r?i&&-1:\x20\t\r\n\f]*)[\x20\t\r\n\f]*\/?>(?:<\/\1>|)$/i;function j(e,n,r){return m(n)?S.grep(e,function(e,t){return!!n.call(e,t,e)!==r}):n.nodeType?S.grep(e,function(e){return e===n!==r}):"string"!=typeof n?S.grep(e,function(e){return-1)[^>]*|#([\w-]+))$/;(S.fn.init=function(e,t,n){var r,i;if(!e)return this;if(n=n||D,"string"==typeof e){if(!(r="<"===e[0]&&">"===e[e.length-1]&&3<=e.length?[null,e,null]:q.exec(e))||!r[1]&&t)return!t||t.jquery?(t||n).find(e):this.constructor(t).find(e);if(r[1]){if(t=t instanceof S?t[0]:t,S.merge(this,S.parseHTML(r[1],t&&t.nodeType?t.ownerDocument||t:E,!0)),N.test(r[1])&&S.isPlainObject(t))for(r in t)m(this[r])?this[r](t[r]):this.attr(r,t[r]);return this}return(i=E.getElementById(r[2]))&&(this[0]=i,this.length=1),this}return e.nodeType?(this[0]=e,this.length=1,this):m(e)?void 0!==n.ready?n.ready(e):e(S):S.makeArray(e,this)}).prototype=S.fn,D=S(E);var L=/^(?:parents|prev(?:Until|All))/,H={children:!0,contents:!0,next:!0,prev:!0};function O(e,t){while((e=e[t])&&1!==e.nodeType);return e}S.fn.extend({has:function(e){var t=S(e,this),n=t.length;return this.filter(function(){for(var e=0;e\x20\t\r\n\f]*)/i,he=/^$|^module$|\/(?:java|ecma)script/i;ce=E.createDocumentFragment().appendChild(E.createElement("div")),(fe=E.createElement("input")).setAttribute("type","radio"),fe.setAttribute("checked","checked"),fe.setAttribute("name","t"),ce.appendChild(fe),y.checkClone=ce.cloneNode(!0).cloneNode(!0).lastChild.checked,ce.innerHTML="",y.noCloneChecked=!!ce.cloneNode(!0).lastChild.defaultValue,ce.innerHTML="",y.option=!!ce.lastChild;var ge={thead:[1,"","
"],col:[2,"","
"],tr:[2,"","
"],td:[3,"","
"],_default:[0,"",""]};function ve(e,t){var n;return n="undefined"!=typeof e.getElementsByTagName?e.getElementsByTagName(t||"*"):"undefined"!=typeof e.querySelectorAll?e.querySelectorAll(t||"*"):[],void 0===t||t&&A(e,t)?S.merge([e],n):n}function ye(e,t){for(var n=0,r=e.length;n",""]);var me=/<|&#?\w+;/;function xe(e,t,n,r,i){for(var o,a,s,u,l,c,f=t.createDocumentFragment(),p=[],d=0,h=e.length;d\s*$/g;function je(e,t){return A(e,"table")&&A(11!==t.nodeType?t:t.firstChild,"tr")&&S(e).children("tbody")[0]||e}function De(e){return e.type=(null!==e.getAttribute("type"))+"/"+e.type,e}function qe(e){return"true/"===(e.type||"").slice(0,5)?e.type=e.type.slice(5):e.removeAttribute("type"),e}function Le(e,t){var n,r,i,o,a,s;if(1===t.nodeType){if(Y.hasData(e)&&(s=Y.get(e).events))for(i in Y.remove(t,"handle events"),s)for(n=0,r=s[i].length;n").attr(n.scriptAttrs||{}).prop({charset:n.scriptCharset,src:n.url}).on("load error",i=function(e){r.remove(),i=null,e&&t("error"===e.type?404:200,e.type)}),E.head.appendChild(r[0])},abort:function(){i&&i()}}});var _t,zt=[],Ut=/(=)\?(?=&|$)|\?\?/;S.ajaxSetup({jsonp:"callback",jsonpCallback:function(){var e=zt.pop()||S.expando+"_"+wt.guid++;return this[e]=!0,e}}),S.ajaxPrefilter("json jsonp",function(e,t,n){var r,i,o,a=!1!==e.jsonp&&(Ut.test(e.url)?"url":"string"==typeof e.data&&0===(e.contentType||"").indexOf("application/x-www-form-urlencoded")&&Ut.test(e.data)&&"data");if(a||"jsonp"===e.dataTypes[0])return r=e.jsonpCallback=m(e.jsonpCallback)?e.jsonpCallback():e.jsonpCallback,a?e[a]=e[a].replace(Ut,"$1"+r):!1!==e.jsonp&&(e.url+=(Tt.test(e.url)?"&":"?")+e.jsonp+"="+r),e.converters["script json"]=function(){return o||S.error(r+" was not called"),o[0]},e.dataTypes[0]="json",i=C[r],C[r]=function(){o=arguments},n.always(function(){void 0===i?S(C).removeProp(r):C[r]=i,e[r]&&(e.jsonpCallback=t.jsonpCallback,zt.push(r)),o&&m(i)&&i(o[0]),o=i=void 0}),"script"}),y.createHTMLDocument=((_t=E.implementation.createHTMLDocument("").body).innerHTML="
",2===_t.childNodes.length),S.parseHTML=function(e,t,n){return"string"!=typeof e?[]:("boolean"==typeof t&&(n=t,t=!1),t||(y.createHTMLDocument?((r=(t=E.implementation.createHTMLDocument("")).createElement("base")).href=E.location.href,t.head.appendChild(r)):t=E),o=!n&&[],(i=N.exec(e))?[t.createElement(i[1])]:(i=xe([e],t,o),o&&o.length&&S(o).remove(),S.merge([],i.childNodes)));var r,i,o},S.fn.load=function(e,t,n){var r,i,o,a=this,s=e.indexOf(" ");return-1").append(S.parseHTML(e)).find(r):e)}).always(n&&function(e,t){a.each(function(){n.apply(this,o||[e.responseText,t,e])})}),this},S.expr.pseudos.animated=function(t){return S.grep(S.timers,function(e){return t===e.elem}).length},S.offset={setOffset:function(e,t,n){var r,i,o,a,s,u,l=S.css(e,"position"),c=S(e),f={};"static"===l&&(e.style.position="relative"),s=c.offset(),o=S.css(e,"top"),u=S.css(e,"left"),("absolute"===l||"fixed"===l)&&-1<(o+u).indexOf("auto")?(a=(r=c.position()).top,i=r.left):(a=parseFloat(o)||0,i=parseFloat(u)||0),m(t)&&(t=t.call(e,n,S.extend({},s))),null!=t.top&&(f.top=t.top-s.top+a),null!=t.left&&(f.left=t.left-s.left+i),"using"in t?t.using.call(e,f):c.css(f)}},S.fn.extend({offset:function(t){if(arguments.length)return void 0===t?this:this.each(function(e){S.offset.setOffset(this,t,e)});var e,n,r=this[0];return r?r.getClientRects().length?(e=r.getBoundingClientRect(),n=r.ownerDocument.defaultView,{top:e.top+n.pageYOffset,left:e.left+n.pageXOffset}):{top:0,left:0}:void 0},position:function(){if(this[0]){var e,t,n,r=this[0],i={top:0,left:0};if("fixed"===S.css(r,"position"))t=r.getBoundingClientRect();else{t=this.offset(),n=r.ownerDocument,e=r.offsetParent||n.documentElement;while(e&&(e===n.body||e===n.documentElement)&&"static"===S.css(e,"position"))e=e.parentNode;e&&e!==r&&1===e.nodeType&&((i=S(e).offset()).top+=S.css(e,"borderTopWidth",!0),i.left+=S.css(e,"borderLeftWidth",!0))}return{top:t.top-i.top-S.css(r,"marginTop",!0),left:t.left-i.left-S.css(r,"marginLeft",!0)}}},offsetParent:function(){return this.map(function(){var e=this.offsetParent;while(e&&"static"===S.css(e,"position"))e=e.offsetParent;return e||re})}}),S.each({scrollLeft:"pageXOffset",scrollTop:"pageYOffset"},function(t,i){var o="pageYOffset"===i;S.fn[t]=function(e){return $(this,function(e,t,n){var r;if(x(e)?r=e:9===e.nodeType&&(r=e.defaultView),void 0===n)return r?r[i]:e[t];r?r.scrollTo(o?r.pageXOffset:n,o?n:r.pageYOffset):e[t]=n},t,e,arguments.length)}}),S.each(["top","left"],function(e,n){S.cssHooks[n]=Fe(y.pixelPosition,function(e,t){if(t)return t=We(e,n),Pe.test(t)?S(e).position()[n]+"px":t})}),S.each({Height:"height",Width:"width"},function(a,s){S.each({padding:"inner"+a,content:s,"":"outer"+a},function(r,o){S.fn[o]=function(e,t){var n=arguments.length&&(r||"boolean"!=typeof e),i=r||(!0===e||!0===t?"margin":"border");return $(this,function(e,t,n){var r;return x(e)?0===o.indexOf("outer")?e["inner"+a]:e.document.documentElement["client"+a]:9===e.nodeType?(r=e.documentElement,Math.max(e.body["scroll"+a],r["scroll"+a],e.body["offset"+a],r["offset"+a],r["client"+a])):void 0===n?S.css(e,t,i):S.style(e,t,n,i)},s,n?e:void 0,n)}})}),S.each(["ajaxStart","ajaxStop","ajaxComplete","ajaxError","ajaxSuccess","ajaxSend"],function(e,t){S.fn[t]=function(e){return this.on(t,e)}}),S.fn.extend({bind:function(e,t,n){return this.on(e,null,t,n)},unbind:function(e,t){return this.off(e,null,t)},delegate:function(e,t,n,r){return this.on(t,e,n,r)},undelegate:function(e,t,n){return 1===arguments.length?this.off(e,"**"):this.off(t,e||"**",n)},hover:function(e,t){return this.mouseenter(e).mouseleave(t||e)}}),S.each("blur focus focusin focusout resize scroll click dblclick mousedown mouseup mousemove mouseover mouseout mouseenter mouseleave change select submit keydown keypress keyup contextmenu".split(" "),function(e,n){S.fn[n]=function(e,t){return 0 - +h1.title {font-size: 38px;} +h2 {font-size: 30px;} +h3 {font-size: 24px;} +h4 {font-size: 18px;} +h5 {font-size: 16px;} +h6 {font-size: 12px;} +code {color: inherit; background-color: rgba(0, 0, 0, 0.04);} +pre:not([class]) { background-color: white } +code{white-space: pre-wrap;} +span.smallcaps{font-variant: small-caps;} +span.underline{text-decoration: underline;} +div.column{display: inline-block; vertical-align: top; width: 50%;} +div.hanging-indent{margin-left: 1.5em; text-indent: -1.5em;} +ul.task-list{list-style: none;} +