diff --git a/CohortDiagnosticsBreastCancer/DiagnosticsExplorer.Rproj b/CohortDiagnosticsBreastCancer/DiagnosticsExplorer.Rproj
new file mode 100644
index 00000000..8e3c2ebc
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/DiagnosticsExplorer.Rproj
@@ -0,0 +1,13 @@
+Version: 1.0
+
+RestoreWorkspace: Default
+SaveWorkspace: Default
+AlwaysSaveHistory: Default
+
+EnableCodeIndexing: Yes
+UseSpacesForTab: Yes
+NumSpacesForTab: 2
+Encoding: UTF-8
+
+RnwWeave: Sweave
+LaTeX: pdfLaTeX
diff --git a/CohortDiagnosticsBreastCancer/R/DisplayFunctions.R b/CohortDiagnosticsBreastCancer/R/DisplayFunctions.R
new file mode 100644
index 00000000..d3cf2fb7
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/R/DisplayFunctions.R
@@ -0,0 +1,73 @@
+camelCaseToSnakeCase <- function(string) {
+  string <- gsub("([A-Z])", "_\\1", string)
+  string <- tolower(string)
+  string <- gsub("([a-z])([0-9])", "\\1_\\2", string)
+  return(string)
+}
+
+
+camelCaseToTitleCase <- function(string) {
+  string <- gsub("([A-Z])", " \\1", string)
+  string <- gsub("([a-z])([0-9])", "\\1 \\2", string)
+  substr(string, 1, 1) <- toupper(substr(string, 1, 1))
+  return(string)
+}
+
+
+truncateStringDef <- function(columns, maxChars) {
+  list(
+    targets = columns,
+    render = DT::JS(sprintf("function(data, type, row, meta) {\n
+      return type === 'display' && data != null && data.length > %s ?\n
+        '<span title=\"' + data + '\">' + data.substr(0, %s) + '...</span>' : data;\n
+     }", maxChars, maxChars))
+  )
+}
+
+minCellCountDef <- function(columns) {
+  list(
+    targets = columns,
+    render = DT::JS("function(data, type) {
+    if (type !== 'display' || isNaN(parseFloat(data))) return data;
+    if (data >= 0) return data.toString().replace(/(\\d)(?=(\\d{3})+(?!\\d))/g, '$1,');
+    return '<' + Math.abs(data).toString().replace(/(\\d)(?=(\\d{3})+(?!\\d))/g, '$1,');
+  }")
+  )
+}
+
+minCellPercentDef <- function(columns) {
+  list(
+    targets = columns,
+    render = DT::JS("function(data, type) {
+    if (type !== 'display' || isNaN(parseFloat(data))) return data;
+    if (data >= 0) return (100 * data).toFixed(1).replace(/(\\d)(?=(\\d{3})+(?!\\d))/g, '$1,') + '%';
+    return '<' + Math.abs(100 * data).toFixed(1).replace(/(\\d)(?=(\\d{3})+(?!\\d))/g, '$1,') + '%';
+  }")
+  )
+}
+
+minCellRealDef <- function(columns, digits = 1) {
+  list(
+    targets = columns,
+    render = DT::JS(sprintf("function(data, type) {
+    if (type !== 'display' || isNaN(parseFloat(data))) return data;
+    if (data >= 0) return data.toFixed(%s).replace(/(\\d)(?=(\\d{3})+(?!\\d))/g, '$1,');
+    return '<' + Math.abs(data).toFixed(%s).replace(/(\\d)(?=(\\d{3})+(?!\\d))/g, '$1,');
+  }", digits, digits))
+  )
+}
+
+styleAbsColorBar <- function(maxValue, colorPositive, colorNegative, angle = 90) {
+  DT::JS(sprintf("isNaN(parseFloat(value))? '' : 'linear-gradient(%fdeg, transparent ' + (%f - Math.abs(value))/%f * 100 + '%%, ' + (value > 0 ? '%s ' : '%s ') + (%f - Math.abs(value))/%f * 100 + '%%)'", 
+                 angle, maxValue, maxValue, colorPositive, colorNegative, maxValue, maxValue))
+}
+
+sumCounts <- function(counts) {
+  result <- sum(abs(counts))
+  if (any(counts < 0)) {
+    return(-result)
+  } else {
+    return(result)
+  }
+  
+}
diff --git a/CohortDiagnosticsBreastCancer/R/FacetNested.R b/CohortDiagnosticsBreastCancer/R/FacetNested.R
new file mode 100644
index 00000000..e02ca2d1
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/R/FacetNested.R
@@ -0,0 +1,602 @@
+# Code borrowed from https://github.com/teunbrand/ggh4x and gtable, just to merge the labels of grouped facets.
+# May need to simplify a bit.
+library(ggplot2)
+
+.grab_ggplot_internals <- function() {
+  objects <- c(
+    ".all_aesthetics",
+    "as_facets_list",
+    "as_gg_data_frame",
+    "axis_label_element_overrides",
+    "check_aesthetics",
+    "check_labeller",
+    "check_subclass",
+    "compact",
+    "continuous_range",
+    "convertInd",
+    "df.grid",
+    "draw_axis_labels",
+    "reshape_add_margins",
+    "new_data_frame",
+    "defaults", "id",
+    "empty",
+    "eval_facets",
+    "ggname",
+    "rename_aes",
+    "mapped_aesthetics",
+    "make_labels",
+    "grid_as_facets_list",
+    "is.zero",
+    "rbind_dfs",
+    "sanitise_dim",
+    "set_draw_key",
+    "snake_class",
+    "ulevels",
+    "unique_combs",
+    "var_list",
+    "validate_mapping",
+    "warn_for_guide_position",
+    "weave_tables_col",
+    "weave_tables_row",
+    "wrap_as_facets_list",
+    ".pt"
+  )
+  objects <- setNames(objects, objects)
+  out <- lapply(objects, function(i) {
+    getFromNamespace(i, "ggplot2")
+  })
+}
+
+# Store the needed ggplot internals here
+.int <- .grab_ggplot_internals()
+
+# From gtable:
+neg_to_pos <- function (x, max) {
+  ifelse(x >= 0, x, max + 1 + x)
+}
+
+new_data_frame <- function (x, n = NULL) 
+{
+  if (is.null(n)) {
+    n <- if (length(x) == 0) 
+      0
+    else length(x[[1]])
+  }
+  class(x) <- "data.frame"
+  attr(x, "row.names") <- .set_row_names(n)
+  x
+}
+
+gtable_add_grob <- function(x, grobs, t, l, b = t, r = l, z = Inf, clip = "on", 
+                            name = x$name) 
+{
+  if (!gtable::is.gtable(x)) 
+    stop("x must be a gtable", call. = FALSE)
+  # if (is.grob(grobs)) 
+  #   grobs <- list(grobs)
+  if (!is.list(grobs)) 
+    stop("grobs must either be a single grob or a list of grobs", 
+         call. = FALSE)
+  n_grobs <- length(grobs)
+  if (is.logical(clip)) {
+    clip <- ifelse(clip, "on", "off")
+  }
+  layout <- unclass(x$layout)
+  # if (!all(vapply(list(t, r, b, l, z, clip, name), len_same_or_1, 
+  #                 logical(1), n_grobs))) {
+  #   stop("Not all inputs have either length 1 or same length same as 'grobs'")
+  # }
+  z <- rep(z, length.out = n_grobs)
+  zval <- c(layout$z, z[!is.infinite(z)])
+  if (length(zval) == 0) {
+    zmin <- 1
+    zmax <- 0
+  }
+  else {
+    zmin <- min(zval)
+    zmax <- max(zval)
+  }
+  z[z == -Inf] <- zmin - rev(seq_len(sum(z == -Inf)))
+  z[z == Inf] <- zmax + seq_len(sum(z == Inf))
+  x_row <- length(x$heights)
+  x_col <- length(x$widths)
+  t <- rep(neg_to_pos(t, x_row), length.out = n_grobs)
+  b <- rep(neg_to_pos(b, x_row), length.out = n_grobs)
+  l <- rep(neg_to_pos(l, x_col), length.out = n_grobs)
+  r <- rep(neg_to_pos(r, x_col), length.out = n_grobs)
+  clip <- rep(clip, length.out = n_grobs)
+  name <- rep(name, length.out = n_grobs)
+  x$grobs <- c(x$grobs, grobs)
+  x$layout <- new_data_frame(list(t = c(layout$t, t), l = c(layout$l, 
+                                                            l), b = c(layout$b, b), r = c(layout$r, r), z = c(layout$z, 
+                                                                                                              z), clip = c(layout$clip, clip), name = c(layout$name, 
+                                                                                                                                                        name)))
+  x
+}
+
+# Main function -----------------------------------------------------------
+
+#' @title Layout panels in a grid with nested strips
+#'
+#' @description \code{facet_nested()} forms a matrix of panels defined by row
+#'   and column faceting variables and nests grouped facets.
+#'
+#' @inheritParams ggplot2::facet_grid
+#' @param nest_line a \code{logical} vector of length 1, indicating whether to
+#'   draw a nesting line to indicate the nesting of variables. Control the look
+#'   of the nesting line by setting the \code{ggh4x.facet.nestline} theme
+#'   element.
+#' @param resect  a \code{unit} vector of length 1, indicating how much the
+#'   nesting line should be shortened.
+#' @param bleed a \code{logical} vector of length 1, indicating whether merging
+#'   of lower-level variables is allowed when the higher-level variables are
+#'   separate. See details.
+#'
+#' @details Unlike \code{facet_grid()}, this function only automatically expands
+#'   missing variables when they have no variables in that direction, to allow
+#'   for unnested variables. It still requires at least one layer to have all
+#'   faceting variables.
+#'
+#'   Hierarchies are inferred from the order of variables supplied to
+#'   \code{rows} or \code{cols}. The first variable is interpreted to be the
+#'   outermost variable, while the last variable is interpreted to be the
+#'   innermost variable. They display order is always such that the outermost
+#'   variable is placed the furthest away from the panels. Strips are
+#'   automatically grouped when they span a nested variable.
+#'
+#'   The \code{bleed} argument controls whether lower-level variables are allowed
+#'   to be merged when higher-level are different, i.e. they can bleed over
+#'   hierarchies. Suppose the \code{facet_grid()} behaviour would be the
+#'   following:
+#'
+#'   \code{[_1_][_2_][_2_]} \cr \code{[_3_][_3_][_4_]}
+#'
+#'   In such case, the default \code{bleed = FALSE} argument would result in the
+#'   following:
+#'
+#'   \code{[_1_][___2____]} \cr \code{[_3_][_3_][_4_]}
+#'
+#'   Whereas \code{bleed = TRUE} would allow the following:
+#'
+#'   \code{[_1_][___2____]} \cr \code{[___3____][_4_]}
+#'
+#' @export
+#'
+#' @return A \emph{FacetNested} ggproto object.
+#' @family facetting functions
+#'
+#' @seealso See \code{\link[ggplot2]{facet_grid}} for descriptions of the
+#'   original arguments. See \code{\link[grid]{unit}} for the construction of a
+#'   \code{unit} vector.
+#'
+#' @examples
+#' df <- iris
+#' df$nester <- ifelse(df$Species == "setosa",
+#'                     "Short Leaves",
+#'                     "Long Leaves")
+#'
+#' ggplot(df, aes(Sepal.Length, Petal.Length)) +
+#'   geom_point() +
+#'   facet_nested(~ nester + Species)
+#'
+#' # Controlling the nest line
+#' ggplot(df, aes(Sepal.Length, Petal.Length)) +
+#'   geom_point() +
+#'   facet_nested(~ nester + Species, nest_line = TRUE) +
+#'   theme(ggh4x.facet.nestline = element_line(linetype = 3))
+facet_nested <- function(
+  rows = NULL, cols = NULL, scales = "fixed", space = "fixed",
+  shrink = TRUE, labeller = "label_value", as.table = TRUE,
+  switch = NULL, drop = TRUE, margins = FALSE, facets = NULL,
+  nest_line = FALSE, resect = unit(0, "mm"), bleed = FALSE
+) {
+  if (!is.null(facets)) {
+    rows <- facets
+  }
+  if (is.logical(cols)) {
+    margins <- cols
+    cols <- NULL
+  }
+  scales <- match.arg(scales, c("fixed", "free_x", "free_y", "free"))
+  free <- list(x = any(scales %in% c("free_x", "free")),
+               y = any(scales %in% c("free_y", "free")))
+  
+  space <- match.arg(space, c("fixed", "free_x", "free_y", "free"))
+  space_free <- list(x = any(space %in% c("free_x", "free")),
+                     y = any(space %in% c("free_y", "free")))
+  
+  if (!is.null(switch) && !switch %in% c("both", "x", "y")) {
+    stop("switch must be either 'both', 'x', or 'y'", call. = FALSE)
+  }
+  
+  facets_list <- .int$grid_as_facets_list(rows, cols)
+  n <- length(facets_list)
+  if (n > 2L) {
+    stop("A grid facet specification can't have more than two dimensions",
+         .call = FALSE)
+  }
+  if (n == 1L) {
+    rows <- quos()
+    cols <- facets_list[[1]]
+  } else {
+    rows <- facets_list[[1]]
+    cols <- facets_list[[2]]
+  }
+  labeller <- .int$check_labeller(labeller)
+  ggplot2::ggproto(NULL, FacetNested, shrink = shrink,
+                   params = list(
+                     rows = rows,
+                     cols = cols,
+                     margins = margins,
+                     free = free,
+                     space_free = space_free,
+                     labeller = labeller,
+                     as.table = as.table,
+                     switch = switch,
+                     drop = drop,
+                     nest_line = nest_line,
+                     resect = resect,
+                     bleed = bleed
+                   ))
+}
+
+# ggproto -----------------------------------------------------------------
+
+#' @usage NULL
+#' @format NULL
+#' @export
+#' @rdname ggh4x_extensions
+FacetNested <- ggplot2::ggproto(
+  "FacetNested", FacetGrid,
+  map_data = function(data, layout, params) {
+    # Handle empty data
+    if (.int$empty(data)) {
+      return(cbind(data, PANEL = integer(0)))
+    }
+    # Setup variables
+    rows <- params$rows
+    cols <- params$cols
+    
+    vars <- c(names(rows), names(cols))
+    if (length(vars) == 0) {
+      data$PANEL <- layout$PANEL
+      return(data)
+    }
+    
+    margin_vars <- list(intersect(names(rows), names(data)),
+                        intersect(names(cols), names(data)))
+    
+    # Add variables
+    data <- .int$reshape_add_margins(data, margin_vars, params$margins)
+    facet_vals <- .int$eval_facets(c(rows, cols), data, params$.possible_columns)
+    
+    # Only set as missing if it has no variable in that direction
+    missing_facets <- character(0)
+    if (!any(names(rows) %in% names(facet_vals))){
+      missing_facets <- c(missing_facets,
+                          setdiff(names(rows), names(facet_vals)))
+    }
+    if (!any(names(cols) %in% names(facet_vals))){
+      missing_facets <- c(missing_facets,
+                          setdiff(names(cols), names(facet_vals)))
+    }
+    
+    # Fill in missing values
+    if (length(missing_facets) > 0) {
+      to_add <- unique(layout[missing_facets])
+      data_rep <- rep.int(1:nrow(data), nrow(to_add))
+      facet_rep <- rep(1:nrow(to_add), each = nrow(data))
+      data <- data[data_rep, , drop = FALSE]
+      rownames(data) <- NULL
+      facet_vals <- cbind(facet_vals[data_rep, , drop = FALSE],
+                          to_add[facet_rep, , drop = FALSE])
+      rownames(facet_vals) <- NULL
+    }
+    
+    # Match columns to facets
+    if (nrow(facet_vals) == 0) {
+      data$PANEL <- -1
+    } else {
+      facet_vals[] <- lapply(facet_vals[], as.factor)
+      facet_vals[] <- lapply(facet_vals[], addNA, ifany = TRUE)
+      keys <- plyr::join.keys(facet_vals, layout,
+                              by = vars[vars %in% names(facet_vals)])
+      data$PANEL <- layout$PANEL[match(keys$x, keys$y)]
+    }
+    data
+  },
+  compute_layout = function(data, params) {
+    rows <- params$rows
+    cols <- params$cols
+    dups <- intersect(names(rows), names(cols))
+    
+    if (length(dups) > 0) {
+      stop("Facetting variables can only appear in row or cols, not both.\n",
+           "Problems: ", paste0(dups, collapse = "'"), call. = FALSE)
+    }
+    
+    base_rows <- combine_nested_vars(data, params$plot_env,
+                                     rows, drop = params$drop)
+    if (!params$as.table) {
+      rev_order <- function(x) factor(x, levels = rev(.int$ulevels(x)))
+    }
+    base_cols <- combine_nested_vars(data, params$plot_env, cols,
+                                     drop = params$drop)
+    base <- .int$df.grid(base_rows, base_cols)
+    
+    if (nrow(base) == 0) {
+      return(.int$new_data_frame(list(PANEL = 1L, ROW = 1L, COL = 1L,
+                                      SCALE_X = 1L, SCALE_Y = 1L)))
+    }
+    
+    base <- .int$reshape_add_margins(
+      base, list(names(rows), names(cols)), params$margins
+    )
+    base <- unique(base)
+    
+    panel <- .int$id(base, drop = TRUE)
+    panel <- factor(panel, levels = seq_len(attr(panel, "n")))
+    
+    rows <- if (!length(names(rows))) {
+      rep(1L, length(panel))
+    } else {
+      .int$id(base[names(rows)], drop = TRUE)
+    }
+    cols <- if (!length(names(cols))) {
+      rep(1L, length(panel))
+    } else {
+      .int$id(base[names(cols)], drop = TRUE)
+    }
+    
+    panels <- .int$new_data_frame(
+      c(list(PANEL = panel, ROW = rows, COL = cols), base)
+    )
+    panels <- panels[order(panels$PANEL), , drop = FALSE]
+    rownames(panels) <- NULL
+    panels$SCALE_X <- if (params$free$x) {
+      panels$COL
+    } else {
+      1L
+    }
+    panels$SCALE_Y <- if (params$free$y) {
+      panels$ROW
+    } else {
+      1L
+    }
+    panels
+  },
+  draw_panels = function(panels, layout, x_scales, y_scales, ranges, coord,
+                         data, theme, params) {
+    panel_table <- FacetGrid$draw_panels(panels, layout, x_scales, y_scales,
+                                         ranges, coord, data, theme, params)
+    
+    # Setup strips
+    col_vars  <- unique(layout[names(params$cols)])
+    row_vars  <- unique(layout[names(params$rows)])
+    attr(col_vars, "type")  <- "cols"
+    attr(col_vars, "facet") <- "grid"
+    attr(row_vars, "type")  <- "rows"
+    attr(row_vars, "facet") <- "grid"
+    
+    # Build strips
+    switch_x <- !is.null(params$switch) && params$switch %in% c("both", "x")
+    switch_y <- !is.null(params$switch) && params$switch %in% c("both", "y")
+    
+    # Merging strips
+    merge_cols <- apply(col_vars, 2, function(x) any(rle(x)$lengths > 1))
+    merge_rows <- apply(row_vars, 2, function(x) any(rle(x)$lengths > 1))
+    
+    if (any(merge_cols)) {
+      if (switch_x) {
+        panel_table <- merge_strips(panel_table,
+                                    col_vars, switch_x, params, theme, "b")
+      } else {
+        panel_table <- merge_strips(panel_table,
+                                    col_vars, switch_x, params, theme, "t")
+      }
+    }
+    
+    if (any(merge_rows)) {
+      if (switch_y) {
+        panel_table <- merge_strips(panel_table,
+                                    row_vars, switch_y, params, theme, "l")
+      } else {
+        panel_table <- merge_strips(panel_table,
+                                    row_vars, switch_y, params, theme, "r")
+      }
+    }
+    panel_table
+  }
+)
+
+# Helper functions -----------------------------------------------
+
+combine_nested_vars <- function(
+  data, env = emptyenv(), vars = NULL, drop = TRUE
+) {
+  if (length(vars) == 0) {
+    return(.int$new_data_frame())
+  }
+  
+  possible_columns <- unique(unlist(lapply(data, names)))
+  
+  values <- .int$compact(lapply(data, .int$eval_facets, facets = vars,
+                                possible_columns = possible_columns))
+  has_all <- unlist(lapply(values, length)) == length(vars)
+  if (!any(has_all)) {
+    missing <- lapply(values, function(x) setdiff(names(vars), names(x)))
+    missing_txt <- vapply(missing, .int$var_list, character(1))
+    name <- c("Plot", paste0("Layer ", seq_len(length(data) - 1)))
+    stop("At least one layer must contain all faceting variables: ",
+         .int$var_list(names(vars)), ".\n", paste0("* ", name, " is missing ",
+                                                   missing_txt, collapse = "\n"),
+         call. = FALSE)
+  }
+  base <- unique(.int$rbind_dfs(values[has_all]))
+  if (!drop) {
+    base <- .int$unique_combs(base)
+  }
+  for (value in values[!has_all]) {
+    if (.int$empty(value))
+      next
+    old <- base[setdiff(names(base), names(value))]
+    new <- unique(value[intersect(names(base), names(value))])
+    if (drop) {
+      new <- .int$unique_combs(new)
+    }
+    old[setdiff(names(base), names(value))] <- rep("", nrow(old))
+    base <- rbind(base, .int$df.grid(old, new))
+  }
+  if (.int$empty(base)) {
+    stop("Facetting variables must have at least one value",
+         call. = FALSE)
+  }
+  base
+}
+
+# New merge strips --------------------------------------------------------
+
+merge_strips <- function(
+  panel_table, vars, switch, params, theme, where = "t"
+) {
+  orient <- if (where %in% c("t", "b")) "x" else "y"
+  nlevels <- ncol(vars)
+  
+  these_strips <- grep(paste0("strip-", where), panel_table$layout$name)
+  strp_rows <- range(panel_table$layout$t[these_strips])
+  strp_cols <- range(panel_table$layout$l[these_strips])
+  strp_rows <- seq(strp_rows[1], strp_rows[2])
+  strp_cols <- seq(strp_cols[1], strp_cols[2])
+  strp <- panel_table[strp_rows, strp_cols]
+  
+  # Make empty template
+  template <- strp
+  template$grobs <- list()
+  template$layout <- template$layout[0,]
+  
+  # Inflate strips
+  for (i in seq_along(strp$grobs)) {
+    sub <- strp$grobs[[i]]
+    if (where == "b") {
+      sub$layout$t <- rev(sub$layout$t)
+      sub$layout$b <- rev(sub$layout$b)
+    }
+    n <- length(sub$grobs)
+    lay <- strp$layout[i,]
+    lay <- lay[rep(1, n),]
+    rownames(lay) <- NULL
+    sub <- lapply(seq_len(n), function(j) {
+      x <- sub
+      x$grobs <- x$grobs[j]
+      x$layout <- x$layout[j,]
+      x
+    })
+    template <- gtable_add_grob(
+      template,
+      sub, t = lay$t, l = lay$l, b = lay$b, r = lay$r,
+      z = lay$z, clip = lay$clip, name = paste0(lay$name, "-", seq_len(n))
+    )
+  }
+  
+  if (!params$bleed) {
+    vars[] <- lapply(seq_len(ncol(vars)), function(i) {
+      do.call(paste0, vars[, seq(i), drop = FALSE])
+    })
+  }
+  merge <- apply(vars, 2, function(x) any(rle(x)$lengths > 1))
+  
+  if (where == "r") {
+    vars <- rev(vars)
+    merge <- rev(merge)
+  }
+  
+  # Abstract away strips
+  strip_ids <- strsplit(template$layout$name, "-", fixed = TRUE)
+  strip_ids <- do.call(rbind, strip_ids)
+  strip_ids <- strip_ids[,3:ncol(strip_ids)]
+  mode(strip_ids) <- "integer"
+  
+  template$layout$delete <- rep(FALSE, nrow(strip_ids))
+  template$layout$aquire <- seq_along(template$grobs)
+  
+  for (i in seq_len(nlevels)) {
+    if (!merge[i]) {
+      next()
+    }
+    ii <- strip_ids[, 2] == i
+    
+    # Figure out what to merge
+    j <- as.numeric(as.factor(vars[, i]))
+    
+    ends <- cumsum(rle(j)$lengths)
+    starts <- c(1, which(diff(j) != 0) + 1)
+    
+    # Figure out what strip to remove
+    seqs <- unlist(Map(seq, from = starts, to = ends))
+    delete_this <- seqs[!(seqs %in% starts)]
+    delete_this <- which(strip_ids[, 1] %in% delete_this & ii)
+    template$layout$delete[delete_this] <- TRUE
+    
+    # Figure out what cells to expand
+    expand <- seqs[seqs %in% starts]
+    expand <- which(strip_ids[, 1] %in% expand & ii)
+    expand_where <- seqs[seqs %in% ends]
+    expand_where <- which(strip_ids[, 1] %in% expand_where & ii)
+    template$layout$aquire[expand] <- template$layout$aquire[expand_where]
+  }
+  
+  # Do expansion
+  if (orient == "x") {
+    template$layout$r <- template$layout$r[template$layout$aquire]
+  } else {
+    template$layout$b <- template$layout$b[template$layout$aquire]
+  }
+  
+  # Do deletion
+  template$grobs  <- template$grobs[!template$layout$delete]
+  strip_ids <- strip_ids[!template$layout$delete,]
+  template$layout <- template$layout[!template$layout$delete,]
+  
+  # Add nesting indicator
+  if (params$nest_line) {
+    active <- unit(c(0, 1), "npc") + c(1, -1) * params$resect
+    passive <- if (switch) c(1, 1) else c(0, 0)
+    nindi <- element_render(
+      theme, "ggh4x.facet.nestline",
+      x = switch(orient, x = active,  y = passive),
+      y = switch(orient, x = passive, y = active)
+    )
+    i <- which(with(template$layout, t != b | l != r))
+    offset <- switch(
+      orient,
+      x = vapply(template$grobs, function(grob){grob$layout$t}, numeric(1)),
+      y = vapply(template$grobs, function(grob){grob$layout$l}, numeric(1))
+    )
+    offset <- if (where %in% c("r", "b")) offset else nlevels - offset
+    template$grobs[i] <- lapply(template$grobs[i], function(grb) {
+      grb <- with(grb$layout, gtable_add_grob(
+        grb, nindi, t = t, l = l, r = r, b = b,
+        z = z,
+        name = "nester",
+        clip = "off"
+      ))
+    })
+    template$layout$z <- template$layout$z + offset
+  }
+  
+  # Delete old strips
+  panel_table <- gtable::gtable_filter(panel_table, paste0("strip-", where),
+                                       fixed = TRUE, trim = FALSE, invert = TRUE)
+  
+  # Place back new strips
+  panel_table <- with(template$layout, gtable::gtable_add_grob(
+    panel_table,
+    template$grobs,
+    t = t - 1 + strp_rows[1],
+    l = l - 1 + strp_cols[1],
+    b = b - 1 + strp_rows[1],
+    r = r - 1 + strp_cols[1],
+    z = z, clip = clip, name = name
+  ))
+  panel_table
+}
\ No newline at end of file
diff --git a/CohortDiagnosticsBreastCancer/R/Plots.R b/CohortDiagnosticsBreastCancer/R/Plots.R
new file mode 100644
index 00000000..551b2d15
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/R/Plots.R
@@ -0,0 +1,553 @@
+plotTimeDistribution <- function(data, 
+                                 cohortIds = NULL,
+                                 databaseIds = NULL,
+                                 xAxis = "database") {
+  
+  if (is.null(cohortIds) || xAxis != "database" || is.null(databaseIds)) {
+    warning("Not yet supported. Upcoming feature.")
+    return(NULL)
+  }
+  
+  # Perform error checks for input variables
+  errorMessage <- checkmate::makeAssertCollection()
+  checkmate::assertTibble(x = data, 
+                          any.missing = FALSE,
+                          min.rows = 1,
+                          min.cols = 5,
+                          null.ok = FALSE,
+                          add = errorMessage)
+  checkmate::assertDouble(x = cohortIds,
+                          lower = 1,
+                          upper = 2^53,
+                          any.missing = FALSE,
+                          null.ok = TRUE, 
+                          min.len = 1,
+                          add = errorMessage)
+  checkmate::assertCharacter(x = databaseIds,
+                             any.missing = FALSE,
+                             null.ok = TRUE, 
+                             min.len = 1, 
+                             unique = TRUE,
+                             add = errorMessage)
+  checkmate::assertChoice(x = xAxis,
+                          choices = c("database", "cohortId"),
+                          add = errorMessage)
+  checkmate::assertNames(x = colnames(data), 
+                         must.include = c("Min", "P25", "Median", "P75", "Max"),
+                         add = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  
+  plotData <- data 
+  if (!is.null(cohortIds)) {
+    plotData <- plotData %>% 
+      dplyr::filter(.data$cohortId %in% !!cohortIds)
+  }
+  if (!is.null(databaseIds)) {
+    plotData <- plotData %>% 
+      dplyr::filter(.data$Database %in% !!databaseIds)
+  }
+  
+  plotData$tooltip <- c(paste0(plotData$shortName, " : ", plotData$cohortName,
+                              "\nDatabase = ", plotData$Database, 
+                              "\nMin = ",  plotData$Min,
+                              "\nMax = ",  plotData$Max,
+                              "\nP25 = ",  plotData$P25,
+                              "\nMedian = ",  plotData$Median,
+                              "\nP75 = ", plotData$P75,
+                              "\nTime Measure = ",  plotData$TimeMeasure,
+                              "\nAverage = ",  plotData$Average))
+  
+  plot <- ggplot2::ggplot(data = plotData) +
+    ggplot2::aes(x = .data$Database,
+                 ymin = .data$Min,
+                 lower = .data$P25,
+                 middle = .data$Median,
+                 upper = .data$P75,
+                 ymax = .data$Max,
+                 group = .data$TimeMeasure,
+                 average = .data$Average) +
+    ggplot2::geom_errorbar(mapping = ggplot2::aes(ymin = .data$Min, 
+                                                  ymax = .data$Max), size = 0.5) +
+    ggiraph::geom_boxplot_interactive(ggplot2::aes(tooltip = tooltip),
+                                      stat = "identity", 
+                                      fill = rgb(0, 0, 0.8, alpha = 0.25), 
+                                      size = 0.2) +
+    ggplot2::facet_grid(Database+shortName~TimeMeasure, scales = "free") +
+    ggplot2::coord_flip() +
+    ggplot2::theme(panel.grid.major.y = ggplot2::element_blank(),
+                   panel.grid.minor.y = ggplot2::element_blank(),
+                   axis.title.y = ggplot2::element_blank(),
+                   axis.ticks.y = ggplot2::element_blank(),
+                   axis.text.y = ggplot2::element_blank(),
+                   strip.text.y.right = ggplot2::element_text(angle = 0)) 
+  plot <- ggiraph::girafe(ggobj = plot,
+                          options = list(
+                            ggiraph::opts_sizing(width = .7),
+                            ggiraph::opts_zoom(max = 5)),
+                          width_svg = 12,
+                          height_svg = 0.7 + 0.5 * length(databaseIds))
+  return(plot)
+}  
+# how to render using pure plot ly. Plotly does not prefer precomputed data.
+# TO DO: color and plot positions are not consistent yet.
+# plot <- plotly::plot_ly(data = plotData,
+#                         type = "box",
+#                         median = plotData$P25,
+#                         #Mean = plotData$Average,
+#                         upperfence = plotData$Max,
+#                         lowerfence = plotData$Min,
+#                         split = plotData$TimeMeasure)
+# loop thru database or cohorts as needed
+# then subplot
+# plot <- plotly::subplot(plots,nrows = length(input$databases),margin = 0.05)
+
+
+plotIncidenceRate <- function(data,
+                              cohortIds = NULL,
+                              databaseIds = NULL,
+                              stratifyByAgeGroup = TRUE,
+                              stratifyByGender = TRUE,
+                              stratifyByCalendarYear = TRUE,
+                              yscaleFixed = FALSE) {
+  if (nrow(data) == 0) {
+    ParallelLogger::logWarn("Record counts are too low to plot.")
+  }
+  errorMessage <- checkmate::makeAssertCollection()
+  checkmate::assertTibble(x = data, 
+                          any.missing = TRUE,
+                          min.rows = 1,
+                          min.cols = 5,
+                          null.ok = FALSE,
+                          add = errorMessage)
+  checkmate::assertDouble(x = cohortIds,
+                          lower = 1,
+                          upper = 2^53,
+                          any.missing = FALSE,
+                          null.ok = TRUE, 
+                          min.len = 1,
+                          add = errorMessage)
+  checkmate::assertCharacter(x = databaseIds,
+                             any.missing = FALSE,
+                             null.ok = TRUE, 
+                             min.len = 1, 
+                             unique = TRUE,
+                             add = errorMessage)
+  checkmate::assertLogical(x = stratifyByAgeGroup, 
+                           any.missing = FALSE, 
+                           min.len = 1, 
+                           max.len = 1,
+                           null.ok = FALSE,
+                           add = errorMessage)
+  checkmate::assertLogical(x = stratifyByGender, 
+                           any.missing = FALSE, 
+                           min.len = 1,  
+                           max.len = 1,
+                           null.ok = FALSE,
+                           add = errorMessage)
+  checkmate::assertLogical(x = stratifyByCalendarYear, 
+                           any.missing = FALSE, 
+                           min.len = 1,  
+                           max.len = 1,
+                           null.ok = FALSE,
+                           add = errorMessage)
+  checkmate::assertLogical(x = yscaleFixed, 
+                           any.missing = FALSE, 
+                           min.len = 1,  
+                           max.len = 1,
+                           null.ok = FALSE,
+                           add = errorMessage)
+  checkmate::assertDouble(x = data$incidenceRate,
+                          lower = 0,
+                          any.missing = FALSE,
+                          null.ok = FALSE, 
+                          min.len = 1,
+                          add = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  checkmate::assertDouble(x = data$incidenceRate,
+                          lower = 0,
+                          any.missing = FALSE,
+                          null.ok = FALSE, 
+                          min.len = 1,
+                          add = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  
+  plotData <- data %>% 
+    dplyr::mutate(incidenceRate = round(.data$incidenceRate, digits = 3))
+  if (!is.null(cohortIds)) {
+    plotData <- plotData %>% 
+      dplyr::filter(.data$cohortId %in% !!cohortIds)
+  }
+  if (!is.null(databaseIds)) {
+    plotData <- plotData %>% 
+      dplyr::filter(.data$databaseId %in% !!databaseIds)
+  }
+  plotData <- plotData %>% 
+    dplyr::mutate(strataGender = !is.na(.data$gender),
+                  strataAgeGroup = !is.na(.data$ageGroup),
+                  strataCalendarYear = !is.na(.data$calendarYear)) %>% 
+    dplyr::filter(.data$strataGender %in% !!stratifyByGender &
+                    .data$strataAgeGroup %in% !!stratifyByAgeGroup &
+                    .data$strataCalendarYear %in% !!stratifyByCalendarYear) %>% 
+    dplyr::select(-dplyr::starts_with("strata"))
+  
+  aesthetics <- list(y = "incidenceRate")
+  if (stratifyByCalendarYear) {
+    aesthetics$x <- "calendarYear"
+    xLabel <- "Calender year"
+    showX <- TRUE
+    if (stratifyByGender) {
+      aesthetics$group <- "gender"
+      aesthetics$color <- "gender"
+    }
+    plotType <- "line"
+  } else {
+    xLabel <- ""
+    if (stratifyByGender) {
+      aesthetics$x <- "gender"
+      aesthetics$color <- "gender"
+      aesthetics$fill <- "gender"
+      showX <- TRUE
+    } else if (stratifyByAgeGroup) {
+      aesthetics$x <- "ageGroup"
+      showX <- TRUE
+    }
+    else{
+      aesthetics$x <- "cohortId"
+      showX <- FALSE
+    }
+    plotType <- "bar"
+  }
+  
+  newSort <- plotData %>% 
+    dplyr::select(.data$ageGroup) %>% 
+    dplyr::distinct() %>% 
+    dplyr::arrange(as.integer(sub(pattern = '-.+$','',x = .data$ageGroup)))
+  
+  plotData <- plotData %>% 
+    dplyr::arrange(ageGroup = factor(.data$ageGroup, levels = newSort$ageGroup), .data$ageGroup)
+  
+  plotData$ageGroup <- factor(plotData$ageGroup,
+                              levels = newSort$ageGroup)
+  plotData$tooltip <- c(paste0(plotData$shortName, ":", plotData$cohortName,"\n","Incidence Rate = ", scales::comma(plotData$incidenceRate, accuracy = 0.01), 
+                               "\nDatabase = ", plotData$databaseId, 
+                               "\nPerson years = ", scales::comma(plotData$personYears, accuracy = 0.1), 
+                               "\nCohort count = ", scales::comma(plotData$cohortCount)))
+  
+  if (stratifyByAgeGroup) {
+    plotData$tooltip <- c(paste0(plotData$tooltip, "\nAge Group = ", plotData$ageGroup))
+  }
+  
+  if (stratifyByGender) {
+    plotData$tooltip <- c(paste0(plotData$tooltip, "\nGender = ", plotData$gender))
+  }
+  
+  if (stratifyByCalendarYear) {
+    plotData$tooltip <- c(paste0(plotData$tooltip, "\nYear = ", plotData$calendarYear))
+  }
+  
+  
+  plot <- ggplot2::ggplot(data = plotData, 
+                          do.call(ggplot2::aes_string, aesthetics)) +
+    ggplot2::xlab(xLabel) +
+    ggplot2::ylab("Incidence Rate (/1,000 person years)") +
+    ggplot2::theme(legend.position = "top",
+                   legend.title = ggplot2::element_blank(),
+                   axis.text.x = if (showX) ggplot2::element_text(angle = 90, vjust = 0.5) else ggplot2::element_blank() )
+  
+  if (plotType == "line") {
+    plot <- plot + 
+      ggiraph::geom_line_interactive(ggplot2::aes(), size = 1, alpha = 0.6) +
+      ggiraph::geom_point_interactive(ggplot2::aes(tooltip = tooltip), size = 2, alpha = 0.6)
+  } else {
+    plot <- plot + ggplot2::geom_bar(stat = "identity") +
+      ggiraph::geom_col_interactive( ggplot2::aes(tooltip = tooltip), size = 1)
+  }
+  
+  # databaseId field only present when called in Shiny app:
+  if (!is.null(data$databaseId) && length(data$databaseId) > 1) {
+    if (yscaleFixed) {
+      scales <- "fixed"
+    } else {
+      scales <- "free_y"
+    }
+    if (stratifyByGender | stratifyByCalendarYear) {
+      if (stratifyByAgeGroup) {
+        plot <- plot + facet_nested(databaseId + shortName ~ plotData$ageGroup, scales = scales)
+      } else {
+        plot <- plot + facet_nested(databaseId + shortName ~ ., scales = scales) 
+      }
+    } else {
+      plot <- plot + facet_nested(databaseId + shortName ~., scales = scales) 
+    }
+    spacing <- rep(c(1, rep(0.5, length(unique(plotData$shortName)) - 1)), length(unique(plotData$databaseId)))[-1]
+    plot <- plot + ggplot2::theme(panel.spacing.y = ggplot2::unit(spacing, "lines"),
+                                  strip.background = ggplot2::element_blank())
+  } else {
+    if (stratifyByAgeGroup) {
+      plot <- plot + ggplot2::facet_grid(~ageGroup) 
+    }
+  }
+  plot <- ggiraph::girafe(ggobj = plot,
+                          options = list(
+                            ggiraph::opts_sizing(width = .7),
+                            ggiraph::opts_zoom(max = 5)),
+                          width_svg = 15,
+                          height_svg = 1.5 + 2*length(unique(data$databaseId)))
+  return(plot)
+}
+
+plotCohortComparisonStandardizedDifference <- function(balance, 
+                                                       domain = "all",
+                                                       targetLabel = "Mean Target",
+                                                       comparatorLabel = "Mean Comparator") {
+  domains <- c("condition", "device", "drug", "measurement", "observation", "procedure")
+  balance$domain <- tolower(stringr::str_extract(balance$covariateName, "[a-z]+"))
+  balance$domain[!balance$domain %in% domains] <- "other"
+  
+  if (domain != "all") {
+    balance <- balance %>%
+      dplyr::filter(.data$domain == !!domain)
+  }
+  
+  # Can't make sense of plot with > 1000 dots anyway, so remove anything with small mean in both target and comparator:
+  if (nrow(balance) > 1000) {
+    balance <- balance %>% 
+      dplyr::filter(.data$mean1 > 0.01 | .data$mean2 > 0.01)
+  }
+  
+  # ggiraph::geom_point_interactive(ggplot2::aes(tooltip = tooltip), size = 3, alpha = 0.6)
+  balance$tooltip <- c(paste("Covariate Name:", balance$covariateName,
+                             "\nDomain: ", balance$domain,
+                             "\nMean Target: ", scales::comma(balance$mean1, accuracy = 0.1),
+                             "\nMean Comparator:", scales::comma(balance$mean2, accuracy = 0.1),
+                             "\nStd diff.:", scales::comma(balance$stdDiff, accuracy = 0.1)))
+  
+  # Code used to generate palette:
+  # writeLines(paste(RColorBrewer::brewer.pal(n = length(domains), name = "Dark2"), collapse = "\", \""))
+  
+  # Make sure colors are consistent, no matter which domains are included:
+  colors <- c("#1B9E77", "#D95F02", "#7570B3", "#E7298A", "#66A61E", "#E6AB02", "#444444")
+  colors <- colors[c(domains, "other") %in% unique(balance$domain)]
+  
+  balance$domain <- factor(balance$domain, levels = c(domains, "other"))
+  
+  # targetLabel <- paste(strwrap(targetLabel, width = 50), collapse = "\n")
+  # comparatorLabel <- paste(strwrap(comparatorLabel, width = 50), collapse = "\n")
+  
+  plot <- ggplot2::ggplot(balance, ggplot2::aes(x = .data$mean1, y = .data$mean2, color = .data$domain)) +
+    ggiraph::geom_point_interactive(ggplot2::aes(tooltip = .data$tooltip), size = 3,shape = 16, alpha = 0.5) +
+    ggplot2::geom_abline(slope = 1, intercept = 0, linetype = "dashed") +
+    ggplot2::geom_hline(yintercept = 0) +
+    ggplot2::geom_vline(xintercept = 0) +             
+    ggplot2::scale_x_continuous("MEAN") +
+    ggplot2::scale_y_continuous("MEAN") +
+    ggplot2::scale_color_manual("Domain", values = colors) +
+    ggplot2::facet_grid(targetCohortShortName ~ databaseId + comparatorCohortShortName)
+  
+  plot <- ggiraph::girafe(ggobj = plot,
+                          options = list(
+                            ggiraph::opts_sizing(width = .7),
+                            ggiraph::opts_zoom(max = 5)),width_svg = 12,
+                          height_svg = 5)
+  return(plot)
+}
+
+
+plotCohortOverlapVennDiagram <- function(data,
+                                         targetCohortIds, 
+                                         comparatorCohortIds,
+                                         databaseIds) {
+  
+  # Perform error checks for input variables
+  errorMessage <- checkmate::makeAssertCollection()
+  checkmate::assertTibble(x = data, 
+                          any.missing = FALSE,
+                          min.rows = 1,
+                          min.cols = 5,
+                          null.ok = FALSE,
+                          add = errorMessage)
+  checkmate::assertDouble(x = targetCohortIds,
+                          lower = 1,
+                          upper = 2^53, 
+                          any.missing = FALSE,
+                          null.ok = FALSE)
+  checkmate::assertDouble(x = comparatorCohortIds,
+                          lower = 1,
+                          upper = 2^53, 
+                          any.missing = FALSE,
+                          null.ok = FALSE)
+  checkmate::assertCharacter(x = databaseIds,
+                             any.missing = FALSE,
+                             min.len = 1,
+                             null.ok = TRUE
+  )
+  checkmate::reportAssertions(collection = errorMessage)
+  
+  plot <- VennDiagram::draw.pairwise.venn(area1 = abs(data$eitherSubjects) - abs(data$cOnlySubjects),
+                                          area2 = abs(data$eitherSubjects) - abs(data$tOnlySubjects),
+                                          cross.area = abs(data$bothSubjects),
+                                          category = c("Target", "Comparator"),
+                                          col = c(rgb(0.8, 0, 0), rgb(0, 0, 0.8)),
+                                          fill = c(rgb(0.8, 0, 0), rgb(0, 0, 0.8)),
+                                          alpha = 0.2,
+                                          fontfamily = rep("sans", 3),
+                                          cat.fontfamily = rep("sans", 2),
+                                          margin = 0.01,
+                                          ind = FALSE)
+  # Borrowed from https://stackoverflow.com/questions/37239128/how-to-put-comma-in-large-number-of-venndiagram
+  idx <- sapply(plot, function(i) grepl("text", i$name))
+  for (i in 1:3) {
+    plot[idx][[i]]$label <- format(as.numeric(plot[idx][[i]]$label),
+                                   big.mark = ",",
+                                   scientific = FALSE)
+  }
+  grid::grid.draw(plot)
+  
+  return(plot)
+}
+
+plotCohortOverlap <- function(data,
+                              yAxis = "Percentages") {
+  
+  # Perform error checks for input variables
+  errorMessage <- checkmate::makeAssertCollection()
+  checkmate::assertTibble(x = data, 
+                          any.missing = FALSE,
+                          min.rows = 1,
+                          min.cols = 6,
+                          null.ok = FALSE,
+                          add = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  checkmate::assertNames(x = colnames(data), 
+                         must.include = c("databaseId",
+                                          "targetCohortId",
+                                          "comparatorCohortId",
+                                          "tOnlySubjects",
+                                          "cOnlySubjects",
+                                          "bothSubjects"),
+                         add = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  
+  
+  
+  
+  
+  plotData <- data %>% 
+    dplyr::mutate(absTOnlySubjects = abs(.data$tOnlySubjects), 
+                  absCOnlySubjects = abs(.data$cOnlySubjects),
+                  absBothSubjects = abs(.data$bothSubjects),
+                  absEitherSubjects = abs(.data$eitherSubjects),
+                  signTOnlySubjects = dplyr::case_when(.data$tOnlySubjects < 0 ~ '<', TRUE ~ ''),
+                  signCOnlySubjects = dplyr::case_when(.data$cOnlySubjects < 0 ~ '<', TRUE ~ ''),
+                  signBothSubjects = dplyr::case_when(.data$bothSubjects < 0 ~ '<', TRUE ~ '')) %>% 
+    dplyr::mutate(tOnlyString = paste0(.data$signTOnlySubjects, 
+                                       scales::comma(.data$absTOnlySubjects), 
+                                       " (", 
+                                       .data$signTOnlySubjects, 
+                                       scales::percent(.data$absTOnlySubjects/.data$absEitherSubjects, 
+                                                       accuracy = 1),
+                                       ")"),
+                  cOnlyString = paste0(.data$signCOnlySubjects, 
+                                       scales::comma(.data$absCOnlySubjects), 
+                                       " (", 
+                                       .data$signCOnlySubjects,
+                                       scales::percent(.data$absCOnlySubjects/.data$absEitherSubjects, 
+                                                       accuracy = 1),
+                                       ")"),
+                  bothString = paste0(.data$signBothSubjects, 
+                                      scales::comma(.data$absBothSubjects), 
+                                      " (", 
+                                      .data$signBothSubjects,
+                                      scales::percent(.data$absBothSubjects/.data$absEitherSubjects, 
+                                                      accuracy = 1),
+                                      ")"))  %>% 
+    dplyr::mutate(tooltip = paste0("Database: ", .data$databaseId,
+                                   "\n", .data$targetShortName, ": ", .data$targetCohortName,
+                                   "\n", .data$comparatorShortName, ": ", .data$comparatorCohortName,
+                                   "\n", .data$targetShortName, " only: ", .data$tOnlyString,
+                                   "\n", .data$comparatorShortName, " only: ", .data$cOnlyString,
+                                   "\nBoth: ", .data$bothString)) %>%
+    dplyr::select(.data$targetShortName,
+                  .data$comparatorShortName,
+                  .data$databaseId,
+                  .data$absTOnlySubjects,
+                  .data$absCOnlySubjects,
+                  .data$absBothSubjects,
+                  .data$tooltip) %>% 
+    tidyr::pivot_longer(cols = c("absTOnlySubjects", 
+                                 "absCOnlySubjects",
+                                 "absBothSubjects"),
+                        names_to = "subjectsIn",
+                        values_to = "value") %>%
+    dplyr::mutate(subjectsIn = camelCaseToTitleCase(stringr::str_replace_all(string = .data$subjectsIn,
+                                                                             pattern = "abs|Subjects",
+                                                                             replacement = "")))
+  
+  plotData$subjectsIn <- factor(plotData$subjectsIn, levels = c(" T Only", " Both", " C Only"))
+  if (yAxis == "Percentages") {
+    position = "fill"
+  } else { 
+    position = "stack"
+  }
+  
+  plot <- ggplot2::ggplot(data = plotData) +
+    ggplot2::aes(fill = .data$subjectsIn, 
+                 y = .data$value,
+                 x = .data$comparatorShortName,
+                 tooltip = .data$tooltip,
+                 group = .data$subjectsIn) +
+    ggplot2::ylab(label = "") +
+    ggplot2::xlab(label = "") +
+    ggplot2::scale_fill_manual("Subjects in", values = c(rgb(0.8, 0.2, 0.2), rgb(0.3, 0.2, 0.4), rgb(0.4, 0.4, 0.9))) +
+    ggplot2::facet_grid(.data$databaseId ~ .data$targetShortName, drop = FALSE) +
+    ggiraph::geom_bar_interactive(position = position, alpha = 0.6, stat = "identity") 
+  if (yAxis == "Percentages") {
+    plot <- plot + ggplot2::scale_y_continuous(labels = scales::percent)
+  } else {
+    plot <- plot + ggplot2::scale_y_continuous(labels = scales::comma)
+  }
+  width <- 1.5 + 1*length(unique(plotData$databaseId))
+  height <- 1.5 + 1*length(unique(plotData$targetShortName))
+  aspectRatio <- width / height                        
+  plot <- ggiraph::girafe(ggobj = plot,
+                          options = list(
+                            ggiraph::opts_sizing(width = .7),
+                            ggiraph::opts_zoom(max = 5)), 
+                          width_svg = 6 * aspectRatio,
+                          height_svg = 6)
+  
+  return(plot)
+}   
+# Future function getCohortOverlapHistogram:
+# 1. https://stackoverflow.com/questions/20184096/how-to-plot-multiple-stacked-histograms-together-in-r
+# 2. https://stackoverflow.com/questions/43415709/how-to-use-facet-grid-with-geom-histogram
+# 3. https://www.datacamp.com/community/tutorials/facets-ggplot-r?utm_source=adwords_ppc&utm_campaignid=1455363063&utm_adgroupid=65083631748&utm_device=c&utm_keyword=&utm_matchtype=b&utm_network=g&utm_adpostion=&utm_creative=332602034361&utm_targetid=dsa-429603003980&utm_loc_interest_ms=&utm_loc_physical_ms=1007768&gclid=CjwKCAjw19z6BRAYEiwAmo64LQMUJwf1i0V-Zgc5hYhpDOFQeZU05reAJmQvo2-mClFWWM4_sJiSmBoC-YkQAvD_BwE
+# 4. https://stackoverflow.com/questions/24123499/frequency-histograms-with-facets-calculating-percent-by-groups-used-in-facet-i
+# 5. https://stackoverflow.com/questions/62821480/add-a-trace-to-every-facet-of-a-plotly-figure
+
+# ComparatorOnlySubjs <- generateHistogramValues(len = seq(1:nrow(data)), val = data$cOnlySubjects)
+# bothSubjs <- generateHistogramValues(seq(1:nrow(data)), data$bothSubjects)
+# cohortOnlySubjs <- generateHistogramValues(seq(1:nrow(data)), data$tOnlySubjects)
+# bucket <- list(ComparatorOnlySubjs = ComparatorOnlySubjs, bothSubjs = bothSubjs, cohortOnlySubjs = cohortOnlySubjs)
+# 
+# 
+# p <- ggplot2::ggplot(reshape::melt(bucket), ggplot2::aes(value, fill = L1)) +
+#   ggplot2::xlab(label = "Comparators") +
+#   ggplot2::geom_histogram(position = "stack", binwidth = 1) +
+#   ggplot2::xlim(c(0,max(length(comparatorCohortIds()),10))) +
+#   ggplot2::facet_grid(rows = ggplot2::vars(data$targetCohortId), 
+#   cols = ggplot2::vars(data$databaseId), scales = "free_y")
+# plot <- plotly::ggplotly(p)
+# GENERATE HISTOGRAM FUNCTION
+# generateHistogramValues <- function(len,val)
+# {
+#   fillVal <- c()
+#   
+#   inc <- 1
+#   for (i in len)
+#   {
+#     fillVal <- c(fillVal,rep(i,val[[i]]))
+#   }
+#   return(fillVal);
+# }
+
diff --git a/CohortDiagnosticsBreastCancer/R/Results.R b/CohortDiagnosticsBreastCancer/R/Results.R
new file mode 100644
index 00000000..a93a425f
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/R/Results.R
@@ -0,0 +1,645 @@
+createDatabaseDataSource <- function(connection, resultsDatabaseSchema, vocabularyDatabaseSchema = resultsDatabaseSchema) {
+  return(list(connection = connectionPool,
+              resultsDatabaseSchema = resultsDatabaseSchema,
+              vocabularyDatabaseSchema = vocabularyDatabaseSchema))
+}
+
+createFileDataSource <- function(premergedDataFile, envir = new.env()) {
+  load(premergedDataFile, envir = envir)
+  return(envir)
+}
+
+
+renderTranslateQuerySql <- function(connection, sql, ..., snakeCaseToCamelCase = FALSE) {
+  if (is(connection, "Pool")) {
+    # Connection pool is used by Shiny app, which always uses PostgreSQL:
+    sql <- SqlRender::render(sql, ...)
+    sql <- SqlRender::translate(sql, targetDialect = "postgresql")
+  
+    tryCatch({
+      data <- DatabaseConnector::dbGetQuery(connection, sql)
+    }, error = function(err) {
+      writeLines(sql)
+      stop(err)
+    })
+    if (snakeCaseToCamelCase) {
+      colnames(data) <- SqlRender::snakeCaseToCamelCase(colnames(data))
+    }
+    return(data)
+  } else {
+    return(DatabaseConnector::renderTranslateQuerySql(connection = connection,
+                                                      sql = sql,
+                                                      ...,
+                                                      snakeCaseToCamelCase = snakeCaseToCamelCase))
+  }
+}
+
+quoteLiterals <- function(x) {
+  if (is.null(x)) {
+    return("")
+  } else {
+    return(paste0("'", paste(x, collapse = "', '"), "'")) 
+  }
+}
+
+getCohortCountResult <- function(dataSource = .GlobalEnv,
+                                 cohortIds = NULL,
+                                 databaseIds) {
+  if (is(dataSource, "environment")) {
+    data <- get("cohortCount", envir = dataSource) %>% 
+      dplyr::filter(.data$databaseId %in% !!databaseIds) 
+    if (!is.null(cohortIds)) {
+      data <- data %>% 
+        dplyr::filter(.data$cohortId %in% !!cohortIds) 
+    }
+  } else {
+    sql <- "SELECT *
+            FROM  @results_database_schema.cohort_count
+            WHERE database_id in (@database_id)
+            {@cohort_ids != ''} ? {  AND cohort_id in (@cohort_ids)}
+            ;"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    cohort_ids = cohortIds,
+                                    database_id = quoteLiterals(databaseIds), 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  }
+  return(data)
+}
+
+getTimeDistributionResult <- function(dataSource = .GlobalEnv,
+                                      cohortIds,
+                                      databaseIds) {
+  if (is(dataSource, "environment")) {
+    data <- get("timeDistribution", envir = dataSource) %>% 
+      dplyr::filter(.data$cohortId %in% !!cohortIds &
+                      .data$databaseId %in% !!databaseIds)
+  } else {
+    sql <-   "SELECT *
+              FROM  @results_database_schema.time_distribution
+              WHERE cohort_id in (@cohort_ids)
+            	AND database_id in (@database_ids);"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    cohort_ids = cohortIds,
+                                    database_ids = quoteLiterals(databaseIds), 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  } 
+  shortNames <- data %>%
+    dplyr::inner_join(cohort) %>% 
+    dplyr::distinct(.data$cohortId, .data$cohortName) %>%
+    dplyr::arrange(.data$cohortName) %>%
+    dplyr::mutate(shortName = paste0('C', dplyr::row_number()))
+  
+  
+  data <- data %>% 
+    dplyr::inner_join(shortNames, by = "cohortId")
+  
+  data <- data %>% 
+    dplyr::rename(Database = "databaseId",
+                  TimeMeasure = "timeMetric", 
+                  Average = "averageValue", 
+                  SD = "standardDeviation", 
+                  Min = "minValue", 
+                  P10 = "p10Value", 
+                  P25 = "p25Value", 
+                  Median = "medianValue", 
+                  P75 = "p75Value", 
+                  P90 = "p90Value", 
+                  Max = "maxValue") %>% 
+    dplyr::relocate(.data$cohortId, .data$Database, .data$TimeMeasure) %>% 
+    dplyr::arrange(.data$cohortId, .data$Database, .data$TimeMeasure)
+  return(data)
+}
+
+
+getIncidenceRateResult <- function(dataSource = .GlobalEnv,
+                                   cohortIds,
+                                   databaseIds,
+                                   stratifyByGender = c(TRUE,FALSE),
+                                   stratifyByAgeGroup = c(TRUE,FALSE),
+                                   stratifyByCalendarYear = c(TRUE,FALSE),
+                                   minPersonYears = 1000) {
+  # Perform error checks for input variables
+  errorMessage <- checkmate::makeAssertCollection()
+  errorMessage <- checkErrorCohortIdsDatabaseIds(cohortIds = cohortIds,
+                                                 databaseIds = databaseIds,
+                                                 errorMessage = errorMessage)
+  checkmate::assertLogical(x = stratifyByGender,
+                           add = errorMessage,
+                           min.len = 1,
+                           max.len = 2,
+                           unique = TRUE)
+  checkmate::assertLogical(x = stratifyByAgeGroup,
+                           add = errorMessage,
+                           min.len = 1,
+                           max.len = 2,
+                           unique = TRUE)
+  checkmate::assertLogical(x = stratifyByCalendarYear,
+                           add = errorMessage,
+                           min.len = 1,
+                           max.len = 2,
+                           unique = TRUE)
+  checkmate::reportAssertions(collection = errorMessage)
+  
+  if (is(dataSource, "environment")) {
+    data <- get("incidenceRate", envir = dataSource) %>% 
+      dplyr::mutate(strataGender = !is.na(.data$gender),
+                    strataAgeGroup = !is.na(.data$ageGroup),
+                    strataCalendarYear = !is.na(.data$calendarYear)) %>% 
+      dplyr::filter(.data$cohortId %in% !!cohortIds &
+                      .data$databaseId %in% !!databaseIds &
+                      .data$strataGender %in% !!stratifyByGender &
+                      .data$strataAgeGroup %in% !!stratifyByAgeGroup &
+                      .data$strataCalendarYear %in% !!stratifyByCalendarYear &
+                      .data$personYears > !!minPersonYears) %>% 
+      dplyr::select(-tidyselect::starts_with('strata'))
+  } else {
+    sql <- "SELECT *
+            FROM  @results_database_schema.incidence_rate
+            WHERE cohort_id in (@cohort_ids)
+           	  AND database_id in (@database_ids)
+            {@gender == TRUE} ? {AND gender != ''} : {  AND gender = ''}
+            {@age_group == TRUE} ? {AND age_group != ''} : {  AND age_group = ''}
+            {@calendar_year == TRUE} ? {AND calendar_year != ''} : {  AND calendar_year = ''}
+              AND person_years > @personYears;"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    cohort_ids = cohortIds,
+                                    database_ids = quoteLiterals(databaseIds),
+                                    gender = stratifyByGender,
+                                    age_group = stratifyByAgeGroup,
+                                    calendar_year = stratifyByCalendarYear,
+                                    personYears = minPersonYears,
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+    data <- data %>%
+      dplyr::mutate(gender = dplyr::na_if(.data$gender, ""),
+                    ageGroup = dplyr::na_if(.data$ageGroup, ""),
+                    calendarYear = dplyr::na_if(.data$calendarYear, ""))
+  }
+  shortNames <- data %>%
+    dplyr::inner_join(cohort) %>% 
+    dplyr::distinct(.data$cohortId, .data$cohortName) %>%
+    dplyr::arrange(.data$cohortName) %>%
+    dplyr::mutate(shortName = paste0('C', dplyr::row_number()))
+
+  
+  data <- data %>% 
+    dplyr::inner_join(shortNames, by = "cohortId")
+  
+  return(data %>% 
+           dplyr::mutate(calendarYear = as.integer(.data$calendarYear)) %>%
+           dplyr::arrange(.data$cohortId, .data$databaseId))
+}
+
+getInclusionRuleStats <- function(dataSource = .GlobalEnv,
+                                  cohortIds = NULL,
+                                  databaseIds) {
+  if (is(dataSource, "environment")) {
+    data <- get("inclusionRuleStats", envir = dataSource) %>% 
+      dplyr::filter(.data$databaseId %in% !!databaseIds) 
+    if (!is.null(cohortIds)) {
+      data <- data %>% 
+        dplyr::filter(.data$cohortId %in% !!cohortIds) 
+    }
+  } else {
+    sql <- "SELECT *
+    FROM  @resultsDatabaseSchema.inclusion_rule_stats
+    WHERE database_id in (@database_id)
+    {@cohort_ids != ''} ? {  AND cohort_id in (@cohort_ids)}
+    ;"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    resultsDatabaseSchema = dataSource$resultsDatabaseSchema,
+                                    cohort_ids = cohortIds,
+                                    database_id = quoteLiterals(databaseIds), 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  }
+  data <- data %>% 
+    dplyr::select(.data$ruleSequenceId, .data$ruleName, 
+                  .data$meetSubjects, .data$gainSubjects, 
+                  .data$remainSubjects, .data$totalSubjects, .data$databaseId) %>% 
+    dplyr::arrange(.data$ruleSequenceId)
+  return(data)
+}
+
+
+getIndexEventBreakdown <- function(dataSource = .GlobalEnv,
+                                   cohortIds,
+                                   databaseIds) {
+  errorMessage <- checkmate::makeAssertCollection()
+  errorMessage <- checkErrorCohortIdsDatabaseIds(cohortIds = cohortIds,
+                                                 databaseIds = databaseIds,
+                                                 errorMessage = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  
+  if (is(dataSource, "environment")) {
+    data <- get("indexEventBreakdown", envir = dataSource) %>% 
+      dplyr::filter(.data$databaseId %in% !!databaseIds) 
+    if (!is.null(cohortIds)) {
+      data <- data %>% 
+        dplyr::filter(.data$cohortId %in% !!cohortIds) 
+    }
+    data <- data %>%
+      dplyr::inner_join(dplyr::select(get("concept", envir = dataSource),
+                                      .data$conceptId,
+                                      .data$conceptName),
+                        by = c("conceptId"))
+  } else {
+    sql <- "SELECT index_event_breakdown.*,
+              standard_concept.concept_name AS concept_name
+            FROM  @results_database_schema.index_event_breakdown
+            INNER JOIN  @vocabulary_database_schema.concept standard_concept
+              ON index_event_breakdown.concept_id = standard_concept.concept_id
+            WHERE database_id in (@database_id)
+              AND cohort_id in (@cohort_ids);"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    vocabulary_database_schema = dataSource$vocabularyDatabaseSchema,
+                                    cohort_ids = cohortIds,
+                                    database_id = quoteLiterals(databaseIds), 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  }
+  return(data)
+}
+
+getVisitContextResults <- function(dataSource = .GlobalEnv,
+                                   cohortIds,
+                                   databaseIds) {
+  errorMessage <- checkmate::makeAssertCollection()
+  errorMessage <- checkErrorCohortIdsDatabaseIds(cohortIds = cohortIds,
+                                                 databaseIds = databaseIds,
+                                                 errorMessage = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  
+  if (is(dataSource, "environment")) {
+    data <- get("visitContext", envir = dataSource) %>% 
+      dplyr::filter(.data$databaseId %in% !!databaseIds) 
+    if (!is.null(cohortIds)) {
+      data <- data %>% 
+        dplyr::filter(.data$cohortId %in% !!cohortIds) 
+    }
+    data <- data %>%
+      dplyr::inner_join(dplyr::select(get("concept", envir = dataSource),
+                                      visitConceptId = .data$conceptId,
+                                      visitConceptName = .data$conceptName),
+                        by = c("visitConceptId"))
+  } else {
+    sql <- "SELECT visit_context.*,
+              standard_concept.concept_name AS visit_concept_name
+            FROM  @results_database_schema.visit_context
+            INNER JOIN  @vocabulary_database_schema.concept standard_concept
+              ON visit_context.visit_concept_id = standard_concept.concept_id
+            WHERE database_id in (@database_id)
+              AND cohort_id in (@cohort_ids);"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    vocabulary_database_schema = dataSource$vocabularyDatabaseSchema,
+                                    cohort_ids = cohortIds,
+                                    database_id = quoteLiterals(databaseIds), 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  }
+  return(data)
+}
+
+getIncludedConceptResult <- function(dataSource = .GlobalEnv,
+                                     cohortId,
+                                     databaseIds) {
+  if (is(dataSource, "environment")) {
+    data <- get("includedSourceConcept", envir = dataSource) %>% 
+      dplyr::filter(.data$cohortId == !!cohortId &
+                      .data$databaseId %in% !!databaseIds) %>% 
+      dplyr::inner_join(dplyr::select(get("conceptSets", envir = dataSource),
+                                      .data$cohortId,
+                                      .data$conceptSetId,
+                                      .data$conceptSetName), 
+                        by = c("cohortId", "conceptSetId")) %>%
+      dplyr::inner_join(dplyr::select(get("concept", envir = dataSource),
+                                      sourceConceptId = .data$conceptId,
+                                      sourceConceptName = .data$conceptName,
+                                      sourceVocabularyId = .data$vocabularyId,
+                                      sourceConceptCode = .data$conceptCode),
+                        by = c("sourceConceptId")) %>%
+      dplyr::inner_join(dplyr::select(get("concept", envir = dataSource),
+                                      .data$conceptId,
+                                      .data$conceptName,
+                                      .data$vocabularyId),
+                        by = c("conceptId"))
+  } else {
+    sql <- "SELECT included_source_concept.*,
+              concept_set_name,
+              source_concept.concept_name AS source_concept_name,
+              source_concept.vocabulary_id AS source_vocabulary_id,
+              source_concept.concept_code AS source_concept_code,
+              standard_concept.concept_name AS concept_name,
+              standard_concept.vocabulary_id AS vocabulary_id
+            FROM  @results_database_schema.included_source_concept
+            INNER JOIN  @results_database_schema.concept_sets
+              ON included_source_concept.cohort_id = concept_sets.cohort_id
+                AND included_source_concept.concept_set_id = concept_sets.concept_set_id
+            INNER JOIN  @vocabulary_database_schema.concept source_concept
+              ON included_source_concept.source_concept_id = source_concept.concept_id
+            INNER JOIN  @vocabulary_database_schema.concept standard_concept
+              ON included_source_concept.concept_id = standard_concept.concept_id
+            WHERE included_source_concept.cohort_id = @cohort_id
+             AND database_id in (@database_ids);"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    vocabulary_database_schema = dataSource$vocabularyDatabaseSchema,
+                                    cohort_id = cohortId,
+                                    database_ids = quoteLiterals(databaseIds), 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  } 
+  
+  return(data)
+}
+
+getOrphanConceptResult <- function(dataSource = .GlobalEnv,
+                                   cohortId,
+                                   databaseIds) {
+  if (is(dataSource, "environment")) {
+    data <- get("orphanConcept", envir = dataSource) %>% 
+      dplyr::filter(.data$cohortId == !!cohortId &
+                      .data$databaseId %in% !!databaseIds) %>% 
+      dplyr::inner_join(dplyr::select(get("conceptSets", envir = dataSource),
+                                      .data$cohortId,
+                                      .data$conceptSetId,
+                                      .data$conceptSetName), 
+                        by = c("cohortId", "conceptSetId")) %>%
+      dplyr::inner_join(dplyr::select(get("concept", envir = dataSource),
+                                      .data$conceptId,
+                                      .data$conceptName,
+                                      .data$vocabularyId,
+                                      .data$conceptCode),
+                        by = c("conceptId"))
+  } else {
+    sql <- "SELECT orphan_concept.*,
+              concept_set_name,
+              standard_concept.concept_name AS concept_name,
+              standard_concept.vocabulary_id AS vocabulary_id,
+              standard_concept.concept_code AS concept_code
+            FROM  @results_database_schema.orphan_concept
+            INNER JOIN  @results_database_schema.concept_sets
+              ON orphan_concept.cohort_id = concept_sets.cohort_id
+                AND orphan_concept.concept_set_id = concept_sets.concept_set_id
+            INNER JOIN  @vocabulary_database_schema.concept standard_concept
+              ON orphan_concept.concept_id = standard_concept.concept_id
+            WHERE orphan_concept.cohort_id = @cohort_id
+             AND database_id in (@database_ids);"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    vocabulary_database_schema = dataSource$vocabularyDatabaseSchema,
+                                    cohort_id = cohortId,
+                                    database_ids = quoteLiterals(databaseIds), 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  } 
+  
+  return(data)
+}
+
+
+getCohortOverlapResult <- function(dataSource = .GlobalEnv,
+                                   targetCohortIds,
+                                   comparatorCohortIds,
+                                   databaseIds) {
+  errorMessage <- checkmate::makeAssertCollection()
+  errorMessage <- checkErrorCohortIdsDatabaseIds(cohortIds = targetCohortIds,
+                                                 databaseIds = databaseIds,
+                                                 errorMessage = errorMessage)
+  errorMessage <- checkErrorCohortIdsDatabaseIds(cohortIds = comparatorCohortIds,
+                                                 databaseIds = databaseIds,
+                                                 errorMessage = errorMessage)
+  
+  if (is(dataSource, "environment")) {
+    data <- get("cohortOverlap", envir = dataSource) %>% 
+      dplyr::filter(.data$targetCohortId %in% !!targetCohortIds &
+                      .data$comparatorCohortId %in% !!comparatorCohortIds &
+                      .data$databaseId %in% !!databaseIds) %>% 
+      dplyr::inner_join(dplyr::select(get("cohort", envir = dataSource), 
+                                      targetCohortId = .data$cohortId,
+                                      targetCohortName = .data$cohortName),
+                        by = "targetCohortId") %>% 
+      dplyr::inner_join(dplyr::select(get("cohort", envir = dataSource), 
+                                      comparatorCohortId = .data$cohortId,
+                                     comparatorCohortName = .data$cohortName),
+                        by = "comparatorCohortId")
+  } else {
+    sql <-   "SELECT cohort_overlap.*,
+                target_cohort.cohort_name AS target_cohort_name,
+                comparator_cohort.cohort_name AS comparator_cohort_name
+              FROM  @results_database_schema.cohort_overlap
+              INNER JOIN @results_database_schema.cohort target_cohort
+                ON cohort_overlap.target_cohort_id = target_cohort.cohort_id
+              INNER JOIN @results_database_schema.cohort comparator_cohort
+                ON cohort_overlap.comparator_cohort_id = comparator_cohort.cohort_id
+              WHERE target_cohort_id in (@targetCohortId)
+              AND comparator_cohort_id in (@comparatorCohortId)
+            	AND database_id in (@databaseId);"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    targetCohortId = targetCohortIds,
+                                    comparatorCohortId = comparatorCohortIds,
+                                    databaseId = quoteLiterals(databaseIds), 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  } 
+  
+  if (nrow(data) == 0) {
+    return(tidyr::tibble())
+  }
+  targetShortNames <- data %>%
+    dplyr::distinct(.data$targetCohortId, .data$targetCohortName) %>%
+    dplyr::arrange(.data$targetCohortName) %>%
+    dplyr::select(-.data$targetCohortName) %>%
+    dplyr::mutate(targetShortName = paste0('C', dplyr::row_number()))
+  
+  comparatorShortNames <- data %>%
+    dplyr::distinct(.data$comparatorCohortId, .data$comparatorCohortName) %>%
+    dplyr::arrange(.data$comparatorCohortName) %>%
+    dplyr::select(-.data$comparatorCohortName) %>%
+    dplyr::mutate(comparatorShortName = paste0('C', dplyr::row_number()))
+  
+  data <- data %>% 
+    dplyr::inner_join(targetShortNames, by = "targetCohortId") %>%
+    dplyr::inner_join(comparatorShortNames, by = "comparatorCohortId") 
+  return(data)
+}
+
+getCovariateValueResult <- function(dataSource = .GlobalEnv,
+                                    cohortIds,
+                                    analysisIds = NULL,
+                                    databaseIds,
+                                    timeIds = NULL,
+                                    isTemporal = FALSE) {
+  
+  # Perform error checks for input variables
+  errorMessage <- checkmate::makeAssertCollection()
+  checkmate::assertLogical(x = isTemporal, 
+                           any.missing = FALSE, 
+                           min.len = 1, 
+                           max.len = 1, 
+                           add = errorMessage)
+  errorMessage <- checkErrorCohortIdsDatabaseIds(cohortIds = cohortIds,
+                                                 databaseIds = databaseIds,
+                                                 errorMessage = errorMessage)
+  if (isTemporal) {
+    checkmate::assertIntegerish(x = timeIds, 
+                                lower = 0, 
+                                any.missing = FALSE, 
+                                unique = TRUE, 
+                                null.ok = TRUE,
+                                add = errorMessage)
+  }
+  checkmate::reportAssertions(collection = errorMessage)
+  
+
+  if (isTemporal) {
+    table <- "temporalCovariateValue"
+    refTable <- "temporalCovariateRef"
+    timeRefTable <- "temporalTimeRef"
+  } else {
+    table <- "covariateValue"
+    refTable <- "covariateRef"
+    timeRefTable <- ""
+  }
+  
+  if (is(dataSource, "environment")) {
+    data <- get(table, envir = dataSource) %>%
+      dplyr::filter(.data$cohortId %in% !!cohortIds,
+                    .data$databaseId %in% !!databaseIds) %>%
+      dplyr::inner_join(get(refTable, envir = dataSource), by = "covariateId")
+    if (!is.null(analysisIds)) {
+      data <- data %>%
+        dplyr::filter(.data$analysisId %in% analysisIds)
+    }
+    if (isTemporal) {
+      data <- data %>%
+        dplyr::inner_join(get(timeRefTable, envir = dataSource), by = "timeId")
+      if (!is.null(timeIds)) {
+        data <- data %>%
+          dplyr::filter(.data$timeId %in% timeIds)
+      }
+    }
+  } else {
+    sql <- "SELECT covariate.*,
+              covariate_name,
+            {@time_ref_table != \"\"} ? {
+              start_day,
+              end_day,
+            }
+              concept_id,
+              analysis_id
+            FROM  @results_database_schema.@table covariate
+            INNER JOIN @results_database_schema.@ref_table covariate_ref
+              ON covariate.covariate_id = covariate_ref.covariate_id
+            {@time_ref_table != \"\"} ? {
+            INNER JOIN @results_database_schema.@time_ref_table time_ref
+              ON covariate.time_id = time_ref.time_id
+            }
+            WHERE cohort_id in (@cohort_ids)
+            {@time_ref_table != \"\" & @time_ids != \"\"} ? {  AND covariate.time_id IN (@time_ids)}
+            {@analysis_ids != \"\"} ? {  AND analysis_id IN (@analysis_ids)}
+            	AND database_id in (@databaseIds);"
+    if (is.null(timeIds)) {
+      timeIds <- ""
+    }
+    if (is.null(analysisIds)) {
+      analysisIds <- ""
+    }
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    table = SqlRender::camelCaseToSnakeCase(table),
+                                    ref_table = SqlRender::camelCaseToSnakeCase(refTable),
+                                    time_ref_table = SqlRender::camelCaseToSnakeCase(timeRefTable),
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    cohort_ids = cohortIds,
+                                    analysis_ids = analysisIds,
+                                    databaseIds = quoteLiterals(databaseIds),
+                                    time_ids = timeIds,
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  }
+  if (isTemporal) {
+    data <- data %>% 
+      dplyr::relocate(.data$cohortId, 
+                      .data$databaseId, 
+                      .data$timeId, 
+                      .data$startDay, 
+                      .data$endDay,
+                      .data$analysisId,
+                      .data$covariateId, 
+                      .data$covariateName) %>% 
+      dplyr::arrange(.data$cohortId, .data$databaseId, .data$timeId, .data$covariateId, .data$covariateName)
+  } else {
+    data <- data %>% 
+      dplyr::relocate(.data$cohortId, 
+                      .data$databaseId, 
+                      .data$analysisId,
+                      .data$covariateId, 
+                      .data$covariateName) %>% 
+      dplyr::arrange(.data$cohortId, .data$databaseId, .data$covariateId)
+  }
+  return(data)
+}
+
+getConceptReference <- function(dataSource = .GlobalEnv,
+                                conceptIds) {
+  # Perform error checks for input variables
+  errorMessage <- checkmate::makeAssertCollection()
+  checkmate::assertIntegerish(x = conceptIds,
+                              min.len = 1, 
+                              null.ok = TRUE,
+                              add = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  if (is(dataSource, "environment")) {
+    data <- get("cohort", envir = dataSource) %>% 
+      dplyr::filter(!is.na(.data$invalidReason)) %>% 
+      dplyr::filter(.data$conceptId %in% conceptIds)
+  } else {
+    sql <- "SELECT *
+              FROM  @results_database_schema.concept
+              WHERE invalid_reason IS NULL 
+              {@conceptIds == } ? {}:{AND concept_id IN (@conceptIds)};"
+    data <- renderTranslateQuerySql(connection = dataSource$connection,
+                                    sql = sql,
+                                    results_database_schema = dataSource$resultsDatabaseSchema,
+                                    conceptIds = conceptIds, 
+                                    snakeCaseToCamelCase = TRUE) %>% 
+      tidyr::tibble()
+  }
+  return(data %>% dplyr::arrange(.data$conceptId))
+}
+
+checkErrorCohortIdsDatabaseIds <- function(errorMessage,
+                                           cohortIds,
+                                           databaseIds) {
+  checkmate::assertDouble(x = cohortIds,
+                          null.ok = FALSE,
+                          lower = 1,
+                          upper = 2^53,
+                          any.missing = FALSE,
+                          add = errorMessage)
+  checkmate::assertCharacter(x = databaseIds,
+                             min.len = 1,
+                             any.missing = FALSE,
+                             unique = TRUE,
+                             add = errorMessage)
+  checkmate::reportAssertions(collection = errorMessage)
+  return(errorMessage)
+}
diff --git a/CohortDiagnosticsBreastCancer/R/Tables.R b/CohortDiagnosticsBreastCancer/R/Tables.R
new file mode 100644
index 00000000..e0b6edb6
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/R/Tables.R
@@ -0,0 +1,141 @@
+library(magrittr)
+
+prepareTable1 <- function(covariates,
+                          pathToCsv = "Table1Specs.csv") {
+  covariates <- covariates %>%
+    dplyr::mutate(covariateName = stringr::str_to_sentence(stringr::str_replace_all(string = .data$covariateName, 
+                                                                                    pattern = "^.*: ",
+                                                                                    replacement = "")))
+  space <- "&nbsp;"
+  specifications <- readr::read_csv(file = pathToCsv, 
+                                    col_types = readr::cols(),
+                                    guess_max = min(1e7)) %>% 
+    dplyr::mutate(dplyr::across(tidyr::everything(), ~tidyr::replace_na(data = .x, replace = '')))
+  
+  resultsTable <- tidyr::tibble()
+  
+  if (nrow(specifications) == 0) {
+    return(resultsTable)
+  }
+  
+  for (i in 1:nrow(specifications)) {
+    specification <- specifications[i,]
+    if (specification %>% dplyr::pull(.data$covariateIds) == "") {
+      covariatesSubset <- covariates %>%
+        dplyr::filter(.data$analysisId %in% specification$analysisId) %>% 
+        dplyr::arrange(.data$covariateId)
+    } else {
+      covariatesSubset <- covariates %>%
+        dplyr::filter(.data$analysisId %in% specification$analysisId,
+                      .data$covariateId %in% (stringr::str_split(string = (specification %>% 
+                                                                             dplyr::pull(.data$covariateIds)), 
+                                                                 pattern = ";")[[1]] %>% 
+                                                utils::type.convert())) %>% 
+        dplyr::arrange(.data$covariateId)
+    }
+    if (nrow(covariatesSubset) > 0) {
+      resultsTable <- dplyr::bind_rows(resultsTable, 
+                                       tidyr::tibble(characteristic = paste0('<strong>',
+                                                                             specification %>% dplyr::pull(.data$label),
+                                                                             '</strong>'),
+                                                     value = NA,
+                                                     header = 1,
+                                                     position = i), 
+                                       tidyr::tibble(characteristic = paste0(space,
+                                                                             space,
+                                                                             space,
+                                                                             space,
+                                                                             covariatesSubset$covariateName),
+                                                     value = covariatesSubset$mean,
+                                                     header = 0,
+                                                     position = i)) %>% 
+        dplyr::distinct() %>%
+        dplyr::mutate(sortOrder = dplyr::row_number())
+    }
+  }
+  if (nrow(resultsTable) > 0) {
+    resultsTable <- resultsTable %>% 
+      dplyr::arrange(.data$position, dplyr::desc(.data$header), .data$sortOrder)
+  }
+  return(resultsTable)
+}
+
+
+prepareTable1Comp <- function(balance,
+                              pathToCsv = "Table1Specs.csv") {
+  balance <- balance %>%
+    dplyr::mutate(covariateName = stringr::str_to_sentence(stringr::str_replace_all(string = .data$covariateName, 
+                                                                                    pattern = "^.*: ",
+                                                                                    replacement = "")))
+  space <- "&nbsp;"
+  specifications <- readr::read_csv(file = pathToCsv, 
+                                    col_types = readr::cols(),
+                                    guess_max = min(1e7)) %>% 
+    dplyr::mutate(dplyr::across(tidyr::everything(), ~tidyr::replace_na(data = .x, replace = '')))
+  
+  resultsTable <- tidyr::tibble()
+  
+  if (nrow(specifications) == 0) {
+    return(dplyr::tibble(Note = 'There are no covariate records for the cohorts being compared.'))
+  }
+  
+  for (i in 1:nrow(specifications)) {
+    specification <- specifications[i,]
+    if (specification %>% dplyr::pull(.data$covariateIds) == "") {
+      balanceSubset <- balance %>%
+        dplyr::filter(.data$analysisId %in% specification$analysisId) %>% 
+        dplyr::arrange(.data$covariateId)
+    } else {
+      balanceSubset <- balance %>%
+        dplyr::filter(.data$analysisId %in% specification$analysisId,
+                      .data$covariateId %in% (stringr::str_split(string = (specification %>% 
+                                                                             dplyr::pull(.data$covariateIds)), 
+                                                                 pattern = ";")[[1]] %>% 
+                                                utils::type.convert())) %>% 
+        dplyr::arrange(.data$covariateId)
+    }
+    
+    if (nrow(balanceSubset) > 0) {
+      resultsTable <- dplyr::bind_rows(resultsTable, 
+                                       tidyr::tibble(characteristic = paste0('<strong>',
+                                                                             specification %>% dplyr::pull(.data$label),
+                                                                             '</strong>'),
+                                                     MeanT = NA,
+                                                     MeanC = NA,
+                                                     StdDiff = NA,
+                                                     header = 1,
+                                                     position = i), 
+                                       tidyr::tibble(characteristic = paste0(space,
+                                                                             space,
+                                                                             space,
+                                                                             space,
+                                                                             balanceSubset$covariateName),
+                                                     MeanT = balanceSubset$mean1,
+                                                     MeanC = balanceSubset$mean2,
+                                                     StdDiff = balanceSubset$stdDiff,
+                                                     header = 0,
+                                                     position = i)) %>% 
+        dplyr::distinct() %>%
+        dplyr::mutate(sortOrder = dplyr::row_number())
+    }
+  }
+  if (nrow(resultsTable) > 0 ) {
+    resultsTable <- resultsTable %>% 
+      dplyr::arrange(.data$position, dplyr::desc(.data$header), .data$sortOrder) %>% 
+      dplyr::mutate(sortOrder = dplyr::row_number()) %>% 
+      dplyr::select(-.data$header, -.data$position)
+  }
+  return(resultsTable)
+}
+
+
+compareCohortCharacteristics <- function(characteristics1, characteristics2) {
+  m <- dplyr::full_join(x = characteristics1 %>% dplyr::distinct(), 
+                        y = characteristics2 %>% dplyr::distinct(), 
+                        by = c("covariateId", "conceptId", "databaseId", "covariateName", "analysisId"),
+                        suffix = c("1", "2")) %>%
+    dplyr::mutate(sd = sqrt(.data$sd1^2 + .data$sd2^2),
+                  stdDiff = (.data$mean2 - .data$mean1)/.data$sd) %>% 
+    dplyr::arrange(-abs(.data$stdDiff))
+  return(m)
+}
diff --git a/CohortDiagnosticsBreastCancer/Table1Specs.csv b/CohortDiagnosticsBreastCancer/Table1Specs.csv
new file mode 100644
index 00000000..6389f2be
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/Table1Specs.csv
@@ -0,0 +1,9 @@
+label,analysisId,covariateIds
+Age group,3,
+Gender: female,1,8532001
+Race,4,
+Ethnicity,5,
+Medical history: General,210,4006969210;438409210;4212540210;255573210;201606210;4182210210;440383210;201820210;318800210;192671210;439727210;432867210;316866210;4104000210;433736210;80180210;255848210;140168210;4030518210;80809210;435783210;4279309210;81893210;81902210;197494210;4134440210
+Medical history: Cardiovascular disease,210,313217210;381591210;317576210;321588210;316139210;4185932210;321052210;440417210;444247210
+Medical history: Neoplasms,210,4044013210;432571210;40481902210;443392210;4112853210;4180790210;443388210;197508210;200962210
+Medication use,410,21601782410;21602796410;21604686410;21604389410;21603932410;21601387410;21602028410;21600960410;21601664410;21601744410;21601461410;21600046410;21603248410;21600712410;21603890410;21601853410;21604254410;21604489410;21604752410
diff --git a/CohortDiagnosticsBreastCancer/data/PreMerged.RData b/CohortDiagnosticsBreastCancer/data/PreMerged.RData
new file mode 100644
index 00000000..31eaeb62
Binary files /dev/null and b/CohortDiagnosticsBreastCancer/data/PreMerged.RData differ
diff --git a/CohortDiagnosticsBreastCancer/global.R b/CohortDiagnosticsBreastCancer/global.R
new file mode 100644
index 00000000..bc66cfca
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/global.R
@@ -0,0 +1,163 @@
+library(magrittr)
+
+source("R/Tables.R")
+source("R/Plots.R")
+source("R/Results.R")
+
+# shinySettings <- list(connectionDetails = DatabaseConnector::createConnectionDetails(dbms = "postgresql",
+#                                              server = "localhost/ohdsi",
+#                                              user = "postgres",
+#                                              password = Sys.getenv("pwPostgres")),
+#                       resultsDatabaseSchema =  "phenotype_library",
+#                       vocabularyDatabaseSchema =  "phenotype_library")
+# shinySettings <- list(dataFolder = "s:/examplePackageOutput")
+
+# Settings when running on server:
+
+defaultLocalDataFolder <- "data"
+defaultLocalDataFile <- "PreMerged.RData"
+
+connectionPool <- NULL
+defaultServer <- Sys.getenv("phenotypeLibraryDbServer")
+defaultDatabase <- Sys.getenv("phenotypeLibraryDbDatabase")
+defaultPort <- Sys.getenv("phenotypeLibraryDbPort")
+defaultUser <- Sys.getenv("phenotypeLibraryDbUser")
+defaultPassword <- Sys.getenv("phenotypeLibraryDbPassword")
+defaultResultsSchema <- Sys.getenv("phenotypeLibraryDbResultsSchema")
+defaultVocabularySchema <- Sys.getenv("phenotypeLibraryDbVocabularySchema")
+
+defaultDatabaseMode <- FALSE # Use file system if FALSE
+
+defaultCohortBaseUrl <- "https://atlas.ohdsi.org/#/cohortdefinition/"
+defaultConceptBaseUrl <- "https://athena.ohdsi.org/search-terms/terms/"
+
+cohortDiagnosticModeDefaultTitle <- "Cohort Diagnostics"
+phenotypeLibraryModeDefaultTitle <- "Phenotype Library"
+
+if (!exists("shinySettings")) {
+  writeLines("Using default settings")
+  databaseMode <- defaultDatabaseMode & defaultServer != ""
+  if (databaseMode) {
+    connectionPool <- pool::dbPool(
+      drv = DatabaseConnector::DatabaseConnectorDriver(),
+      dbms = "postgresql",
+      server = paste(defaultServer, defaultDatabase, sep = "/"),
+      port = defaultPort,
+      user = defaultUser,
+      password = defaultPassword
+    )
+    resultsDatabaseSchema <- defaultResultsSchema
+    vocabularyDatabaseSchema <- defaultVocabularySchema
+  } else {
+    dataFolder <- defaultLocalDataFolder
+  }
+  cohortBaseUrl <- defaultCohortBaseUrl
+  conceptBaseUrl <- defaultCohortBaseUrl
+} else {
+  writeLines("Using settings provided by user")
+  databaseMode <- !is.null(shinySettings$connectionDetails)
+  if (databaseMode) {
+    connectionDetails <- shinySettings$connectionDetails
+    if (is(connectionDetails$server, "function")) {
+      connectionPool <- pool::dbPool(drv = DatabaseConnector::DatabaseConnectorDriver(),
+                                     dbms = "postgresql",
+                                     server = connectionDetails$server(),
+                                     port = connectionDetails$port(),
+                                     user = connectionDetails$user(),
+                                     password = connectionDetails$password(),
+                                     connectionString = connectionDetails$connectionString())
+    } else {
+      # For backwards compatibility with older versions of DatabaseConnector:
+      connectionPool <- pool::dbPool(drv = DatabaseConnector::DatabaseConnectorDriver(),
+                                     dbms = "postgresql",
+                                     server = connectionDetails$server,
+                                     port = connectionDetails$port,
+                                     user = connectionDetails$user,
+                                     password = connectionDetails$password,
+                                     connectionString = connectionDetails$connectionString)
+    }
+    resultsDatabaseSchema <- shinySettings$resultsDatabaseSchema
+    vocabularyDatabaseSchema <- shinySettings$vocabularyDatabaseSchema
+  } else {
+    dataFolder <- shinySettings$dataFolder
+  }
+  cohortBaseUrl <- shinySettings$cohortBaseUrl
+  conceptBaseUrl <- shinySettings$cohortBaseUrl
+}
+
+dataModelSpecifications <- read.csv("resultsDataModelSpecification.csv")
+# Cleaning up any tables in memory:
+suppressWarnings(rm(list = SqlRender::snakeCaseToCamelCase(dataModelSpecifications$tableName)))
+
+if (databaseMode) {
+  
+  onStop(function() {
+    if (DBI::dbIsValid(connectionPool)) {
+      writeLines("Closing database pool")
+      pool::poolClose(connectionPool)
+    }
+  })
+  
+  resultsTablesOnServer <- tolower(DatabaseConnector::dbListTables(connectionPool, schema = resultsDatabaseSchema))
+  
+  loadResultsTable <- function(tableName, required = FALSE) {
+    if (required || tableName %in% resultsTablesOnServer) {
+      tryCatch({
+        table <- DatabaseConnector::dbReadTable(connectionPool, 
+                                                paste(resultsDatabaseSchema, tableName, sep = "."))
+      }, error = function(err) {
+        stop("Error reading from ", paste(resultsDatabaseSchema, tableName, sep = "."), ": ", err$message)
+      })
+      colnames(table) <- SqlRender::snakeCaseToCamelCase(colnames(table))
+      if (nrow(table) > 0) {
+        assign(SqlRender::snakeCaseToCamelCase(tableName), dplyr::as_tibble(table), envir = .GlobalEnv)
+      }
+    }
+  }
+  
+  loadResultsTable("database", required = TRUE)
+  loadResultsTable("cohort", required = TRUE)
+  loadResultsTable("phenotype_description")
+  loadResultsTable("temporal_time_ref")
+  loadResultsTable("concept_sets")
+  
+  # Create empty objects in memory for all other tables. This is used by the Shiny app to decide what tabs to show:
+  isEmpty <- function(tableName) {
+    sql <- sprintf("SELECT 1 FROM %s.%s LIMIT 1;", resultsDatabaseSchema, tableName)
+    oneRow <- DatabaseConnector::dbGetQuery(connectionPool, sql)
+    return(nrow(oneRow) == 0)
+  }
+  
+  for (table in dataModelSpecifications$tableName) {
+    if (table %in% resultsTablesOnServer && 
+        !exists(SqlRender::snakeCaseToCamelCase(table)) &&
+        !isEmpty(table)) {
+      assign(SqlRender::snakeCaseToCamelCase(table), dplyr::tibble())
+    }
+  }
+
+  dataSource <- createDatabaseDataSource(connection = connectionPool,
+                                         resultsDatabaseSchema = resultsDatabaseSchema,
+                                         vocabularyDatabaseSchema = vocabularyDatabaseSchema)
+} else {
+  localDataPath <- file.path(dataFolder, defaultLocalDataFile)
+  if (!file.exists(localDataPath)) {
+    stop(sprintf("Local data file %s does not exist.", localDataPath))
+  }
+  dataSource <- createFileDataSource(localDataPath, envir = .GlobalEnv)
+} 
+
+if (exists("temporalTimeRef")) {
+  temporalCovariateChoices <- temporalTimeRef %>%
+    dplyr::mutate(choices = paste0("Start ", .data$startDay, " to end ", .data$endDay)) %>%
+    dplyr::select(.data$timeId, .data$choices) %>% 
+    dplyr::arrange(.data$timeId) %>% 
+    dplyr::slice_head(n = 5)
+}
+
+if (exists("covariateRef")) {
+  specifications <- readr::read_csv(file = "Table1Specs.csv", 
+                                    col_types = readr::cols(),
+                                    guess_max = min(1e7))
+  prettyAnalysisIds <- specifications$analysisId
+}
diff --git a/CohortDiagnosticsBreastCancer/html/cohortCharacterization.html b/CohortDiagnosticsBreastCancer/html/cohortCharacterization.html
new file mode 100644
index 00000000..9f6ef077
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/cohortCharacterization.html
@@ -0,0 +1,16 @@
+<h3>Description</h3>
+<p>A table showing cohort characteristics (covariates). These characteristics are captured on or before the cohort start date. There is a Pretty and a Raw version of this table.</p>
+<p>The Pretty table shows the standard OHDSI characteristics table, which includes only covariates that were manually selected to provide a general overview of the comorbidities and medications of the cohort. These are all binary covariates, and the table shows the proportion (%) of the cohort entries having the covariate.<p>
+<p>The Raw table shows all captured covariates. These include binary and continuous covariates (e.g. the Charlson comorbidity index). For each covariate the table lists the mean, which for binary covariates is equal to the proportion, and the standard deviation (SD).</p>
+
+<h3>Options</h3>
+<p>You can select multiple databases in the side bar to see cohort characteristics from different databases side-by-side in the same table.</p>
+<p>Select the cohort to explore in the side bar.</p>
+<p>Select either the Pretty or the Raw table at the top of the table.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are the characteristics of the cohort as expected? For example, do people have the expected comorbidities?</li>
+<li>Do the characteristics of the cohort differ much per database?</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/cohortCounts.html b/CohortDiagnosticsBreastCancer/html/cohortCounts.html
new file mode 100644
index 00000000..684a6dd6
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/cohortCounts.html
@@ -0,0 +1,12 @@
+<h3>Description</h3>
+<p>A table showing the number of cohort entries and unique persons per cohort per database. Because one person can have more than one cohort entry, the number of entries can be higher than the number of persons.</p>
+
+<h3>Options</h3>
+<p>You can select multiple databases in the side bar to see counts from different databases side-by-side.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are there cohorts that are empty in some databases?</li>
+<li>Are the relative counts (relative to the other cohorts in the same database) comparable across databases? Note that the color bars show the relative counts.</li>
+<li>Are the cohorts of expected and sufficient size? For example, if we want to study the effect of an exposure, a rule-of-thumb is that we require at least 2,500 in the exposure cohort.</li>
+</ul>
\ No newline at end of file
diff --git a/CohortDiagnosticsBreastCancer/html/cohortOverlap.html b/CohortDiagnosticsBreastCancer/html/cohortOverlap.html
new file mode 100644
index 00000000..419eaa62
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/cohortOverlap.html
@@ -0,0 +1,27 @@
+<h3>Description</h3>
+<p>Stacked bar graph showing the overlap between two cohorts, and a table listing several overlap statistics.</p>
+
+<p>The stacked bar shows the overlap in terms of subjects. It shows the number of subjects that belong to each cohort and to both. The diagram does <em>not</em> consider whether the subjects were in the different cohorts at the same time.</p>
+<p>The table show the same information and more:
+<ul>
+<li>Subject in either cohort: The number of subjects that enter one or both cohorts. (The union)</li>
+<li>Subject in both cohort: The number of subjects that enter both cohorts, although not necessarily at the same time. (The intersection)</li>
+<li>Subject in target not in comparator: The number of subjects that enter the target cohort, but not the comparator cohort. (Subtracting the comparator from the target)</li>
+<li>Subject in comparator not in target: The number of subjects that enter the comparator cohort, but not the target cohort. (Subtracting the comparator from the target)</li>
+<li>Subject in target before comparator: The number of subjects that enter both cohorts, but enter the target cohort before entering the comparator cohort. This number considers only the first entry per cohort per person.</li>
+<li>Subject in comparator before target: The number of subjects that enter both cohorts, but enter the comparator cohort before entering the target cohort. This number considers only the first entry per cohort per person.</li>
+<li>Subject in target and comparator on same day: The number of subjects that enter both cohorts on the same date. This number considers only the first entry per cohort per person.</li>
+<li>Subject having target start during comparator: The number of subjects that enter the target cohort during the comparator cohort, meaning comparator cohort start date &lt;= target cohort start date &lt;= comparator cohort end date. This number considers only the first entry per cohort per person.</li>
+<li>Subject having comparator start during target: The number of subjects that enter the comparator cohort during the target cohort, meaning target cohort start date &lt;= comparator cohort start date &lt;= target cohort end date. This number considers only the first entry per cohort per person.</li>
+</p>
+
+<h3>Options</h3>
+<p>You can select one or more database in the side bar.</p>
+<p>You can select the (target) cohort(s) and comparator cohort(s) in the side bar.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are there many people in both cohorts? For example, if we want to compare two exposures, are there many people that receive both?</li>
+<li>Is the overlap of sufficient size for a specific research question? For example, if we wish to study the effect of an exposure on an outcome, we may require a minimum number of outcomes during exposure.</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/compareCohortCharacterization.html b/CohortDiagnosticsBreastCancer/html/compareCohortCharacterization.html
new file mode 100644
index 00000000..04cd56e7
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/compareCohortCharacterization.html
@@ -0,0 +1,18 @@
+<h3>Description</h3>
+<p>A table or plot showing cohort characteristics (covariates) for two cohorts side-by-side. These characteristics are captured on or before the cohort start date. There is a Pretty and a Raw version of the table.</p>
+<p>The Pretty table shows the standard OHDSI characteristics table, which includes only covariates that were manually selected to provide a general overview of the comorbidities and medications of the cohort. These are all binary covariates, and the table shows the proportion (%) of the cohort entries having the covariate, as well as the standardized difference of the mean (StdDiff).<p>
+<p>The Raw table shows all captured covariates. These include binary and continuous covariates (e.g. the Charlson comorbidity index). For each covariate the table lists the mean, which for binary covariates is equal to the proportion, the standard deviation (SD), and the standardized difference of the mean (StdDiff).</p>
+<p>The plot shows all covariates, include binary and continuous covariates. The x-axis represents the mean value in the target cohort, the y-axis the mean value in the comparator cohort. Each dot represents a covariate, and the color indicates the absolute value of the standardized difference of the mean.</p>
+
+<h3>Options</h3>
+<p>You can select a database in the side bar.</p>
+<p>Select the cohort to explore in the side bar.</p>
+<p>Select either the Pretty, the Raw table, or the plot at the top of the screen.</p>
+<p>In the plot, you can move the mouse pointer over a dot to see information on that covariate.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are there major differences between the two cohorts? For example, if we wish to compute a propensity score between two cohorts, concepts that have very high proportion in one cohort and a very low proportion in the other may lead to a perfectly predictive model.</li>
+<li>In general, how comparable are two cohorts? If we wish to compare two exposures, but the cohorts differ over many characteristics, we may be able to fit a propensity model and compute an estimate, but we may have concerns over the generalizability of the results.</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/incidenceRate.html b/CohortDiagnosticsBreastCancer/html/incidenceRate.html
new file mode 100644
index 00000000..8fa811e8
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/incidenceRate.html
@@ -0,0 +1,23 @@
+<h3>Description</h3>
+<p>A graph showing the incidence rate, optionally stratified by age (in 10-year bins), gender, and calendar year.</p>
+
+<p>The incidence rate is computed as 1000 * the number of people <em>first</em> entering the cohort / the number of years people were eligible to enter the cohort for the first time. The eligible person time is defined as the time when
+<ul>
+  <li>A person was observed in the database (based on the observation_period table).</li>
+  <li>Had the required amount of prior observation time as specified in the cohort entry event criteria. For example, if the cohort definition requires 365 days of observation prior to cohort entry, patients are not eligible to enter the cohort in the first 365 days of their observation period, and this time is not counted in the eligible time.</li>
+  <li>If the person enters the cohort, then only the time up to cohort entry. Because we only consider the first cohort entry, persons are no longer eligible to enter to cohort after their first entry.</li>
+</ul>
+
+<h3>Options</h3>
+<p>You can select multiple databases in the side bar to see graphs from different databases in the same plot.</p>
+<p>Select the cohort to explore in the side bar.</p>
+<p>At the top left of the plot, you can choose whether to stratify the data by age, gender, or calendar year.</p>
+<p>At the top right of the plot, you can choose whether to use the same y-axis for all databases.</p>
+<p>If you move the mouse over the plot, you can see the precise value.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are the observed incidence rates in line with expectations? For example, if we have an estimate of the population incidence based on an external source, is the incidence rate comparable to that estimate?</li>
+<li>Are the age and gender distributions in line with expectations? For example, are contraceptives only prescribed in women?</li>
+<li>Is the incidence rate stable over time? If there are sudden peaks or drops, this may indicate coding issues.</li>
+</ul>
\ No newline at end of file
diff --git a/CohortDiagnosticsBreastCancer/html/includedConcepts.html b/CohortDiagnosticsBreastCancer/html/includedConcepts.html
new file mode 100644
index 00000000..a53139eb
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/includedConcepts.html
@@ -0,0 +1,14 @@
+<h3>Description</h3>
+<p>A table showing the (source) concepts observed in the database that are included in a concept set of a cohort. The Subjects column contains the number of subjects in the entire database that have the specific concept. This count is <em>not</em> restricted to only those people in the cohort. Source concepts are identified in the _source_concept_id fields of the Common Data Model, (e.g. drug_source_concept_id) and are used to identify the specific source codes used in a database. Standard concepts are found using the _concept_id fields (e.g. drug_concept_id), and use the same coding system across all databases.</p>
+
+<h3>Options</h3>
+<p>You can select a database in the side bar to see the concepts and counts observed in that database.</p>
+<p>Select the cohort and the specific concept set within that cohort to explore in the side bar.</p>
+<p>You can switch between Source Concepts and Standard Concepts at the top of the table.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are there source codes included that should not be? For example, in a concept set for hypertensive disorder, are hypotension codes included by accident?</li>
+<li>Are all expected codes present? For example, if we have a list of ICD-10 codes that have been used in literature to identify a cohort, are all those codes present?</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/inclusionRuleStats.html b/CohortDiagnosticsBreastCancer/html/inclusionRuleStats.html
new file mode 100644
index 00000000..ca7f4626
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/inclusionRuleStats.html
@@ -0,0 +1,25 @@
+<h3>Description</h3>
+<p>A table showing the number of subject that match specific inclusion rules in the cohort definition. Note that this table will be empty if no inclusion rules have been specified.</p>
+
+<p>The table contains the following columns:
+<ul>
+<li>Sequence: The order in which the inclusion rules are applied to the cohort.</li>
+<li>Name: The name of the inclusion rule.</li>
+<li>Meet: The number of cohort entries that meet the entry event definition and the specific inclusion rule indicated in the row.</li>
+<li>Gain: The number of cohort entries that would be gained if this inclusion rule was dropped.</li>
+<li>Total: The number of cohort entries meeting the entry event definition. In other words, the number of cohort entries before applying any of the inclusion rules.</li>
+<li>Remain: The number of cohort entries remaining after applying the specific inclusion rule, and all preceding rules.</li>
+</ul>
+</p>
+
+<h3>Options</h3>
+<p>You can select a database in the side bar to see the inclusion rule statistics observed in that database.</p>
+<p>Select the cohort to explore in the side bar.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are there inclusion rules that nobody meets in a database? For example, requiring a specialist visit that is not recorded in a specific database.</li>
+<li>Are there inclusion rules that have no effect in a database? For example, requiring no occurrence of a prior disease code that is not recorded in a database.</li>
+<li>Are there inclusion rules that drastically reduce the population? In this case we might worry about generalizability. For example, if we require a diagnostic procedure, and only a small fraction meets this criteria, we may wonder if this identifies a special population that differs from the overall population in significant ways.</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/indexEventBreakdown.html b/CohortDiagnosticsBreastCancer/html/indexEventBreakdown.html
new file mode 100644
index 00000000..8c23125b
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/indexEventBreakdown.html
@@ -0,0 +1,13 @@
+<h3>Description</h3>
+<p>A table showing the concepts belonging to the concept sets in the entry event definition that are observed on the index date. In other words, the table lists the concepts that likely triggered the cohort entry. The counts indicate number of cohort entries where the concepts was observed on the index date. Note that multiple concepts can be present on the index date, so the sum of counts might be greater than the cohort entry count.</p>
+
+<h3>Options</h3>
+<p>You can select multiple databases in the side bar to see counts from different databases side-by-side.</p>
+<p>Select the cohort to explore in the side bar.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Is one concept unexpectedly dominating? For example, if our cohort identifies exposure to drugs in a class, but we notice almost everyone enters the cohort based on a single drug, we may wonder whether our results will generalize to the class.</li>
+<li>Are the highest ranking concepts different across databases? For example, is everyone in one database initiating high-dose prescriptions, and everyone in another database low-dose prescriptions? 
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/orphanConcepts.html b/CohortDiagnosticsBreastCancer/html/orphanConcepts.html
new file mode 100644
index 00000000..b6eac27d
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/orphanConcepts.html
@@ -0,0 +1,21 @@
+<h3>Description</h3>
+<p>A table showing the (source) concepts observed in the database that are <em>not</em> included in a concept set of a cohort, but maybe should be. The following logic is used to identify concepts that might be relevant:</p>
+<ol>
+<li>Given a concept set expression, find all included concepts.
+<li>Find all names of those concepts, including synonyms, and the names of source concepts that map to them.</li>
+<li>Search for concepts (standard and source) that contain any of those names as substring.</li>
+<li>Filter those concepts to those that are not in the original set of concepts (i.e. orphans).</li>
+<li>Restrict the set of orphan concepts to those that appear in the CDM database as either source concept or standard concept.</li>
+</ol>
+
+<p>The Subjects column contains the number of subjects in the entire database that have the specific concept. This count is <em>not</em> restricted to only those people in the cohort. Source concepts are identified in the _source_concept_id fields of the Common Data Model, (e.g. drug_source_concept_id) and are used to identify the specific source codes used in a database. Standard concepts are found using the _concept_id fields (e.g. drug_concept_id), and use the same coding system across all databases.</p>
+
+<h3>Options</h3>
+<p>You can select a database in the side bar to see the concepts and counts observed in that database.</p>
+<p>Select the cohort and the specific concept set within that cohort to explore in the side bar.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are there concepts that are not included in the concept but should be? Note that the provided list likely contains many false positives.</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/temporalCharacterization.html b/CohortDiagnosticsBreastCancer/html/temporalCharacterization.html
new file mode 100644
index 00000000..cfb588df
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/temporalCharacterization.html
@@ -0,0 +1,16 @@
+<h3>Description</h3>
+<p>A table showing temporal cohort characteristics (covariates). These characteristics are captured at specific time intervals before or after cohort start date. There is a Pretty and a Raw version of this table.</p>
+<p>The Pretty table includes a pre-selected subset of covariates manually selected to provide a general overview of the comorbidities and medications of the cohort. These are all binary covariates, and the table shows the proportion (%) of the cohort entries having the covariate.<p>
+<p>The Raw table shows all captured covariates. These include binary and continuous covariates (e.g. the Charlson comorbidity index). For each covariate the table lists the mean, which for binary covariates is equal to the proportion, and the standard deviation (SD).</p>
+
+<h3>Options</h3>
+<p>You can select multiple databases in the side bar to see temporal cohort characteristics from different databases side-by-side in the same table.</p>
+<p>Select the cohort to explore in the side bar.</p>
+<p>Select either the Pretty or the Raw table at the top of the table.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are the characteristics of the cohort different at different intervals relative to index date? For example, if we are evaluating the characteristics of a cohort of patients with hypertension, we expect the use of anti-hypertensive drugs to be very little or none prior to index date of hypertension, and the rates to go up significantly after the index date. </li>
+<li>Do the characteristics of the cohort differ much per database?</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/timeDistribution.html b/CohortDiagnosticsBreastCancer/html/timeDistribution.html
new file mode 100644
index 00000000..e504480b
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/timeDistribution.html
@@ -0,0 +1,36 @@
+<h3>Description</h3>
+<p>Boxplot and a table showing the distribution of time (in days) before and after the cohort index date (cohort start date), and the time between cohort start and end date. The information is shown for <em>all</em> cohort entries, so not limiting to the first per person.</p>
+
+<p>The boxplot shows:
+<ul>
+<li>Whiskers: The minimum and maximum observed number of days.</li>
+<li>Box: The 25th to 75th percentile.</li>
+<li>Line: The median</li>
+</ul>
+</p>
+
+<p>The table show the same information and more:
+<ul>
+<li>Average: the mean of the distribution</li>
+<li>SD: Standard Deviation</li>
+<li>Min: The minimum</li>
+<li>P10: The 10th percentile</li>
+<li>P25: The 25th percentile</li>
+<li>Median: The median (50th percentile)</li>
+<li>P75: The 75th percentile</li>
+<li>P90: The 90th percentile</li>
+<li>Max: The maximum</li>
+</ul>
+</p>
+
+<h3>Options</h3>
+<p>You can select multiple databases in the side bar to see time distributions from different databases in the same plot and table.</p>
+<p>Select the cohort to explore in the side bar.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>For exposure cohorts: is there sufficient time after index (either within the cohort for on-treatment analyses, or until the end of observation for intent-to-treat type analyses) to observe the outcome of interest?</li>
+<li>Are there many cohorts with length = 0 when this is not expected?</li>
+<li>Are the distributions comparable across databases?</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/html/visitContext.html b/CohortDiagnosticsBreastCancer/html/visitContext.html
new file mode 100644
index 00000000..e7cc460f
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/html/visitContext.html
@@ -0,0 +1,18 @@
+<h3>Description</h3>
+<p>A table showing the relationship between the cohort start date and visits recorded in the database. For each database, the table shows:</p>
+<ul>
+<li><strong>Visits Before</strong>: the number of visits recorded before the cohort start date. Note that if a person is in the same cohort twice, visits may be counted twice.</li>
+<li><strong>Visits Ongoing</strong>: the number of visits that were ongoing (excluding the visit start date) when the cohort started. Note that if a person is in the same cohort twice, visits may be counted twice.</li>
+<li><strong>Starting Simultaneous</strong>: the number of visits that started on the same day the cohort started.</li>
+<li><strong>Visits After</strong>: the number of visits recorded after the cohort start date. Note that if a person is in the same cohort twice, visits may be counted twice.</li>
+</ul>
+
+<h3>Options</h3>
+<p>You can select multiple databases in the side bar to see counts from different databases side-by-side.</p>
+<p>Select the cohort to explore in the side bar.</p>
+
+<h3>What to look for</h3>
+<ul>
+<li>Are cohorts starting in the right context? E.g. some cohorts may be expected to start predominantly in an inpatient setting.</li>
+</ul>
+
diff --git a/CohortDiagnosticsBreastCancer/resultsDataModelSpecification.csv b/CohortDiagnosticsBreastCancer/resultsDataModelSpecification.csv
new file mode 100644
index 00000000..c5314658
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/resultsDataModelSpecification.csv
@@ -0,0 +1,161 @@
+tableName,fieldName,type,isRequired,primaryKey,optional,emptyIsNa
+analysis_ref,analysis_id,bigint,Yes,Yes,No,Yes
+analysis_ref,analysis_name,varchar(50),Yes,No,No,Yes
+analysis_ref,domain_id,varchar(20),No,No,No,Yes
+analysis_ref,start_day,float,No,No,No,Yes
+analysis_ref,end_day,float,No,No,No,Yes
+analysis_ref,is_binary,varchar(1),Yes,No,No,Yes
+analysis_ref,missing_means_zero,varchar(1),No,No,No,Yes
+cohort,phenotype_id,bigint,No,No,Yes,Yes
+cohort,cohort_id,bigint,Yes,Yes,No,Yes
+cohort,web_api_cohort_id,bigint,Yes,No,No,Yes
+cohort,cohort_name,varchar(255),Yes,No,No,Yes
+cohort,logic_description,varchar,No,No,Yes,Yes
+cohort,sql,varchar,Yes,No,No,Yes
+cohort,json,varchar,Yes,No,No,Yes
+cohort_count,cohort_id,bigint,Yes,Yes,No,Yes
+cohort_count,cohort_entries,float,Yes,No,No,Yes
+cohort_count,cohort_subjects,float,Yes,No,No,Yes
+cohort_count,database_id,varchar(20),Yes,Yes,No,Yes
+cohort_overlap,either_subjects,float,Yes,No,No,Yes
+cohort_overlap,both_subjects,float,Yes,No,No,Yes
+cohort_overlap,t_only_subjects,float,Yes,No,No,Yes
+cohort_overlap,c_only_subjects,float,Yes,No,No,Yes
+cohort_overlap,t_before_c_subjects,float,Yes,No,No,Yes
+cohort_overlap,c_before_t_subjects,float,Yes,No,No,Yes
+cohort_overlap,same_day_subjects,float,Yes,No,No,Yes
+cohort_overlap,t_in_c_subjects,float,Yes,No,No,Yes
+cohort_overlap,c_in_t_subjects,float,Yes,No,No,Yes
+cohort_overlap,target_cohort_id,bigint,Yes,Yes,No,Yes
+cohort_overlap,comparator_cohort_id,bigint,Yes,Yes,No,Yes
+cohort_overlap,database_id,varchar(20),Yes,Yes,No,Yes
+concept,concept_id,int,Yes,Yes,No,Yes
+concept,concept_name,varchar(255),Yes,No,No,Yes
+concept,domain_id,varchar(20),Yes,Yes,No,Yes
+concept,vocabulary_id,varchar(20),Yes,Yes,No,Yes
+concept,concept_class_id,varchar(20),Yes,No,No,Yes
+concept,standard_concept,varchar(1),No,No,No,Yes
+concept,concept_code,varchar(20),Yes,No,No,Yes
+concept,valid_start_date,Date,Yes,No,No,Yes
+concept,valid_end_date,Date,Yes,No,No,Yes
+concept,invalid_reason,varchar,No,No,No,Yes
+concept_ancestor,ancestor_concept_id,bigint,Yes,Yes,No,Yes
+concept_ancestor,descendant_concept_id,bigint,Yes,Yes,No,Yes
+concept_ancestor,min_levels_of_separation,int,Yes,No,No,Yes
+concept_ancestor,max_levels_of_separation,int,Yes,No,No,Yes
+concept_relationship,concept_id_1,int,Yes,Yes,No,Yes
+concept_relationship,concept_id_2,int,Yes,Yes,No,Yes
+concept_relationship,relationship_id,varchar(20),Yes,Yes,No,Yes
+concept_relationship,valid_start_date,Date,Yes,No,No,Yes
+concept_relationship,valid_end_date,Date,Yes,No,No,Yes
+concept_relationship,invalid_reason,varchar(1),No,No,No,Yes
+concept_sets,cohort_id,bigint,Yes,Yes,No,Yes
+concept_sets,concept_set_id,int,Yes,Yes,No,Yes
+concept_sets,concept_set_sql,varchar,Yes,No,No,Yes
+concept_sets,concept_set_name,varchar(255),Yes,No,No,Yes
+concept_sets,concept_set_expression,varchar,Yes,No,No,Yes
+concept_synonym,concept_id,int,Yes,Yes,No,Yes
+concept_synonym,concept_synonym_name,varchar,Yes,Yes,No,Yes
+concept_synonym,language_concept_id,int,Yes,Yes,No,Yes
+covariate_ref,covariate_id,bigint,Yes,Yes,No,Yes
+covariate_ref,covariate_name,varchar,Yes,No,No,Yes
+covariate_ref,analysis_id,int,Yes,No,No,Yes
+covariate_ref,concept_id,int,Yes,No,No,Yes
+covariate_value,cohort_id,bigint,Yes,Yes,No,Yes
+covariate_value,covariate_id,bigint,Yes,Yes,No,Yes
+covariate_value,mean,float,Yes,No,No,Yes
+covariate_value,sd,float,No,No,No,Yes
+covariate_value,database_id,varchar(20),Yes,Yes,No,Yes
+database,database_id,varchar(20),Yes,Yes,No,Yes
+database,database_name,varchar,No,No,No,Yes
+database,description,varchar,No,No,No,Yes
+database,is_meta_analysis,varchar(1),Yes,No,No,Yes
+domain,domain_id,varchar(20),Yes,Yes,No,Yes
+domain,domain_name,varchar(255),Yes,No,No,Yes
+domain,domain_concept_id,int,Yes,No,No,Yes
+incidence_rate,cohort_count,float,Yes,No,No,Yes
+incidence_rate,person_years,float,Yes,No,No,Yes
+incidence_rate,gender,varchar,No,Yes,No,No
+incidence_rate,age_group,varchar,No,Yes,No,No
+incidence_rate,calendar_year,varchar(4),No,Yes,No,No
+incidence_rate,incidence_rate,float,Yes,No,No,Yes
+incidence_rate,cohort_id,bigint,Yes,Yes,No,Yes
+incidence_rate,database_id,varchar(20),Yes,Yes,No,Yes
+included_source_concept,database_id,varchar(20),Yes,Yes,No,Yes
+included_source_concept,cohort_id,bigint,Yes,Yes,No,Yes
+included_source_concept,concept_set_id,int,Yes,Yes,No,Yes
+included_source_concept,concept_id,int,Yes,Yes,No,Yes
+included_source_concept,source_concept_id,int,Yes,Yes,No,Yes
+included_source_concept,concept_subjects,float,Yes,No,No,Yes
+included_source_concept,concept_count,float,Yes,No,No,Yes
+inclusion_rule_stats,rule_sequence_id,int,Yes,Yes,No,Yes
+inclusion_rule_stats,rule_name,varchar(255),Yes,No,No,Yes
+inclusion_rule_stats,meet_subjects,float,Yes,No,No,Yes
+inclusion_rule_stats,gain_subjects,float,Yes,No,No,Yes
+inclusion_rule_stats,total_subjects,float,Yes,No,No,Yes
+inclusion_rule_stats,remain_subjects,float,Yes,No,No,Yes
+inclusion_rule_stats,cohort_id,bigint,Yes,Yes,No,Yes
+inclusion_rule_stats,database_id,varchar(20),Yes,Yes,No,Yes
+index_event_breakdown,concept_id,int,Yes,Yes,No,Yes
+index_event_breakdown,concept_count,float,Yes,No,No,Yes
+index_event_breakdown,cohort_id,bigint,Yes,Yes,No,Yes
+index_event_breakdown,database_id,varchar(20),Yes,Yes,No,Yes
+orphan_concept,cohort_id,bigint,Yes,Yes,No,Yes
+orphan_concept,concept_set_id,int,Yes,Yes,No,Yes
+orphan_concept,database_id,varchar(20),Yes,Yes,No,Yes
+orphan_concept,concept_id,int,Yes,Yes,No,Yes
+orphan_concept,concept_count,float,Yes,No,No,Yes
+orphan_concept,concept_subjects,float,Yes,No,No,Yes
+phenotype_description,phenotype_id,bigint,Yes,Yes,No,Yes
+phenotype_description,phenotype_name,varchar(255),Yes,No,No,Yes
+phenotype_description,referent_concept_id,int,Yes,No,No,Yes
+phenotype_description,clinical_description,varchar,Yes,No,No,Yes
+phenotype_description,literature_review,varchar,No,No,No,Yes
+phenotype_description,phenotype_notes,varchar,No,No,No,Yes
+relationship,relationship_id,varchar(20),Yes,Yes,No,Yes
+relationship,relationship_name,varchar(255),Yes,No,No,Yes
+relationship,is_hierarchical,varchar(1),Yes,No,No,Yes
+relationship,defines_ancestry,varchar(1),Yes,No,No,Yes
+relationship,reverse_relationship_id,varchar(20),Yes,Yes,No,Yes
+relationship,relationship_concept_id,int,Yes,Yes,No,Yes
+temporal_analysis_ref,analysis_id,int,Yes,Yes,No,Yes
+temporal_analysis_ref,analysis_name,varchar(20),Yes,No,No,Yes
+temporal_analysis_ref,domain_id,varchar(20),Yes,Yes,No,Yes
+temporal_analysis_ref,is_binary,varchar(1),Yes,No,No,Yes
+temporal_analysis_ref,missing_means_zero,varchar(1),No,No,No,Yes
+temporal_covariate_ref,covariate_id,bigint,Yes,Yes,No,Yes
+temporal_covariate_ref,covariate_name,varchar,Yes,No,No,Yes
+temporal_covariate_ref,analysis_id,int,Yes,No,No,Yes
+temporal_covariate_ref,concept_id,int,Yes,No,No,Yes
+temporal_covariate_value,cohort_id,bigint,Yes,Yes,No,Yes
+temporal_covariate_value,time_id,int,Yes,Yes,No,Yes
+temporal_covariate_value,covariate_id,bigint,Yes,Yes,No,Yes
+temporal_covariate_value,mean,float,Yes,No,No,Yes
+temporal_covariate_value,sd,float,No,No,No,Yes
+temporal_covariate_value,database_id,varchar(20),Yes,Yes,No,Yes
+temporal_time_ref,time_id,int,Yes,Yes,No,Yes
+temporal_time_ref,start_day,float,Yes,No,No,Yes
+temporal_time_ref,end_day,float,Yes,No,No,Yes
+time_distribution,cohort_id,bigint,Yes,Yes,No,Yes
+time_distribution,count_value,float,Yes,No,No,Yes
+time_distribution,min_value,float,Yes,No,No,Yes
+time_distribution,max_value,float,Yes,No,No,Yes
+time_distribution,average_value,float,Yes,No,No,Yes
+time_distribution,standard_deviation,float,Yes,No,No,Yes
+time_distribution,median_value,float,Yes,No,No,Yes
+time_distribution,p_10_value,float,Yes,No,No,Yes
+time_distribution,p_25_value,float,Yes,No,No,Yes
+time_distribution,p_75_value,float,Yes,No,No,Yes
+time_distribution,p_90_value,float,Yes,No,No,Yes
+time_distribution,time_metric,varchar(50),Yes,Yes,No,Yes
+time_distribution,database_id,varchar(20),Yes,Yes,No,Yes
+visit_context,cohort_id,bigint,Yes,Yes,No,Yes
+visit_context,visit_concept_id,int,Yes,Yes,No,Yes
+visit_context,visit_context,varchar(20),Yes,Yes,No,Yes
+visit_context,subjects,float,Yes,No,No,Yes
+visit_context,database_id,varchar(20),Yes,Yes,No,Yes
+vocabulary,vocabulary_id,varchar(20),Yes,Yes,No,Yes
+vocabulary,vocabulary_name,varchar(255),Yes,No,No,Yes
+vocabulary,vocabulary_reference,varchar,No,No,No,Yes
+vocabulary,vocabulary_version,varchar,No,No,No,Yes
+vocabulary,vocabulary_concept_id,int,Yes,Yes,No,Yes
diff --git a/CohortDiagnosticsBreastCancer/server.R b/CohortDiagnosticsBreastCancer/server.R
new file mode 100644
index 00000000..b2c0fe89
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/server.R
@@ -0,0 +1,1430 @@
+library(magrittr)
+
+source("R/DisplayFunctions.R")
+source("R/Tables.R")
+source("R/Plots.R")
+source("R/Results.R")
+
+shiny::shinyServer(function(input, output, session) {
+  
+  cohortId <- shiny::reactive({
+    return(cohort$cohortId[cohort$cohortName == input$cohort])
+  })
+  
+  comparatorCohortId <- shiny::reactive({
+    return(cohort$cohortId[cohort$cohortName == input$comparator])
+  })
+  
+  cohortIds <- shiny::reactive({
+    return(cohort$cohortId[cohort$cohortName  %in% input$cohorts])
+  })
+  
+
+  
+  timeId <- shiny::reactive({
+    return(temporalCovariateChoices %>%
+             dplyr::filter(choices %in% input$timeIdChoices) %>%
+             dplyr::pull(timeId))
+  })
+  
+  phenotypeId <- shiny::reactive({
+    return(phenotypeDescription$phenotypeId[phenotypeDescription$phenotypeName %in% input$phenotypes])
+  })
+  
+  shiny::observe({
+    subset <- unique(conceptSets$conceptSetName[conceptSets$cohortId == cohortId()]) %>% sort()
+    shinyWidgets::updatePickerInput(session = session,
+                                    inputId = "conceptSet",
+                                    choicesOpt = list(style = rep_len("color: black;", 999)),
+                                    choices = subset)
+  })
+  
+  shiny::observe({
+    subset <- unique(cohort$cohortName[cohort$phenotypeId == phenotypeId()]) %>% sort()
+    shinyWidgets::updatePickerInput(session = session,
+                                    inputId = "cohort",
+                                    choicesOpt = list(style = rep_len("color: black;", 999)),
+                                    choices = subset)
+  })
+  
+  shiny::observe({
+    subset <- unique(cohort$cohortName[cohort$phenotypeId == phenotypeId()]) %>% sort()
+    shinyWidgets::updatePickerInput(session = session,
+                                    inputId = "cohorts",
+                                    choicesOpt = list(style = rep_len("color: black;", 999)),
+                                    choices = subset,
+                                    selected = c(subset[1],subset[2]))
+  })
+  
+  output$phenoTypeDescriptionTable <- DT::renderDataTable(expr = {
+    data <- phenotypeDescription %>% 
+      dplyr::mutate(dplyr::across(.cols = dplyr::everything(), tidyr::replace_na, "")) %>% 
+      dplyr::mutate(literatureReview = dplyr::case_when(!.data$literatureReview %in% c("","0") ~ 
+                                                          paste0("<a href='", .data$literatureReview, "' target='_blank'>", "Link", "</a>"),
+                                                        TRUE ~ "Ongoing")) %>%
+      dplyr::mutate(phenotypeId = paste0("<a href='", paste0(conceptBaseUrl, .data$referentConceptId), "' target='_blank'>", .data$phenotypeId, "</a>")) %>% 
+      dplyr::mutate(clinicalDescription = stringr::str_replace_all(string = .data$clinicalDescription, 
+                                                                   pattern = "Overview:", 
+                                                                   replacement = "<strong>Overview:</strong>"))  %>% 
+      dplyr::mutate(clinicalDescription = stringr::str_replace_all(string = .data$clinicalDescription, 
+                                                                   pattern = "Assessment:", 
+                                                                   replacement = "<br/> <strong>Assessment:</strong>")) %>% 
+      dplyr::mutate(clinicalDescription = stringr::str_replace_all(string = .data$clinicalDescription, 
+                                                                   pattern = "Presentation:", 
+                                                                   replacement = "<br/> <strong>Presentation: </strong>")) %>% 
+      dplyr::mutate(clinicalDescription = stringr::str_replace_all(string = .data$clinicalDescription,
+                                                                   pattern = "Plan:",
+                                                                   replacement = "<br/> <strong>Plan: </strong>")) %>% 
+      dplyr::select(-.data$referentConceptId)
+    
+    options = list(pageLength = 10,
+                   searching = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   info = TRUE,
+                   searchHighlight = TRUE)
+    
+    dataTable <- DT::datatable(data,
+                               options = options,
+                               rownames = FALSE,
+                               colnames = colnames(data) %>% 
+                                 camelCaseToTitleCase(),
+                               escape = FALSE,
+                               filter = c("bottom"),
+                               class = "stripe compact")
+    return(dataTable)
+  }, server = TRUE)
+  
+  output$cohortDescriptionTable <- DT::renderDataTable(expr = {
+    data <- cohort %>%
+      dplyr::filter(.data$phenotypeId == phenotypeId()) %>% 
+      dplyr::left_join(y = phenotypeDescription) %>% 
+      dplyr::mutate(cohortName = paste0("<a href='", 
+                                        paste0(cohortBaseUrl, 
+                                               .data$webApiCohortId),
+                                        "' target='_blank'>", 
+                                        paste0(.data$cohortName), "</a>")) %>% 
+      dplyr::select(.data$phenotypeId, .data$cohortId, 
+                    .data$cohortName, .data$logicDescription) %>% 
+      dplyr::arrange(.data$phenotypeId, .data$cohortId, 
+                     .data$cohortName)
+    
+    options = list(pageLength = 10,
+                   searching = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   info = TRUE,
+                   searchHighlight = TRUE)
+    
+    dataTable <- DT::datatable(data,
+                               options = options,
+                               rownames = FALSE,
+                               colnames = colnames(data) %>% camelCaseToTitleCase(),
+                               escape = FALSE,
+                               filter = c("bottom"),
+                               class = "stripe compact")
+    return(dataTable)
+  }, server = TRUE)
+  
+  output$cohortCountsTable <- DT::renderDataTable(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    
+    data <- getCohortCountResult(dataSource = dataSource,
+                                 databaseIds = input$databases) %>%
+      dplyr::left_join(cohort, by = "cohortId") %>% 
+      dplyr::filter(.data$phenotypeId == phenotypeId()) %>% 
+      dplyr::select(.data$cohortId, 
+                    .data$cohortName, 
+                    .data$databaseId, 
+                    .data$webApiCohortId,
+                    .data$cohortSubjects, 
+                    .data$cohortEntries)
+    
+    if (nrow(data) == 0) {
+      return(tidyr::tibble("There is no data on any cohort"))
+    }
+    
+    if (!isTRUE(all.equal(data$databaseId %>% unique %>% sort(),
+                          input$databases %>% unique() %>% sort()))) {
+      return(dplyr::tibble(Note = paste0("There is no data for the databases:\n",
+                                         paste0(setdiff(input$databases, 
+                                                        data$databaseId %>% unique()), 
+                                                collapse = ",\n "), 
+                                         ".\n Please unselect them.")))
+    }
+    
+    table <- dplyr::full_join(
+      data %>% 
+        dplyr::select(.data$cohortId, .data$databaseId, 
+                      .data$cohortSubjects, .data$cohortName) %>% 
+        dplyr::mutate(columnName = paste0(.data$databaseId, "_subjects")) %>% 
+        tidyr::pivot_wider(id_cols = c(.data$cohortId, .data$cohortName),
+                           names_from = columnName,
+                           values_from = .data$cohortSubjects),
+      data %>% 
+        dplyr::select(.data$cohortId, .data$databaseId, 
+                      .data$cohortEntries, .data$cohortName) %>% 
+        dplyr::mutate(columnName = paste0(.data$databaseId, "_entries")) %>% 
+        tidyr::pivot_wider(id_cols = c(.data$cohortId, .data$cohortName),
+                           names_from = columnName,
+                           values_from = .data$cohortEntries),
+      by = c("cohortId", "cohortName"))
+    table <- table %>% 
+      dplyr::select(order(colnames(table))) %>% 
+      dplyr::relocate(.data$cohortId)
+    
+    table <- data %>% 
+      dplyr::select(.data$cohortId, .data$cohortName, .data$webApiCohortId) %>% 
+      dplyr::distinct() %>% 
+      dplyr::inner_join(table, by = c("cohortId", "cohortName")) %>%
+      dplyr::arrange(.data$cohortName)
+    
+    
+    if (!is.null(cohortBaseUrl)) {
+      table <- table %>%
+        dplyr::mutate(url = paste0(cohortBaseUrl, .data$webApiCohortId),
+                      cohortName = paste0("<a href='", 
+                                          .data$url, 
+                                          "' target='_blank'>", 
+                                          .data$cohortName, 
+                                          "</a>")) %>%
+        dplyr::select(-.data$url)
+    }
+    table <- table %>%
+      dplyr::select(-.data$cohortId, -.data$webApiCohortId) 
+    
+    databaseIds <- unique(data$databaseId)
+    
+    sketch <- htmltools::withTags(table(
+      class = "display",
+      thead(
+        tr(
+          th(rowspan = 2, "Cohort"),
+          lapply(databaseIds, th, colspan = 2, class = "dt-center")
+        ),
+        tr(
+          lapply(rep(c("Entries", "Subjects"), length(databaseIds)), th)
+        )
+      )
+    ))
+    
+    options = list(pageLength = 10,
+                   searching = TRUE,
+                   lengthChange = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   info = TRUE,
+                   searchHighlight = TRUE,
+                   scrollX = TRUE,
+                   columnDefs = list(minCellCountDef(1:(2*length(databaseIds)))))
+    
+    dataTable <- DT::datatable(table,
+                               options = options,
+                               rownames = FALSE,
+                               container = sketch, 
+                               escape = FALSE,
+                               filter = c("bottom"),
+                               class = "stripe nowrap compact")
+    for (i in 1:length(databaseIds)) {
+      dataTable <- DT::formatStyle(table = dataTable,
+                                   columns = i*2,
+                                   background = DT::styleColorBar(c(0, max(table[, i*2], na.rm = TRUE)), "lightblue"),
+                                   backgroundSize = "98% 88%",
+                                   backgroundRepeat = "no-repeat",
+                                   backgroundPosition = "center")
+      dataTable <- DT::formatStyle(table = dataTable,
+                                   columns = i*2 + 1,
+                                   background = DT::styleColorBar(c(0, max(table[, i*2 + 1], na.rm = TRUE)), "#ffd699"),
+                                   backgroundSize = "98% 88%",
+                                   backgroundRepeat = "no-repeat",
+                                   backgroundPosition = "center")
+    }
+    return(dataTable)
+  }, server = TRUE)
+  
+  incidenceRate <- reactive({
+    stratifyByAge <- "Age" %in% input$irStratification
+    stratifyByGender <- "Gender" %in% input$irStratification
+    stratifyByCalendarYear <- "Calendar Year" %in% input$irStratification
+    data <- getIncidenceRateResult(dataSource = dataSource,
+                                   cohortIds = cohortIds(), 
+                                   databaseIds = input$databases, 
+                                   stratifyByGender =  stratifyByGender,
+                                   stratifyByAgeGroup =  stratifyByAge,
+                                   stratifyByCalendarYear =  stratifyByCalendarYear,
+                                   minPersonYears = 1000) %>% 
+      dplyr::mutate(incidenceRate = dplyr::case_when(.data$incidenceRate < 0 ~ 0, 
+                                                     TRUE ~ .data$incidenceRate))
+  })
+  
+  output$incidenceRatePlot <- ggiraph::renderggiraph(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    
+    stratifyByAge <- "Age" %in% input$irStratification
+    stratifyByGender <- "Gender" %in% input$irStratification
+    stratifyByCalendarYear <- "Calendar Year" %in% input$irStratification
+    data <- incidenceRate()
+    
+    validate(need(!is.null(data), paste0("No data for this combination")),
+             need(nrow(data) > 0, paste0("No data for this combination")))
+    
+    plot <- plotIncidenceRate(data = data,
+                              cohortIds = NULL,
+                              databaseIds = NULL,
+                              stratifyByAgeGroup = stratifyByAge,
+                              stratifyByGender = stratifyByGender,
+                              stratifyByCalendarYear  = stratifyByCalendarYear,
+                              yscaleFixed =   input$irYscaleFixed)
+    return(plot)
+  })
+  
+  timeDist <- reactive({
+    data <- getTimeDistributionResult(dataSource = dataSource,
+                                      cohortIds = cohortIds(), 
+                                      databaseIds = input$databases)
+  })
+  
+  output$timeDisPlot <- ggiraph::renderggiraph(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    data <- timeDist()
+    validate(need(!is.null(data), paste0('No data for this combination')),
+             need(nrow(data) > 0, paste0('No data for this combination')))
+    
+    plot <- plotTimeDistribution(data = data,
+                                 cohortIds = cohortIds(),
+                                 databaseIds = input$databases)
+    return(plot)
+  })
+  
+  output$timeDistTable <- DT::renderDataTable(expr = {
+    
+    table <- getTimeDistributionResult(dataSource = dataSource,
+                                       cohortIds = cohortId(), 
+                                       databaseIds = input$databases)
+    
+    if (is.null(table)) {
+      return(dplyr::tibble(Note = paste0("No data available for selected databases and cohorts")))
+    }
+    
+    options = list(pageLength = 9,
+                   searching = TRUE,
+                   searchHighlight = TRUE,
+                   scrollX = TRUE,
+                   lengthChange = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   info = TRUE,
+                   columnDefs = list(minCellCountDef(3)))
+    table <- DT::datatable(table,
+                           options = options,
+                           rownames = FALSE,
+                           colnames = colnames(table) %>% 
+                             camelCaseToTitleCase(),
+                           filter = c("bottom"),
+                           class = "stripe nowrap compact")
+    table <- DT::formatRound(table, c("Average", "SD"), digits = 2)
+    table <- DT::formatRound(table, c("Min", "P10", "P25", "Median", "P75", "P90", "Max"), digits = 0)
+    return(table)
+  }, server = TRUE)
+  
+  
+  output$includedConceptsTable <- DT::renderDataTable(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    
+    data <- getIncludedConceptResult(dataSource = dataSource,
+                                     cohortId = cohortId(),
+                                     databaseIds = input$databases)
+    data <- data %>%
+      dplyr::filter(.data$conceptSetName == input$conceptSet)
+    if (nrow(data) == 0) {
+      return(dplyr::tibble("No data available for selected databases and cohorts"))
+    }
+    
+    databaseIds <- unique(data$databaseId)
+    
+    if (!all(input$databases %in% databaseIds)) {
+      return(dplyr::tibble(Note = paste0("There is no data for the databases:\n",
+                                         paste0(setdiff(input$databases, databaseIds), 
+                                                collapse = ",\n "), 
+                                         ".\n Please unselect them.")))
+    }
+    
+    maxCount <- max(data$conceptCount, na.rm = TRUE)
+    
+    if (input$includedType == "Source Concepts") {
+      table <- data %>%
+        dplyr::select(.data$databaseId, 
+                      .data$sourceConceptId,
+                      .data$conceptSubjects,
+                      .data$conceptCount) %>%
+        dplyr::arrange(.data$databaseId) %>% 
+        tidyr::pivot_longer(cols = c(.data$conceptSubjects, .data$conceptCount)) %>% 
+        dplyr::mutate(name = paste0(databaseId, "_",
+                                    stringr::str_replace(string = .data$name, 
+                                                         pattern = 'concept', 
+                                                         replacement = ''))) %>% 
+        tidyr::pivot_wider(id_cols = c(.data$sourceConceptId),
+                           names_from = .data$name,
+                           values_from = .data$value) %>%
+        dplyr::inner_join(data %>%
+                            dplyr::select(.data$sourceConceptId,
+                                          .data$sourceConceptName,
+                                          .data$sourceVocabularyId,
+                                          .data$sourceConceptCode) %>%
+                            dplyr::distinct(),
+                          by = "sourceConceptId") %>%
+        dplyr::relocate(.data$sourceConceptId, 
+                        .data$sourceConceptName, 
+                        .data$sourceVocabularyId,
+                        .data$sourceConceptCode)
+      
+      if (nrow(table) == 0) {
+        return(dplyr::tibble(Note = paste0("No data available for selected databases and cohorts")))
+      }
+      table <- table[order(-table[, 5]), ]
+      
+      sketch <- htmltools::withTags(table(
+        class = "display",
+        thead(
+          tr(
+            th(rowspan = 2, 'Concept ID'),
+            th(rowspan = 2, 'Concept Name'),
+            th(rowspan = 2, 'Vocabulary ID'),
+            th(rowspan = 2, 'Concept Code'),
+            lapply(databaseIds, th, colspan = 2, class = "dt-center")
+          ),
+          tr(
+            lapply(rep(c("Subjects", "Count"), length(databaseIds)), th)
+          )
+        )
+      ))
+      
+      options = list(pageLength = 10,
+                     searching = TRUE,
+                     scrollX = TRUE,
+                     lengthChange = TRUE,
+                     searchHighlight = TRUE,
+                     ordering = TRUE,
+                     paging = TRUE,
+                     columnDefs = list(truncateStringDef(1, 100),
+                                       minCellCountDef(3 + (1:(length(databaseIds) * 2)))))
+      
+      dataTable <- DT::datatable(table,
+                                 colnames = colnames(table),
+                                 options = options,
+                                 rownames = FALSE, 
+                                 container = sketch,
+                                 escape = FALSE,
+                                 filter = c("bottom"),
+                                 class = "stripe nowrap compact")
+      
+      dataTable <- DT::formatStyle(table = dataTable,
+                                   columns =  4 + (1:(length(databaseIds) * 2)),
+                                   background = DT::styleColorBar(c(0, maxCount), "lightblue"),
+                                   backgroundSize = "98% 88%",
+                                   backgroundRepeat = "no-repeat",
+                                   backgroundPosition = "center")
+    } else {
+      table <- data %>%
+        dplyr::select(.data$databaseId, 
+                      .data$conceptId,
+                      .data$conceptSubjects,
+                      .data$conceptCount) %>%
+        dplyr::group_by(.data$databaseId, 
+                        .data$conceptId) %>%
+        dplyr::summarise(conceptSubjects = sum(.data$conceptSubjects),
+                         conceptCount = sum(.data$conceptCount)) %>%
+        dplyr::ungroup() %>%
+        dplyr::arrange(.data$databaseId) %>% 
+        tidyr::pivot_longer(cols = c(.data$conceptSubjects, .data$conceptCount)) %>% 
+        dplyr::mutate(name = paste0(databaseId, "_",
+                                    stringr::str_replace(string = .data$name, 
+                                                         pattern = "concept", 
+                                                         replacement = ""))) %>% 
+        tidyr::pivot_wider(id_cols = c(.data$conceptId),
+                           names_from = .data$name,
+                           values_from = .data$value) %>%
+        dplyr::inner_join(data %>%
+                            dplyr::select(.data$conceptId,
+                                          .data$conceptName,
+                                          .data$vocabularyId) %>%
+                            dplyr::distinct(),
+                          by = "conceptId") %>%
+        dplyr::relocate(.data$conceptId, .data$conceptName, .data$vocabularyId)
+      
+      if (nrow(table) == 0) {
+        return(dplyr::tibble(Note = paste0('No data available for selected databases and cohorts')))
+      }
+      
+      table <- table[order(-table[, 4]), ]
+      
+      
+      sketch <- htmltools::withTags(table(
+        class = "display",
+        thead(
+          tr(
+            th(rowspan = 2, "Concept ID"),
+            th(rowspan = 2, "Concept Name"),
+            th(rowspan = 2, "Vocabulary ID"),
+            lapply(databaseIds, th, colspan = 2, class = "dt-center")
+          ),
+          tr(
+            lapply(rep(c("Subjects", "Counts"), length(databaseIds)), th)
+          )
+        )
+      ))
+      
+      options = list(pageLength = 10,
+                     searching = TRUE,
+                     scrollX = TRUE,
+                     lengthChange = TRUE,
+                     ordering = TRUE,
+                     paging = TRUE,
+                     columnDefs = list(truncateStringDef(1, 100),
+                                       minCellCountDef(2 + (1:(length(databaseIds) * 2)))))
+      
+      dataTable <- DT::datatable(table,
+                                 options = options,
+                                 colnames = colnames(table),
+                                 rownames = FALSE,
+                                 container = sketch,
+                                 escape = FALSE,
+                                 filter = c("bottom"),
+                                 class = "stripe nowrap compact")
+      
+      dataTable <- DT::formatStyle(table = dataTable,
+                                   columns =  3 + (1:(length(databaseIds)*2)),
+                                   background = DT::styleColorBar(c(0, maxCount), "lightblue"),
+                                   backgroundSize = "98% 88%",
+                                   backgroundRepeat = "no-repeat",
+                                   backgroundPosition = "center")
+    }
+    return(dataTable)
+  }, server = TRUE)
+  
+  output$orphanConceptsTable <- DT::renderDataTable(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    
+    data <- getOrphanConceptResult(dataSource = dataSource,
+                                   cohortId = cohortId(),
+                                   databaseIds = input$databases)
+    data <- data %>%
+      dplyr::filter(.data$conceptSetName == input$conceptSet)
+    
+    if (nrow(data) == 0) {
+      return(dplyr::tibble(Note = paste0("There is no data for the selected combination.")))
+    }
+    databaseIds <- unique(data$databaseId)
+    
+    if (!all(input$databases %in% databaseIds)) {
+      return(dplyr::tibble(Note = paste0("There is no data for the databases:\n",
+                                         paste0(setdiff(input$databases, databaseIds), 
+                                                collapse = ",\n "), 
+                                         ".\n Please unselect them.")))
+    }
+    
+    maxCount <- max(data$conceptCount, na.rm = TRUE)
+    
+    table <- data %>%
+      dplyr::select(.data$databaseId, 
+                    .data$conceptId,
+                    .data$conceptSubjects,
+                    .data$conceptCount) %>%
+      dplyr::group_by(.data$databaseId, 
+                      .data$conceptId) %>%
+      dplyr::summarise(conceptSubjects = sum(.data$conceptSubjects),
+                       conceptCount = sum(.data$conceptCount)) %>%
+      dplyr::ungroup() %>%
+      dplyr::arrange(.data$databaseId) %>% 
+      tidyr::pivot_longer(cols = c(.data$conceptSubjects, .data$conceptCount)) %>% 
+      dplyr::mutate(name = paste0(databaseId, "_",
+                                  stringr::str_replace(string = .data$name, 
+                                                       pattern = "concept", 
+                                                       replacement = ""))) %>% 
+      tidyr::pivot_wider(id_cols = c(.data$conceptId),
+                         names_from = .data$name,
+                         values_from = .data$value) %>%
+      dplyr::inner_join(data %>%
+                          dplyr::select(.data$conceptId,
+                                        .data$conceptName,
+                                        .data$vocabularyId,
+                                        .data$conceptCode) %>%
+                          dplyr::distinct(),
+                        by = "conceptId") %>%
+      dplyr::relocate(.data$conceptId, .data$conceptName, .data$vocabularyId, .data$conceptCode)
+    
+    if (nrow(table) == 0) {
+      return(dplyr::tibble(Note = paste0('No data available for selected databases and cohorts')))
+    }
+    
+    table <- table[order(-table[, 5]), ]
+    
+    
+    sketch <- htmltools::withTags(table(
+      class = "display",
+      thead(
+        tr(
+          th(rowspan = 2, "Concept ID"),
+          th(rowspan = 2, "Concept Name"),
+          th(rowspan = 2, "Vocabulary ID"),
+          th(rowspan = 2, "Concept Code"),
+          lapply(databaseIds, th, colspan = 2, class = "dt-center")
+        ),
+        tr(
+          lapply(rep(c("Subjects", "Counts"), length(databaseIds)), th)
+        )
+      )
+    ))
+    
+    options = list(pageLength = 10,
+                   searching = TRUE,
+                   scrollX = TRUE,
+                   lengthChange = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   columnDefs = list(truncateStringDef(1, 100),
+                                     minCellCountDef(3 + (1:(length(databaseIds) * 2)))))
+    
+    table <- DT::datatable(table,
+                           options = options,
+                           colnames = colnames(table),
+                           rownames = FALSE,
+                           container = sketch,
+                           escape = FALSE,
+                           filter = c("bottom"),
+                           class = "stripe nowrap compact")
+    
+    table <- DT::formatStyle(table = table,
+                             columns =  4 + (1:(length(databaseIds)*2)),
+                             background = DT::styleColorBar(c(0, maxCount), "lightblue"),
+                             backgroundSize = "98% 88%",
+                             backgroundRepeat = "no-repeat",
+                             backgroundPosition = "center")
+    return(table)
+  }, server = TRUE)
+  
+  output$inclusionRuleTable <- DT::renderDataTable(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    table <- getInclusionRuleStats(dataSource = dataSource,
+                                   cohortIds = cohortId(),
+                                   databaseIds = input$databases) 
+    if (nrow(table) == 0) {
+      return(dplyr::tibble(Note = paste0("No data available for selected databases and cohorts")))
+    }
+    
+    databaseIds <- unique(table$databaseId)
+    
+    if (!all(input$databases %in% databaseIds)) {
+      return(dplyr::tibble(Note = paste0("There is no data for the databases:\n",
+                                         paste0(setdiff(input$databases, databaseIds), 
+                                                collapse = ",\n "), 
+                                         ".\n Please unselect them.")))
+    }
+    
+    table <- table %>% 
+      tidyr::pivot_longer(cols = c(.data$meetSubjects, .data$gainSubjects, 
+                                   .data$totalSubjects, .data$remainSubjects)) %>% 
+      dplyr::group_by(.data$ruleSequenceId, .data$databaseId, .data$name, .data$ruleName) %>% 
+      dplyr::summarise(value = sum(.data$value)) %>% 
+      dplyr::mutate(name = paste0(databaseId, "_", .data$name)) %>% 
+      tidyr::pivot_wider(id_cols = c(.data$ruleSequenceId, .data$ruleName),
+                         names_from = .data$name,
+                         values_from = .data$value)
+    
+    sketch <- htmltools::withTags(table(
+      class = "display",
+      thead(
+        tr(
+          th(rowspan = 2, "Rule Sequence ID"),
+          th(rowspan = 2, "Rule Name"),
+          lapply(databaseIds, th, colspan = 4, class = "dt-center")
+        ),
+        tr(
+          lapply(rep(c("Meet", "Gain", "Remain", "Total"), length(databaseIds)), th)
+        )
+      )
+    ))
+    
+    options = list(pageLength = 10,
+                   searching = TRUE,
+                   searchHighlight = TRUE,
+                   scrollX = TRUE,
+                   lengthChange = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   columnDefs = list(minCellCountDef(1 + (1:(length(databaseIds) * 4)))))
+    
+    table <- DT::datatable(table,
+                           options = options,
+                           colnames = colnames(table) %>% camelCaseToTitleCase(),
+                           rownames = FALSE,
+                           container = sketch,
+                           escape = FALSE,
+                           filter = c("bottom"),
+                           class = "stripe nowrap compact")
+    
+    # table <- DT::formatStyle(table = table,
+    #                          columns = 2 + (1:(length(databaseIds) * 4)),
+    #                          background = DT::styleColorBar(lims, "lightblue"),
+    #                          backgroundSize = "98% 88%",
+    #                          backgroundRepeat = "no-repeat",
+    #                          backgroundPosition = "center")
+    return(table)
+  }, server = TRUE)
+  
+  output$breakdownTable <- DT::renderDataTable(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    data <- getIndexEventBreakdown(dataSource = dataSource,
+                                   cohortIds = cohortId(),
+                                   databaseIds = input$databases)
+    if (nrow(data) == 0) {
+      return(dplyr::tibble(Note = paste0("No data available for selected databases and cohorts")))
+    }
+    maxCount <- max(data$conceptCount, na.rm = TRUE)
+    databaseIds <- unique(data$databaseId) %>% sort()
+    data <- data %>%
+      dplyr::select(.data$conceptId, .data$conceptName, .data$databaseId, .data$conceptCount)
+    table <- data[data$databaseId == databaseIds[1], ]
+    table$databaseId <- NULL
+    colnames(table)[3] <- databaseIds[1]
+    if (length(databaseIds) > 1) {
+      for (i in 2:length(databaseIds)) {
+        temp <- data[data$databaseId == databaseIds[i],]
+        temp$databaseId <- NULL        
+        colnames(temp)[3] <- databaseIds[i]
+        table <- merge(table, temp, all = TRUE)
+      }
+    }
+    table <- table[order(-table[, 3]), ]
+    colnames(table)[1:2] <- c("Concept ID", "Name")
+    options = list(pageLength = 10,
+                   searching = TRUE,
+                   searchHighlight = TRUE,
+                   scrollX = TRUE,
+                   lengthChange = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   columnDefs = list(minCellCountDef(3:ncol(table) - 1)))
+    dataTable <- DT::datatable(table,
+                               options = options,
+                               rownames = FALSE,
+                               escape = FALSE,
+                               filter = c("bottom"),
+                               class = "stripe nowrap compact")
+    dataTable <- DT::formatStyle(table = dataTable,
+                                 columns = 3:ncol(table),
+                                 background = DT::styleColorBar(c(0, maxCount), "lightblue"),
+                                 backgroundSize = "98% 88%",
+                                 backgroundRepeat = "no-repeat",
+                                 backgroundPosition = "center")
+    return(dataTable)
+  }, server = TRUE)
+  
+  output$visitContextTable <- DT::renderDataTable(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    data <- getVisitContextResults(dataSource = dataSource,
+                                   cohortIds = cohortId(), 
+                                   databaseIds = input$databases)
+    if (nrow(data) == 0) {
+      return(dplyr::tibble(Note = paste0("No data available for selected databases and cohort")))
+    }
+    
+    databaseIds <- sort(unique(data$databaseId))
+    
+    if (!all(input$databases %in% databaseIds)) {
+      return(dplyr::tibble(Note = paste0("There is no data for the databases:\n",
+                                         paste0(setdiff(input$databases, databaseIds), 
+                                                collapse = ",\n "), 
+                                         ".\n Please unselect them.")))
+    }
+    
+    maxSubjects <- max(data$subjects)
+    visitContextReference <-  expand.grid(visitContext = c("Before", "During visit", "On visit start", "After"), 
+                                          visitConceptName = unique(data$visitConceptName),
+                                          databaseId = databaseIds)
+    
+    table <- visitContextReference %>% 
+      dplyr::left_join(data, by = c("visitConceptName", "visitContext", "databaseId")) %>% 
+      dplyr::select(.data$visitConceptName, .data$visitContext, .data$subjects, .data$databaseId) %>% 
+      dplyr::mutate(visitContext = paste0(.data$databaseId, "_", .data$visitContext)) %>% 
+      dplyr::select(-.data$databaseId) %>%
+      tidyr::pivot_wider(id_cols = c(.data$visitConceptName),
+                         names_from = .data$visitContext,
+                         values_from = .data$subjects)
+    
+    sketch <- htmltools::withTags(table(
+      class = "display",
+      thead(
+        tr(
+          th(rowspan = 2, "Visit"),
+          lapply(databaseIds, th, colspan = 4, class = "dt-center")
+        ),
+        tr(
+          lapply(rep(c("Visits Before", "Visits Ongoing", "Starting Simultateous", "Visits After"), length(databaseIds)), th)
+        )
+      )
+    ))
+    
+    options = list(pageLength = 10,
+                   searching = TRUE,
+                   searchHighlight = TRUE,
+                   scrollX = TRUE,
+                   lengthChange = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   columnDefs = list(truncateStringDef(0, 30),
+                                     minCellCountDef(1:(length(databaseIds) * 4))))
+    
+    table <- DT::datatable(table,
+                           options = options,
+                           colnames = colnames(table) %>% camelCaseToTitleCase(),
+                           rownames = FALSE,
+                           container = sketch,
+                           escape = TRUE,
+                           filter = c("bottom"))
+    
+    table <- DT::formatStyle(table = table,
+                             columns = 1:(length(databaseIds) * 4) + 1,
+                             background = DT::styleColorBar(c(0, maxSubjects), "lightblue"),
+                             backgroundSize = "98% 88%",
+                             backgroundRepeat = "no-repeat",
+                             backgroundPosition = "center")
+    
+  }, server = TRUE)
+  
+  output$characterizationTable <- DT::renderDataTable({
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    if (input$charType == "Pretty") {
+      analysisIds <- prettyAnalysisIds
+    } else {
+      analysisIds <- NULL
+    }
+    data <- getCovariateValueResult(dataSource = dataSource,
+                                    analysisIds = analysisIds,
+                                    cohortIds = cohortId(),
+                                    databaseIds = input$databases,
+                                    isTemporal = FALSE) 
+    if (nrow(data) == 0) {
+      return(dplyr::tibble(Note = paste0("No data available for selected databases and cohorts")))
+    }
+    
+    databaseIds <- sort(unique(data$databaseId))
+    
+    if (!all(input$databases %in% databaseIds)) {
+      return(dplyr::tibble(Note = paste0("There is no data for the databases:\n",
+                                         paste0(setdiff(input$databases, databaseIds), 
+                                                collapse = ",\n "), 
+                                         ".\n Please unselect them.")))
+    }
+    
+    if (input$charType == "Pretty") {
+      countData <- getCohortCountResult(dataSource = dataSource,
+                                        databaseIds = input$databases,
+                                        cohortIds = cohortId()) %>%
+        dplyr::arrange(.data$databaseId)
+      
+      table <- list()
+      characteristics <- list()
+      for (i in 1:length(databaseIds)) {
+        temp <- data %>% 
+          dplyr::filter(.data$databaseId == databaseIds[i]) %>% 
+          prepareTable1()
+        if (nrow(temp) > 0) {
+          table[[i]] <- temp %>% 
+            dplyr::mutate(databaseId = databaseIds[i])
+          characteristics[[i]] <- table[[i]] %>% 
+            dplyr::select(.data$characteristic, .data$position, 
+                          .data$header, .data$sortOrder)
+        } else {
+          return(dplyr::tibble(Note = paste0(databaseIds[i], " does not have covariates that are part of pretty table. Please unselect.")))
+        }
+      }
+      characteristics <- dplyr::bind_rows(characteristics) %>% 
+        dplyr::distinct() %>% 
+        dplyr::group_by(.data$characteristic, .data$position, .data$header) %>% 
+        dplyr::summarise(sortOrder = max(.data$sortOrder)) %>% 
+        dplyr::ungroup() %>% 
+        dplyr::arrange(.data$position, desc(.data$header)) %>% 
+        dplyr::mutate(sortOrder = dplyr::row_number()) %>%
+        dplyr::distinct() %>% 
+        tidyr::crossing(dplyr::tibble(databaseId = input$databases)) %>% 
+        dplyr::arrange(.data$databaseId, .data$sortOrder)
+      
+      table <- characteristics %>% 
+        dplyr::left_join(dplyr::bind_rows(table) %>% 
+                           dplyr::select(-.data$sortOrder),
+                         by = c("characteristic", "position", "header", "databaseId"))  %>% 
+        dplyr::arrange(.data$sortOrder) %>% 
+        tidyr::pivot_wider(id_cols = "characteristic", 
+                           names_from = "databaseId",
+                           values_from = "value" ,
+                           names_sep = "_",
+                           names_prefix = "Value_")
+      
+      options = list(pageLength = 100,
+                     searching = TRUE,
+                     scrollX = TRUE,
+                     scrollY = TRUE,
+                     lengthChange = TRUE,
+                     ordering = FALSE,
+                     paging = TRUE,
+                     columnDefs = list(
+                       truncateStringDef(0, 150),
+                       minCellPercentDef(1:length(databaseIds))
+                     ))
+      sketch <- htmltools::withTags(table(
+        class = "display",
+        thead(
+          tr(
+            th(rowspan = 3, "Covariate Name"),
+            lapply(databaseIds, th, colspan = 1, class = "dt-center")
+          ),
+          tr(
+            lapply(paste0("(n = ", 
+                          format(countData$cohortSubjects, big.mark = ","), ")"), 
+                   th, 
+                   colspan = 1, 
+                   class = "dt-center no-padding")
+          ),
+          tr(
+            lapply(rep(c("Proportion"), 
+                       length(databaseIds)), th)
+          )
+        )
+      ))
+      table <- DT::datatable(table,
+                             options = options,
+                             rownames = FALSE,
+                             container = sketch, 
+                             escape = FALSE,
+                             filter = c("bottom"),
+                             class = "stripe nowrap compact")
+      
+      table <- DT::formatStyle(table = table,
+                               columns = 1 + (1:length(databaseIds)),
+                               background = DT::styleColorBar(c(0,1), "lightblue"),
+                               backgroundSize = "98% 88%",
+                               backgroundRepeat = "no-repeat",
+                               backgroundPosition = "center")
+    } else {
+      data <- data %>% 
+        dplyr::arrange(.data$databaseId) %>% 
+        tidyr::pivot_longer(cols = c(.data$mean, .data$sd)) %>% 
+        dplyr::mutate(name = paste0(databaseId, "_", .data$name)) %>% 
+        tidyr::pivot_wider(id_cols = c(.data$covariateId),
+                           names_from = .data$name,
+                           values_from = .data$value) %>%
+        dplyr::inner_join(data %>% dplyr::select(.data$covariateId, 
+                                                 .data$covariateName, 
+                                                 .data$conceptId) %>% 
+                            dplyr::distinct(),
+                          by = "covariateId") %>%
+        dplyr::select(-covariateId) %>% 
+        dplyr::relocate("covariateName", "conceptId") %>% 
+        dplyr::distinct()
+      
+      data <- data[order(-data[3]), ]
+      
+      options = list(pageLength = 100,
+                     searching = TRUE,
+                     searchHighlight = TRUE,
+                     scrollX = TRUE,
+                     scrollY = TRUE,
+                     lengthChange = TRUE,
+                     ordering = TRUE,
+                     paging = TRUE,
+                     columnDefs = list(
+                       truncateStringDef(0, 150),
+                       minCellRealDef(2:(1 + length(databaseIds)*2), digits = 3)))
+      sketch <- htmltools::withTags(table(
+        class = "display",
+        thead(
+          tr(
+            th(rowspan = 2, "Covariate Name"),
+            th(rowspan = 2, "Concept Id"),
+            lapply(databaseIds, th, colspan = 2, class = "dt-center")
+          ),
+          tr(
+            lapply(rep(c("Mean", "SD"), length(databaseIds)), th)
+          )
+        )
+      ))
+      table <- DT::datatable(data,
+                             options = options,
+                             rownames = FALSE,
+                             container = sketch, 
+                             escape = FALSE,
+                             filter = c("bottom"),
+                             class = "stripe nowrap compact")
+      table <- DT::formatStyle(table = table,
+                               columns = (1 + 2*(1:length(databaseIds))),
+                               background = DT::styleColorBar(c(0,1), "lightblue"),
+                               backgroundSize = "98% 88%",
+                               backgroundRepeat = "no-repeat",
+                               backgroundPosition = "center")
+    }
+    return(table)
+  })
+  
+  covariateIdArray <- reactiveVal()
+  covariateIdArray(c())
+  observeEvent(input$rows, {
+    if (input$rows[[2]] %in% covariateIdArray())
+      covariateIdArray(covariateIdArray()[covariateIdArray() %in% input$rows[[2]] == FALSE])
+    else
+      covariateIdArray(c(covariateIdArray(),input$rows[[2]]))
+  })
+  
+  output$temporalCharacterizationTable <- DT::renderDataTable(expr = {
+    validate(need(length(input$databases) > 0, "No data sources chosen"))
+    validate(need(length(timeId()) > 0, "No time periods selected"))
+    
+    data <- getCovariateValueResult(dataSource = dataSource,
+                                    cohortIds = cohortId(),
+                                    databaseIds = input$database,
+                                    timeIds = timeId(),
+                                    isTemporal = TRUE) 
+    if (nrow(data) == 0) {
+      return(dplyr::tibble(Note = paste0("No data available for selected databases and cohorts")))
+    }
+    
+    table <- data %>% 
+      dplyr::inner_join(temporalCovariateChoices, by = "timeId") %>% 
+      dplyr::arrange(.data$timeId)  %>% 
+      tidyr::pivot_wider(id_cols = c("covariateId", "covariateName", "conceptId"), 
+                         names_from = "choices",
+                         values_from = "mean" ,
+                         names_sep = "_"
+      ) %>% 
+      dplyr::select(-.data$conceptId) %>% 
+      dplyr::relocate(.data$covariateName, .data$covariateId) 
+    
+    table <- table[order(-table[3]), ]
+    
+    temporalCovariateChoicesSelected <- temporalCovariateChoices %>% 
+      dplyr::filter(.data$timeId %in% c(timeId())) %>% 
+      dplyr::arrange(.data$timeId)
+    
+    options = list(pageLength = 10,
+                   searching = TRUE,
+                   searchHighlight = TRUE,
+                   scrollX = TRUE,
+                   lengthChange = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   columnDefs = list(
+                     truncateStringDef(0, 150),
+                     minCellPercentDef(1:(length(temporalCovariateChoicesSelected$choices)) + 1)))
+    
+    table <- DT::datatable(table,
+                           options = options,
+                           rownames = FALSE,
+                           colnames = colnames(table) %>% 
+                             camelCaseToTitleCase(),
+                           escape = FALSE,
+                           filter = c("bottom"),
+                           class = "stripe nowrap compact",
+                           callback =  DT::JS("table.on('click.dt', 'td', function() {
+                                            var row_=table.row(this).data();
+                                            var data = [row_];
+                                            Shiny.onInputChange('rows',data );});"))
+    table <- DT::formatStyle(table = table,
+                             columns = (2 + (1:length(temporalCovariateChoicesSelected$choices))), #0 index
+                             background = DT::styleColorBar(c(0,1), "lightblue"),
+                             backgroundSize = "98% 88%",
+                             backgroundRepeat = "no-repeat",
+                             backgroundPosition = "center")
+    return(table)
+  }, server = TRUE)
+  
+  cohortOverlap <- reactive({
+    combisOfTargetComparator <- tidyr::crossing(targetCohortId = cohortIds(),
+                                                comparatorCohortId = cohortIds()) %>% 
+      dplyr::filter(!.data$targetCohortId == .data$comparatorCohortId) %>% 
+      dplyr::distinct()
+    validate(need(nrow(combisOfTargetComparator) > 0, paste0("Please select atleast two cohorts.")))
+    
+    data <- getCohortOverlapResult(dataSource = dataSource, 
+                                   targetCohortIds = combisOfTargetComparator$targetCohortId, 
+                                   comparatorCohortIds = combisOfTargetComparator$comparatorCohortId, 
+                                   databaseIds = input$databases)
+  })
+  
+  output$overlapPlot <- ggiraph::renderggiraph(expr = {
+    validate(need(length(cohortIds()) > 0, paste0("Please select Target Cohort(s)")))
+
+    data <- cohortOverlap()
+    validate(need(!is.null(data), paste0("No cohort overlap data for this combination")))
+    
+    plot <- plotCohortOverlap(data = data,
+                              yAxis = input$overlapPlotType)
+    return(plot)
+  })
+  
+  computeBalance <- shiny::reactive({
+    covs1 <- getCovariateValueResult(dataSource = dataSource,
+                                     cohortIds = cohortIds(),
+                                     databaseIds = input$databases,
+                                     isTemporal = FALSE)
+    covs2 <- getCovariateValueResult(dataSource = dataSource,
+                                     cohortIds = cohortIds(),
+                                     databaseIds = input$databases,
+                                     isTemporal = FALSE)
+    balance <- compareCohortCharacteristics(covs1, covs2) %>%
+      dplyr::mutate(absStdDiff = abs(.data$stdDiff))
+    return(balance)
+  })
+  
+  output$charCompareTable <- DT::renderDataTable(expr = {
+    balance <- computeBalance()
+    if (nrow(balance) == 0) {
+      return(dplyr::tibble(Note = "No data for the selected combination."))
+    }
+    
+    if (input$charCompareType == "Pretty table") {
+      table <- prepareTable1Comp(balance)
+      if (nrow(table) > 0) {
+        table <- table %>% 
+          dplyr::arrange(.data$sortOrder) %>% 
+          dplyr::select(-.data$sortOrder)
+      } else {
+        return(dplyr::tibble(Note = "No data for covariates that are part of pretty table."))
+      }
+      
+      options = list(pageLength = 100,
+                     searching = TRUE,
+                     scrollX = TRUE,
+                     searchHighlight = TRUE,
+                     lengthChange = TRUE,
+                     ordering = FALSE,
+                     paging = TRUE,
+                     columnDefs = list(minCellPercentDef(1:2)))
+      
+      table <- DT::datatable(table,
+                             options = options,
+                             rownames = FALSE,
+                             colnames = c("Characteristic", "Target", "Comparator","StdDiff"),
+                             escape = FALSE,
+                             filter = c("bottom"),
+                             class = "stripe nowrap compact")
+      table <- DT::formatStyle(table = table,
+                               columns = 2:3,
+                               background = DT::styleColorBar(c(0,1), "lightblue"),
+                               backgroundSize = "98% 88%",
+                               backgroundRepeat = "no-repeat",
+                               backgroundPosition = "center")
+      table <- DT::formatStyle(table = table,
+                               columns = 4,
+                               background = styleAbsColorBar(1, "lightblue", "pink"),
+                               backgroundSize = "98% 88%",
+                               backgroundRepeat = "no-repeat",
+                               backgroundPosition = "center")
+      table <- DT::formatRound(table, 4, digits = 2)
+    } else {
+      table <- balance %>% 
+        dplyr::select(.data$covariateName, .data$conceptId, .data$mean1, .data$sd1, .data$mean2, .data$sd2, .data$stdDiff)
+      
+      table <- table[order(-abs(table[7])), ]
+      
+      options = list(pageLength = 100,
+                     searching = TRUE,
+                     searchHighlight = TRUE,
+                     scrollX = TRUE,
+                     lengthChange = TRUE,
+                     ordering = TRUE,
+                     paging = TRUE,
+                     columnDefs = list(
+                       truncateStringDef(0, 150),
+                       minCellRealDef(2:6, digits = 2)))
+      
+      table <- DT::datatable(table,
+                             options = options,
+                             rownames = FALSE,
+                             colnames = c("Covariate Name", "Concept ID", "Mean Target", "SD Target", "Mean Comparator", "SD Comparator", "StdDiff"),
+                             escape = FALSE,
+                             filter = c("bottom"),
+                             class = "stripe nowrap compact")
+      table <- DT::formatStyle(table = table,
+                               columns = c(3, 5),
+                               background = DT::styleColorBar(c(0,1), "lightblue"),
+                               backgroundSize = "98% 88%",
+                               backgroundRepeat = "no-repeat",
+                               backgroundPosition = "center")
+      table <- DT::formatStyle(table = table,
+                               columns = 7,
+                               background = styleAbsColorBar(1, "lightblue", "pink"),
+                               backgroundSize = "98% 88%",
+                               backgroundRepeat = "no-repeat",
+                               backgroundPosition = "center")
+    }
+    return(table)
+  }, server = TRUE)
+  
+  cohortCompare <- shiny::reactive({
+    balance <- computeBalance()
+    
+    balance <- balance %>%
+      replace(is.na(.), 0) %>% 
+      dplyr::filter(.data$cohortId1 != 0) %>% 
+      dplyr::filter(.data$cohortId2 != 0)
+    
+    balance <- balance %>%
+      dplyr::inner_join(
+        balance %>%
+          dplyr::select(.data$cohortId1,
+                        .data$cohortId2) %>%
+          dplyr::distinct() %>%
+          dplyr::arrange(.data$cohortId1,
+                         .data$cohortId2) %>%
+          dplyr::mutate(comparisonGroup = dplyr::row_number())) %>%
+      dplyr::relocate(.data$comparisonGroup)
+    
+    combis <- dplyr::bind_rows(balance %>% 
+                                 dplyr::select(.data$cohortId1) %>% 
+                                 dplyr::distinct() %>% 
+                                 dplyr::arrange(.data$cohortId1) %>% 
+                                 dplyr::mutate(shortName = paste0('C', dplyr::row_number())) %>% 
+                                 dplyr::rename(cohortId = .data$cohortId1),
+                               balance %>% 
+                                 dplyr::select(.data$cohortId2) %>% 
+                                 dplyr::distinct() %>% 
+                                 dplyr::arrange(.data$cohortId2) %>% 
+                                 dplyr::mutate(shortName = paste0('C', dplyr::row_number())) %>% 
+                                 dplyr::rename(cohortId = .data$cohortId2)) %>% 
+      dplyr::inner_join(y = cohort %>% 
+                          dplyr::select(.data$cohortId, .data$cohortName))
+    
+    balance <- balance %>% 
+      dplyr::inner_join(y = combis %>% 
+                          dplyr::filter(stringr::str_detect(string = .data$shortName,
+                                                            pattern = 'C')) %>% 
+                          dplyr::rename(targetCohortId = .data$cohortId,
+                                        targetCohortName = .data$cohortName,
+                                        targetCohortShortName = .data$shortName),
+                        by = c("cohortId1" = "targetCohortId")) %>% 
+      dplyr::inner_join(y = combis %>% 
+                          dplyr::filter(stringr::str_detect(string = .data$shortName,
+                                                            pattern = 'C')) %>% 
+                          dplyr::rename(comparatorCohortId = .data$cohortId,
+                                        comparatorCohortName = .data$cohortName,
+                                        comparatorCohortShortName = .data$shortName),
+                        by = c("cohortId2" = "comparatorCohortId"))
+    
+    return(balance)
+  })
+  
+  output$charComparePlot <- ggiraph::renderggiraph(expr = {
+    validate(need((length(cohortIds()) != 1), paste0("Please select atleast two different cohorts.")))
+    balance <- cohortCompare()
+    if (nrow(balance) == 0) {
+      return(dplyr::tibble(Note = "No data for the selected combination."))
+    }
+    plot <- plotCohortComparisonStandardizedDifference(balance = balance,
+                                                       domain = input$domainId,
+                                                       targetLabel = paste0("Mean in Target (", input$cohort, ")"),
+                                                       comparatorLabel = paste0("Mean in Comparator (", input$comparator, ")"))
+    return(plot)
+  })
+  
+  # output$databaseInformationPanel <- renderUI({
+  #   row <- database[database$databaseId == input$database, ]
+  #   text <- div(tags$p(tags$h3("ID"), wellPanel(row$databaseId)),
+  #               tags$p(tags$h3("Name"), wellPanel(row$databaseName)),
+  #               tags$p(tags$h3("Description"), wellPanel(row$description)))
+  #   return(text)
+  # })
+  
+  output$databaseInformationTable <- DT::renderDataTable(expr = {
+    
+    table <- database[, c("databaseId", "databaseName", "description")]
+    options = list(pageLength = 20,
+                   searching = TRUE,
+                   lengthChange = TRUE,
+                   ordering = TRUE,
+                   paging = TRUE,
+                   searchHighlight = TRUE,
+                   columnDefs = list(list(width = "30%", targets = 1),
+                                     list(width = "60%", targets = 2))
+    )
+    table <- DT::datatable(table,
+                           options = options,
+                           colnames = c("ID", "Name", "Description"),
+                           rownames = FALSE,
+                           class = "stripe compact")
+    return(table)
+  }, server = TRUE)
+  
+  showInfoBox <- function(title, htmlFileName) {
+    shiny::showModal(shiny::modalDialog(
+      title = title,
+      easyClose = TRUE,
+      footer = NULL,
+      size = "l",
+      HTML(readChar(htmlFileName, file.info(htmlFileName)$size) )
+    ))
+  }
+  
+  shiny::observeEvent(input$cohortCountsInfo, {
+    showInfoBox("Cohort Counts", "html/cohortCounts.html")
+  })
+  
+  shiny::observeEvent(input$incidenceRateInfo, {
+    showInfoBox("Incidence Rate", "html/incidenceRate.html")
+  })
+  
+  shiny::observeEvent(input$timeDistributionInfo, {
+    showInfoBox("Time Distributions", "html/timeDistribution.html")
+  })
+  
+  shiny::observeEvent(input$includedConceptsInfo, {
+    showInfoBox("Included (Source) Concepts", "html/includedConcepts.html")
+  })
+  
+  shiny::observeEvent(input$orphanConceptsInfo, {
+    showInfoBox("Orphan (Source) Concepts", "html/orphanConcepts.html")
+  })
+  
+  shiny::observeEvent(input$inclusionRuleStatsInfo, {
+    showInfoBox("Inclusion Rule Statistics", "html/inclusionRuleStats.html")
+  })
+  
+  shiny::observeEvent(input$indexEventBreakdownInfo, {
+    showInfoBox("Index Event Breakdown", "html/indexEventBreakdown.html")
+  })
+  
+  shiny::observeEvent(input$visitContextInfo, {
+    showInfoBox("Visit Context", "html/visitContext.html")
+  })
+  
+  shiny::observeEvent(input$cohortCharacterizationInfo, {
+    showInfoBox("Cohort Characterization", "html/cohortCharacterization.html")
+  })
+  
+  shiny::observeEvent(input$temporalCharacterizationInfo, {
+    showInfoBox("Temporal Characterization", "html/temporalCharacterization.html")
+  })
+  
+  shiny::observeEvent(input$cohortOverlapInfo, {
+    showInfoBox("Cohort Overlap", "html/cohortOverlap.html")
+  })
+  
+  shiny::observeEvent(input$compareCohortCharacterizationInfo, {
+    showInfoBox("Compare Cohort Characteristics", "html/compareCohortCharacterization.html")
+  })
+  
+  output$temporalCharacterizationSelectedDataBase <- shiny::renderText(input$database)
+  
+  targetCohortCount <- shiny::reactive({
+    targetCohortWithCount <- getCohortCountResult(dataSource = dataSource,
+                                                  cohortIds = cohortId(),
+                                                  databaseIds = input$database) %>% 
+      dplyr::left_join(y = cohort, by = "cohortId") %>% 
+      dplyr::arrange(.data$cohortName)
+    return(targetCohortWithCount)
+  }) 
+  
+  targetCohortCountHtml <- shiny::reactive({
+    targetCohortCount <- targetCohortCount()
+    
+    return(htmltools::withTags(
+      div(
+        h5("Target: ", targetCohortCount$cohortName, " ( n = ", scales::comma(x = targetCohortCount$cohortSubjects), " )")
+      )
+    )
+    )
+  })
+  
+  output$temporalCharacterizationSelectedCohort <- shiny::renderUI({
+    return(targetCohortCountHtml())
+  })
+  
+  output$inclusionRuleStatSelectedCohort <- shiny::renderUI({
+    return(targetCohortCountHtml())
+  })
+  
+  output$compareCohortCharacterizationSelectedCohort <- shiny::renderUI({
+      data <- cohortCompare()
+      
+      cohorts <- data %>%
+        dplyr::distinct(.data$targetCohortShortName, .data$targetCohortName) %>%
+        dplyr::arrange(.data$targetCohortShortName) 
+        
+      html <- htmltools::withTags(
+        div(table(
+          tr(
+            td(
+              HTML(paste(paste(cohorts$targetCohortShortName, cohorts$targetCohortName, sep = ": "), collapse = "</br>"))
+            )
+          )
+        )
+        ))
+      return(html)
+  })
+  
+  output$cohortOverlapSelectedCohort <- shiny::renderUI({
+    data <- cohortOverlap()
+    targetCohorts <- data %>%
+      dplyr::distinct(.data$targetShortName, .data$targetCohortName) %>%
+      dplyr::arrange(.data$targetShortName)
+    
+    html <- htmltools::withTags(
+      div(table(
+        tr(
+          td(
+            HTML(paste(paste(targetCohorts$targetShortName, targetCohorts$targetCohortName, sep = ": "), collapse = "</br>"))
+          )
+        )
+      )
+      ))
+    return(html)
+  })
+  
+  output$incidenceRateSelectedCohort <- shiny::renderUI({
+    data <- incidenceRate()
+    targetCohorts <- data %>%
+      dplyr::distinct(.data$shortName, .data$cohortName) %>%
+      dplyr::arrange(.data$shortName)
+    
+    html <- htmltools::withTags(
+      div(table(
+        tr(
+          td(
+            HTML(paste(paste(targetCohorts$shortName, targetCohorts$cohortName, sep = ": "), collapse = "</br>"))
+          )
+        )
+      )
+      ))
+    return(html)
+  })
+  
+  output$timeDistSelectedCohort <- shiny::renderUI({
+    data <- timeDist()
+    targetCohorts <- data %>%
+      dplyr::distinct(.data$shortName, .data$cohortName) %>%
+      dplyr::arrange(.data$shortName)
+    
+    html <- htmltools::withTags(
+      div(table(
+        tr(
+          td(
+            HTML(paste(paste(targetCohorts$shortName, targetCohorts$cohortName, sep = ": "), collapse = "</br>"))
+          )
+        )
+      )
+      ))
+    return(html)
+  })
+  
+  #Download
+  # download_box <- function(exportname, plot){
+  #   downloadHandler(
+  #     filename = function() {
+  #       paste(exportname, Sys.Date(), ".png", sep = "")
+  #     },
+  #     content = function(file) {
+  #       ggplot2::ggsave(file, plot = plot, device = "png", width = 9, height = 7, dpi = 400)
+  #     }
+  #   )
+  # }
+  
+})
diff --git a/CohortDiagnosticsBreastCancer/ui.R b/CohortDiagnosticsBreastCancer/ui.R
new file mode 100644
index 00000000..d50211ec
--- /dev/null
+++ b/CohortDiagnosticsBreastCancer/ui.R
@@ -0,0 +1,467 @@
+library(magrittr)
+
+source("R/DisplayFunctions.R")
+source("R/Tables.R")
+source("R/Plots.R")
+source("R/Results.R")
+
+addInfo <- function(item, infoId) {
+  infoTag <- tags$small(
+    class = "badge pull-right action-button",
+    style = "padding: 1px 6px 2px 6px; background-color: steelblue;",
+    type = "button",
+    id = infoId,
+    "i"
+  )
+  item$children[[1]]$children <-
+    append(item$children[[1]]$children, list(infoTag))
+  return(item)
+}
+
+if (!exists("phenotypeDescription")) {
+  appTitle <- cohortDiagnosticModeDefaultTitle
+} else {
+  appTitle <- phenotypeLibraryModeDefaultTitle
+}
+
+#header name
+header <-
+  shinydashboard::dashboardHeader(title = appTitle, 
+                                  tags$li(
+                                    tags$div(
+                                      tags$strong("Phenotype ID:"),
+                                      style = "color: white; margin-top: 14px; margin-right: 10px;"
+                                    ),
+                                    class = "dropdown"
+                                  ), 
+                                  tags$li(
+                                    tags$div(
+                                      shinyWidgets::pickerInput(
+                                        inputId = "phenotypes",
+                                        choices = phenotypeDescription$phenotypeName,
+                                        selected = phenotypeDescription$phenotypeName[1],
+                                        multiple = FALSE,
+                                        choicesOpt = list(style = rep_len("color: black;", 999)),
+                                        options = shinyWidgets::pickerOptions(
+                                          actionsBox = FALSE,
+                                          liveSearch = TRUE,
+                                          size = 20,
+                                          liveSearchStyle = "contains",
+                                          liveSearchPlaceholder = "Type here to search",
+                                          virtualScroll = 50,
+                                          dropdownAlignRight = TRUE
+                                        )
+                                      ),
+                                      style = "margin-top: 8px; margin-right: 10px; margin-bottom: -8px;"
+                                    ),
+                                    class = "dropdown"
+                                  )
+  )
+#sidebarMenu
+sidebarMenu <-
+  shinydashboard::sidebarMenu(
+    id = "tabs",
+    shiny::conditionalPanel(
+      condition = "input.tabs != 'databaseInformation'",
+      
+    ),
+    if (exists("phenotypeDescription") && exists("cohort"))
+      shinydashboard::menuItem(text = "Description", tabName = "description"),
+    if (exists("cohortCount"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Cohort Counts", tabName = "cohortCounts"),
+        infoId = "cohortCountsInfo"
+      ),
+    if (exists("incidenceRate"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Incidence Rate", tabName = "incidenceRate"),
+        infoId = "incidenceRateInfo"
+      ),
+    if (exists("timeDistribution"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Time Distributions", tabName = "timeDistribution"),
+        infoId = "timeDistributionInfo"
+      ),
+    if (exists("includedSourceConcept"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Included (Source) Concepts", tabName = "includedConcepts"),
+        infoId = "includedConceptsInfo"
+      ),
+    if (exists("orphanConcept"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Orphan (Source) Concepts", tabName = "orphanConcepts"),
+        infoId = "orphanConceptsInfo"
+      ),
+    if (exists("inclusionRuleStats"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Inclusion Rule Statistics", tabName = "inclusionRuleStats"),
+        infoId = "inclusionRuleStatsInfo"
+      ),
+    if (exists("indexEventBreakdown"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Index Event Breakdown", tabName = "indexEventBreakdown"),
+        infoId = "indexEventBreakdownInfo"
+      ),
+    if (exists("visitContext"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Visit Context", tabName = "visitContext"),
+        infoId = "visitContextInfo"
+      ),
+    if (exists("covariateValue"))
+      addInfo(
+        shinydashboard::menuItem(text = "Cohort Characterization", tabName = "cohortCharacterization"),
+        infoId = "cohortCharacterizationInfo"
+      ),
+    if (exists("temporalCovariateValue"))
+      addInfo(
+        shinydashboard::menuItem(text = "Temporal Characterization", tabName = "temporalCharacterization"),
+        infoId = "temporalCharacterizationInfo"
+      ),
+    if (exists("cohortOverlap"))
+      addInfo(
+        shinydashboard::menuItem(text = "Cohort Overlap", tabName = "cohortOverlap"),
+        infoId = "cohortOverlapInfo"
+      ),
+    if (exists("covariateValue"))
+      addInfo(
+        item = shinydashboard::menuItem(text = "Compare Cohort Char.", tabName = "compareCohortCharacterization"),
+        infoId = "compareCohortCharacterizationInfo"
+      ),
+    shinydashboard::menuItem(text = "Database information", tabName = "databaseInformation"),
+    shiny::conditionalPanel(
+      condition = "input.tabs!='incidenceRate' & input.tabs!='timeDistribution' & input.tabs!='cohortCharacterization' & input.tabs!='cohortCounts' & input.tabs!='indexEventBreakdown' & input.tabs!='databaseInformation' & input.tabs != 'description' & input.tabs != 'includedConcepts' & input.tabs != 'orphanConcepts' & input.tabs != 'inclusionRuleStats' & input.tabs != 'visitContext' & input.tabs != 'cohortOverlap' & input.tabs != 'compareCohortCharacterization'",
+      shinyWidgets::pickerInput(
+        inputId = "database",
+        label = "Database",
+        choices = database$databaseId,
+        selected = database$databaseId[1],
+        multiple = FALSE,
+        choicesOpt = list(style = rep_len("color: black;", 999)),
+        options = shinyWidgets::pickerOptions(
+          actionsBox = TRUE, 
+          liveSearch = TRUE,
+          size = 10,
+          liveSearchStyle = "contains",
+          liveSearchPlaceholder = "Type here to search",
+          virtualScroll = 50
+        )
+      )
+    ),
+    shiny::conditionalPanel(
+      condition = "input.tabs=='incidenceRate' | input.tabs=='timeDistribution' | input.tabs=='cohortCharacterization' | input.tabs=='cohortCounts' | input.tabs=='indexEventBreakdown' | input.tabs == 'includedConcepts' | input.tabs == 'orphanConcepts' | input.tabs == 'inclusionRuleStats' | input.tabs == 'visitContext' | input.tabs == 'cohortOverlap' | input.tabs == 'compareCohortCharacterization'",
+      shinyWidgets::pickerInput(
+        inputId = "databases",
+        label = "Database",
+        choices = database$databaseId,
+        selected = database$databaseId[1],
+        multiple = TRUE,
+        choicesOpt = list(style = rep_len("color: black;", 999)),
+        options = shinyWidgets::pickerOptions(
+          actionsBox = TRUE, 
+          liveSearch = TRUE, 
+          size = 10,
+          liveSearchStyle = "contains",
+          liveSearchPlaceholder = "Type here to search",
+          virtualScroll = 50)
+      )
+    ),
+    if (exists("temporalCovariateValue")) {
+      shiny::conditionalPanel(
+        condition = "input.tabs=='temporalCharacterization'",
+        shinyWidgets::pickerInput(
+          inputId = "timeIdChoices",
+          label = "Temporal Choice",
+          choices = temporalCovariateChoices$choices,
+          multiple = TRUE,
+          choicesOpt = list(style = rep_len("color: black;", 999)),
+          selected = temporalCovariateChoices %>% 
+            dplyr::filter(.data$timeId %in% (c(min(temporalCovariateChoices$timeId),
+                                               temporalCovariateChoices %>% 
+                                                 dplyr::filter(timeId %in% c(1,2,3,4,5)) %>% 
+                                                 dplyr::pull(.data$timeId)) %>% 
+                                               unique() %>% 
+                                               sort())) %>%
+            dplyr::pull("choices"),
+          options = shinyWidgets::pickerOptions(
+            actionsBox = TRUE,
+            liveSearch = TRUE,
+            size = 10,
+            liveSearchStyle = "contains",
+            liveSearchPlaceholder = "Type here to search",
+            virtualScroll = 50)
+        )
+      )
+    },
+    shiny::conditionalPanel(
+      condition = "input.tabs!='cohortCounts' & 
+      input.tabs!='databaseInformation' & 
+      input.tabs != 'description' & 
+      input.tabs != 'cohortOverlap'&
+      input.tabs != 'compareCohortCharacterization' &
+      input.tabs != 'incidenceRate' &
+      input.tabs != 'timeDistribution'",
+      shinyWidgets::pickerInput(
+        inputId = "cohort",
+        label = "Cohorts",
+        choices = c(""),
+        multiple = FALSE,
+        choicesOpt = list(style = rep_len("color: black;", 999)),
+        options = shinyWidgets::pickerOptions(
+          actionsBox = TRUE, 
+          liveSearch = TRUE, 
+          liveSearchStyle = "contains",
+          size = 10,
+          liveSearchPlaceholder = "Type here to search",
+          virtualScroll = 50)
+      )
+    ),
+    shiny::conditionalPanel(
+      condition = "input.tabs=='includedConcepts' | input.tabs=='orphanConcepts'",
+      shinyWidgets::pickerInput(
+        inputId = "conceptSet",
+        label = "Concept Set",
+        choices = c(""),
+        multiple = FALSE,
+        choicesOpt = list(style = rep_len("color: black;", 999)),
+        options = shinyWidgets::pickerOptions(
+          actionsBox = TRUE,
+          liveSearch = TRUE,
+          size = 10,
+          liveSearchStyle = "contains",
+          liveSearchPlaceholder = "Type here to search",
+          virtualScroll = 50)
+      )
+    ),
+    shiny::conditionalPanel(
+      condition = "input.tabs == 'cohortOverlap' | input.tabs=='compareCohortCharacterization' | input.tabs=='incidenceRate' | input.tabs=='timeDistribution'" ,
+      shinyWidgets::pickerInput(
+        inputId = "cohorts",
+        label = "Cohorts",
+        choices = c(""),
+        selected = c(""),
+        multiple = TRUE,
+        choicesOpt = list(style = rep_len("color: black;", 999)),
+        options = shinyWidgets::pickerOptions(
+          actionsBox = TRUE, 
+          liveSearch = TRUE, 
+          liveSearchStyle = "contains",
+          size = 10,
+          liveSearchPlaceholder = "Type here to search",
+          virtualScroll = 50)
+      )
+    )
+  )
+
+#Side bar code
+sidebar <-
+  shinydashboard::dashboardSidebar(sidebarMenu, width = NULL, collapsed = FALSE)
+
+#body - items in tab
+bodyTabItems <- shinydashboard::tabItems(
+  shinydashboard::tabItem(
+    tabName = "description",
+    shinydashboard::box(
+      title = "Description",
+      width = NULL,
+      status = "primary",
+      shiny::tabsetPanel(type = "tab",
+                         shiny::tabPanel(
+                           tags$br(),
+                           title = "Cohort", 
+                           DT::dataTableOutput(outputId = "cohortDescriptionTable")),
+                         shiny::tabPanel(
+                           tags$br(),
+                           title = "Phenotype",
+                           DT::dataTableOutput(outputId = "phenoTypeDescriptionTable"))
+      )
+    )
+  ),
+  shinydashboard::tabItem(tabName = "cohortCounts",
+                          DT::dataTableOutput("cohortCountsTable")),
+  shinydashboard::tabItem(
+    tabName = "incidenceRate",
+    shiny::uiOutput(outputId = "incidenceRateSelectedCohort"),
+    shinydashboard::box(
+      title = "Incidence Rate",
+      width = NULL,
+      status = "primary",
+      tags$table(style = "width: 100%",
+                 tags$tr(
+                   tags$td(
+                     valign = "bottom",
+                     shiny::checkboxGroupInput(
+                       inputId = "irStratification",
+                       label = "Stratify by",
+                       choices = c("Age", "Gender", "Calendar Year"),
+                       selected = c("Age", "Gender", "Calendar Year"),
+                       inline = TRUE
+                     )
+                   ),
+                   tags$td(HTML("&nbsp;&nbsp;&nbsp;&nbsp;")),
+                   tags$td(
+                     valign = "bottom",
+                     style = "text-align: right",
+                     shiny::checkboxInput("irYscaleFixed", "Use same y-scale across databases")
+                   )
+                 )),
+      shiny::htmlOutput(outputId = "hoverInfoIr"),
+      ggiraph::ggiraphOutput( outputId = "incidenceRatePlot", width = "100%", height = "100%" )
+    )
+  ),
+  shinydashboard::tabItem(
+    tabName = "timeDistribution",
+    shiny::uiOutput(outputId = "timeDistSelectedCohort"),
+    shinydashboard::box(
+      title = "Time Distributions",
+      width = NULL,
+      status = "primary",
+      tags$br(),
+      ggiraph::ggiraphOutput("timeDisPlot", width = "100%", height = "100%")
+    ),
+    shinydashboard::box(
+      title = "Time Distributions Table",
+      width = NULL,
+      status = "primary",
+      DT::dataTableOutput("timeDistTable")
+    )
+  ),
+  shinydashboard::tabItem(
+    tabName = "includedConcepts",
+    shiny::radioButtons(
+      inputId = "includedType",
+      label = "",
+      choices = c("Source Concepts", "Standard Concepts"),
+      selected = "Source Concepts",
+      inline = TRUE
+    ),
+    DT::dataTableOutput("includedConceptsTable")
+  ),
+  shinydashboard::tabItem(tabName = "orphanConcepts",
+                          DT::dataTableOutput("orphanConceptsTable")),
+  shinydashboard::tabItem(tabName = "inclusionRuleStats",
+                          div(style = "font-size:15px;font-weight: bold", "Target cohort:"),
+                          shiny::htmlOutput(outputId = "inclusionRuleStatSelectedCohort"),
+                          tags$br(),
+                          DT::dataTableOutput("inclusionRuleTable")),
+  shinydashboard::tabItem(tabName = "indexEventBreakdown",
+                          DT::dataTableOutput("breakdownTable")),
+  shinydashboard::tabItem(tabName = "visitContext",
+                          DT::dataTableOutput("visitContextTable")),
+  shinydashboard::tabItem(
+    tabName = "cohortCharacterization",
+    shiny::radioButtons(
+      inputId = "charType",
+      label = "",
+      choices = c("Pretty", "Raw"),
+      selected = "Pretty",
+      inline = TRUE
+    ),
+    div(style = "font-size:15px;font-weight: bold", "Target cohort:"),
+    shiny::textOutput(outputId = "cohortCharacterizationSelectedCohort"),
+    tags$br(),
+    DT::dataTableOutput("characterizationTable")
+  ),
+  shinydashboard::tabItem(
+    tabName = "temporalCharacterization",
+    tags$table(style = "width: 100%",
+               tags$tr(
+                 tags$td(
+                   htmlOutput(outputId = "temporalCharacterizationSelectedCohort")
+                 ),
+                 tags$td(
+                   style = "text-align: right",
+                   div("Selected database:"),
+                   shiny::textOutput(outputId = "temporalCharacterizationSelectedDataBase")
+                 ),
+                 tags$td(HTML("&nbsp;&nbsp;&nbsp;&nbsp;"))
+               )
+    ),
+    shinydashboard::box(
+      title = "Temporal Characterization Table",
+      width = NULL,
+      status = "primary",
+      DT::dataTableOutput("temporalCharacterizationTable")
+    )
+    # ,
+    # shinydashboard::box(
+    #   title = "Temporal Characterization Plot",
+    #   width = NULL,
+    #   status = "primary",
+    #   ggiraph::ggiraphOutput(
+    #     outputId = "covariateTimeSeriesPlot")
+    # )
+  ),
+  shinydashboard::tabItem(
+    tabName = "cohortOverlap",
+    shiny::uiOutput(outputId = "cohortOverlapSelectedCohort"),
+    shinydashboard::box(
+      title = "Cohort Overlap (Subjects)",
+      width = NULL,
+      status = "primary",
+      shiny::radioButtons(
+        inputId = "overlapPlotType",
+        label = "",
+        choices = c("Percentages", "Counts"),
+        selected = "Percentages",
+        inline = TRUE
+      ),
+      ggiraph::ggiraphOutput("overlapPlot", width = "100%", height = 600)
+    )
+    # shinydashboard::box(
+    #   title = "Cohort Overlap Statistics",
+    #   width = NULL,
+    #   status = "primary",
+    #   DT::dataTableOutput("overlapTable")
+    # )
+  ),
+  shinydashboard::tabItem(
+    tabName = "compareCohortCharacterization",
+    shiny::radioButtons(
+      inputId = "charCompareType",
+      label = "",
+      choices = c("Pretty table", "Raw table", "Plot"),
+      selected = "Pretty table",
+      inline = TRUE
+    ),
+    shiny::conditionalPanel(condition = "input.charCompareType=='Pretty table' | input.charCompareType=='Raw table'",
+                            DT::dataTableOutput("charCompareTable")),
+    shiny::conditionalPanel(
+      condition = "input.charCompareType=='Plot'",
+      shinydashboard::box(
+        title = "Compare Cohort Characterization",
+        width = NULL,
+        status = "primary",
+        shiny::htmlOutput("compareCohortCharacterizationSelectedCohort"),
+        shinyWidgets::pickerInput(
+          inputId = "domainId",
+          label = "Filter By Domain",
+          choices = c("all","condition", "device", "drug", "measurement", "observation", "procedure", "other"),
+          multiple = FALSE,
+          choicesOpt = list(style = rep_len("color: black;", 999)),
+          options = shinyWidgets::pickerOptions(
+            actionsBox = TRUE, 
+            liveSearch = TRUE, 
+            size = 10,
+            liveSearchStyle = 'contains',
+            liveSearchPlaceholder = "Type here to search",
+            virtualScroll = 50)
+          
+        ),
+        ggiraph::ggiraphOutput(outputId = "charComparePlot", width = "100%", height = "100%")
+      )
+    )
+  ),
+  shinydashboard::tabItem(tabName = "databaseInformation",
+                          # uiOutput("databaseInformationPanel")
+                          DT::dataTableOutput("databaseInformationTable"))
+)
+
+
+#body
+body <- shinydashboard::dashboardBody(bodyTabItems)
+
+
+#main
+shinydashboard::dashboardPage(header = header,
+                              sidebar = sidebar,
+                              body = body)