## Modified version of mapscape. Cannot be put into the same package as some
## of the components conflict
library(xcrmapscape)
library(htmlwidgets)

library(ithi.utils)
load_base_libs()
library(ithi.meta)
library(ithi.ihc)
library(ithi.xcr)
library(ithi.figures)
library(ithi.clones)

Parameters

db_path <- snakemake@params$db

mapscape_input_directories = snakemake@input$mapscape_inputs
xcr_table_path <- snakemake@input$xcr_table
show_full_track <- (snakemake@params$track_option == "full")
full_page_mode <- (snakemake@params$page_mode == "full")
segment_type <- snakemake@params$segment_type

clone_tree_file <- snakemake@input$clone_tree_file
clone_prevalence_file <- snakemake@input$clone_prevalence_file
clone_branch_length_file <- snakemake@input$clone_branch_length_file
db <- src_sqlite(db_path, create = FALSE)
andrew_map <- collect(tbl(db, "andrew_map"))
distance_method <- "horn"

tree_branch_data <- read_clone_tree_data(clone_tree_file, clone_branch_length_file, 
    clone_prevalence_file, db_path)
xcr_table <- read_clonotypes(xcr_table_path, duplicates = FALSE, db_path)

Read 36.1% of 304822 rows
Read 85.3% of 304822 rows
Read 304822 rows and 18 (of 18) columns from 0.070 GB file in 00:00:05
annotation_colours <- ithi.figures::get_annotation_colours()
tcr_segment_type <- "TRB"
bcr_segment_type <- "IGH"

patients <- unique(xcr_table$patient_id)

id_type <- "condensed_id"

dists <- lapply(patients, function(patient) {
    tcr_clonotypes <- subset(xcr_table, type == tcr_segment_type & patient_id == 
        patient)
    bcr_clonotypes <- subset(xcr_table, type == bcr_segment_type & patient_id == 
        patient)
    tcr_cross_table <- ithi.xcr::cross_tabulate(tcr_clonotypes, id_type = id_type)
    bcr_cross_table <- ithi.xcr::cross_tabulate(bcr_clonotypes, id_type = id_type)
    
    cross_tables <- list(tcr = tcr_cross_table, bcr = bcr_cross_table)
    
    distance_matrices <- lapply(cross_tables, function(cross_table) {
        distmat <- ithi.xcr::compute_immune_distance_matrix(cross_table, method = distance_method)
        mat <- as.matrix(distmat)
        return(mat)
    })
    return(distance_matrices)
})
tcr_dists <- lapply(dists, function(x) x$tcr)
bcr_dists <- lapply(dists, function(x) x$bcr)

xcr_dists <- tibble::tibble(patient_id = patients, tcr = tcr_dists, bcr = bcr_dists)
xcr_dists$patient_id <- factor(xcr_dists$patient_id)
xcr_dists <- xcr_dists[order(xcr_dists$patient_id), ]


trees <- lapply(tree_branch_data, function(x) x$tree)
prevalences <- plyr::rbind.fill(lapply(tree_branch_data, function(x) x$prevalence_dat))
branch_lengths <- plyr::rbind.fill(lapply(tree_branch_data, function(x) x$branch_dat))

ccfs <- ithi.clones::compute_ccf(prevalences, trees, id_type = id_type)
ccfs_labeled <- merge(ccfs, branch_lengths, by = c("label", "node", "patient_id"))

## Need non-normalized distances
clone_dists <- ithi.clones::clone_distances(ccfs_labeled, normalize = FALSE, 
    id_type = "condensed_id")

clone_dists$patient_id <- factor(clone_dists$patient_id)

total_dists <- inner_join(clone_dists, xcr_dists)


pairwise_similarities <- plyr::rbind.fill(lapply(1:nrow(total_dists), function(i) {
    clone_distmat <- total_dists[i, ]$dist_clones_weighted[[1]]
    tcr_distmat <- total_dists[i, ]$tcr[[1]]
    bcr_distmat <- total_dists[i, ]$bcr[[1]]
    
    inputs <- list(clone_distmat, tcr_distmat, bcr_distmat)
    names(inputs) <- c("clones", "tcr", "bcr")
    
    patient_id <- total_dists[i, ]$patient_id
    
    pairwise_sims <- cbind(patient_id = patient_id, ithi.supp:::compute_overlap_similarities(inputs))
    return(pairwise_sims)
}))
pairwise_similarities$patient_id <- factor(pairwise_similarities$patient_id)

dissimilarity_matrices <- dplyr::bind_rows(lapply(1:nrow(total_dists), function(i) {
    clone_distmat <- total_dists[i, ]$dist_clones_weighted[[1]]
    tcr_distmat <- total_dists[i, ]$tcr[[1]]
    bcr_distmat <- total_dists[i, ]$bcr[[1]]
    patient_id <- total_dists[i, ]$patient_id
    
    inputs <- list(clone_distmat, tcr_distmat, bcr_distmat)
    names(inputs) <- c("clones", "tcr", "bcr")
    
    matrices_subset <- ithi.supp:::compute_overlap_matrices(inputs)
    names(matrices_subset) <- names(inputs)
    
    tibble(patient_id = patient_id, clones = list(matrices_subset$clones), tcr = list(matrices_subset$tcr), 
        bcr = list(matrices_subset$bcr))
}))

segment_name <- plyr::mapvalues(segment_type, from = c("TRB", "IGH"), to = c("tcr", 
    "bcr"))

stats <- plyr::rbind.fill(lapply(1:nrow(dissimilarity_matrices), function(i) {
    row <- dissimilarity_matrices[i, ]
    xcrmat <- dissimilarity_matrices[, segment_name][[1]][[i]]
    clonemat <- dissimilarity_matrices$clones[[i]]
    
    manttest <- vegan::mantel(xcrmat, clonemat, method = "pearson")
    data.frame(patient_id = row$patient_id, p.value = manttest$signif, stat = manttest$statistic)
}))
plot_xcrmapscape <- function(clonal_prev, sample_locations, tree_edges, chord_data, 
    track_data, resize_factor, plot_title, full_page_mode, pvalue) {
    img_ref = "/shahlab/alzhang/projects/ITH_Immune/paper/miscellaneous/FF4D00-0.8.png"
    # img_ref =
    # '~/shahlab/projects/ITH_Immune/paper/miscellaneous/FF4D00-0.8.png'
    
    if (!full_page_mode) {
        xcrmapscape::xcrmapscape(clonal_prev = clonal_prev, tree_edges = tree_edges, 
            sample_locations = sample_locations, img_ref = img_ref, show_warnings = FALSE, 
            chord_data = chord_data, track_data = track_data, resize_factor = resize_factor, 
            plot_title = plot_title, phylo_stroke_width = "5px", phylo_stroke_color = "#000000", 
            legendTitleHeight = 26, centerSize = 0.6, treeRelativeSize = 0, 
            titleScaleFactor = 28, pvalue = pvalue)
    } else {
        xcrmapscape::xcrmapscape(clonal_prev = clonal_prev, tree_edges = tree_edges, 
            sample_locations = sample_locations, img_ref = img_ref, show_warnings = FALSE, 
            chord_data = chord_data, track_data = track_data, resize_factor = resize_factor, 
            plot_title = plot_title, phylo_stroke_width = "1px", phylo_stroke_color = "#9E9A9A", 
            legendTitleHeight = 16, centerSize = 0.5, treeRelativeSize = 0.33, 
            titleScaleFactor = 40, pvalue = pvalue)
    }
}
intersect_table <- compute_overlap_table(xcr_table, segment_type = segment_type, 
    prevalence_option = "clones", id_type = "condensed_id")
intersect_table$patient1 <- ithi.meta::map_id(intersect_table$sample1, from = "condensed_id", 
    to = "patient_id", db_path)
intersect_table$patient2 <- ithi.meta::map_id(intersect_table$sample2, from = "condensed_id", 
    to = "patient_id", db_path)

intersect_table <- subset(intersect_table, patient1 == patient2)

clonotype_table <- subset(xcr_table, type == segment_type)
clonotype_counts <- clonotype_table %>% group_by(condensed_id, patient_id) %>% 
    summarise(n = n()) %>% plyr::rename(c(condensed_id = "label", n = "len"))
reformat_andrew_table <- function(dat, db_path, patient_id) {
    dat$patient_id <- patient_id
    dat <- subset(dat, !sample_id %in% c("Pv2", "Rec2", "Rec3"))
    dat <- dat %>% plyr::rename(c(sample_id = "plot_id", long_sample_id = "sample_id"))
    dat_remapped <- ithi.meta::remap_sample_ids(dat, db_path)
    dat_remapped$abbrev_id <- stringr::str_extract(dat_remapped$condensed_id, 
        "[A-Za-z0-9]+$")
    dat_remapped <- dat_remapped %>% plyr::rename(c(sample_id = "old_sample_id", 
        sample_key = "long_sample_id", plot_id = "old_plot_id", abbrev_id = "sample_id"))
    if ("location_id" %in% colnames(dat_remapped)) {
        dat_remapped$location_id <- dat_remapped$sample_id
    }
    return(dat_remapped)
}

export_cydney_inputs <- function(xcr_table, patient_id, mapscape_base_dir = "/Users/alzhang/shahlab/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC", 
    outdir) {
    patient_tmp <- patient_id
    clonotypes_sub <- xcr_table[(xcr_table$type == segment_type) & (xcr_table$patient_id == 
        as.numeric(patient_tmp)), ]
    clonotypes_sub$condensed_id <- factor(clonotypes_sub$condensed_id)
    cross_table <- ithi.xcr::cross_tabulate(clonotypes_sub, id_type = "condensed_id")
    colnames(cross_table) <- str_replace(colnames(cross_table), "^[0-9]+_", 
        "")
    
    bin_cross_table <- cross_table
    bin_cross_table[bin_cross_table > 0] <- 1
    coln <- colnames(cross_table)
    
    cross_summary <- bin_cross_table %>% group_by_(.dots = coln) %>% summarise(n_shared_clonotypes = n())
    
    dir <- file.path(mapscape_base_dir, patient_id)
    
    clonal_prev = read.table(file.path(dir, "clonal_prevalence_table.tsv"), 
        sep = "\t", header = T)
    tree_edges = read.table(file.path(dir, "tree_edges.tsv"), sep = "\t", header = T)
    
    root <- tree_edges$source[!(tree_edges$source %in% tree_edges$target)]
    tree_edges <- subset(tree_edges, source != root)
    clonal_prev <- reformat_andrew_table(clonal_prev, db_path, patient_id)
    # clonal_prev <- subset(clonal_prev, long_sample_id %in% sample_ids)
    
    clonal_prev_short <- subset(clonal_prev, !duplicate, select = c(patient_id, 
        clone_id, clone_idx, condensed_id, site_id, clonal_prev))
    
    if (!dir.exists(outdir)) {
        dir.create(outdir)
        
        clone_file_output <- file.path(outdir, "clone_prevalences.tsv")
        tree_edges_output <- file.path(outdir, "tree_edges.tsv")
        intersect_output <- file.path(outdir, "intersect.tsv")
        
        write.table(clonal_prev_short, file = clone_file_output, sep = "\t", 
            quote = FALSE, row.names = FALSE, col.names = TRUE)
        write.table(tree_edges, file = tree_edges_output, sep = "\t", quote = FALSE, 
            row.names = FALSE, col.names = TRUE)
        write.table(cross_summary, file = intersect_output, sep = "\t", quote = FALSE, 
            row.names = FALSE, col.names = TRUE)
    }
}

Plots

htmltools::tagList(lapply(mapscape_input_directories, function(dir) {
    patient_id <- stringr::str_extract(dir, "[0-9]+$")
    df <- subset(intersect_table, patient1 == patient_id)
    clonal_prev = read.table(file.path(dir, "clonal_prevalence_table.tsv"), 
        sep = "\t", header = T)
    tree_edges = read.table(file.path(dir, "tree_edges.tsv"), sep = "\t", header = T)
    
    root <- tree_edges$source[!(tree_edges$source %in% tree_edges$target)]
    tree_edges <- subset(tree_edges, source != root)
    
    sample_locations = read.table(file.path(dir, "sample_locations.tsv"), sep = "\t", 
        header = T)
    sample_locations$long_sample_id <- df_as_map(clonal_prev, sample_locations$sample_id, 
        from = "sample_id", to = "long_sample_id")
    
    clonal_prev <- reformat_andrew_table(clonal_prev, db_path, patient_id)
    sample_locations <- reformat_andrew_table(sample_locations, db_path, patient_id)
    
    # df <- merge(df, subset(andrew_map, select=c(sample_key, sample_id)),
    # by.x=c('sample1'), by.y=c('sample_key')) %>%
    # plyr::rename(c('sample_id'='sample_id1')) df <- merge(df,
    # subset(andrew_map, select=c(sample_key, sample_id)), by.x=c('sample2'),
    # by.y=c('sample_key')) %>% plyr::rename(c('sample_id'='sample_id2'))
    
    clonotype_counts_sub <- clonotype_counts[as.character(clonotype_counts$patient_id) == 
        patient_id, ]
    
    patient_tmp <- patient_id
    
    clonotypes_sub <- xcr_table[(xcr_table$type == segment_type) & (xcr_table$patient_id == 
        as.numeric(patient_tmp)), ]
    clonotypes_sub$condensed_id <- factor(clonotypes_sub$condensed_id)
    cross_table <- ithi.xcr::cross_tabulate(clonotypes_sub, id_type = "condensed_id")
    
    # df$sample1 <- df$sample_id1 df$sample2 <- df$sample_id2
    
    sample_ids <- intersect(clonal_prev$long_sample_id, unique(df$sample1))
    
    if (length(sample_ids) == 0) {
        return(NULL)
    }
    
    df <- subset(df, (sample1 %in% sample_ids) & (sample2 %in% sample_ids))
    df$sample1 <- factor(df$sample1, levels = sample_ids)
    df$sample2 <- factor(df$sample2, levels = sample_ids)
    df <- df[order(df$sample1), ]
    
    ## IF YOU ONLY WANT THE INTERSECTION TO BE SHOWN, JUST SET CLONOTYPE TABLE TO
    ## NULL Otherwise set it to clonotype_counts_sub
    if (show_full_track) {
        res <- ithi.figures::format_xcrcircos_data(df, clonotype_counts = clonotype_counts_sub, 
            cross_table = cross_table)
    } else {
        res <- ithi.figures::format_xcrcircos_data(df, clonotype_counts = NULL)
    }
    chord_data <- res$chords
    track_data <- as.data.frame(res$tracks)
    
    resize_factor <- min(sum(track_data$len)/max(track_data$len) * 1/nrow(track_data), 
        0.9)
    
    clonal_prev <- subset(clonal_prev, long_sample_id %in% sample_ids)
    sample_locations <- subset(sample_locations, sample_id %in% clonal_prev$sample_id)
    
    if (!full_page_mode) {
        plot_title <- paste0("Patient ", patient_id)
    } else {
        plot_title <- ""
    }
    
    pvalue <- subset(stats, patient_id == patient_tmp)$p.value
    
    ## TODO: Extract pvalues from XCR-clone correlation
    
    print(patient_id)
    plot_xcrmapscape(clonal_prev, sample_locations, tree_edges, chord_data = chord_data, 
        track_data = track_data, resize_factor = resize_factor, plot_title = plot_title, 
        full_page_mode = full_page_mode, pvalue = round(pvalue, 3))
}))
[1] "1"
[1] "2"
[1] "3"
[1] "4"
[1] "7"
[1] "9"
[1] "10"
[1] "11"
[1] "12"
[1] "13"
[1] "14"
[1] "15"
[1] "16"
[1] "17"
---
title: "XCR-Mapscape plots"
output: 
  html_notebook:
    toc: true
    toc_depth: 5
    toc_float: true
params:
  rmd: "xcrmapscape.Rmd"
---
                        ```{r, echo=FALSE, message=FALSE, warning=FALSE}

######## Snakemake header ########
library(methods)
Snakemake <- setClass(
    "Snakemake",
    slots = c(
        input = "list",
        output = "list",
        params = "list",
        wildcards = "list",
        threads = "numeric",
        log = "list",
        resources = "list",
        config = "list",
        rule = "character"
    )
)
snakemake <- Snakemake(
    input = list('/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/1', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/2', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/3', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/4', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/7', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/9', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/10', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/11', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/12', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/13', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/14', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/15', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/16', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/17', '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2/xcr_table.tsv', '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2/clones/tree_data.tsv', 'Rmd/xcrmapscape.Rmd', '/shahlab/alzhang/projects/ITH_Immune/paper/analysis/Rmd/_site.yml', '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2/clones/branch_data.tsv', '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2/clones/clone_data.tsv', "mapscape_inputs" = c('/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/1', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/2', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/3', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/4', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/7', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/9', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/10', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/11', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/12', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/13', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/14', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/15', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/16', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC/17'), "xcr_table" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2/xcr_table.tsv', "clone_tree_file" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2/clones/tree_data.tsv', "notebook" = 'Rmd/xcrmapscape.Rmd', "site_file" = '/shahlab/alzhang/projects/ITH_Immune/paper/analysis/Rmd/_site.yml', "clone_branch_length_file" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2/clones/branch_data.tsv', "clone_prevalence_file" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2/clones/clone_data.tsv'),
    output = list('/shahlab/alzhang/projects/ITH_Immune/paper/results/web/xcrmapscape_full.nb.html'),
    params = list('/shahlab/alzhang/projects/ITH_Immune/metadata/db/immune_project.sqlite3', 'ithi-analysis-plot_xcrmapscapes-full', 'full', 'TRB', 'shrink', "db" = '/shahlab/alzhang/projects/ITH_Immune/metadata/db/immune_project.sqlite3', "name" = 'ithi-analysis-plot_xcrmapscapes-full', "page_mode" = 'shrink', "segment_type" = 'TRB', "track_option" = 'full'),
    wildcards = list(),
    threads = 1,
    log = list('/shahlab/alzhang/clusttmp/paperanalysis2/plot_xcrmapscape_full.log'),
    resources = list(),
    config = list("tilmapscape_files" = c('/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/1.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/2.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/3.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/4.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/7.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/9.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/10.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/11.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/12.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/13.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/14.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/15.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/16.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/tilmapscape/17.svg'), "immune_variability_notebook" = 'Rmd/immune_variability.Rmd', "bcr_diversity" = '/shahlab/alzhang/pipeline_outputs/ith_immune/mixcr/mixcr_runs/ith_1_2_3/mixcr5/postprocess/IGH/postfilter_diversity_stats/diversity.strict.resampled.txt', "driver_map" = '/shahlab/alzhang/projects/ITH_Immune/subprojects/drivers/data/gene_list_mapped.bed', "xcr_qc_notebook" = 'Rmd/replicates.Rmd', "nanostring_data" = '/shahlab/alzhang/projects/ITH_Immune/results/nanostring_results/ith_full/qc/limma_quantile/normalized_expression_voa_labels_filtered.tsv', "benchmarkdir" = '/shahlab/alzhang/benchmarks/paperanalysis2', "icgc_expr_melted" = '/shahlab/alzhang/data/ICGC/OVAU_expr_melted.tsv', "logdir" = '/shahlab/alzhang/clusttmp/paperanalysis2', "xcrmapscape_bcr_patient_order" = c(9, 4, 12, 1, 15, 14, 11, 10, 2, 17, 13, 3, 16, 7), "driver_analysis_notebook" = 'Rmd/driver_analysis.Rmd', "known_subtype_file" = '/shahlab/alzhang/projects/ITH_Immune/data/expression/array/subtypes/known_subtypes.tsv', "example_annotations" = '/shahlab/alzhang/pipeline_outputs/ith_immune/igpartition/run13/final_partitions/ith2_2/clust9/annotations_flagged.tsv', "xcr_mapping_notebook" = 'Rmd/xcr_mapping.Rmd', "j_dictionary" = '/shahlab/alzhang/projects/ITH_Immune/subprojects/immtyper/metadata/imgt/Homo_sapiens_TRBJ.fasta', "nanostring_signature_notebook" = 'Rmd/nanostring_signatures.Rmd', "nanostring_annotations" = '/shahlab/alzhang/projects/ITH_Immune/data/expression/nanostring/pancancer_annotations.tsv', "thumbnail2" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/extra_plots/15_ROv2/thumbnail_image.tiff', "known_subtypes_merged" = '/shahlab/alzhang/projects/ITH_Immune/data/expression/known_subtypes_merged.tsv', "notebook_dir" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/web', "bcrphylo_examples_notebook" = 'Rmd/bcr_phylo_examples.Rmd', "clonal_samplers" = c('HMC', 'NUTS'), "proportion_subclonal_file" = '/shahlab/alzhang/projects/ITH_Immune/data/ith/complete/old_proportion_subclonal.tsv', "tils_for_variability" = c('E_CD8_density', 'E_CD4_density', 'E_CD20_density', 'E_Plasma_density', 'S_CD8_density', 'S_CD4_density', 'S_CD20_density', 'S_Plasma_density'), "master_breakpoint_file" = '/shahlab/amcpherson/projects/ith3/ith3/notebooks/bespoke/ith_breakpoints.tsv', "mmctm_sample_result_dir" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/ith_by-sample/output', "mmctm_patient_ad_sigplot" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/ith_by-patient-ancestry/plots/ith-by-patient-ancestry_snv-sv_sigs_multipanel.pdf', "immtyper_models" = '/shahlab/alzhang/projects/ITH_Immune/results/immtyper_results/klarenbeek/aa_vj/gradboost', "v_dictionary" = '/shahlab/alzhang/projects/ITH_Immune/subprojects/immtyper/metadata/imgt/Homo_sapiens_TRBV.fasta', "image_summary_file2" = '/shahlab/alzhang/data/ithi/yuan_hecr_image_results_2.csv', "patients_for_clonal" = c(1, 2, 3, 4, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17), "mmctm_sample_sigplot" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/ith_by-sample/plots/ith-by-sample_snv-sv_sigs_multipanel.pdf', "nscatters" = 1, "phenotype_threshold" = 0.85, "yinyin_image_summary" = '/shahlab/alzhang/data/ithi/yuan_hecr_image_results.csv', "library_sizes" = '/shahlab/alzhang/pipeline_outputs/ith_immune/mixcr/mixcr_runs/ith_1_2_3/mixcr5/library_sizes.tsv', "ihc_xcr_stats_notebook" = 'Rmd/ihc_xcr_stats.Rmd', "ith_til_notebook" = 'Rmd/ith_til_densities.Rmd', "mutsig_tiltypes" = c('E_CD8_density', 'E_CD4_density', 'E_CD20_density', 'E_Plasma_density', 'S_CD8_density', 'S_CD4_density', 'S_CD20_density', 'S_Plasma_density', 'T_CD8_density', 'T_CD4_density', 'T_CD20_density', 'T_Plasma_density'), "mapscape_notebook" = 'Rmd/mapscape.Rmd', "ov133_fbi_status" = '/shahlab/alzhang/data/OV133/ov133_hgsc_fbi_class.tsv', "multiviewclustering_notebook" = 'Rmd/multiviewclustering.Rmd', "table_dir" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/tables/run2', "mmctm_ov_combined_sigplot" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/combined_ov_mmctm/plots/ov_snv-sv_sigs_multipanel.pdf', "image_analysis_notebook" = 'Rmd/image_analysis.Rmd', "bcrphylo_tiltypes" = c('E_CD8_density', 'E_CD4_density', 'E_CD20_density', 'E_Plasma_density', 'S_CD8_density', 'S_CD4_density', 'S_CD20_density', 'S_Plasma_density', 'T_CD8_density', 'T_CD4_density', 'T_CD20_density', 'T_Plasma_density'), "PNG_DENSITY" = 300, "clone_branch_length_file" = '/shahlab/alzhang/projects/ITH_Immune/data/ith/complete/branch_data.tsv', "clone_prevalence_file" = '/shahlab/alzhang/projects/ITH_Immune/data/ith/complete/clone_data.tsv', "mmctm_ancestral_descendant_result_dir" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/ith_by-ancestry-sample/output', "xcr_distance_method" = 'horn', "mutation_signature_notebook" = 'Rmd/mutation_signatures.Rmd', "ccsri_mapscape_notebook" = 'Rmd/mapscape_ccsri.Rmd', "ithi_neutrality_samples" = c('1_Om1', '1_ROv1', '1_ROv2', '1_ROv3', '1_ROv4', '1_SBwl1', '10_ROv1', '10_ROv2', '10_ROv3', '10_ROv4', '11_LOv1', '11_LOv3', '11_Pv1', '11_Rct1', '11_Rct2', '12_LOv1', '12_LOv2', '12_Om1', '12_Om2', '12_ROv1', '13_Om1', '13_RGrn1', '13_ROv1', '13_ROv2', '13_ROv3', '14_Bld1', '14_CDS1', '14_LOv1', '14_Om1', '14_ROv1', '15_CDS1', '15_LOv1', '15_ROv1', '15_ROv2', '15_SBwl1', '16_LOv1', '16_LOvSfc1', '16_Om1', '16_Ptn1', '16_ROv1', '17_Om1', '17_Om2', '17_Om3', '17_Ov1', '17_Ov2', '2_Om1', '2_Om2', '2_ROv1', '2_ROv2', '3_Adnx1', '3_Om1', '3_ROv1', '3_ROv2', '4_LPvSw1', '4_ROv1', '4_ROv2', '4_ROv3', '4_ROv4', '7_BrnM', '7_LOv1', '7_RPvM', '9_LOv1', '9_LOv2', '9_Om1', '9_Om2', '9_ROv1'), "variability_type" = 'stabilize', "figure_gallery_notebook" = 'Rmd/figures.Rmd', "neoediting_outdir" = '/shahlab/alzhang/pipeline_outputs/ith_immune/neoediting/run4', "xcrmapscape_tcr_patient_order" = c(9, 15, 17, 1, 14, 2, 12, 3, 4, 13, 11, 16, 10, 7), "xcr_clones_notebook" = 'Rmd/xcr_clones_analysis.Rmd', "db" = '/shahlab/alzhang/projects/ITH_Immune/metadata/db/immune_project.sqlite3', "tils_for_cluster" = c('E_CD8_density', 'E_CD4_density', 'E_CD20_density', 'E_Plasma_density', 'S_CD8_density', 'S_CD4_density', 'S_CD20_density', 'S_Plasma_density'), "tcga_clinical" = '/shahlab/alzhang/data/TCGA/synapse_clinAll_data.tsv', "PNG_QUALITY" = 300, "prevalence_threshold" = 0.01, "til_classifier_notebook" = 'Rmd/til_classifier.Rmd', "smooth_type" = 'glm', "driver_patients" = c(1, 2, 3, 4, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17), "example_msa_plot" = '/shahlab/alzhang/pipeline_outputs/ith_immune/igpartition/run13/old/alignment_plots/msa/ith2_2/clust9/indel_reversed.html', "spatial_notebook" = 'Rmd/spatial_analysis.Rmd', "clone_tree_file" = '/shahlab/alzhang/projects/ITH_Immune/data/ith/complete/tree_data.tsv', "tcga_expr_matrix" = '/shahlab/alzhang/data/TCGA/expr_matrix_normalize_standardize_noduplicates.tsv', "default_sampler" = 'HMC', "ith_stats_file" = '/shahlab/alzhang/projects/ITH_Immune/data/ith/complete/clonal_measures.tsv', "thumbnail1" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/extra_plots/11_Rct2/thumbnail_image.tiff', "sad_notebook" = 'Rmd/species_abundance_distributions.Rmd', "icgc_normalized_reads_matrix" = '/shahlab/alzhang/data/ICGC/OVAU_expr_matrix.tsv', "xcrmapscape_notebook" = 'Rmd/xcrmapscape.Rmd', "mmctm_ov_combined_result_dir" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/combined_ov_mmctm/output', "tex_resource_dir" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/tex_resources/run2', "icgc_specimen_file" = '/shahlab/alzhang/data/ICGC/specimen.tsv', "intermediate_dir" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2', "image_summary_file1" = '/shahlab/alzhang/data/ithi/yuan_hecr_image_results.csv', "zoom2" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/extra_plots/17_Om1/zoomed_image.tiff', "thumbnail3" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/extra_plots/17_Om1/thumbnail_image.tiff', "wang_fbi_status" = '/shahlab/alzhang/data/ICGC/ng.3849-S12.txt', "neutral_options" = c('restrict', 'free'), "ith_statistics_notebook" = 'Rmd/ith_statistics.Rmd', "classifier_type" = 'knn', "index_notebook" = 'Rmd/index.Rmd', "neoantigen_editing_notebook" = 'Rmd/immunoediting.Rmd', "ithi_clinical_file" = '/shahlab/alzhang/data/ithi/clinical_table_20170816_2.txt', "igpartition_outdir" = '/shahlab/alzhang/pipeline_outputs/ith_immune/igpartition/run22', "site_file" = '/shahlab/alzhang/projects/ITH_Immune/paper/analysis/Rmd/_site.yml', "zoom1" = '/shahlab/alzhang/projects/ITH_Immune/paper/results/extra_plots/11_Rct2/zoomed_image.tiff', "xcrmapscape_files" = c('/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/1.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/2.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/3.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/4.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/7.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/9.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/10.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/11.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/12.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/13.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/14.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/15.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/16.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/xcrmapscape/17.svg'), "tcr_diversity" = '/shahlab/alzhang/pipeline_outputs/ith_immune/mixcr/mixcr_runs/ith_1_2_3/mixcr5/postprocess/TRB/postfilter_diversity_stats/diversity.strict.resampled.txt', "master_copynumber_file" = '/shahlab/alzhang/data/ithi/master_copynumber_file.tsv', "bcr_clonotypes" = '/shahlab/alzhang/pipeline_outputs/ith_immune/mixcr/mixcr_runs/ith_1_2_3/mixcr5/clonotypes/IGH_clonotypes_filtered.txt', "mmctm_patient_ancestral_descendant_result_dir" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/ith_by-patient-ancestry/output', "master_variant_file" = '/shahlab/amcpherson/projects/ith3/ith3/notebooks/bespoke/ith_snvs.tsv', "clonal_figure_template" = '/shahlab/alzhang/projects/ITH_Immune/paper/analysis/templates/clonal_figure_4by4.svg', "immtyper_lengths" = '11 12 13 14 15 16 17 18', "image_analysis_dir" = '/shahlab/alzhang/pipeline_outputs/ith_immune/icr_spatial/run5/hotspots', "ith_project_results" = '/shahlab/alzhang/projects/ith3/data/results', "tcga_ov_annotations" = '/shahlab/alzhang/data/TCGA/tcga_ov_annotation_sup13.txt', "ihc_run2" = '/shahlab/alzhang/projects/ITH_Immune/data/ihc/cd79cd138cd68/validated_stats_weighted.rdata', "bcr_clonal_figure_template" = '/shahlab/alzhang/projects/ITH_Immune/paper/analysis/templates/clonal_figure_4by4_nobottom.svg', "icgc_molecular_subtypes" = '/shahlab/alzhang/data/ICGC/icgc_primary_tumour_subtypes.tsv', "molsubtype_notebook" = 'Rmd/molecular_subtypes.Rmd', "molsubtype_tiltypes" = c('E_CD8_density', 'E_CD4_density', 'E_CD20_density', 'E_Plasma_density', 'S_CD8_density', 'S_CD4_density', 'S_CD20_density', 'S_Plasma_density'), "mmctm_final_patient_sigplot" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/ith_by-patient_with-ov/plots/ith-by-patient_snv-sv_sigs_multipanel.pdf', "mmctm_sample_ad_sigplot" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/ith_by-ancestry-sample/plots/ith-by-ancestral-sample_snv-sv_sigs_multipanel.pdf', "ihc_xcr_tiltypes" = c('E_CD8_density', 'E_CD4_density', 'E_CD20_density', 'E_Plasma_density', 'S_CD8_density', 'S_CD4_density', 'S_CD20_density', 'S_Plasma_density', 'T_CD8_density', 'T_CD4_density', 'T_CD20_density', 'T_Plasma_density'), "mapscape_template" = '/shahlab/alzhang/projects/ITH_Immune/paper/analysis/templates/clonal_figure_4by4_nobottom_tilcluster.svg', "mmctm_final_patient_dir" = '/shahlab/alzhang/projects/ITH_Immune/results/mmctm_results/ith_by-patient_with-ov', "ith_stat_types" = c('entropy', 'postprocessed_divergence', 'combined_ith_normalized', 'proportion_subclonal'), "spatial_result_dirs" = list("epithelial" = '/shahlab/alzhang/pipeline_outputs/ith_immune/spatsim/ith3/abc', "stromal" = '/shahlab/alzhang/pipeline_outputs/ith_immune/spatsim/ith5/abc'), "mvclust_tiltypes" = c('E_CD8_density', 'E_CD4_density', 'E_CD20_density', 'E_Plasma_density', 'S_CD8_density', 'S_CD4_density', 'S_CD20_density', 'S_Plasma_density'), "icgc_clinical" = '/shahlab/alzhang/data/ICGC/donor.OV-AU.tsv', "tcr_clonotypes" = '/shahlab/alzhang/pipeline_outputs/ith_immune/mixcr/mixcr_runs/ith_1_2_3/mixcr5/clonotypes/TRB_clonotypes_filtered.txt', "mapscape_patient_order" = c(1, 2, 3, 4, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17), "ihc_run1" = '/shahlab/alzhang/projects/ITH_Immune/data/ihc/cd8cd3cd20/validated_stats_weighted_new.rdata', "bcrmapscape_files" = c('/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/1.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/2.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/3.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/4.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/7.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/9.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/10.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/11.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/12.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/13.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/14.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/15.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/16.svg', '/shahlab/alzhang/projects/ITH_Immune/paper/results/intermediates/run2/bcrmapscape/17.svg'), "nclusts" = 3, "subtype_marker_file" = '/shahlab/alzhang/projects/ITH_Immune/data/expression/nanostring/subtype_markers.tsv', "mvclust_nclust" = 3, "bcrphylo_correlations_notebook" = 'Rmd/bcr_phylo_correlations.Rmd'),
    rule = 'plot_xcrmapscape_full'
)
######## Original script #########

                        ```


```{r global_chunk_options, include=FALSE}
knitr::opts_chunk$set(echo = TRUE, tidy=TRUE, warning=FALSE, message=FALSE)
```

```{r}
## Modified version of mapscape. Cannot be put into the same package as some of the components conflict
library(xcrmapscape)
library(htmlwidgets)

library(ithi.utils)
load_base_libs()
library(ithi.meta)
library(ithi.ihc)
library(ithi.xcr)
library(ithi.figures)
library(ithi.clones)
```

## Parameters

```{r}
db_path <- snakemake@params$db

mapscape_input_directories = snakemake@input$mapscape_inputs
xcr_table_path <- snakemake@input$xcr_table
show_full_track <- (snakemake@params$track_option == "full")
full_page_mode <- (snakemake@params$page_mode == "full")
segment_type <- snakemake@params$segment_type

clone_tree_file <- snakemake@input$clone_tree_file
clone_prevalence_file <- snakemake@input$clone_prevalence_file
clone_branch_length_file <- snakemake@input$clone_branch_length_file
```

```{r}
db <- src_sqlite(db_path, create=FALSE)
andrew_map <- collect(tbl(db, "andrew_map"))
```

```{r}
distance_method <- "horn"

tree_branch_data <- read_clone_tree_data(clone_tree_file, clone_branch_length_file, clone_prevalence_file, db_path)
xcr_table <- read_clonotypes(xcr_table_path, duplicates = FALSE, db_path)
```


```{r}
annotation_colours <- ithi.figures::get_annotation_colours()
tcr_segment_type <- "TRB"
bcr_segment_type <- "IGH"

patients <- unique(xcr_table$patient_id)

id_type <- "condensed_id"

dists <- lapply(patients, function(patient) {
  tcr_clonotypes <- subset(xcr_table, type == tcr_segment_type & patient_id == patient)
  bcr_clonotypes <- subset(xcr_table, type == bcr_segment_type & patient_id == patient)
  tcr_cross_table <- ithi.xcr::cross_tabulate(tcr_clonotypes, id_type = id_type)
  bcr_cross_table <- ithi.xcr::cross_tabulate(bcr_clonotypes, id_type = id_type)
  
  cross_tables <- list(tcr=tcr_cross_table, bcr=bcr_cross_table)
  
  distance_matrices <- lapply(cross_tables, function(cross_table) {
    distmat <- ithi.xcr::compute_immune_distance_matrix(cross_table, method = distance_method)
    mat <- as.matrix(distmat)
    return(mat)
  })
  return(distance_matrices)
})
tcr_dists <- lapply(dists, function(x) x$tcr)
bcr_dists <- lapply(dists, function(x) x$bcr)

xcr_dists <- tibble::tibble(patient_id = patients, tcr=tcr_dists, bcr=bcr_dists)
xcr_dists$patient_id <- factor(xcr_dists$patient_id)
xcr_dists <- xcr_dists[order(xcr_dists$patient_id),]


trees <- lapply(tree_branch_data, function(x) x$tree)
prevalences <- plyr::rbind.fill(lapply(tree_branch_data, function(x) x$prevalence_dat))
branch_lengths <- plyr::rbind.fill(lapply(tree_branch_data, function(x) x$branch_dat))

ccfs <- ithi.clones::compute_ccf(prevalences, trees, id_type = id_type)
ccfs_labeled <- merge(ccfs, branch_lengths, by=c("label", "node", "patient_id"))

## Need non-normalized distances
clone_dists <- ithi.clones::clone_distances(ccfs_labeled, normalize = FALSE, id_type = "condensed_id")

clone_dists$patient_id <- factor(clone_dists$patient_id)

total_dists <- inner_join(clone_dists, xcr_dists)


pairwise_similarities <- plyr::rbind.fill(lapply(1:nrow(total_dists), function(i) {
  clone_distmat <- total_dists[i,]$dist_clones_weighted[[1]]
  tcr_distmat <- total_dists[i,]$tcr[[1]]
  bcr_distmat <- total_dists[i,]$bcr[[1]]
  
  inputs <- list(clone_distmat, tcr_distmat, bcr_distmat)
  names(inputs) <- c("clones", "tcr", "bcr")
  
  patient_id <- total_dists[i,]$patient_id
  
  pairwise_sims <- cbind(patient_id=patient_id, ithi.supp:::compute_overlap_similarities(inputs))
  return(pairwise_sims)
}))
pairwise_similarities$patient_id <- factor(pairwise_similarities$patient_id)

dissimilarity_matrices <- dplyr::bind_rows(lapply(1:nrow(total_dists), function(i) {
  clone_distmat <- total_dists[i,]$dist_clones_weighted[[1]]
  tcr_distmat <- total_dists[i,]$tcr[[1]]
  bcr_distmat <- total_dists[i,]$bcr[[1]]
  patient_id <- total_dists[i,]$patient_id
  
  inputs <- list(clone_distmat, tcr_distmat, bcr_distmat)
  names(inputs) <- c("clones", "tcr", "bcr")
  
  matrices_subset <- ithi.supp:::compute_overlap_matrices(inputs)
  names(matrices_subset) <- names(inputs)
  
  tibble(patient_id=patient_id, clones=list(matrices_subset$clones), tcr=list(matrices_subset$tcr), bcr=list(matrices_subset$bcr))
}))

segment_name <- plyr::mapvalues(segment_type, from = c("TRB", "IGH"),
                                to = c("tcr", "bcr"))

stats <- plyr::rbind.fill(lapply(1:nrow(dissimilarity_matrices), function(i) {
  row <- dissimilarity_matrices[i,]
  xcrmat <- dissimilarity_matrices[,segment_name][[1]][[i]]
  clonemat <- dissimilarity_matrices$clones[[i]]
  
  manttest <- vegan::mantel(xcrmat, clonemat,method = "pearson")
  data.frame(patient_id=row$patient_id, p.value=manttest$signif, stat=manttest$statistic)
}))
```

```{r}
plot_xcrmapscape <- function(clonal_prev, sample_locations, tree_edges, chord_data, track_data, resize_factor, plot_title, full_page_mode, pvalue) {
  img_ref = '/shahlab/alzhang/projects/ITH_Immune/paper/miscellaneous/FF4D00-0.8.png'
  #img_ref = '~/shahlab/projects/ITH_Immune/paper/miscellaneous/FF4D00-0.8.png'
  
  if (!full_page_mode) {
    xcrmapscape::xcrmapscape(
      clonal_prev = clonal_prev,
      tree_edges = tree_edges,
      sample_locations = sample_locations,
      img_ref = img_ref,
      show_warnings = FALSE,
      chord_data = chord_data,
      track_data = track_data,
      resize_factor = resize_factor,
      plot_title = plot_title,
      phylo_stroke_width = '5px',
      phylo_stroke_color = '#000000',
      legendTitleHeight = 26,
      centerSize = 0.6,
      treeRelativeSize = 0,
      titleScaleFactor = 28,
      pvalue = pvalue)
  } else {
    xcrmapscape::xcrmapscape(
      clonal_prev = clonal_prev,
      tree_edges = tree_edges,
      sample_locations = sample_locations,
      img_ref = img_ref,
      show_warnings = FALSE,
      chord_data = chord_data,
      track_data = track_data,
      resize_factor = resize_factor,
      plot_title = plot_title,
      phylo_stroke_width = '1px',
      phylo_stroke_color = '#9E9A9A',
      legendTitleHeight = 16,
      centerSize = 0.5,
      treeRelativeSize = 0.33,
      titleScaleFactor = 40, 
      pvalue = pvalue)
  }
}
```

```{r}
intersect_table <- compute_overlap_table(xcr_table, segment_type = segment_type, prevalence_option = "clones", id_type = "condensed_id")
intersect_table$patient1 <- ithi.meta::map_id(intersect_table$sample1, from = "condensed_id", to="patient_id", db_path)
intersect_table$patient2 <- ithi.meta::map_id(intersect_table$sample2, from = "condensed_id", to="patient_id", db_path)

intersect_table <- subset(intersect_table, patient1 == patient2)

clonotype_table <- subset(xcr_table, type == segment_type)
clonotype_counts <- clonotype_table %>% group_by(condensed_id, patient_id) %>% summarise(n=n()) %>% plyr::rename(c("condensed_id"="label", "n"="len"))
```

```{r}
reformat_andrew_table <- function(dat, db_path, patient_id) {
  dat$patient_id <- patient_id
  dat <- subset(dat, !sample_id %in% c("Pv2", "Rec2", "Rec3"))
  dat <- dat %>% plyr::rename(c("sample_id"="plot_id", "long_sample_id"="sample_id"))
  dat_remapped <- ithi.meta::remap_sample_ids(dat, db_path)
  dat_remapped$abbrev_id <- stringr::str_extract(dat_remapped$condensed_id, "[A-Za-z0-9]+$")
  dat_remapped <- dat_remapped %>% plyr::rename(c("sample_id"="old_sample_id", "sample_key"="long_sample_id", "plot_id"="old_plot_id", "abbrev_id"="sample_id"))
  if ("location_id" %in% colnames(dat_remapped)) {
    dat_remapped$location_id <- dat_remapped$sample_id
  }
  return(dat_remapped)
}

export_cydney_inputs <- function(xcr_table, patient_id, mapscape_base_dir = "/Users/alzhang/shahlab/projects/ITH_Immune/paper/results/intermediates/run2/mapscape_postprocessed_HMC", outdir) {
  patient_tmp <- patient_id
  clonotypes_sub <- xcr_table[(xcr_table$type == segment_type) & (xcr_table$patient_id == as.numeric(patient_tmp)),]
  clonotypes_sub$condensed_id <- factor(clonotypes_sub$condensed_id)
  cross_table <- ithi.xcr::cross_tabulate(clonotypes_sub, id_type = "condensed_id")
  colnames(cross_table) <- str_replace(colnames(cross_table), "^[0-9]+_", "")
  
  bin_cross_table <- cross_table
  bin_cross_table[bin_cross_table > 0] <- 1
  coln <- colnames(cross_table)
  
  cross_summary <- bin_cross_table %>% group_by_(.dots = coln) %>% summarise(n_shared_clonotypes=n())
  
  dir <- file.path(mapscape_base_dir, patient_id)
  
  clonal_prev = read.table(file.path(dir, "clonal_prevalence_table.tsv"), sep='\t', header=T)
  tree_edges = read.table(file.path(dir, "tree_edges.tsv"), sep='\t', header=T)
  
  root <- tree_edges$source[!(tree_edges$source %in% tree_edges$target)]
  tree_edges <- subset(tree_edges, source != root)
  clonal_prev <- reformat_andrew_table(clonal_prev, db_path, patient_id)
  #clonal_prev <- subset(clonal_prev, long_sample_id %in% sample_ids)
  
  clonal_prev_short <- subset(clonal_prev, !duplicate, select=c(patient_id, clone_id, clone_idx, condensed_id, site_id, clonal_prev))
  
  if (!dir.exists(outdir)) {
    dir.create(outdir)
    
    clone_file_output <- file.path(outdir, "clone_prevalences.tsv")
    tree_edges_output <- file.path(outdir, "tree_edges.tsv")
    intersect_output <- file.path(outdir, "intersect.tsv")
    
    write.table(clonal_prev_short, file = clone_file_output, sep="\t", quote=FALSE, row.names = FALSE, col.names = TRUE)
    write.table(tree_edges, file = tree_edges_output, sep="\t", quote=FALSE, row.names = FALSE, col.names = TRUE)
    write.table(cross_summary, file = intersect_output, sep="\t", quote=FALSE, row.names = FALSE, col.names = TRUE)
  }
}
```

## Plots

```{r}
htmltools::tagList(lapply(mapscape_input_directories, function(dir) {
  patient_id <- stringr::str_extract(dir, "[0-9]+$")
  df <- subset(intersect_table, patient1 == patient_id)
  clonal_prev = read.table(file.path(dir, "clonal_prevalence_table.tsv"), sep='\t', header=T)
  tree_edges = read.table(file.path(dir, "tree_edges.tsv"), sep='\t', header=T)
  
  root <- tree_edges$source[!(tree_edges$source %in% tree_edges$target)]
  tree_edges <- subset(tree_edges, source != root)
  
  sample_locations = read.table(file.path(dir, "sample_locations.tsv"), sep='\t', header=T)
  sample_locations$long_sample_id <- df_as_map(clonal_prev, sample_locations$sample_id, from = "sample_id", to = "long_sample_id")
  
  clonal_prev <- reformat_andrew_table(clonal_prev, db_path, patient_id)
  sample_locations <- reformat_andrew_table(sample_locations, db_path, patient_id)
  
  #df <- merge(df, subset(andrew_map, select=c(sample_key, sample_id)), by.x=c("sample1"), by.y=c("sample_key")) %>% plyr::rename(c("sample_id"="sample_id1"))
  #df <- merge(df, subset(andrew_map, select=c(sample_key, sample_id)), by.x=c("sample2"), by.y=c("sample_key")) %>% plyr::rename(c("sample_id"="sample_id2"))
  
  clonotype_counts_sub <- clonotype_counts[as.character(clonotype_counts$patient_id) == patient_id,]
  
  patient_tmp <- patient_id
  
  clonotypes_sub <- xcr_table[(xcr_table$type == segment_type) & (xcr_table$patient_id == as.numeric(patient_tmp)),]
  clonotypes_sub$condensed_id <- factor(clonotypes_sub$condensed_id)
  cross_table <- ithi.xcr::cross_tabulate(clonotypes_sub, id_type = "condensed_id")
  
  #df$sample1 <- df$sample_id1
  #df$sample2 <- df$sample_id2
  
  sample_ids <- intersect(clonal_prev$long_sample_id, unique(df$sample1))
  
  if (length(sample_ids) == 0) {
    return(NULL)
  }
  
  df <- subset(df, (sample1 %in% sample_ids) & (sample2 %in% sample_ids))
  df$sample1 <- factor(df$sample1, levels = sample_ids)
  df$sample2 <- factor(df$sample2, levels = sample_ids)
  df <- df[order(df$sample1),]
  
  ## IF YOU ONLY WANT THE INTERSECTION TO BE SHOWN, JUST SET CLONOTYPE TABLE TO NULL
  ## Otherwise set it to clonotype_counts_sub
  if (show_full_track) {
    res <- ithi.figures::format_xcrcircos_data(df, clonotype_counts = clonotype_counts_sub, cross_table = cross_table)
  } else {
    res <- ithi.figures::format_xcrcircos_data(df, clonotype_counts = NULL)
  }
  chord_data <- res$chords
  track_data <- as.data.frame(res$tracks)
  
  resize_factor <- min(sum(track_data$len)/max(track_data$len) * 1/nrow(track_data), 0.9)
  
  clonal_prev <- subset(clonal_prev, long_sample_id %in% sample_ids)
  sample_locations <- subset(sample_locations, sample_id %in% clonal_prev$sample_id)
  
  if (!full_page_mode) {
    plot_title <- paste0("Patient ", patient_id)
  } else {
    plot_title <- ""
  }
  
  pvalue <- subset(stats, patient_id == patient_tmp)$p.value
  
  ## TODO: Extract pvalues from XCR-clone correlation
  
  print(patient_id)
  plot_xcrmapscape(clonal_prev, sample_locations, tree_edges, chord_data = chord_data, track_data = track_data, resize_factor = resize_factor, plot_title = plot_title, full_page_mode = full_page_mode, pvalue = round(pvalue, 3))
}))
```
