cola_examples

Golub leukemia dataset

The Golub leukemia dataset is a Bioconductor dataset.

RDS files generated by cola (use readRDS() to load into R (>= 3.6.0)):

HTML reports for cola analysis:

Following code performs the analysis.

Prepare the input matrix:

library(cola)

library(golubEsets)
data(Golub_Merge)
m = exprs(Golub_Merge)
colnames(m) = paste0("sample_", colnames(m))
anno = pData(Golub_Merge)

m[m <= 1] = NA
m = log10(m)

m = adjust_matrix(m)

library(preprocessCore)
cn = colnames(m)
rn = rownames(m)
m = normalize.quantiles(m)
colnames(m) = cn
rownames(m) = rn

Perform the consensus partitioning:

register_NMF()

set.seed(123)
rl = run_all_consensus_partition_methods(
    m,
    mc.cores = 4, 
    anno = anno[, c("ALL.AML"), drop = FALSE],
    anno_col = c("ALL" = "red", "AML" = "blue")
)
saveRDS(rl, file = qq("Golub_leukemia_subgroup.rds"))
cola_report(rl, output_dir = "Golub_leukemia_subgroup_cola_report", mc.cores = 4)