#!/usr/bin/env Rscript
############################################################################
#
############################################################################
library("aroma.seq");
dataSet <- "AlbertsonD_2012-Bladder_VUMC";
organism <- "Homo_sapiens";
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Setup
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
by <- 50e3;
byTag <- sprintf("%dkb", by/1e3);
ugp <- AromaUgpFile$byChipType("GenericHuman", tags=byTag);
print(ugp);
unc <- getAromaUncFile(ugp);
print(unc);
# Data set
path <- file.path("bamData", dataSet, organism);
bs <- BamDataSet$byPath(path);
setFullNamesTranslator(bs, function(names, ...) {
names <- gsub(".bowtie.sorted", "", names, fixed=TRUE);
names <- gsub("([TN])$", ",\\1", names);
names;
});
print(bs);
chrLabels <- names(getTargets(bs[[1]]));
chrMap <- c(1:25);
labels <- sprintf("chr%d", chrMap);
labels[23:25] <- sprintf("chr%s", c("X", "Y", "M"));
names(chrMap) <- labels;
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Bin reads chromosome by chromosome
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
bc <- TotalCnBinnedCounting(bs, targetUgp=ugp);
print(bc);
ds <- process(bc, verbose=verbose);
verbose && print(verbose, ds);
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
# Normalize GC content
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
bgn <- BinnedGcNormalization(ds);
verbose && print(verbose, bgn);
dsN <- process(bgn, verbose=verbose);
verbose && print(verbose, dsN);
# DEBUG...
if (FALSE) {
muN <- median(yN, na.rm=TRUE);
rho <- muN / median(y, na.rm=TRUE);
xlab <- "GC content fraction";
ylab <- "Signals";
gcLim <- c(0.25,0.75);
Clim <- c(0,6);
plot(gc, rho*y, pch=".", col="#999999", xlim=gcLim, ylim=c(0,6), xlab=xlab, ylab=ylab);
points(gc, yN, pch=".");
abline(h=muN, col="#cccccc");
stext(side=3, pos=1, line=-1, cex=0.8, sprintf("n=%d", sum(is.finite(yN))));
}
############################################################################
# HISTORY:
# 2012-10-21
# o Now we can do CbsModel(dsT, ref="constant(2)").
# 2012-10-11
# o Now generating a Chromosome Explorer report.
# o Added TotalCnBinnedCounting() which calculates bin counts centered
# at target loci specified by an UGP annotation file and outputs an
# AromaUnitTotalCnBinarySet data set of DNAseq bin counts.
# 2012-10-10
# o Now plotting whole-genome TCN tracks, where data is loaded chromosome
# by chromosome. Also utilizing generic UGP files.
# 2012-10-02
# o Created.
############################################################################
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.