tests/testthat/test_3_peaks_per_gene.R

context('Test peaks per gene functions')

################################################################################
# Test human locus definitions

# Load the required data for the test
hg19_ldefs = grep('locusdef.hg19', data(package = 'chipenrich.data')$results[,3], value=T)
data(list = hg19_ldefs, package = 'chipenrich.data')
tss = get(data('tss.hg19', package = 'chipenrich.data'))

file = system.file('extdata', 'test_assign.bed', package = 'chipenrich')
peaks = suppressMessages(read_bed(file))

# Expected values for peak assignments
expected_numpeaks = list(
	'locusdef.hg19.10kb' = c(3),
	'locusdef.hg19.10kb_outside' = c(1),
	'locusdef.hg19.10kb_outside_upstream' = c(1),
	'locusdef.hg19.1kb' = c(2),
	'locusdef.hg19.1kb_outside' = c(1,1),
	'locusdef.hg19.1kb_outside_upstream' = c(1,1),
	'locusdef.hg19.5kb' = c(3),
	'locusdef.hg19.5kb_outside' = c(1),
	'locusdef.hg19.5kb_outside_upstream' = c(1),
	'locusdef.hg19.exon' = c(1),
	'locusdef.hg19.intron' = c(1),
	'locusdef.hg19.nearest_gene' = c(3, 1),
	'locusdef.hg19.nearest_tss' = c(3, 1)
)

# Do the tests in a loop for each locus definition of hg19
for(ldef in hg19_ldefs) {
	test_assign = assign_peaks(peaks = peaks, locusdef = get(ldef), tss = tss)

	test_ppg = num_peaks_per_gene(assigned_peaks = test_assign, locusdef = get(ldef), mappa = NULL)

	expect_true(all(subset(test_ppg, num_peaks != 0)$num_peaks == expected_numpeaks[[ldef]]),
		info = sprintf('Test num_peaks_per_gene(): %s', ldef))
}

expected_overlaps = list(
	'locusdef.hg19.10kb' = c(700,80),
	'locusdef.hg19.10kb_outside' = c(921),
	'locusdef.hg19.10kb_outside_upstream' = c(921),
	'locusdef.hg19.1kb' = c(327),
	'locusdef.hg19.1kb_outside' = c(1000,374),
	'locusdef.hg19.1kb_outside_upstream' = c(1000,374),
	'locusdef.hg19.5kb' = c(700),
	'locusdef.hg19.5kb_outside' = c(1000),
	'locusdef.hg19.5kb_outside_upstream' = c(1000),
	'locusdef.hg19.exon' = c(100),
	'locusdef.hg19.intron' = c(100),
	'locusdef.hg19.nearest_gene' = c(700,1000),
	'locusdef.hg19.nearest_tss' = c(700,1000)
)

# Do the tests in a loop for each locus definition of hg19
for(ldef in hg19_ldefs) {
	test_assign = assign_peak_segments(peaks = peaks, locusdef = get(ldef))

	test_ppg = num_peaks_per_gene(assigned_peaks = test_assign, locusdef = get(ldef), mappa = NULL)
	test_ppg = calc_peak_gene_overlap(assigned_peaks = test_assign, ppg = test_ppg)

	expect_true(all(subset(test_ppg, peak_overlap != 0)$peak_overlap == expected_overlaps[[ldef]]),
		info = sprintf('Test num_peaks_per_gene(): %s', ldef))
}

Try the chipenrich package in your browser

Any scripts or data that you put into this service are public.

chipenrich documentation built on Nov. 8, 2020, 8:11 p.m.