~ubuntu-branches/ubuntu/wily/r-bioc-genomicranges/wily-proposed

« back to all changes in this revision

Viewing changes to inst/doc/summarizeOverlaps.R

Committer: Package Import Robot
Author(s): Andreas Tille
Date: 2014-06-13 15:04:19 UTC
mfrom: (1.1.2)
Revision ID: package-import@ubuntu.com-20140613150419-v49mxnlg42rnuks5

Tags: 1.16.3-1

* New upstream version
* New (Build-)Depends: r-bioc-genomeinfodb
* cme fix dpkg-control
* add autopkgtest

files added:
R/map-methods.R

R/range-squeezers.R

R/tile-methods.R

debian/tests

debian/tests/control

debian/tests/run-unit-test

inst/CITATION

man/deprecated.Rd

man/range-squeezers.Rd

vignettes

vignettes/GenomicRanges.bib

vignettes/GenomicRangesHOWTOs.Rnw

vignettes/GenomicRangesIntroduction.Rnw

files removed:
R/GAlignmentPairs-class.R

R/GAlignments-class.R

R/GAlignmentsList-class.R

R/cigar-utils.R

R/encodeOverlaps-methods.R

R/findSpliceOverlaps-methods.R

R/findSpliceOverlaps-utils.R

R/summarizeOverlaps.R

inst/doc/GenomicRanges.bib

inst/doc/OverlapEncodings.R

inst/doc/OverlapEncodings.Rnw

inst/doc/OverlapEncodings.pdf

inst/doc/precomputed_results

inst/doc/precomputed_results/U1.sbcompHITSa.rda

inst/doc/precomputed_results/U1.sbcompHITSb.rda

inst/doc/precomputed_results/exbytx.rda

inst/doc/summarizeOverlaps-modes.pdf

inst/doc/summarizeOverlaps.R

inst/doc/summarizeOverlaps.Rnw

inst/doc/summarizeOverlaps.pdf

inst/extdata/sm_treated1.bam

inst/extdata/sm_untreated1.bam

inst/scripts

inst/unitTests/test_GAlignments-class.R

inst/unitTests/test_GAlignmentsList-class.R

inst/unitTests/test_cigar-utils.R

inst/unitTests/test_findSpliceOverlaps-methods.R

inst/unitTests/test_summarizeOverlaps-methods.R

man/GAlignmentPairs-class.Rd

man/GAlignments-class.Rd

man/GAlignmentsList-class.Rd

man/cigar-utils.Rd

man/encodeOverlaps-methods.Rd

man/findSpliceOverlaps-methods.Rd

man/makeSeqnameIds.Rd

man/summarizeOverlaps.Rd

src/cigar_utils.c

files modified:
DESCRIPTION

NAMESPACE

NEWS

R/GRanges-class.R

R/GRangesList-class.R

R/GenomicRanges-class.R

R/GenomicRanges-comparison.R

R/RangesMapping-methods.R

R/Seqinfo-class.R

R/SummarizedExperiment-class.R

R/SummarizedExperiment-rowData-methods.R

R/coverage-methods.R

R/findOverlaps-methods.R

R/inter-range-methods.R

R/intra-range-methods.R

R/makeSeqnameIds.R

R/resolveHits-methods.R

R/seqinfo.R

R/seqlevels-utils.R

R/setops-methods.R

R/strand-utils.R

R/utils.R

build/vignette.rds

debian/README.test

debian/changelog

debian/control

inst/doc/GenomicRangesHOWTOs.R

inst/doc/GenomicRangesHOWTOs.Rnw

inst/doc/GenomicRangesHOWTOs.pdf

inst/doc/GenomicRangesIntroduction.R

inst/doc/GenomicRangesIntroduction.Rnw

inst/doc/GenomicRangesIntroduction.pdf

inst/unitTests/test_GRangesList-class.R

inst/unitTests/test_Seqinfo-class.R

inst/unitTests/test_SummarizedExperiment-class.R

inst/unitTests/test_findOverlaps-methods.R

inst/unitTests/test_intra-range-methods.R

inst/unitTests/test_utils.R

man/GIntervalTree-class.Rd

man/GRanges-class.Rd

man/GRangesList-class.Rd

man/GenomicRanges-comparison.Rd

man/Seqinfo-class.Rd

man/SummarizedExperiment-class.Rd

man/coverage-methods.Rd

man/findOverlaps-methods.Rd

man/inter-range-methods.Rd

man/intra-range-methods.Rd

man/map-methods.Rd

man/seqinfo.Rd

man/seqlevels-utils.Rd

man/setops-methods.Rd

man/strand-utils.Rd

src/GenomicRanges.h

src/R_init_GenomicRanges.c

src/transcript_utils.c

Show diffs side-by-side

added added

removed removed

inst/doc/summarizeOverlaps.R

### R code from vignette source 'summarizeOverlaps.Rnw'

###################################################

### code chunk number 1: style

###################################################

BiocStyle::latex()

###################################################

### code chunk number 2: options

###################################################

options(width=72)

options("showHeadLines" = 3)

options("showTailLines" = 3)

###################################################

### code chunk number 3: firstExample

###################################################

library(Rsamtools)

library(DESeq)

library(edgeR)

fls <- list.files(system.file("extdata",package="GenomicRanges"),

recursive=TRUE, pattern="*bam$", full=TRUE)

bfl <- BamFileList(fls, index=character())

features <- GRanges(

seqnames = c(rep("chr2L", 4), rep("chr2R", 5), rep("chr3L", 2)),

ranges = IRanges(c(1000, 3000, 4000, 7000, 2000, 3000, 3600, 4000,

7500, 5000, 5400), width=c(rep(500, 3), 600, 900, 500, 300, 900,

300, 500, 500)), "-",

group_id=c(rep("A", 4), rep("B", 5), rep("C", 2)))

olap <- summarizeOverlaps(features, bfl)

deseq <- newCountDataSet(assays(olap)$counts, rownames(colData(olap)))

edger <- DGEList(assays(olap)$counts, group=rownames(colData(olap)))

###################################################

### code chunk number 4: simple

###################################################

rd <- GAlignments("a", seqnames = Rle("chr1"), pos = as.integer(100),

cigar = "300M", strand = strand("+"))

gr1 <- GRanges("chr1", IRanges(start=50, width=150), strand="+")

gr2 <- GRanges("chr1", IRanges(start=350, width=150), strand="+")

###################################################

### code chunk number 5: simpleGRanges

###################################################

gr <- c(gr1, gr2)

data.frame(union = assays(summarizeOverlaps(gr, rd))$counts,

intStrict = assays(summarizeOverlaps(gr, rd,

mode="IntersectionStrict"))$counts,

intNotEmpty = assays(summarizeOverlaps(gr, rd,

mode="IntersectionNotEmpty"))$counts)

###################################################

### code chunk number 6: simpleGRangesList

###################################################

grl <- GRangesList(c(gr1, gr2))

data.frame(union = assays(summarizeOverlaps(grl, rd))$counts,

intStrict = assays(summarizeOverlaps(grl, rd,

mode="IntersectionStrict"))$counts,

intNotEmpty = assays(summarizeOverlaps(grl, rd,

mode="IntersectionNotEmpty"))$counts)

###################################################

### code chunk number 7: data

###################################################

group_id <- c("A", "B", "C", "C", "D", "D", "E", "F", "G", "G", "H", "H")

features <- GRanges(

seqnames = Rle(c("chr1", "chr2", "chr1", "chr1", "chr2", "chr2",

"chr1", "chr1", "chr2", "chr2", "chr1", "chr1")),

strand = strand(rep("+", length(group_id))),

ranges = IRanges(

start=c(1000, 2000, 3000, 3600, 7000, 7500, 4000, 4000, 3000, 3350, 5000, 5400),

width=c(500, 900, 500, 300, 600, 300, 500, 900, 150, 200, 500, 500)),

DataFrame(group_id)

)

reads <- GAlignments(

names = c("a","b","c","d","e","f","g"),

seqnames = Rle(c(rep(c("chr1", "chr2"), 3), "chr1")),

pos = as.integer(c(1400, 2700, 3400, 7100, 4000, 3100, 5200)),

cigar = c("500M", "100M", "300M", "500M", "300M", "50M200N50M", "50M150N50M"),

strand = strand(rep.int("+", 7L)))

###################################################

### code chunk number 8: GRanges

###################################################

data.frame(union = assays(summarizeOverlaps(features, reads))$counts,

intStrict = assays(summarizeOverlaps(features, reads,

100

mode="IntersectionStrict"))$counts,

101

intNotEmpty = assays(summarizeOverlaps(features, reads,

102

mode="IntersectionNotEmpty"))$counts)

103

104

105

###################################################

106

### code chunk number 9: lst

107

###################################################

108

lst <- split(features, mcols(features)[["group_id"]])

109

length(lst)

110

111

112

###################################################

113

### code chunk number 10: GRangesList

114

###################################################

115

data.frame(union = assays(summarizeOverlaps(lst, reads))$counts,

116

intStrict = assays(summarizeOverlaps(lst, reads,

117

mode="IntersectionStrict"))$counts,

118

intNotEmpty = assays(summarizeOverlaps(lst, reads,

119

mode="IntersectionNotEmpty"))$counts)

120

121

122

###################################################

123

### code chunk number 11: gff (eval = FALSE)

124

###################################################

125

## library(rtracklayer)

126

## fl <- paste0("ftp://ftp.ensembl.org/pub/release-62/",

127

## "gtf/drosophila_melanogaster/",

128

## "Drosophila_melanogaster.BDGP5.25.62.gtf.gz")

129

## gffFile <- file.path(tempdir(), basename(fl))

130

## download.file(fl, gffFile)

131

## gff0 <- import(gffFile, asRangedData=FALSE)

132

133

134

###################################################

135

### code chunk number 12: gff_parse (eval = FALSE)

136

###################################################

137

## idx <- mcols(gff0)$source == "protein_coding" &

138

## mcols(gff0)$type == "exon" &

139

## seqnames(gff0) == "4"

140

## gff <- gff0[idx]

141

## ## adjust seqnames to match Bam files

142

## seqlevels(gff) <- paste("chr", seqlevels(gff), sep="")

143

## chr4genes <- split(gff, mcols(gff)$gene_id)

144

145

146

###################################################

147

### code chunk number 13: pasilla_param

148

###################################################

149

param <- ScanBamParam(

150

what='qual',

151

which=GRanges("chr4", IRanges(1, 1e6)),

152

flag=scanBamFlag(isUnmappedQuery=FALSE, isPaired=NA),

153

tag="NH")

154

155

156

###################################################

157

### code chunk number 14: pasilla_count (eval = FALSE)

158

###################################################

159

## fls <- c("treated1.bam", "untreated1.bam", "untreated2.bam")

160

## path <- "pathToBAMFiles"

161

## bamlst <- BamFileList(fls, index=character())

162

## genehits <- summarizeOverlaps(chr4genes, bamlst, mode="Union")

163

164

165

###################################################

166

### code chunk number 15: pasilla_exoncountset (eval = FALSE)

167

###################################################

168

## expdata = new("MIAME",

169

## name="pasilla knockdown",

170

## lab="Genetics and Developmental Biology, University of

171

## Connecticut Health Center",

172

## contact="Dr. Brenton Graveley",

173

## title="modENCODE Drosophila pasilla RNA Binding Protein RNAi

174

## knockdown RNA-Seq Studies",

175

## url="http://www.ncbi.nlm.nih.gov/projects/geo/query/acc.cgi?acc=GSE18508",

176

## abstract="RNA-seq of 3 biological replicates of from the Drosophila

177

## melanogaster S2-DRSC cells that have been RNAi depleted of mRNAs

178

## encoding pasilla, a mRNA binding protein and 4 biological replicates

179

## of the the untreated cell line.")

180

## pubMedIds(expdata) <- "20921232"

181

182

## design <- data.frame(

183

## condition=c("treated", "untreated", "untreated"),

184

## replicate=c(1,1,2),

185

## type=rep("single-read", 3),

186

## countfiles=path(colData(genehits)[,1]), stringsAsFactors=TRUE)

187

188

## geneCDS <- newCountDataSet(

189

## countData=assays(genehits)$counts,

190

## conditions=design)

191

192

## experimentData(geneCDS) <- expdata

193

## sampleNames(geneCDS) = colnames(genehits)

194

195

196

###################################################

197

### code chunk number 16: pasilla_genes (eval = FALSE)

198

###################################################

199

## chr4tx <- split(gff, mcols(gff)$transcript_id)

200

## txhits <- summarizeOverlaps(chr4tx, bamlst)

201

## txCDS <- newCountDataSet(assays(txhits)$counts, design)

202

## experimentData(txCDS) <- expdata

203

204

Older »