Last data update: 2014.03.03
R: Alignment statistics
alignStats R Documentation
Alignment statistics
Description
Generate data frame containing important read alignment statistics such as the
total number of reads in the FASTQ files, the number of total alignments, as
well as the number of primary alignments in the corresponding BAM files.
Usage
alignStats(args)
Arguments
args
Object of class SYSargs
.
Value
data.frame
with alignment statistics.
Author(s)
Thomas Girke
Examples
## Construct SYSargs object from param and targets files
param <- system.file("extdata", "tophat.param", package="systemPipeR")
targets <- system.file("extdata", "targets.txt", package="systemPipeR")
args <- systemArgs(sysma=param, mytargets=targets)
args
names(args); modules(args); cores(args); outpaths(args); sysargs(args)
## Not run:
## Execute SYSargs on single machine
runCommandline(args=args)
## Execute SYSargs on multiple machines
qsubargs <- getQsubargs(queue="batch", Nnodes="nodes=1", cores=cores(tophat), memory="mem=10gb", time="walltime=20:00:00")
qsubRun(args=args, qsubargs=qsubargs, Nqsubs=1, package="systemPipeR")
## Alignment stats
read_statsDF <- alignStats(args)
read_statsDF <- cbind(read_statsDF[targets$FileName,], targets)
write.table(read_statsDF, "results/alignStats.xls", row.names=FALSE, quote=FALSE, sep="\t")
## End(Not run)
Results
R version 3.3.1 (2016-06-21) -- "Bug in Your Hair"
Copyright (C) 2016 The R Foundation for Statistical Computing
Platform: x86_64-pc-linux-gnu (64-bit)
R is free software and comes with ABSOLUTELY NO WARRANTY.
You are welcome to redistribute it under certain conditions.
Type 'license()' or 'licence()' for distribution details.
R is a collaborative project with many contributors.
Type 'contributors()' for more information and
'citation()' on how to cite R or R packages in publications.
Type 'demo()' for some demos, 'help()' for on-line help, or
'help.start()' for an HTML browser interface to help.
Type 'q()' to quit R.
> library(systemPipeR)
Loading required package: Rsamtools
Loading required package: GenomeInfoDb
Loading required package: stats4
Loading required package: BiocGenerics
Loading required package: parallel
Attaching package: 'BiocGenerics'
The following objects are masked from 'package:parallel':
clusterApply, clusterApplyLB, clusterCall, clusterEvalQ,
clusterExport, clusterMap, parApply, parCapply, parLapply,
parLapplyLB, parRapply, parSapply, parSapplyLB
The following objects are masked from 'package:stats':
IQR, mad, xtabs
The following objects are masked from 'package:base':
Filter, Find, Map, Position, Reduce, anyDuplicated, append,
as.data.frame, cbind, colnames, do.call, duplicated, eval, evalq,
get, grep, grepl, intersect, is.unsorted, lapply, lengths, mapply,
match, mget, order, paste, pmax, pmax.int, pmin, pmin.int, rank,
rbind, rownames, sapply, setdiff, sort, table, tapply, union,
unique, unsplit
Loading required package: S4Vectors
Attaching package: 'S4Vectors'
The following objects are masked from 'package:base':
colMeans, colSums, expand.grid, rowMeans, rowSums
Loading required package: IRanges
Loading required package: GenomicRanges
Loading required package: Biostrings
Loading required package: XVector
Loading required package: ShortRead
Loading required package: BiocParallel
Loading required package: GenomicAlignments
Loading required package: SummarizedExperiment
Loading required package: Biobase
Welcome to Bioconductor
Vignettes contain introductory material; view with
'browseVignettes()'. To cite Bioconductor, see
'citation("Biobase")', and for packages 'citation("pkgname")'.
> png(filename="/home/ddbj/snapshot/RGM3/R_BC/result/systemPipeR/alignStats.Rd_%03d_medium.png", width=480, height=480)
> ### Name: alignStats
> ### Title: Alignment statistics
> ### Aliases: alignStats
> ### Keywords: utilities
>
> ### ** Examples
>
> ## Construct SYSargs object from param and targets files
> param <- system.file("extdata", "tophat.param", package="systemPipeR")
> targets <- system.file("extdata", "targets.txt", package="systemPipeR")
> args <- systemArgs(sysma=param, mytargets=targets)
There were 18 warnings (use warnings() to see them)
> args
An instance of 'SYSargs' for running 'tophat' on 18 samples
> names(args); modules(args); cores(args); outpaths(args); sysargs(args)
[1] "targetsin" "targetsout" "targetsheader" "modules"
[5] "software" "cores" "other" "reference"
[9] "results" "infile1" "infile2" "outfile1"
[13] "sysargs" "outpaths"
[1] "bowtie2/2.2.5" "tophat/2.0.14"
[1] 4
M1A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446027_1.fastq.tophat/accepted_hits.bam"
M1B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446028_1.fastq.tophat/accepted_hits.bam"
A1A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446029_1.fastq.tophat/accepted_hits.bam"
A1B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446030_1.fastq.tophat/accepted_hits.bam"
V1A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446031_1.fastq.tophat/accepted_hits.bam"
V1B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446032_1.fastq.tophat/accepted_hits.bam"
M6A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446033_1.fastq.tophat/accepted_hits.bam"
M6B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446034_1.fastq.tophat/accepted_hits.bam"
A6A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446035_1.fastq.tophat/accepted_hits.bam"
A6B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446036_1.fastq.tophat/accepted_hits.bam"
V6A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446037_1.fastq.tophat/accepted_hits.bam"
V6B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446038_1.fastq.tophat/accepted_hits.bam"
M12A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446039_1.fastq.tophat/accepted_hits.bam"
M12B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446040_1.fastq.tophat/accepted_hits.bam"
A12A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446041_1.fastq.tophat/accepted_hits.bam"
A12B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446042_1.fastq.tophat/accepted_hits.bam"
V12A
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446043_1.fastq.tophat/accepted_hits.bam"
V12B
"/home/ddbj/DataUpdator-rgm3/target/results/SRR446044_1.fastq.tophat/accepted_hits.bam"
M1A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446027_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446027_1.fastq "
M1B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446028_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446028_1.fastq "
A1A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446029_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446029_1.fastq "
A1B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446030_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446030_1.fastq "
V1A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446031_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446031_1.fastq "
V1B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446032_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446032_1.fastq "
M6A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446033_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446033_1.fastq "
M6B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446034_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446034_1.fastq "
A6A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446035_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446035_1.fastq "
A6B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446036_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446036_1.fastq "
V6A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446037_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446037_1.fastq "
V6B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446038_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446038_1.fastq "
M12A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446039_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446039_1.fastq "
M12B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446040_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446040_1.fastq "
A12A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446041_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446041_1.fastq "
A12B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446042_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446042_1.fastq "
V12A
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446043_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446043_1.fastq "
V12B
"tophat -p 4 -g 1 --segment-length 25 -i 30 -I 3000 -o /home/ddbj/DataUpdator-rgm3/target/results/SRR446044_1.fastq.tophat /home/ddbj/DataUpdator-rgm3/target/data/tair10.fasta ./data/SRR446044_1.fastq "
>
> ## Not run:
> ##D ## Execute SYSargs on single machine
> ##D runCommandline(args=args)
> ##D
> ##D ## Execute SYSargs on multiple machines
> ##D qsubargs <- getQsubargs(queue="batch", Nnodes="nodes=1", cores=cores(tophat), memory="mem=10gb", time="walltime=20:00:00")
> ##D qsubRun(args=args, qsubargs=qsubargs, Nqsubs=1, package="systemPipeR")
> ##D ## Alignment stats
> ##D read_statsDF <- alignStats(args)
> ##D read_statsDF <- cbind(read_statsDF[targets$FileName,], targets)
> ##D write.table(read_statsDF, "results/alignStats.xls", row.names=FALSE, quote=FALSE, sep="\t")
> ## End(Not run)
>
>
>
>
>
> dev.off()
null device
1
>