Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
157 commits
Select commit Hold shift + click to select a range
5f75c2c
Adjust white space
Feb 28, 2013
1739e48
Rewrite NEWS and CIATION files in inst directory
Feb 28, 2013
ed96081
Adjust white space
Feb 28, 2013
ddcb331
Split out .normByXxx methods from main list of TCC methods field
Feb 28, 2013
1c5d614
Add row.names automatically if the data doesnt have row name at TCC c…
Feb 28, 2013
5e7bf21
The elements of DEGES.potentialDEG only use '1' to indicate DEG. Fixe…
Feb 28, 2013
1e46655
Add col.tag for plotting MA plot
Feb 28, 2013
3a8f45d
change the order of returned value of plotMA
Feb 28, 2013
29d0de1
round the decimal to integer before analysis
Feb 28, 2013
712c0d6
changed version to v1.0.1
Feb 28, 2013
bf03895
reWrite test script
Feb 28, 2013
28ad5ca
Add 'show' method for TCC class.
Mar 4, 2013
5070fc0
Add 'names' method for TCC class.
Mar 4, 2013
58c352d
Add more information to show TCC class object. Because the previous o…
Mar 4, 2013
17daac0
Add 'dispersion' argument for 'exactTest' in edgeR. This argument all…
Mar 5, 2013
30bc7d2
Add 'TCC' method for constructing TCC class object. Because the conve…
Mar 5, 2013
88e1235
It occurs error if the journal field is not exist. Add the journal fi…
Mar 5, 2013
31255c2
Add 'length', '[' function for TCC class. And modify the 'names' func…
Mar 5, 2013
4dfcf62
Add '[' and 'length' method for TCC class. And modify 'names' method …
Mar 5, 2013
26c88fd
Add depending package of 'snow'.
Mar 7, 2013
07cdc7a
Attach the 'man' of names, length, [ and show together on the 'man' o…
Mar 7, 2013
d38bbe7
Attach the 'man' of names, length, [ and show method together on the …
Mar 7, 2013
cd8e3ed
removed unnecessary files. and add show, length, names method test sc…
Mar 7, 2013
d2e27e6
remove unnecessary files with 'git rm' command
Mar 7, 2013
262d34d
Add vignette to TCC package.
Mar 8, 2013
938f30c
Extend for multiple group and multiple factor analysis
Mar 19, 2013
e829df9
Modify the codition for generating hypoData_mt. The before one is the…
Mar 19, 2013
30bc638
Change the expression labels of 'show' function.
Mar 21, 2013
9806311
some minor changes. 1) remove replicates argument from 'new' and 'gen…
Mar 22, 2013
91072f7
Change the warnings message in TCC.
Mar 22, 2013
1337c85
change missed description of hypoData, hypoData_mg. Because hypoData …
Mar 22, 2013
5621c89
the file which has forgetten to commit. (?)
Mar 24, 2013
6cce920
add citation (about GLM of edgeR).
Mar 24, 2013
eb5f369
Modify the wrong method of p.adjust in DEGES/DESeq(GLM).
Mar 25, 2013
e44484c
minor change
Mar 25, 2013
1fae538
Re moved 'processors' argument in TCC. The 'cl' argument is used for …
Mar 27, 2013
2c6a74d
modify the test scripts.
Mar 27, 2013
fb39520
add GLM (multi-group, multi-factor) test scripts.
Mar 27, 2013
8910577
change depended packages.
Mar 27, 2013
0fd2856
separate genSim function from TCC_public. removed 'group' argument an…
Mar 28, 2013
33ceb11
The hypoData of multple grouip.
Mar 28, 2013
9a5ca7d
change the default paramaters in 'estimateDispersions' when the data …
Mar 28, 2013
311e77b
Change 'DEG.foldchange' argument.
Mar 29, 2013
96d5667
i mistake the conditional judgement in 'testByDeseq'
Mar 29, 2013
f474c24
Some inconvenience was happend when execute vignette code, move the p…
Mar 29, 2013
9f370c2
Change 'names' field in TCC class to 'gene_id'.
Mar 29, 2013
783039c
Change 'length' function. Return the count object if it was called.
Apr 1, 2013
1358060
Fix the bug. It occurs error when use DEG.model='gamma' model
Apr 2, 2013
fdc2dcf
change default value for 'DEG.model'. Check the 'DEG.foldchange' clas…
Apr 2, 2013
d135ece
Missed object name.
Apr 2, 2013
8366f02
remove gamma model
Apr 11, 2013
4d8def3
vignette for TCC package
Apr 14, 2013
2bd8d07
Rewrite 'subset' and '[' functions
Apr 16, 2013
40f812b
spell miss
Apr 16, 2013
f24383a
change generateSimulationData to simulateReadCounts.
Apr 17, 2013
26290ac
change generateSimulationData to simulateReadCounts.
Apr 17, 2013
11804b1
Add iterator function for iDEGES normalization. If iDEGES(n=k) has be…
Apr 17, 2013
f0f8ee4
Minor changed for adjusting the position of figures. Add pdf file.
Apr 21, 2013
c8abb50
delete geometry.sty in Rnw.
Apr 21, 2013
bd1dab2
bug fix. when calcNormFactors execute with 'test.method=bayseq' and '…
Apr 22, 2013
bc03200
Add 'cite' in vignette.
Apr 22, 2013
da2c8cd
change figure format to PNG from EPS of vignette.
Apr 23, 2013
db270da
bug fix. forgot to add 'try' function to execute 'estimateDispersion'…
Apr 26, 2013
d529dca
bug fix. forgot to add 'try' function to execute 'estimateDispersion'…
Apr 26, 2013
ede5347
Add 'floorPDEG' options for kadota's TbT.
Apr 26, 2013
82c8282
Remove the code which contains the unsed argument ('processors').
Apr 29, 2013
86c2c28
bug fix
May 3, 2013
ad78b52
bug fix
May 3, 2013
59fcbae
Add .getRank method code, but unsed.
May 10, 2013
cef8925
Fix Rd files for avoding CMD check warnings.
May 10, 2013
ad643db
Add pre-PDEG value in private field.
May 11, 2013
bc0d150
delete debug code
May 12, 2013
bd436e4
comment the 'increment' argument function.
May 12, 2013
adf8a77
minor change the citations.
May 12, 2013
5b0612d
modify the vignette.
May 12, 2013
b54b0e0
modify the vignette.
May 13, 2013
408c6d3
add if sentence for avoding check
May 14, 2013
25f97db
modify the Rd files
May 14, 2013
5c28bbd
modify TCC vignette
May 14, 2013
77afc6f
change the version number
May 14, 2013
55f7ac5
add package tar
May 15, 2013
cf0a11e
rename the test script.
May 18, 2013
fd726c0
bug fix. the col.tag argument doesnt work correctly.
May 22, 2013
f584b82
modify manuals
May 23, 2013
0882a17
delete package
May 24, 2013
8d357b2
bug fix. the col option does not work correctly
May 29, 2013
e914888
modify manuals
May 30, 2013
1b26551
fix bug.
Jun 4, 2013
aedee8e
use 4 spaces per indentation level and shorten the lines less than 80…
Jun 5, 2013
46a34b8
add unit test
Jun 6, 2013
bf5812d
delete test scripts
Jun 6, 2013
35a1f48
modify vignette
Jun 7, 2013
8729543
change to correctly format
Jun 7, 2013
845918f
modify author name
Jun 7, 2013
ecf4d8f
move NEWS to correctly directory
Jun 7, 2013
b227001
add twad method
Jun 16, 2013
9654366
add wad test
Jun 17, 2013
b163dc1
bug fix for twad method
Jun 17, 2013
0bb6e2f
bug fix for .testByWad method
Jun 17, 2013
2157b37
bug fix for twad method
Jun 18, 2013
e55b86f
bug fix for TWAD normalization
Jun 27, 2013
e78babb
add parameters for TWAD nromalization
Jun 27, 2013
f11746b
add increment argument for caclNormFactors.
Jun 27, 2013
afda686
Add AD argument for TWAD normalization.
Jul 9, 2013
59152ce
the submitted article has been published
Jul 9, 2013
35912ae
the article has been published.
Jul 11, 2013
b778aa3
add arguments for TWAD method
Jul 14, 2013
7842fb6
split file
Jul 18, 2013
360a769
change WAD algorithm
Jul 21, 2013
9f9b812
add ROKU function
Jul 21, 2013
5982349
change namespace
Jul 21, 2013
65af528
add others
Jul 21, 2013
851fb73
remvoed depended package
Jul 22, 2013
b4c69d5
add new test method
Jul 22, 2013
12fd4ea
split file
Jul 22, 2013
12b8ea8
change writting style
Jul 27, 2013
3d28c02
change meta files
Jul 27, 2013
340ffcf
delete AD argument in WAD
Jul 27, 2013
9b4c5e1
add unit tests
Jul 27, 2013
b7f08e3
remove
Jul 27, 2013
092d8ca
delete AD argument in WAD
Jul 27, 2013
c4bfcb0
change function used in ROKU
Jul 27, 2013
0087aed
bug fix
Jul 27, 2013
9eb3237
delete AD argument of WAD
Jul 27, 2013
863b11e
adjust arguments
Jul 30, 2013
2b39018
let function can generate multiple factor simulation data
Jul 30, 2013
a575b08
change meta files
Jul 31, 2013
39b43ac
fix code
Jul 31, 2013
2ef6c71
adjust document files
Jul 31, 2013
b3d3a78
add microarray data
Jul 31, 2013
2a151c5
add ... argument
Aug 6, 2013
09c1aca
bug fix and add paried strategy
Aug 7, 2013
80aac59
man file
Aug 7, 2013
ad0dc17
add unittest
Aug 7, 2013
1535f0f
simulation data
Aug 8, 2013
33351b7
bug fix plotFC
Aug 9, 2013
bb9644e
delete command
Aug 9, 2013
d6abcf4
adjust
Aug 9, 2013
18d2bdd
meta file, delete NOISeq
Aug 26, 2013
26729bf
bug fix
Aug 26, 2013
51b08bf
delete duplicated files
Aug 26, 2013
9a5c209
bug fix test script
Aug 26, 2013
b5b0727
change man files
Aug 26, 2013
10f97d1
fix code
Aug 28, 2013
3d27c0a
vignette change
Aug 28, 2013
0c3cd3c
delete paired strategy
Aug 28, 2013
4ef3da6
change README
Aug 28, 2013
f9bb2fd
change README
Aug 28, 2013
0f976b8
fix
Aug 28, 2013
a417ddd
add hypo data
Aug 28, 2013
9ca37fe
change data
Aug 28, 2013
445a24d
fix data
Aug 29, 2013
2548a8b
delete space
Aug 29, 2013
34425d0
fix comment in TCC.Rnw
Sep 10, 2013
9ad921c
change unit test threhold
Sep 10, 2013
19934a9
change released url
Sep 10, 2013
8a42bd6
delete vignette
Sep 30, 2013
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
39 changes: 24 additions & 15 deletions README.md
Original file line number Diff line number Diff line change
@@ -1,20 +1,28 @@
TCC
===

R package for tag count comparison

Title
-----

Differential expression analysis for tag count data with robust normalization strategies
----------------------------------------------------------------------------------------
TCC: Differential expression analysis for tag count data with robust normalization strategies

This package provides functions for performing differential expression
analysis using differentially expressed gene elimination strategy.
A simple unified interface is provided which encapsulates functions
to calculate normalization factors and estimate differentially
expressed genes defined in edgeR, baySeq, and DESeq packages.
The appropriate combination provided by TCC allows a more robust
and accurate estimation performed easily than directly using original packages.
Functions to produce simulation data under various conditions and to plot the data are also provided.
Description
-----------

This package provides a series of functions for performing
differential expression analysis from RNA-seq count data using robust
normalization strategy (called DEGES). The basic idea of DEGES is that
potential differentially expressed genes or transcripts (DEGs) among
compared samples should be removed before data normalization to obtain
a well-ranked gene list where true DEGs are top-ranked and non-DEGs are
bottom ranked. This can be done by performing a multi-step normalization
strategy (called DEGES for DEG elimination strategy). A major
characteristic of TCC is to provide the robust normalization methods for
several kinds of count data (two-group with or without replicates,
multi-group/multi-factor, and so on) by virtue of the use of combinations
of functions in other sophisticated packages (especially edgeR, DESeq,
and baySeq).

Documentation
-------------
Expand All @@ -26,13 +34,14 @@ in addition to the documents included in the software package.
Development versions
--------------------

The development version is now on the github repository at https://github.com/tomoakin/TCC
The development version is now on the github repository
at https://github.com/kohijiri/huaying.asagao

Releases
--------

Release of this software is made through CRAN at http://cran.r-project.org/web/packages/TCC/

Release of this software is made through CRAN at
http://www.bioconductor.org/packages/release/bioc/html/TCC.html

No warranty
-----------
Expand All @@ -53,4 +62,4 @@ A copy of GPL-2 is accompanied in this directory in a file named COPYING.
Authors
-------

Sun Jianqiang, Tomoaki Nishiyama, Kentaro Shimizu, and Koji Kadota
Jianqiang Sun, Tomoaki Nishiyama, Kentaro Shimizu, and Koji Kadota
37 changes: 23 additions & 14 deletions TCC/DESCRIPTION
Original file line number Diff line number Diff line change
@@ -1,19 +1,28 @@
Package: TCC
Type: Package
Title: TCC: Differential expression analysis for tag count data with
robust normalization strategies
Version: 1.0.0
Date: 2013-01-10
Author: Sun Jianqiang, Tomoaki Nishiyama, Kentaro Shimizu, and Koji Kadota
Maintainer: Tomoaki Nishiyama <tomoakin@staff.kanazawa-u.ac.jp>
Description: This package provides functions for performing differential expression analysis
using differentially expressed gene elimination strategy. A simple unified interface is
provided which encapsulates functions to calculate normalization factors and estimate
differentially expressed genes defined in edgeR, baySeq, and DESeq packages.
The appropriate combination provided by TCC allows a more robust and accurate estimation
performed easily than directly using original packages.
Functions to produce simulation data under various conditions and to plot the data are also provided.
Depends: R (>= 2.15), edgeR, baySeq, DESeq, ROC, methods
robust normalization strategies
Version: 1.1.99
Author: Jianqiang Sun, Tomoaki Nishiyama, Kentaro Shimizu, and Koji Kadota
Maintainer: Jianqiang Sun <wukong@bi.a.u-tokyo.ac.jp>,
Tomoaki Nishiyama <tomoakin@staff.kanazawa-u.ac.jp>
Description: This package provides a series of functions for performing
differential expression analysis from RNA-seq count data using robust
normalization strategy (called DEGES). The basic idea of DEGES is that
potential differentially expressed genes or transcripts (DEGs) among
compared samples should be removed before data normalization to obtain
a well-ranked gene list where true DEGs are top-ranked and non-DEGs are
bottom ranked. This can be done by performing a multi-step normalization
strategy (called DEGES for DEG elimination strategy). A major
characteristic of TCC is to provide the robust normalization methods for
several kinds of count data (two-group with or without replicates,
multi-group/multi-factor, and so on) by virtue of the use of combinations
of functions in other sophisticated packages (especially edgeR, DESeq,
and baySeq).
Depends: R (>= 2.15), methods, DESeq, edgeR, baySeq, ROC
Imports: EBSeq, samr
Suggests: RUnit, BiocGenerics
Enhances: snow
biocViews: HighThroughputSequencing, DifferentialExpression, RNAseq
License: GPL-2
Copyright: Authors listed above
URL: http://www.iu.a.u-tokyo.ac.jp/~kadota/TCC
16 changes: 12 additions & 4 deletions TCC/NAMESPACE
Original file line number Diff line number Diff line change
Expand Up @@ -2,25 +2,33 @@ import(ROC)
import(DESeq)
import(baySeq)
import(edgeR)
import(EBSeq)
import(samr)

# Export TCC class.
exportClasses(
"TCC"
)

# Export the public methods in TCC package.
export(
show,
names,
length,
"[",
TCC,
calcAUCValue,
calcNormFactors,
do_TbT,
estimateDE,
exactTestafterTbT,
filterLowCountGenes,
generateSimulationData,
simulateReadCounts,
getNormalizedData,
getResult,
MAplot,
NBsample,
plotFCPseudocolor,
plot.TCC
plot.TCC,
WAD,
ROKU
)

43 changes: 43 additions & 0 deletions TCC/NEWS
Original file line number Diff line number Diff line change
@@ -0,0 +1,43 @@
CHANGES IN VERSION 1.2.0
------------------------

NEW FEATURES

o This package was released as a Bioconductor package (previously CRAN).
o WAD method for identifying DEGs was added.
o ROKU method for identifying tissue-specific genes was added.
o 'increment' argument of 'calcNormFactor' function was added.


SIGNIFICANT USER-VISIBLE CHANGES

o 'replicates' field of TCC class was deleted.




CHANGES IN VERSION 1.1.3
------------------------

SIGNIFICANT USER-VISIBLE CHANGES

o 'generateSimulationData' function was renamed to 'simulateReadCount'.

o 'names' field of TCC class was changed to 'gene_id'.

o 'hypoData' was reduced to a smaller data set.

o 'hypoData_mg' was created. This is the simulation dataset which consists
of 1,000 genes and 9 samples.




CHANGES IN VERSION 1.0.0
------------------------

SIGNIFICANT USER-VISIBLE CHANGES

o 'TCC' class was implemented as a R5 reference class. Wrapper functions
with functional programming semantics were proviede.

123 changes: 123 additions & 0 deletions TCC/R/ROKU.R
Original file line number Diff line number Diff line change
@@ -0,0 +1,123 @@
.outval <- function(y, upper.limit) {
if (all(is.na(y)))
y <- rep(0, length = length(y))
z <- y[!is.na(y)]

N <- length(z)
fN <- floor(N * upper.limit) + 1

z.sorted <- sort(z)
z.ordered <- order(z)

df <- matrix(c(rep(1:fN, times = c(fN:1)), j = sequence(fN:1)),
ncol = 2, byrow = FALSE)
n <- N - df[, 2] - df[, 1] + 2
s <- N - n
f <- rep(0, length = N)

if (sd(z) != 0) {
ssd <- apply(df, 1, function(d, w = z.sorted, N = N) {
return(sd(w[d[1]:(N + 1 - d[2])]))
}, z.sorted, N)
u <- n * log(ssd * sqrt((n - 1) / n)) +
sqrt(2) * s * lfactorial(n) / n
min.u <- min(u)
d <- t(df[u == min.u, ])[1:2]
if (d[1] > 1)
f[z.ordered[1:(d[1] - 1)]] <- -1
if (d[2] > 1)
f[z.ordered[(N + 1 - d[2] + 1):N]] <- 1
}
return(replace(y, !is.na(y), f))
}


.tbw <- function(y) {
y <- y[!is.na(y)]
y.m <- median(y)
y.u <- (y - y.m) / (5 * median(abs(y - y.m)) + 1e-04)
y.w <- rep(0, length(y))
y.i <- abs(y.u) <= 1
y.w[y.i] <- ((1 - y.u^2)^2)[y.i]
y.b <- sum(y.w * y) / sum(y.w)
}

.entvalmod <- function(y) {
y <- y[!is.na(y)]
l <- length(y)
y <- y[y != 0]
if (is.na(sd(y))) {
return (0)
} else if (sum(y) <= 0 || sd(y) == 0) {
return (log2(l))
} else {
y.m <- median(y)
y.u <- (y - y.m) / (5 * median(abs(y - y.m)) + 1e-04)
y.w <- rep(0, length(y))
y.i <- abs(y.u) <= 1
y.w[y.i] <- ((1 - y.u^2)^2)[y.i]
y.b <- sum(y.w * y) / sum(y.w)
p <- abs(y - y.b)
p <- p / sum(p)
e <- - sum(p * log2(p))
if (is.na(e))
e <- 0
return (e)
}
}

.entval <- function(y) {
y <- y[!is.na(y)]
l <- length(y)
y <- y[y != 0]
if (is.na(sd(y))) {
return (0)
} else if (sum(y) <= 0 || sd(y) == 0) {
return (log2(l))
} else {
p <- y / sum(y)
e <- - sum(p * log2(p))
if (is.na(e))
e <- 0
return (e)
}
}

ROKU <- function(data, upper.limit = 0.25, sort = FALSE) {
rs <- NULL
if (is.vector(data)) {
data <- t(matrix(data))
} else {
data <- as.matrix(data)
}
rs$outliers <- t(apply(t(scale(t(data))), 1,
function (y, upper.limit = upper.limit) {
.outval(y, upper.limit = upper.limit)
}, upper.limit))
rs$H <- apply(data, 1, .entval)
rs$modH <- apply(data, 1, .entvalmod)
rs$rank <- rank(rs$modH)
rs$Tbw <- apply(data, 1, .tbw)
if (!is.null(colnames(data))) {
l <- colnames(data)
} else {
l <- paste("tissue", 1:ncol(data), sep = "_")
}
if (!is.null(rownames(data))) {
r <- rownames(data)
} else {
r <- 1:nrow(data)
}
colnames(rs$outliers) <- l
rownames(rs$outliers) <- r
if (sort) {
reindex <- order(rs$rank)
rs$outliers <- rs$outliers[reindex, ]
rs$H <- rs$H[reindex]
rs$modH <- rs$modH[reindex]
rs$rank <- rs$rank[reindex]
rs$Tbw <- rs$Tbw[reindex]
}
return (rs)
}

Loading