[Robast-commits] r279 - pkg/RobLoxBioC/inst/scripts

noreply at r-forge.r-project.org noreply at r-forge.r-project.org
Thu Apr 9 12:57:25 CEST 2009


Author: stamats
Date: 2009-04-09 12:57:25 +0200 (Thu, 09 Apr 2009)
New Revision: 279

Modified:
   pkg/RobLoxBioC/inst/scripts/AffymetrixExample.R
   pkg/RobLoxBioC/inst/scripts/IlluminaExample.R
Log:
small modifications

Modified: pkg/RobLoxBioC/inst/scripts/AffymetrixExample.R
===================================================================
--- pkg/RobLoxBioC/inst/scripts/AffymetrixExample.R	2009-04-09 06:41:59 UTC (rev 278)
+++ pkg/RobLoxBioC/inst/scripts/AffymetrixExample.R	2009-04-09 10:57:25 UTC (rev 279)
@@ -27,7 +27,7 @@
 ## and
 ## http://www.genelogic.com/media/studies/dilution.cfm        (not found)
 ## seem not to lead to the data any longer.
-## An email to the support of genelogic is still unanswered ...
+## An email to the support of genelogic remained unanswered ...
 ###############################################################################
 
 
@@ -70,10 +70,10 @@
 ###########################################################
 library(RobLoxBioC)
 
-## takes more than 90 min on Intel P9500 (64bit Linux, 4 GByte RAM)
-#system.time(minKD.hgu95a <- KolmogorovMinDist(spikein.hgu95a, Norm()))
+## takes more than 100 min on Intel P9500 (64bit Linux, 4 GByte RAM)
+system.time(minKD.hgu95a <- KolmogorovMinDist(spikein.hgu95a, Norm()))
 ## takes more than 130 min on Intel P9500 (64bit Linux, 4 GByte RAM)
-#system.time(minKD.hgu133a <- KolmogorovMinDist(spikein.hgu133a, Norm()))
+system.time(minKD.hgu133a <- KolmogorovMinDist(spikein.hgu133a, Norm()))
 
 ## load the results from R-forge ...
 con <- url("http://robast.r-forge.r-project.org/data/minKD_hgu95a.RData")
@@ -85,8 +85,51 @@
 
 boxplot(as.data.frame(minKD.hgu95a$dist), main = "HGU95a")
 boxplot(as.data.frame(minKD.hgu133a$dist), main = "HGU133a")
+table(minKD.hgu95a$n)
+table(minKD.hgu133a$n)
 
+###########################################################
+## Comparison with normal samples
+###########################################################
 
+## takes more than 90 min on Intel P9500 (64bit Linux, 4 GByte RAM)
+ns <- 5:20
+M <- length(ns)
+minKD.norm <- matrix(NA, nrow = 50000, ncol = M)
+for(i in seq_len(M)){
+    print(i)
+    temp <- matrix(rnorm(50000*ns[i]), ncol = ns[i])
+    minKD.norm[,i] <- KolmogorovMinDist(temp, Norm())$dist
+}
+colnames(minKD.norm) <- ns
+
+## load the results from R-forge
+con <- url("http://robast.r-forge.r-project.org/data/minKD_norm.RData")
+load(file = con)
+close(con)
+
+x11(width = 14)
+par(mfrow = c(1, 3))
+res <- split(as.vector(minKD.hgu95a$dist), as.vector(minKD.hgu95a$n))
+uni.n <- sort(unique(as.vector(minKD.hgu95a$n)))
+boxplot(res, main = "HGU95a", ylim = c(0, 0.45), 
+        ylab = "minimum Kolmogorov distance", xlab = "sample size")
+lines(1:length(uni.n), 1/(2*uni.n), col = "orange", lwd = 2)
+legend("topright", legend = "minimal possible distance", fill = "orange")
+
+res <- split(as.vector(minKD.hgu133a$dist), as.vector(minKD.hgu133a$n))
+uni.n <- sort(unique(as.vector(minKD.hgu133a$n)))
+boxplot(res, main = "HGU133a", ylim = c(0, 0.45), 
+        ylab = "minimum Kolmogorov distance", xlab = "sample size")
+lines(1:length(uni.n), 1/(2*uni.n), col = "orange", lwd = 2)
+legend("topright", legend = "minimal possible distance", fill = "orange")
+
+boxplot(as.data.frame(minKD.norm), main = "Normal samples", ylim = c(0, 0.45), 
+        ylab = "minimum Kolmogorov distance", xlab = "sample size")
+lines(1:length(ns), 1/(2*ns), col = "orange", lwd = 2)
+legend("topright", legend = "minimal possible distance", fill = "orange")
+
+
 ###########################################################
 ## assessments for MAS 5.0 and RMA including dilution data from package affycomp
 ###########################################################

Modified: pkg/RobLoxBioC/inst/scripts/IlluminaExample.R
===================================================================
--- pkg/RobLoxBioC/inst/scripts/IlluminaExample.R	2009-04-09 06:41:59 UTC (rev 278)
+++ pkg/RobLoxBioC/inst/scripts/IlluminaExample.R	2009-04-09 10:57:25 UTC (rev 279)
@@ -91,9 +91,6 @@
 rm(bld.sharpen.normexp); gc()
 
 
-
-
-
 ## no sharpening, no local background subtraction
 bld.nosharpen.nobgc <- readIllumina(path = "./SpikeInData", textType=".csv", 
                                     arrayNames=targets$ArrayNo,
@@ -302,6 +299,7 @@
 #            simdataarray2 at beadData[[arraynms[i]]]$G[ind] <- 2^16
         ## problem: there are bead types where more than 50% of the values are contaminated
         ## => there is no meaningful estimator which can handle this!
+        ## Hence, we contiminate bead-type wise
             sel <- which(simdataarray2 at beadData[[arraynms[i]]]$ProbeID != 0)
             pr <- simdataarray2 at beadData[[arraynms[i]]]$ProbeID[sel]
             probes <- sort(unique(pr))



More information about the Robast-commits mailing list