13、几类控制探针组

  Affymetrix阵列包含一些控制探针组,用“AFFX”、“INTRON”、“EXON”注释。

 

一、一些芯片的控制探针组是用“AFFX”开头的,没有“INTRON”和“EXON”探针组,如“HG_U95Av2”。获取“HG_U95Av2”的“AFFX”探针组名:

 

library(affy) 

cdfname <- "HG-U133A_2"

 

how = getOption("BioC")$affy$probesloc

verbose = FALSE

badOut <- list()

for (i in 1:length(how)) 

{

cur <- how[[i]]

        envir <- switch(cur$what, 

environment = cdfFromEnvironment(cdfname, cur$where, verbose), 

libPath = cdfFromLibPath(cdfname, cur$where, verbose = verbose), 

bioC = cdfFromBioC(cdfname, cur$where, verbose))

 

}

 

genenames <- ls(envir)

affxnames <- unique(genenames[grep("AFFX",genenames,fixed=TRUE)])

> affxnames

 [1] "AFFX-BioB-3_at"              "AFFX-BioB-5_at"             

 [3] "AFFX-BioB-M_at"              "AFFX-BioC-3_at"             

 [5] "AFFX-BioC-5_at"              "AFFX-BioDn-3_at"            

 [7] "AFFX-BioDn-5_at"             "AFFX-CreX-3_at"             

 [9] "AFFX-CreX-5_at"              "AFFX-DapX-3_at"             

[11] "AFFX-DapX-5_at"              "AFFX-DapX-M_at"             

[13] "AFFX-HSAC07/X00351_3_at"     "AFFX-HSAC07/X00351_5_at"    

[15] "AFFX-HSAC07/X00351_M_at"     "AFFX-hum_alu_at"            

[17] "AFFX-HUMGAPDH/M33197_3_at"   "AFFX-HUMGAPDH/M33197_5_at"  

[19] "AFFX-HUMGAPDH/M33197_M_at"   "AFFX-HUMISGF3A/M97935_3_at" 

[21] "AFFX-HUMISGF3A/M97935_5_at"  "AFFX-HUMISGF3A/M97935_MA_at"

[23] "AFFX-HUMISGF3A/M97935_MB_at" "AFFX-HUMRGE/M10098_3_at"    

[25] "AFFX-HUMRGE/M10098_5_at"     "AFFX-HUMRGE/M10098_M_at"    

[27] "AFFX-LysX-3_at"              "AFFX-LysX-5_at"             

[29] "AFFX-LysX-M_at"              "AFFX-M27830_3_at"           

[31] "AFFX-M27830_5_at"            "AFFX-M27830_M_at"           

[33] "AFFX-PheX-3_at"              "AFFX-PheX-5_at"             

[35] "AFFX-PheX-M_at"              "AFFX-r2-Bs-dap-3_at"        

[37] "AFFX-r2-Bs-dap-5_at"         "AFFX-r2-Bs-dap-M_at"        

[39] "AFFX-r2-Bs-lys-3_at"         "AFFX-r2-Bs-lys-5_at"        

[41] "AFFX-r2-Bs-lys-M_at"         "AFFX-r2-Bs-phe-3_at"        

[43] "AFFX-r2-Bs-phe-5_at"         "AFFX-r2-Bs-phe-M_at"        

[45] "AFFX-r2-Bs-thr-3_s_at"       "AFFX-r2-Bs-thr-5_s_at"      

[47] "AFFX-r2-Bs-thr-M_s_at"       "AFFX-r2-Ec-bioB-3_at"       

[49] "AFFX-r2-Ec-bioB-5_at"        "AFFX-r2-Ec-bioB-M_at"       

[51] "AFFX-r2-Ec-bioC-3_at"        "AFFX-r2-Ec-bioC-5_at"       

[53] "AFFX-r2-Ec-bioD-3_at"        "AFFX-r2-Ec-bioD-5_at"       

[55] "AFFX-r2-P1-cre-3_at"         "AFFX-r2-P1-cre-5_at"        

[57] "AFFX-ThrX-3_at"              "AFFX-ThrX-5_at"             

[59] "AFFX-ThrX-M_at"              "AFFX-TrpnX-3_at"            

[61] "AFFX-TrpnX-5_at"             "AFFX-TrpnX-M_at"

 

affxnames的输出结果中可以看到AFFX-r2-Bs-lys-3_atAFFX-r2-Bs-dap-3_atAFFX-r2-Bs-phe-3_atAFFX-r2-Bs-thr-3_s_atAFFX-r2-Ec-bioB-3_atAFFX-r2-Ec-bioC-3_atAFFX-r2-Ec-bioD-3_atAFFX-r2-P1-cre-3_atAFFX-HSAC07/X00351_3_atAFFX-HUMGAPDH/M33197_3_at这类探针组,它们是一些嵌入探针组或beta-actinGAPDH基因的探针组。

 

二、一些芯片包含了“AFFX”、“INTRON”和“EXON”探针组,不过这些探针组也并没有用“AFFX”、“INTRON”、“EXON”显式地表示,如“HuGene-1_0-st-v1”。获取“HuGene-1_0-st-v1”的控制探针组名:

 

library(affy) 

cdfname <- "HuGene-1_0-st-v1"

 

how = getOption("BioC")$affy$probesloc

verbose = FALSE

 

badOut <- list()

for (i in 1:length(how)) 

{

cur <- how[[i]]

        envir <- switch(cur$what, 

environment = cdfFromEnvironment(cdfname, cur$where, verbose), 

libPath = cdfFromLibPath(cdfname, cur$where, verbose = verbose), 

bioC = cdfFromBioC(cdfname, cur$where, verbose))

}

 

genenames <- ls(envir) ## 探针名

 

require("ArrayTools", quietly = TRUE)

annotation <- cleancdfname(cdfname, addcdf = FALSE)

dataTable <- paste(substr(annotation,1,nchar(annotation)-2),"CONTROL",sep="")

 

suppressWarnings(eval(parse("",-1,paste("data(",dataTable,")",sep="")))) #ArrayTools

cntrl <- NULL

try(cntrl <- get(dataTable),TRUE)

 

assign("affx",cntrl[grep("affx",cntrl[,2]),1])

assign("exon",cntrl[grep("exon",cntrl[,2]),1])

assign("intron",cntrl[grep("intron",cntrl[,2]),1])

 

controlnames <- cntrl[,1] ## 所有的控制探针组

affxnames <- get("affx")[get("affx") %in% genenames] ## AFFX”探针组

exonnames <- get("exon")[get("exon") %in% genenames] ## EXON”探针组

intronnames <- get("intron")[get("intron") %in% genenames] ## INTRON”探针组

 

> affxnames

 [1] 7892796 7892925 7893130 7893306 7893613 7893939 7894584 7894611 7894970

[10] 7895139 7895220 7896160 7896366

 

posted @ 2015-05-22 14:58  洗浄  阅读(1305)  评论(0编辑  收藏  举报