加载地理曲线包裹。

图书馆(地理码)
##加载所需包:加载所需的包:生物根系文件##加载所需的包:并行## ##附加包:'生物根系术'## ##以下对象从“包:并行”屏蔽:####clusterapply,clusterapplylb,clustercall,clusterevalq,## clusterexport,clustermap,parapply,parcapply,parlapply,## parlapplylb,parrapply,parsapply,parsapplylb ## ##以下对象屏蔽了“包:统计”:## ##IQR,MAD,XTABS ## ##以下对象从“包:基础”屏蔽:## ## AnyDupleated,Append,As.Data.frame,As.vector,Cbind,## Colnames,Do.call,重复,eval,evalq,filter,find,get,## grep,grepl,相交,是.unsorted,lapply,长度,地图,## makply,match,mget,订单,粘贴,pmax,pmax.int,pmin,##pmin.int,位置,等级,rbind,减少,rownames,sapply,## setdiff,sort,表,tappety,Union,unique,dil,undplit ###欢迎来到Biocumon ## Vignettes包含介绍性材料;与##'BrowSevignettes()'查看。为了引用生物导体,请参阅##'引文(“Biobase”)',以及包装的引文(“PKGNAME”)'。## ##设置选项('download.file.method.geoquery'='auto')

获取数据

x = getGeOSuppfiles(“GSE20986”)
## ftp://ftp.ncbi.nlm.nih.gov/geo/series/gse20nnn/gse20986/suppl/
X
##尺寸ISDir模式## /tmp/houtan/gse20986/gse20986_raw.tar 56360960 false 644 ## /tmp/houtan/gse20986/filelist.txt 740 false 644 ## mtime ## /tmp/houtan/gse20986/gse20986_raw.tar2015-10-14 05:16:54 ## /tmp/houtan/gse20986/filelist.txt 2015-10-14 05:16:57 ## Ctime ## /tmp/houtan/gse20986/gse20986_raw.tar 2015-10-14 05:16:54 ## /tmp/houtan/gse20986/filelist.txt 2015-10-14 05:16:57 ## atime uid gid ## /tmp/houtan/gse20986/gse20986_raw.tar 2015-10-14 05:14:50 37962 37962 ## /tmp/houtan/gse20986/filelist.txt 2015-10-14 05:08:01 37962 37962 ## uname grname ## /tmp/houtan/gse20986/gse20986_raw.tar mtmorgan g_mtmorgan## /tmp/houtan/gse20986/filelist.txt mtmorgan g_mtmorgan

无阵阵数据

Untar(“GSE20986 / GSE20986_RAW.tar”,EXDIR =“数据”)

枪支数据

cels = list.files(“数据/”,模式=“[gz]”)Sapply(粘贴(“数据”,CELS,SEP =“/”),GUNZ​​IP)
##数据/ GSM524662.COCE.GZ数据/ GSM524663.COCE.GZ数据/ GSM524664.COCE.GZ ## 13555726 13555639 ##数据/ GSM524665.COR.GZ数据/ GSM524666.COR.GZ数据/ GSM524667.CEL。GZ ## 13560122 13555663 13555663 1355763 13557614 ##数据/ GSM524668.COCE.GZ数据/ GSM524669.CEL.GZ数据/ GSM524670.COCE.GZ ## 13556090 13560054 13555090 13560054 13555090 13560054 1355971 ##数据/ GSM524671.COR.GZ数据/ GSM524672.COR.GZ数据/ GSM524673.CEL.GZ ## 13554926 13555042 13555290

创建你的penodata.

penodata =矩阵(rep(list.files(“数据”),2),ncol = 2)类(phenodata)
## [1]“矩阵”
Phenodata < -  As.Data.Frame(Phenodata)Colnames(Phenodata)< -  C(“名称”,“文件名”)Penodata $ Targets < -  C(“Iris”,“Retina”,“Retina”,“Iris”,“视网膜”,“虹膜”,“脉络膜”,“脉络膜”,“脉络膜”,“HUVEC”,“HUVEC”,“HUVEC”)写道。(Phenodata,“数据/ Phenodata.txt”,Quote = F,SEP =“\ T”,Row.names = F)
图书馆(Simpleaffy)
##加载所需包:yify ##加载所需包:Genefilter ## ##附加包必填包:GCRMA
celfiles < -  read.affy(covdesc =“penodata.txt”,path =“data”)boxplot(celfiles)
##警告:加载##'HGU133PLUS2CDF'时替换以前的“utils ::尾部”
##警告:加载##'HGU133PLUS2CDF'时替换以前的“utils :: head”
##

库(RColorBrewer)Cols = Brewer.pal(8,Set1“)ESET < -  exprs(Celfiles)样本< -  Celfiles $ targets Colnames(ESET)
## [1]“GSM524663.CEL”“GSM524664.CEL”“GSM524665.CEL”GSM524666.CEL“GSM524668.CEL”“GSM524669.CEL”“GSM524669.CEL”## [9]“GSM524670.CEL”“GSM524671.CEL”“GSM524672.CEL”“GSM524673.CER”
Colnames(ESET)< -  Samples Boxplot(Celfille,Col = Cols,LAS = 2)

距离< -  dist(t(eSET),方法=“最大”)群集< -  hclust(距离)绘图(群集)

要求(simpleaffy)要求(affyplm)
##加载所需包:AFFYPLM ##加载所需包:预处理核
celfiles.gcrma = gcrma(celfiles)
##调整光学效果............完成。##计算亲和力
##加载所需包:加载所需包:Stats4 ##加载所需包:绞喉##加载所需的包:S4Vectors ## ##附加包:'Iranges' ## ##以下对象从'包屏蔽以下对象:SimpleAffy':## ##成员
## 。完毕。##调整非特异性绑定............完成。##归一化##计算表达式
par(mfrow = c(1,2))boxplot(celfiles.gcrma,col = col,las = 2,main =“后标准化”);Boxplot(Celfiles,Col = Cols,LAS = 2,Main =“预归一化”)

dev.off()
## null device ## 1
距离< -  dist(t(exprs(celfiles.gcrma)),方法=“最大”)簇< -  hclust(距离)绘图(群集)
图书馆(Limma)
## ##附加包:'limma' ## ##从“包裹:生物根系中”屏蔽以下对象:## ## plotma
phenodata.
##名称文件名目标## 1 GSM524662.COL GSM524662.CEL IRIS ## 2 GSM524663.COR RETINA ## 3 GSM524664.COR GSM524664.COR RETINA ## 4 GSM524665.COR GSM524665.COR IRIS ## 5 GSM524666。cel gsm524666.Cel retina ## 6 GSM524667.CEL IRIS ## 7 GSM524668.COR GSM524668.COR GSM524668.COR GSM524669.CEL GSM524669.CEL CHSM524669.CEL CHOROID ## 9 GSM524670.COR GSM524670.CEL CHOROID ## 10 GSM524671。Cel GSM524671.CEL HUVEC ## GSM524672.COR GSM524672.CEL HUVEC ## 12 GSM524673.CEL GSM524673.CEL HUVEC
样本< -  as.factor(样本)设计< -  model.matrix(〜0 +样本)colnames(设计)
## [1]“SamplesChoroid”“Sampleshuvec”“Samplesiris”“SamplesRetina”
Colnames(设计)< -  C(“Choroid”,“Huvec”,“Iris”,“Retina”)设计
## Choroid Huvec虹膜Retina ## 1 0 0 1 0 ## 2 0 0 0 1 ## 3 0 0 0 1 ## 4 0 0 1 0 ## 5 0 0 0 1 ## 6 0 0 1 0 ##7 1 0 0 0 0 0#8 1 0 0 0 0#9 1 0 0 0 ## 10 0 1 0 0 0 ## 11 0 1 0 0 ## 12 0 1 0 0 ## attr(,“分配”)##[1] 1 1 1 1 1 1 ## attr(,对比“)## attr(,”对比度“)$ samples ## [1]”contr.treatment“
Contrast.matrix = MakeContrasts(Huvec_Choroid = Huvec  -  Choroid,Huvec_Retina = Huvec-Retina,Huvec_Iris < -  Huvec  -  Iris,Levels = Design)Fit = Lmfit(C​​elfiles.gcrma,Design)Huvec_fit < -  Formast.fit(适合,对比度。矩阵)HUVEC_EBAY < -  eBayes(HUVEC_FIT)库(HGU133PLUS2.DB)
##加载所需包:org.hs.eg.db ##加载所需包:DBI
图书馆(注释)
##加载所需包:XML
probenames.list < -  rownames(toptable(huvec_ebay,number = 100000))getsymbols < -  getsymbol(probenames.list,“hgu133plus2”)结果< -  toptable(huvec_ebay,number = 100000,cof =“huvec_choroid”)结果< -  cbind(结果,getsymbols)

制作门槛

摘要(结果)
## logfc aveexpr t p.value ## min。:-9.19111分钟。:2.279分钟。:-39.77473分钟。:0.0000 ## 1ST Qu.:-0.05967 1st qu。:-0.70649 1st qu。:0.70649 1st qu.:0.1523 ##中位数:0.00000中位数:2.480中位数:0.00000中位数:0.05079 ##均值:-0.02353意思:4.375平均值:0.07441意思是:0.5346 ## 3rd qu。:0.03986 3rd qu。:6.241 3rd qu。:0.67455 3rd qu.:1.0000 ## max。:最多8.67086。:最多15.541。:296.84201 Max。:1.0000 ####JAG.VAL B Getsymbols ## min。 :0.0000 Min. :-7.710 YME1L1 : 22 ## 1st Qu.:0.6036 1st Qu.:-7.710 HFE : 15 ## Median :1.0000 Median :-7.451 CFLAR : 14 ## Mean :0.7436 Mean :-6.582 NRP2 : 14 ## 3rd Qu.:1.0000 3rd Qu.:-6.498 ARHGEF12: 13 ## Max. :1.0000 Max. :21.290 (Other) :42280 ## NA's :12317
结果$阈值< - “1”A < - 子集(结果,adj.p.val <0.05和logfc> 5)结果[Rownames(A),“阈值”] < - “2”B < - 子集(结果,adj.p.val <0.05和logfc <-5)结果[Rownames(b),“阈值”] < - “3”表(结果$阈值)
## ## 1 2 3 ## 54587 33 55

制作GGPLOT.

库(GGPlot2)Volcano < -  Ggplot(数据=结果,AES(x = logfc,y = -1 * log10(adj.p.val),color = throupold,label = getsymbols))Volcano < -  Volano + GeoM_Point()+ scale_color_manual(值= c(“黑色”,“红色”,“绿色”),标签= c(“不显着”,“上调”,“下调”),name =“键/图例”)Volcano + GeoM_Text(数据=子集(结果,logfc> 5&-1 * log10(adj.p.val)> 5),aes(x = logfc,y = -1 * log10(adj.p.val),color =阈值,标签= getsymbols))
##警告:删除了包含缺失值(GeoM_Text)的4行。

Geo Link.