> source("http://bioconductor.org/biocLite.R")
> biocLite()
> biocLite(c("GenomicFeatures", "AnnotationDbi"))
> biocLite
function (pkgs = c("Biobase", "IRanges", "AnnotationDbi"), suppressUpdates = FALSE,
suppressAutoUpdate = FALSE, siteRepos = character(), ask = TRUE,
if (missing(pkgs))
pkgs <- pkgs[!pkgs %in% rownames(installed.packages())]
if (!suppressAutoUpdate && !.isCurrentBiocInstaller()) {
on.exit(.updateBiocInstaller(pkgs, ask = ask, suppressUpdates = suppressUpdates,
siteRepos = siteRepos, ...))
else if ("BiocUpgrade" %in% pkgs) {
else {
.biocLiteInstall(pkgs, ask = ask, siteRepos = siteRepos,
suppressUpdates = suppressUpdates, ...)
<environment: namespace:BiocInstaller>
> chooseBioCmirror()
HTTPS BioC mirror
1: 0-Bioconductor (World-wide) [https]
2: Germany (Dortmund) [https]
3: United Kingdom (Hinxton) [https]
4: Japan (Wako) [https]
5: China (Anhui) [https]
6: (HTTP mirrors)
Selection: 4
> chooseCRANmirror()
1: 0-Cloud [https] 2: Austria [https]
3: Chile [https] 4: China (Beijing 4) [https]
5: China (Hefei) [https] 6: Colombia (Cali) [https]
7: France (Lyon 2) [https] 8: Germany (Munster) [https]
9: Iceland [https] 10: Russia (Moscow) [https]
11: Spain (A Coruna) [https] 12: Switzerland [https]
13: UK (Bristol) [https] 14: UK (Cambridge) [https]
15: USA (CA 1) [https] 16: USA (KS) [https]
17: USA (MI 1) [https] 18: USA (TN) [https]
19: USA (TX) [https] 20: USA (WA) [https]
21: (HTTP mirrors)
メニューから項目を入力するか、0 を入力して終了して下さい
Selection: 0
BioconductorのAnnotation Data Packageを試す。
対象は、AffymetrixのHuman RNA解析Chip
3' IVT Expression Analysis | Gene Regulation Analysis | miRNA Analysis | Whole-Transcript Expression Analysis & Profiling
3'IVT Expression Analysis → Human Genome U133A Arrayのデータパッケージ「hgu133A」

> ?hgu133a.db ヘルプで確認
> biocLite("hgu133a.db")
> library("hgu133a.db")
> ls("package:hgu133a.db")
[1] "hgu133a" "hgu133a.db" "hgu133a_dbconn"
[4] "hgu133a_dbfile" "hgu133a_dbInfo" "hgu133a_dbschema"
[7] "hgu133aACCNUM" "hgu133aALIAS2PROBE" "hgu133aCHR"
[10] "hgu133aCHRLENGTHS" "hgu133aCHRLOC" "hgu133aCHRLOCEND"
[13] "hgu133aENSEMBL" "hgu133aENSEMBL2PROBE" "hgu133aENTREZID"
[16] "hgu133aENZYME" "hgu133aENZYME2PROBE" "hgu133aGENENAME"
[19] "hgu133aGO" "hgu133aGO2ALLPROBES" "hgu133aGO2PROBE"
[22] "hgu133aMAP" "hgu133aMAPCOUNTS" "hgu133aOMIM"
[25] "hgu133aORGANISM" "hgu133aORGPKG" "hgu133aPATH"
[28] "hgu133aPATH2PROBE" "hgu133aPFAM" "hgu133aPMID"
[31] "hgu133aPMID2PROBE" "hgu133aPROSITE" "hgu133aREFSEQ"
[34] "hgu133aSYMBOL" "hgu133aUNIGENE" "hgu133aUNIPROT"
> myMap<-hgu133aENTREZID MyMap変数に抽出
> myMap
ENTREZID map for chip hgu133a (object of class "ProbeAnnDbBimap")
> summary(myMap)
ENTREZID map for chip hgu133a (object of class "ProbeAnnDbBimap")
| Lkeyname: probe_id (Ltablename: probes)
| Lkeys: "1007_s_at", "1053_at", ... (total=22283/mapped=19846)
| Rkeyname: gene_id (Rtablename: genes)
| Rkeys: "1", "2", ... (total=56340/mapped=12434)
| direction: L --> R
> mapped_probes<-mappedkeys(myMap)
> summary(mapped_probes)
Length Class Mode
19846 character character
> MyEntrez <- as.list(myMap[mapped_probes[1:5]])
> MyEntrez EntrezID番号
[1] "5982"
[1] "3310"
[1] "7849"
[1] "2978"
[1] "7067"
> MyEntrez[1] listエントリ1番目データへのアクセス
[1] "5982"
> MyEntrez[[1]] listエントリ1番目データの中身へアクセス
[1] "5982"
> d1 <- c() 空の変数作成
> for (i in 1:3){ d1<- append(d1, MyEntrez[[i]]) }
> d1
[1] "5982" "3310" "7849"
> biocLite("org.Hs.eg.db")
> library(org.Hs.eg.db)

> myEIDs<-c("1","10","100","1000","37690")
> myEIDs
[1] "1" "10" "100" "1000" "37690"
> ls("package:org.Hs.eg.db")
[1] "org.Hs.eg" "org.Hs.eg.db"
[3] "org.Hs.eg_dbconn" "org.Hs.eg_dbfile"
[5] "org.Hs.eg_dbInfo" "org.Hs.eg_dbschema"
[7] "org.Hs.egACCNUM" "org.Hs.egACCNUM2EG"
[9] "org.Hs.egALIAS2EG" "org.Hs.egCHR"
[11] "org.Hs.egCHRLENGTHS" "org.Hs.egCHRLOC"
[13] "org.Hs.egCHRLOCEND" "org.Hs.egENSEMBL"
[15] "org.Hs.egENSEMBL2EG" "org.Hs.egENSEMBLPROT"
[17] "org.Hs.egENSEMBLPROT2EG" "org.Hs.egENSEMBLTRANS"
[19] "org.Hs.egENSEMBLTRANS2EG" "org.Hs.egENZYME"
[21] "org.Hs.egENZYME2EG" "org.Hs.egGENENAME"
[23] "org.Hs.egGO" "org.Hs.egGO2ALLEGS"
[25] "org.Hs.egGO2EG" "org.Hs.egMAP"
[27] "org.Hs.egMAP2EG" "org.Hs.egMAPCOUNTS"
[29] "org.Hs.egOMIM" "org.Hs.egOMIM2EG"
[31] "org.Hs.egORGANISM" "org.Hs.egPATH"
[33] "org.Hs.egPATH2EG" "org.Hs.egPFAM"
[35] "org.Hs.egPMID" "org.Hs.egPMID2EG"
[37] "org.Hs.egPROSITE" "org.Hs.egREFSEQ"
[39] "org.Hs.egREFSEQ2EG" "org.Hs.egSYMBOL"
[41] "org.Hs.egSYMBOL2EG" "org.Hs.egUCSCKG"
[43] "org.Hs.egUNIGENE" "org.Hs.egUNIGENE2EG"
[45] "org.Hs.egUNIPROT"
> mySymbols<-mget(myEIDs,org.Hs.egSYMBOL,ifnotfound=NA)
> mySymbols
[1] "A1BG"
[1] "NAT2"
[1] "ADA"
[1] "CDH2"
[1] NA
> y<-mySymbols[!is.na(mySymbols)]
> y
1 10 100 1000
"A1BG" "NAT2" "ADA" "CDH2"
> myEIDs<-mget(y,org.Hs.egSYMBOL2EG,ifnotfound=NA) ※本と違うので注意
> myEIDs
[1] "1"
[1] "10"
[1] "100"
[1] "1000"
KEGG API パスウェイで見たい生物種の遺伝子(EC番号)のみ表示できるhttps://www.google.co.jp/search?q=KEGG+API&hl=ja&source=lnms&tbm=isch&sa=X&ved=0CAgQ_AUoAWoVChMIz-fmgOusyAIVYeKmCh0u_AlN&biw=1008&bih=632
> biocLite("KEGG.db")
> library(KEGG.db)
KEGG.db contains mappings based on older data because the original
resource was removed from the the public domain before the most recent
update was produced. This package should now be considered deprecated
and future versions of Bioconductor may not have it available. Users
who want more current data are encouraged to look at the KEGGREST or
reactome.db packages
> ?KEGG.db
> ls("package:KEGG.db")
[1] "KEGG" "KEGG_dbconn" "KEGG_dbfile" "KEGG_dbInfo"
> myEID <- unlist(mget(y, org.Hs.egSYMBOL2EG, ifnotfound=NA))
> myEID<-as.character(myEID)> myEID
[1] "1" "10" "100" "1000"
> kegg<-mget(myEID,KEGGEXTID2PATHID,ifnotfound=list(NA))
=>Entrez(Gene)IDからKEGG PathwayIDにマップするオブジェクト
> kegg
[1] NA
[1] "hsa00232" "hsa00983" "hsa01100"
[1] "hsa00230" "hsa01100" "hsa05340"
[1] "hsa04514" "hsa05412"
> kegg[[2]]
[1] "hsa00232" "hsa00983" "hsa01100"
> kegg[[2]][1]
[1] "hsa00232"
> tmp1<-substr(kegg[[2]][1],4,8) 番号だけを抽出
> tmp1
[1] "00232"
> mypath1<-unlist(mget(tmp1,KEGGPATHID2NAME,ifnotfound=list(NA)))
=>KEGG PathwayIDからKEGG Pathway Nameにマップするオブジェクト
> mypath1
"Caffeine metabolism"
> biocLite("KEGGREST")
> library(KEGGREST)
> genes<-keggGet("hsa:1045")
> genes
[1] "CDX2, CDX-3, CDX2/AS, CDX3"
[1] "(RefSeq) caudal type homeobox 2"
"homeobox protein CDX"
"Homo sapiens (human)"
[1] "Transcription factors [BR:hsa03000]" " Eukaryotic Type"
[3] " Helix-turn-helix" " Homeo domain only, Cad"
[5] " 1045 (CDX2)"
[1] "13q12.3"
[1] "Pfam: Caudal_act Homeobox Homeobox_KN"
[1] "NCBI-ProteinID: NP_001256" "NCBI-GeneID: 1045"
[3] "OMIM: 600297" "HGNC: 1806"
[5] "HPRD: 02622" "UniProt: Q99626"
A AAStringSet instance of length 1
width seq
A DNAStringSet instance of length 1
width seq