#以下为安装TCGAbiolinks的R包
#1)第一种
if (!requireNamespace("BiocManager", quietly=TRUE))
install.packages("BiocManager")
BiocManager::install("TCGAbiolinks")
#2)第二种
#可以先下载到本地安装比较快
#Tools > install.packages
#3) 第三种
devtools::install_github(repo = "BioinformaticsFMRP/TCGAbiolinks")
#################################
# TCGA-12-4567-01-blah-blah --> 这是Normal
# TCGA-12-4567-11-blah-blah --> 这是tumor
# 注意黑体的部分。01-09是tumor;10-19是Normal;20-29是Control
####加载程序包
library(TCGAbiolinks)
library(dplyr)
library(DT)
library(SummarizedExperiment)
#################################
#下面填入要下载的癌症种类
request_cancer=c("PRAD","BLCA","KICH","KIRC","KIRP")
for (i in request_cancer) {
cancer_type=paste("TCGA",i,sep="-")
print(cancer_type)
#下载临床数据
clinical <- GDCquery_clinic(project = cancer_type, type = "clinical")
write.csv(clinical,file = paste(cancer_type,"clinical.csv",sep = "-"))
#下载rna-seq的counts数据
query <- GDCquery(project = cancer_type,
data.category = "Transcriptome Profiling",
data.type = "Gene Expression Quantification",
workflow.type = "HTSeq - Counts")
GDCdownload(query, method = "api", files.per.chunk = 100)
expdat <- GDCprepare(query = query)
count_matrix=assay(expdat)
write.csv(count_matrix,file = paste(cancer_type,"Counts.csv",sep = "-"))
#下载miRNA数据
query <- GDCquery(project = cancer_type,
data.category = "Transcriptome Profiling",
data.type = "miRNA Expression Quantification",
workflow.type = "BCGSC miRNA Profiling")
GDCdownload(query, method = "api", files.per.chunk = 50)
expdat <- GDCprepare(query = query)
count_matrix=assay(expdat)
write.csv(count_matrix,file = paste(cancer_type,"miRNA.csv",sep = "-"))
#下载Copy Number Variation数据
query <- GDCquery(project = cancer_type,
data.category = "Copy Number Variation",
data.type = "Copy Number Segment")
GDCdownload(query, method = "api", files.per.chunk = 50)
expdat <- GDCprepare(query = query)
count_matrix=assay(expdat)
write.csv(count_matrix,file = paste(cancer_type,"Copy-Number-Variation.csv",sep = "-"))
#下载甲基化数据
query.met <- GDCquery(project =cancer_type,
legacy = TRUE,
data.category = "DNA methylation")
GDCdownload(query.met, method = "api", files.per.chunk = 300)
expdat <- GDCprepare(query = query)
count_matrix=assay(expdat)
write.csv(count_matrix,file = paste(cancer_type,"methylation.csv",sep = "-"))
}
TCGAbiolinks下载TCGA数据
最后编辑于 :
©著作权归作者所有,转载或内容合作请联系作者
【社区内容提示】社区部分内容疑似由AI辅助生成,浏览时请结合常识与多方信息审慎甄别。
平台声明:文章内容(如有图片或视频亦包括在内)由作者上传并发布,文章内容仅代表作者本人观点,简书系信息发布平台,仅提供信息存储服务。
【社区内容提示】社区部分内容疑似由AI辅助生成,浏览时请结合常识与多方信息审慎甄别。
平台声明:文章内容(如有图片或视频亦包括在内)由作者上传并发布,文章内容仅代表作者本人观点,简书系信息发布平台,仅提供信息存储服务。
相关阅读更多精彩内容
- The data retrieval is handled by the three main TCGAbioli...
- 1. 什么是TCGA?TCGA中有哪些数据? TCGA的全称是The Cancer Genome Atlas, 这...
- 参考学习资料:还是小洁老师的TCGA-3.R包TCGA-biolinks下载数据下载安装包 这个包有点大,安装需要...
- 首先到官网下载需要的包:http://www.keepalived.org/download.html [root...