HTSeq counts
# the followingprojects do not have RNA-seq data
# - VAREPOP-APOLLO
# - FM-AD
# - BEATAML1.0-CRENOLANIB
project <- grep("TCGA|TARGET|VAREPOP|FM-AD|CRENO",sort(getGDCprojects()$project_id),
invert = TRUE,
value = TRUE)
for(proj in project){
cat("\n\n## ", proj,"\n\n")
tryCatch({
query <- GDCquery(
project = proj,
data.category = "Transcriptome Profiling",
data.type = "Gene Expression Quantification",
workflow.type = "HTSeq - Counts"
)
query <- GDCquery(
project = proj,
data.category = "Transcriptome Profiling",
data.type = "Gene Expression Quantification",
workflow.type = "HTSeq - Counts",
barcode = getResults(query)$cases[1:10]
)
GDCdownload(query)
invisible(capture.output(
data <- GDCprepare(query)
))
kexpand.df(proj)
}, error = function(e){
message(e)
})
cat("\n\n")
}
BEATAML1.0-COHORT
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): BA2611R BA3038R ... BA2842R BA2450R
## colData names(30): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
CGCI-BLGSP
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): BLGSP-71-06-00162-01A BLGSP-71-06-00159-01A ...
## BLGSP-71-08-00029-01A BLGSP-71-08-00508-01B
## colData names(55): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
CPTAC-2
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): ad5c848c-ae26-42c8-874e-387a09
## 2ddefa4f-77aa-416f-93f3-904e07 ... a2f03d85-5f1a-4b3e-9dbf-74e67e
## 4798bb9d-7100-43aa-b615-85897d
## colData names(35): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
CPTAC-3
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): C3L-00448-01 C3L-00096-01 ... C3N-00491-02 C3N-00390-06
## colData names(69): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
CTSP-DLBCL1
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): DLBCL11280-sample DLBCL11295-sample ... DLBCL11319-sample
## DLBCL11284-sample
## colData names(42): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
GENIE-DFCI
14232 |
14232 |
Simple Nucleotide Variation |
14232 |
14232 |
Copy Number Variation |
GENIE-GRCC
1038 |
1038 |
Simple Nucleotide Variation |
GENIE-JHU
3320 |
3320 |
Simple Nucleotide Variation |
GENIE-MDA
3857 |
3857 |
Simple Nucleotide Variation |
GENIE-MSK
16823 |
16823 |
Simple Nucleotide Variation |
16823 |
16823 |
Copy Number Variation |
2824 |
2824 |
Somatic Structural Variation |
GENIE-NKI
801 |
801 |
Simple Nucleotide Variation |
GENIE-UHN
2632 |
2632 |
Simple Nucleotide Variation |
GENIE-VICC
2052 |
2052 |
Simple Nucleotide Variation |
1473 |
1473 |
Copy Number Variation |
308 |
308 |
Somatic Structural Variation |
HCMI-CMDC
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): HCM-CSHL-0063-C18-85A HCM-CSHL-0065-C20-06A ...
## HCM-BROD-0011-C71-01A HCM-BROD-0012-C71-01A
## colData names(58): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
MMRF-COMMPASS
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): MMRF_2475_1_BM_CD138pos MMRF_2836_1_BM_CD138pos ...
## MMRF_2597_1_BM_CD138pos MMRF_2807_1_BM_CD138pos
## colData names(41): barcode sample ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
NCICCR-DLBCL
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): DLBCL11676-sample DLBCL10991-sample ... DLBCL10951-sample
## DLBCL10995-sample
## colData names(32): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
OHSU-CNL
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): 3784R 2474R ... 4191R 2648R
## colData names(31): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
ORGANOID-PANCREATIC
## class: RangedSummarizedExperiment
## dim: 56512 10
## metadata(1): data_release
## assays(1): HTSeq - Counts
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(10): S158 S181 ... S194 S211
## colData names(31): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
STAR counts
# the followingprojects do not have RNA-seq data
# - VAREPOP-APOLLO
# - FM-AD
# - BEATAML1.0-CRENOLANIB
project <- c("CPTAC-3","MMRF-COMMPASS","TARGET-OS","CGCI-BLGSP")
for(proj in project){
cat("\n\n## ", proj,"\n\n")
tryCatch({
query <- GDCquery(
project = proj,
data.category = "Transcriptome Profiling",
data.type = "Gene Expression Quantification",
workflow.type = "STAR - Counts"
)
query <- GDCquery(
project = proj,
data.category = "Transcriptome Profiling",
data.type = "Gene Expression Quantification",
workflow.type = "STAR - Counts",
barcode = getResults(query)$cases[1:4]
)
GDCdownload(query)
invisible(capture.output(
data <- GDCprepare(query)
))
kexpand.df(paste0("START counts - ", proj))
}, error = function(e){
message(e)
})
cat("\n\n")
}
CPTAC-3
## class: RangedSummarizedExperiment
## dim: 56512 4
## metadata(1): data_release
## assays(3): unstranded stranded_first stranded_second
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(4): C3N-00383-04 C3N-00847-01 C3L-02365-01 C3L-01248-01
## colData names(65): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
MMRF-COMMPASS
## class: RangedSummarizedExperiment
## dim: 56512 4
## metadata(1): data_release
## assays(3): unstranded stranded_first stranded_second
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(4): MMRF_2091_1_BM_CD138pos MMRF_2422_1_BM_CD138pos
## MMRF_1048_1_BM_CD138pos MMRF_2608_1_BM_CD138pos
## colData names(39): barcode sample ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
TARGET-OS
## class: RangedSummarizedExperiment
## dim: 56512 4
## metadata(1): data_release
## assays(3): unstranded stranded_first stranded_second
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(4): TARGET-40-PANMIG-01A-01R TARGET-40-PATMXR-01A-01R
## TARGET-40-PAKXLD-01A-01R TARGET-40-0A4HXS-01A-01R
## colData names(46): nucleic.acid.code tumor.code ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
CGCI-BLGSP
## class: RangedSummarizedExperiment
## dim: 56512 4
## metadata(1): data_release
## assays(3): unstranded stranded_first stranded_second
## rownames(56512): ENSG00000000003 ENSG00000000005 ... ENSG00000281912
## ENSG00000281920
## rowData names(3): ensembl_gene_id external_gene_name
## original_ensembl_gene_id
## colnames(4): BLGSP-71-08-00194-01A BLGSP-71-06-00155-01A
## BLGSP-71-19-00113-01A BLGSP-71-08-00036-01A
## colData names(52): sample sample_submitter_id ... project_id name
## GRanges object with 56512 ranges and 3 metadata columns:
## seqnames ranges strand | ensembl_gene_id
## <Rle> <IRanges> <Rle> | <character>
## ENSG00000000003 chrX 100627108-100639991 - | ENSG00000000003
## ENSG00000000005 chrX 100584936-100599885 + | ENSG00000000005
## ENSG00000000419 chr20 50934867-50958555 - | ENSG00000000419
## ENSG00000000457 chr1 169849631-169894267 - | ENSG00000000457
## ENSG00000000460 chr1 169662007-169854080 + | ENSG00000000460
## ... ... ... ... . ...
## ENSG00000281904 chr2 90365737-90367699 + | ENSG00000281904
## ENSG00000281909 chr15 22480439-22484840 - | ENSG00000281909
## ENSG00000281910 chr16 58559796-58559931 - | ENSG00000281910
## ENSG00000281912 chr1 45303910-45305619 + | ENSG00000281912
## ENSG00000281920 chr2 65623272-65628424 + | ENSG00000281920
## external_gene_name original_ensembl_gene_id
## <character> <character>
## ENSG00000000003 TSPAN6 ENSG00000000003.13
## ENSG00000000005 TNMD ENSG00000000005.5
## ENSG00000000419 DPM1 ENSG00000000419.11
## ENSG00000000457 SCYL3 ENSG00000000457.12
## ENSG00000000460 C1orf112 ENSG00000000460.15
## ... ... ...
## ENSG00000281904 AC233263.6 ENSG00000281904.1
## ENSG00000281909 HERC2P7 ENSG00000281909.1
## ENSG00000281910 SNORA50A ENSG00000281910.1
## ENSG00000281912 LINC01144 ENSG00000281912.1
## ENSG00000281920 AC007389.5 ENSG00000281920.1
## -------
## seqinfo: 24 sequences from an unspecified genome; no seqlengths
LS0tCnRpdGxlOiAiUk5BLXNlcSBkYXRhIC0gY2hlY2tpbmcgbm9uIFRDR0EvVEFSR0VUIHByb2plY3RzIgpkYXRlOiAiYHIgU3lzLkRhdGUoKWAiCm91dHB1dDoKICBybWFya2Rvd246Omh0bWxfZG9jdW1lbnQ6CiAgICB0aGVtZTogbHVtZW4KICAgIGhpZ2hsaWdodDogemVuYnVybgogICAgdG9jOiB0cnVlCiAgICBudW1iZXJfc2VjdGlvbnM6IHRydWUKICAgIGRmX3ByaW50OiBwYWdlZAogICAgY29kZV9kb3dubG9hZDogdHJ1ZQogICAgdG9jX2Zsb2F0OgogICAgICBjb2xsYXBzZWQ6IHllcwogICAgdG9jX2RlcHRoOiAzCmVkaXRvcl9vcHRpb25zOgogIGNodW5rX291dHB1dF90eXBlOiBpbmxpbmUgICAgCi0tLQoKYGBge3IsIGluY2x1ZGU9RkFMU0V9CmxpYnJhcnkoa25pdHIpCmRldnRvb2xzOjpsb2FkX2FsbCgifi9Eb2N1bWVudHMvcGFja2FnZXMvVENHQWJpb2xpbmtzLyIpCmxpYnJhcnkoZHBseXIpCm9wdHNfa25pdCRzZXQocHJvZ3Jlc3MgPSBGQUxTRSwgdmVyYm9zZSA9IEZBTFNFLCBmaWcuYWxpZ24gPSAnY2VudGVyJykKb3B0c19jaHVuayRzZXQod2FybmluZyA9IEZBTFNFLCBtZXNzYWdlID0gRkFMU0UsIGVjaG8gPSBGQUxTRSkKCmtleHBhbmQuZGYgPC0gZnVuY3Rpb24oY2FwKSB7CiAgICBjYXQoCiAgICAgICAga25pdCh0ZXh0ID0ga25pdF9leHBhbmQodGV4dCA9ICBzcHJpbnRmKCJgYGB7ciAlc31cbiBkYXRhIFxuIGFzLmRhdGEuZnJhbWUoY29sRGF0YShkYXRhKSkgIFxuIGFzLmRhdGEuZnJhbWUoYXNzYXkoZGF0YSlbMTozLF0pIFxuIHJvd1JhbmdlcyhkYXRhKVxuIGBgYCIsY2FwKQogICAgICAgICkpCiAgICApCn0KYGBgCgojIEdEQyBwcm9qZWN0cwpgYGB7ciBjYXJzfQpwcm9qZWN0cyA8LSBnZXRHRENwcm9qZWN0cygpWyxjKDcsOSldCnByb2plY3RzW29yZGVyKHByb2plY3RzJHByb2plY3RfaWQpLF0KYGBgCgoKIyBIVFNlcSBjb3VudHMKCmBgYHtyLCBlY2hvPVRSVUUsIG1lc3NhZ2U9RkFMU0UsIHdhcm5pbmc9RkFMU0UscmVzdWx0cyA9ICJhc2lzIixmaWcuaGVpZ2h0PTEwfQojIHRoZSBmb2xsb3dpbmdwcm9qZWN0cyBkbyBub3QgaGF2ZSBSTkEtc2VxIGRhdGEgCiMgLSBWQVJFUE9QLUFQT0xMTwojIC0gRk0tQUQKIyAtIEJFQVRBTUwxLjAtQ1JFTk9MQU5JQgpwcm9qZWN0IDwtIGdyZXAoIlRDR0F8VEFSR0VUfFZBUkVQT1B8Rk0tQUR8Q1JFTk8iLHNvcnQoZ2V0R0RDcHJvamVjdHMoKSRwcm9qZWN0X2lkKSwKICAgICAgICAgICAgICAgIGludmVydCA9IFRSVUUsCiAgICAgICAgICAgICAgICB2YWx1ZSA9IFRSVUUpCmZvcihwcm9qIGluIHByb2plY3QpewogICAgY2F0KCJcblxuIyMgIiwgcHJvaiwiXG5cbiIpCiAgICB0cnlDYXRjaCh7CiAgICAgICAgcXVlcnkgPC0gR0RDcXVlcnkoCiAgICAgICAgICAgIHByb2plY3QgPSBwcm9qLAogICAgICAgICAgICBkYXRhLmNhdGVnb3J5ID0gIlRyYW5zY3JpcHRvbWUgUHJvZmlsaW5nIiwgCiAgICAgICAgICAgIGRhdGEudHlwZSA9ICJHZW5lIEV4cHJlc3Npb24gUXVhbnRpZmljYXRpb24iLAogICAgICAgICAgICB3b3JrZmxvdy50eXBlID0gIkhUU2VxIC0gQ291bnRzIgogICAgICAgICkKICAgICAgICBxdWVyeSA8LSBHRENxdWVyeSgKICAgICAgICAgICAgcHJvamVjdCA9IHByb2osCiAgICAgICAgICAgIGRhdGEuY2F0ZWdvcnkgPSAiVHJhbnNjcmlwdG9tZSBQcm9maWxpbmciLCAKICAgICAgICAgICAgZGF0YS50eXBlID0gIkdlbmUgRXhwcmVzc2lvbiBRdWFudGlmaWNhdGlvbiIsCiAgICAgICAgICAgIHdvcmtmbG93LnR5cGUgPSAiSFRTZXEgLSBDb3VudHMiLAogICAgICAgICAgICBiYXJjb2RlID0gZ2V0UmVzdWx0cyhxdWVyeSkkY2FzZXNbMToxMF0gCiAgICAgICAgKQogICAgICAgIEdEQ2Rvd25sb2FkKHF1ZXJ5KQogICAgICAgIGludmlzaWJsZShjYXB0dXJlLm91dHB1dCgKICAgICAgICAgICAgZGF0YSA8LSBHRENwcmVwYXJlKHF1ZXJ5KQogICAgICAgICkpCiAgICAgICAga2V4cGFuZC5kZihwcm9qKQogICAgfSwgZXJyb3IgPSBmdW5jdGlvbihlKXsKICAgICAgICBtZXNzYWdlKGUpCiAgICB9KQogICAgY2F0KCJcblxuIikKfQpgYGAKCiMgU1RBUiBjb3VudHMKCmBgYHtyLCBlY2hvPVRSVUUsIG1lc3NhZ2U9RkFMU0UsIHdhcm5pbmc9RkFMU0UscmVzdWx0cyA9ICJhc2lzIixmaWcuaGVpZ2h0PTEwfQojIHRoZSBmb2xsb3dpbmdwcm9qZWN0cyBkbyBub3QgaGF2ZSBSTkEtc2VxIGRhdGEgCiMgLSBWQVJFUE9QLUFQT0xMTwojIC0gRk0tQUQKIyAtIEJFQVRBTUwxLjAtQ1JFTk9MQU5JQgpwcm9qZWN0IDwtIGMoIkNQVEFDLTMiLCJNTVJGLUNPTU1QQVNTIiwiVEFSR0VULU9TIiwiQ0dDSS1CTEdTUCIpCmZvcihwcm9qIGluIHByb2plY3QpewogICAgY2F0KCJcblxuIyMgIiwgcHJvaiwiXG5cbiIpCiAgICB0cnlDYXRjaCh7CiAgICAgICAgcXVlcnkgPC0gR0RDcXVlcnkoCiAgICAgICAgICAgIHByb2plY3QgPSBwcm9qLAogICAgICAgICAgICBkYXRhLmNhdGVnb3J5ID0gIlRyYW5zY3JpcHRvbWUgUHJvZmlsaW5nIiwgCiAgICAgICAgICAgIGRhdGEudHlwZSA9ICJHZW5lIEV4cHJlc3Npb24gUXVhbnRpZmljYXRpb24iLAogICAgICAgICAgICAgIHdvcmtmbG93LnR5cGUgPSAiU1RBUiAtIENvdW50cyIKICAgICAgICApCiAgICAgICAgcXVlcnkgPC0gR0RDcXVlcnkoCiAgICAgICAgICAgIHByb2plY3QgPSBwcm9qLAogICAgICAgICAgICBkYXRhLmNhdGVnb3J5ID0gIlRyYW5zY3JpcHRvbWUgUHJvZmlsaW5nIiwgCiAgICAgICAgICAgIGRhdGEudHlwZSA9ICJHZW5lIEV4cHJlc3Npb24gUXVhbnRpZmljYXRpb24iLAogICAgICAgICAgICAgIHdvcmtmbG93LnR5cGUgPSAiU1RBUiAtIENvdW50cyIsCiAgICAgICAgICAgIGJhcmNvZGUgPSBnZXRSZXN1bHRzKHF1ZXJ5KSRjYXNlc1sxOjRdIAogICAgICAgICkKICAgICAgICBHRENkb3dubG9hZChxdWVyeSkKICAgICAgICBpbnZpc2libGUoY2FwdHVyZS5vdXRwdXQoCiAgICAgICAgICAgIGRhdGEgPC0gR0RDcHJlcGFyZShxdWVyeSkKICAgICAgICApKQogICAgICAgIGtleHBhbmQuZGYocGFzdGUwKCJTVEFSVCBjb3VudHMgLSAiLCBwcm9qKSkKICAgIH0sIGVycm9yID0gZnVuY3Rpb24oZSl7CiAgICAgICAgbWVzc2FnZShlKQogICAgfSkKICAgIGNhdCgiXG5cbiIpCn0KYGBgCg==