Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- query <- GDCquery(project = "TCGA-GBM",
- data.category = "Transcriptome Profiling",
- data.type = "Gene Expression Quantification",
- workflow.type = "HTSeq - Counts",
- )
- GDCdownload(query, method = "client")
- data <- GDCprepare(query)
- datatable(assay(data)[1:100,],
- options = list(scrollX = TRUE, keys = TRUE, pageLength = 5),
- rownames = TRUE)
- ENSG00000000003 TSPAN6 ENSG00000000003.13
- ENSG00000000005 TNMD ENSG00000000005.5
- ENSG00000000419 DPM1 ENSG00000000419.11
- ENSG00000000457 SCYL3 ENSG00000000457.12
- ENSG00000000460 C1orf112 ENSG00000000460.15
- import gseapy
- with open('Genelist.txt','r') as f:
- reflist = f.readlines()
- gseapy.enrichr(gene_list=reflist, description='pathway',
- gene_sets='KEGG_2016', outdir='test', cutoff=0.05)
- Term Overlap P-value AdjustedP value Z-score Combined Score Genes
- Cyanoamino acid metabolism_Homo sapiens_hsa00460 7/7 0.58570 0.66370 56.420294 -23.12773 GGT5 GGT7 GGT6 SHMT2 SHMT1 GGT1 GBA3
- Caffeine metabolism_Homo sapiens_hsa00232 5/5 0.60707 0.66370 58.0237 -23.7850 CYP2A6 NAT1 NAT2 CYP1A2 XDH
- Butirosin and neomycin biosynthesis_Homo sapiens_hsa00524 5/5 0.60707 0.6637 79.4520 -32.5688 HK3 HKDC1 GCK HK2 HK1
Add Comment
Please, Sign In to add comment