# Identifying which gene sets are enriched in TCGA samples where FZD7 is overexpressed

<div class="alert alert-info">
<p class="lead"> Instructions <i class="fa fa-info-circle"></i></p>
Run all cells (in order) in this notebook if you want to create the GSEA figure from "A FZD7-specific antibody-drug conjugate induces tumor regression in preclinical modelsTargeting solid tumors with a FZD7-specific antibody-drug conjugateTargeting FZD7
</div>

<div class="well well-sm">
GenePattern jobs have been pre-ran and should be available after logging in.
</div>

In [8]:
# Requires GenePattern Notebook: pip install genepattern-notebook
import gp
import genepattern

# Username and password removed for security reasons.
genepattern.display(genepattern.session.register("https://cloud.genepattern.org/gp", "", ""))

GPAuthWidget()

# OV

In [9]:
tcga_sampleselection_task = gp.GPTask(genepattern.session.get(0), 'urn:lsid:genepattern.org:module.analysis:00417')
tcga_sampleselection_job_spec = tcga_sampleselection_task.make_job_spec()
tcga_sampleselection_job_spec.set_parameter("TCGA.Collection", "OV")
tcga_sampleselection_job_spec.set_parameter("Gene.Symbol", "FZD7")
tcga_sampleselection_job_spec.set_parameter("High.Expression", "1")
tcga_sampleselection_job_spec.set_parameter("Low.Expression", "-1")
tcga_sampleselection_job_spec.set_parameter("Output.Type", "scaled_estimate")
tcga_sampleselection_job_spec.set_parameter("MSigDB.Version", "7.2")
tcga_sampleselection_job_spec.set_parameter("job.memory", "4 Gb")
tcga_sampleselection_job_spec.set_parameter("job.queue", "gp-cloud-default")
tcga_sampleselection_job_spec.set_parameter("job.cpuCount", "1")
tcga_sampleselection_job_spec.set_parameter("job.walltime", "02:00:00")
genepattern.display(tcga_sampleselection_task)


job347659 = gp.GPJob(genepattern.session.get(0), 347659)
genepattern.display(job347659)

GPTaskWidget(lsid='urn:lsid:genepattern.org:module.analysis:00417')

GPJobWidget(job_number=347659)

In [10]:
ssgsea_task = gp.GPTask(genepattern.session.get(0), 'urn:lsid:broad.mit.edu:cancer.software.genepattern.module.analysis:00270')
ssgsea_job_spec = ssgsea_task.make_job_spec()
ssgsea_job_spec.set_parameter("input.gct.file", "https://cloud.genepattern.org/gp/jobResults/347659/TCGA_OV_FZD7_HIGH_stdev_greater_than_1_vs_LOW_stdev_less_than_neg_1.TPM.gct")
ssgsea_job_spec.set_parameter("output.file.prefix", "")
ssgsea_job_spec.set_parameter("gene.sets.database.files", ["ftp://gpftp.broadinstitute.org/module_support_files/msigdb/gmt/h.all.v7.4.symbols.gmt", "ftp://gpftp.broadinstitute.org/module_support_files/msigdb/gmt/c6.all.v7.4.symbols.gmt"])
ssgsea_job_spec.set_parameter("gene.symbol.column", "Name")
ssgsea_job_spec.set_parameter("gene.set.selection", "ALL")
ssgsea_job_spec.set_parameter("sample.normalization.method", "none")
ssgsea_job_spec.set_parameter("weighting.exponent", "0.75")
ssgsea_job_spec.set_parameter("min.gene.set.size", "10")
ssgsea_job_spec.set_parameter("combine.mode", "combine.add")
ssgsea_job_spec.set_parameter("job.memory", "2 Gb")
ssgsea_job_spec.set_parameter("job.queue", "gp-new-beta")
ssgsea_job_spec.set_parameter("job.cpuCount", "1")
ssgsea_job_spec.set_parameter("job.walltime", "02:00:00")
genepattern.display(ssgsea_task)

job347663 = gp.GPJob(genepattern.session.get(0), 347663)
genepattern.display(job347663)

GPTaskWidget(lsid='urn:lsid:broad.mit.edu:cancer.software.genepattern.module.analysis:00270')

GPJobWidget(job_number=347663)

In [11]:
ssgsea_roc_task = gp.GPTask(genepattern.session.get(0), 'urn:lsid:8080.gpserver.ip-172-31-26-71.ip-172-31-26-71.ec2.internal:genepatternmodules:177')
ssgsea_roc_job_spec = ssgsea_roc_task.make_job_spec()
ssgsea_roc_job_spec.set_parameter("PROJ.gct", "https://cloud.genepattern.org/gp/jobResults/347663/TCGA_OV_FZD7_HIGH_stdev_greater_than_1_vs_LOW_stdev_less_than_neg_1.TPM.PROJ.gct")
ssgsea_roc_job_spec.set_parameter("CLS", "https://cloud.genepattern.org/gp/jobResults/347659/TCGA_OV_FZD7_HIGH_stdev_greater_than_1_vs_LOW_stdev_less_than_neg_1.cls")
ssgsea_roc_job_spec.set_parameter("Reverse", "FALSE")
ssgsea_roc_job_spec.set_parameter("Plot.Top.Results", "20")
ssgsea_roc_job_spec.set_parameter("job.memory", "2 Gb")
ssgsea_roc_job_spec.set_parameter("job.queue", "gp-new-beta")
ssgsea_roc_job_spec.set_parameter("job.cpuCount", "1")
ssgsea_roc_job_spec.set_parameter("job.walltime", "02:00:00")
genepattern.display(ssgsea_roc_task)

job347667 = gp.GPJob(genepattern.session.get(0), 347667)
genepattern.display(job347667)

GPTaskWidget(lsid='urn:lsid:8080.gpserver.ip-172-31-26-71.ip-172-31-26-71.ec2.internal:genepatternmodules:177'…

GPJobWidget(job_number=347667)

# BRCA

In [12]:
tcga_sampleselection_task = gp.GPTask(genepattern.session.get(0), 'urn:lsid:genepattern.org:module.analysis:00417')
tcga_sampleselection_job_spec = tcga_sampleselection_task.make_job_spec()
tcga_sampleselection_job_spec.set_parameter("TCGA.Collection", "BRCA")
tcga_sampleselection_job_spec.set_parameter("Gene.Symbol", "FZD7")
tcga_sampleselection_job_spec.set_parameter("High.Expression", "1")
tcga_sampleselection_job_spec.set_parameter("Low.Expression", "-1")
tcga_sampleselection_job_spec.set_parameter("Output.Type", "scaled_estimate")
tcga_sampleselection_job_spec.set_parameter("MSigDB.Version", "latest")
tcga_sampleselection_job_spec.set_parameter("job.memory", "8Gb")
tcga_sampleselection_job_spec.set_parameter("job.queue", "gp-cloud-default")
tcga_sampleselection_job_spec.set_parameter("job.cpuCount", "1")
tcga_sampleselection_job_spec.set_parameter("job.walltime", "02:00:00")
genepattern.display(tcga_sampleselection_task)


job347660 = gp.GPJob(genepattern.session.get(0), 347660)
genepattern.display(job347660)

GPTaskWidget(lsid='urn:lsid:genepattern.org:module.analysis:00417')

GPJobWidget(job_number=347660)

In [13]:
ssgsea_task = gp.GPTask(genepattern.session.get(0), 'urn:lsid:broad.mit.edu:cancer.software.genepattern.module.analysis:00270')
ssgsea_job_spec = ssgsea_task.make_job_spec()
ssgsea_job_spec.set_parameter("input.gct.file", "https://cloud.genepattern.org/gp/jobResults/347660/TCGA_BRCA_FZD7_HIGH_stdev_greater_than_1_vs_LOW_stdev_less_than_neg_1.TPM.gct")
ssgsea_job_spec.set_parameter("output.file.prefix", "")
ssgsea_job_spec.set_parameter("gene.sets.database.files", ["ftp://gpftp.broadinstitute.org/module_support_files/msigdb/gmt/h.all.v7.4.symbols.gmt", "ftp://gpftp.broadinstitute.org/module_support_files/msigdb/gmt/c6.all.v7.4.symbols.gmt"])
ssgsea_job_spec.set_parameter("gene.symbol.column", "Name")
ssgsea_job_spec.set_parameter("gene.set.selection", "ALL")
ssgsea_job_spec.set_parameter("sample.normalization.method", "none")
ssgsea_job_spec.set_parameter("weighting.exponent", "0.75")
ssgsea_job_spec.set_parameter("min.gene.set.size", "10")
ssgsea_job_spec.set_parameter("combine.mode", "combine.add")
ssgsea_job_spec.set_parameter("job.memory", "2 Gb")
ssgsea_job_spec.set_parameter("job.queue", "gp-new-beta")
ssgsea_job_spec.set_parameter("job.cpuCount", "1")
ssgsea_job_spec.set_parameter("job.walltime", "02:00:00")
genepattern.display(ssgsea_task)

job347666 = gp.GPJob(genepattern.session.get(0), 347666)
genepattern.display(job347666)

GPTaskWidget(lsid='urn:lsid:broad.mit.edu:cancer.software.genepattern.module.analysis:00270')

GPJobWidget(job_number=347666)

In [14]:
ssgsea_roc_task = gp.GPTask(genepattern.session.get(0), 'urn:lsid:8080.gpserver.ip-172-31-26-71.ip-172-31-26-71.ec2.internal:genepatternmodules:177')
ssgsea_roc_job_spec = ssgsea_roc_task.make_job_spec()
ssgsea_roc_job_spec.set_parameter("PROJ.gct", "https://cloud.genepattern.org/gp/jobResults/347666/TCGA_BRCA_FZD7_HIGH_stdev_greater_than_1_vs_LOW_stdev_less_than_neg_1.TPM.PROJ.gct")
ssgsea_roc_job_spec.set_parameter("CLS", "https://cloud.genepattern.org/gp/jobResults/347660/TCGA_BRCA_FZD7_HIGH_stdev_greater_than_1_vs_LOW_stdev_less_than_neg_1.cls")
ssgsea_roc_job_spec.set_parameter("Reverse", "FALSE")
ssgsea_roc_job_spec.set_parameter("Plot.Top.Results", "20")
ssgsea_roc_job_spec.set_parameter("job.memory", "4Gb")
ssgsea_roc_job_spec.set_parameter("job.queue", "gp-new-beta")
ssgsea_roc_job_spec.set_parameter("job.cpuCount", "1")
ssgsea_roc_job_spec.set_parameter("job.walltime", "02:00:00")
genepattern.display(ssgsea_roc_task)


job347669 = gp.GPJob(genepattern.session.get(0), 347669)
genepattern.display(job347669)

GPTaskWidget(lsid='urn:lsid:8080.gpserver.ip-172-31-26-71.ip-172-31-26-71.ec2.internal:genepatternmodules:177'…

GPJobWidget(job_number=347669)