Skip to content

Commit

Permalink
Added a test case for the new abs_max collapse mode
Browse files Browse the repository at this point in the history
  • Loading branch information
davideby committed Dec 2, 2021
1 parent 60b948c commit 12665cf
Show file tree
Hide file tree
Showing 2 changed files with 51 additions and 1 deletion.
Original file line number Diff line number Diff line change
@@ -0,0 +1,50 @@
# Copyright (c) 2003-2021 Broad Institute, Inc., Massachusetts Institute of Technology, and Regents of the University of California. All rights reserved.
#module: urn:lsid:broad.mit.edu:cancer.software.genepattern.module.analysis:00072:20
module: GSEA
name: GSEA collapse_NaN_Missing_abs_max_test
description: Test the GSEA 'collapse dataset' function handling Infinite, NaN and Missing values, collapse to absolute max of probes. Tests are centered on HTR4, HTR6, FLJ22639, HTR7, NPAL2, NPAL3, GSTK1, BCR.
params:
expression.dataset: "<%gpunit.testData%>gpunit/GSEA/v20/input/Diabetes_hgu133a_NaN_missing_vals.gct"
gene.sets.database: [ "<%gpunit.testData%>gpunit/GSEA/v20/input/c1.symbols.reduced.gmt" ]
number.of.permutations: "10"
# Uses P53_6samples.cls because it happens to have a reasonable class template for this use
phenotype.labels: "<%gpunit.testData%>gpunit/GSEA/v20/input/P53_6samples.cls"
target.profile: ""
permutation.type: "phenotype"
collapse.dataset: "Collapse"
chip.platform.file: "<%gpunit.testData%>gpunit/GSEA/v20/input/HG_U133A.chip"
# Modifying the ZIP name here so that the diffCmd can find the RNK inside. We could modify the diffCmd
# to be able to find it, but that makes the code somewhat complicated.
output.file.name: "Diabetes_hgu133a_NaN_missing_vals_collapsed_to_symbols.zip"
scoring.scheme: "weighted"
metric.for.ranking.genes: "Signal2Noise"
gene.list.sorting.mode: "real"
gene.list.ordering.mode: "descending"
max.gene.set.size: "500"
min.gene.set.size: "15"
collapsing.mode.for.probe.sets.with.more.than.one.match: "Abs_max_of_probes"
normalization.mode: "meandiv"
randomization.mode: "no_balance"
omit.features.with.no.symbol.match: "true"
median.for.class.metrics: "false"
number.of.markers: "100"
# Note that we use a fixed random seed rather than the 'timestamp' default so that we'll have reproducible test results
random.seed: "149"
create.svgs: "false"
create.gcts: "true"
save.random.ranked.lists: "false"
plot.graphs.for.the.top.sets.of.each.phenotype: "20"
make.detailed.gene.set.report: "false"
selected.gene.sets: ""
dev.mode: "true"
alt.delim: ""
create.zip: "true"
assertions:
jobStatus: success
files:
"Diabetes_hgu133a_NaN_missing_vals_collapsed_to_symbols.zip":
diffCmd: ../diffGseaResults.sh
diff: "<%gpunit.resultData%>gpunit/GSEA/v20/output/collapse/collapse_NaN_Missing_abs_max_test/Diabetes_hgu133a_NaN_missing_vals_collapsed_to_symbols.zip"
"stdout.txt":
diffCmd: ../grepMessages.sh
diff: "<%gpunit.resultData%>gpunit/GSEA/v20/output/collapse/collapse_NaN_Missing_abs_max_test/stdoutMatches.txt"
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
#module: urn:lsid:broad.mit.edu:cancer.software.genepattern.module.analysis:00072:20
module: GSEA
name: GSEA collapse_NaN_Missing_max_test
description: Test the GSEA 'collapse dataset' function handling NaN and Missing values, collapse to max of probes. Tests are centered on HTR4, HTR7, NPAL2, NPAL3, GSTK1.
description: Test the GSEA 'collapse dataset' function handling Infinite, NaN and Missing values, collapse to max of probes. Tests are centered on HTR4, HTR6, FLJ22639, HTR7, NPAL2, NPAL3, GSTK1, BCR.
params:
expression.dataset: "<%gpunit.testData%>gpunit/GSEA/v20/input/Diabetes_hgu133a_NaN_missing_vals.gct"
gene.sets.database: [ "<%gpunit.testData%>gpunit/GSEA/v20/input/c1.symbols.reduced.gmt" ]
Expand Down

0 comments on commit 12665cf

Please sign in to comment.