Mercurial > repos > vijay > pancancer_targene_cell_line_predictions
comparison targene_cell_line_predictions.xml @ 0:872aab514d37 draft default tip
"planemo upload for repository http://github.com/nvk747/papaa/galaxy/ commit 954b283ef7f82f59f55476a4b3a230d655187ac1"
author | vijay |
---|---|
date | Wed, 16 Dec 2020 23:30:22 +0000 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:872aab514d37 |
---|---|
1 <tool id="pancancer_targene_cell_line_predictions" name="PAPAA: PanCancer targene cell line predictions" version="@VERSION@"> | |
2 <description>targene status in ccle cell lines </description> | |
3 <macros> | |
4 <import>macros.xml</import> | |
5 </macros> | |
6 <expand macro="requirements"/> | |
7 <expand macro="stdio"/> | |
8 <version_command><![CDATA['papaa_targene_cell_line_predictions.py' --version]]></version_command> | |
9 <command><![CDATA[ | |
10 mkdir 'classifier' && | |
11 mkdir -p 'classifier/figures' && | |
12 mkdir -p 'classifier/figures/cell_line' && | |
13 mkdir -p 'classifier/tables' && | |
14 mkdir -p 'classifier/results' && | |
15 ln -s '${classifier_summary}' 'classifier/classifier_summary.txt' && | |
16 ln -s '${pancan_classifier_coefficients}' 'classifier/classifier_coefficients.tsv' && | |
17 ln -s '${nucleotide_mutation_scores}' 'classifier/tables/nucleotide_mutation_scores.tsv' && | |
18 ln -s '${amino_acid_mutation_scores}' 'classifier/tables/amino_acid_mutation_scores.tsv' && | |
19 papaa_targene_cell_line_predictions.py | |
20 --classifier_summary 'classifier' | |
21 #if $targenes and str($targenes): | |
22 --targenes '$targenes' | |
23 #end if | |
24 #if $path_genes and str($path_genes): | |
25 --path_genes '$path_genes' | |
26 #end if | |
27 #if $ccle_rnaseq and $ccle_rnaseq is not None: | |
28 --ccle_rnaseq '$ccle_rnaseq' | |
29 #end if | |
30 #if $ccle_mut and $ccle_mut is not None: | |
31 --ccle_mut '$ccle_mut' | |
32 #end if | |
33 #if $ccle_maf and $ccle_maf is not None: | |
34 --ccle_maf '$ccle_maf' | |
35 #end if | |
36 #if $gdsc_rnaseq and $gdsc_rnaseq is not None: | |
37 --gdsc_rnaseq '$gdsc_rnaseq' | |
38 #end if | |
39 #if $gdsc_mut and $gdsc_mut is not None: | |
40 --gdsc_mut '$gdsc_mut' | |
41 #end if | |
42 #if $gdsc1_phar and $gdsc1_phar is not None: | |
43 --gdsc1_phar '$gdsc1_phar' | |
44 #end if | |
45 #if $gdsc2_phar and $gdsc2_phar is not None: | |
46 --gdsc2_phar '$gdsc2_phar' | |
47 #end if | |
48 > '${log}' | |
49 ]]> | |
50 </command> | |
51 <inputs> | |
52 <param argument="--classifier_summary" label="Classifier data" name="classifier_summary" optional="false" type="data" format="txt" help="classifer_summary.txt"/> | |
53 <param label="pancancer classifier coefficients" name="pancan_classifier_coefficients" optional="false" type="data" format="tabular" help="classifier_coefficients.tsv"/> | |
54 <param label="nucleotide mutation scores" name="nucleotide_mutation_scores" optional="false" type="data" format="tabular" help="nucleotide_mutation_scores.tsv"/> | |
55 <param label="amino acid mutation scores" name="amino_acid_mutation_scores" optional="false" type="data" format="tabular" help="amino_acid_mutation_scores.tsv"/> | |
56 <param argument="--targenes" label="Comma separated string of HUGO targene symbols" name="targenes" optional="False" type="text" value="ERBB2_MUT,PIK3CA_MUT,KRAS_MUT,AKT1_MUT"/> | |
57 <param argument="--path_genes" label="string of the genes to extract or genelist file" name="path_genes" optional="true" type= "data" format="txt"/> | |
58 <param argument="--ccle_rnaseq" label="Filename ccle rnaseq data" name="ccle_rnaseq" optional="false" type="data" format="tabular" help="data/ccle_rnaseq_genes_rpkm_20180929_mod.tsv"/> | |
59 <param argument="--ccle_mut" label="Filename ccle mutational data" name="ccle_mut" optional="true" type="data" format="txt" help="data/CCLE_MUT_CNA_AMP_DEL_binary_Revealer.gct"/> | |
60 <param argument="--ccle_maf" label="Filename ccle variant data" name="ccle_maf" optional="true" type="data" format="txt" help="data/CCLE_DepMap_18Q1_maf_20180207.txt" /> | |
61 <param argument="--gdsc_rnaseq" label="Filename gdsc rnaseq data" name="gdsc_rnaseq" optional="false" type="data" format="tabular" help="data/GDSC_EXP_CCLE_converted_name.tsv"/> | |
62 <param argument="--gdsc_mut" label="Filename gdsc mutational data" name="gdsc_mut" optional="true" type="data" format="tabular" help="data/GDSC_CCLE_common_mut_cnv_binary.tsv"/> | |
63 <param argument="--gdsc1_phar" label="Filename for gdsc1 pharmacological data file" name="gdsc1_phar" optional="false" type="data" format="txt" help="data/gdsc1_ccle_pharm_fitted_dose_data.txt"/> | |
64 <param argument="--gdsc2_phar" label="Filename for gdsc2 pharmacological data file" name="gdsc2_phar" optional="false" type="data" format="txt" help="data/gdsc2_ccle_pharm_fitted_dose_data.txt"/> | |
65 </inputs> | |
66 <outputs> | |
67 <data format="txt" name="log" label="${tool.name} on ${on_string} (Log)"/> | |
68 <data format="png" name="ccle_histogram" label="${tool.name} on ${on_string} (ccle_histogram.png)" from_work_dir="classifier/figures/ccle_histogram.png"/> | |
69 <data format="tabular" name="ccle_targene_classifier_scores" label="${tool.name} on ${on_string} (ccle_targene_classifier_scores.tsv)" from_work_dir="classifier/tables/ccle_targene_classifier_scores.tsv"/> | |
70 <data format="pdf" name="ccle_targene_WT_MUT_predictions" label="${tool.name} on ${on_string} (ccle_targene_WT_MUT_predictions.pdf)" from_work_dir="classifier/figures/cell_line/ccle_targene_WT_MUT_predictions.pdf"/> | |
71 <data format="csv" name="updated_data_nucleotide_scores" label="${tool.name} on ${on_string} (updated_data_nucleotide_scores.csv)" from_work_dir="classifier/tables/updated_data_nucleotide_scores.csv"/> | |
72 <data format="csv" name="updated_data_aminoacid_scores" label="${tool.name} on ${on_string} (updated_data_aminoacid_scores.csv)" from_work_dir="classifier/tables/updated_data_aminoacid_scores.csv"/> | |
73 <data format="png" name="gdsc_scores_histogram" label="${tool.name} on ${on_string} (gdsc_scores_histogram.png)" from_work_dir="classifier/figures/gdsc_scores_histogram.png"/> | |
74 <data format="tabular" name="gdsc_targene_classifier_scores" label="${tool.name} on ${on_string} (gdsc_targene_classifier_scores.tsv)" from_work_dir="classifier/tables/gdsc_targene_classifier_scores.tsv"/> | |
75 <data format="pdf" name="gdsc_targene_WT_MUT_predictions" label="${tool.name} on ${on_string} (gdsc_targene_WT_MUT_predictions.pdf)" from_work_dir="classifier/figures/cell_line/gdsc_targene_WT_MUT_predictions.pdf"/> | |
76 <data format="tabular" name="gdsc1_targene_pharmacology_predictions" label="${tool.name} on ${on_string} (gdsc1_targene_pharmacology_predictions.tsv)" from_work_dir="classifier/tables/gdsc1_targene_pharmacology_predictions.tsv"/> | |
77 <data format="tabular" name="gdsc2_targene_pharmacology_predictions" label="${tool.name} on ${on_string} (gdsc2_targene_pharmacology_predictions.tsv)" from_work_dir="classifier/tables/gdsc2_targene_pharmacology_predictions.tsv"/> | |
78 <data format="tabular" name="gdsc1_ccle_targene_pharmacology_predictions" label="${tool.name} on ${on_string} (gdsc1_ccle_targene_pharmacology_predictions.tsv)" from_work_dir="classifier/tables/gdsc1_ccle_targene_pharmacology_predictions.tsv"/> | |
79 <data format="tabular" name="gdsc2_ccle_targene_pharmacology_predictions" label="${tool.name} on ${on_string} (gdsc2_ccle_targene_pharmacology_predictions.tsv)" from_work_dir="classifier/tables/gdsc2_ccle_targene_pharmacology_predictions.tsv"/> | |
80 </outputs> | |
81 <tests> | |
82 <test> | |
83 <param name="classifier_summary" value="classifier_summary.txt" ftype="txt"/> | |
84 <param name="pancan_classifier_coefficients" value="classifier_coefficients.tsv" ftype="tabular"/> | |
85 <param name="nucleotide_mutation_scores" value="nucleotide_mutation_scores.tsv" ftype="tabular"/> | |
86 <param name="amino_acid_mutation_scores" value="amino_acid_mutation_scores.tsv" ftype="tabular"/> | |
87 <param name="targenes" value="ERBB2_MUT,PIK3CA_MUT,KRAS_MUT,AKT1_MUT"/> | |
88 <param name="path_genes" value="path_genes.txt" ftype="txt"/> | |
89 <param name="ccle_rnaseq" value="ccle_rnaseq_genes_rpkm_20180929_mod_t5p.tsv.gz" ftype="tabular"/> | |
90 <param name="ccle_mut" value="CCLE_MUT_CNA_AMP_DEL_binary_Revealer.gct.gz" ftype="tabular"/> | |
91 <param name="ccle_maf" value="CCLE_DepMap_18Q1_maf_20180207_t1p.txt.gz" ftype="txt"/> | |
92 <param name="gdsc_rnaseq" value="GDSC_EXP_CCLE_converted_name_t10p.tsv.gz" ftype="tabular"/> | |
93 <param name="gdsc_mut" value="GDSC_CCLE_common_mut_cnv_binary.tsv.gz" ftype="tabular"/> | |
94 <param name="gdsc1_phar" value="gdsc1_ccle_pharm_fitted_dose_data_t10p.txt.gz" ftype="txt"/> | |
95 <param name="gdsc2_phar" value="gdsc2_ccle_pharm_fitted_dose_data_t10p.txt.gz" ftype="txt"/> | |
96 <output name="log" file="targene_cell_line_predictions_Log.txt" lines_diff="2"/> | |
97 <output name="ccle_histogram" file="ccle_histogram.png" compare="sim_size" delta="50"/> | |
98 <output name="ccle_targene_classifier_scores" file="ccle_targene_classifier_scores.tsv" /> | |
99 <output name="ccle_targene_WT_MUT_predictions" file="ccle_targene_WT_MUT_predictions.pdf" compare="sim_size" delta="100"/> | |
100 <output name="updated_data_nucleotide_scores" file="updated_data_nucleotide_scores.csv" /> | |
101 <output name="updated_data_aminoacid_scores" file="updated_data_aminoacid_scores.csv" /> | |
102 <output name="gdsc_scores_histogram" file="gdsc_scores_histogram.png" /> | |
103 <output name="gdsc_targene_classifier_scores" file="gdsc_targene_classifier_scores.tsv" /> | |
104 <output name="gdsc_targene_WT_MUT_predictions" file="gdsc_targene_WT_MUT_predictions.pdf" compare="sim_size" delta="50"/> | |
105 <output name="gdsc1_targene_pharmacology_predictions"> | |
106 <assert_contents> | |
107 <has_line line="	GDSC1_cell_line	NLME_CURVE_ID	COSMIC_ID	SANGER_MODEL_ID	TCGA_DESC	DRUG_ID	Compound	PUTATIVE_TARGET	PATHWAY_NAME	MIN_CONC	MAX_CONC	LN_IC50	AUC	RMSE	Z_SCORE	tissue	ERBB2_MUT	PIK3CA_MUT	KRAS_MUT	AKT1_MUT	targene_status	weight	sample_name	predictions" /> | |
108 <has_n_columns n="25" /> | |
109 <has_n_lines n="10281" /> | |
110 </assert_contents> | |
111 </output> | |
112 <output name="gdsc2_targene_pharmacology_predictions"> | |
113 <assert_contents> | |
114 <has_line line="	GDSC1_cell_line	NLME_CURVE_ID	COSMIC_ID	SANGER_MODEL_ID	TCGA_DESC	DRUG_ID	Compound	PUTATIVE_TARGET	PATHWAY_NAME	MIN_CONC	MAX_CONC	LN_IC50	AUC	RMSE	Z_SCORE	tissue	ERBB2_MUT	PIK3CA_MUT	KRAS_MUT	AKT1_MUT	targene_status	weight	sample_name	predictions" /> | |
115 <has_n_columns n="25" /> | |
116 <has_n_lines n="10281" /> | |
117 </assert_contents> | |
118 </output> | |
119 <output name="gdsc1_ccle_targene_pharmacology_predictions" file="gdsc1_ccle_targene_pharmacology_predictions.tsv" /> | |
120 <output name="gdsc2_ccle_targene_pharmacology_predictions" file="gdsc2_ccle_targene_pharmacology_predictions.tsv" /> | |
121 </test> | |
122 </tests> | |
123 <help><![CDATA[ | |
124 | |
125 **Pancancer_Aberrant_Pathway_Activity_Analysis scripts/viz/papaa_targene_cell_line_predictions_mod.py:** | |
126 | |
127 **Inputs:** | |
128 --targenes comma separated string of HUGO symbols for target genes or targenes_list.csv file | |
129 --path_genes comma separated string of HUGO symbols for all genes in the target pathway or path_genes.txt file | |
130 --classifier_summary String of the location of classifier_summary file | |
131 --ccle_rnaseq Filename of CCLE gene expression data file | |
132 --ccle_mut Filename of CCLE cell lines/gene mutations data file | |
133 --ccle_maf Filename of CCLE mutational variant level data file | |
134 --gdsc_rnaseq Filename of GDSC gene expression data file | |
135 --gdsc_mut Filename of GDSC cell lines/gene mutations data file | |
136 --gdsc1_phar Filename of GDSC1 pharmacological response data | |
137 --gdsc2_phar Filename of GDSC2 pharmacological response data | |
138 | |
139 **Outputs:** | |
140 Generate predictions for CCLE data using targene classifier(ccle_histogram.png) | |
141 | |
142 Generate classifier scores for CCLE cell lines and combines CCLE mutational data and variant data with classifier scores (ccle_targene_classifier_scores.tsv) | |
143 | |
144 Performs t-test on classifier weights across targene mutant vs targene wildtype cell-line groups(ccle_targene_WT_MUT_predictions.pdf) | |
145 | |
146 Add CCLE nucleotide scores at variant level and update nucleotide_mutation_scores.tsv (updated_data_nucleotide_scores.csv) | |
147 | |
148 Add CCLE protein scores at variant level and update aminoacid_mutation_scores.tsv (updated_data_aminoacid_scores.csv) | |
149 | |
150 Generate predictions for GDSC data using targene classifier(gdsc_scores_histogram.png) | |
151 | |
152 Generate classifier scores for GDSC cell lines and combines CCLE mutational data and variant data with classifier scores (gdsc_targene_classifier_scores.tsv) | |
153 | |
154 Performs t-test on classifier weights across targene mutant vs targene wildtype cell-line groups(gdsc_targene_WT_MUT_predictions.pdf) | |
155 | |
156 Apply GDSC classifier scores to evaluate GDSC1 pharmacological data response(gdsc1_targene_pharmacology_predictions.tsv) | |
157 | |
158 Apply GDSC classifier scores to evaluate GDSC2 pharmacological data response(gdsc2_targene_pharmacology_predictions.tsv) | |
159 | |
160 Apply CCLE classifier scores to evaluate GDSC1 pharmacological data response(gdsc1_ccle_targene_pharmacology_predictions.tsv) | |
161 | |
162 Apply CCLE classifier scores to evaluate GDSC2 pharmacological data response(gdsc2_ccle_targene_pharmacology_predictions.tsv) ]]> | |
163 </help> | |
164 <expand macro="citations" /> | |
165 </tool> |