# HG changeset patch # User galaxyp # Date 1536353585 14400 # Node ID a018c44dc18bf90e95a3daa8b979e8c16e410977 # Parent f3027b8f28bd0ecfb1c6fd96cf3525ef301f5497 planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/cravatp_score_and_annotate commit d80e60ce74aabe64e131d560085af099d52b81cf-dirty diff -r f3027b8f28bd -r a018c44dc18b cravatp_submit.py --- a/cravatp_submit.py Thu Aug 16 12:28:29 2018 -0400 +++ b/cravatp_submit.py Fri Sep 07 16:53:05 2018 -0400 @@ -24,15 +24,12 @@ # initializes blank parameters chasm_classifier = '' probed_filename = None -intersected_only = False +all_intersect = False vcf_output = None analysis_type = None # # Testing Command -# python cravatp_submit.py test-data/Freebayes_two-variants.vcf GRCh38 -# test-data/variant.tsv test-data/gene.tsv test-data/noncoding.tsv -# test-data/error.tsv CHASM -—classifier Breast -—proBED -# test-data/MCF7_proBed.bed +# python cravatp_submit.py test-data/Freebayes_two-variants.vcf GRCh38 test-data/variant.tsv test-data/gene.tsv test-data/noncoding.tsv test-data/error.tsv CHASM -—classifier Breast -—proBED test-data/MCF7_proBed.bed parser = argparse.ArgumentParser() parser.add_argument('cravatInput',help='The filename of the input ' 'CRAVAT-formatted tabular file ' @@ -56,11 +53,8 @@ parser.add_argument('--proBED', help='The filename of the proBED file ' 'containing peptides with genomic ' 'coordinates') -parser.add_argument('--intersectOnly', help='Specifies whether to ' - 'analyze only variants ' - 'intersected between the ' - 'CRAVAT input and proBED ' - 'file') +parser.add_argument('--allIntersect', help='Specifies whether to ' + 'analyze all variants') parser.add_argument('--vcfOutput', help='The output filename of the ' 'intersected VCF file') @@ -78,8 +72,8 @@ chasm_classifier = args.classifier if args.proBED: probed_filename = args.proBED -if args.intersectOnly: - intersected_only = args.intersectOnly +if args.allIntersect: + all_intersect = args.allIntersect if args.vcfOutput: vcf_output = args.vcfOutput @@ -118,7 +112,7 @@ # proteogenomic input (proBED) file if the user specifies that they want # to only include intersected variants or if they want to receive the # intersected VCF as well. -if probed_filename and (vcf_output or intersected_only == 'true'): +if probed_filename and (vcf_output or all_intersect == 'false'): proBED = loadProBED() if not vcf_output: vcf_output = 'intersected_input.vcf' @@ -143,7 +137,7 @@ genpos <= pepposB): tsvout.writerow(row) break -if intersected_only == 'true': +if all_intersect == 'false': input_filename = vcf_output # sets up the parameters for submission to the CRAVAT API diff -r f3027b8f28bd -r a018c44dc18b cravatp_submit.xml --- a/cravatp_submit.xml Thu Aug 16 12:28:29 2018 -0400 +++ b/cravatp_submit.xml Fri Sep 07 16:53:05 2018 -0400 @@ -1,12 +1,12 @@ - + | Submits, intersects, checks for, and retrieves data for cancer annotation. - + - + - + @@ -110,8 +110,8 @@ - - + + @@ -121,6 +121,28 @@ + + + + + + + + + + + + + + + + + + + + + + @@ -202,29 +224,7 @@ - - - - - - - - - - - - - - - - - - - - - - - + @@ -240,6 +240,29 @@ + + + + + + + + + + + + + + + + + + + + + + + @@ -256,9 +279,10 @@ + - + @@ -290,6 +314,7 @@ ]]> + 10.1021/acs.jproteome.8b00404 10.1158/0008-5472.CAN-17-0338 10.1186/s13059-017-1377-x diff -r f3027b8f28bd -r a018c44dc18b test-data/error.tsv --- a/test-data/error.tsv Thu Aug 16 12:28:29 2018 -0400 +++ b/test-data/error.tsv Fri Sep 07 16:53:05 2018 -0400 @@ -1,9 +1,9 @@ #Input Errors Report -#2018-08-13 15:36:32.358464 +#2018-09-07 16:42:38.414856 #CRAVAT version: hybrid #Analysis done at http://www.cravat.us. -#Job Id: rsajulga_20180813_113614 -#Input file: Freebayes_two_variants.vcf +#Job Id: rsajulga_20180907_124216 +#Input file: Freebayes_one_variant.vcf #This report shows errors that occurred in the input. #Input coordinate: hg38 genomic. #CHASM classifier: Breast diff -r f3027b8f28bd -r a018c44dc18b test-data/gene.tsv --- a/test-data/gene.tsv Thu Aug 16 12:28:29 2018 -0400 +++ b/test-data/gene.tsv Fri Sep 07 16:53:05 2018 -0400 @@ -1,9 +1,9 @@ #Gene Level Annotation Report -#2018-08-13 15:36:32.359533 +#2018-09-07 16:42:38.415811 #CRAVAT version: hybrid #Analysis done at http://www.cravat.us. -#Job Id: rsajulga_20180813_113614 -#Input file: Freebayes_two_variants.vcf +#Job Id: rsajulga_20180907_124216 +#Input file: Freebayes_one_variant.vcf #This report shows analysis results at gene level. #The composite p-value (Stouffer's combined p-value) and composite FDR of a gene show how probable it is to get the same p-value distribution for the gene as that obtained from the input variants by chance. #hg38 genomic. @@ -11,5 +11,4 @@ #For more information on CRAVAT, visit http://www.cravat.us. HUGO symbol Number of variants Sequence ontology CGC driver class CGC inheritance CGC tumor types somatic CGC tumor types germline ClinVar disease identifier ClinVar XRef Occurrences in COSMIC COSMIC gene count (tissue) Number of samples with gene mutated CHASM gene score CHASM gene p-value CHASM gene FDR VEST gene score (non-silent) VEST gene p-value VEST gene FDR Protein 3D gene Has a mutation in a TCGA Mutation Cluster NCI pathway hits NCI pathway IDs NCI pathway names TARGET CGL driver class -CRABP2 1 MS 37 upper_aerodigestive_tract(3);large_intestine(9);stomach(4);soft_tissue(3);endometrium(4);lung(3);liver(2);skin(4);NS(1);prostate(1);bone(1);kidney(1);breast(1) 1 0.358 0.4176 1 ../MuPIT_Interactive?gm=chr1:156701052 0 -UPF1 1 MS 267 large_intestine(57);endometrium(18);lung(13);skin(45);meninges(1);kidney(9);thyroid(3);cervix(4);central_nervous_system(7);oesophagus(5);NS(4);upper_aerodigestive_tract(10);biliary_tract(2);stomach(15);soft_tissue(6);urinary_tract(12);breast(11);prostate(7);pancreas(7);haematopoietic_and_lymphoid_tissue(10);ovary(4);bone(2);liver(15) 1 0.63 0.0394 0.1 ../MuPIT_Interactive?gm=chr19:18856059 0 +UPF1 1 MS 267 large_intestine(57);endometrium(18);lung(13);skin(45);meninges(1);kidney(9);thyroid(3);cervix(4);central_nervous_system(7);oesophagus(5);NS(4);upper_aerodigestive_tract(10);biliary_tract(2);stomach(15);soft_tissue(6);urinary_tract(12);breast(11);prostate(7);pancreas(7);haematopoietic_and_lymphoid_tissue(10);ovary(4);bone(2);liver(15) 1 0.63 0.0394 1 ../MuPIT_Interactive?gm=chr19:18856059 0 diff -r f3027b8f28bd -r a018c44dc18b test-data/noncoding.tsv --- a/test-data/noncoding.tsv Thu Aug 16 12:28:29 2018 -0400 +++ b/test-data/noncoding.tsv Fri Sep 07 16:53:05 2018 -0400 @@ -1,9 +1,9 @@ #Non-coding Variant Report -#2018-08-13 15:36:32.354693 +#2018-09-07 16:42:38.411675 #CRAVAT version: hybrid #Analysis done at http://www.cravat.us. -#Job Id: rsajulga_20180813_113614 -#Input file: Freebayes_two_variants.vcf +#Job Id: rsajulga_20180907_124216 +#Input file: Freebayes_one_variant.vcf #This report shows analysis results at variant level. #hg38 genomic. #Breast diff -r f3027b8f28bd -r a018c44dc18b test-data/variant.tsv --- a/test-data/variant.tsv Thu Aug 16 12:28:29 2018 -0400 +++ b/test-data/variant.tsv Fri Sep 07 16:53:05 2018 -0400 @@ -1,13 +1,12 @@ #Variant Report -#2018-08-13 15:36:32.354483 +#2018-09-07 16:42:38.411479 #CRAVAT version: hybrid #Analysis done at http://www.cravat.us. -#Job Id: rsajulga_20180813_113614 -#Input file: Freebayes_two_variants.vcf +#Job Id: rsajulga_20180907_124216 +#Input file: Freebayes_one_variant.vcf #This report shows analysis results at variant level. #hg38 genomic. #Breast #For more information on CRAVAT, visit http://www.cravat.us. Input line ID Chromosome Position Strand Reference base(s) Alternate base(s) Sample ID HUGO symbol Sequence ontology Protein sequence change Reference peptide Variant peptide CHASM p-value CHASM FDR ClinVar COSMIC ID COSMIC variant count (tissue) Number of samples with variant dbSNP ESP6500 AF (average) gnomAD AF Total gnomAD AF African gnomAD AF American gnomAD AF Ashkenazi Jewish gnomAD AF East Asian gnomAD AF Finnish gnomAD AF Non-Finnish European gnomAD AF Other gnomAD AF South Asian GWAS NHLBI Key (GRASP) GWAS PMID (GRASP) GWAS Phenotype (GRASP) Protein 3D variant In TCGA Mutation Cluster ncRNA Class ncRNA Name Pseudogene Pseudogene Transcript Repeat Class Repeat Family Repeat Name TARGET 1000 Genomes AF UTR/Intron UTR/Intron Gene UTR/Intron All Transcript Phred VCF filters Zygosity Alternate reads Total reads Variant allele frequency CGL driver class S.O. transcript S.O. transcript strand S.O. all transcripts CGC driver class CGC inheritance CGC tumor types somatic CGC tumor types germline CHASM transcript CHASM score All transcripts CHASM results ClinVar disease identifier ClinVar XRef COSMIC transcript COSMIC protein change COSMIC variant count ESP6500 AF (European American) ESP6500 AF (African American) HGVS Genomic HGVS Protein HGVS Protein All NCI pathway hits NCI pathway IDs NCI pathway names -1 VAR516_unknown chr1 156701052 + C T unknown CRABP2 MS G24E 0.4176 1 0.0 4.07800406169e-06 2.98044825942e-05 ../MuPIT_Interactive?gm=chr1:156701052 0 122.853 . het 8 20 0.4 ENST00000368221.1 - *ENST00000368221.1:G24E(MS),ENST00000621784.4:G24E(MS),ENST00000368222.7:G24E(MS) ENST00000368221.1 0.358 *ENST00000368221.1:G24E(0.358:0.4176),ENST00000368222.7:G24E(0.358:0.4176),ENST00000621784.4:G24E(0.358:0.4176) 0 0 NC_000001.10:g.156701052C>T ENST00000368221.1:p.Gly24Glu *ENST00000368221.1:p.Gly24Glu,ENST00000621784.4:p.Gly24Glu,ENST00000368222.7:p.Gly24Glu 0 -2 VAR517_unknown chr19 18856059 + C T unknown UPF1 MS A571V EAIDSPVSFLALHNQIR EAIDSPVSFLVLHNQIR 0.0394 COSM3100527 large_intestine(1) 1 0.0 ../MuPIT_Interactive?gm=chr19:18856059 0 10269.5 . het 592 2379 0.248844052123 ENST00000599848.5 + ENST00000262803.9:A560V(MS),*ENST00000599848.5:A571V(MS) ENST00000262803.9 0.63 *ENST00000599848.5:A571V(0.61:0.0530),ENST00000262803.9:A560V(0.63:0.0394) ENST00000262803 p.A560V (large_intestine 1) 1 0 0 NC_000019.10:g.18856059C>T ENST00000599848.5:p.Ala571Val ENST00000262803.9:p.Ala560Val,*ENST00000599848.5:p.Ala571Val 0 +1 VAR516_unknown chr19 18856059 + C T unknown UPF1 MS A571V EAIDSPVSFLALHNQIR EAIDSPVSFLVLHNQIR 0.0394 COSM3100527 large_intestine(1) 1 0.0 ../MuPIT_Interactive?gm=chr19:18856059 0 10269.5 . het 592 2379 0.248844052123 ENST00000599848.5 + ENST00000262803.9:A560V(MS),*ENST00000599848.5:A571V(MS) ENST00000262803.9 0.63 *ENST00000599848.5:A571V(0.61:0.0530),ENST00000262803.9:A560V(0.63:0.0394) ENST00000262803 p.A560V (large_intestine 1) 1 0 0 NC_000019.10:g.18856059C>T ENST00000599848.5:p.Ala571Val ENST00000262803.9:p.Ala560Val,*ENST00000599848.5:p.Ala571Val 0