Mercurial > repos > saharlcc > isoem2_isode2
diff isoDE2.sh @ 14:007e2dd3fe8b draft
Bug fix in output files headers
author | saharlcc |
---|---|
date | Mon, 03 Apr 2017 17:55:22 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/isoDE2.sh Mon Apr 03 17:55:22 2017 -0400 @@ -0,0 +1,218 @@ +#!/bin/bash + +isoEMDir=/galaxy/galaxy/tools-dependencies/bin/isoem2/ +toolpath=${isoEMDir}/bin +isoDEPath=${isoEMDir}/bin +supportCalcPath=${isoEMDir}/src/calc +fpkmGeneCommand="" +fpkmIsoformCommand="" +tpmGeneCommand="" +tpmIsoformCommand="" + +numberOfBootstrapIterationsPerSample=199 + +arg=($*) +i=0 +while [ $i -lt $# ] +do + a=${arg[i]} + if [ "$a" == "-c1" ]; then + fpkmGeneCommand="$fpkmGeneCommand -c1" + fpkmIsoformCommand="$fpkmIsoformCommand -c1" + tpmGeneCommand="$tpmGeneCommand -c1" + tpmIsoformCommand="$tpmIsoformCommand -c1" + + ((i++)) + a=${arg[i]} + rep=1 + while [[ `expr index "$a" "/"` -ne 0 && $i -lt $# ]] + do + condition1File=$a + ${toolpath}/convertToisoDEFormatWithIsoforms $condition1File c1_rep${rep} + + fpkmGeneCommand="$fpkmGeneCommand c1_rep${rep}_fpkm_G" + fpkmIsoformCommand="$fpkmIsoformCommand c1_rep${rep}_fpkm_I" + tpmGeneCommand="$tpmGeneCommand c1_rep${rep}_tpm_G" + tpmIsoformCommand="$tpmIsoformCommand c1_rep${rep}_tpm_I" + ((rep++)) + + ((i++)) + a=${arg[i]} + done + elif [ "$a" == "-c2" ]; then + fpkmGeneCommand="$fpkmGeneCommand -c2" + fpkmIsoformCommand="$fpkmIsoformCommand -c2" + tpmGeneCommand="$tpmGeneCommand -c2" + tpmIsoformCommand="$tpmIsoformCommand -c2" + + ((i++)) + a=${arg[i]} + rep=1 + while [[ `expr index "$a" "/"` -ne 0 && $i -lt $# ]] + do + condition1File=$a + #echo $condition1File + ${toolpath}/convertToisoDEFormatWithIsoforms $condition1File c2_rep${rep} + + fpkmGeneCommand="$fpkmGeneCommand c2_rep${rep}_fpkm_G" + fpkmIsoformCommand="$fpkmIsoformCommand c2_rep${rep}_fpkm_I" + tpmGeneCommand="$tpmGeneCommand c2_rep${rep}_tpm_G" + tpmIsoformCommand="$tpmIsoformCommand c2_rep${rep}_tpm_I" + ((rep++)) + + ((i++)) + a=${arg[i]} + done + elif [ "$a" == "-pval" ]; then + ((i++)) + pval=${arg[i]} + ((i++)) + + + elif [ "$a" == "-geneFPKMout" ]; then + ((i++)) + geneFPKMout_file=${arg[i]} + ((i++)) + + + elif [ "$a" == "-geneTPMout" ]; then + ((i++)) + geneTPMout_file=${arg[i]} + ((i++)) + + elif [ "$a" == "-isoFPKMout" ]; then + ((i++)) + isoFPKMout_file=${arg[i]} + ((i++)) + + elif [ "$a" == "-isoTPMout" ]; then + ((i++)) + isoTPMout_file=${arg[i]} + ((i++)) + else + + ((i++)) + fi + +done +((rep--)) +bootstrap=$(($rep*$numberOfBootstrapIterationsPerSample)) +echo boostrap iterations $bootstrap +#support=`java -cp ${supportCalcPath} support 200 200 $pval` +#support=`java -cp ${supportCalcPath} support $bootstrap $bootstrap $pval` +#Calculator assumes IsoDE does all pairs when calculation the number of ratios. It multiplies the number of bootstrap samples per condition +# changed the second parameter to make the number of ratios equal to the number of bootstrap samples (match, not all pairs) +echo calculate support based on p-value and number or replicates +support=`java -cp ${supportCalcPath} support $bootstrap 1 $pval` +fpkmGeneCommand="$fpkmGeneCommand -b $support" +fpkmIsoformCommand="$fpkmIsoformCommand -b $support" +tpmGeneCommand="$tpmGeneCommand -b $support" +tpmIsoformCommand="$tpmIsoformCommand -b $support" + +fpkmGeneCommand="$fpkmGeneCommand -dfc 2" +fpkmIsoformCommand="$fpkmIsoformCommand -dfc 2" +tpmGeneCommand="$tpmGeneCommand -dfc 2" +tpmIsoformCommand="$tpmIsoformCommand -dfc 2" + + +#if [ "${out_prefix}" == "$(basename ${out_prefix} )" ]; then +# pth=`pwd` +# out_prefix=${pth}/${out_prefix} +#fi + + +echo GENE FPKM +echo moving start +date + +mkdir fpkm_G +cd fpkm_G +mv ../c*_fpkm_G . + + +echo isoDE start +date + + +${isoDEPath}/isodecalls $fpkmGeneCommand -out "output.txt" +#awk '{for (f=1; f<=NF; f++) {if (f == NF) printf "%s",$f; else printf "%s\t", $f }; print ""}' Bootstrap_Merge1_DIR/output.txt | sed 1,1d > ${geneFPKMout_file} + +echo awk command +date + + +awk '{if (NR == 1) {print "Gene ID\tConfident log2 FC\t Single run log2 FC\t c1 average FPKM\tc2 average FPKM";} else {if ($6 == 0 && $7 == 0) {two="0";} else {two=$2;} print $1 "\t" two "\t" $5 "\t" $6 "\t" $7}}' Bootstrap_Merge1_DIR/output.txt > ${geneFPKMout_file} + +cd .. + + +echo ISOFORM FPKM + +echo moving start +date + +mkdir fpkm_I +cd fpkm_I +mv ../c*_fpkm_I . + + +echo isoDE start +date + +${isoDEPath}/isodecalls $fpkmIsoformCommand -out "output.txt" + +echo awk command +date +pwd +awk '{if (NR == 1) {print "Isoform ID\tConfident log2 FC\t Single run log2 FC\t c1 average FPKM\tc2 average FPKM";} else {if ($6 == 0 && $7 == 0) {two="0";} else {two=$2;} print $1 "\t" two "\t" $5 "\t" $6 "\t" $7}}' Bootstrap_Merge1_DIR/output.txt > ${isoFPKMout_file} +cd .. + + +echo ISOFORM TPM +echo moving start +date + +mkdir tpm_G +cd tpm_G +mv ../c*_tpm_G . + +echo isoDE start +date + +${isoDEPath}/isodecalls $tpmGeneCommand -out "output.txt" + +echo awk command +date +pwd +awk '{if (NR == 1) {print "Gene ID\tConfident log2 FC\t Single run log2 FC\t c1 average TPM\tc2 average TPM";} else {if ($6 == 0 && $7 == 0) {two="0";} else {two=$2;} print $1 "\t" two "\t" $5 "\t" $6 "\t" $7}}' Bootstrap_Merge1_DIR/output.txt > ${geneTPMout_file} +cd .. + + +echo ISOFORM TPM +echo moving start +date + +mkdir tpm_I +cd tpm_I +mv ../c*_tpm_I . + +echo isoDE start +date + +${isoDEPath}/isodecalls $tpmIsoformCommand -out "output.txt" + +echo awk command +date + +awk '{if (NR == 1) {print "Isoform ID\tConfident log2 FC\t Single run log2 FC\t c1 average TPM\tc2 average TPM";} else {if ($6 == 0 && $7 == 0) {two="0";} else {two=$2;} print $1 "\t" two "\t" $5 "\t" $6 "\t" $7}}' Bootstrap_Merge1_DIR/output.txt > ${isoTPMout_file} + +cd .. + + +echo final cleanup +date +rm -fr fpkm_G fpkm_I tpm_G cd tpm_I +echo done +date + +