0
|
1 #!/bin/bash
|
|
2
|
|
3 if [ "$#" -ne 1 ]; then
|
|
4 echo "[usage:] ICGC_pipeline.sh fastq_in_tar.gz"
|
|
5 exit 1;
|
|
6 fi
|
|
7
|
|
8 #FASTQ_1=$1
|
|
9 #FASTQ_2=$2
|
|
10 #SAMPLE_ID=$3
|
|
11 #TAR_FILE=$SAMPLE_ID".tar"
|
|
12 TAR_FILE=$1
|
|
13
|
|
14 export PATH=/storage/data/program/GDC_TGCA-Harmonized/RNA-Seq/bin/ICGC-STAR_ALIGNMENT_PIPELINE:$PATH
|
|
15
|
|
16 #tar cvfh $TAR_FILE $FASTQ_2 $FASTQ_1
|
|
17
|
|
18 STAD_ALIGN=~/package/DAUMSOFT/RNA-seq/ICGC_STAR_ALIGNMENT_PIPELINE/star_align.py
|
|
19 STAR_INDEX_PATH=~/refs/hg38/gdc/Index_Files/GDC.h38.d1.vd1_STAR2_Index_Files/star_genome_d1_vd1_gtfv22
|
|
20 WORK_DIR=./wrk
|
|
21 OUTPUT_BAM=./out
|
|
22 REFERENCE=~/refs/hg38/gdc/GRCh38.d1.vd1_Reference_Sequence/GRCh38.d1.vd1.fa
|
|
23 RUN_THREAD_NUM=8
|
|
24 rm -rf $WORK_DIR
|
|
25 rm -rf $OUTPUT_BAM
|
|
26 mkdir $WORK_DIR
|
|
27 mkdir $OUTPUT_BAM
|
|
28
|
|
29 python $STAD_ALIGN \
|
|
30 --genomeDir $STAR_INDEX_PATH \
|
|
31 --tarFileIn $TAR_FILE \
|
|
32 --workDir $WORK_DIR \
|
|
33 --out $OUTPUT_BAM \
|
|
34 --genomeFastaFiles $REFERENCE \
|
|
35 --runThreadN $RUN_THREAD_NUM \
|
|
36 --outFilterMultimapScoreRange 1 \
|
|
37 --outFilterMultimapNmax 20 \
|
|
38 --outFilterMismatchNmax 10 \
|
|
39 --alignIntronMax 500000 \
|
|
40 --alignMatesGapMax 1000000 \
|
|
41 --sjdbScore 2 \
|
|
42 --limitBAMsortRAM 0 \
|
|
43 --alignSJDBoverhangMin 1 \
|
|
44 --genomeLoad NoSharedMemory \
|
|
45 --outFilterMatchNminOverLread 0.33 \
|
|
46 --outFilterScoreMinOverLread 0.33 \
|
|
47 --twopass1readsN -1 \
|
|
48 --sjdbOverhang 100 \
|
|
49 --outSAMstrandField intronMotif \
|
|
50 --outSAMunmapped Within
|
|
51
|