Mercurial > repos > portiahollyoak > fastuniq
view source/fastq_pair.c @ 0:816cb55b5a2d draft default tip
planemo upload for repository https://github.com/portiahollyoak/Tools commit c4769fd68ad9583d4b9dbdf212e4ecb5968cef1c-dirty
author | portiahollyoak |
---|---|
date | Thu, 02 Jun 2016 11:34:51 -0400 |
parents | |
children |
line wrap: on
line source
/**************************************************************************** * The 'FASTQ_PAIR' structure group was used to store paired reads and * qualities, including basic operation function as well. * * This file was written by Haibin Xu, December 2011. ****************************************************************************/ #include "fastq_pair.h" FASTQ_PAIR *fastq_pair_create() { /* create a FASTQ pair. If successful, return the point to it, * otherwise, return NULL. */ FASTQ_PAIR *fq_pair; if((fq_pair=(FASTQ_PAIR *)malloc(sizeof(FASTQ_PAIR)))==NULL) return NULL; fq_pair->seq_left=NULL; fq_pair->seq_right=NULL; return fq_pair; } int fastq_pair_remove(FASTQ_PAIR *fq_pair) { /* free the FASTQ pair. If successful, return 0, otherwise return 1. */ if(fq_pair==NULL) return 1; fastq_pair_clear(fq_pair); free(fq_pair); return 0; } int fastq_pair_clear(FASTQ_PAIR *fq_pair) { /* clear the FASTQ pair. If successful, return 0, otherwise return 1. */ if(fq_pair==NULL) return 1; if(fq_pair->seq_left!=NULL) { fastq_remove(fq_pair->seq_left); fq_pair->seq_left=NULL; } if(fq_pair->seq_right!=NULL) { fastq_remove(fq_pair->seq_right); fq_pair->seq_right=NULL; } return 0; } int fastq_pair_scanf(FASTQ_PAIR *fq_pair, FILE *fp_left_in, FILE *fp_right_in, int whether_append_description, int whether_append_quality) { /* load the left and right reads and qualities for FASTQ pair from file, including description * (whether_append_description=1) or not (whether_append_description=0), including quality * (whether_append_quality=1) or not (whether_append_quality=0). If successful, return 0, * otherwise, clear FASTQ pair and return 1. */ FASTQ_ALL *fq_left, *fq_right; if(fq_pair==NULL || fp_left_in==NULL || fp_right_in==NULL) return 1; /* clear the FASTQ_PAIR */ fastq_pair_clear(fq_pair); /* create the FASTQ_ALL structure */ if((fq_left=fastq_create())==NULL) return 1; if((fq_right=fastq_create())==NULL) { fastq_remove(fq_left); return 1; } if(fastq_scanf(fq_left, fp_left_in, whether_append_description, whether_append_quality)!=0 || fastq_scanf(fq_right, fp_right_in, whether_append_description, whether_append_quality)!=0) { fastq_remove(fq_left); fastq_remove(fq_right); return 1; } fq_pair->seq_left=fq_left; fq_pair->seq_right=fq_right; return 0; } int fastq_pair_printf(FASTQ_PAIR *fq_pair, FILE *fp_out1, FILE *fp_out2, char *format, long serial) { /* write the pair-end reads in FASTA or FASTQ format into two output files(format='fa' or 'fq') * or in FASTA format into a single output file(format="fa" and fp_out2==NULL) using the original * description (serial=-1) or the new serial. If successful, return 0, otherwise, return 1. */ if(fq_pair==NULL || fp_out1==NULL) return 1; if((strcmp(format, "fq")==0 && fp_out2!=NULL) || (strcmp(format, "fa")==0 && fp_out2!=NULL)) { fastq_printf(fq_pair->seq_left, fp_out1, format, serial); fastq_printf(fq_pair->seq_right, fp_out2, format, serial); } else if(strcmp(format, "fa")==0 && fp_out2==NULL) { fastq_printf(fq_pair->seq_left, fp_out1, format, serial); fastq_printf(fq_pair->seq_right, fp_out1, format, serial); } else return 1; return 0; } int fastq_pair_compare_tight(FASTQ_PAIR *fq_pair_a, FASTQ_PAIR *fq_pair_b) { /* compare the two FASTQ pairs tightly, if identical, return 0, else if a>b, * return 1, else if a<b, return -1. */ char *a_left, *a_right, *b_left, *b_right; int i, flag; /* check whether the sequence read exist */ if(fq_pair_a==NULL || fq_pair_b==NULL || fq_pair_a->seq_left==NULL || fq_pair_a->seq_left->sequence==NULL || fq_pair_a->seq_right==NULL || fq_pair_a->seq_right->sequence==NULL || fq_pair_b->seq_left==NULL || fq_pair_b->seq_left->sequence==NULL || fq_pair_b->seq_right==NULL || fq_pair_b->seq_right->sequence==NULL) return 1; /* obtain points to sequence */ a_left=fq_pair_a->seq_left->sequence; a_right=fq_pair_a->seq_right->sequence; b_left=fq_pair_b->seq_left->sequence; b_right=fq_pair_b->seq_right->sequence; flag=0; for(i=0;;i++) { if(a_left[i]=='\0' && b_left[i]=='\0') break; if(a_left[i]==b_left[i]) continue; if(a_left[i]=='\0') { flag=-1; break; } if(b_left[i]=='\0') { flag=1; break; } switch((int)(a_left[i]>b_left[i])) { case 1: flag=1; break; case 0: flag=-1; break; default: break; } break; } if(flag==0) { for(i=0;;i++) { if(a_right[i]=='\0' && b_right[i]=='\0') break; if(a_right[i]==b_right[i]) continue; if(a_right[i]=='\0') { flag=-1; break; } if(b_right[i]=='\0') { flag=1; break; } switch((int)(a_right[i]>b_right[i])) { case 1: flag=1; break; case 0: flag=-1; break; default: break; } break; } } return flag; } int fastq_pair_compare_loose(FASTQ_PAIR *fq_pair_a, FASTQ_PAIR *fq_pair_b) { /* compare the two FASTQ pairs loosely, if identical, return 0, else if a>b, * return 1, else if a<b, return -1. */ char *a_left, *a_right, *b_left, *b_right; int i, flag; /* check whether the sequence read exist */ if(fq_pair_a==NULL || fq_pair_b==NULL || fq_pair_a->seq_left==NULL || fq_pair_a->seq_left->sequence==NULL || fq_pair_a->seq_right==NULL || fq_pair_a->seq_right->sequence==NULL || fq_pair_b->seq_left==NULL || fq_pair_b->seq_left->sequence==NULL || fq_pair_b->seq_right==NULL || fq_pair_b->seq_right->sequence==NULL) return 1; /* obtain points to sequence */ a_left=fq_pair_a->seq_left->sequence; a_right=fq_pair_a->seq_right->sequence; b_left=fq_pair_b->seq_left->sequence; b_right=fq_pair_b->seq_right->sequence; flag=0; for(i=0;;i++) { if(a_left[i]=='\0' && b_left[i]=='\0') break; if(a_left[i]==b_left[i]) continue; if(a_left[i]=='\0' || b_left[i]=='\0') break; switch((int)(a_left[i]>b_left[i])) { case 1: flag=1; break; case 0: flag=-1; break; default: break; } break; } if(flag==0) { for(i=0;;i++) { if(a_right[i]=='\0' && b_right[i]=='\0') break; if(a_right[i]==b_right[i]) continue; if(a_right[i]=='\0' || b_right[i]=='\0') break; switch((int)(a_right[i]>b_right[i])) { case 1: flag=1; break; case 0: flag=-1; break; default: break; } break; } } return flag; } long fastq_pair_get_left_length(FASTQ_PAIR *fq_pair) { /* return the length of left FASTQ sequence in pair, if any error, return -1. */ if(fq_pair==NULL) return -1; return fastq_get_length(fq_pair->seq_left); } long fastq_pair_get_right_length(FASTQ_PAIR *fq_pair) { /* return the length of right FASTQ sequence in pair, if any error, return -1. */ if(fq_pair==NULL) return -1; return fastq_get_length(fq_pair->seq_right); } long fastq_pair_get_total_length(FASTQ_PAIR *fq_pair) { /* return the length of both left and right FASTQ sequence in pair, * if any error, return -1. */ long left_length, right_length; if(fq_pair==NULL) return -1; left_length=fastq_pair_get_left_length(fq_pair); right_length=fastq_pair_get_right_length(fq_pair); if(left_length==-1 || right_length==-1) return -1; return left_length+right_length; }