annotate SNV/SNVMix2_source/SNVMix2-v0.12.1-rc1/samtools-0.1.6/bgzip.c @ 0:74f5ea818cea

Uploaded
author ryanmorin
date Wed, 12 Oct 2011 19:50:38 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
1 /* The MIT License
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
2
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
3 Copyright (c) 2008 Broad Institute / Massachusetts Institute of Technology
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
4
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
5 Permission is hereby granted, free of charge, to any person obtaining a copy
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
6 of this software and associated documentation files (the "Software"), to deal
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
7 in the Software without restriction, including without limitation the rights
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
8 to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
9 copies of the Software, and to permit persons to whom the Software is
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
10 furnished to do so, subject to the following conditions:
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
11
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
12 The above copyright notice and this permission notice shall be included in
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
13 all copies or substantial portions of the Software.
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
14
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
15 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
16 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
17 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
18 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
19 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
20 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
21 THE SOFTWARE.
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
22 */
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
23
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
24 #include <stdlib.h>
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
25 #include <string.h>
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
26 #include <stdio.h>
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
27 #include <fcntl.h>
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
28 #include <unistd.h>
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
29 #include <errno.h>
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
30 #include "bgzf.h"
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
31
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
32 static const int WINDOW_SIZE = 64 * 1024;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
33
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
34 static int bgzip_main_usage()
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
35 {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
36 printf("\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
37 printf("Usage: bgzip [options] [file] ...\n\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
38 printf("Options: -c write on standard output, keep original files unchanged\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
39 printf(" -d decompress\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
40 // printf(" -l list compressed file contents\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
41 printf(" -b INT decompress at virtual file pointer INT\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
42 printf(" -s INT decompress INT bytes in the uncompressed file\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
43 printf(" -h give this help\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
44 printf("\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
45 return 0;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
46 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
47
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
48 static int write_open(const char *fn, int is_forced)
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
49 {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
50 int fd = -1;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
51 char c;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
52 if (!is_forced) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
53 if ((fd = open(fn, O_WRONLY | O_CREAT | O_TRUNC | O_EXCL, 0644)) < 0 && errno == EEXIST) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
54 printf("bgzip: %s already exists; do you wish to overwrite (y or n)? ", fn);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
55 scanf("%c", &c);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
56 if (c != 'Y' && c != 'y') {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
57 printf("bgzip: not overwritten\n");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
58 exit(1);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
59 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
60 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
61 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
62 if (fd < 0) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
63 if ((fd = open(fn, O_WRONLY | O_CREAT | O_TRUNC, 0644)) < 0) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
64 fprintf(stderr, "bgzip: %s: Fail to write\n", fn);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
65 exit(1);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
66 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
67 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
68 return fd;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
69 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
70
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
71 static
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
72 void
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
73 fail(BGZF* fp)
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
74 {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
75 printf("Error: %s\n", fp->error);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
76 exit(1);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
77 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
78
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
79 int main(int argc, char **argv)
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
80 {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
81 int c, compress, pstdout, is_forced;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
82 BGZF *rz;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
83 void *buffer;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
84 long start, end, size;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
85
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
86 compress = 1; pstdout = 0; start = 0; size = -1; end = -1; is_forced = 0;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
87 while((c = getopt(argc, argv, "cdlhfb:s:")) >= 0){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
88 switch(c){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
89 case 'h': return bgzip_main_usage();
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
90 case 'd': compress = 0; break;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
91 case 'c': pstdout = 1; break;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
92 // case 'l': compress = 2; break;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
93 case 'b': start = atol(optarg); break;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
94 case 's': size = atol(optarg); break;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
95 case 'f': is_forced = 1; break;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
96 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
97 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
98 if (size >= 0) end = start + size;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
99 if(end >= 0 && end < start){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
100 fprintf(stderr, " -- Illegal region: [%ld, %ld] --\n", start, end);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
101 return 1;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
102 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
103 if(compress == 1){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
104 int f_src, f_dst = -1;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
105 if(argc > optind){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
106 if((f_src = open(argv[optind], O_RDONLY)) < 0){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
107 fprintf(stderr, " -- Cannot open file: %s --\n", argv[optind]);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
108 return 1;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
109 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
110 if(pstdout){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
111 f_dst = fileno(stdout);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
112 } else {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
113 char *name = malloc(sizeof(strlen(argv[optind]) + 5));
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
114 strcpy(name, argv[optind]);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
115 strcat(name, ".gz");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
116 f_dst = write_open(name, is_forced);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
117 if (f_dst < 0) return 1;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
118 free(name);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
119 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
120 } else if(pstdout){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
121 f_src = fileno(stdin);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
122 f_dst = fileno(stdout);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
123 } else return bgzip_main_usage();
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
124 rz = bgzf_fdopen(f_dst, "w");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
125 buffer = malloc(WINDOW_SIZE);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
126 while((c = read(f_src, buffer, WINDOW_SIZE)) > 0) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
127 if (bgzf_write(rz, buffer, c) < 0) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
128 fail(rz);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
129 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
130 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
131 // f_dst will be closed here
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
132 if (bgzf_close(rz) < 0) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
133 fail(rz);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
134 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
135 if (argc > optind) unlink(argv[optind]);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
136 free(buffer);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
137 close(f_src);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
138 return 0;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
139 } else {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
140 if(argc <= optind) return bgzip_main_usage();
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
141 int f_dst;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
142 if (argc > optind && !pstdout) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
143 char *name;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
144 if (strstr(argv[optind], ".gz") - argv[optind] != strlen(argv[optind]) - 3) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
145 printf("bgzip: %s: unknown suffix -- ignored\n", argv[optind]);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
146 return 1;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
147 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
148 name = strdup(argv[optind]);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
149 name[strlen(name) - 3] = '\0';
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
150 f_dst = write_open(name, is_forced);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
151 free(name);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
152 } else f_dst = fileno(stdout);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
153 rz = bgzf_open(argv[optind], "r");
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
154 if (rz == NULL) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
155 printf("Could not open file: %s\n", argv[optind]);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
156 return 1;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
157 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
158 buffer = malloc(WINDOW_SIZE);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
159 if (bgzf_seek(rz, start, SEEK_SET) < 0) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
160 fail(rz);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
161 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
162 while(1){
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
163 if(end < 0) c = bgzf_read(rz, buffer, WINDOW_SIZE);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
164 else c = bgzf_read(rz, buffer, (end - start > WINDOW_SIZE)? WINDOW_SIZE:(end - start));
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
165 if(c == 0) break;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
166 if (c < 0) fail(rz);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
167 start += c;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
168 write(f_dst, buffer, c);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
169 if(end >= 0 && start >= end) break;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
170 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
171 free(buffer);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
172 if (bgzf_close(rz) < 0) {
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
173 fail(rz);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
174 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
175 if (!pstdout) unlink(argv[optind]);
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
176 return 0;
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
177 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
178 }
74f5ea818cea Uploaded
ryanmorin
parents:
diff changeset
179