annotate tools/rdock/bin/sdsplit @ 3:279ba0732f87 draft default tip

planemo upload
author marpiech
date Mon, 29 Aug 2016 09:07:58 -0400
parents 30e2440b2173
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
1 #!/usr/bin/perl
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
2 # Splits SD records into multiple files of equal no. of records
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
3 use lib "$ENV{'RBT_ROOT'}/lib";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
4
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
5 use FileHandle;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
6 use SDRecord;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
7
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
8 # Record size to split into
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
9 my $recSize = 1000;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
10
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
11 #output root
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
12 my $outRoot = "tmp";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
13
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
14 #Print help if no command line arguments
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
15 printHelpAndExit() if (scalar(@ARGV) == 0);
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
16
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
17 #Parse command line arguments
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
18 my @files;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
19 while (scalar(@ARGV)) {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
20 my $arg = shift @ARGV;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
21 printHelpAndExit() if ($arg eq '-h');
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
22 if (index($arg,'-o')==0) {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
23 $outRoot = substr($arg,2);
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
24 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
25 elsif (index($arg,'-')==0) {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
26 $recSize = substr($arg,1);
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
27 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
28 else {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
29 push @files,$arg;#must be a filename
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
30 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
31 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
32 push @ARGV,@files;#put the filenames back in the arg list
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
33
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
34 my $sdRec = new SDRecord;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
35 my $nRec=0;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
36 my $nFile=0;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
37 my $sdfh;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
38
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
39 #read records
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
40 while ($sdRec->readRec('LINES'=>1)) {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
41 #check if we need to start a new output file
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
42 if ($nRec % $recSize == 0) {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
43 $nFile++;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
44 my $outFile = $outRoot . $nFile . ".sd";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
45 if (defined $sdfh) {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
46 undef $sdfh;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
47 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
48 $sdfh = new FileHandle ">$outFile";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
49 if (!defined $sdfh) {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
50 die "Can't open $outFile";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
51 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
52 else {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
53 print STDOUT "Opening $outFile\n";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
54 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
55 $sdfh->autoflush(1);
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
56 select($sdfh);
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
57 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
58 $nRec++;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
59 $sdRec->writeRec();
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
60 }
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
61 undef $sdfh;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
62 select(STDOUT);#reselect STDOUT as default
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
63
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
64 #######################################################################
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
65 sub printHelpAndExit {
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
66 print "\Splits SD records into multiple files of equal size\n";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
67 print "\nUsage:\tsdsplit [-<RecSize>] [-o<OutputRoot>] [sdFiles]\n\n";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
68 print "\t-<RecSize>\trecord size to split into (default = 1000 records)\n";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
69 print "\t-o<OutputRoot>\tRoot name for output files (default = tmp)\n";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
70 print "\n\tIf SD file list not given, reads from standard input\n";
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
71 exit;
30e2440b2173 planemo upload
marpiech
parents:
diff changeset
72 }