annotate Tools/CREF/Extract_motif_codes_galaxy.pl @ 0:229d36377838 draft

Uploaded
author amadeo
date Mon, 05 Sep 2016 05:53:08 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
229d36377838 Uploaded
amadeo
parents:
diff changeset
1 #!/usr/bin/perl -w
229d36377838 Uploaded
amadeo
parents:
diff changeset
2
229d36377838 Uploaded
amadeo
parents:
diff changeset
3 # The lines that start with # are comment lines that are not executed
229d36377838 Uploaded
amadeo
parents:
diff changeset
4
229d36377838 Uploaded
amadeo
parents:
diff changeset
5
229d36377838 Uploaded
amadeo
parents:
diff changeset
6 $|=1;
229d36377838 Uploaded
amadeo
parents:
diff changeset
7 use strict;
229d36377838 Uploaded
amadeo
parents:
diff changeset
8 use warnings;
229d36377838 Uploaded
amadeo
parents:
diff changeset
9
229d36377838 Uploaded
amadeo
parents:
diff changeset
10
229d36377838 Uploaded
amadeo
parents:
diff changeset
11 #Script to take output from AME (part of memesuite-org) and extract a
229d36377838 Uploaded
amadeo
parents:
diff changeset
12 #list of the overrepresented motifs and print them to a new file
229d36377838 Uploaded
amadeo
parents:
diff changeset
13 #called ame-motif-id.list
229d36377838 Uploaded
amadeo
parents:
diff changeset
14
229d36377838 Uploaded
amadeo
parents:
diff changeset
15
229d36377838 Uploaded
amadeo
parents:
diff changeset
16 #Checking to see if the user has provided 1 argument - which is the
229d36377838 Uploaded
amadeo
parents:
diff changeset
17 #name of the AME results file
229d36377838 Uploaded
amadeo
parents:
diff changeset
18
229d36377838 Uploaded
amadeo
parents:
diff changeset
19 if(@ARGV < 2){
229d36377838 Uploaded
amadeo
parents:
diff changeset
20 print "\nUsage: Extract_motif_codes.pl ame.txt ame-shorted.txt\n\n";
229d36377838 Uploaded
amadeo
parents:
diff changeset
21 exit(0);
229d36377838 Uploaded
amadeo
parents:
diff changeset
22 }
229d36377838 Uploaded
amadeo
parents:
diff changeset
23
229d36377838 Uploaded
amadeo
parents:
diff changeset
24 #Declaring variables
229d36377838 Uploaded
amadeo
parents:
diff changeset
25 my @cols; #an array variable
229d36377838 Uploaded
amadeo
parents:
diff changeset
26 my $line; # a scalar varaible
229d36377838 Uploaded
amadeo
parents:
diff changeset
27
229d36377838 Uploaded
amadeo
parents:
diff changeset
28 #Using a FIELHANDLE to open the input file
229d36377838 Uploaded
amadeo
parents:
diff changeset
29 open (INPUT, "<$ARGV[0]") ||
229d36377838 Uploaded
amadeo
parents:
diff changeset
30 die "File '$ARGV[0]' not found\n" ;
229d36377838 Uploaded
amadeo
parents:
diff changeset
31
229d36377838 Uploaded
amadeo
parents:
diff changeset
32 open (OUTPUT, ">$ARGV[1]") ||
229d36377838 Uploaded
amadeo
parents:
diff changeset
33 die "File '>$ARGV[1]' not found\n" ;
229d36377838 Uploaded
amadeo
parents:
diff changeset
34
229d36377838 Uploaded
amadeo
parents:
diff changeset
35 #looping through each line of the file
229d36377838 Uploaded
amadeo
parents:
diff changeset
36 while (<INPUT>){
229d36377838 Uploaded
amadeo
parents:
diff changeset
37 #assigning line to variable $line
229d36377838 Uploaded
amadeo
parents:
diff changeset
38 #$_ is a special default variable that here holds the line contents
229d36377838 Uploaded
amadeo
parents:
diff changeset
39 $line = $_;
229d36377838 Uploaded
amadeo
parents:
diff changeset
40 #match lines that have Ranksum
229d36377838 Uploaded
amadeo
parents:
diff changeset
41 if ($line =~ /Ranksum/){
229d36377838 Uploaded
amadeo
parents:
diff changeset
42 printf OUTPUT "%s\n", $line;
229d36377838 Uploaded
amadeo
parents:
diff changeset
43 #split the lines on white space, so each part of the line gets
229d36377838 Uploaded
amadeo
parents:
diff changeset
44 #stored as an array element
229d36377838 Uploaded
amadeo
parents:
diff changeset
45 @cols=split;
229d36377838 Uploaded
amadeo
parents:
diff changeset
46 #Testing to see what line elements are stored in the array
229d36377838 Uploaded
amadeo
parents:
diff changeset
47 #print "cols [0] is $cols[0] \n";
229d36377838 Uploaded
amadeo
parents:
diff changeset
48 #print "cols [2] is $cols[2] \n\n";
229d36377838 Uploaded
amadeo
parents:
diff changeset
49
229d36377838 Uploaded
amadeo
parents:
diff changeset
50 #Now see if you can print out the array elemnent that stores the
229d36377838 Uploaded
amadeo
parents:
diff changeset
51 #motif ID to a new file called ame-motif-id.list.
229d36377838 Uploaded
amadeo
parents:
diff changeset
52 }
229d36377838 Uploaded
amadeo
parents:
diff changeset
53 }
229d36377838 Uploaded
amadeo
parents:
diff changeset
54