# HG changeset patch # User bgruening # Date 1387311890 18000 # Node ID ad6a989924ac35f81e350abbc8e852ca4806637e Uploaded diff -r 000000000000 -r ad6a989924ac split_file_on_column.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/split_file_on_column.xml Tue Dec 17 15:24:50 2013 -0500 @@ -0,0 +1,55 @@ + + according to the values of a column + + gnu_awk + + + awk '{print > "primary_${outfile.id}_" \$$column "_visible_${infile.ext}" }' $infile; + echo 'Created' `ls -l | wc -l` 'files:' > $outfile; + ls -1 --hide="*_stdout" --hide="*_stderr" >> $outfile; + + + + + + + + + + + + + + + + +**What it does** + +This tool splits a file into different smaller files using a specific column. +It will work like the group tool, but every group is saved to its own file. + +----- + +**Example** + +Splitting on column 4 from this:: + + chr7 56632 56652 cluster 1 + chr7 56736 56756 cluster 1 + chr7 56761 56781 cluster 2 + chr7 56772 56792 cluster 2 + chr7 56775 56795 cluster 2 + +will produce 2 files with different clusters:: + + chr7 56632 56652 cluster 1 + chr7 56736 56756 cluster 1 + + + chr7 56761 56781 cluster 2 + chr7 56772 56792 cluster 2 + chr7 56775 56795 cluster 2 + + + + diff -r 000000000000 -r ad6a989924ac tool_dependencies.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_dependencies.xml Tue Dec 17 15:24:50 2013 -0500 @@ -0,0 +1,6 @@ + + + + + +