# HG changeset patch
# User iuc
# Date 1714478549 0
# Node ID 55a53b5e308d842c887b0bb87e3acf6884b405d7
# Parent 5412142130adefb5fe8125331abd049e03492ad0
planemo upload for repository https://github.com/open2c/pairtools commit 162c595b19e442f40be4c2f5434b20b56ade52d4
diff -r 5412142130ad -r 55a53b5e308d dedup.xml
--- a/dedup.xml Tue Apr 16 12:51:21 2024 +0000
+++ b/dedup.xml Tue Apr 30 12:02:29 2024 +0000
@@ -20,7 +20,7 @@
]]>
-
+
diff -r 5412142130ad -r 55a53b5e308d macros.xml
--- a/macros.xml Tue Apr 16 12:51:21 2024 +0000
+++ b/macros.xml Tue Apr 30 12:02:29 2024 +0000
@@ -1,5 +1,5 @@
- 1.0.3
+ 1.1.0
0
diff -r 5412142130ad -r 55a53b5e308d test-data/output_dedup_pairs.pairsam
--- a/test-data/output_dedup_pairs.pairsam Tue Apr 16 12:51:21 2024 +0000
+++ b/test-data/output_dedup_pairs.pairsam Tue Apr 30 12:02:29 2024 +0000
@@ -39,20 +39,20 @@
#samheader: @PG ID:bwa PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane1.00.1.fastq.gz MATalpha_R1.lane1.00.2.fastq.gz
#samheader: @PG ID:pairtools_parse-1.2 PN:pairtools_parse CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools parse -o output_parsed_pairs_bam.pairs --output-stats output_parsed_pairs.stats --min-mapq 40 --walks-policy 5unique --max-inter-align-gap 30 --chroms-path test.reduced.chrom.sizes test.bam PP:bwa VN:1.0.2
#samheader: @PG ID:pairtools_sort-1.3 PN:pairtools_sort CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools sort -o output_sorted_pairs.pairsam output_parsed_pairs_bam.pairs PP:pairtools_parse-1.2 VN:1.0.2
-#samheader: @PG ID:pairtools_dedup-1.4 PN:pairtools_dedup CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools dedup -o output_dedup_pairs.pairsam output_sorted_pairs.pairsam PP:pairtools_sort-1.3 VN:1.0.2
+#samheader: @PG ID:pairtools_dedup-1.4 PN:pairtools_dedup CL:/usr/local/bin/pairtools dedup /tmp/tmpp1v7bap4/files/2/1/3/dataset_21372a8a-66a4-4ab8-8a38-a1e4d87d5048.dat -o /tmp/tmpp1v7bap4/job_working_directory/000/2/outputs/dataset_b7034ba7-f57e-4752-a341-425fdb4da81e.dat --nproc-in 1 --nproc-out 1 PP:pairtools_sort-1.3 VN:1.1.0
#samheader: @PG ID:bwa-2CCE5976 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane1.01.1.fastq.gz MATalpha_R1.lane1.01.2.fastq.gz
#samheader: @PG ID:pairtools_parse-2.2 PN:pairtools_parse CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools parse -o output_parsed_pairs_bam.pairs --output-stats output_parsed_pairs.stats --min-mapq 40 --walks-policy 5unique --max-inter-align-gap 30 --chroms-path test.reduced.chrom.sizes test.bam PP:bwa-2CCE5976 VN:1.0.2
#samheader: @PG ID:pairtools_sort-2.3 PN:pairtools_sort CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools sort -o output_sorted_pairs.pairsam output_parsed_pairs_bam.pairs PP:pairtools_parse-2.2 VN:1.0.2
-#samheader: @PG ID:pairtools_dedup-2.4 PN:pairtools_dedup CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools dedup -o output_dedup_pairs.pairsam output_sorted_pairs.pairsam PP:pairtools_sort-2.3 VN:1.0.2
+#samheader: @PG ID:pairtools_dedup-2.4 PN:pairtools_dedup CL:/usr/local/bin/pairtools dedup /tmp/tmpp1v7bap4/files/2/1/3/dataset_21372a8a-66a4-4ab8-8a38-a1e4d87d5048.dat -o /tmp/tmpp1v7bap4/job_working_directory/000/2/outputs/dataset_b7034ba7-f57e-4752-a341-425fdb4da81e.dat --nproc-in 1 --nproc-out 1 PP:pairtools_sort-2.3 VN:1.1.0
#samheader: @PG ID:bwa-3CAFD9D9 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane2.00.1.fastq.gz MATalpha_R1.lane2.00.2.fastq.gz
#samheader: @PG ID:pairtools_parse-3.2 PN:pairtools_parse CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools parse -o output_parsed_pairs_bam.pairs --output-stats output_parsed_pairs.stats --min-mapq 40 --walks-policy 5unique --max-inter-align-gap 30 --chroms-path test.reduced.chrom.sizes test.bam PP:bwa-3CAFD9D9 VN:1.0.2
#samheader: @PG ID:pairtools_sort-3.3 PN:pairtools_sort CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools sort -o output_sorted_pairs.pairsam output_parsed_pairs_bam.pairs PP:pairtools_parse-3.2 VN:1.0.2
-#samheader: @PG ID:pairtools_dedup-3.4 PN:pairtools_dedup CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools dedup -o output_dedup_pairs.pairsam output_sorted_pairs.pairsam PP:pairtools_sort-3.3 VN:1.0.2
+#samheader: @PG ID:pairtools_dedup-3.4 PN:pairtools_dedup CL:/usr/local/bin/pairtools dedup /tmp/tmpp1v7bap4/files/2/1/3/dataset_21372a8a-66a4-4ab8-8a38-a1e4d87d5048.dat -o /tmp/tmpp1v7bap4/job_working_directory/000/2/outputs/dataset_b7034ba7-f57e-4752-a341-425fdb4da81e.dat --nproc-in 1 --nproc-out 1 PP:pairtools_sort-3.3 VN:1.1.0
#samheader: @PG ID:bwa-4548A671 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane2.01.1.fastq.gz MATalpha_R1.lane2.01.2.fastq.gz
#samheader: @PG ID:samtools PN:samtools PP:bwa-4548A671 VN:1.19.2 CL:samtools view -s 0.1 -b -@ 4 -o subset.bam test.bam
#samheader: @PG ID:pairtools_parse-4.3 PN:pairtools_parse CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools parse -o output_parsed_pairs_bam.pairs --output-stats output_parsed_pairs.stats --min-mapq 40 --walks-policy 5unique --max-inter-align-gap 30 --chroms-path test.reduced.chrom.sizes test.bam PP:samtools VN:1.0.2
#samheader: @PG ID:pairtools_sort-4.4 PN:pairtools_sort CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools sort -o output_sorted_pairs.pairsam output_parsed_pairs_bam.pairs PP:pairtools_parse-4.3 VN:1.0.2
-#samheader: @PG ID:pairtools_dedup-4.5 PN:pairtools_dedup CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools dedup -o output_dedup_pairs.pairsam output_sorted_pairs.pairsam PP:pairtools_sort-4.4 VN:1.0.2
+#samheader: @PG ID:pairtools_dedup-4.5 PN:pairtools_dedup CL:/usr/local/bin/pairtools dedup /tmp/tmpp1v7bap4/files/2/1/3/dataset_21372a8a-66a4-4ab8-8a38-a1e4d87d5048.dat -o /tmp/tmpp1v7bap4/job_working_directory/000/2/outputs/dataset_b7034ba7-f57e-4752-a341-425fdb4da81e.dat --nproc-in 1 --nproc-out 1 PP:pairtools_sort-4.4 VN:1.1.0
#columns: readID chrom1 pos1 chrom2 pos2 strand1 strand2 pair_type sam1 sam2
HWI-ST560:29:B0A7LABXX:2:1101:15566:24141 chrI 3199 chrI 3399 + - UU HWI-ST560:29:B0A7LABXX:2:1101:15566:2414197chrI31996015S35M=3350201CTTAGACAATAAGCTAGCTTTCAAGATATAAGATACGAAATAGGGGTTGA111442422223232232EGDD?BFIIIIGBHCJIJIHFIHFHGHGGC<2GHGHFDEGDD?BFIIIIGBHCJIJIHFIHFHGHGGC<2GHGHFDEGDD?BFIIIIGBHCJIJIHFIHFHGHGGC<2GHGHFD332224D=:1NM:i:0MD:Z:50AS:i:50XS:i:0Yt:Z:UU
HWUSI-EAS1533_0033_FC:1:1:2403:20808 chrIV 497939 chrIV 498215 + - DD HWUSI-EAS1533_0033_FC:1:1:2403:2080897chrIV4979396036M=498180277CGCTTTCATTACTCGAATCCGTCAAAGACGCTTCTT4544588888C@@CC@CCC@@@C@@@C@CCC@C@CCNM:i:1MD:Z:0A35AS:i:35XS:i:0Yt:Z:UU HWUSI-EAS1533_0033_FC:1:1:2403:20808145chrIV4981806036M=497939-277GGCTGGTGAAGGAGTATTATTTACAATTCTAAAGCN@@C@@@@CC@CC@CC22C@@@CCCCC888886666)NM:i:1MD:Z:35T0AS:i:35XS:i:0Yt:Z:UU
diff -r 5412142130ad -r 55a53b5e308d test-data/output_pairs_split.bam
Binary file test-data/output_pairs_split.bam has changed
diff -r 5412142130ad -r 55a53b5e308d test-data/output_pairs_split.pairs
--- a/test-data/output_pairs_split.pairs Tue Apr 16 12:51:21 2024 +0000
+++ b/test-data/output_pairs_split.pairs Tue Apr 30 12:02:29 2024 +0000
@@ -39,24 +39,24 @@
#samheader: @PG ID:bwa PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane1.00.1.fastq.gz MATalpha_R1.lane1.00.2.fastq.gz
#samheader: @PG ID:pairtools_parse-1.2 PN:pairtools_parse CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools parse -o output_parsed_pairs_bam.pairs --output-stats output_parsed_pairs.stats --min-mapq 40 --walks-policy 5unique --max-inter-align-gap 30 --chroms-path test.reduced.chrom.sizes test.bam PP:bwa VN:1.0.2
#samheader: @PG ID:pairtools_sort-1.3 PN:pairtools_sort CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools sort -o output_sorted_pairs.pairsam output_parsed_pairs_bam.pairs PP:pairtools_parse-1.2 VN:1.0.2
-#samheader: @PG ID:pairtools_dedup-1.4 PN:pairtools_dedup CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools dedup -o output_dedup_pairs_markdups.pairsam --mark-dups --output-stats output_dedup_pairs.stats output_sorted_pairs.pairsam PP:pairtools_sort-1.3 VN:1.0.2
-#samheader: @PG ID:pairtools_split-1.5 PN:pairtools_split CL:/usr/local/bin/pairtools split /tmp/tmpnt_hb134/files/7/4/2/dataset_7420fb9f-e3dd-4326-8cef-1e023c2b5e85.dat --output-pairs /tmp/tmpnt_hb134/job_working_directory/000/2/outputs/dataset_ba891b58-22e9-49f5-83f9-063b56eda346.dat --output-sam ./output.bam --nproc-in 1 --nproc-out 1 PP:pairtools_dedup-1.4 VN:1.0.3
+#samheader: @PG ID:pairtools_dedup-1.4 PN:pairtools_dedup CL:/usr/local/bin/pairtools dedup /tmp/tmpp1v7bap4/files/3/7/9/dataset_379f0c04-3329-4201-9b3c-3c3a66e7eec4.dat -o /tmp/tmpp1v7bap4/job_working_directory/000/6/outputs/dataset_6f9ee270-56fb-4c2e-92f4-509340f9eb58.dat --mark-dups --output-stats /tmp/tmpp1v7bap4/job_working_directory/000/6/outputs/dataset_653a5918-ae05-4cfe-8fc9-4ecc516aeaf1.dat --nproc-in 1 --nproc-out 1 PP:pairtools_sort-1.3 VN:1.1.0
+#samheader: @PG ID:pairtools_split-1.5 PN:pairtools_split CL:/usr/local/bin/pairtools split /tmp/tmpms_dxt0a/files/8/b/9/dataset_8b97afbd-6770-4cb4-8bf1-fdc78bbce0af.dat --output-pairs /tmp/tmpms_dxt0a/job_working_directory/000/2/outputs/dataset_da90611d-b0d1-447c-ae61-f9ac7147d51d.dat --output-sam ./output.bam --nproc-in 1 --nproc-out 1 PP:pairtools_dedup-1.4 VN:1.1.0
#samheader: @PG ID:bwa-2CCE5976 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane1.01.1.fastq.gz MATalpha_R1.lane1.01.2.fastq.gz
#samheader: @PG ID:pairtools_parse-2.2 PN:pairtools_parse CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools parse -o output_parsed_pairs_bam.pairs --output-stats output_parsed_pairs.stats --min-mapq 40 --walks-policy 5unique --max-inter-align-gap 30 --chroms-path test.reduced.chrom.sizes test.bam PP:bwa-2CCE5976 VN:1.0.2
#samheader: @PG ID:pairtools_sort-2.3 PN:pairtools_sort CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools sort -o output_sorted_pairs.pairsam output_parsed_pairs_bam.pairs PP:pairtools_parse-2.2 VN:1.0.2
-#samheader: @PG ID:pairtools_dedup-2.4 PN:pairtools_dedup CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools dedup -o output_dedup_pairs_markdups.pairsam --mark-dups --output-stats output_dedup_pairs.stats output_sorted_pairs.pairsam PP:pairtools_sort-2.3 VN:1.0.2
-#samheader: @PG ID:pairtools_split-2.5 PN:pairtools_split CL:/usr/local/bin/pairtools split /tmp/tmpnt_hb134/files/7/4/2/dataset_7420fb9f-e3dd-4326-8cef-1e023c2b5e85.dat --output-pairs /tmp/tmpnt_hb134/job_working_directory/000/2/outputs/dataset_ba891b58-22e9-49f5-83f9-063b56eda346.dat --output-sam ./output.bam --nproc-in 1 --nproc-out 1 PP:pairtools_dedup-2.4 VN:1.0.3
+#samheader: @PG ID:pairtools_dedup-2.4 PN:pairtools_dedup CL:/usr/local/bin/pairtools dedup /tmp/tmpp1v7bap4/files/3/7/9/dataset_379f0c04-3329-4201-9b3c-3c3a66e7eec4.dat -o /tmp/tmpp1v7bap4/job_working_directory/000/6/outputs/dataset_6f9ee270-56fb-4c2e-92f4-509340f9eb58.dat --mark-dups --output-stats /tmp/tmpp1v7bap4/job_working_directory/000/6/outputs/dataset_653a5918-ae05-4cfe-8fc9-4ecc516aeaf1.dat --nproc-in 1 --nproc-out 1 PP:pairtools_sort-2.3 VN:1.1.0
+#samheader: @PG ID:pairtools_split-2.5 PN:pairtools_split CL:/usr/local/bin/pairtools split /tmp/tmpms_dxt0a/files/8/b/9/dataset_8b97afbd-6770-4cb4-8bf1-fdc78bbce0af.dat --output-pairs /tmp/tmpms_dxt0a/job_working_directory/000/2/outputs/dataset_da90611d-b0d1-447c-ae61-f9ac7147d51d.dat --output-sam ./output.bam --nproc-in 1 --nproc-out 1 PP:pairtools_dedup-2.4 VN:1.1.0
#samheader: @PG ID:bwa-3CAFD9D9 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane2.00.1.fastq.gz MATalpha_R1.lane2.00.2.fastq.gz
#samheader: @PG ID:pairtools_parse-3.2 PN:pairtools_parse CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools parse -o output_parsed_pairs_bam.pairs --output-stats output_parsed_pairs.stats --min-mapq 40 --walks-policy 5unique --max-inter-align-gap 30 --chroms-path test.reduced.chrom.sizes test.bam PP:bwa-3CAFD9D9 VN:1.0.2
#samheader: @PG ID:pairtools_sort-3.3 PN:pairtools_sort CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools sort -o output_sorted_pairs.pairsam output_parsed_pairs_bam.pairs PP:pairtools_parse-3.2 VN:1.0.2
-#samheader: @PG ID:pairtools_dedup-3.4 PN:pairtools_dedup CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools dedup -o output_dedup_pairs_markdups.pairsam --mark-dups --output-stats output_dedup_pairs.stats output_sorted_pairs.pairsam PP:pairtools_sort-3.3 VN:1.0.2
-#samheader: @PG ID:pairtools_split-3.5 PN:pairtools_split CL:/usr/local/bin/pairtools split /tmp/tmpnt_hb134/files/7/4/2/dataset_7420fb9f-e3dd-4326-8cef-1e023c2b5e85.dat --output-pairs /tmp/tmpnt_hb134/job_working_directory/000/2/outputs/dataset_ba891b58-22e9-49f5-83f9-063b56eda346.dat --output-sam ./output.bam --nproc-in 1 --nproc-out 1 PP:pairtools_dedup-3.4 VN:1.0.3
+#samheader: @PG ID:pairtools_dedup-3.4 PN:pairtools_dedup CL:/usr/local/bin/pairtools dedup /tmp/tmpp1v7bap4/files/3/7/9/dataset_379f0c04-3329-4201-9b3c-3c3a66e7eec4.dat -o /tmp/tmpp1v7bap4/job_working_directory/000/6/outputs/dataset_6f9ee270-56fb-4c2e-92f4-509340f9eb58.dat --mark-dups --output-stats /tmp/tmpp1v7bap4/job_working_directory/000/6/outputs/dataset_653a5918-ae05-4cfe-8fc9-4ecc516aeaf1.dat --nproc-in 1 --nproc-out 1 PP:pairtools_sort-3.3 VN:1.1.0
+#samheader: @PG ID:pairtools_split-3.5 PN:pairtools_split CL:/usr/local/bin/pairtools split /tmp/tmpms_dxt0a/files/8/b/9/dataset_8b97afbd-6770-4cb4-8bf1-fdc78bbce0af.dat --output-pairs /tmp/tmpms_dxt0a/job_working_directory/000/2/outputs/dataset_da90611d-b0d1-447c-ae61-f9ac7147d51d.dat --output-sam ./output.bam --nproc-in 1 --nproc-out 1 PP:pairtools_dedup-3.4 VN:1.1.0
#samheader: @PG ID:bwa-4548A671 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane2.01.1.fastq.gz MATalpha_R1.lane2.01.2.fastq.gz
#samheader: @PG ID:samtools PN:samtools PP:bwa-4548A671 VN:1.19.2 CL:samtools view -s 0.1 -b -@ 4 -o subset.bam test.bam
#samheader: @PG ID:pairtools_parse-4.3 PN:pairtools_parse CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools parse -o output_parsed_pairs_bam.pairs --output-stats output_parsed_pairs.stats --min-mapq 40 --walks-policy 5unique --max-inter-align-gap 30 --chroms-path test.reduced.chrom.sizes test.bam PP:samtools VN:1.0.2
#samheader: @PG ID:pairtools_sort-4.4 PN:pairtools_sort CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools sort -o output_sorted_pairs.pairsam output_parsed_pairs_bam.pairs PP:pairtools_parse-4.3 VN:1.0.2
-#samheader: @PG ID:pairtools_dedup-4.5 PN:pairtools_dedup CL:/scratch/ddepanis/Software/anaconda3/envs/MAP_env/bin/pairtools dedup -o output_dedup_pairs_markdups.pairsam --mark-dups --output-stats output_dedup_pairs.stats output_sorted_pairs.pairsam PP:pairtools_sort-4.4 VN:1.0.2
-#samheader: @PG ID:pairtools_split-4.6 PN:pairtools_split CL:/usr/local/bin/pairtools split /tmp/tmpnt_hb134/files/7/4/2/dataset_7420fb9f-e3dd-4326-8cef-1e023c2b5e85.dat --output-pairs /tmp/tmpnt_hb134/job_working_directory/000/2/outputs/dataset_ba891b58-22e9-49f5-83f9-063b56eda346.dat --output-sam ./output.bam --nproc-in 1 --nproc-out 1 PP:pairtools_dedup-4.5 VN:1.0.3
+#samheader: @PG ID:pairtools_dedup-4.5 PN:pairtools_dedup CL:/usr/local/bin/pairtools dedup /tmp/tmpp1v7bap4/files/3/7/9/dataset_379f0c04-3329-4201-9b3c-3c3a66e7eec4.dat -o /tmp/tmpp1v7bap4/job_working_directory/000/6/outputs/dataset_6f9ee270-56fb-4c2e-92f4-509340f9eb58.dat --mark-dups --output-stats /tmp/tmpp1v7bap4/job_working_directory/000/6/outputs/dataset_653a5918-ae05-4cfe-8fc9-4ecc516aeaf1.dat --nproc-in 1 --nproc-out 1 PP:pairtools_sort-4.4 VN:1.1.0
+#samheader: @PG ID:pairtools_split-4.6 PN:pairtools_split CL:/usr/local/bin/pairtools split /tmp/tmpms_dxt0a/files/8/b/9/dataset_8b97afbd-6770-4cb4-8bf1-fdc78bbce0af.dat --output-pairs /tmp/tmpms_dxt0a/job_working_directory/000/2/outputs/dataset_da90611d-b0d1-447c-ae61-f9ac7147d51d.dat --output-sam ./output.bam --nproc-in 1 --nproc-out 1 PP:pairtools_dedup-4.5 VN:1.1.0
#columns: readID chrom1 pos1 chrom2 pos2 strand1 strand2 pair_type
HWI-ST560:29:B0A7LABXX:2:1101:15566:24141 chrI 3199 chrI 3399 + - UU
HWI-ST560:29:B0A7LABXX:2:1101:18861:21891 chrI 35431 chrI 35703 + - UU
diff -r 5412142130ad -r 55a53b5e308d test-data/output_parsed_pairs.stats
--- a/test-data/output_parsed_pairs.stats Tue Apr 16 12:51:21 2024 +0000
+++ b/test-data/output_parsed_pairs.stats Tue Apr 30 12:02:29 2024 +0000
@@ -6,16 +6,14 @@
total_nodups 308
cis 308
trans 0
-pair_types/MU 88
+pair_types/MU 95
pair_types/UU 293
pair_types/MM 49
pair_types/UR 8
pair_types/MR 26
pair_types/NR 110
pair_types/RU 7
-pair_types/nM 3
-pair_types/Mu 7
-pair_types/NM 1
+pair_types/NM 4
cis_1kb+ 15
cis_2kb+ 14
cis_4kb+ 14
@@ -31,6 +29,33 @@
summary/frac_cis_40kb+ 0.02922077922077922
summary/frac_dups 0.0
summary/complexity_naive nan
+summary/dist_freq_convergence/convergence_dist 177828
+summary/dist_freq_convergence/strands_w_max_convergence_dist ++
+summary/dist_freq_convergence/convergence_rel_diff_threshold 0.05
+summary/dist_freq_convergence/n_cis_pairs_below_convergence_dist/++ 4
+summary/dist_freq_convergence/n_cis_pairs_below_convergence_dist/-- 2
+summary/dist_freq_convergence/n_cis_pairs_below_convergence_dist/-+ 1
+summary/dist_freq_convergence/n_cis_pairs_below_convergence_dist/+- 301
+summary/dist_freq_convergence/n_cis_pairs_below_convergence_dist_all_strands 308
+summary/dist_freq_convergence/n_cis_pairs_above_convergence_dist_all_strands 0
+summary/dist_freq_convergence/frac_cis_in_cis_below_convergence_dist/++ 0.012987012987012988
+summary/dist_freq_convergence/frac_cis_in_cis_below_convergence_dist/-- 0.006493506493506494
+summary/dist_freq_convergence/frac_cis_in_cis_below_convergence_dist/-+ 0.003246753246753247
+summary/dist_freq_convergence/frac_cis_in_cis_below_convergence_dist/+- 0.9772727272727273
+summary/dist_freq_convergence/frac_cis_in_cis_below_convergence_dist_all_strands 1.0
+summary/dist_freq_convergence/frac_cis_in_cis_above_convergence_dist_all_strands 0.0
+summary/dist_freq_convergence/frac_total_mapped_in_cis_below_convergence_dist/++ 0.012987012987012988
+summary/dist_freq_convergence/frac_total_mapped_in_cis_below_convergence_dist/-- 0.006493506493506494
+summary/dist_freq_convergence/frac_total_mapped_in_cis_below_convergence_dist/-+ 0.003246753246753247
+summary/dist_freq_convergence/frac_total_mapped_in_cis_below_convergence_dist/+- 0.9772727272727273
+summary/dist_freq_convergence/frac_total_mapped_in_cis_below_convergence_dist_all_strands 1.0
+summary/dist_freq_convergence/frac_total_mapped_in_cis_above_convergence_dist_all_strands 0.0
+summary/dist_freq_convergence/frac_total_nodups_in_cis_below_convergence_dist/++ 0.012987012987012988
+summary/dist_freq_convergence/frac_total_nodups_in_cis_below_convergence_dist/-- 0.006493506493506494
+summary/dist_freq_convergence/frac_total_nodups_in_cis_below_convergence_dist/-+ 0.003246753246753247
+summary/dist_freq_convergence/frac_total_nodups_in_cis_below_convergence_dist/+- 0.9772727272727273
+summary/dist_freq_convergence/frac_total_nodups_in_cis_below_convergence_dist_all_strands 1.0
+summary/dist_freq_convergence/frac_total_nodups_in_cis_above_convergence_dist_all_strands 0.0
chrom_freq/Test_seq/Test_seq 308
dist_freq/0-1/+- 0
dist_freq/0-1/-+ 0
@@ -44,143 +69,279 @@
dist_freq/2-3/-+ 0
dist_freq/2-3/-- 0
dist_freq/2-3/++ 0
-dist_freq/3-6/+- 0
-dist_freq/3-6/-+ 0
-dist_freq/3-6/-- 0
-dist_freq/3-6/++ 0
-dist_freq/6-10/+- 0
-dist_freq/6-10/-+ 0
-dist_freq/6-10/-- 0
-dist_freq/6-10/++ 0
-dist_freq/10-18/+- 0
-dist_freq/10-18/-+ 0
-dist_freq/10-18/-- 0
-dist_freq/10-18/++ 0
-dist_freq/18-32/+- 0
-dist_freq/18-32/-+ 0
-dist_freq/18-32/-- 0
-dist_freq/18-32/++ 0
-dist_freq/32-56/+- 0
-dist_freq/32-56/-+ 0
-dist_freq/32-56/-- 0
-dist_freq/32-56/++ 0
-dist_freq/56-100/+- 1
-dist_freq/56-100/-+ 0
-dist_freq/56-100/-- 0
-dist_freq/56-100/++ 0
-dist_freq/100-178/+- 3
-dist_freq/100-178/-+ 0
-dist_freq/100-178/-- 0
-dist_freq/100-178/++ 0
-dist_freq/178-316/+- 53
-dist_freq/178-316/-+ 0
-dist_freq/178-316/-- 0
-dist_freq/178-316/++ 0
-dist_freq/316-562/+- 236
-dist_freq/316-562/-+ 0
-dist_freq/316-562/-- 0
-dist_freq/316-562/++ 0
-dist_freq/562-1000/+- 0
-dist_freq/562-1000/-+ 0
-dist_freq/562-1000/-- 0
-dist_freq/562-1000/++ 0
-dist_freq/1000-1778/+- 1
-dist_freq/1000-1778/-+ 0
-dist_freq/1000-1778/-- 0
-dist_freq/1000-1778/++ 0
-dist_freq/1778-3162/+- 0
-dist_freq/1778-3162/-+ 0
-dist_freq/1778-3162/-- 0
-dist_freq/1778-3162/++ 0
-dist_freq/3162-5623/+- 0
-dist_freq/3162-5623/-+ 0
-dist_freq/3162-5623/-- 0
-dist_freq/3162-5623/++ 0
-dist_freq/5623-10000/+- 2
-dist_freq/5623-10000/-+ 0
-dist_freq/5623-10000/-- 0
-dist_freq/5623-10000/++ 0
-dist_freq/10000-17783/+- 1
-dist_freq/10000-17783/-+ 1
-dist_freq/10000-17783/-- 0
-dist_freq/10000-17783/++ 0
-dist_freq/17783-31623/+- 1
-dist_freq/17783-31623/-+ 0
-dist_freq/17783-31623/-- 0
-dist_freq/17783-31623/++ 0
-dist_freq/31623-56234/+- 0
-dist_freq/31623-56234/-+ 0
-dist_freq/31623-56234/-- 0
-dist_freq/31623-56234/++ 1
-dist_freq/56234-100000/+- 2
-dist_freq/56234-100000/-+ 0
-dist_freq/56234-100000/-- 1
-dist_freq/56234-100000/++ 1
-dist_freq/100000-177828/+- 1
-dist_freq/100000-177828/-+ 0
-dist_freq/100000-177828/-- 1
-dist_freq/100000-177828/++ 2
-dist_freq/177828-316228/+- 0
-dist_freq/177828-316228/-+ 0
-dist_freq/177828-316228/-- 0
-dist_freq/177828-316228/++ 0
-dist_freq/316228-562341/+- 0
-dist_freq/316228-562341/-+ 0
-dist_freq/316228-562341/-- 0
-dist_freq/316228-562341/++ 0
-dist_freq/562341-1000000/+- 0
-dist_freq/562341-1000000/-+ 0
-dist_freq/562341-1000000/-- 0
-dist_freq/562341-1000000/++ 0
-dist_freq/1000000-1778279/+- 0
-dist_freq/1000000-1778279/-+ 0
-dist_freq/1000000-1778279/-- 0
-dist_freq/1000000-1778279/++ 0
-dist_freq/1778279-3162278/+- 0
-dist_freq/1778279-3162278/-+ 0
-dist_freq/1778279-3162278/-- 0
-dist_freq/1778279-3162278/++ 0
-dist_freq/3162278-5623413/+- 0
-dist_freq/3162278-5623413/-+ 0
-dist_freq/3162278-5623413/-- 0
-dist_freq/3162278-5623413/++ 0
-dist_freq/5623413-10000000/+- 0
-dist_freq/5623413-10000000/-+ 0
-dist_freq/5623413-10000000/-- 0
-dist_freq/5623413-10000000/++ 0
-dist_freq/10000000-17782794/+- 0
-dist_freq/10000000-17782794/-+ 0
-dist_freq/10000000-17782794/-- 0
-dist_freq/10000000-17782794/++ 0
-dist_freq/17782794-31622777/+- 0
-dist_freq/17782794-31622777/-+ 0
-dist_freq/17782794-31622777/-- 0
-dist_freq/17782794-31622777/++ 0
-dist_freq/31622777-56234133/+- 0
-dist_freq/31622777-56234133/-+ 0
-dist_freq/31622777-56234133/-- 0
-dist_freq/31622777-56234133/++ 0
-dist_freq/56234133-100000000/+- 0
-dist_freq/56234133-100000000/-+ 0
-dist_freq/56234133-100000000/-- 0
-dist_freq/56234133-100000000/++ 0
-dist_freq/100000000-177827941/+- 0
-dist_freq/100000000-177827941/-+ 0
-dist_freq/100000000-177827941/-- 0
-dist_freq/100000000-177827941/++ 0
-dist_freq/177827941-316227766/+- 0
-dist_freq/177827941-316227766/-+ 0
-dist_freq/177827941-316227766/-- 0
-dist_freq/177827941-316227766/++ 0
-dist_freq/316227766-562341325/+- 0
-dist_freq/316227766-562341325/-+ 0
-dist_freq/316227766-562341325/-- 0
-dist_freq/316227766-562341325/++ 0
-dist_freq/562341325-1000000000/+- 0
-dist_freq/562341325-1000000000/-+ 0
-dist_freq/562341325-1000000000/-- 0
-dist_freq/562341325-1000000000/++ 0
-dist_freq/562341325+/+- 0
-dist_freq/562341325+/-+ 0
-dist_freq/562341325+/-- 0
-dist_freq/562341325+/++ 0
+dist_freq/3-4/+- 0
+dist_freq/3-4/-+ 0
+dist_freq/3-4/-- 0
+dist_freq/3-4/++ 0
+dist_freq/4-6/+- 0
+dist_freq/4-6/-+ 0
+dist_freq/4-6/-- 0
+dist_freq/4-6/++ 0
+dist_freq/6-7/+- 0
+dist_freq/6-7/-+ 0
+dist_freq/6-7/-- 0
+dist_freq/6-7/++ 0
+dist_freq/7-10/+- 0
+dist_freq/7-10/-+ 0
+dist_freq/7-10/-- 0
+dist_freq/7-10/++ 0
+dist_freq/10-13/+- 0
+dist_freq/10-13/-+ 0
+dist_freq/10-13/-- 0
+dist_freq/10-13/++ 0
+dist_freq/13-18/+- 0
+dist_freq/13-18/-+ 0
+dist_freq/13-18/-- 0
+dist_freq/13-18/++ 0
+dist_freq/18-24/+- 0
+dist_freq/18-24/-+ 0
+dist_freq/18-24/-- 0
+dist_freq/18-24/++ 0
+dist_freq/24-32/+- 0
+dist_freq/24-32/-+ 0
+dist_freq/24-32/-- 0
+dist_freq/24-32/++ 0
+dist_freq/32-42/+- 0
+dist_freq/32-42/-+ 0
+dist_freq/32-42/-- 0
+dist_freq/32-42/++ 0
+dist_freq/42-56/+- 0
+dist_freq/42-56/-+ 0
+dist_freq/42-56/-- 0
+dist_freq/42-56/++ 0
+dist_freq/56-75/+- 0
+dist_freq/56-75/-+ 0
+dist_freq/56-75/-- 0
+dist_freq/56-75/++ 0
+dist_freq/75-100/+- 1
+dist_freq/75-100/-+ 0
+dist_freq/75-100/-- 0
+dist_freq/75-100/++ 0
+dist_freq/100-133/+- 1
+dist_freq/100-133/-+ 0
+dist_freq/100-133/-- 0
+dist_freq/100-133/++ 0
+dist_freq/133-178/+- 2
+dist_freq/133-178/-+ 0
+dist_freq/133-178/-- 0
+dist_freq/133-178/++ 0
+dist_freq/178-237/+- 3
+dist_freq/178-237/-+ 0
+dist_freq/178-237/-- 0
+dist_freq/178-237/++ 0
+dist_freq/237-316/+- 50
+dist_freq/237-316/-+ 0
+dist_freq/237-316/-- 0
+dist_freq/237-316/++ 0
+dist_freq/316-422/+- 135
+dist_freq/316-422/-+ 0
+dist_freq/316-422/-- 0
+dist_freq/316-422/++ 0
+dist_freq/422-562/+- 101
+dist_freq/422-562/-+ 0
+dist_freq/422-562/-- 0
+dist_freq/422-562/++ 0
+dist_freq/562-750/+- 0
+dist_freq/562-750/-+ 0
+dist_freq/562-750/-- 0
+dist_freq/562-750/++ 0
+dist_freq/750-1000/+- 0
+dist_freq/750-1000/-+ 0
+dist_freq/750-1000/-- 0
+dist_freq/750-1000/++ 0
+dist_freq/1000-1334/+- 0
+dist_freq/1000-1334/-+ 0
+dist_freq/1000-1334/-- 0
+dist_freq/1000-1334/++ 0
+dist_freq/1334-1778/+- 1
+dist_freq/1334-1778/-+ 0
+dist_freq/1334-1778/-- 0
+dist_freq/1334-1778/++ 0
+dist_freq/1778-2371/+- 0
+dist_freq/1778-2371/-+ 0
+dist_freq/1778-2371/-- 0
+dist_freq/1778-2371/++ 0
+dist_freq/2371-3162/+- 0
+dist_freq/2371-3162/-+ 0
+dist_freq/2371-3162/-- 0
+dist_freq/2371-3162/++ 0
+dist_freq/3162-4217/+- 0
+dist_freq/3162-4217/-+ 0
+dist_freq/3162-4217/-- 0
+dist_freq/3162-4217/++ 0
+dist_freq/4217-5623/+- 0
+dist_freq/4217-5623/-+ 0
+dist_freq/4217-5623/-- 0
+dist_freq/4217-5623/++ 0
+dist_freq/5623-7499/+- 0
+dist_freq/5623-7499/-+ 0
+dist_freq/5623-7499/-- 0
+dist_freq/5623-7499/++ 0
+dist_freq/7499-10000/+- 2
+dist_freq/7499-10000/-+ 0
+dist_freq/7499-10000/-- 0
+dist_freq/7499-10000/++ 0
+dist_freq/10000-13335/+- 1
+dist_freq/10000-13335/-+ 1
+dist_freq/10000-13335/-- 0
+dist_freq/10000-13335/++ 0
+dist_freq/13335-17783/+- 0
+dist_freq/13335-17783/-+ 0
+dist_freq/13335-17783/-- 0
+dist_freq/13335-17783/++ 0
+dist_freq/17783-23714/+- 1
+dist_freq/17783-23714/-+ 0
+dist_freq/17783-23714/-- 0
+dist_freq/17783-23714/++ 0
+dist_freq/23714-31623/+- 0
+dist_freq/23714-31623/-+ 0
+dist_freq/23714-31623/-- 0
+dist_freq/23714-31623/++ 0
+dist_freq/31623-42170/+- 0
+dist_freq/31623-42170/-+ 0
+dist_freq/31623-42170/-- 0
+dist_freq/31623-42170/++ 0
+dist_freq/42170-56234/+- 0
+dist_freq/42170-56234/-+ 0
+dist_freq/42170-56234/-- 0
+dist_freq/42170-56234/++ 1
+dist_freq/56234-74989/+- 2
+dist_freq/56234-74989/-+ 0
+dist_freq/56234-74989/-- 1
+dist_freq/56234-74989/++ 0
+dist_freq/74989-100000/+- 0
+dist_freq/74989-100000/-+ 0
+dist_freq/74989-100000/-- 0
+dist_freq/74989-100000/++ 1
+dist_freq/100000-133352/+- 1
+dist_freq/100000-133352/-+ 0
+dist_freq/100000-133352/-- 1
+dist_freq/100000-133352/++ 1
+dist_freq/133352-177828/+- 0
+dist_freq/133352-177828/-+ 0
+dist_freq/133352-177828/-- 0
+dist_freq/133352-177828/++ 1
+dist_freq/177828-237137/+- 0
+dist_freq/177828-237137/-+ 0
+dist_freq/177828-237137/-- 0
+dist_freq/177828-237137/++ 0
+dist_freq/237137-316228/+- 0
+dist_freq/237137-316228/-+ 0
+dist_freq/237137-316228/-- 0
+dist_freq/237137-316228/++ 0
+dist_freq/316228-421697/+- 0
+dist_freq/316228-421697/-+ 0
+dist_freq/316228-421697/-- 0
+dist_freq/316228-421697/++ 0
+dist_freq/421697-562341/+- 0
+dist_freq/421697-562341/-+ 0
+dist_freq/421697-562341/-- 0
+dist_freq/421697-562341/++ 0
+dist_freq/562341-749894/+- 0
+dist_freq/562341-749894/-+ 0
+dist_freq/562341-749894/-- 0
+dist_freq/562341-749894/++ 0
+dist_freq/749894-1000000/+- 0
+dist_freq/749894-1000000/-+ 0
+dist_freq/749894-1000000/-- 0
+dist_freq/749894-1000000/++ 0
+dist_freq/1000000-1333521/+- 0
+dist_freq/1000000-1333521/-+ 0
+dist_freq/1000000-1333521/-- 0
+dist_freq/1000000-1333521/++ 0
+dist_freq/1333521-1778279/+- 0
+dist_freq/1333521-1778279/-+ 0
+dist_freq/1333521-1778279/-- 0
+dist_freq/1333521-1778279/++ 0
+dist_freq/1778279-2371374/+- 0
+dist_freq/1778279-2371374/-+ 0
+dist_freq/1778279-2371374/-- 0
+dist_freq/1778279-2371374/++ 0
+dist_freq/2371374-3162278/+- 0
+dist_freq/2371374-3162278/-+ 0
+dist_freq/2371374-3162278/-- 0
+dist_freq/2371374-3162278/++ 0
+dist_freq/3162278-4216965/+- 0
+dist_freq/3162278-4216965/-+ 0
+dist_freq/3162278-4216965/-- 0
+dist_freq/3162278-4216965/++ 0
+dist_freq/4216965-5623413/+- 0
+dist_freq/4216965-5623413/-+ 0
+dist_freq/4216965-5623413/-- 0
+dist_freq/4216965-5623413/++ 0
+dist_freq/5623413-7498942/+- 0
+dist_freq/5623413-7498942/-+ 0
+dist_freq/5623413-7498942/-- 0
+dist_freq/5623413-7498942/++ 0
+dist_freq/7498942-10000000/+- 0
+dist_freq/7498942-10000000/-+ 0
+dist_freq/7498942-10000000/-- 0
+dist_freq/7498942-10000000/++ 0
+dist_freq/10000000-13335214/+- 0
+dist_freq/10000000-13335214/-+ 0
+dist_freq/10000000-13335214/-- 0
+dist_freq/10000000-13335214/++ 0
+dist_freq/13335214-17782794/+- 0
+dist_freq/13335214-17782794/-+ 0
+dist_freq/13335214-17782794/-- 0
+dist_freq/13335214-17782794/++ 0
+dist_freq/17782794-23713737/+- 0
+dist_freq/17782794-23713737/-+ 0
+dist_freq/17782794-23713737/-- 0
+dist_freq/17782794-23713737/++ 0
+dist_freq/23713737-31622777/+- 0
+dist_freq/23713737-31622777/-+ 0
+dist_freq/23713737-31622777/-- 0
+dist_freq/23713737-31622777/++ 0
+dist_freq/31622777-42169650/+- 0
+dist_freq/31622777-42169650/-+ 0
+dist_freq/31622777-42169650/-- 0
+dist_freq/31622777-42169650/++ 0
+dist_freq/42169650-56234133/+- 0
+dist_freq/42169650-56234133/-+ 0
+dist_freq/42169650-56234133/-- 0
+dist_freq/42169650-56234133/++ 0
+dist_freq/56234133-74989421/+- 0
+dist_freq/56234133-74989421/-+ 0
+dist_freq/56234133-74989421/-- 0
+dist_freq/56234133-74989421/++ 0
+dist_freq/74989421-100000000/+- 0
+dist_freq/74989421-100000000/-+ 0
+dist_freq/74989421-100000000/-- 0
+dist_freq/74989421-100000000/++ 0
+dist_freq/100000000-133352143/+- 0
+dist_freq/100000000-133352143/-+ 0
+dist_freq/100000000-133352143/-- 0
+dist_freq/100000000-133352143/++ 0
+dist_freq/133352143-177827941/+- 0
+dist_freq/133352143-177827941/-+ 0
+dist_freq/133352143-177827941/-- 0
+dist_freq/133352143-177827941/++ 0
+dist_freq/177827941-237137371/+- 0
+dist_freq/177827941-237137371/-+ 0
+dist_freq/177827941-237137371/-- 0
+dist_freq/177827941-237137371/++ 0
+dist_freq/237137371-316227766/+- 0
+dist_freq/237137371-316227766/-+ 0
+dist_freq/237137371-316227766/-- 0
+dist_freq/237137371-316227766/++ 0
+dist_freq/316227766-421696503/+- 0
+dist_freq/316227766-421696503/-+ 0
+dist_freq/316227766-421696503/-- 0
+dist_freq/316227766-421696503/++ 0
+dist_freq/421696503-562341325/+- 0
+dist_freq/421696503-562341325/-+ 0
+dist_freq/421696503-562341325/-- 0
+dist_freq/421696503-562341325/++ 0
+dist_freq/562341325-749894209/+- 0
+dist_freq/562341325-749894209/-+ 0
+dist_freq/562341325-749894209/-- 0
+dist_freq/562341325-749894209/++ 0
+dist_freq/749894209-1000000000/+- 0
+dist_freq/749894209-1000000000/-+ 0
+dist_freq/749894209-1000000000/-- 0
+dist_freq/749894209-1000000000/++ 0
+dist_freq/1000000000+/+- 0
+dist_freq/1000000000+/-+ 0
+dist_freq/1000000000+/-- 0
+dist_freq/1000000000+/++ 0
diff -r 5412142130ad -r 55a53b5e308d test-data/output_parsed_pairs_bam.pairs
--- a/test-data/output_parsed_pairs_bam.pairs Tue Apr 16 12:51:21 2024 +0000
+++ b/test-data/output_parsed_pairs_bam.pairs Tue Apr 30 12:02:29 2024 +0000
@@ -37,14 +37,14 @@
#samheader: @SQ SN:chrXV LN:1091291
#samheader: @SQ SN:chrXVI LN:948066
#samheader: @PG ID:bwa PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane1.00.1.fastq.gz MATalpha_R1.lane1.00.2.fastq.gz
-#samheader: @PG ID:pairtools_parse-1.2 PN:pairtools_parse CL:/usr/local/bin/pairtools parse /tmp/tmpvtvmbj0m/files/5/c/9/dataset_5c90f563-7928-4455-84af-6129feb92ffc.dat -c /tmp/tmpvtvmbj0m/files/4/9/a/dataset_49af402e-cee9-4737-bf5e-15a04f62c1d8.dat -o /tmp/tmpvtvmbj0m/job_working_directory/000/7/outputs/dataset_461ac430-f019-4ae5-9b37-796f7c45fa35.dat --min-mapq 1 --max-molecule-size 750 --walks-policy mask --max-inter-align-gap 20 --nproc-in 1 --nproc-out 1 PP:bwa VN:1.0.3
+#samheader: @PG ID:pairtools_parse-1.2 PN:pairtools_parse CL:/usr/local/bin/pairtools parse /tmp/tmpchj83off/files/b/e/9/dataset_be9fce34-5096-400c-9efd-1f189da7f40a.dat -c /tmp/tmpchj83off/files/1/4/3/dataset_143017f3-646f-4cc1-b3d6-fc5d73287981.dat -o /tmp/tmpchj83off/job_working_directory/000/7/outputs/dataset_3348ea1d-0460-452f-aafb-dbde21a7b812.dat --min-mapq 1 --max-molecule-size 750 --walks-policy mask --max-inter-align-gap 20 --nproc-in 1 --nproc-out 1 PP:bwa VN:1.1.0
#samheader: @PG ID:bwa-2CCE5976 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane1.01.1.fastq.gz MATalpha_R1.lane1.01.2.fastq.gz
-#samheader: @PG ID:pairtools_parse-2.2 PN:pairtools_parse CL:/usr/local/bin/pairtools parse /tmp/tmpvtvmbj0m/files/5/c/9/dataset_5c90f563-7928-4455-84af-6129feb92ffc.dat -c /tmp/tmpvtvmbj0m/files/4/9/a/dataset_49af402e-cee9-4737-bf5e-15a04f62c1d8.dat -o /tmp/tmpvtvmbj0m/job_working_directory/000/7/outputs/dataset_461ac430-f019-4ae5-9b37-796f7c45fa35.dat --min-mapq 1 --max-molecule-size 750 --walks-policy mask --max-inter-align-gap 20 --nproc-in 1 --nproc-out 1 PP:bwa-2CCE5976 VN:1.0.3
+#samheader: @PG ID:pairtools_parse-2.2 PN:pairtools_parse CL:/usr/local/bin/pairtools parse /tmp/tmpchj83off/files/b/e/9/dataset_be9fce34-5096-400c-9efd-1f189da7f40a.dat -c /tmp/tmpchj83off/files/1/4/3/dataset_143017f3-646f-4cc1-b3d6-fc5d73287981.dat -o /tmp/tmpchj83off/job_working_directory/000/7/outputs/dataset_3348ea1d-0460-452f-aafb-dbde21a7b812.dat --min-mapq 1 --max-molecule-size 750 --walks-policy mask --max-inter-align-gap 20 --nproc-in 1 --nproc-out 1 PP:bwa-2CCE5976 VN:1.1.0
#samheader: @PG ID:bwa-3CAFD9D9 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane2.00.1.fastq.gz MATalpha_R1.lane2.00.2.fastq.gz
-#samheader: @PG ID:pairtools_parse-3.2 PN:pairtools_parse CL:/usr/local/bin/pairtools parse /tmp/tmpvtvmbj0m/files/5/c/9/dataset_5c90f563-7928-4455-84af-6129feb92ffc.dat -c /tmp/tmpvtvmbj0m/files/4/9/a/dataset_49af402e-cee9-4737-bf5e-15a04f62c1d8.dat -o /tmp/tmpvtvmbj0m/job_working_directory/000/7/outputs/dataset_461ac430-f019-4ae5-9b37-796f7c45fa35.dat --min-mapq 1 --max-molecule-size 750 --walks-policy mask --max-inter-align-gap 20 --nproc-in 1 --nproc-out 1 PP:bwa-3CAFD9D9 VN:1.0.3
+#samheader: @PG ID:pairtools_parse-3.2 PN:pairtools_parse CL:/usr/local/bin/pairtools parse /tmp/tmpchj83off/files/b/e/9/dataset_be9fce34-5096-400c-9efd-1f189da7f40a.dat -c /tmp/tmpchj83off/files/1/4/3/dataset_143017f3-646f-4cc1-b3d6-fc5d73287981.dat -o /tmp/tmpchj83off/job_working_directory/000/7/outputs/dataset_3348ea1d-0460-452f-aafb-dbde21a7b812.dat --min-mapq 1 --max-molecule-size 750 --walks-policy mask --max-inter-align-gap 20 --nproc-in 1 --nproc-out 1 PP:bwa-3CAFD9D9 VN:1.1.0
#samheader: @PG ID:bwa-4548A671 PN:bwa VN:0.7.15-r1140 CL:bwa mem -t 8 -v 3 -SP sacCer3.fa.gz MATalpha_R1.lane2.01.1.fastq.gz MATalpha_R1.lane2.01.2.fastq.gz
#samheader: @PG ID:samtools PN:samtools PP:bwa-4548A671 VN:1.19.2 CL:samtools view -s 0.1 -b -@ 4 -o subset.bam test.bam
-#samheader: @PG ID:pairtools_parse-4.3 PN:pairtools_parse CL:/usr/local/bin/pairtools parse /tmp/tmpvtvmbj0m/files/5/c/9/dataset_5c90f563-7928-4455-84af-6129feb92ffc.dat -c /tmp/tmpvtvmbj0m/files/4/9/a/dataset_49af402e-cee9-4737-bf5e-15a04f62c1d8.dat -o /tmp/tmpvtvmbj0m/job_working_directory/000/7/outputs/dataset_461ac430-f019-4ae5-9b37-796f7c45fa35.dat --min-mapq 1 --max-molecule-size 750 --walks-policy mask --max-inter-align-gap 20 --nproc-in 1 --nproc-out 1 PP:samtools VN:1.0.3
+#samheader: @PG ID:pairtools_parse-4.3 PN:pairtools_parse CL:/usr/local/bin/pairtools parse /tmp/tmpchj83off/files/b/e/9/dataset_be9fce34-5096-400c-9efd-1f189da7f40a.dat -c /tmp/tmpchj83off/files/1/4/3/dataset_143017f3-646f-4cc1-b3d6-fc5d73287981.dat -o /tmp/tmpchj83off/job_working_directory/000/7/outputs/dataset_3348ea1d-0460-452f-aafb-dbde21a7b812.dat --min-mapq 1 --max-molecule-size 750 --walks-policy mask --max-inter-align-gap 20 --nproc-in 1 --nproc-out 1 PP:samtools VN:1.1.0
#columns: readID chrom1 pos1 chrom2 pos2 strand1 strand2 pair_type sam1 sam2
HWI-ST560:29:B0A7LABXX:2:1101:5084:4188 ! 0 ! 0 - - NM HWI-ST560:29:B0A7LABXX:2:1101:5084:4188133chrI24200*=24200GGAACCGTAAAGGTTTATCGCGGTAGTAGTTTTTCACACGATTCGATAAA?<@DFDFD=FBHHCBHGGIJIIG:C@DGD??DDH?FHGHIJJDGCGEGG;AS:i:0XS:i:0Yt:Z:NM HWI-ST560:29:B0A7LABXX:2:1101:5084:418873chrI242009S41M=24200TTGATAGACTTCGTATGTGGAGTACTGTTTTATGGCGCTTATGTGTATTC11144222222322<