cpt_intersect_adj: intersect_and_adjacent.py comparison

comparison intersect_and_adjacent.py @ 4:3e3b5ba626b9 draft

planemo upload commit c3db49ef44729e27fa7ca5ade2ea27d7074072ca

author	cpt
date	Mon, 12 Aug 2024 04:33:20 +0000
parents	10000414e916
children	00aab5199327

comparison

equal deleted inserted replaced

-:10000414e916
+:3e3b5ba626b9
 a_pos = []
 b_neg = []
 b_pos = []
 tree_a = []
 tree_b = []
-if stranding == True:
 for feat in rec_a_i.features:
 if feat.type == "remark" or feat.type == "annotation":
 continue
+interval = Interval(
+int(feat.location.start) - int(window),
+int(feat.location.end) + int(window),
+feat.id,
+)
+if stranding:
 if feat.strand > 0:
-a_pos.append(
+a_pos.append(interval)
-Interval(
+else:
-int(feat.location.start) - int(window),
+a_neg.append(interval)
-int(feat.location.end) + int(window),
+else:
-feat.id,
+tree_a.append(interval)
-)
-)
+for feat in rec_b_i.features:
-else:
+if feat.type == "remark" or feat.type == "annotation":
-a_neg.append(
+continue
-Interval(
+interval = Interval(
 int(feat.location.start) - int(window),
 int(feat.location.end) + int(window),
 feat.id,
 )
-)
+if stranding:
-for feat in rec_b_i.features:
-if feat.type == "remark" or feat.type == "annotation":
-continue
 if feat.strand > 0:
-b_pos.append(
+b_pos.append(interval)
-Interval(
+else:
-int(feat.location.start) - int(window),
+b_neg.append(interval)
-int(feat.location.end) + int(window),
+else:
-feat.id,
+tree_b.append(interval)
-)
-)
-else:
-b_neg.append(
-Interval(
-int(feat.location.start) - int(window),
-int(feat.location.end) + int(window),
-feat.id,
-)
-)
-else:
-for feat in rec_a_i.features:
-if feat.type == "remark" or feat.type == "annotation":
-continue
-tree_a.append(
-Interval(
-int(feat.location.start) - int(window),
-int(feat.location.end) + int(window),
-feat.id,
-)
-)
-for feat in rec_b_i.features:
-if feat.type == "remark" or feat.type == "annotation":
-continue
-tree_b.append(
-Interval(
-int(feat.location.start) - int(window),
-int(feat.location.end) + int(window),
-feat.id,
-)
-)
 if stranding:
-# builds interval tree from Interval objects of form (start, end, id) for each feature
-# tree_a = IntervalTree(list(treeFeatures_noRem(rec_a_i.features, window)))
-# tree_b = IntervalTree(list(treeFeatures_noRem(rec_b_i.features, window)))
-# else:
 tree_a_pos = IntervalTree(a_pos)
 tree_a_neg = IntervalTree(a_neg)
 tree_b_pos = IntervalTree(b_pos)
 tree_b_neg = IntervalTree(b_neg)
 else:
 rec_a_hits_in_b = []
 rec_b_hits_in_a = []
 for feature in rec_a_i.features:
-# Save each feature in rec_a that overlaps a feature in rec_b
-# hits = tree_b.find_range((int(feature.location.start), int(feature.location.end)))
 if feature.type == "remark" or feature.type == "annotation":
 continue
-if stranding == False:
+if not stranding:
 hits = tree_b[
 int(feature.location.start) : int(feature.location.end)
 ]
-# feature id is saved in interval result.data, use map to get full feature
 for hit in hits:
 rec_a_hits_in_b.append(rec_b_map[hit.data])
 else:
 if feature.strand > 0:
-hits_pos = tree_b_pos[
+hits = tree_b_pos[
 int(feature.location.start) : int(feature.location.end)
 ]
-for hit in hits_pos:
+else:
-rec_a_hits_in_b.append(rec_b_map[hit.data])
+hits = tree_b_neg[
-else:
+int(feature.location.start) : int(feature.location.end)
-hits_neg = tree_b_neg[
+]
-int(feature.location.start) : int(feature.location.end)
+for hit in hits:
-]
+rec_a_hits_in_b.append(rec_b_map[hit.data])
-for hit in hits_neg:
-rec_a_hits_in_b.append(rec_b_map[hit.data])
 for feature in rec_b_i.features:
 if feature.type == "remark" or feature.type == "annotation":
 continue
-if stranding == False:
+if not stranding:
 hits = tree_a[
 int(feature.location.start) : int(feature.location.end)
 ]
-# feature id is saved in interval result.data, use map to get full feature
 for hit in hits:
 rec_b_hits_in_a.append(rec_a_map[hit.data])
 else:
 if feature.strand > 0:
-hits_pos = tree_a_pos[
+hits = tree_a_pos[
 int(feature.location.start) : int(feature.location.end)
 ]
-for hit in hits_pos:
+else:
-rec_b_hits_in_a.append(rec_a_map[hit.data])
+hits = tree_a_neg[
-else:
+int(feature.location.start) : int(feature.location.end)
-hits_neg = tree_a_neg[
+]
-int(feature.location.start) : int(feature.location.end)
+for hit in hits:
-]
+rec_b_hits_in_a.append(rec_a_map[hit.data])
-for hit in hits_neg:
-rec_b_hits_in_a.append(rec_a_map[hit.data])
 # Remove duplicate features using sets
 rec_a_out.append(
 SeqRecord(
 rec_a[iterate].seq,
 type=int,
 default=50,
 help="Allows features this far away to still be considered 'adjacent'",
 )
 parser.add_argument(
-"stranding",
+"-stranding",
-nargs="?",
+action="store_true",
-default="",
+help="Only allow adjacency for same-strand features",
-help="Only allow adjacency for same-strand features if set to '-stranding'",
 )
 parser.add_argument("--oa", type=str, default="a_hits_near_b.gff")
 parser.add_argument("--ob", type=str, default="b_hits_near_a.gff")
 args = parser.parse_args()
-stranding = args.stranding == "-stranding"
 b, a = intersect(args.a, args.b, args.window, args.stranding)
 with open(args.oa, "w") as handle:
 for rec in a:
 gffWrite([rec], handle)

Mercurial > repos > cpt > cpt_intersect_adj

comparison intersect_and_adjacent.py @ 4:3e3b5ba626b9 draft