annotate mutational_patterns.R @ 19:69f09dff98f9 draft

"planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit db5fd077ec6c840b7b6eda331820999f85fd7c26"
author artbio
date Sun, 17 Oct 2021 23:05:01 +0000
parents 8d9f31389f33
children a2cb7dc9250a
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
1 # load packages that are provided in the conda env
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
2 options(show.error.messages = F,
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
3 error = function() {
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
4 cat(geterrmessage(), file = stderr()); q("no", 1, F)
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
5 }
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
6 )
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
7 loc <- Sys.setlocale("LC_MESSAGES", "en_US.UTF-8")
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
8 warnings()
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
9 library(optparse)
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
10 library(rjson)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
11 library(grid)
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
12 library(gridExtra)
4
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
13 library(scales)
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
14 library(RColorBrewer)
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
15
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
16 # Arguments
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
17 option_list <- list(
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
18 make_option(
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
19 "--inputs",
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
20 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
21 type = "character",
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
22 help = "json formatted dictionary of datasets and their paths"
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
23 ),
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
24 make_option(
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
25 "--genome",
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
26 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
27 type = "character",
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
28 help = "genome name in the BSgenome bioconductor package"
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
29 ),
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
30 make_option(
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
31 "--levels",
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
32 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
33 type = "character",
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
34 help = "path to the tab separated file describing the levels in function of datasets"
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
35 ),
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
36 make_option(
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
37 "--cosmic_version",
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
38 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
39 type = "character",
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
40 help = "Version of the Cosmic Signature set to be used to express mutational profiles"
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
41 ),
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
42 make_option(
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
43 "--own_signatures",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
44 default = NA,
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
45 type = "character",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
46 help = "Path to the user-defined signature matrix"
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
47 ),
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
48 make_option(
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
49 "--signum",
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
50 default = 2,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
51 type = "integer",
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
52 help = "selects the N most significant signatures in samples to express mutational profiles"
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
53 ),
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
54 make_option(
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
55 "--nrun",
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
56 default = 2,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
57 type = "integer",
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
58 help = "Number of runs to fit signatures"
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
59 ),
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
60 make_option(
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
61 "--rank",
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
62 default = 2,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
63 type = "integer",
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
64 help = "number of ranks to display for parameter optimization"
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
65 ),
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
66 make_option(
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
67 "--newsignum",
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
68 default = 2,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
69 type = "integer",
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
70 help = "Number of new signatures to be captured"
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
71 ),
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
72 make_option(
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
73 "--output_spectrum",
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
74 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
75 type = "character",
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
76 help = "path to output dataset"
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
77 ),
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
78 make_option(
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
79 "--output_denovo",
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
80 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
81 type = "character",
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
82 help = "path to output dataset"
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
83 ),
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
84 make_option(
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
85 "--sigmatrix",
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
86 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
87 type = "character",
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
88 help = "path to signature matrix"
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
89 ),
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
90 make_option(
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
91 "--output_sigpattern",
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
92 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
93 type = "character",
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
94 help = "path to output dataset"
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
95 ),
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
96 make_option(
11
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
97 "--sig_contrib_matrix",
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
98 default = NA,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
99 type = "character",
11
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
100 help = "path to signature contribution matrix"
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
101 ),
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
102 make_option(
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
103 c("-r", "--rdata"),
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
104 type = "character",
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
105 default = NULL,
17
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
106 help = "Path to RData output file"
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
107 ),
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
108 make_option(
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
109 c("-t", "--tooldir"),
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
110 type = "character",
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
111 default = NULL,
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
112 help = "Path to tool directory, where tool data are stored")
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
113
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
114 )
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
115
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
116 opt <- parse_args(OptionParser(option_list = option_list),
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
117 args = commandArgs(trailingOnly = TRUE))
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
118
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
119 ################ Manage input data ####################
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
120 json_dict <- opt$inputs
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
121 parser <- newJSONParser()
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
122 parser$addData(json_dict)
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
123 fileslist <- parser$getObject()
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
124 vcf_paths <- attr(fileslist, "names")
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
125 element_identifiers <- unname(unlist(fileslist))
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
126 ref_genome <- opt$genome
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
127 vcf_table <- data.frame(element_identifier = as.character(element_identifiers), path = vcf_paths)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
128
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
129 library(MutationalPatterns)
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
130 library(ref_genome, character.only = TRUE)
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
131 library(ggplot2)
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
132
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
133 # Load the VCF files into a GRangesList:
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
134 vcfs <- read_vcfs_as_granges(vcf_paths, element_identifiers, ref_genome)
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
135 library(plyr)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
136 if (!is.na(opt$levels)[1]) { # manage levels if there are
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
137 levels_table <- read.delim(opt$levels, header = FALSE,
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
138 col.names = c("element_identifier", "level"))
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
139 } else {
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
140 levels_table <- data.frame(element_identifier = vcf_table$element_identifier,
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
141 level = rep("nolabels", length(vcf_table$element_identifier)))
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
142 }
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
143 metadata_table <- join(vcf_table, levels_table, by = "element_identifier")
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
144 tissue <- as.vector(metadata_table$level)
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
145 detach(package:plyr)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
146
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
147 ##### This is done for any section ######
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
148 mut_mat <- mut_matrix(vcf_list = vcfs, ref_genome = ref_genome)
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
149 qual_col_pals <- brewer.pal.info[brewer.pal.info$category == "qual", ]
0
924c527fb379 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e1f3ca871f13569401f41a5af9d0e281bf372540"
artbio
parents:
diff changeset
150
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
151 ###### Section 1 Mutation characteristics and spectrums #############
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
152 if (!is.na(opt$output_spectrum)[1]) {
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
153 pdf(opt$output_spectrum, paper = "special", width = 11.69, height = 11.69)
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
154 type_occurrences <- mut_type_occurrences(vcfs, ref_genome)
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
155
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
156 # mutation spectrum, total or by sample
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
157
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
158 if (length(levels(factor(levels_table$level))) == 1) {
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
159 p1 <- plot_spectrum(type_occurrences, CT = TRUE, legend = TRUE)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
160 plot(p1)
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
161 } else {
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
162 p2 <- plot_spectrum(type_occurrences, by = tissue, CT = TRUE) # by levels
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
163 p3 <- plot_spectrum(type_occurrences, CT = TRUE, legend = TRUE) # total
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
164 grid.arrange(p2, p3, ncol = 2, widths = c(4, 2.3), heights = c(4, 1))
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
165 }
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
166 plot_96_profile(mut_mat, condensed = TRUE)
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
167 dev.off()
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
168 }
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
169
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
170 ###### Section 2: De novo mutational signature extraction using NMF #######
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
171 # opt$rank cannot be higher than the number of samples and
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
172 # likewise, opt$signum cannot be higher thant the number of samples
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
173 if (!is.na(opt$output_denovo)[1]) {
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
174
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
175 if (opt$rank > length(element_identifiers)) {
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
176 opt$rank <- length(element_identifiers)
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
177 }
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
178 if (opt$signum > length(element_identifiers)) {
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
179 opt$signum <- length(element_identifiers)
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
180 }
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
181 pseudo_mut_mat <- mut_mat + 0.0001 # First add a small pseudocount to the mutation count matrix
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
182 # Use the NMF package to generate an estimate rank plot
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
183 library("NMF")
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
184 estimate <- nmf(pseudo_mut_mat, rank = 1:opt$rank, method = "brunet", nrun = opt$nrun, seed = 123456)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
185 # And plot it
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
186 pdf(opt$output_denovo, paper = "special", width = 11.69, height = 11.69)
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
187 p4 <- plot(estimate)
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
188 grid.arrange(p4)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
189 # Extract 4 (PARAMETIZE) mutational signatures from the mutation count matrix with extract_signatures
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
190 # (For larger datasets it is wise to perform more iterations by changing the nrun parameter
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
191 # to achieve stability and avoid local minima)
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
192 nmf_res <- extract_signatures(pseudo_mut_mat, rank = opt$newsignum, nrun = opt$nrun)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
193 # Assign signature names
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
194 colnames(nmf_res$signatures) <- paste0("NewSig_", 1:opt$newsignum)
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
195 rownames(nmf_res$contribution) <- paste0("NewSig_", 1:opt$newsignum)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
196 # Plot the 96-profile of the signatures:
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
197 p5 <- plot_96_profile(nmf_res$signatures, condensed = TRUE)
15
8182d1625433 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 6ca5597637439c87b61af2dbd6c38089b29eca37"
artbio
parents: 14
diff changeset
198 new_sig_matrix <- reshape2::dcast(p5$data, substitution + context ~ sample, value.var = "freq")
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
199 new_sig_matrix <- format(new_sig_matrix, scientific = TRUE)
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
200 write.table(new_sig_matrix, file = opt$sigmatrix, quote = FALSE, row.names = FALSE, sep = "\t")
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
201 grid.arrange(p5)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
202 # Visualize the contribution of the signatures in a barplot
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
203 pc1 <- plot_contribution(nmf_res$contribution, nmf_res$signature, mode = "relative", coord_flip = TRUE)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
204 # Visualize the contribution of the signatures in absolute number of mutations
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
205 pc2 <- plot_contribution(nmf_res$contribution, nmf_res$signature, mode = "absolute", coord_flip = TRUE)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
206 # Combine the two plots:
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
207 grid.arrange(pc1, pc2)
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
208
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
209 # The relative contribution of each signature for each sample can also be plotted as a heatmap with
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
210 # plot_contribution_heatmap, which might be easier to interpret and compare than stacked barplots.
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
211 # The samples can be hierarchically clustered based on their euclidean dis- tance. The signatures
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
212 # can be plotted in a user-specified order.
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
213 # Plot signature contribution as a heatmap with sample clustering dendrogram and a specified signature order:
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
214 pch1 <- plot_contribution_heatmap(nmf_res$contribution,
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
215 sig_order = paste0("NewSig_", 1:opt$newsignum))
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
216 # Plot signature contribution as a heatmap without sample clustering:
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
217 pch2 <- plot_contribution_heatmap(nmf_res$contribution, cluster_samples = FALSE)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
218 #Combine the plots into one figure:
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
219 grid.arrange(pch1, pch2, ncol = 2, widths = c(2, 1.6))
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
220
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
221 # Compare the reconstructed mutational profile with the original mutational profile:
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
222 plot_compare_profiles(pseudo_mut_mat[, 1],
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
223 nmf_res$reconstructed[, 1],
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
224 profile_names = c("Original", "Reconstructed"),
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
225 condensed = TRUE)
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
226 dev.off()
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
227 }
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
228
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
229 ##### Section 3: Find optimal contribution of known signatures: COSMIC or OWN mutational signatures ####
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
230
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
231 if (!is.na(opt$output_sigpattern)[1]) {
17
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
232 # Prepare cosmic signatures
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
233 if (!is.na(opt$cosmic_version)) {
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
234 cosmic_urls <- read.delim(paste0(opt$tooldir, "cosmic_urls.tsv"), sep = "\t", header = TRUE)
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
235 cosmic_sbs_file <- cosmic_urls$url[cosmic_urls$genome == opt$genome &
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
236 cosmic_urls$cosmic_version == opt$cosmic_version]
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
237 sbs_signatures <- read.table(paste0(opt$tooldir, cosmic_sbs_file),
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
238 sep = "\t", header = TRUE)
19
69f09dff98f9 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit db5fd077ec6c840b7b6eda331820999f85fd7c26"
artbio
parents: 18
diff changeset
239 tag <- paste(gsub("BSgenome.Hsapiens.UCSC.", "", opt$genome), "COSMIC", opt$cosmic_version, sep = " ")
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
240 }
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
241 # Prepare user-defined signatures
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
242 if (!is.na(opt$own_signatures)) {
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
243 sbs_signatures <- read.table(opt$own_signatures, sep = "\t", header = TRUE)
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
244 tag <- paste(opt$genome, "User-Defined Signatures", sep = " ")
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
245 }
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
246 row.names(sbs_signatures) <- sbs_signatures$Type
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
247 # drop column Type of sbs_signatures
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
248 sbs_signatures <- subset(sbs_signatures, select = -c(Type))
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
249 # reorder substitutions of sbs_signatures to match mut_mat
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
250 sbs_signatures <- sbs_signatures[match(row.names(mut_mat), row.names(sbs_signatures)), ]
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
251 colnames(sbs_signatures) <- gsub("SBS", "", colnames(sbs_signatures))
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
252 # arrange signature colors
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
253 signature_colors <- c("#3f4100", "#6f53ff", "#6dc400", "#9d1fd7", "#009c06", "#001fae", "#8adb4d", "#5a67ff", "#d8c938", "#024bc3", "#d2ab00",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
254 "#e36eff", "#00ac44", "#d000b0", "#01b071", "#ff64e2", "#006b21", "#b70090", "#60dc9f", "#5f0083", "#c0ce67", "#002981",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
255 "#ffb53e", "#44005f", "#b59600", "#7d95ff", "#f47600", "#017bc4", "#ff2722", "#02cfec", "#ff233f", "#01b7b4", "#fd005c",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
256 "#019560", "#ff57a9", "#88d896", "#b80067", "#abd27f", "#dc8eff", "#667b00", "#fba3ff", "#093f00", "#ff6494", "#009791",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
257 "#c93200", "#4ac8ff", "#a60005", "#8fd4b6", "#ce0036", "#00634d", "#ff6035", "#2d1956", "#f0be6d", "#6a0058", "#957a00",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
258 "#e4b4ff", "#4a5500", "#abc7fe", "#c95900", "#003d27", "#b10043", "#d5c68e", "#3e163e", "#b36b00", "#debaeb", "#605400",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
259 "#7a0044", "#ffa06d", "#4c0d21", "#ff9cb5", "#3f1d02", "#ff958f", "#634a66", "#775500", "#6e0028", "#717653",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
260 "#6c1000", "#693600")
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
261 signature_colors <- signature_colors[seq_len(ncol(sbs_signatures))]
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
262 names(signature_colors) <- colnames(sbs_signatures)
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
263 # To drop signature_colors <- signature_colors[colnames(sbs_signatures)]
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
264 # This is IMPORTANT since in Galaxy we do not use the embeded function get_known_signatures()
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
265 sbs_signatures <- as.matrix(sbs_signatures)
17
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
266
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
267
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
268 # Plot mutational profiles of the COSMIC signatures
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
269
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
270 pdf(opt$output_sigpattern, paper = "special", width = 11.69, height = 11.69)
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
271 for (i in head(seq(1, ncol(sbs_signatures), by = 20), -1)) {
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
272 p6 <- plot_96_profile(sbs_signatures[, i:(i + 19)], condensed = TRUE, ymax = 0.3)
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
273 grid.arrange(p6, top = textGrob(paste0(tag, " profiles (", trunc((i + 1) / 20) + 1, " of ",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
274 trunc(ncol(sbs_signatures) / 20) + 1, " pages)"),
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
275 gp = gpar(fontsize = 12, font = 3)))
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
276 }
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
277 p6 <- plot_96_profile(sbs_signatures[, (trunc(ncol(sbs_signatures) / 20) * 20):(ncol(sbs_signatures))],
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
278 condensed = TRUE, ymax = 0.3)
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
279 grid.arrange(p6, top = textGrob(paste0(tag, " profiles (", trunc(ncol(sbs_signatures) / 20) + 1, " of ",
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
280 trunc(ncol(sbs_signatures) / 20) + 1, " pages)"),
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
281 gp = gpar(fontsize = 12, font = 3)))
19
69f09dff98f9 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit db5fd077ec6c840b7b6eda331820999f85fd7c26"
artbio
parents: 18
diff changeset
282
69f09dff98f9 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit db5fd077ec6c840b7b6eda331820999f85fd7c26"
artbio
parents: 18
diff changeset
283
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
284 # Find optimal contribution of COSMIC signatures to reconstruct 96 mutational profiles
17
8c6ee1c2248f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e5d498dfc5a6a9aaea3d09037dea5d15c2d85dd2"
artbio
parents: 16
diff changeset
285 pseudo_mut_mat <- mut_mat + 0.0001 # First add a small pseudocount to the mutation count matrix
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
286 fit_res <- fit_to_signatures(pseudo_mut_mat, sbs_signatures)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
287
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
288 # Plot contribution barplots
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
289 pc3 <- plot_contribution(fit_res$contribution, sbs_signatures, coord_flip = T, mode = "absolute")
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
290 pc4 <- plot_contribution(fit_res$contribution, sbs_signatures, coord_flip = T, mode = "relative")
15
8182d1625433 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 6ca5597637439c87b61af2dbd6c38089b29eca37"
artbio
parents: 14
diff changeset
291 if (is.na(opt$levels)[1]) { # if there are NO levels to display in graphs
4
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
292 pc3_data <- pc3$data
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
293 pc3 <- ggplot(pc3_data, aes(x = Sample, y = Contribution, fill = as.factor(Signature))) +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
294 geom_bar(stat = "identity", position = "stack") +
4
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
295 coord_flip() +
19
69f09dff98f9 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit db5fd077ec6c840b7b6eda331820999f85fd7c26"
artbio
parents: 18
diff changeset
296 scale_fill_manual(name = tag, values = signature_colors[]) +
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
297 labs(x = "Samples", y = "Absolute contribution") + theme_bw() +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
298 theme(panel.grid.minor.x = element_blank(),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
299 panel.grid.major.x = element_blank(),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
300 legend.position = "right",
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
301 text = element_text(size = 8),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
302 axis.text.x = element_text(angle = 90, hjust = 1))
4
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
303 pc4_data <- pc4$data
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
304 pc4 <- ggplot(pc4_data, aes(x = Sample, y = Contribution, fill = as.factor(Signature))) +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
305 geom_bar(stat = "identity", position = "fill") +
4
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
306 coord_flip() +
19
69f09dff98f9 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit db5fd077ec6c840b7b6eda331820999f85fd7c26"
artbio
parents: 18
diff changeset
307 scale_fill_manual(name = tag, values = signature_colors) +
4
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
308 scale_y_continuous(labels = scales::percent_format(accuracy = 1)) +
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
309 labs(x = "Samples", y = "Relative contribution") + theme_bw() +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
310 theme(panel.grid.minor.x = element_blank(), panel.grid.major.x = element_blank(), legend.position = "right",
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
311 text = element_text(size = 8),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
312 axis.text.x = element_text(angle = 90, hjust = 1))
15
8182d1625433 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 6ca5597637439c87b61af2dbd6c38089b29eca37"
artbio
parents: 14
diff changeset
313 }
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
314 #####
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
315 # ggplot2 alternative
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
316 if (!is.na(opt$levels)[1]) { # if there are levels to display in graphs
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
317 pc3_data <- pc3$data
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
318 pc3_data <- merge(pc3_data, metadata_table[, c(1, 3)], by.x = "Sample", by.y = "element_identifier")
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
319 pc3 <- ggplot(pc3_data, aes(x = Sample, y = Contribution, fill = as.factor(Signature))) +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
320 geom_bar(stat = "identity", position = "stack") +
19
69f09dff98f9 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit db5fd077ec6c840b7b6eda331820999f85fd7c26"
artbio
parents: 18
diff changeset
321 scale_fill_manual(name = tag, values = signature_colors) +
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
322 labs(x = "Samples", y = "Absolute contribution") + theme_bw() +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
323 theme(panel.grid.minor.x = element_blank(),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
324 panel.grid.major.x = element_blank(),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
325 legend.position = "right",
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
326 text = element_text(size = 8),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
327 axis.text.x = element_text(angle = 90, hjust = 1)) +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
328 facet_grid(~level, scales = "free_x", space = "free")
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
329 pc4_data <- pc4$data
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
330 pc4_data <- merge(pc4_data, metadata_table[, c(1, 3)], by.x = "Sample", by.y = "element_identifier")
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
331 pc4 <- ggplot(pc4_data, aes(x = Sample, y = Contribution, fill = as.factor(Signature))) +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
332 geom_bar(stat = "identity", position = "fill") +
19
69f09dff98f9 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit db5fd077ec6c840b7b6eda331820999f85fd7c26"
artbio
parents: 18
diff changeset
333 scale_fill_manual(name = tag, values = signature_colors) +
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
334 scale_y_continuous(labels = scales::percent_format(accuracy = 1)) +
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
335 labs(x = "Samples", y = "Relative contribution") + theme_bw() +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
336 theme(panel.grid.minor.x = element_blank(),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
337 panel.grid.major.x = element_blank(),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
338 legend.position = "right",
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
339 text = element_text(size = 8),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
340 axis.text.x = element_text(angle = 90, hjust = 1)) +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
341 facet_grid(~level, scales = "free_x", space = "free")
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
342 }
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
343 # Combine the two plots:
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
344 grid.arrange(pc3, pc4,
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
345 top = textGrob("Absolute and Relative Contributions of elementary signatures to mutational profiles",
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
346 gp = gpar(fontsize = 12, font = 3)))
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
347
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
348 #### pie charts of comic signatures contributions in samples ###
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
349 library(reshape2)
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
350 library(dplyr)
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
351 if (length(levels(factor(levels_table$level))) < 2) {
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
352 fit_res_contrib <- as.data.frame(fit_res$contribution)
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
353 worklist <- cbind(signature = rownames(fit_res$contribution),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
354 level = rep("nolabels", length(fit_res_contrib[, 1])),
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
355 fit_res_contrib,
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
356 sum = rowSums(fit_res_contrib))
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
357 worklist <- worklist[order(worklist[, "sum"], decreasing = T), ]
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
358 worklist <- worklist[1:opt$signum, ]
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
359 worklist <- worklist[, -length(worklist[1, ])]
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
360 worklist <- melt(worklist)
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
361 worklist <- worklist[, c(1, 3, 4, 2)]
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
362 } else {
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
363 worklist <- list()
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
364 for (i in levels(factor(levels_table$level))) {
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
365 fit_res$contribution[, levels_table$element_identifier[levels_table$level == i]] -> worklist[[i]]
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
366 sum <- rowSums(as.data.frame(worklist[[i]]))
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
367 worklist[[i]] <- cbind(worklist[[i]], sum)
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
368 worklist[[i]] <- worklist[[i]][order(worklist[[i]][, "sum"], decreasing = T), ]
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
369 worklist[[i]] <- worklist[[i]][1:opt$signum, ]
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
370 worklist[[i]] <- worklist[[i]][, -length(as.data.frame(worklist[[i]]))]
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
371 }
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
372 worklist <- as.data.frame(melt(worklist))
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
373 worklist[, 2] <- paste0(worklist[, 4], " - ", worklist[, 2])
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
374 }
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
375
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
376 colnames(worklist) <- c("signature", "sample", "value", "level")
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
377 worklist <- as.data.frame(worklist %>% group_by(sample) %>% mutate(value = value / sum(value) * 100))
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
378 worklist$pos <- cumsum(worklist$value) - worklist$value / 2
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
379 worklist$label <- factor(worklist$signature)
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
380 worklist$signature <- factor(worklist$signature)
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
381 p7 <- ggplot(worklist, aes(x = "", y = value, group = signature, fill = signature)) +
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
382 geom_bar(width = 1, stat = "identity") +
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
383 geom_text(aes(label = label), position = position_stack(vjust = 0.5), color = "black", size = 3) +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
384 coord_polar("y", start = 0) + facet_wrap(.~sample) +
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
385 labs(x = "", y = "Samples", fill = tag) +
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
386 scale_fill_manual(name = paste0(opt$signum, " most contributing\nsignatures\n(in each label/tissue)"),
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
387 values = signature_colors[levels(worklist$signature)],
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
388 labels = names(signature_colors[levels(worklist$signature)])) +
8
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
389 theme(axis.text = element_blank(),
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
390 axis.ticks = element_blank(),
e0dad46148bf "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 75fd87e806f9bee2f6ff7fcd3834e55eb21d8710"
artbio
parents: 7
diff changeset
391 panel.grid = element_blank())
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
392 grid.arrange(p7)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
393
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
394 # Plot relative contribution of the cancer signatures in each sample as a heatmap with sample clustering
4
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
395 if (length(vcf_paths) > 1) {
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
396 p8 <- plot_contribution_heatmap(fit_res$contribution, cluster_samples = TRUE, method = "complete")
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
397 grid.arrange(p8)
7ba08c826888 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit e2d6ed12516e1bd24071962a0dfe0220cc348f3c"
artbio
parents: 3
diff changeset
398 }
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
399
11
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
400 # export relative contribution matrix
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
401 if (!is.na(opt$sig_contrib_matrix)) {
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
402 output_table <- t(fit_res$contribution) / rowSums(t(fit_res$contribution))
12
7954f0d3517f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 7c990ad7024035342c4abd6e3fa8feb1b2f2ac2c"
artbio
parents: 11
diff changeset
403 if (length(levels(factor(levels_table$level))) > 1) {
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
404 output_table <- data.frame(sample = paste0(metadata_table[metadata_table$element_identifier == colnames(fit_res$contribution),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
405 3], "-", colnames(fit_res$contribution)),
13
6741b819cc15 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 372eb902f528baa8b5465b83d992a1d146343dfe"
artbio
parents: 12
diff changeset
406 output_table)
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
407 colnames(output_table) <- gsub("X", "SBS", colnames(output_table))
12
7954f0d3517f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 7c990ad7024035342c4abd6e3fa8feb1b2f2ac2c"
artbio
parents: 11
diff changeset
408 } else {
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
409 output_table <- data.frame(sample = rownames(output_table), output_table)
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
410 colnames(output_table) <- gsub("X", "SBS", colnames(output_table))
12
7954f0d3517f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 7c990ad7024035342c4abd6e3fa8feb1b2f2ac2c"
artbio
parents: 11
diff changeset
411 }
11
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
412 write.table(output_table, file = opt$sig_contrib_matrix, sep = "\t", quote = F, row.names = F)
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
413 }
7995a949189f "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 94919d0f442fe7059afa2e07898c149b126a5460"
artbio
parents: 10
diff changeset
414
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
415 # calculate all pairwise cosine similarities
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
416 cos_sim_ori_rec <- cos_sim_matrix(pseudo_mut_mat, fit_res$reconstructed)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
417 # extract cosine similarities per sample between original and reconstructed
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
418 cos_sim_ori_rec <- as.data.frame(diag(cos_sim_ori_rec))
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
419
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
420 # We can use ggplot to make a barplot of the cosine similarities between the original and
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
421 # reconstructed mutational profile of each sample. This clearly shows how well each mutational
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
422 # profile can be reconstructed with the COSMIC mutational signatures. Two identical profiles
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
423 # have a cosine similarity of 1. The lower the cosine similarity between original and
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
424 # reconstructed, the less well the original mutational profile can be reconstructed with
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
425 # the COSMIC signatures. You could use, for example, cosine similarity of 0.95 as a cutoff.
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
426
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
427 # Adjust data frame for plotting with gpplot
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
428 colnames(cos_sim_ori_rec) <- "cos_sim"
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
429 cos_sim_ori_rec$sample <- row.names(cos_sim_ori_rec)
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
430 # Make barplot
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
431 p9 <- ggplot(cos_sim_ori_rec, aes(y = cos_sim, x = sample)) +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
432 geom_bar(stat = "identity", fill = "skyblue4") +
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
433 coord_cartesian(ylim = c(0.8, 1)) +
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
434 # coord_flip(ylim=c(0.8,1)) +
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
435 ylab("Cosine similarity\n original VS reconstructed") +
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
436 xlab("") +
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
437 # Reverse order of the samples such that first is up
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
438 # xlim(rev(levels(factor(cos_sim_ori_rec$sample)))) +
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
439 theme_bw() +
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
440 theme(panel.grid.minor.y = element_blank(),
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
441 panel.grid.major.y = element_blank()) +
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
442 # Add cut.off line
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
443 geom_hline(aes(yintercept = .95))
18
8d9f31389f33 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 1cb9c8fd0c74943a8e6de4c63ac5e4a84ef27430"
artbio
parents: 17
diff changeset
444 grid.arrange(p9, top = textGrob("Similarity between true profiles and profiles reconstructed with elementary signatures", gp = gpar(fontsize = 12, font = 3)))
2
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
445 dev.off()
aea952be68cb "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit cd8f633245d53cf47eaf860a4e0ae8d806c34419"
artbio
parents: 0
diff changeset
446 }
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
447
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
448
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
449 # Output RData file
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
450 if (!is.null(opt$rdata)) {
14
56c8869a231e "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 518fb067e8206ecafbf673a5e4cf375ccead11e3"
artbio
parents: 13
diff changeset
451 save.image(file = opt$rdata)
3
e332cf9dfa06 "planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/mutational_patterns commit 0f7593f703ba0dfd12aea1c0460e371f08b57d2f"
artbio
parents: 2
diff changeset
452 }