Mercurial > repos > prog > lcmsmatching
comparison ChemspiderConn.R @ 2:20d69a062da3 draft
planemo upload for repository https://github.com/workflow4metabolomics/lcmsmatching.git commit d4048accde6bdfd5b3e14f5394902d38991854f8
author | prog |
---|---|
date | Thu, 02 Mar 2017 08:55:00 -0500 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
1:253d531a0193 | 2:20d69a062da3 |
---|---|
1 ##################### | |
2 # CLASS DECLARATION # | |
3 ##################### | |
4 | |
5 ChemspiderConn <- methods::setRefClass("ChemspiderConn", contains = "RemotedbConn") | |
6 | |
7 ########################## | |
8 # GET ENTRY CONTENT TYPE # | |
9 ########################## | |
10 | |
11 ChemspiderConn$methods( getEntryContentType = function() { | |
12 return(BIODB.XML) | |
13 }) | |
14 | |
15 ##################### | |
16 # GET ENTRY CONTENT # | |
17 ##################### | |
18 | |
19 ChemspiderConn$methods( getEntryContent = function(ids) { | |
20 | |
21 # Debug | |
22 .self$.print.debug.msg(paste0("Get entry content(s) for ", length(ids)," id(s)...")) | |
23 | |
24 URL.MAX.LENGTH <- 2083 | |
25 | |
26 # Initialize return values | |
27 content <- rep(NA_character_, length(ids)) | |
28 | |
29 # Loop on all | |
30 n <- 0 | |
31 inc <- NA_integer_ | |
32 while (n < length(ids)) { | |
33 | |
34 # Get list of accession ids to retrieve | |
35 accessions <- ids[(n + 1):(if (is.na(inc)) length(ids) else (min(n + inc, length(ids))))] | |
36 | |
37 # Create URL request | |
38 x <- get.entry.url(class = BIODB.CHEMSPIDER, accession = accessions, content.type = BIODB.XML, max.length = URL.MAX.LENGTH, base.url = .self$.url, token = .self$.token) | |
39 | |
40 # Debug | |
41 .self$.print.debug.msg(paste0("Send URL request for ", x$n," id(s)...")) | |
42 | |
43 # Send request | |
44 xmlstr <- .self$.get.url(x$url) | |
45 | |
46 # Error : "Cannot convert WRONG to System.Int32.\r\nParameter name: type ---> Input string was not in a correct format.\r\n" | |
47 if (grepl('^Cannot convert .* to System\\.Int32\\.', xmlstr)) { | |
48 # One of the ids is incorrect | |
49 if (is.na(inc)) { | |
50 inc <- 1 | |
51 next | |
52 } | |
53 else | |
54 xmlstr <- NA_character_ | |
55 } | |
56 | |
57 # Increase number of entries retrieved | |
58 n <- n + x$n | |
59 | |
60 # Parse XML and get included XML | |
61 if ( ! is.na(xmlstr)) { | |
62 xml <- xmlInternalTreeParse(xmlstr, asText = TRUE) | |
63 ns <- c(csns = "http://www.chemspider.com/") | |
64 returned.ids <- xpathSApply(xml, "//csns:ExtendedCompoundInfo/csns:CSID", xmlValue, namespaces = ns) | |
65 content[match(returned.ids, ids)] <- vapply(getNodeSet(xml, "//csns:ExtendedCompoundInfo", namespaces = ns), saveXML, FUN.VALUE = '') | |
66 } | |
67 | |
68 # Debug | |
69 .self$.print.debug.msg(paste0("Now ", length(ids) - n," id(s) left to be retrieved...")) | |
70 } | |
71 | |
72 return(content) | |
73 }) | |
74 | |
75 ################ | |
76 # CREATE ENTRY # | |
77 ################ | |
78 | |
79 ChemspiderConn$methods( createEntry = function(content, drop = TRUE) { | |
80 return(createChemspiderEntryFromXml(content, drop = drop)) | |
81 }) | |
82 | |
83 ############################ | |
84 # GET CHEMSPIDER IMAGE URL # | |
85 ############################ | |
86 | |
87 get.chemspider.image.url <- function(id) { | |
88 | |
89 url <- paste0('http://www.chemspider.com/ImagesHandler.ashx?w=300&h=300&id=', id) | |
90 | |
91 return(url) | |
92 } |