# HG changeset patch # User ecology # Date 1729024428 0 # Node ID cfe884e5360030f42c0173a204ad24846eb73eee planemo upload for repository https://github.com/galaxyecology/tools-ecology/tree/main/tools-ecology/tools/make_data_paper_sketches commit 34f4e0604adc2a2ba4902ce6b8e6df2460eda292 diff -r 000000000000 -r cfe884e53600 draft_data_paper.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/draft_data_paper.xml Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,71 @@ + + from EML + + r-base + libxslt + pandoc + r-dplyr + r-mapview + r-xslt + r-xml2 + phantomjs + + + + + + + + + + + + + + + + + + + + is made to produce draft of data paper from Ecological Metadata Language (EML) based metadata documents. + +**How to use it?** +-------------------- + +You need to input an EML (Ecological Metadata Language) metadata file (xml format) and run the tool that will produce a draft of data paper in docx format that you can edit. + + + ]]> + + + @misc{githubsurvey2023, + author = {Tanguy Genthon}, + title = {{Metadata Shiny for Retroactive Information Management and Production of data paper Sketches}}, + publisher = {Github}, + url = {https://github.com/TanguyGen/metaCure}, + year = {2023} + } + } + @misc{githubsurvey2023b, + author = {Tanguy Genthon}, + title = {{Produce beautifull website from EML}}, + publisher = {Github}, + url = {https://github.com/TanguyGen/emldown}, + year = {2023} + } + } + + diff -r 000000000000 -r cfe884e53600 emldown_templates/addmap2.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/addmap2.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,14 @@ + + + + + +
+ +
+
+
+
+
+ diff -r 000000000000 -r cfe884e53600 emldown_templates/bootstrap2.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/bootstrap2.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,77 @@ + + + + + + + + + + + + + + + + + + + + + + +
+
+ +
+
+
+ +
+ +
+ +
+ +
+ + +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ +
+ + + + + + + +
+
diff -r 000000000000 -r cfe884e53600 emldown_templates/dataset2.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/dataset2.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,88 @@ + + + + + + +

Publication date

+ +
+
+ + + +

Abstract

+
+
+

+
+
+
+
+ + + +

Metadata Provider

+

+   + +

+
+
+

Author list

+

Creators

+ + + + +

Associated parties

+
    + +
  • +   +   + +
  • +
    +
+
+
+ + +

Keywords

+

+ +

    +
  • +
+ +

+
+
+ + + +

Annotations

+

+ +

    +
  • +  + +
  • +
+ +

+
+
+
+
diff -r 000000000000 -r cfe884e53600 emldown_templates/datatable2.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/datatable2.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,38 @@ + + + + + + +

Data tables

+ +
+

+
+ + Physical:  + +
+ + + + + + + + + + + + + +
attribute namedefinitionformat, unit or codes
 =   
+
+
+
+
+
+
+ + diff -r 000000000000 -r cfe884e53600 emldown_templates/footer.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/footer.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,15 @@ + + + + + + + diff -r 000000000000 -r cfe884e53600 emldown_templates/geographic_coverage.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/geographic_coverage.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,33 @@ + + + + + + +

Geographic coverage

+
+ +
+ +

+ +

+ West:
+ East:
+ North:
+ South: +

+ +
+ +
+ +
+
+
+
+
+ + + diff -r 000000000000 -r cfe884e53600 emldown_templates/head.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/head.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,11 @@ + + + + + + + <xsl:value-of select="//dataset/title" /> + + + diff -r 000000000000 -r cfe884e53600 emldown_templates/method.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/method.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,34 @@ + + + + +

Method

+ +
+ + + +

Method step

+

+
+
+ + + +

Sampling

+

+
+
+ + + +

Quality control

+

+
+
+ +
+
+
+
diff -r 000000000000 -r cfe884e53600 emldown_templates/otherentity.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/otherentity.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,19 @@ + + + + + + +

Other entities

+ +
+ +
+
+
+
+
+
+ + diff -r 000000000000 -r cfe884e53600 emldown_templates/rights.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/rights.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,16 @@ + + + + + + +

Intellectual Rights

+

+ +

+
+
+
+
+ diff -r 000000000000 -r cfe884e53600 emldown_templates/spatraster2.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/spatraster2.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,39 @@ + + + + + + +

Spatial Rasters

+ +
+

+

+
+ + Physical:  + +
+ + + + + + + + + + + + + +
attribute namedefinitionformat, unit or codes
 =   
+
+
+
+
+
+
+ + diff -r 000000000000 -r cfe884e53600 emldown_templates/spatvector2.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/spatvector2.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,38 @@ + + + + + + +

Spatial Vectors

+ +
+

+
+ + Physical:  + +
+ + + + + + + + + + + + + +
attribute namedefinitionformat, unit or codes
 =   
+
+
+
+
+
+
+ + diff -r 000000000000 -r cfe884e53600 emldown_templates/taxonomic_coverage.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/taxonomic_coverage.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,42 @@ + + + + + + +

Taxonomic coverage

+
+ + + + + + + + +
RankValue
+
+
+
+
+ + + + + + + + + + + + + + + +
+ + + + diff -r 000000000000 -r cfe884e53600 emldown_templates/temporal_coverage.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/temporal_coverage.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,43 @@ + + + + + + +

Temporal coverage

+ + + + + + + + + + + + + + +
Start dateEnd date
+
+ + + + + + + + + + + + +
Date
+
+
+
+
+
+ diff -r 000000000000 -r cfe884e53600 emldown_templates/units.xsl --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/emldown_templates/units.xsl Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,30 @@ + + + + + + +

Custom units

+ + + + + + + + + + + + + + + +
unit nameparent SI unitunit typedescription
+
+
+
+
+ + diff -r 000000000000 -r cfe884e53600 map_geographical_coverage.R --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/map_geographical_coverage.R Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,64 @@ +#From https://github.com/TanguyGen/metaCure/blob/main/R/eml_down.R +#Modified by Seguineau Pauline (2024-10-15) +library(dplyr) +library(xslt) +library(xml2) +library(mapview) +library(leaflet) + +args = commandArgs(trailingOnly=TRUE) +if (length(args)==0) +{ + stop("This tool needs at least one argument") +}else{ + data <- args[1] +} + +#' map_geographical_coverage +#'Make a map from EML +#' @param eml Metadata using EML standard in XML format +#' +#' @return A map +#' @export + +map_geographical_coverage <- function(eml){ + name <- xml2::xml_find_all(eml, "//geographicCoverage/geographicDescription") + name <- unlist(xml2::as_list(name)) + + west <- xml2::xml_find_all(eml, "//geographicCoverage/boundingCoordinates/westBoundingCoordinate") + west <- as.numeric(unlist(xml2::as_list(west))) + + east <- xml2::xml_find_all(eml, "//geographicCoverage/boundingCoordinates/eastBoundingCoordinate") + east <- as.numeric(unlist(xml2::as_list(east))) + + north <- xml2::xml_find_all(eml, "//geographicCoverage/boundingCoordinates/northBoundingCoordinate") + north <- as.numeric(unlist(xml2::as_list(north))) + + south <- xml2::xml_find_all(eml, "//geographicCoverage/boundingCoordinates/southBoundingCoordinate") + south <- as.numeric(unlist(xml2::as_list(south))) + + geo_info <- data.frame(name = name, west = west, east = east, south = south, north = north) + + map <- leaflet(geo_info) %>% + addProviderTiles("CartoDB.Positron") + + for (i in 1:nrow(geo_info)) { + if (geo_info$west[i]==geo_info$east[i] && geo_info$south[i]==geo_info$north[i]){ + map <- map %>% addCircles(lng = geo_info$west[i] , lat= geo_info$south[i], fillColor = "transparent" ) %>% addScaleBar()} + + else if(geo_info$west[i]!=geo_info$east[i] && geo_info$south[i]!=geo_info$north[i]){ + map <- map %>% addRectangles(lng1 = geo_info$west[i], lat1 = geo_info$south[i], + lng2 = geo_info$east[i], lat2 = geo_info$north[i], fillColor = "transparent") %>% addScaleBar()} + } + mapview::mapshot(map, file = "map.png",remove_controls = c("zoomControl", "layersControl", "homeButton","drawToolbar", "easyButton")) +} + +doc <- read_xml(data) + +if (is.na(xml2::xml_find_first(doc, "//geographicCoverage"))){ + mes = "No geographic coverage found, skipping geographic coverage step." + mes +}else{ + map_geographical_coverage(doc) +} + diff -r 000000000000 -r cfe884e53600 test-data/EML.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/EML.xml Tue Oct 15 20:33:48 2024 +0000 @@ -0,0 +1,609 @@ + + + + + Dumont D Urville sea abiotic and physical parameters and Jupyter notebook + + + Marc + Eléaume + + Muséum National d'Histoire Naturelle + marc.eleaume@mnhn.fr + https://orcid.org/0000-0003-1999-1177 + + + + Lenaïg + G. + Hemery + + Pacific Northwest National Laboratory Marine Sciences Laboratory + lenaighemery@gmail.com,lenaig.hemery@pnnl.gov + https://orcid.org/0000-0001-5337-4514 + + + + Pauline + Seguineau + + Muséum National d'Histoire Naturelle + pauline.seguineau@mnhn.fr + https://orcid.org/0009-0009-5969-8478 + + + + Yvan + Le Bras + + Muséum National d'Histoire Naturelle + yvan.le-bras@mnhn.fr + https://orcid.org/0000-0002-8504-068X + + 2024-05-28 + + Antarctica and the Southern Ocean play a central role in regulating the Earth climate and its singularity dating back 25 Mya also includes ecological processes that need to be better understood. The Dumont D’Urville sea located off George V and Adélie Land, is one of the better known East-Antarctic marine area displaying a diversity of abiotic and physical parameters that have been shown to drive the distribution of marine organisms. The dataset presented here contribute to our understanding of these interactions, providing essential information for ongoing research and conservation efforts in this Antarctic ecosystem. This dataset presents a table containing abiotic and physical parameters specific to the Dumont D’Urville Sea and a Jupyter notebook to execute a R script in the ecoregionalization Galaxy workflow. The abiotic and physical parameters were first presented in the research article 'Predicting habitat preferences for Anthometrina adriani (Echinodermata) on the East Antarctic continental shelf' by Hemery et al. (2011). The jupyter notebook is dedicated to the pivot_wider function from the tidyr R package. This notebook is the final part of the data preparation for the ecoregionalization Galaxy workflow. + + + + Antarctica + Ocean circulation model + Southern Ocean + Dumont D'Urville sea + CEAMARC + Abiotic and physical parameters + Ecoregionalization + Tidyr + R package + Jupyter notebook + Pivot wider function + + + + + + + This information is released under the Creative Commons license - Attribution - CC BY (https://creativecommons.org/licenses/by/4.0/). The consumer of these data ("Data User" herein) is required to cite it appropriately in any publication that results from its use. The Data User should realize that these data may be actively used by others for ongoing research and that coordination may be necessary to prevent duplicate publication. The Data User is urged to contact the authors of these data if any questions about methodology or results occur. Where appropriate, the Data User is encouraged to consider collaboration or co-authorship with the authors. The Data User should realize that misinterpretation of data may occur if used out of context of the original study. While substantial efforts are made to ensure the accuracy of data and associated documentation, complete accuracy of data sets cannot be guaranteed. All data are made available "as is." The Data User should be aware, however, that data are updated periodically and it is the responsibility of the Data User to check for new versions of the data. The data authors and the repository where these data were obtained shall not be liable for damages resulting from any use or misinterpretation of the data. Thank you. + + + + + Dumont D'Urville sampling border + + 139.22 + 145.53 + -65.57 + -67.01 + + + + + + 2007-12-01 + + + 2008-01-31 + + + + + + http://purl.obolibrary.org/obo/IAO_0000136 + http://ncicb.nci.nih.gov/xml/owl/EVS/Thesaurus.owl#C18007 + + + + Marc + Eléaume + + Muséum National d'Histoire Naturelle + marc.eleaume@mnhn.fr + https://orcid.org/0000-0003-1999-1177 + + + + + Abiotic and physical parameters in this dataset were taken from oceanographic model and in situ measurements (Hemery et al., 2011). Here we quote the relevant section of the “Materials and methods” part from the study: “Abiotic or physical parameters. Two different categories of abiotic parameters were used (Fig. 2): parameters likely to be subject to daily or seasonal variability (temperature, salinity, current magnitude, general current direction and sea-ice concentration) and parameters with long-term stability (bathymetry, slope, rugosity and seabed sediments). Parameters with short-term variability are taken from an oceanographic model, whereas parameters with long-term stability are derived from in situ measurements. Physical oceanography. Physical oceanographic parameters near the seabed (temperature, salinity, mean current magnitude, standard deviations of these 3 parameters, maximum current magnitude and general current direction) are taken from a climatologically forced ocean circulation model. The model was run for a total of 23 yr. A spinup phase of 20 yr was required for the model to reach quasi-equilibrium. The mean and SD were calculated by using 6-hourly model data for the last 3 yr. Sea ice growth rate was calculated directly from special sensor microwave imager (SSM/I) observations (Tamura et al. 2008). The model is based on the Rutgers/University of California Los Angeles Regional Ocean Model System (ROMS; Shchepetkin & McWilliams 2005) and is identical to the one described by B. K. Galton-Fenzi et al. (unpubl.). The model used here, initially developed for regional modelling studies of the Amery Ice Shelf/Ocean system and has been used in circum-Antarctic modelling studies, is able to simulate ice/ocean interactions at a high level of realism (Galton-Fenzi 2009, 2010). For the region of this study, the model is able to reproduce the circulation patterns and water mass properties when compared with oceanographic measurements taken in the vicinity of the George V and Adélie basins (A. Meijers pers. comm.). The model domain extends from 135.77° E to 158.08° E and from 69.417° S to 62.724° S. The southern boundary of the model is a closed, solid, free slip wall and the eastern and western boundaries are partially open. The horizontal grid resolution is between 2.16 km near the southern boundary to 2.88 km near the northern boundary. There are 31 vertical levels that are concentrated towards the top and bottom of the model domain. The parameters used here were taken from the lowest vertical level in the model that lies immediately adjacent to the seabed. The choice of mixing and advection schemes follows the choices that were successfully used by Dinniman et al. (2003, 2007) for studies of the shelf seas near the Ross Ice Shelf. The melting and freezing formulation uses the full 3-equation formulation and dynamics frazil ice model used in the studies of Galton-Fenzi (2009, 2010). Lateral boundary fields (potential temperature, salinity and currents) on the open boundaries are relaxed to monthly climatologies from ECCO2 (Menemenlis et al. 2008, Wunsch et al. 2009). Ten primary tidal constituents were added as a free-surface forcing. The tidal amplitudes and phase are calculated with a nonstandard ROMS subroutine, based on tidal information from the Proudman Oceanographic Laboratory (Murray 1964) and modified to be included within ROMS, yielding a standard tidal prediction. The bathymetry and the ice-draft information come from a version of R-TOPO (Timmermann et al. 2010) that was modified to include the high-resolution bathymetric data (outlined below, Beaman et al. 2011) and knowledge of the glacial ice drafts in the region (B. Legresy pers.comm.). The open ocean surface fluxes are modified by an imposed climatological sea-ice cover that includes polynyas, derived from SSM/I observations (Tamura et al. 2008). During summer, the Tamura et al. (2008) data are supplemented with open-water heat and salt fluxes by using the monthly climatologies from the NCEP-2 (Kanamitsu et al. 2002). Bathymetry and seabed sediments. A bathymetry model based on multibeam swath sonar and single beam bathymetry data was produced at about 250 m resolution for the study area (Beaman et al. 2011). A raster map of the slope gradient was generated from this bathymetry model by using ESRI ArcGIS 9.2 Spatial Analysis Tools and a raster map of the rugosity was generated by using Benthic Terrain Modeler tools. Sediment grabs provided substratum composition data, such as the percentage of gravel, mud, sand, biogenic carbonate and biogenic silica at sample sites (Beaman & O’Brien 2009). These data are used as a broad-scale representation of the seafloor substratum.” (Hemery et al., 2011) + + + + + + ceamarc_env + A table containing abiotic and physical parameters specific to the Dumont D'Urville Sea that were first presented in the research article "Predicting habitat preferences for Anthometrina adriani (Echinodermata) on the East Antarctic continental shelf" by Hemery et al. (2011). + + ceamarc_env.tsv + 15573372 + 7e21041af224ad58f685f37f68a49c5b + + + 1 + \n + column + + \t + + + + + + + long + Longitude is a geographic coordinate that specifies the east–west position of a point + float + + + + degree + + + real + + 139.22 + 145.53 + + + + + + -9999 + no data available + + + + lat + Latitude is a geographic coordinate that specifies the north–south position of a point. + float + + + + degree + + + real + + -67.01 + -65.57 + + + + + + -9999 + no data available + + + + Carbo + Percentage of biogenic carbonate + float + + + + percent + + + real + + 0.78 + 5.62 + + + + + + -9999 + no data available + + + + Grav + Percentage of gravel in the seabed + float + + + + percent + + + real + + -0.01 + 29.55 + + + + + + -9999 + no data available + + + + Maxbearing + Maximum current bearing + float + + + + radian + + + real + + 0.000201518007088453 + 6.28 + + + + + + -9999 + no data available + + + + Maxmagnit + Maximum current magnitude + float + + + + meterPerSecond + + + real + + 0.000266201008344069 + 0.49 + + + + + + -9999 + no data available + + + + Meancurmag + Mean current magnitude + float + + + + meterPerSecond + + + real + + 0.01 + 0.26 + + + + + + -9999 + no data available + + + + Meansal + Mean salinity of the sea + float + + + + PSU + + + real + + 34.52 + 34.77 + + + + + + -9999 + no data available + + + + Meantheta + Mean temperature of the sea + float + + + + degreeCelsius + + + real + + -1.86 + -0.09 + + + + + + -9999 + no data available + + + + Mud + Percentage of mud in the seabed + float + + + + percent + + + real + + -2.04 + 85.6 + + + + + + -9999 + no data available + + + + Prof + Depth of the sea + float + + + + meter + + + integer + + -1200 + -130 + + + + + + -9999 + no data available + + + + Rugosity + Rugosity of the seabed + float + + + + dimensionless + + + real + + 1 + 1.01 + + + + + + -9999 + no data available + + + + Sand + Percentage of sand in the seabed + float + + + + percent + + + real + + 34.29 + 73.92 + + + + + + -9999 + no data available + + + + Seaice_prod + Seaice production in meter per year + float + + + + meterPerYear + + + real + + -2.21 + 13.31 + + + + + + -9999 + no data available + + + + Sili + Percentage of biogenic silica in the seabed + float + + + + percent + + + real + + 0.69 + 17.1 + + + + + + -9999 + no data available + + + + Slope + Slope of the seabed + float + + + + degree + + + real + + -0.29 + 13.18 + + + + + + -9999 + no data available + + + + Standcurmag + Current magnitude standard deviation + float + + + + meterPerSecond + + + real + + 0.01 + 0.08 + + + + + + -9999 + no data available + + + + Standsal + Salinity standard deviation + float + + + + PSU + + + real + + 0.00584563100710511 + 0.26 + + + + + + -9999 + no data available + + + + Standtheta + Temperature standard deviation + float + + + + degreeCelsius + + + real + + 0.03 + 0.52 + + + + + + -9999 + no data available + + + + 155823 + + + pivot_wider_jupytool_notebook + This jupyter notebook is dedicated to the pivot_wider function from the tidyr R package. It is the final part of the data preparation for the ecoregionalization Galaxy workflow. + + pivot_wider_jupytool_notebook.ipynb + 2794 + 2065faa032869e3da5f20b56c7904290 + + + Unknown + + + + executable + + + + + + + 1 PSU = 1g/kg + + + 0 °C + 273,15 = 273,15 Kelvin + + + meter per year + + + + + + + + EMLassemblyline + 3.5.5 + + + +