larch_artemis: larch_artemis.py comparison

comparison larch_artemis.py @ 5:7acb53ffb96f draft

planemo upload for repository https://github.com/MaterialsGalaxy/larch-tools/tree/main/larch_artemis commit 4814f53888643f1d3667789050914675fffb7d59

author	muon-spectroscopy-computational-project
date	Fri, 23 Aug 2024 13:46:13 +0000
parents	39ab361e6d59
children

comparison

equal deleted inserted replaced

-:39ab361e6d59
+:7acb53ffb96f
 gds_val = 0.0
 gds_expr = ""
 try:
 gds_val = float(data_dict[par_idx]["value"])
 except ValueError:
-gds_val = 0.00
+continue
 gds_expr = data_dict[par_idx]["expr"]
 gds_vary = (
 True
 if str(data_dict[par_idx]["vary"]).strip().capitalize() == "True"
 else False
 if one_par is not None:
 dgs_group.__setattr__(gds_name, one_par)
 return dgs_group
-def plot_rmr(path: str, data_set, rmin, rmax):
+def plot_rmr(path: str, datasets: list, rmin, rmax):
 plt.figure()
-plt.plot(data_set.data.r, data_set.data.chir_mag, color="b")
+for i, dataset in enumerate(datasets):
-plt.plot(data_set.data.r, data_set.data.chir_re, color="b", label="expt.")
+plt.subplot(len(datasets), 1, i + 1)
-plt.plot(data_set.model.r, data_set.model.chir_mag, color="r")
+data = dataset.data
-plt.plot(data_set.model.r, data_set.model.chir_re, color="r", label="fit")
+model = dataset.model
-plt.ylabel(
+plt.plot(data.r, data.chir_mag, color="b")
-"Magnitude of Fourier Transform of "
+plt.plot(data.r, data.chir_re, color="b", label="expt.")
-r"$k^2 \cdot \chi$/$\mathrm{\AA}^{-3}$"
+plt.plot(model.r, model.chir_mag, color="r")
-)
+plt.plot(model.r, model.chir_re, color="r", label="fit")
-plt.xlabel(r"Radial distance/$\mathrm{\AA}$")
+plt.ylabel(
-plt.xlim(0, 5)
+"Magnitude of Fourier Transform of "
+r"$k^2 \cdot \chi$/$\mathrm{\AA}^{-3}$"
-plt.fill(
+)
-[rmin, rmin, rmax, rmax],
+plt.xlabel(r"Radial distance/$\mathrm{\AA}$")
-[-rmax, rmax, rmax, -rmax],
+plt.axvspan(xmin=rmin, xmax=rmax, color="g", alpha=0.1)
-color="g",
+plt.legend()
-alpha=0.1,
-)
-plt.text(rmax - 0.65, -rmax + 0.5, "fit range")
-plt.legend()
 plt.savefig(path, format="png")
 plt.close("all")
-def plot_chikr(path: str, data_set, rmin, rmax, kmin, kmax):
+def plot_chikr(path: str, datasets, rmin, rmax, kmin, kmax):
 fig = plt.figure(figsize=(16, 4))
-ax1 = fig.add_subplot(121)
+for i, dataset in enumerate(datasets):
-ax2 = fig.add_subplot(122)
+data = dataset.data
-ax1.plot(
+model = dataset.model
-data_set.data.k,
+ax1 = fig.add_subplot(len(datasets), 2, 2*i + 1)
-data_set.data.chi * data_set.data.k**2,
+ax2 = fig.add_subplot(len(datasets), 2, 2*i + 2)
-color="b",
+ax1.plot(data.k, data.chi * data.k**2, color="b", label="expt.")
-label="expt.",
+ax1.plot(model.k, model.chi * data.k**2, color="r", label="fit")
-)
+ax1.set_xlabel(r"$k (\mathrm{\AA})^{-1}$")
-ax1.plot(
+ax1.set_ylabel(r"$k^2$ $\chi (k)(\mathrm{\AA})^{-2}$")
-data_set.model.k,
+ax1.axvspan(xmin=kmin, xmax=kmax, color="g", alpha=0.1)
-data_set.model.chi * data_set.data.k**2,
+ax1.legend()
-color="r",
-label="fit",
+ax2.plot(data.r, data.chir_mag, color="b", label="expt.")
-)
+ax2.plot(model.r, model.chir_mag, color="r", label="fit")
-ax1.set_xlim(0, 15)
+ax2.set_xlim(0, 5)
-ax1.set_xlabel(r"$k (\mathrm{\AA})^{-1}$")
+ax2.set_xlabel(r"$R(\mathrm{\AA})$")
-ax1.set_ylabel(r"$k^2$ $\chi (k)(\mathrm{\AA})^{-2}$")
+ax2.set_ylabel(r"$|\chi(R)|(\mathrm{\AA}^{-3})$")
+ax2.legend(loc="upper right")
-ax1.fill(
+ax2.axvspan(xmin=rmin, xmax=rmax, color="g", alpha=0.1)
-[kmin, kmin, kmax, kmax],
-[-rmax, rmax, rmax, -rmax],
-color="g",
-alpha=0.1,
-)
-ax1.text(kmax - 1.65, -rmax + 0.5, "fit range")
-ax1.legend()
-ax2.plot(data_set.data.r, data_set.data.chir_mag, color="b", label="expt.")
-ax2.plot(data_set.model.r, data_set.model.chir_mag, color="r", label="fit")
-ax2.set_xlim(0, 5)
-ax2.set_xlabel(r"$R(\mathrm{\AA})$")
-ax2.set_ylabel(r"$|\chi(R)|(\mathrm{\AA}^{-3})$")
-ax2.legend(loc="upper right")
-ax2.fill(
-[rmin, rmin, rmax, rmax],
-[-rmax, rmax, rmax, -rmax],
-color="g",
-alpha=0.1,
-)
-ax2.text(rmax - 0.65, -rmax + 0.5, "fit range")
 fig.savefig(path, format="png")
 plt.close("all")
 def read_gds(gds_file):
 def read_selected_paths_list(file_name):
 sp_dict = read_csv_data(file_name)
 sp_list = []
-for path_id in sp_dict:
+for path_dict in sp_dict.values():
-filename = sp_dict[path_id]["filename"]
+filename = path_dict["filename"]
+if not os.path.isfile(filename):
+raise FileNotFoundError(
+f"{filename} not found, check paths in the Selected Paths "
+"table match those in the zipped directory structure."
+)
 print(f"Reading selected path for file {filename}")
 new_path = FeffPathGroup(
 filename=filename,
-label=sp_dict[path_id]["label"],
+label=path_dict["label"],
-s02=sp_dict[path_id]["s02"],
+degen=path_dict["degen"] if path_dict["degen"] != "" else None,
-e0=sp_dict[path_id]["e0"],
+s02=path_dict["s02"],
-sigma2=sp_dict[path_id]["sigma2"],
+e0=path_dict["e0"],
-deltar=sp_dict[path_id]["deltar"],
+sigma2=path_dict["sigma2"],
+deltar=path_dict["deltar"],
 )
 sp_list.append(new_path)
 return sp_list
-def run_fit(data_group, gds, selected_paths, fv):
+def run_fit(
+data_groups: list, gds, pathlist, fv, selected_path_ids: list = None
+):
 # create the transform group (prepare the fit space).
 trans = TransformGroup(
 fitspace=fv["fitspace"],
 kmin=fv["kmin"],
 kmax=fv["kmax"],
 window=fv["window"],
 rmin=fv["rmin"],
 rmax=fv["rmax"],
 )
-dset = FeffitDataSet(
+datasets = []
-data=data_group, pathlist=selected_paths, transform=trans
+for i, data_group in enumerate(data_groups):
-)
+if selected_path_ids:
+selected_paths = []
-out = feffit(gds, dset)
+for path_id in selected_path_ids[i]:
-return dset, out
+selected_paths.append(pathlist[path_id - 1])
+dataset = FeffitDataSet(
+data=data_group, pathlist=selected_paths, transform=trans
+)
+else:
+dataset = FeffitDataSet(
+data=data_group, pathlist=pathlist, transform=trans
+)
+datasets.append(dataset)
+out = feffit(gds, datasets)
+return datasets, out
 def main(
-prj_file: str,
+prj_file: list,
 gds_file: str,
 sp_file: str,
 fit_vars: dict,
 plot_graph: bool,
 series_id: str = "",
 ) -> Group:
 report_path = f"report/fit_report{series_id}.txt"
 rmr_path = f"rmr/rmr{series_id}.png"
 chikr_path = f"chikr/chikr{series_id}.png"
+gds = read_gds(gds_file)
+pathlist = read_selected_paths_list(sp_file)
 # calc_with_defaults will hang indefinitely (>6 hours recorded) if the
 # data contains any NaNs - consider adding an early error here if this is
 # not fixed in Larch?
-data_group = read_group(prj_file)
+selected_path_ids = []
+if isinstance(prj_file[0], dict):
-print(f"Fitting project from file {data_group.filename}")
+data_groups = []
+for dataset in prj_file:
-gds = read_gds(gds_file)
+data_groups.append(read_group(dataset["prj_file"]))
-selected_paths = read_selected_paths_list(sp_file)
+selected_path_ids.append([p["path_id"] for p in dataset["paths"]])
-dset, out = run_fit(data_group, gds, selected_paths, fit_vars)
+else:
+data_groups = [read_group(p) for p in prj_file]
+print(f"Fitting project from file {[d.filename for d in data_groups]}")
+datasets, out = run_fit(
+data_groups,
+gds,
+pathlist,
+fit_vars,
+selected_path_ids=selected_path_ids,
+)
 fit_report = feffit_report(out)
 with open(report_path, "w") as fit_report_file:
 fit_report_file.write(fit_report)
 if plot_graph:
-plot_rmr(rmr_path, dset, fit_vars["rmin"], fit_vars["rmax"])
+plot_rmr(rmr_path, datasets, fit_vars["rmin"], fit_vars["rmax"])
 plot_chikr(
 chikr_path,
-dset,
+datasets,
 fit_vars["rmin"],
 fit_vars["rmax"],
 fit_vars["kmin"],
 fit_vars["kmax"],
 )
 rows = [[f"{c['variable']:>12s}" for c in report_criteria]]
 for series_index, series_file in enumerate(filepaths):
 series_id = str(series_index).zfill(id_length)
 try:
 out = main(
-series_file,
+[series_file],
 gds_file,
 sp_file,
 fit_vars,
 plot_graph,
 f"_{series_id}",
 input_values = json.load(open(sys.argv[4], "r", encoding="utf-8"))
 fit_vars = input_values["fit_vars"]
 plot_graph = input_values["plot_graph"]
 if input_values["execution"]["execution"] == "parallel":
-main(prj_file, gds_file, sp_file, fit_vars, plot_graph)
+main([prj_file], gds_file, sp_file, fit_vars, plot_graph)
+elif input_values["execution"]["execution"] == "simultaneous":
+dataset_dicts = input_values["execution"]["simultaneous"]
+main(dataset_dicts, gds_file, sp_file, fit_vars, plot_graph)
 else:
 if os.path.isdir(prj_file):
 # Sort the unzipped directory, all filenames should be zero-padded
 filepaths = [
 os.path.join(prj_file, p) for p in os.listdir(prj_file)

Mercurial > repos > muon-spectroscopy-computational-project > larch_artemis

comparison larch_artemis.py @ 5:7acb53ffb96f draft