Cleanup

2021-03-03 14:56:38 +01:00 · 2021-03-03 14:56:38 +01:00 · 426bb16792
commit 426bb16792
parent 554716fc9a
3 changed files with 1 additions and 400 deletions
--- a/pyzebra/init.py
+++ b/pyzebra/init.py
@ -1,6 +1,5 @@
 from pyzebra.anatric import *
-from pyzebra.ccl_io import export_1D, load_1D, parse_1D
-from pyzebra.fit2 import fitccl
+from pyzebra.ccl_io import *
 from pyzebra.h5 import *
 from pyzebra.xtal import *
 from pyzebra.ccl_process import *
--- a/pyzebra/fit2.py
+++ b/pyzebra/fit2.py
@ -1,231 +0,0 @@
-import numpy as np
-import uncertainties as u
-from lmfit import Model, Parameters
-from scipy.integrate import simps
-
-
-def bin_data(array, binsize):
-    if isinstance(binsize, int) and 0 < binsize < len(array):
-        return [
-            np.mean(array[binsize * i : binsize * i + binsize])
-            for i in range(int(np.ceil(len(array) / binsize)))
-        ]
-    else:
-        print("Binsize need to be positive integer smaller than lenght of array")
-        return array
-
-
-def find_nearest(array, value):
-    # find nearest value and return index
-    array = np.asarray(array)
-    idx = (np.abs(array - value)).argmin()
-    return idx
-
-
-def create_uncertanities(y, y_err):
-    # create array with uncertanities for error propagation
-    combined = np.array([])
-    for i in range(len(y)):
-        part = u.ufloat(y[i], y_err[i])
-        combined = np.append(combined, part)
-    return combined
-
-
-def fitccl(
-    scan,
-    value,
-    vary,
-    constraints_min,
-    constraints_max,
-    numfit_min=None,
-    numfit_max=None,
-    binning=None,
-):
-    """Made for fitting of ccl date where 1 peak is expected. Allows for combination of gaussian and linear model combination
-    :param scan: scan in the data dict (i.e. M123)
-    :param guess: initial guess for the fitting, if none, some values are added automatically in order (see below)
-    :param vary: True if parameter can vary during fitting, False if it to be fixed
-    :param numfit_min: minimal value on x axis for numerical integration - if none is centre of gaussian minus 3 sigma
-    :param numfit_max: maximal value on x axis for numerical integration - if none is centre of gaussian plus 3 sigma
-    :param constraints_min: min constranits value for fit
-    :param constraints_max: max constranits value for fit
-    :param binning : binning of the data
-    :return data dict with additional values
-    order for guess, vary, constraints_min, constraints_max:
-    [Gaussian centre, Gaussian sigma, Gaussian amplitude, background slope, background intercept]
-    examples:
-    guess = [None, None, 100,  0, None]
-    vary = [True, True, True, True,  True]
-    constraints_min = [23, None, 50, 0, 0]
-    constraints_min = [80, None, 1000, 0, 100]
-    """
-    if "peak_indexes" not in scan:
-        scan["peak_indexes"] = []
-
-    if len(scan["peak_indexes"]) > 1:
-        # return in case of more than 1 peaks
-        return
-
-    if binning is None or binning == 0 or binning == 1:
-        x = list(scan["omega"])
-        y = list(scan["Counts"])
-        y_err = list(np.sqrt(y)) if scan.get("sigma", None) is None else list(scan["sigma"])
-        if not scan["peak_indexes"]:
-            centre = np.mean(x)
-        else:
-            centre = x[int(scan["peak_indexes"])]
-    else:
-        x = list(scan["omega"])
-        if not scan["peak_indexes"]:
-            centre = np.mean(x)
-        else:
-            centre = x[int(scan["peak_indexes"])]
-        x = bin_data(x, binning)
-        y = list(scan["Counts"])
-        y_err = list(np.sqrt(y)) if scan.get("sigma", None) is None else list(scan["sigma"])
-        combined = bin_data(create_uncertanities(y, y_err), binning)
-        y = [combined[i].n for i in range(len(combined))]
-        y_err = [combined[i].s for i in range(len(combined))]
-
-    if len(scan["peak_indexes"]) == 0:
-        # Case for no peak, gaussian in centre, sigma as 20% of range
-        peak_index = find_nearest(x, np.mean(x))
-        value[0] = centre if value[0] is None else value[0]
-        value[1] = (x[-1] - x[0]) / 5 if value[1] is None else value[1]
-        value[2] = 50 if value[2] is None else value[2]
-        value[3] = 0 if value[3] is None else value[3]
-        value[4] = np.mean(y) if value[4] is None else value[4]
-        constraints_min[2] = 0
-
-    elif len(scan["peak_indexes"]) == 1:
-        # case for one peak, takse into account users guesses
-        peak_height = scan["peak_heights"]
-        value[0] = centre if value[0] is None else value[0]
-        value[1] = 0.1 if value[1] is None else value[1]
-        value[2] = float(peak_height / 10) if value[2] is None else float(value[2])
-        value[3] = 0 if value[3] is None else value[3]
-        value[4] = np.median(x) if value[4] is None else value[4]
-        constraints_min[0] = np.min(x) if constraints_min[0] is None else constraints_min[0]
-        constraints_max[0] = np.max(x) if constraints_max[0] is None else constraints_max[0]
-
-    def gaussian(x, g_cen, g_width, g_amp):
-        """1-d gaussian: gaussian(x, amp, cen, wid)"""
-        return (g_amp / (np.sqrt(2 * np.pi) * g_width)) * np.exp(
-            -((x - g_cen) ** 2) / (2 * g_width ** 2)
-        )
-
-    def background(x, slope, intercept):
-        """background"""
-        return slope * (x - centre) + intercept
-
-    mod = Model(gaussian) + Model(background)
-    params = Parameters()
-    params.add_many(
-        ("g_cen", value[0], bool(vary[0]), np.min(x), np.max(x), None, None),
-        ("g_width", value[1], bool(vary[1]), constraints_min[1], constraints_max[1], None, None),
-        ("g_amp", value[2], bool(vary[2]), constraints_min[2], constraints_max[2], None, None),
-        ("slope", value[3], bool(vary[3]), constraints_min[3], constraints_max[3], None, None),
-        ("intercept", value[4], bool(vary[4]), constraints_min[4], constraints_max[4], None, None),
-    )
-    # the weighted fit
-    weights = [np.abs(1 / val) if val != 0 else 1 for val in y_err]
-    try:
-        result = mod.fit(y, params, weights=weights, x=x, calc_covar=True)
-    except ValueError:
-        print(f"Couldn't fit scan {scan['idx']}")
-        return
-
-    if result.params["g_amp"].stderr is None:
-        result.params["g_amp"].stderr = result.params["g_amp"].value
-    elif result.params["g_amp"].stderr > result.params["g_amp"].value:
-        result.params["g_amp"].stderr = result.params["g_amp"].value
-
-    # u.ufloat to work with uncertanities
-    fit_area = u.ufloat(result.params["g_amp"].value, result.params["g_amp"].stderr)
-    comps = result.eval_components()
-
-    if len(scan["peak_indexes"]) == 0:
-        # for case of no peak, there is no reason to integrate, therefore fit and int are equal
-        int_area = fit_area
-
-    elif len(scan["peak_indexes"]) == 1:
-        gauss_3sigmamin = find_nearest(
-            x, result.params["g_cen"].value - 3 * result.params["g_width"].value
-        )
-        gauss_3sigmamax = find_nearest(
-            x, result.params["g_cen"].value + 3 * result.params["g_width"].value
-        )
-        # numfit_min = gauss_3sigmamin if numfit_min is None else find_nearest(x, numfit_min)
-        # numfit_max = gauss_3sigmamax if numfit_max is None else find_nearest(x, numfit_max)
-        numfit_min = 0 if numfit_min is None else find_nearest(x, numfit_min)
-        numfit_max = len(x)-1 if numfit_max is None else find_nearest(x, numfit_max)
-
-        it = -1
-        while abs(numfit_max - numfit_min) < 3:
-            # in the case the peak is very thin and numerical integration would be on zero omega
-            # difference, finds closes values
-            it = it + 1
-            numfit_min = find_nearest(
-                x,
-                result.params["g_cen"].value - 3 * (1 + it / 10) * result.params["g_width"].value,
-            )
-            numfit_max = find_nearest(
-                x,
-                result.params["g_cen"].value + 3 * (1 + it / 10) * result.params["g_width"].value,
-            )
-
-        if x[numfit_min] < np.min(x):
-            # makes sure that the values supplied by user lay in the omega range
-            # can be ommited for users who know what they're doing
-            numfit_min = gauss_3sigmamin
-            print("Minimal integration value outside of x range")
-        elif x[numfit_min] >= x[numfit_max]:
-            numfit_min = gauss_3sigmamin
-            print("Minimal integration value higher than maximal")
-        else:
-            pass
-        if x[numfit_max] > np.max(x):
-            numfit_max = gauss_3sigmamax
-            print("Maximal integration value outside of x range")
-        elif x[numfit_max] <= x[numfit_min]:
-            numfit_max = gauss_3sigmamax
-            print("Maximal integration value lower than minimal")
-        else:
-            pass
-
-
-        count_errors = create_uncertanities(y, y_err)
-        # create error vector for numerical integration propagation
-        num_int_area = simps(count_errors[numfit_min:numfit_max], x[numfit_min:numfit_max])
-        slope_err = u.ufloat(result.params["slope"].value, result.params["slope"].stderr)
-        # pulls the nominal and error values from fit (slope)
-        intercept_err = u.ufloat(
-            result.params["intercept"].value, result.params["intercept"].stderr
-        )
-        # pulls the nominal and error values from fit (intercept)
-
-        background_errors = np.array([])
-        for j in range(len(x[numfit_min:numfit_max])):
-            # creates nominal and error vector for numerical integration of background
-            bg = slope_err * (x[j] - centre) + intercept_err
-            background_errors = np.append(background_errors, bg)
-
-        num_int_background = simps(background_errors, x[numfit_min:numfit_max])
-        int_area = num_int_area - num_int_background
-
-    d = {}
-    for pars in result.params:
-        d[str(pars)] = (result.params[str(pars)].value, result.params[str(pars)].vary)
-
-    print("Scan", scan["idx"])
-    print(result.fit_report())
-
-    d["ratio"] = (result.params["g_amp"].value - int_area.n) / result.params["g_amp"].value
-    d["int_area"] = int_area
-    d["fit_area"] = u.ufloat(result.params["g_amp"].value, result.params["g_amp"].stderr)
-    d["full_report"] = result.fit_report()
-    d["result"] = result
-    d["comps"] = comps
-    d["numfit"] = [numfit_min, numfit_max]
-    d["x_fit"] = x
-    scan["fit"] = d
--- a/pyzebra/fitvol3.py
+++ b/pyzebra/fitvol3.py
@ -1,167 +0,0 @@
-import numpy as np
-from lmfit import Model, Parameters
-from scipy.integrate import simps
-import matplotlib.pyplot as plt
-import uncertainties as u
-from lmfit.models import GaussianModel
-from lmfit.models import VoigtModel
-from lmfit.models import PseudoVoigtModel
-
-
-def bin_data(array, binsize):
-    if isinstance(binsize, int) and 0 < binsize < len(array):
-        return [
-            np.mean(array[binsize * i : binsize * i + binsize])
-            for i in range(int(np.ceil(len(array) / binsize)))
-        ]
-    else:
-        print("Binsize need to be positive integer smaller than lenght of array")
-        return array
-
-
-def create_uncertanities(y, y_err):
-    # create array with uncertanities for error propagation
-    combined = np.array([])
-    for i in range(len(y)):
-        part = u.ufloat(y[i], y_err[i])
-        combined = np.append(combined, part)
-    return combined
-
-
-def find_nearest(array, value):
-    # find nearest value and return index
-    array = np.asarray(array)
-    idx = (np.abs(array - value)).argmin()
-    return idx
-
-
-# predefined peak positions
-# peaks = [6.2,  8.1, 9.9, 11.5]
-peaks = [23.5, 24.5]
-# peaks = [24]
-def fitccl(scan, variable="omega", peak_type="gauss", binning=None):
-
-    x = list(scan[variable])
-    y = list(scan["Counts"])
-    peak_centre = np.mean(x)
-    if binning is None or binning == 0 or binning == 1:
-        x = list(scan[variable])
-        y = list(scan["Counts"])
-        y_err = list(np.sqrt(y)) if scan.get("sigma", None) is None else list(scan["sigma"])
-        print(scan["peak_indexes"])
-        if not scan["peak_indexes"]:
-            peak_centre = np.mean(x)
-        else:
-            centre = x[int(scan["peak_indexes"])]
-    else:
-        x = list(scan[variable])
-        if not scan["peak_indexes"]:
-            peak_centre = np.mean(x)
-        else:
-            peak_centre = x[int(scan["peak_indexes"])]
-        x = bin_data(x, binning)
-        y = list(scan["Counts"])
-        y_err = list(np.sqrt(y)) if scan.get("sigma", None) is None else list(scan["sigma"])
-        combined = bin_data(create_uncertanities(y, y_err), binning)
-        y = [combined[i].n for i in range(len(combined))]
-        y_err = [combined[i].s for i in range(len(combined))]
-
-    def background(x, slope, intercept):
-        """background"""
-        return slope * (x - peak_centre) + intercept
-
-    def gaussian(x, center, g_sigma, amplitude):
-        """1-d gaussian: gaussian(x, amp, cen, wid)"""
-        return (amplitude / (np.sqrt(2.0 * np.pi) * g_sigma)) * np.exp(
-            -((x - center) ** 2) / (2 * g_sigma ** 2)
-        )
-
-    def lorentzian(x, center, l_sigma, amplitude):
-        """1d lorentzian"""
-        return (amplitude / (1 + ((1 * x - center) / l_sigma) ** 2)) / (np.pi * l_sigma)
-
-    def pseudoVoigt1(x, center, g_sigma, amplitude, l_sigma, fraction):
-        """PseudoVoight peak with different widths of lorenzian and gaussian"""
-        return (1 - fraction) * gaussian(x, center, g_sigma, amplitude) + fraction * (
-            lorentzian(x, center, l_sigma, amplitude)
-        )
-
-    mod = Model(background)
-    params = Parameters()
-    params.add_many(
-        ("slope", 0, True, None, None, None, None), ("intercept", 0, False, None, None, None, None)
-    )
-    for i in range(len(peaks)):
-        if peak_type == "gauss":
-            mod = mod + GaussianModel(prefix="p%d_" % (i + 1))
-            params.add(str("p%d_" % (i + 1) + "amplitude"), 20, True, 0, None, None)
-            params.add(str("p%d_" % (i + 1) + "center"), peaks[i], True, None, None, None)
-            params.add(str("p%d_" % (i + 1) + "sigma"), 0.2, True, 0, 5, None)
-        elif peak_type == "voigt":
-            mod = mod + VoigtModel(prefix="p%d_" % (i + 1))
-            params.add(str("p%d_" % (i + 1) + "amplitude"), 20, True, 0, None, None)
-            params.add(str("p%d_" % (i + 1) + "center"), peaks[i], True, None, None, None)
-            params.add(str("p%d_" % (i + 1) + "sigma"), 0.2, True, 0, 3, None)
-            params.add(str("p%d_" % (i + 1) + "gamma"), 0.2, True, 0, 5, None)
-        elif peak_type == "pseudovoigt":
-            mod = mod + PseudoVoigtModel(prefix="p%d_" % (i + 1))
-            params.add(str("p%d_" % (i + 1) + "amplitude"), 20, True, 0, None, None)
-            params.add(str("p%d_" % (i + 1) + "center"), peaks[i], True, None, None, None)
-            params.add(str("p%d_" % (i + 1) + "sigma"), 0.2, True, 0, 5, None)
-            params.add(str("p%d_" % (i + 1) + "fraction"), 0.5, True, -5, 5, None)
-        elif peak_type == "pseudovoigt1":
-            mod = mod + Model(pseudoVoigt1, prefix="p%d_" % (i + 1))
-            params.add(str("p%d_" % (i + 1) + "amplitude"), 20, True, 0, None, None)
-            params.add(str("p%d_" % (i + 1) + "center"), peaks[i], True, None, None, None)
-            params.add(str("p%d_" % (i + 1) + "g_sigma"), 0.2, True, 0, 5, None)
-            params.add(str("p%d_" % (i + 1) + "l_sigma"), 0.2, True, 0, 5, None)
-            params.add(str("p%d_" % (i + 1) + "fraction"), 0.5, True, 0, 1, None)
-    # add parameters
-
-    result = mod.fit(
-        y, params, weights=[np.abs(1 / y_err[i]) for i in range(len(y_err))], x=x, calc_covar=True
-    )
-
-    comps = result.eval_components()
-
-    reportstring = list()
-    for keys in result.params:
-        if result.params[keys].value is not None:
-            str2 = np.around(result.params[keys].value, 3)
-        else:
-            str2 = 0
-        if result.params[keys].stderr is not None:
-            str3 = np.around(result.params[keys].stderr, 3)
-        else:
-            str3 = 0
-        reportstring.append("%s = %2.3f +/- %2.3f" % (keys, str2, str3))
-
-    reportstring = "\n".join(reportstring)
-
-    plt.figure(figsize=(20, 10))
-    plt.plot(x, result.best_fit, "k-", label="Best fit")
-
-    plt.plot(x, y, "b-", label="Original data")
-    plt.plot(x, comps["background"], "g--", label="Line component")
-    for i in range(len(peaks)):
-        plt.plot(
-            x,
-            comps[str("p%d_" % (i + 1))],
-            "r--",
-        )
-        plt.fill_between(x, comps[str("p%d_" % (i + 1))], alpha=0.4, label=str("p%d_" % (i + 1)))
-    plt.legend()
-    plt.text(
-        np.min(x),
-        np.max(y),
-        reportstring,
-        fontsize=9,
-        verticalalignment="top",
-    )
-    plt.title(str(peak_type))
-
-    plt.xlabel("Omega [deg]")
-    plt.ylabel("Counts [a.u.]")
-    plt.show()
-
-    print(result.fit_report())