import logging import os import sys import numpy as np from orsopy import fileio from .command_line import expand_file_list from .file_reader import AmorData from .header import Header from .options import EOSConfig from .instrument import Grid class AmorReduction: def __init__(self, config: EOSConfig): self.experiment_config = config.experiment self.reader_config = config.reader self.reduction_config = config.reductoin self.output_config = config.output self.grid = Grid(config.reductoin.qResolution) self.header = Header() def reduce(self): if not os.path.exists(f'{self.reader_config.dataPath}'): logging.debug(f'Creating destination path {self.reader_config.dataPath}') os.system(f'mkdir {self.reader_config.dataPath}') # load or create normalisation matrix if self.reduction_config.normalisationFileIdentifier: self.create_normalisation_map(self.reduction_config.normalisationFileIdentifier[0]) else: self.norm_lz = self.grid.lz() self.normAngle = 1. logging.warning('normalisation matrix: none requested') # load R(q_z) curve to be subtracted: if self.reduction_config.subtract: self.sq_q, self.sR_q, self.sdR_q, self.sFileName = self.loadRqz(self.reduction_config.subtract) logging.warning(f'loaded background file: {self.sFileName}') self.header.reduction.corrections.append(f'background from \'{self.sFileName}\' subtracted') self.subtract = True else: self.subtract = False # load measurement data and do the reduction self.datasetsRqz = [] self.datasetsRlt = [] for i, short_notation in enumerate(self.reduction_config.fileIdentifier): self.read_file_block(i, short_notation) # output logging.warning('output:') if 'Rqz.ort' in self.output_config.outputFormats: self.save_Rqz() if 'Rlt.ort' in self.output_config.outputFormats: self.save_Rtl() def read_file_block(self, i, short_notation): logging.warning('reading input:') self.header.measurement_data_files = [] self.file_reader = AmorData(header=self.header, reader_config=self.reader_config, config=self.experiment_config, short_notation=short_notation) if self.reduction_config.timeSlize: self.read_timeslices(i) else: self.read_unsliced(i) def read_unsliced(self, i): lamda_e = self.file_reader.lamda_e detZ_e = self.file_reader.detZ_e qz_lz, ref_lz, err_lz, res_lz, lamda_lz, theta_lz, int_lz, self.mask_lz = self.project_on_lz( self.file_reader, self.norm_lz, self.normAngle, lamda_e, detZ_e) try: ref_lz *= self.reduction_config.scale[i] err_lz *= self.reduction_config.scale[i] except IndexError: ref_lz *= self.reduction_config.scale[-1] err_lz *= self.reduction_config.scale[-1] if 'Rqz.ort' in self.output_config.outputFormats: headerRqz = self.header.orso_header() headerRqz.data_set = f'Nr {i} : mu = {self.file_reader.mu:6.3f} deg' # projection on q-grid q_q, R_q, dR_q, dq_q = self.project_on_qz(qz_lz, ref_lz, err_lz, res_lz, self.norm_lz, self.mask_lz) filter_q = np.where((self.experiment_config.qzRange[0]0, filter_q, False) if len(filter_q[filter_q]) > 0: scale = np.sum(R_q[filter_q]**2/dR_q[filter_q]) / np.sum(R_q[filter_q]/dR_q[filter_q]) else: logging.warning(f'# automatic scaling not possible') scale = 1. else: filter_q = np.where(np.isnan(pR_q*R_q), False, True) filter_q = np.where(R_q>0, filter_q, False) filter_q = np.where(pR_q>0, filter_q, False) if len(filter_q[filter_q]) > 0: scale = np.sum(R_q[filter_q]**3 * pR_q[filter_q] / (dR_q[filter_q]**2 * pdR_q[filter_q]**2)) \ / np.sum(R_q[filter_q]**2 * pR_q[filter_q]**2 / (dR_q[filter_q]**2 * pdR_q[filter_q]**2)) else: logging.warning(f'# automatic scaling not possible') scale = 1. R_q /= scale dR_q /= scale logging.debug(f'# scaling factor = {scale}') return R_q, dR_q def project_on_qz(self, q_lz, R_lz, dR_lz, dq_lz, norm_lz, mask_lz): q_q = self.grid.q() mask_lzf = mask_lz.flatten() q_lzf = q_lz.flatten()[mask_lzf] R_lzf = R_lz.flatten()[mask_lzf] dR_lzf = dR_lz.flatten()[mask_lzf] dq_lzf = dq_lz.flatten()[mask_lzf] norm_lzf = norm_lz.flatten()[mask_lzf] N_q = np.histogram(q_lzf, bins = q_q, weights = norm_lzf )[0] N_q = np.where(N_q > 0, N_q, np.nan) R_q = np.histogram(q_lzf, bins = q_q, weights = norm_lzf * R_lzf )[0] R_q = R_q / N_q dR_q = np.histogram(q_lzf, bins = q_q, weights = (norm_lzf * dR_lzf)**2 )[0] dR_q = np.sqrt( dR_q ) / N_q # TODO: different error propagations for dR and dq! N_q = np.histogram(q_lzf, bins = q_q, weights = norm_lzf**2 )[0] N_q = np.where(N_q > 0, N_q, np.nan) dq_q = np.histogram(q_lzf, bins = q_q, weights = (norm_lzf * dq_lzf)**2 )[0] dq_q = np.sqrt( dq_q / N_q ) q_q = 0.5 * (q_q + np.roll(q_q, 1)) return q_q[1:], R_q, dR_q, dq_q def loadRqz(self, name): fname = os.path.join(self.reader_config.dataPath, name) if os.path.exists(fname): fileName = fname elif os.path.exists(f'{fname}.Rqz.ort'): fileName = f'{fname}.Rqz.ort' else: sys.exit(f'### the background file \'{fname}\' does not exist! => stopping') q_q, Sq_q, dS_q = np.loadtxt(fileName, usecols=(0, 1, 2), comments='#', unpack=True) return q_q, Sq_q, dS_q, fileName def create_normalisation_map(self, short_notation): dataPath = self.reader_config.dataPath normalisation_list = expand_file_list(short_notation) name = str(normalisation_list[0]) for i in range(1, len(normalisation_list), 1): name = f'{name}_{normalisation_list[i]}' n_path = os.path.join(dataPath, f'{name}.norm') if os.path.exists(n_path): logging.info(f'# normalisation matrix: found and using {n_path}') self.norm_lz = np.loadtxt(f'{dataPath}/{name}.norm') with open(n_path, 'r') as fh: fh.readline() self.normFileList = fh.readline().split('[')[1].split(']')[0].replace('\'', '').split(', ') self.normAngle = float(fh.readline().split('= ')[1]) for i, entry in enumerate(self.normFileList): self.normFileList[i] = entry.split('/')[-1] self.header.measurement_additional_files = self.normFileList else: logging.info(f'# normalisation matrix: using the files {normalisation_list}') fromHDF = AmorData(header=self.header, reader_config=self.reader_config, config=self.experiment_config, short_notation=short_notation, norm=True) self.normAngle = fromHDF.nu - fromHDF.mu lamda_e = fromHDF.lamda_e detZ_e = fromHDF.detZ_e self.norm_lz, bins_l, bins_z = np.histogram2d(lamda_e, detZ_e, bins = (self.grid.lamda(), self.grid.z())) self.norm_lz = np.where(self.norm_lz>0, self.norm_lz, np.nan) # correct for the SM reflectivity lamda_l = self.grid.lamda() theta_z = self.normAngle + fromHDF.delta_z lamda_lz = (self.grid.lz().T*lamda_l[:-1]).T theta_lz = self.grid.lz()*theta_z qz_lz = 4.0*np.pi * np.sin(np.deg2rad(theta_lz)) / lamda_lz Rsm_lz = np.ones(np.shape(qz_lz)) Rsm_lz = np.where(qz_lz>0.0217, 1-(qz_lz-0.0217)*(0.0625/0.0217), Rsm_lz) Rsm_lz = np.where(qz_lz>0.0217*5, np.nan, Rsm_lz) self.norm_lz = self.norm_lz / Rsm_lz if len(lamda_e) > 1e6: head = ('normalisation matrix based on the measurements\n' f'{fromHDF.file_list}\n' f'nu - mu = {self.normAngle}\n' f'shape= {np.shape(self.norm_lz)} (lambda, z)\n' f'measured at mu = {fromHDF.mu:6.3f} deg\n' f'N(l_lambda, z) = theta(z) / sum_i=-1..1 I(l_lambda+i, z)') head = head.replace('../', '') head = head.replace('./', '') head = head.replace('raw/', '') np.savetxt(f'{dataPath}/{name}.norm', self.norm_lz, header = head) self.normFileList = fromHDF.file_list self.header.reduction.corrections.append('normalisation with \'additional files\'') def project_on_lz(self, fromHDF, norm_lz, normAngle, lamda_e, detZ_e): # projection on lambda-z-grid lamda_l = self.grid.lamda() theta_z = fromHDF.nu - fromHDF.mu + fromHDF.delta_z lamda_lz = (self.grid.lz().T*lamda_l[:-1]).T theta_lz = self.grid.lz()*theta_z thetaN_z = fromHDF.delta_z + normAngle thetaN_lz = np.ones(np.shape(norm_lz))*thetaN_z thetaN_lz = np.where(np.absolute(thetaN_lz)>5e-3, thetaN_lz, np.nan) mask_lz = np.where(np.isnan(norm_lz), False, True) mask_lz = np.logical_and(mask_lz, np.where(np.absolute(thetaN_lz)>5e-3, True, False)) mask_lz = np.logical_and(mask_lz, np.where(np.absolute(theta_lz)>5e-3, True, False)) if self.reduction_config.thetaRange[1]<12: mask_lz = np.logical_and(mask_lz, np.where(theta_lz >= self.reduction_config.thetaRange[0], True, False)) mask_lz = np.logical_and(mask_lz, np.where(theta_lz <= self.reduction_config.thetaRange[1], True, False)) if self.reduction_config.thetaRangeR[1]<12: t0 = fromHDF.nu - fromHDF.mu mask_lz = np.logical_and(mask_lz, np.where(theta_lz-t0 >= self.reduction_config.thetaRangeR[0], True, False)) mask_lz = np.logical_and(mask_lz, np.where(theta_lz-t0 <= self.reduction_config.thetaRangeR[1], True, False)) if self.experiment_config.lambdaRange[1]<15: mask_lz = np.logical_and(mask_lz, np.where(lamda_lz >= self.experiment_config.lambdaRange[0], True, False)) mask_lz = np.logical_and(mask_lz, np.where(lamda_lz <= self.experiment_config.lambdaRange[1], True, False)) # gravity correction #theta_lz += np.rad2deg( np.arctan( 3.07e-10 * (fromHDF.detectorDistance + detXdist_e) * lamda_lz**2 ) ) theta_lz += np.rad2deg( np.arctan( 3.07e-10 * fromHDF.detectorDistance * lamda_lz**2 ) ) z_z = enumerate(theta_z) qz_lz = 4.0*np.pi * np.sin(np.deg2rad(theta_lz)) / lamda_lz int_lz, bins_l, bins_z = np.histogram2d(lamda_e, detZ_e, bins = (lamda_l, self.grid.z())) # cut normalisation sample horizon int_lz = np.where(mask_lz, int_lz, np.nan) thetaF_lz = np.where(mask_lz, theta_lz, np.nan) ref_lz = (int_lz * np.absolute(thetaN_lz)) / (norm_lz * np.absolute(thetaF_lz)) err_lz = ref_lz * np.sqrt( 1/(int_lz+.1) + 1/norm_lz ) res_lz = np.ones((np.shape(lamda_l[:-1])[0], np.shape(theta_z)[0])) * 0.022**2 res_lz = res_lz + (0.008/theta_lz)**2 res_lz = qz_lz * np.sqrt(res_lz) return qz_lz, ref_lz, err_lz, res_lz, lamda_lz, theta_lz, int_lz, mask_lz @staticmethod def histogram2d_lz(lamda_e, detZ_e, bins): """ Perform binning operation equivalent to numpy bin2d for the sepcial case of the second dimension using integer positions (pre-defined pixels). Based on the devide_bin algorithm below. """ dimension = bins[1].shape[0]-1 if not (np.array(bins[1])==np.arange(dimension+1)).all(): raise ValueError("histogram2d_lz requires second bin dimension to be contigous integer range") binning = AmorReduction.devide_bin(lamda_e, detZ_e.astype(np.int64), bins[0], dimension) return np.array(binning), bins[0], bins[1] @staticmethod def devide_bin(lambda_e, position_e, lamda_edges, dimension): ''' Use a divide and conquer strategy to bin the data. For the actual binning the numpy bincount function is used, as it is much faster than histogram for counting of integer values. :param lambda_e: Array of wavelength for each event :param position_e: Array of positional indices for each event :param lamda_edges: The edges of bins to be used for the histogram :param dimension: position number of buckets in output arrray :return: 2D list of dimensions (lambda, x) of counts ''' if len(lambda_e)==0: # no more events in range, return empty bins return [np.zeros(dimension, dtype=int).tolist()]*(len(lamda_edges)-1) if len(lamda_edges)==2: # deepest recursion reached, all items should be within the two ToF edges return [np.bincount(position_e, minlength=dimension).tolist()] # split all events into two time of flight regions split_idx = len(lamda_edges)//2 left_region = lambda_e