Refactor split_scans

2022-06-20 16:08:36 +02:00 · 2022-06-20 16:08:36 +02:00 · 7214746af1
commit 7214746af1
parent 9c6a7d5991
1 changed files with 93 additions and 66 deletions
--- a/nafuma/xanes/io.py
+++ b/nafuma/xanes/io.py
@ -3,93 +3,119 @@ import matplotlib.pyplot as plt
 import os
 import numpy as np
 import nafuma.auxillary as aux
 from nafuma.xanes.calib import find_element
-def split_xanes_scan(root, destination=None, replace=False):
+def split_scan_data(data: dict, options={}):
    required_options = ['save', 'save_folder', 'replace', 'add_rois']
    default_options = {
        'save': False,
        'save_folder': '.',
        'replace': False,
        'add_rois': False
    }
    options = aux.update_options(options=options, required_options=required_options, default_options=default_options)
    #root is the path to the beamtime-folder
    #destination should be the path to the processed data
    #insert a for-loop to go through all the folders.dat-files in the folder root\xanes\raw
    # FIXME Only adding this variable to pass the Linting-tests - will refactor this later
    filename = 'dummy'
-    with open(filename, 'r') as f:
+    if not isinstance(data['path'], list):
-        lines = f.readlines()
+        data['path'] = [data['path']]
-    datas = []
+    all_scans = []
    data = []
    headers = []
    header = ''
    start = False
-    for line in lines:
+    for filename in data['path']:
        if line[0:2] == "#L":
            start = True
            header = line[2:].split()
            continue
-        elif line[0:2] == "#C":
+        with open(filename, 'r') as f:
-            start = False
+            lines = f.readlines()
-            if data:
+        scan_datas, scan_data = [], []
-                datas.append(data)
+        headers, header = [], ''
-                data = []
+        read_data = False
-            if header:
+        for line in lines:
-                headers.append(header)
+            # Header line starts with #L - reads headers, and toggles data read-in on
-                header = ''
+            if line[0:2] == "#L":
                header, read_data = line[2:].split(), True
                continue
            # First line after data started with #C - stops data read-in
            elif line[0:2] == "#C":
                read_data = False
                if scan_data:
                    scan_datas.append(scan_data); scan_data = []
                if header:
                    headers.append(header); header = ''
            # Ignore line if read-in not toggled       
            if read_data == False:
                continue
            # Read in data if it is
            else:
                scan_data.append(line.split())
-
+        edges = {'Mn': [], 'Fe': [], 'Co': [], 'Ni': []}
        if start == False:
            continue
        else:
            data.append(line.split())
        for i, scan_data in enumerate(scan_datas):
            xanes_df = pd.DataFrame(scan_data).apply(pd.to_numeric)
            xanes_df.columns = headers[i]
            if not ('xmap_roi00' in headers[i]) and (not 'xmap_roi01' in headers[i]):
                continue 
-    edges = {'Mn': [6.0, 6.1, 6.2, 6.3, 6.4, 6.5], 'Fe': [6.8, 6.9, 7.0, 7.1, 7.2], 'Co': [7.6, 7.7, 7.8, 7.9], 'Ni': [8.1, 8.2, 8.3, 8.4, 8.5]}
+            edge = find_element({'xanes_data_original': xanes_df})
-    edge_count = {'Mn': 0, 'Fe': 0, 'Co': 0, 'Ni': 0}
+            edges[edge].append(xanes_df)
-    for ind, data in enumerate(datas):
+        if options['add']:
        df = pd.DataFrame(data)
        df.columns = headers[ind]
-        edge_start = np.round((float(df["ZapEnergy"].min())), 1)
+            added_edges = {'Mn': [], 'Fe': [], 'Co': [], 'Ni': []}
            for edge, scans in edges.items():
                if scans:
                    xanes_df = scans[0]
-        for edge, energies in edges.items():
+                    for i, scan in enumerate(scans):
-            if edge_start in energies:
+                        if i > 0:
-                edge_actual = edge
+
-                edge_count[edge] += 1
+                            if 'xmap_roi00' in xanes_df.columns:
                                xanes_df['xmap_roi00'] += scan['xmap_roi00']
                            if 'xmap_roi01' in xanes_df.columns:
                                xanes_df['xmap_roi01'] += scan['xmap_roi01']
                    added_edges[edge].append(xanes_df)
            edges = added_edges
        if options['save']:
            if not os.path.isdir(options['save_folder']):
                os.makedirs(options['save_folder'])
            filename = os.path.basename(filename).split('.')[0]
-        filename = filename.split('/')[-1]
+            for edge, scans in edges.items():
-        count = str(edge_count[edge_actual]).zfill(4)
+                for i, scan in enumerate(scans):
-
+                    count = '' if options['add'] else '_'+str(i).zfill(4)
-        
+                    path = os.path.join(options['save_folder'], f'{filename}_{edge}{count}.dat')
-        # Save 
+                    scan.to_csv(path)
-        if destination:
+
-            cwd = os.getcwd()
+        all_scans.append(edges)
            if not os.path.isdir(destination):
                os.mkdir(destination)
            os.chdir(destination)
            df.to_csv('{}_{}_{}.dat'.format(filename.split('.')[0], edge_actual, count))
            os.chdir(cwd)
        else:
            df.to_csv('{}_{}_{}.dat'.format(filename.split('.')[0], edge_actual, count))
    return all_scans
@ -117,6 +143,7 @@ def read_data(data: dict, options={}) -> pd.DataFrame:
        columns.append(filename)
        scan_data = pd.read_csv(filename)
        scan_data = scan_data[[determine_active_roi(scan_data)]]
        xanes_data = pd.concat([xanes_data, scan_data], axis=1)