Source code for utils.file_reader

import json
import os
import time

import numpy as np
import pandas as pd


[docs]class FileReader:
    def __init__(self):
        pass

[docs]    def to_pd_dataframe(self):
        print("it works")
        # TAKES IN PYTHON DICTIONARY AS ARGUMENT AND RETURNS PANDAS DATAFRAME
        pass

[docs]    def txt_reader(self, filename, delimeter):
        lines_list = []
        # OPEN FILE AND UPDATE LINE LIST
        with open(filename, 'r') as f:
            for l in f.readlines():
                line = []
                l = l.strip()
                a = l.split(delimeter)
                for b in a:
                    if b == '':
                        continue
                    line.append(float(b))
                lines_list.append(line)

        # CHECK FOR MISSING VALUES IN LIST
        mx_len = 0
        for val in lines_list:
            # GET MAXIMUM LIST LENGTH
            if len(val) > mx_len:
                mx_len = len(val)

        list_update = []
        for val in lines_list:
            if len(val) < mx_len:
                for i in range(0, mx_len - len(val)):
                    val.append(None)
            list_update.append(val)

        # CONVERT LIST TO PYTHON DICTIONARY
        data_dict = {}
        for key in range(0, len(line)):
            data_dict[f"{key}"] = [val[key] for val in list_update]

        # CONVERT DICTIONARY TO PANDAS DATAFRAME
        df = pd.DataFrame.from_dict(data_dict, orient='index').transpose()
        return df

[docs]    def excel_reader(self, filename):
        file = pd.ExcelFile(filename)
        # print(file.sheet_names)
        dd = {}
        for sheet_name in file.sheet_names:
            dd[sheet_name] = file.parse(sheet_name)

        return dd

[docs]    def svl_reader(self, filename):
        dict = {
              'TITLE': [],
              'CAVITY RADIUS': [],
              'LENGTH': [],
              'FREQUENCY': [],
              'LENGTH OF WAVE': [],
              'WAVE VALUE': [],
              'QUALITY FACTOR': [],
              'STORED ENERGY': [],
              'TRANSIT TIME': [],
              'EFFECTIVE IMPEDANCE': [],
              'SHUNT IMPEDANCE': [],
              'MAXIMUM MAG. FIELD': [],
              'MAXIMUM ELEC. FIELD': [],
              'ACCELERATION': [],
              'ACCELERATION RATE': [],
              'AVERAGE E.FIELD ON AXIS': [],
              'KM (Emax/Accel.rate)': [],
              'KH (Hmax*Z0/Accel.rate)': [],
        }
        with open(filename, 'r') as f:
            data = f.readlines()
            for i, line in enumerate(data):
                if '*SLANS*' in line:
                    dict['TITLE'].append(line)

                if 'CAVITY RADIUS' in line:
                    dict['CAVITY RADIUS'].append(self._process_line(line, 'CAVITY RADIUS'))
                    dict['LENGTH'].append(self._process_line(line, 'LENGTH'))

                if 'FREQUENCY' in line:
                    dict['FREQUENCY'].append(self._process_line(line, 'FREQUENCY'))

                if 'LENGTH OF WAVE' in line:
                    dict['LENGTH OF WAVE'].append(self._process_line(line, 'LENGTH OF WAVE'))

                if 'WAVE VALUE' in line:
                    dict['WAVE VALUE'].append(self._process_line(line, 'WAVE VALUE'))

                if 'QUALITY FACTOR' in line:
                    dict['QUALITY FACTOR'].append(self._process_line(line, 'QUALITY FACTOR'))

                if 'STORED ENERGY' in line:
                    dict['STORED ENERGY'].append(self._process_line(line, 'STORED ENERGY'))

                if 'TRANSIT TIME' in line:
                    dict['TRANSIT TIME'].append(self._process_line(line, 'TRANSIT TIME'))

                if 'EFFECTIVE IMPEDANCE' in line:
                    dict['EFFECTIVE IMPEDANCE'].append(self._process_line(line, 'EFFECTIVE IMPEDANCE'))

                if 'SHUNT IMPEDANCE' in line:
                    dict['SHUNT IMPEDANCE'].append(self._process_line(line, 'SHUNT IMPEDANCE'))

                if 'MAXIMUM MAG. FIELD' in line:
                    dict['MAXIMUM MAG. FIELD'].append(self._process_line(line, 'MAXIMUM MAG. FIELD'))

                if 'MAXIMUM ELEC.FIELD' in line:
                    dict['MAXIMUM ELEC. FIELD'].append(self._process_line(line, 'MAXIMUM ELEC.FIELD'))

                if 'ACCELERATION' in line and not 'RATE' in line:
                    dict['ACCELERATION'].append(self._process_line(line, 'ACCELERATION'))

                if 'ACCELERATION RATE' in line:
                    dict['ACCELERATION RATE'].append(self._process_line(line, 'ACCELERATION RATE'))

                if 'AVERAGE E.FIELD ON AXIS' in line:
                    dict['AVERAGE E.FIELD ON AXIS'].append(self._process_line(line, 'AVERAGE E.FIELD ON AXIS'))

                if 'KM (Emax/Accel.rate)' in line:
                    dict['KM (Emax/Accel.rate)'].append(self._process_line(line, 'KM (Emax/Accel.rate)'))

                if 'KH (Hmax*Z0/Accel.rate)' in line:
                    dict['KH (Hmax*Z0/Accel.rate)'].append(self._process_line(line, 'KH (Hmax*Z0/Accel.rate)'))

        return dict

[docs]    def top_reader(self):
        pass

[docs]    @staticmethod
    def json_reader(filename, header=None):

        df = pd.read_json(filename)

        if header:
            # check if length of header list is same as column length
            if len(header) == len(list(df.columns)):
                df.columns = header
            else:
                print(f'Expected header length of {len(list(df.columns))}, got {len(header)}.')

        try: # this is to try to return a dataframe of cavity variables if the json file is a shape space
            t = df[:][:1].loc["IC"]
            dd = t.apply(pd.Series)
            dd = dd.set_axis(["A", "B", "ai", "bi", "Ri", "L", "Req", "alpha"], axis=1, inplace=False)

            return dd  # dd is a dataframe whose columns are the cavity geometry variables
        except:
            return df

[docs]    def pam_reader(self):
        pass

    def _process_line(self, line, request):
        # select substring from index
        line = line[line.index(request):]
        line = line.strip().split(" ")
        # print(line)
        res = 0
        for val in line:
            try:
                res = float(val)
                break
            except:
                continue
        return res

    def _combineDict(self, args):

        d1 = json.load(open('Results/population.json', 'r'))
        d2 = json.load(open('Results/population2.json', 'r'))
        d3 = json.load(open('Results/population3.json', 'r'))

        d1.update(d2)
        d1.update(d3)

        with open('population.json', 'w') as file:
            file.write(json.dumps(d1, indent=4, separators=(',', ': ')))

        f1 = json.load(open('Results/freq_diff.json', 'r'))
        f2 = json.load(open('Results/freq_diff2.json', 'r'))
        f3 = json.load(open('Results/freq_diff3.json', 'r'))

        f1.update(f2)
        f1.update(f3)
        with open('freq_diff.json', 'w') as file:
            file.write(json.dumps(f1, indent=4, separators=(',', ': ')))

    def _updateDict(self, d1, d2):
        for key, val_set in d1.items():
            d1[key] += (d2[key])

        return d1


if __name__ == '__main__':
    fr = FileReader()
    # txt = fr.txt_reader(r"D:\Dropbox\2D_Codes\ABCI_software\Python_ABCI\node_editor/SLANS/Cavity382/cavity_mm.pam")
    # fr.txt_reader(r"D:\Dropbox\2D_Codes\ABCI_software\Python_ABCI\node_editor/SLANS/Cavity1/cavity_mm_7.af")
    # df = fr.excel_reader(r'D:\Dropbox\2D_Codes\ABCI_software\Python_ABCI\Dataframe_full_data.xlsx')
    # print([[x] for x in df["Midcell node_editor"].iloc[0][1:8]])
    # print(len(df["Midcell node_editor"]))
    # print([[x] for x in df["Midcell node_editor"].iloc[0][8:20]])
    # print([[x] for x in df["Midcell node_editor"].iloc[0][10:11]])

    # # dataframe from json
    # dir = r'D:\Dropbox\2D_Codes\ABCI_software\Python_ABCI\Cavity Population/pseudo_shape_space.json'
    # df = fr.json_reader(dir, ['A', 'B', 'a', 'b', 'Ri', 'L'])
    # for value in df.to_dict(orient='list').values():
    #     print(value)

    # # svl reader
    # dir = r'D:\Dropbox\2D_Codes\ABCI_software\Python_ABCI\node_editor\SLANS\Cavity_process_0/cavity_mm.svl'
    # d = fr.svl_reader(dir)
    # print(d['FREQUENCY'])

    # txt reader
    durr = r"D:\Dropbox\CavityDesignHub\SampleProject\Cavities\test.json"

    d = fr.json_reader(durr)
    print(type(d))
    print(d)
    # expand df.tags into its own dataframe
    t = d[:][:1].loc["IC"]
    dd = t.apply(pd.Series)
    dd = dd.set_axis(["A", "B", "a", "b", "Ri", "L", "Req", "alpha"], axis=1, inplace=False)