trexio/src/generator.py

import json

from os import listdir
from os.path import isfile, join, dirname, abspath

fileDir = dirname(abspath(__file__))
parentDir = dirname(fileDir)

with open(join(parentDir,'trex.json'), 'r') as f:
    config0 = json.load(f)

print('Metadata I/O currently not supported')
# TODO, for now remove metadata-related stuff
del config0['metadata']

config = {}
for k,v in config0.items():
    if k == 'nucleus' or k == 'ecp':
        config[k] = v

#print(config)

groups = [group for group in config.keys()]

dim_variables = {}
dim_list = []
dim_dict = {}
for k1,v1 in config.items():
    grname = k1
    for v2 in v1.values():
        for dim in v2[1]:
            if not dim.isdigit():
                tmp = dim.replace('.','_')
                dim_variables[tmp] = 0
                if dim not in dim_list: 
                    dim_list.append(tmp)
                    
                dim_dict[grname] = dim_list
                dim_list = []

#print(dim_variables)
#print(dim_dict)

datasets = {}
numbers = {}
for k1,v1 in config.items():
    for k2,v2 in v1.items():
        if len(v2[1]) > 0:
            datasets[f'{k1}_{k2}'] = v2
        else:
            var_name = f'{k1}_{k2}'
            if var_name not in dim_variables.keys():
                numbers[var_name] = v2[0]

print('Strings I/O currently not supported')
# TODO, for now remove char-related stuff
datasets_nostr = {}
for k,v in datasets.items():
    tmp_dict = {}
    if 'char' not in v[0]:
        if v[0] == 'float':
            datatype = 'double'
        elif v[0] == 'int':
            datatype = 'int64_t'
        tmp_dict['dtype'] = datatype
        tmp_dict['dims'] = [dim.replace('.','_') for dim in v[1]]
        datasets_nostr[k] = tmp_dict

#print(datasets_nostr)
#print(numbers)

#print(attributes)
#print(groups)

#file_list = ['temp_trexio_hdf5.c']
file_list = []

temp_path = join(fileDir,'templates_hdf5')

files_exclude = ['prefix_hdf5.c', 'prefix_hdf5.h', 'suffix_hdf5.h', 'templator_hdf5.org']

files = [f for f in listdir(temp_path) if isfile(join(temp_path, f)) and f not in files_exclude]
#print(files)

files_funcs = [f for f in files if 'read_' in f or 'write_' in f or 'rw_' in f ]
files_funcs_dsets = [f for f in files_funcs if 'dset' in f]
files_funcs_nums  = [f for f in files_funcs if 'num' in f]

files_auxil = [f for f in files if not ('read_' in f or 'write_' in f or 'rw_' in f)]

# build files with functions
for fname in files_funcs_nums:
    fname_new = 'populated/pop_' + fname
    for dim in dim_variables.keys():

        grname = dim.split('_')[0]

        with open(f'{temp_path}/{fname}', 'r') as f_in :
            with open(f'{temp_path}/{fname_new}', 'a') as f_out :
                for line in f_in :
                    if '$' in line:
                        templine1 = line.replace('$GROUP_NUM$', dim.upper())
                        templine2 = templine1.replace('$group_num$', dim)

                        templine1 = templine2.replace('$group$', grname)
                        templine2 = templine1.replace('$GROUP$', grname.upper())
                            
                        f_out.write(templine2)                
                    else:        
                        f_out.write(line)

# build files with functions
for fname in files_funcs_dsets:
    fname_new = 'populated/pop_' + fname
    for dset,params in datasets_nostr.items():

        grname = dset.split('_')[0]

        with open(f'{temp_path}/{fname}', 'r') as f_in :
            with open(f'{temp_path}/{fname_new}', 'a') as f_out :
                for line in f_in :
                    if '$' in line:
                        templine1 = line.replace('$GROUP$_$GROUP_DSET$', dset.upper())
                        templine2 = templine1.replace('$group$_$group_dset$', dset)

                        templine1 = templine2.replace('$group_dset$', dset)
                        templine2 = templine1

                        templine1 = templine2.replace('$group_dset_dtype$', params['dtype'])
                        templine2 = templine1

                        if params['dtype'] == 'double':
                            h5_dtype = 'double'
                        elif params['dtype'] == 'int64_t':
                            h5_dtype = 'long'

                        templine1 = templine2.replace('$group_dset_h5_dtype$', h5_dtype)
                        templine2 = templine1.replace('$group_dset_h5_dtype$'.upper(), h5_dtype.upper())

                        for dim in params['dims']:
                            if dim.isdigit():
                                continue
                            else:
                                print("TODO: this only populate 1 dim and not all !")
                                templine1 = templine2.replace('$group_dset_dim$', dim)
                                templine2 = templine1
                                                    
                            f_out.write(templine2)

                        templine1 = templine2.replace('$group$', grname)
                        templine2 = templine1.replace('$GROUP$', grname.upper())
                            
                        f_out.write(templine2)                
                    else:        
                        f_out.write(line)

# build files with $group$ and $group$-based
for fname in ['def_hdf5.c', 'basic_hdf5.c', 'struct_hdf5.h'] :
    fname_new = 'populated/pop_' + fname
    with open(f'{temp_path}/{fname}', 'r') as f_in :
        with open(f'{temp_path}/{fname_new}', 'w') as f_out :
            for line in f_in :
                if '$group_dset$' in line or '$GROUP_DSET$' in line :
                    for dset in datasets_nostr.keys():
                        templine1 = line.replace('$GROUP$_$GROUP_DSET$', dset.upper())
                        templine2 = templine1.replace('$group_dset$', dset)
                        f_out.write(templine2)
                elif '$group_num$' in line or '$GROUP_NUM$' in line :
                    for num in dim_variables.keys():
                        templine1 = line.replace('$GROUP_NUM$', num.upper())
                        templine2 = templine1.replace('$group_num$', num)
                        f_out.write(templine2)                
                elif '$group$' in line or '$GROUP$' in line :
                    for grname in config.keys():
                        templine1 = line.replace('$group$', grname)
                        templine2 = templine1.replace('$GROUP$', grname.upper())
                        f_out.write(templine2)                
                else:        
                    f_out.write(line)
initial generator 2021-03-05 16:50:44 +01:00			`import json`

dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`from os import listdir`
proper path-ing using os.path 2021-03-10 10:27:44 +01:00			`from os.path import isfile, join, dirname, abspath`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00
proper path-ing using os.path 2021-03-10 10:27:44 +01:00			`fileDir = dirname(abspath(__file__))`
			`parentDir = dirname(fileDir)`

			`with open(join(parentDir,'trex.json'), 'r') as f:`
initial generator 2021-03-05 16:50:44 +01:00			`config0 = json.load(f)`

			`print('Metadata I/O currently not supported')`
			`# TODO, for now remove metadata-related stuff`
			`del config0['metadata']`

			`config = {}`
			`for k,v in config0.items():`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`if k == 'nucleus' or k == 'ecp':`
initial generator 2021-03-05 16:50:44 +01:00			`config[k] = v`

dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`#print(config)`
initial generator 2021-03-05 16:50:44 +01:00
			`groups = [group for group in config.keys()]`

			`dim_variables = {}`
			`dim_list = []`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`dim_dict = {}`
initial generator 2021-03-05 16:50:44 +01:00			`for k1,v1 in config.items():`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`grname = k1`
initial generator 2021-03-05 16:50:44 +01:00			`for v2 in v1.values():`
			`for dim in v2[1]:`
			`if not dim.isdigit():`
			`tmp = dim.replace('.','_')`
			`dim_variables[tmp] = 0`
			`if dim not in dim_list:`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`dim_list.append(tmp)`

			`dim_dict[grname] = dim_list`
			`dim_list = []`

proper path-ing using os.path 2021-03-10 10:27:44 +01:00			`#print(dim_variables)`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`#print(dim_dict)`
initial generator 2021-03-05 16:50:44 +01:00
			`datasets = {}`
			`numbers = {}`
			`for k1,v1 in config.items():`
			`for k2,v2 in v1.items():`
			`if len(v2[1]) > 0:`
			`datasets[f'{k1}_{k2}'] = v2`
			`else:`
			`var_name = f'{k1}_{k2}'`
			`if var_name not in dim_variables.keys():`
			`numbers[var_name] = v2[0]`

			`print('Strings I/O currently not supported')`
			`# TODO, for now remove char-related stuff`
			`datasets_nostr = {}`
			`for k,v in datasets.items():`
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00			`tmp_dict = {}`
initial generator 2021-03-05 16:50:44 +01:00			`if 'char' not in v[0]:`
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00			`if v[0] == 'float':`
			`datatype = 'double'`
			`elif v[0] == 'int':`
			`datatype = 'int64_t'`
			`tmp_dict['dtype'] = datatype`
			`tmp_dict['dims'] = [dim.replace('.','_') for dim in v[1]]`
			`datasets_nostr[k] = tmp_dict`
initial generator 2021-03-05 16:50:44 +01:00
			`#print(datasets_nostr)`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`#print(numbers)`
initial generator 2021-03-05 16:50:44 +01:00
			`#print(attributes)`
			`#print(groups)`

dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`#file_list = ['temp_trexio_hdf5.c']`
			`file_list = []`

proper path-ing using os.path 2021-03-10 10:27:44 +01:00			`temp_path = join(fileDir,'templates_hdf5')`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00
			`files_exclude = ['prefix_hdf5.c', 'prefix_hdf5.h', 'suffix_hdf5.h', 'templator_hdf5.org']`
initial generator 2021-03-05 16:50:44 +01:00
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`files = [f for f in listdir(temp_path) if isfile(join(temp_path, f)) and f not in files_exclude]`
			`#print(files)`

			`files_funcs = [f for f in files if 'read_' in f or 'write_' in f or 'rw_' in f ]`
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00			`files_funcs_dsets = [f for f in files_funcs if 'dset' in f]`
			`files_funcs_nums = [f for f in files_funcs if 'num' in f]`

dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`files_auxil = [f for f in files if not ('read_' in f or 'write_' in f or 'rw_' in f)]`

TODO: properly populate dimensions in write_dset 2021-03-09 16:31:12 +01:00			`# build files with functions`
			`for fname in files_funcs_nums:`
			`fname_new = 'populated/pop_' + fname`
			`for dim in dim_variables.keys():`

			`grname = dim.split('_')[0]`

			`with open(f'{temp_path}/{fname}', 'r') as f_in :`
			`with open(f'{temp_path}/{fname_new}', 'a') as f_out :`
			`for line in f_in :`
			`if '$' in line:`
			`templine1 = line.replace('$GROUP_NUM$', dim.upper())`
			`templine2 = templine1.replace('$group_num$', dim)`

			`templine1 = templine2.replace('$group$', grname)`
			`templine2 = templine1.replace('$GROUP$', grname.upper())`

			`f_out.write(templine2)`
			`else:`
			`f_out.write(line)`
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00
			`# build files with functions`
TODO: properly populate dimensions in write_dset 2021-03-09 16:31:12 +01:00			`for fname in files_funcs_dsets:`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`fname_new = 'populated/pop_' + fname`
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00			`for dset,params in datasets_nostr.items():`

			`grname = dset.split('_')[0]`

			`with open(f'{temp_path}/{fname}', 'r') as f_in :`
			`with open(f'{temp_path}/{fname_new}', 'a') as f_out :`
			`for line in f_in :`
			`if '$' in line:`
			`templine1 = line.replace('$GROUP$_$GROUP_DSET$', dset.upper())`
			`templine2 = templine1.replace('$group$_$group_dset$', dset)`

			`templine1 = templine2.replace('$group_dset$', dset)`
			`templine2 = templine1`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00			`templine1 = templine2.replace('$group_dset_dtype$', params['dtype'])`
			`templine2 = templine1`

			`if params['dtype'] == 'double':`
			`h5_dtype = 'double'`
			`elif params['dtype'] == 'int64_t':`
			`h5_dtype = 'long'`

			`templine1 = templine2.replace('$group_dset_h5_dtype$', h5_dtype)`
			`templine2 = templine1.replace('$group_dset_h5_dtype$'.upper(), h5_dtype.upper())`

			`for dim in params['dims']:`
			`if dim.isdigit():`
			`continue`
			`else:`
TODO: properly populate dimensions in write_dset 2021-03-09 16:31:12 +01:00			`print("TODO: this only populate 1 dim and not all !")`
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00			`templine1 = templine2.replace('$group_dset_dim$', dim)`
			`templine2 = templine1`
TODO: properly populate dimensions in write_dset 2021-03-09 16:31:12 +01:00
			`f_out.write(templine2)`
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00
			`templine1 = templine2.replace('$group$', grname)`
			`templine2 = templine1.replace('$GROUP$', grname.upper())`

			`f_out.write(templine2)`
			`else:`
			`f_out.write(line)`
initial generator 2021-03-05 16:50:44 +01:00
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`# build files with $group$ and $group$-based`
wip: generate read/write_dset functions 2021-03-09 15:48:32 +01:00			`for fname in ['def_hdf5.c', 'basic_hdf5.c', 'struct_hdf5.h'] :`
dummy generator for auxiliary files 2021-03-09 11:58:47 +01:00			`fname_new = 'populated/pop_' + fname`
			`with open(f'{temp_path}/{fname}', 'r') as f_in :`
			`with open(f'{temp_path}/{fname_new}', 'w') as f_out :`
			`for line in f_in :`
			`if '$group_dset$' in line or '$GROUP_DSET$' in line :`
			`for dset in datasets_nostr.keys():`
			`templine1 = line.replace('$GROUP$_$GROUP_DSET$', dset.upper())`
			`templine2 = templine1.replace('$group_dset$', dset)`
			`f_out.write(templine2)`
			`elif '$group_num$' in line or '$GROUP_NUM$' in line :`
			`for num in dim_variables.keys():`
			`templine1 = line.replace('$GROUP_NUM$', num.upper())`
			`templine2 = templine1.replace('$group_num$', num)`
			`f_out.write(templine2)`
			`elif '$group$' in line or '$GROUP$' in line :`
			`for grname in config.keys():`
			`templine1 = line.replace('$group$', grname)`
			`templine2 = templine1.replace('$GROUP$', grname.upper())`
			`f_out.write(templine2)`
initial generator 2021-03-05 16:50:44 +01:00			`else:`
			`f_out.write(line)`