1
0
mirror of https://github.com/TREX-CoE/trexio.git synced 2024-08-24 22:21:43 +02:00
trexio/src/generator.py

182 lines
6.5 KiB
Python
Raw Normal View History

2021-03-05 16:50:44 +01:00
import json
2021-03-09 11:58:47 +01:00
from os import listdir
2021-03-10 10:27:44 +01:00
from os.path import isfile, join, dirname, abspath
2021-03-09 11:58:47 +01:00
2021-03-10 10:27:44 +01:00
fileDir = dirname(abspath(__file__))
parentDir = dirname(fileDir)
with open(join(parentDir,'trex.json'), 'r') as f:
2021-03-05 16:50:44 +01:00
config0 = json.load(f)
print('Metadata I/O currently not supported')
# TODO, for now remove metadata-related stuff
del config0['metadata']
config = {}
for k,v in config0.items():
2021-03-09 11:58:47 +01:00
if k == 'nucleus' or k == 'ecp':
2021-03-05 16:50:44 +01:00
config[k] = v
2021-03-09 11:58:47 +01:00
#print(config)
2021-03-05 16:50:44 +01:00
groups = [group for group in config.keys()]
dim_variables = {}
dim_list = []
2021-03-09 11:58:47 +01:00
dim_dict = {}
2021-03-05 16:50:44 +01:00
for k1,v1 in config.items():
2021-03-09 11:58:47 +01:00
grname = k1
2021-03-05 16:50:44 +01:00
for v2 in v1.values():
for dim in v2[1]:
if not dim.isdigit():
tmp = dim.replace('.','_')
dim_variables[tmp] = 0
if dim not in dim_list:
2021-03-09 11:58:47 +01:00
dim_list.append(tmp)
dim_dict[grname] = dim_list
dim_list = []
2021-03-10 10:27:44 +01:00
#print(dim_variables)
2021-03-09 11:58:47 +01:00
#print(dim_dict)
2021-03-05 16:50:44 +01:00
datasets = {}
numbers = {}
for k1,v1 in config.items():
for k2,v2 in v1.items():
if len(v2[1]) > 0:
datasets[f'{k1}_{k2}'] = v2
else:
var_name = f'{k1}_{k2}'
if var_name not in dim_variables.keys():
numbers[var_name] = v2[0]
print('Strings I/O currently not supported')
# TODO, for now remove char-related stuff
datasets_nostr = {}
for k,v in datasets.items():
tmp_dict = {}
2021-03-05 16:50:44 +01:00
if 'char' not in v[0]:
if v[0] == 'float':
datatype = 'double'
elif v[0] == 'int':
datatype = 'int64_t'
tmp_dict['dtype'] = datatype
tmp_dict['dims'] = [dim.replace('.','_') for dim in v[1]]
datasets_nostr[k] = tmp_dict
2021-03-05 16:50:44 +01:00
#print(datasets_nostr)
2021-03-09 11:58:47 +01:00
#print(numbers)
2021-03-05 16:50:44 +01:00
#print(attributes)
#print(groups)
2021-03-09 11:58:47 +01:00
#file_list = ['temp_trexio_hdf5.c']
file_list = []
2021-03-10 10:27:44 +01:00
temp_path = join(fileDir,'templates_hdf5')
2021-03-09 11:58:47 +01:00
files_exclude = ['prefix_hdf5.c', 'prefix_hdf5.h', 'suffix_hdf5.h', 'templator_hdf5.org']
2021-03-05 16:50:44 +01:00
2021-03-09 11:58:47 +01:00
files = [f for f in listdir(temp_path) if isfile(join(temp_path, f)) and f not in files_exclude]
#print(files)
files_funcs = [f for f in files if 'read_' in f or 'write_' in f or 'rw_' in f ]
files_funcs_dsets = [f for f in files_funcs if 'dset' in f]
files_funcs_nums = [f for f in files_funcs if 'num' in f]
2021-03-09 11:58:47 +01:00
files_auxil = [f for f in files if not ('read_' in f or 'write_' in f or 'rw_' in f)]
# build files with functions
for fname in files_funcs_nums:
fname_new = 'populated/pop_' + fname
for dim in dim_variables.keys():
grname = dim.split('_')[0]
with open(f'{temp_path}/{fname}', 'r') as f_in :
with open(f'{temp_path}/{fname_new}', 'a') as f_out :
for line in f_in :
if '$' in line:
templine1 = line.replace('$GROUP_NUM$', dim.upper())
templine2 = templine1.replace('$group_num$', dim)
templine1 = templine2.replace('$group$', grname)
templine2 = templine1.replace('$GROUP$', grname.upper())
f_out.write(templine2)
else:
f_out.write(line)
# build files with functions
for fname in files_funcs_dsets:
2021-03-09 11:58:47 +01:00
fname_new = 'populated/pop_' + fname
for dset,params in datasets_nostr.items():
grname = dset.split('_')[0]
with open(f'{temp_path}/{fname}', 'r') as f_in :
with open(f'{temp_path}/{fname_new}', 'a') as f_out :
for line in f_in :
if '$' in line:
templine1 = line.replace('$GROUP$_$GROUP_DSET$', dset.upper())
templine2 = templine1.replace('$group$_$group_dset$', dset)
templine1 = templine2.replace('$group_dset$', dset)
templine2 = templine1
2021-03-09 11:58:47 +01:00
templine1 = templine2.replace('$group_dset_dtype$', params['dtype'])
templine2 = templine1
if params['dtype'] == 'double':
h5_dtype = 'double'
elif params['dtype'] == 'int64_t':
h5_dtype = 'long'
templine1 = templine2.replace('$group_dset_h5_dtype$', h5_dtype)
templine2 = templine1.replace('$group_dset_h5_dtype$'.upper(), h5_dtype.upper())
for dim in params['dims']:
if dim.isdigit():
continue
else:
print("TODO: this only populate 1 dim and not all !")
templine1 = templine2.replace('$group_dset_dim$', dim)
templine2 = templine1
f_out.write(templine2)
templine1 = templine2.replace('$group$', grname)
templine2 = templine1.replace('$GROUP$', grname.upper())
f_out.write(templine2)
else:
f_out.write(line)
2021-03-05 16:50:44 +01:00
2021-03-09 11:58:47 +01:00
# build files with $group$ and $group$-based
for fname in ['def_hdf5.c', 'basic_hdf5.c', 'struct_hdf5.h'] :
2021-03-09 11:58:47 +01:00
fname_new = 'populated/pop_' + fname
with open(f'{temp_path}/{fname}', 'r') as f_in :
with open(f'{temp_path}/{fname_new}', 'w') as f_out :
for line in f_in :
if '$group_dset$' in line or '$GROUP_DSET$' in line :
for dset in datasets_nostr.keys():
templine1 = line.replace('$GROUP$_$GROUP_DSET$', dset.upper())
templine2 = templine1.replace('$group_dset$', dset)
f_out.write(templine2)
elif '$group_num$' in line or '$GROUP_NUM$' in line :
for num in dim_variables.keys():
templine1 = line.replace('$GROUP_NUM$', num.upper())
templine2 = templine1.replace('$group_num$', num)
f_out.write(templine2)
elif '$group$' in line or '$GROUP$' in line :
for grname in config.keys():
templine1 = line.replace('$group$', grname)
templine2 = templine1.replace('$GROUP$', grname.upper())
f_out.write(templine2)
2021-03-05 16:50:44 +01:00
else:
f_out.write(line)