1
0
mirror of https://github.com/TREX-CoE/trexio.git synced 2025-01-07 03:43:25 +01:00
trexio/tests/io_dset_sparse.c

269 lines
8.1 KiB
C
Raw Normal View History

2023-05-02 14:45:51 +02:00
#include "trexio.h"
#include <assert.h>
#include <stdio.h>
#include <stdlib.h>
#include <stdint.h>
#define N_CHUNKS 4
2023-05-02 14:45:51 +02:00
static int test_write_dset_sparse (const char* file_name, const back_end_t backend, const int64_t offset, const int64_t mo_num) {
2023-05-02 14:45:51 +02:00
/* Try to write an array of sparse data into the TREXIO file */
trexio_t* file = NULL;
trexio_exit_code rc;
/*================= START OF TEST ==================*/
// open file in 'write' mode
file = trexio_open(file_name, 'w', backend, &rc);
assert (file != NULL);
assert (rc == TREXIO_SUCCESS);
// parameters to be written
int32_t* index;
double* value;
int64_t size = mo_num/2;
2023-05-02 14:45:51 +02:00
index = calloc(4L*size, sizeof(int32_t));
value = calloc(size, sizeof(double));
2023-05-02 14:45:51 +02:00
for(int i=0; i<size; i++){
index[4*i] = i;
index[4*i+1] = i+1;
index[4*i+2] = i+2;
index[4*i+3] = i+3;
2023-05-02 14:45:51 +02:00
value[i] = 3.14 + (double) i;
}
// write mo_num which will be used to determine the optimal size of int indices
2023-05-13 12:28:17 +02:00
if (trexio_has_mo_num(file) == TREXIO_HAS_NOT) {
rc = trexio_write_mo_num(file, mo_num);
assert(rc == TREXIO_SUCCESS);
}
2023-05-02 14:45:51 +02:00
// write dataset chunks of sparse data in the file (including FAKE statements)
2023-05-13 12:01:00 +02:00
uint64_t chunk_size = (uint64_t) size/N_CHUNKS;
chunk_size = chunk_size > 0 ? chunk_size : (uint64_t) size;
int n_chunks = size/chunk_size;
2023-06-02 19:37:53 +02:00
printf("chunk_size = %ld\n", (long) chunk_size);
2023-05-13 12:01:00 +02:00
printf("n_chunks = %d\n", n_chunks);
2023-05-13 12:28:17 +02:00
uint64_t offset_f = 0UL + offset;
2023-05-02 14:45:51 +02:00
uint64_t offset_d = 0UL;
// write n_chunks times using write_sparse
2023-05-13 12:01:00 +02:00
while(offset_d < size) {
2023-05-13 12:28:17 +02:00
if (offset_d+chunk_size > size) chunk_size = size-offset_d;
2023-06-02 19:37:53 +02:00
printf("chunk_size = %ld\n", (long) chunk_size);
2023-05-13 12:28:17 +02:00
if (chunk_size == 0L) break;
2023-05-02 14:45:51 +02:00
rc = trexio_write_mo_2e_int_eri(file, offset_f, chunk_size, &index[4*offset_d], &value[offset_d]);
printf("%5d: %s\n", __LINE__, trexio_string_of_error(rc));
2023-05-02 14:45:51 +02:00
assert(rc == TREXIO_SUCCESS);
offset_d += chunk_size;
offset_f += chunk_size;
}
// close current session
rc = trexio_close(file);
assert (rc == TREXIO_SUCCESS);
// free the allocated memeory
free(index);
free(value);
/*================= END OF TEST ==================*/
return 0;
}
static int test_has_dset_sparse (const char* file_name, const back_end_t backend) {
/* Try to check the existence of a dataset of sparse data in the TREXIO file */
trexio_t* file = NULL;
trexio_exit_code rc;
/*================= START OF TEST ==================*/
// open file
file = trexio_open(file_name, 'r', backend, &rc);
assert (file != NULL);
assert (rc == TREXIO_SUCCESS);
// check that the group exists
rc = trexio_has_mo_2e_int(file);
assert(rc==TREXIO_SUCCESS);
// check that the group does not exist
rc = trexio_has_rdm(file);
assert(rc==TREXIO_HAS_NOT);
// first check that mo_2e_int_eri_lr (we only write non-lr component in this unit test)
rc = trexio_has_mo_2e_int_eri_lr(file);
assert(rc==TREXIO_HAS_NOT);
// check that previous call to has_sparse did not create a file/dset
rc = trexio_has_mo_2e_int_eri_lr(file);
assert(rc==TREXIO_HAS_NOT);
// now check that previously written mo_2e_int_eri exists
rc = trexio_has_mo_2e_int_eri(file);
assert(rc==TREXIO_SUCCESS);
// close current session
rc = trexio_close(file);
assert (rc == TREXIO_SUCCESS);
/*================= END OF TEST ==================*/
return 0;
}
static int test_read_dset_sparse (const char* file_name, const back_end_t backend, const int64_t offset) {
/* Try to read one chunk of dataset of sparse data in the TREXIO file */
trexio_t* file = NULL;
trexio_exit_code rc;
/*================= START OF TEST ==================*/
// open file
file = trexio_open(file_name, 'r', backend, &rc);
assert (file != NULL);
assert (rc == TREXIO_SUCCESS);
int32_t mo_num = 0;
rc = trexio_read_mo_num(file, &mo_num);
assert(rc == TREXIO_SUCCESS);
printf("%5d: mo_num = %d\n", __LINE__, mo_num);
const int64_t size = mo_num/2;
2023-05-02 14:45:51 +02:00
// define arrays to read into
int32_t* index_read;
double* value_read;
uint64_t size_r = mo_num;
2023-05-02 14:45:51 +02:00
index_read = (int32_t*) calloc(4L*size_r,sizeof(int32_t));
value_read = (double*) calloc(size_r,sizeof(double));
// specify the read parameters, here:
// 1 chunk of 10 elements using offset of 40 (i.e. lines No. 40--59) into elements of the array starting from 5
int64_t chunk_read = size/3;
2023-05-13 12:01:00 +02:00
chunk_read = chunk_read < 2 ? 2 : chunk_read;
int64_t offset_file_read = 1;
2023-05-02 14:45:51 +02:00
int64_t read_size_check;
read_size_check = chunk_read;
if (offset != 0L) offset_file_read += offset;
// read one chunk using the aforementioned parameters
2023-05-13 12:01:00 +02:00
rc = trexio_read_mo_2e_int_eri(file, offset_file_read, &chunk_read, &index_read[0], &value_read[0]);
printf("%5d: %s\n", __LINE__, trexio_string_of_error(rc));
2023-05-13 12:01:00 +02:00
/*
for (int i=0 ; i<chunk_read ; ++i) {
2023-06-02 19:37:53 +02:00
printf("%d %d | %ld %ld %ld\n", i, index_read[i], (long) offset, (long) offset_file_read, (long) chunk_read);
}
2023-05-13 12:01:00 +02:00
*/
2023-05-13 12:28:17 +02:00
//assert(rc == TREXIO_SUCCESS);
2023-05-02 14:45:51 +02:00
assert(chunk_read == read_size_check);
2023-05-13 12:28:17 +02:00
assert(index_read[0] == offset_file_read-offset);
2023-05-13 12:01:00 +02:00
2023-05-02 14:45:51 +02:00
// now attempt to read so that one encounters end of file during reading (i.e. offset_file_read + chunk_read > size_max)
int64_t size_max;
rc = trexio_read_mo_2e_int_eri_size(file, &size_max);
assert(rc == TREXIO_SUCCESS);
2023-05-13 12:01:00 +02:00
offset_file_read = size_max-chunk_read+1;
int64_t eof_read_size_check = size_max - offset_file_read; // if offset_file_read=97 => only 3 integrals will be read out of total of 100
2023-05-02 14:45:51 +02:00
// read one chunk that will reach EOF and return TREXIO_END code
2023-05-13 12:01:00 +02:00
rc = trexio_read_mo_2e_int_eri(file, offset_file_read, &chunk_read, &index_read[0], &value_read[0]);
printf("%5d: %s\n", __LINE__, trexio_string_of_error(rc));
2023-05-02 14:45:51 +02:00
assert(rc == TREXIO_END);
2023-05-13 12:01:00 +02:00
printf("%d %d x\n", (int32_t) index_read[0], (int32_t) (4L*offset_file_read));
2023-06-02 19:37:53 +02:00
printf("%ld %ld\n", (long) chunk_read, (long) eof_read_size_check);
2023-05-02 14:45:51 +02:00
assert(chunk_read == eof_read_size_check);
2023-05-13 12:28:17 +02:00
printf("%d %d\n", index_read[0] , (int32_t) (offset_file_read - offset));
assert(index_read[0] == (int32_t) offset_file_read - offset);
2023-05-02 14:45:51 +02:00
// close current session
rc = trexio_close(file);
assert (rc == TREXIO_SUCCESS);
// free the memory
free(index_read);
free(value_read);
/*================= END OF TEST ==================*/
return 0;
}
static int test_read_dset_sparse_size (const char* file_name, const back_end_t backend, const int64_t size_check) {
/* Try to read a size of the dataset of sparse data in the TREXIO file */
trexio_t* file = NULL;
trexio_exit_code rc;
/*================= START OF TEST ==================*/
// open file
file = trexio_open(file_name, 'r', backend, &rc);
assert (file != NULL);
assert (rc == TREXIO_SUCCESS);
// define the variable to read into
int64_t size_written;
// read one chunk using the aforementioned parameters
rc = trexio_read_mo_2e_int_eri_size(file, &size_written);
assert(rc == TREXIO_SUCCESS);
2023-06-02 19:37:53 +02:00
printf("%5d: %ld %ld\n", __LINE__, (long) size_written, (long) size_check);
2023-05-02 14:45:51 +02:00
assert(size_written == size_check);
// close current session
rc = trexio_close(file);
assert (rc == TREXIO_SUCCESS);
/*================= END OF TEST ==================*/
return 0;
}
int main(){
/*============== Test launcher ================*/
int rc;
rc = system(RM_COMMAND);
assert (rc == 0);
2023-05-13 12:28:17 +02:00
int32_t mo_num[8] = {6,12,30,62,252,510,1020,9000};
2023-05-13 12:01:00 +02:00
for (int i=0 ; i<8 ; ++i) {
2023-05-02 14:45:51 +02:00
2023-05-13 12:01:00 +02:00
printf("%5d: mo_num = %d\n", __LINE__, mo_num[i]);
const int64_t size = mo_num[i]/2;
// check the first write attempt (SIZE elements written in N_CHUNKS chunks)
2023-05-13 12:01:00 +02:00
test_write_dset_sparse (TREXIO_FILE, TEST_BACKEND, 0, mo_num[i]);
test_has_dset_sparse (TREXIO_FILE, TEST_BACKEND);
test_read_dset_sparse (TREXIO_FILE, TEST_BACKEND, 0);
test_read_dset_sparse_size(TREXIO_FILE, TEST_BACKEND, size);
2023-05-02 14:45:51 +02:00
// check the second write attempt (SIZE elements written in N_CHUNKS chunks)
2023-05-13 12:01:00 +02:00
test_write_dset_sparse (TREXIO_FILE, TEST_BACKEND, size, mo_num[i]);
test_read_dset_sparse (TREXIO_FILE, TEST_BACKEND, size);
2023-05-13 12:28:17 +02:00
test_read_dset_sparse_size(TREXIO_FILE, TEST_BACKEND, 2*size);
rc = system(RM_COMMAND);
assert (rc == 0);
}
2023-05-02 14:45:51 +02:00
return 0;
}