10
0
mirror of https://github.com/LCPQ/quantum_package synced 2024-12-23 04:43:50 +01:00

Fixed CASSD

This commit is contained in:
Anthony Scemama 2017-04-12 20:23:04 +02:00
parent 11aeaa91c7
commit e0183e998c
8 changed files with 62 additions and 59 deletions

View File

@ -41,8 +41,8 @@ subroutine run_selection_slave(thread,iproc,energy)
if (done) then if (done) then
ctask = ctask - 1 ctask = ctask - 1
else else
integer :: i_generator, i_generator_start, i_generator_max, step, N integer :: i_generator, N
read (task,*) i_generator_start, i_generator_max, step, N read (task,*) i_generator, N
if(buf%N == 0) then if(buf%N == 0) then
! Only first time ! Only first time
call create_selection_buffer(N, N*2, buf) call create_selection_buffer(N, N*2, buf)
@ -50,9 +50,7 @@ subroutine run_selection_slave(thread,iproc,energy)
else else
if(N /= buf%N) stop "N changed... wtf man??" if(N /= buf%N) stop "N changed... wtf man??"
end if end if
do i_generator=i_generator_start,i_generator_max,step
call select_connected(i_generator,energy,pt2,buf) call select_connected(i_generator,energy,pt2,buf)
enddo
endif endif
if(done .or. ctask == size(task_id)) then if(done .or. ctask == size(task_id)) then

View File

@ -1215,34 +1215,41 @@ subroutine ZMQ_selection(N_in, pt2)
implicit none implicit none
character*(512) :: task
integer(ZMQ_PTR) :: zmq_to_qp_run_socket integer(ZMQ_PTR) :: zmq_to_qp_run_socket
integer, intent(in) :: N_in integer, intent(in) :: N_in
type(selection_buffer) :: b type(selection_buffer) :: b
integer :: i, N integer :: i, N
integer, external :: omp_get_thread_num integer, external :: omp_get_thread_num
double precision, intent(out) :: pt2(N_states) double precision, intent(out) :: pt2(N_states)
integer, parameter :: maxtasks=10000
N = max(N_in,1)
if (.True.) then if (.True.) then
PROVIDE pt2_e0_denominator PROVIDE pt2_e0_denominator
N = max(N_in,1)
provide nproc provide nproc
call new_parallel_job(zmq_to_qp_run_socket,"selection") call new_parallel_job(zmq_to_qp_run_socket,"selection")
call zmq_put_psi(zmq_to_qp_run_socket,1,pt2_e0_denominator,size(pt2_e0_denominator)) call zmq_put_psi(zmq_to_qp_run_socket,1,pt2_e0_denominator,size(pt2_e0_denominator))
call create_selection_buffer(N, N*2, b) call create_selection_buffer(N, N*2, b)
endif endif
integer :: i_generator, i_generator_start, i_generator_max, step character*(20*maxtasks) :: task
task = ' '
step = int(5000000.d0 / dble(N_int * N_states * elec_num * elec_num * mo_tot_num * mo_tot_num )) integer :: k
step = max(1,step) k=0
do i= 1, N_det_generators,step do i= 1, N_det_generators
i_generator_start = i k = k+1
i_generator_max = min(i+step-1,N_det_generators) write(task(20*(k-1)+1:20*k),'(I9,1X,I9,''|'')') i, N
write(task,*) i_generator_start, i_generator_max, 1, N k = k+20
if (k>20*maxtasks) then
k=0
call add_task_to_taskserver(zmq_to_qp_run_socket,task) call add_task_to_taskserver(zmq_to_qp_run_socket,task)
end do endif
enddo
if (k > 0) then
call add_task_to_taskserver(zmq_to_qp_run_socket,task)
endif
call zmq_set_running(zmq_to_qp_run_socket) call zmq_set_running(zmq_to_qp_run_socket)
!$OMP PARALLEL DEFAULT(shared) SHARED(b, pt2) PRIVATE(i) NUM_THREADS(nproc+1) !$OMP PARALLEL DEFAULT(shared) SHARED(b, pt2) PRIVATE(i) NUM_THREADS(nproc+1)
@ -1250,7 +1257,6 @@ subroutine ZMQ_selection(N_in, pt2)
if (i==0) then if (i==0) then
call selection_collector(b, pt2) call selection_collector(b, pt2)
else else
call sleep(1)
call selection_slave_inproc(i) call selection_slave_inproc(i)
endif endif
!$OMP END PARALLEL !$OMP END PARALLEL
@ -1261,6 +1267,7 @@ subroutine ZMQ_selection(N_in, pt2)
if (s2_eig) then if (s2_eig) then
call make_s2_eigenfunction call make_s2_eigenfunction
endif endif
call save_wavefunction
endif endif
end subroutine end subroutine

View File

@ -24,7 +24,6 @@ subroutine ZMQ_selection(N_in, pt2)
call create_selection_buffer(N, N*2, b) call create_selection_buffer(N, N*2, b)
endif endif
! Ugly, but variable-length strings don't work as expected with gfortran < 4.8 :-(
character*(20*maxtasks) :: task character*(20*maxtasks) :: task
task = ' ' task = ' '

View File

@ -44,8 +44,8 @@ subroutine bielec_integrals_index_reverse(i,j,k,l,i1)
l(1) = ceiling(0.5d0*(dsqrt(8.d0*dble(i2)+1.d0)-1.d0)) l(1) = ceiling(0.5d0*(dsqrt(8.d0*dble(i2)+1.d0)-1.d0))
i3 = i1 - ishft(i2*i2-i2,-1) i3 = i1 - ishft(i2*i2-i2,-1)
k(1) = ceiling(0.5d0*(dsqrt(8.d0*dble(i3)+1.d0)-1.d0)) k(1) = ceiling(0.5d0*(dsqrt(8.d0*dble(i3)+1.d0)-1.d0))
j(1) = i2 - ishft(l(1)*l(1)-l(1),-1) j(1) = int(i2 - ishft(l(1)*l(1)-l(1),-1),4)
i(1) = i3 - ishft(k(1)*k(1)-k(1),-1) i(1) = int(i3 - ishft(k(1)*k(1)-k(1),-1),4)
!ijkl !ijkl
i(2) = i(1) !ilkj i(2) = i(1) !ilkj

View File

@ -26,7 +26,7 @@ subroutine svd(A,LDA,U,LDU,D,Vt,LDVt,m,n)
lwork = -1 lwork = -1
call dgesvd('A','A', m, n, A_tmp, LDA, & call dgesvd('A','A', m, n, A_tmp, LDA, &
D, U, LDU, Vt, LDVt, work, lwork, info) D, U, LDU, Vt, LDVt, work, lwork, info)
lwork = work(1) lwork = int(work(1))
deallocate(work) deallocate(work)
allocate(work(lwork)) allocate(work(lwork))
@ -149,7 +149,7 @@ subroutine ortho_qr(A,LDA,m,n)
allocate (jpvt(n), tau(n), work(1)) allocate (jpvt(n), tau(n), work(1))
LWORK=-1 LWORK=-1
call dgeqrf( m, n, A, LDA, TAU, WORK, LWORK, INFO ) call dgeqrf( m, n, A, LDA, TAU, WORK, LWORK, INFO )
LWORK=2*WORK(1) LWORK=2*int(WORK(1))
deallocate(WORK) deallocate(WORK)
allocate(WORK(LWORK)) allocate(WORK(LWORK))
call dgeqrf(m, n, A, LDA, TAU, WORK, LWORK, INFO ) call dgeqrf(m, n, A, LDA, TAU, WORK, LWORK, INFO )
@ -293,7 +293,7 @@ subroutine get_pseudo_inverse(A,m,n,C,LDA)
print *, info, ': SVD failed' print *, info, ': SVD failed'
stop stop
endif endif
lwork = work(1) lwork = int(work(1))
deallocate(work) deallocate(work)
allocate(work(lwork)) allocate(work(lwork))
call dgesvd('S','A', m, n, A_tmp, m,D,U,m,Vt,n,work,lwork,info) call dgesvd('S','A', m, n, A_tmp, m,D,U,m,Vt,n,work,lwork,info)

View File

@ -105,7 +105,7 @@ subroutine map_load_from_disk(filename,map)
map % map(i) % value => map % consolidated_value ( map % consolidated_idx (i+1) :) map % map(i) % value => map % consolidated_value ( map % consolidated_idx (i+1) :)
map % map(i) % key => map % consolidated_key ( map % consolidated_idx (i+1) :) map % map(i) % key => map % consolidated_key ( map % consolidated_idx (i+1) :)
map % map(i) % sorted = .True. map % map(i) % sorted = .True.
n_elements = map % consolidated_idx (i+2) - k n_elements = int( map % consolidated_idx (i+2) - k, 4)
k = map % consolidated_idx (i+2) k = map % consolidated_idx (i+2)
map % map(i) % map_size = n_elements map % map(i) % map_size = n_elements
map % map(i) % n_elements = n_elements map % map(i) % n_elements = n_elements

View File

@ -53,17 +53,17 @@ module map_module
end module map_module end module map_module
real function map_mb(map) double precision function map_mb(map)
use map_module use map_module
use omp_lib use omp_lib
implicit none implicit none
type (map_type), intent(in) :: map type (map_type), intent(in) :: map
integer(map_size_kind) :: i integer(map_size_kind) :: i
map_mb = 8+map_size_kind+map_size_kind+omp_lock_kind+4 map_mb = dble(8+map_size_kind+map_size_kind+omp_lock_kind+4)
do i=0,map%map_size do i=0,map%map_size
map_mb = map_mb + map%map(i)%map_size*(cache_key_kind+integral_kind) +& map_mb = map_mb + dble(map%map(i)%map_size*(cache_key_kind+integral_kind) +&
8+8+4+cache_map_size_kind+cache_map_size_kind+omp_lock_kind 8+8+4+cache_map_size_kind+cache_map_size_kind+omp_lock_kind)
enddo enddo
map_mb = map_mb / (1024.d0*1024.d0) map_mb = map_mb / (1024.d0*1024.d0)
end end
@ -406,7 +406,7 @@ subroutine map_update(map, key, value, sze, thr)
call cache_map_reallocate(local_map, local_map%n_elements + local_map%n_elements) call cache_map_reallocate(local_map, local_map%n_elements + local_map%n_elements)
call cache_map_shrink(local_map,thr) call cache_map_shrink(local_map,thr)
endif endif
cache_key = iand(key(i),map_mask) cache_key = int(iand(key(i),map_mask),2)
local_map%n_elements = local_map%n_elements + 1 local_map%n_elements = local_map%n_elements + 1
local_map%value(local_map%n_elements) = value(i) local_map%value(local_map%n_elements) = value(i)
local_map%key(local_map%n_elements) = cache_key local_map%key(local_map%n_elements) = cache_key
@ -464,7 +464,7 @@ subroutine map_append(map, key, value, sze)
if (n_elements == map%map(idx_cache)%map_size) then if (n_elements == map%map(idx_cache)%map_size) then
call cache_map_reallocate(map%map(idx_cache), n_elements+ ishft(n_elements,-1)) call cache_map_reallocate(map%map(idx_cache), n_elements+ ishft(n_elements,-1))
endif endif
cache_key = iand(key(i),map_mask) cache_key = int(iand(key(i),map_mask),2)
map%map(idx_cache)%value(n_elements) = value(i) map%map(idx_cache)%value(n_elements) = value(i)
map%map(idx_cache)%key(n_elements) = cache_key map%map(idx_cache)%key(n_elements) = cache_key
map%map(idx_cache)%n_elements = n_elements map%map(idx_cache)%n_elements = n_elements
@ -615,7 +615,7 @@ subroutine search_key_big_interval(key,X,sze,idx,ibegin_in,iend_in)
idx = -1 idx = -1
return return
endif endif
cache_key = iand(key,map_mask) cache_key = int(iand(key,map_mask),2)
ibegin = min(ibegin_in,sze) ibegin = min(ibegin_in,sze)
iend = min(iend_in,sze) iend = min(iend_in,sze)
if ((cache_key > X(ibegin)) .and. (cache_key < X(iend))) then if ((cache_key > X(ibegin)) .and. (cache_key < X(iend))) then
@ -723,7 +723,7 @@ subroutine search_key_value_big_interval(key,value,X,Y,sze,idx,ibegin_in,iend_in
value = 0.d0 value = 0.d0
return return
endif endif
cache_key = iand(key,map_mask) cache_key = int(iand(key,map_mask),2)
ibegin = min(ibegin_in,sze) ibegin = min(ibegin_in,sze)
iend = min(iend_in,sze) iend = min(iend_in,sze)
if ((cache_key > X(ibegin)) .and. (cache_key < X(iend))) then if ((cache_key > X(ibegin)) .and. (cache_key < X(iend))) then

View File

@ -292,18 +292,17 @@ BEGIN_TEMPLATE
! contains the new order of the elements. ! contains the new order of the elements.
! iradix should be -1 in input. ! iradix should be -1 in input.
END_DOC END_DOC
$int_type, intent(in) :: isize integer*$int_type, intent(in) :: isize
$int_type, intent(inout) :: iorder(isize) integer*$int_type, intent(inout) :: iorder(isize)
$type, intent(inout) :: x(isize) integer*$type, intent(inout) :: x(isize)
integer, intent(in) :: iradix integer, intent(in) :: iradix
integer :: iradix_new integer :: iradix_new
$type, allocatable :: x2(:), x1(:) integer*$type, allocatable :: x2(:), x1(:)
$type :: i4 integer*$type :: i4
$int_type, allocatable :: iorder1(:),iorder2(:) integer*$int_type, allocatable :: iorder1(:),iorder2(:)
$int_type :: i0, i1, i2, i3, i integer*$int_type :: i0, i1, i2, i3, i
integer, parameter :: integer_size=$octets integer, parameter :: integer_size=$octets
$type, parameter :: zero=$zero integer*$type :: mask
$type :: mask
integer :: nthreads, omp_get_num_threads integer :: nthreads, omp_get_num_threads
!DIR$ ATTRIBUTES ALIGN : 128 :: iorder1,iorder2, x2, x1 !DIR$ ATTRIBUTES ALIGN : 128 :: iorder1,iorder2, x2, x1
@ -311,16 +310,16 @@ BEGIN_TEMPLATE
! Find most significant bit ! Find most significant bit
i0 = 0_8 i0 = 0_$int_type
i4 = -1_8 i4 = -1_$type
do i=1,isize do i=1,isize
i4 = max(i4,x(i)) i4 = max(i4,x(i))
enddo enddo
i3 = i4 ! Type conversion i3 = int(i4,$int_type)
iradix_new = integer_size-1-leadz(i3) iradix_new = integer_size-1-leadz(i3)
mask = ibset(zero,iradix_new) mask = ibset(0_$type,iradix_new)
nthreads = 1 nthreads = 1
! nthreads = 1+ishft(omp_get_num_threads(),-1) ! nthreads = 1+ishft(omp_get_num_threads(),-1)
@ -331,22 +330,22 @@ BEGIN_TEMPLATE
stop stop
endif endif
i1=1_8 i1=1_$int_type
i2=1_8 i2=1_$int_type
do i=1,isize do i=1,isize
if (iand(mask,x(i)) == zero) then if (iand(mask,x(i)) == 0_$type) then
iorder1(i1) = iorder(i) iorder1(i1) = iorder(i)
x1(i1) = x(i) x1(i1) = x(i)
i1 = i1+1_8 i1 = i1+1_$int_type
else else
iorder2(i2) = iorder(i) iorder2(i2) = iorder(i)
x2(i2) = x(i) x2(i2) = x(i)
i2 = i2+1_8 i2 = i2+1_$int_type
endif endif
enddo enddo
i1=i1-1_8 i1=i1-1_$int_type
i2=i2-1_8 i2=i2-1_$int_type
do i=1,i1 do i=1,i1
iorder(i0+i) = iorder1(i) iorder(i0+i) = iorder1(i)
@ -399,12 +398,12 @@ BEGIN_TEMPLATE
endif endif
mask = ibset(zero,iradix) mask = ibset(0_$type,iradix)
i0=1 i0=1
i1=1 i1=1
do i=1,isize do i=1,isize
if (iand(mask,x(i)) == zero) then if (iand(mask,x(i)) == 0_$type) then
iorder(i0) = iorder(i) iorder(i0) = iorder(i)
x(i0) = x(i) x(i0) = x(i)
i0 = i0+1 i0 = i0+1
@ -443,12 +442,12 @@ BEGIN_TEMPLATE
end end
SUBST [ X, type, octets, is_big, big, int_type, zero ] SUBST [ X, type, octets, is_big, big, int_type ]
i ; integer ; 32 ; .False. ; ; integer ; 0;; i ; 4 ; 32 ; .False. ; ; 4 ;;
i8 ; integer*8 ; 32 ; .False. ; ; integer ; 0_8;; i8 ; 8 ; 32 ; .False. ; ; 4 ;;
i2 ; integer*2 ; 32 ; .False. ; ; integer ; 0;; i2 ; 2 ; 32 ; .False. ; ; 4 ;;
i ; integer ; 64 ; .True. ; _big ; integer*8 ; 0 ;; i ; 4 ; 64 ; .True. ; _big ; 8 ;;
i8 ; integer*8 ; 64 ; .True. ; _big ; integer*8 ; 0_8 ;; i8 ; 8 ; 64 ; .True. ; _big ; 8 ;;
END_TEMPLATE END_TEMPLATE