BEGIN_PROVIDER [ integer, pt2_stoch_istate ] implicit none BEGIN_DOC ! State for stochatsic PT2 END_DOC pt2_stoch_istate = 1 END_PROVIDER BEGIN_PROVIDER [ integer, pt2_N_teeth ] &BEGIN_PROVIDER [ integer, pt2_minDetInFirstTeeth ] &BEGIN_PROVIDER [ integer, pt2_n_tasks_max ] &BEGIN_PROVIDER [ integer, pt2_F, (N_det_generators) ] implicit none logical, external :: testTeethBuilding integer :: i integer :: e e = elec_num - n_core_orb * 2 pt2_n_tasks_max = 1+min((e*(e-1))/2, int(dsqrt(dble(N_det_generators)))/10) do i=1,N_det_generators if (maxval(dabs(psi_coef_sorted_gen(i,1:N_states))) > 0.001d0) then pt2_F(i) = pt2_n_tasks_max else pt2_F(i) = 1 endif enddo if(N_det_generators < 1024) then pt2_minDetInFirstTeeth = 1 pt2_N_teeth = 1 else pt2_minDetInFirstTeeth = min(5, N_det_generators) do pt2_N_teeth=100,2,-1 if(testTeethBuilding(pt2_minDetInFirstTeeth, pt2_N_teeth)) exit end do end if call write_int(6,pt2_N_teeth,'Number of comb teeth') END_PROVIDER logical function testTeethBuilding(minF, N) implicit none integer, intent(in) :: minF, N integer :: n0, i double precision :: u0, Wt, r double precision, allocatable :: tilde_w(:), tilde_cW(:) integer, external :: dress_find_sample allocate(tilde_w(N_det_generators), tilde_cW(0:N_det_generators)) do i=1,N_det_generators tilde_w(i) = psi_coef_sorted_gen(i,pt2_stoch_istate)**2 + 1.d-20 enddo double precision :: norm norm = 0.d0 do i=N_det_generators,1,-1 norm += tilde_w(i) enddo tilde_w(:) = tilde_w(:) / norm tilde_cW(0) = -1.d0 do i=1,N_det_generators tilde_cW(i) = tilde_cW(i-1) + tilde_w(i) enddo tilde_cW(:) = tilde_cW(:) + 1.d0 n0 = 0 testTeethBuilding = .false. do u0 = tilde_cW(n0) r = tilde_cW(n0 + minF) Wt = (1d0 - u0) / dble(N) if (dabs(Wt) <= 1.d-3) then return endif if(Wt >= r - u0) then testTeethBuilding = .true. return end if n0 += 1 if(N_det_generators - n0 < minF * N) then return end if end do stop "exited testTeethBuilding" end function subroutine ZMQ_pt2(E, pt2,relative_error, error) use f77_zmq use selection_types implicit none integer(ZMQ_PTR) :: zmq_to_qp_run_socket, zmq_socket_pull integer, external :: omp_get_thread_num double precision, intent(in) :: relative_error, E(N_states) double precision, intent(out) :: pt2(N_states),error(N_states) integer :: i double precision, external :: omp_get_wtime double precision :: state_average_weight_save(N_states), w(N_states) integer(ZMQ_PTR), external :: new_zmq_to_qp_run_socket if (N_det < max(10,N_states)) then pt2=0.d0 call ZMQ_selection(0, pt2) error(:) = 0.d0 else state_average_weight_save(:) = state_average_weight(:) do pt2_stoch_istate=1,N_states state_average_weight(:) = 0.d0 state_average_weight(pt2_stoch_istate) = 1.d0 TOUCH state_average_weight pt2_stoch_istate provide nproc pt2_F mo_bielec_integrals_in_map mo_mono_elec_integral pt2_w psi_selectors print *, '========== ================= ================= =================' print *, ' Samples Energy Stat. Error Seconds ' print *, '========== ================= ================= =================' call new_parallel_job(zmq_to_qp_run_socket, zmq_socket_pull, 'pt2') integer, external :: zmq_put_psi integer, external :: zmq_put_N_det_generators integer, external :: zmq_put_N_det_selectors integer, external :: zmq_put_dvector integer, external :: zmq_put_ivector if (zmq_put_psi(zmq_to_qp_run_socket,1) == -1) then stop 'Unable to put psi on ZMQ server' endif if (zmq_put_N_det_generators(zmq_to_qp_run_socket, 1) == -1) then stop 'Unable to put N_det_generators on ZMQ server' endif if (zmq_put_N_det_selectors(zmq_to_qp_run_socket, 1) == -1) then stop 'Unable to put N_det_selectors on ZMQ server' endif if (zmq_put_dvector(zmq_to_qp_run_socket,1,'energy',pt2_e0_denominator,size(pt2_e0_denominator)) == -1) then stop 'Unable to put energy on ZMQ server' endif if (zmq_put_dvector(zmq_to_qp_run_socket,1,'state_average_weight',state_average_weight,N_states) == -1) then stop 'Unable to put state_average_weight on ZMQ server' endif if (zmq_put_ivector(zmq_to_qp_run_socket,1,'pt2_stoch_istate',pt2_stoch_istate,1) == -1) then stop 'Unable to put pt2_stoch_istate on ZMQ server' endif if (zmq_put_dvector(zmq_to_qp_run_socket,1,'threshold_selectors',threshold_selectors,1) == -1) then stop 'Unable to put threshold_selectors on ZMQ server' endif if (zmq_put_dvector(zmq_to_qp_run_socket,1,'threshold_generators',threshold_generators,1) == -1) then stop 'Unable to put threshold_generators on ZMQ server' endif integer, external :: add_task_to_taskserver character(len=:), allocatable :: task allocate(character(len=100000) :: task) integer :: j,k,ipos ipos=0 do i=1,N_det_generators if (pt2_F(i) > 1) then ipos += 1 endif enddo call write_int(6,ipos,'Number of fragmented tasks') ipos=1 do i= 1, N_det_generators do j=1,pt2_F(pt2_J(i)) write(task(ipos:ipos+20),'(I9,1X,I9,''|'')') j, pt2_J(i) ipos += 20 if (ipos > len(task)-20) then if (add_task_to_taskserver(zmq_to_qp_run_socket,trim(task(1:ipos))) == -1) then stop 'Unable to add task to task server' endif ipos=1 endif end do enddo if (ipos > 1) then if (add_task_to_taskserver(zmq_to_qp_run_socket,trim(task(1:ipos))) == -1) then stop 'Unable to add task to task server' endif endif integer, external :: zmq_set_running if (zmq_set_running(zmq_to_qp_run_socket) == -1) then print *, irp_here, ': Failed in zmq_set_running' endif integer :: nproc_target nproc_target = nproc double precision :: mem mem = 8.d0 * N_det * (N_int * 2.d0 * 3.d0 + 3.d0 + 5.d0) / (1024.d0**3) call write_double(6,mem,'Estimated memory/thread (Gb)') if (qp_max_mem > 0) then nproc_target = max(1,int(dble(qp_max_mem)/mem)) nproc_target = min(nproc_target,nproc) endif call omp_set_nested(.true.) !$OMP PARALLEL DEFAULT(shared) NUM_THREADS(nproc_target+1) & !$OMP PRIVATE(i) i = omp_get_thread_num() if (i==0) then call pt2_collector(zmq_socket_pull, E(pt2_stoch_istate),relative_error, w, error) pt2(pt2_stoch_istate) = w(pt2_stoch_istate) else call pt2_slave_inproc(i) endif !$OMP END PARALLEL call end_parallel_job(zmq_to_qp_run_socket, zmq_socket_pull, 'pt2') print *, '========== ================= ================= =================' enddo ! call omp_set_nested(.false.) FREE pt2_stoch_istate state_average_weight(:) = state_average_weight_save(:) TOUCH state_average_weight endif do k=N_det+1,N_states pt2(k) = 0.d0 enddo end subroutine subroutine pt2_slave_inproc(i) implicit none integer, intent(in) :: i call run_pt2_slave(1,i,pt2_e0_denominator) end subroutine pt2_collector(zmq_socket_pull, E, relative_error, pt2, error) use f77_zmq use selection_types use bitmasks implicit none integer(ZMQ_PTR), intent(in) :: zmq_socket_pull double precision, intent(in) :: relative_error, E double precision, intent(out) :: pt2(N_states), error(N_states) double precision, allocatable :: eI(:,:), eI_task(:,:), S(:), S2(:) integer(ZMQ_PTR),external :: new_zmq_to_qp_run_socket integer(ZMQ_PTR) :: zmq_to_qp_run_socket integer, external :: zmq_delete_tasks integer, external :: zmq_abort integer, external :: pt2_find_sample integer :: more, n, i, p, c, t, n_tasks, U integer, allocatable :: task_id(:) integer, allocatable :: index(:) double precision, external :: omp_get_wtime double precision :: v, x, avg, eqt, E0 double precision :: time, time0 integer, allocatable :: f(:) logical, allocatable :: d(:) zmq_to_qp_run_socket = new_zmq_to_qp_run_socket() allocate(task_id(pt2_n_tasks_max), index(pt2_n_tasks_max), f(N_det_generators)) allocate(d(N_det_generators+1)) allocate(eI(N_states, N_det_generators), eI_task(N_states, pt2_n_tasks_max)) allocate(S(pt2_N_teeth+1), S2(pt2_N_teeth+1)) pt2(:) = -huge(1.) S(:) = 0d0 S2(:) = 0d0 n = 1 t = 0 U = 0 eI(:,:) = 0d0 f(:) = pt2_F(:) d(:) = .false. n_tasks = 0 E0 = E more = 1 time0 = omp_get_wtime() do while (n <= N_det_generators) if(f(pt2_J(n)) == 0) then d(pt2_J(n)) = .true. do while(d(U+1)) U += 1 end do ! Deterministic part do while(t <= pt2_N_teeth) if(U >= pt2_n_0(t+1)) then t=t+1 E0 = 0.d0 do i=pt2_n_0(t),1,-1 E0 += eI(pt2_stoch_istate, i) end do else exit end if end do ! Add Stochastic part c = pt2_R(n) if(c > 0) then x = 0d0 do p=pt2_N_teeth, 1, -1 v = pt2_u_0 + pt2_W_T * (pt2_u(c) + dble(p-1)) i = pt2_find_sample(v, pt2_cW) x += eI(pt2_stoch_istate, i) * pt2_W_T / pt2_w(i) S(p) += x S2(p) += x**2 end do avg = E0 + S(t) / dble(c) pt2(pt2_stoch_istate) = avg ! 1/(N-1.5) : see Brugger, The American Statistician (23) 4 p. 32 (1969) if(c > 2) then eqt = dabs((S2(t) / c) - (S(t)/c)**2) ! dabs for numerical stability eqt = sqrt(eqt / (dble(c) - 1.5d0)) error(pt2_stoch_istate) = eqt if(mod(c,10)==0 .or. n==N_det_generators) then print '(G10.3, 2X, F16.10, 2X, G16.3, 2X, F16.4, A20)', c, avg+E, eqt, time-time0, '' if( dabs(error(pt2_stoch_istate) / pt2(pt2_stoch_istate)) < relative_error) then if (zmq_abort(zmq_to_qp_run_socket) == -1) then call sleep(10) if (zmq_abort(zmq_to_qp_run_socket) == -1) then print *, irp_here, ': Error in sending abort signal (2)' endif endif endif endif endif time = omp_get_wtime() end if n += 1 else if(more == 0) then exit else call pull_pt2_results(zmq_socket_pull, index, eI_task, task_id, n_tasks) if (zmq_delete_tasks(zmq_to_qp_run_socket,zmq_socket_pull,task_id,n_tasks,more) == -1) then stop 'Unable to delete tasks' endif do i=1,n_tasks eI(:, index(i)) += eI_task(:, i) f(index(i)) -= 1 end do end if end do call end_zmq_to_qp_run_socket(zmq_to_qp_run_socket) end subroutine integer function pt2_find_sample(v, w) implicit none double precision, intent(in) :: v, w(0:N_det_generators) integer :: i,l,r l = 0 r = N_det_generators do while(r-l > 1) i = (r+l) / 2 if(w(i) < v) then l = i else r = i end if end do i = r do r=i+1,N_det_generators if (w(r) /= w(i)) then exit endif enddo pt2_find_sample = r-1 end function BEGIN_PROVIDER[ integer, pt2_J, (N_det_generators)] &BEGIN_PROVIDER[ double precision, pt2_u, (N_det_generators)] &BEGIN_PROVIDER[ integer, pt2_R, (N_det_generators)] implicit none integer :: N_c, N_j, U, t, i double precision :: v logical, allocatable :: d(:) integer, external :: pt2_find_sample allocate(d(N_det_generators)) pt2_R(:) = 0 N_c = 0 N_j = pt2_n_0(1) d(:) = .false. do i=1,N_j d(i) = .true. pt2_J(i) = i end do integer :: m integer, allocatable :: seed(:) call random_seed(size=m) allocate(seed(m)) do i=1,m seed(i) = i enddo call random_seed(put=seed) deallocate(seed) call RANDOM_NUMBER(pt2_u) call RANDOM_NUMBER(pt2_u) U = 0 do while(N_j < N_det_generators) !ADD_COMB N_c += 1 do t=0, pt2_N_teeth-1 v = pt2_u_0 + pt2_W_T * (dble(t) + pt2_u(N_c)) i = pt2_find_sample(v, pt2_cW) if(.not. d(i)) then N_j += 1 pt2_J(N_j) = i d(i) = .true. end if end do pt2_R(N_j) = N_c !FILL_TOOTH do while(U < N_det_generators) U += 1 if(.not. d(U)) then N_j += 1 pt2_J(N_j) = U d(U) = .true. exit; end if end do enddo if(N_det_generators > 1) then pt2_R(N_det_generators-1) = 0 pt2_R(N_det_generators) = N_c end if END_PROVIDER BEGIN_PROVIDER [ double precision, pt2_w, (N_det_generators) ] &BEGIN_PROVIDER [ double precision, pt2_cW, (0:N_det_generators) ] &BEGIN_PROVIDER [ double precision, pt2_W_T ] &BEGIN_PROVIDER [ double precision, pt2_u_0 ] &BEGIN_PROVIDER [ integer, pt2_n_0, (pt2_N_teeth+1) ] implicit none integer :: i, t double precision, allocatable :: tilde_w(:), tilde_cW(:) double precision :: r, tooth_width integer, external :: pt2_find_sample allocate(tilde_w(N_det_generators), tilde_cW(0:N_det_generators)) tilde_cW(0) = 0d0 do i=1,N_det_generators tilde_w(i) = psi_coef_sorted_gen(i,pt2_stoch_istate)**2 + 1.d-20 enddo double precision :: norm norm = 0.d0 do i=N_det_generators,1,-1 norm += tilde_w(i) enddo tilde_w(:) = tilde_w(:) / norm tilde_cW(0) = -1.d0 do i=1,N_det_generators tilde_cW(i) = tilde_cW(i-1) + tilde_w(i) enddo tilde_cW(:) = tilde_cW(:) + 1.d0 pt2_n_0(1) = 0 do pt2_u_0 = tilde_cW(pt2_n_0(1)) r = tilde_cW(pt2_n_0(1) + pt2_minDetInFirstTeeth) pt2_W_T = (1d0 - pt2_u_0) / dble(pt2_N_teeth) if(pt2_W_T >= r - pt2_u_0) then exit end if pt2_n_0(1) += 1 if(N_det_generators - pt2_n_0(1) < pt2_minDetInFirstTeeth * pt2_N_teeth) then stop "teeth building failed" end if end do !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! do t=2, pt2_N_teeth r = pt2_u_0 + pt2_W_T * dble(t-1) pt2_n_0(t) = pt2_find_sample(r, tilde_cW) end do pt2_n_0(pt2_N_teeth+1) = N_det_generators !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! pt2_w(:pt2_n_0(1)) = tilde_w(:pt2_n_0(1)) do t=1, pt2_N_teeth tooth_width = tilde_cW(pt2_n_0(t+1)) - tilde_cW(pt2_n_0(t)) if (tooth_width == 0.d0) then tooth_width = sum(tilde_w(pt2_n_0(t):pt2_n_0(t+1))) endif ASSERT(tooth_width > 0.d0) do i=pt2_n_0(t)+1, pt2_n_0(t+1) pt2_w(i) = tilde_w(i) * pt2_W_T / tooth_width end do end do pt2_cW(0) = 0d0 do i=1,N_det_generators pt2_cW(i) = pt2_cW(i-1) + pt2_w(i) end do pt2_n_0(pt2_N_teeth+1) = N_det_generators END_PROVIDER