mirror of
https://github.com/QuantumPackage/qp2.git
synced 2025-01-08 20:33:20 +01:00
Fixing Davidson
This commit is contained in:
parent
da61f60ba4
commit
f1e14f0851
@ -13,6 +13,7 @@ end
|
|||||||
subroutine davidson_slave_tcp(i)
|
subroutine davidson_slave_tcp(i)
|
||||||
implicit none
|
implicit none
|
||||||
integer, intent(in) :: i
|
integer, intent(in) :: i
|
||||||
|
call sleep(1) ! Let the master start
|
||||||
call davidson_run_slave(0,i)
|
call davidson_run_slave(0,i)
|
||||||
end
|
end
|
||||||
|
|
||||||
@ -42,48 +43,18 @@ subroutine davidson_run_slave(thread,iproc)
|
|||||||
zmq_socket_push = new_zmq_push_socket(thread)
|
zmq_socket_push = new_zmq_push_socket(thread)
|
||||||
|
|
||||||
|
|
||||||
integer :: ierr, doexit
|
|
||||||
do
|
|
||||||
doexit = 0
|
|
||||||
if (connect_to_taskserver(zmq_to_qp_run_socket,worker_id,thread) == -1) then
|
|
||||||
call sleep( int(1.5+float(mpi_rank)/10.) )
|
|
||||||
if (connect_to_taskserver(zmq_to_qp_run_socket,worker_id,thread) == -1) then
|
|
||||||
doexit=1
|
|
||||||
endif
|
|
||||||
endif
|
|
||||||
|
|
||||||
IRP_IF MPI
|
if (connect_to_taskserver(zmq_to_qp_run_socket,worker_id,thread) == -1) then
|
||||||
include 'mpif.h'
|
return
|
||||||
integer :: sendbuf, recvbuf
|
endif
|
||||||
sendbuf = doexit
|
if (zmq_get_N_states_diag_notouch(zmq_to_qp_run_socket,1) == -1) then
|
||||||
recvbuf = doexit
|
if (disconnect_from_taskserver(zmq_to_qp_run_socket,worker_id) == -1) then
|
||||||
call MPI_ALLREDUCE(sendbuf, recvbuf, 1, MPI_INTEGER, MPI_SUM, MPI_COMM_WORLD, ierr)
|
continue
|
||||||
if (ierr /= MPI_SUCCESS) then
|
|
||||||
print *, irp_here//': Unable to reduce '
|
|
||||||
stop -1
|
|
||||||
endif
|
|
||||||
doexit = recvbuf
|
|
||||||
IRP_ENDIF
|
|
||||||
|
|
||||||
if (doexit == 0) then
|
|
||||||
exit
|
|
||||||
else
|
|
||||||
if (thread == 0) then
|
|
||||||
print *, irp_here, ': Connection failed. Exiting Davidson.'
|
|
||||||
return
|
|
||||||
endif
|
|
||||||
endif
|
endif
|
||||||
enddo
|
return
|
||||||
|
endif
|
||||||
|
|
||||||
do
|
! SOFT_TOUCH N_states_diag
|
||||||
if (zmq_get_N_states_diag_notouch(zmq_to_qp_run_socket,1) == -1) then
|
|
||||||
call sleep(1)
|
|
||||||
print *, irp_here, ': waiting for N_states_diag'
|
|
||||||
else
|
|
||||||
exit
|
|
||||||
endif
|
|
||||||
enddo
|
|
||||||
SOFT_TOUCH N_states_diag
|
|
||||||
|
|
||||||
call davidson_slave_work(zmq_to_qp_run_socket, zmq_socket_push, N_states_diag, N_det, worker_id)
|
call davidson_slave_work(zmq_to_qp_run_socket, zmq_socket_push, N_states_diag, N_det, worker_id)
|
||||||
|
|
||||||
|
@ -663,17 +663,16 @@ integer function connect_to_taskserver(zmq_to_qp_run_socket,worker_id,thread)
|
|||||||
rc = f77_zmq_recv(zmq_to_qp_run_socket, message, 510, 0)
|
rc = f77_zmq_recv(zmq_to_qp_run_socket, message, 510, 0)
|
||||||
message = trim(message(1:rc))
|
message = trim(message(1:rc))
|
||||||
if(message(1:5) == "error") then
|
if(message(1:5) == "error") then
|
||||||
connect_to_taskserver = -1
|
go to 10
|
||||||
return
|
|
||||||
end if
|
end if
|
||||||
read(message,*, end=10, err=10) reply, state, worker_id, address
|
read(message,*, end=10, err=10) reply, state, worker_id, address
|
||||||
if (trim(reply) /= 'connect_reply') then
|
if (trim(reply) /= 'connect_reply') then
|
||||||
connect_to_taskserver = -1
|
go to 10
|
||||||
return
|
|
||||||
endif
|
endif
|
||||||
if (trim(state) /= zmq_state) then
|
if (trim(state) /= zmq_state) then
|
||||||
integer, external :: disconnect_from_taskserver_state
|
integer, external :: disconnect_from_taskserver_state
|
||||||
if (disconnect_from_taskserver_state(zmq_to_qp_run_socket, worker_id, state) == -1) then
|
if (disconnect_from_taskserver_state(zmq_to_qp_run_socket, worker_id, state) == -1) then
|
||||||
|
print *, irp_here//': Wrong zmq_state. Disconnecting.'
|
||||||
continue
|
continue
|
||||||
endif
|
endif
|
||||||
connect_to_taskserver = -1
|
connect_to_taskserver = -1
|
||||||
@ -682,6 +681,7 @@ integer function connect_to_taskserver(zmq_to_qp_run_socket,worker_id,thread)
|
|||||||
|
|
||||||
return
|
return
|
||||||
10 continue
|
10 continue
|
||||||
|
print *, irp_here//': '//trim(message)
|
||||||
connect_to_taskserver = -1
|
connect_to_taskserver = -1
|
||||||
end
|
end
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user