/orcd/pool/004/jahn/centos7/MITgcm_gfortran-mpi/verification/deep_anelastic/tr_run.vecinv ../../../tools/tst_2+2 -mpi All -command "mpirun -n 4 -hostfile /tmp/machinefile.54697 ./mitgcmuv" cmdEXE='mpirun -n 4 -hostfile /tmp/machinefile.54697 ./mitgcmuv' from previous run STDOUT.0000, lastPick=' 18 ckptA' ; iter='18' ; sufx='ckptA' prepare parameter file 'data.tst' : prepare file 'data.tst' : done diff data.tst data 42,45c42,43 < nIter0=18, < nTimeSteps=4, < # nIter0=0, < # nTimeSteps=18, --- > nIter0=0, > nTimeSteps=18, 48,49c46,47 < # pChkptFreq=86400., < # chkptFreq=0., --- > pChkptFreq=86400., > chkptFreq=0., link back: temp_tst/pickup*.ckptA* rename ckptA -> 0000000018 for all: pickup rnp_loc: pickup.ckptA pickup.0000000018 start-end iter: 18 , 20 , 22 sufix: '0000000018' '0000000020' '0000000022' cmdEXE=mpirun -n 4 -hostfile /tmp/machinefile.54697 ./mitgcmuv ==> START RUN 2 x 2 it STOP NORMAL END STOP NORMAL END STOP NORMAL END STOP NORMAL END ==> END RUN 2 x 2 it listP= pickup rnp_loc: pickup.ckptA pickup.0000000022 move_outp: res_2it ==> START RUN 1iA STOP NORMAL END STOP NORMAL END STOP NORMAL END STOP NORMAL END ==> END RUN 1iA rnp_loc: pickup.ckptA pickup.0000000020 move_outp: res_1iA ==> START RUN 1iB STOP ABNORMAL END: S/R MDS_READ_FIELD [node669:mpi_rank_2][handle_cqe] Send desc error in msg to 3, wc_opcode=0 [node669:mpi_rank_2][handle_cqe] Msg from 3: wc.status=12, wc.wr_id=0x2134040, wc.opcode=0, vbuf->phead->type=0 = MPIDI_CH3_PKT_EAGER_SEND [node669:mpi_rank_0][handle_cqe] Send desc error in msg to 3, wc_opcode=0 [node669:mpi_rank_2][handle_cqe] src/mpid/ch3/channels/mrail/src/gen2/ibv_channel_manager.c:548: [] Got completion with error 12, vendor code=0x81, dest rank=3 : No such file or directory (2) [node669:mpi_rank_0][handle_cqe] Msg from 3: wc.status=12, wc.wr_id=0x212e040, wc.opcode=0, vbuf->phead->type=0 = MPIDI_CH3_PKT_EAGER_SEND [node669:mpi_rank_0][handle_cqe] src/mpid/ch3/channels/mrail/src/gen2/ibv_channel_manager.c:548: [] Got completion with error 12, vendor code=0x81, dest rank=3 : No such file or directory (2) ==> RUN 1iB STOP without writing pickup => exit