FYI: Ralph's out today. He'll be back tomorrow. I'm not really part of this ORTE discussion, but I am curious about a code style that I see in this commit: assigning ORTE_EPOCH_INVALID to a field, and then immediately overwriting that field with another value. E.g.:
> peer_name.jobid = ORTE_PROC_MY_NAME->jobid; > peer_name.vpid = peer_idx; > + peer_name.epoch = ORTE_EPOCH_INVALID; > peer_name.epoch = orte_ess.proc_get_epoch(&peer_name); This technique is used throughout this patch. What is the purpose for this? As I understand it, this won't squash any valgrind warnings, and may even get eliminated by the compiler as dead code because it seems to be useless. On Aug 8, 2011, at 11:11 AM, wbl...@osl.iu.edu wrote: > Author: wbland > Date: 2011-08-08 11:11:55 EDT (Mon, 08 Aug 2011) > New Revision: 25015 > URL: https://svn.open-mpi.org/trac/ompi/changeset/25015 > > Log: > Make sure that the epoch is initialized everywhere so we don't get weird > output > during valgrind. This shouldn't have caused any problems with any actual > execution. Just extra warnings in valgrind. > > > Text files modified: > trunk/ompi/mca/crcp/bkmrk/crcp_bkmrk_pml.c | 2 ++ > > trunk/ompi/proc/proc.c | 2 +- > > trunk/orte/mca/ess/alps/ess_alps_module.c | 1 + > > trunk/orte/mca/ess/env/ess_env_module.c | 1 + > > trunk/orte/mca/ess/lsf/ess_lsf_module.c | 1 + > > trunk/orte/mca/ess/slave/ess_slave_module.c | 1 + > > trunk/orte/mca/ess/slurm/ess_slurm_module.c | 1 + > > trunk/orte/mca/grpcomm/base/grpcomm_base_coll.c | 12 +++++++----- > > trunk/orte/mca/iof/hnp/iof_hnp.c | 1 + > > trunk/orte/mca/odls/base/odls_base_default_fns.c | 1 + > > trunk/orte/mca/odls/base/odls_base_open.c | 1 + > > trunk/orte/mca/plm/base/plm_base_launch_support.c | 1 + > > trunk/orte/mca/plm/base/plm_base_orted_cmds.c | 2 ++ > > trunk/orte/mca/plm/base/plm_base_receive.c | 1 + > > trunk/orte/mca/rmaps/base/rmaps_base_support_fns.c | 3 +++ > > trunk/orte/mca/rmaps/rank_file/rmaps_rank_file.c | 1 + > > trunk/orte/mca/rmaps/seq/rmaps_seq.c | 1 + > > trunk/orte/mca/rml/oob/rml_oob_component.c | 4 ---- > > trunk/orte/mca/routed/binomial/routed_binomial.c | 4 ++++ > > trunk/orte/mca/routed/cm/routed_cm.c | 4 ++++ > > trunk/orte/mca/routed/linear/routed_linear.c | 2 ++ > > trunk/orte/mca/routed/radix/routed_radix.c | 3 +++ > > trunk/orte/mca/routed/slave/routed_slave.c | 1 + > > trunk/orte/mca/sstore/central/sstore_central_global.c | 1 + > > trunk/orte/mca/sstore/stage/sstore_stage_global.c | 1 + > > trunk/orte/orted/orted_comm.c | 1 + > > trunk/orte/test/system/oob_stress.c | 2 +- > > trunk/orte/test/system/orte_ring.c | 2 ++ > > trunk/orte/test/system/orte_spawn.c | 1 + > > 29 files changed, 48 insertions(+), 11 deletions(-) > > Modified: trunk/ompi/mca/crcp/bkmrk/crcp_bkmrk_pml.c > ============================================================================== > --- trunk/ompi/mca/crcp/bkmrk/crcp_bkmrk_pml.c (original) > +++ trunk/ompi/mca/crcp/bkmrk/crcp_bkmrk_pml.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -5284,6 +5284,7 @@ > */ > peer_name.jobid = ORTE_PROC_MY_NAME->jobid; > peer_name.vpid = peer_idx; > + peer_name.epoch = ORTE_EPOCH_INVALID; > peer_name.epoch = orte_ess.proc_get_epoch(&peer_name); > > if( NULL == (peer_ref = find_peer(peer_name))) { > @@ -5345,6 +5346,7 @@ > > peer_name.jobid = ORTE_PROC_MY_NAME->jobid; > peer_name.vpid = peer_idx; > + peer_name.epoch = ORTE_EPOCH_INVALID; > peer_name.epoch = orte_ess.proc_get_epoch(&peer_name); > > if ( 0 > (ret = orte_rml.recv_buffer_nb(&peer_name, > > Modified: trunk/ompi/proc/proc.c > ============================================================================== > --- trunk/ompi/proc/proc.c (original) > +++ trunk/ompi/proc/proc.c 2011-08-08 11:11:55 EDT (Mon, 08 Aug 2011) > @@ -362,7 +362,7 @@ > > /* Does not change: proc->proc_name.vpid */ > proc->proc_name.jobid = ORTE_PROC_MY_NAME->jobid; > - > + proc->proc_name.epoch = ORTE_EPOCH_INVALID; > proc->proc_name.epoch = orte_ess.proc_get_epoch(&proc->proc_name); > > /* Make sure to clear the local flag before we set it below */ > > Modified: trunk/orte/mca/ess/alps/ess_alps_module.c > ============================================================================== > --- trunk/orte/mca/ess/alps/ess_alps_module.c (original) > +++ trunk/orte/mca/ess/alps/ess_alps_module.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -351,6 +351,7 @@ > > ORTE_PROC_MY_NAME->jobid = jobid; > ORTE_PROC_MY_NAME->vpid = (orte_vpid_t) cnos_get_rank() + starting_vpid; > + ORTE_PROC_MY_NAME->epoch = ORTE_EPOCH_INVALID; > ORTE_PROC_MY_NAME->epoch = orte_ess.proc_get_epoch(ORTE_PROC_MY_NAME); > > OPAL_OUTPUT_VERBOSE((1, orte_ess_base_output, > > Modified: trunk/orte/mca/ess/env/ess_env_module.c > ============================================================================== > --- trunk/orte/mca/ess/env/ess_env_module.c (original) > +++ trunk/orte/mca/ess/env/ess_env_module.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -392,6 +392,7 @@ > > ORTE_PROC_MY_NAME->jobid = jobid; > ORTE_PROC_MY_NAME->vpid = vpid; > + ORTE_PROC_MY_NAME->epoch = ORTE_EPOCH_INVALID; > ORTE_PROC_MY_NAME->epoch = orte_ess.proc_get_epoch(ORTE_PROC_MY_NAME); > > OPAL_OUTPUT_VERBOSE((1, orte_ess_base_output, > > Modified: trunk/orte/mca/ess/lsf/ess_lsf_module.c > ============================================================================== > --- trunk/orte/mca/ess/lsf/ess_lsf_module.c (original) > +++ trunk/orte/mca/ess/lsf/ess_lsf_module.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -357,6 +357,7 @@ > > ORTE_PROC_MY_NAME->jobid = jobid; > ORTE_PROC_MY_NAME->vpid = vpid; > + ORTE_PROC_MY_NAME->epoch = ORTE_EPOCH_INVALID; > ORTE_PROC_MY_NAME->epoch = orte_ess.proc_get_epoch(ORTE_PROC_MY_NAME); > > /* fix up the base name and make it the "real" name */ > > Modified: trunk/orte/mca/ess/slave/ess_slave_module.c > ============================================================================== > --- trunk/orte/mca/ess/slave/ess_slave_module.c (original) > +++ trunk/orte/mca/ess/slave/ess_slave_module.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -280,6 +280,7 @@ > > ORTE_PROC_MY_NAME->jobid = jobid; > ORTE_PROC_MY_NAME->vpid = vpid; > + ORTE_PROC_MY_NAME->epoch = ORTE_EPOCH_INVALID; > ORTE_PROC_MY_NAME->epoch = orte_ess.proc_get_epoch(ORTE_PROC_MY_NAME); > > OPAL_OUTPUT_VERBOSE((1, orte_ess_base_output, > > Modified: trunk/orte/mca/ess/slurm/ess_slurm_module.c > ============================================================================== > --- trunk/orte/mca/ess/slurm/ess_slurm_module.c (original) > +++ trunk/orte/mca/ess/slurm/ess_slurm_module.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -368,6 +368,7 @@ > /* fix up the vpid and make it the "real" vpid */ > slurm_nodeid = atoi(getenv("SLURM_NODEID")); > ORTE_PROC_MY_NAME->vpid = vpid + slurm_nodeid; > + ORTE_PROC_MY_NAME->epoch = ORTE_EPOCH_INVALID; > ORTE_PROC_MY_NAME->epoch = orte_ess.proc_get_epoch(ORTE_PROC_MY_NAME); > > OPAL_OUTPUT_VERBOSE((1, orte_ess_base_output, > > Modified: trunk/orte/mca/grpcomm/base/grpcomm_base_coll.c > ============================================================================== > --- trunk/orte/mca/grpcomm/base/grpcomm_base_coll.c (original) > +++ trunk/orte/mca/grpcomm/base/grpcomm_base_coll.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -168,7 +168,7 @@ > if (vpids[0] == ORTE_PROC_MY_NAME->vpid) { > /* I send first */ > peer.vpid = vpids[1]; > - > + peer.epoch = ORTE_EPOCH_INVALID; > peer.epoch = orte_ess.proc_get_epoch(&peer); > > /* setup a temp buffer so I can inform the other side as to the > @@ -226,7 +226,7 @@ > opal_dss.pack(&buf, &num_entries, 1, OPAL_INT32); > opal_dss.copy_payload(&buf, sendbuf); > peer.vpid = vpids[0]; > - > + peer.epoch = ORTE_EPOCH_INVALID; > peer.epoch = orte_ess.proc_get_epoch(&peer); > > OPAL_OUTPUT_VERBOSE((5, orte_grpcomm_base.output, > @@ -320,7 +320,7 @@ > /* first send my current contents */ > nv = (rank - distance + np) % np; > peer.vpid = vpids[nv]; > - > + peer.epoch = ORTE_EPOCH_INVALID; > peer.epoch = orte_ess.proc_get_epoch(&peer); > > OBJ_CONSTRUCT(&buf, opal_buffer_t); > @@ -340,7 +340,7 @@ > num_recvd = 0; > nv = (rank + distance) % np; > peer.vpid = vpids[nv]; > - > + peer.epoch = ORTE_EPOCH_INVALID; > peer.epoch = orte_ess.proc_get_epoch(&peer); > > OBJ_CONSTRUCT(&bucket, opal_buffer_t); > @@ -439,7 +439,7 @@ > /* first send my current contents */ > nv = rank ^ distance; > peer.vpid = vpids[nv]; > - > + peer.epoch = ORTE_EPOCH_INVALID; > peer.epoch = orte_ess.proc_get_epoch(&peer); > > OBJ_CONSTRUCT(&buf, opal_buffer_t); > @@ -646,6 +646,7 @@ > proc.jobid = jobid; > proc.vpid = 0; > while (proc.vpid < jobdat->num_procs && 0 < > opal_list_get_size(&daemon_tree)) { > + proc.epoch = ORTE_EPOCH_INVALID; > proc.epoch = orte_ess.proc_get_epoch(&proc); > > /* get the daemon that hosts this proc */ > @@ -712,6 +713,7 @@ > /* send it */ > my_parent.jobid = ORTE_PROC_MY_NAME->jobid; > my_parent.vpid = orte_routed.get_routing_tree(NULL); > + my_parent.epoch = ORTE_EPOCH_INVALID; > my_parent.epoch = orte_ess.proc_get_epoch(&my_parent); > > OPAL_OUTPUT_VERBOSE((5, orte_grpcomm_base.output, > > Modified: trunk/orte/mca/iof/hnp/iof_hnp.c > ============================================================================== > --- trunk/orte/mca/iof/hnp/iof_hnp.c (original) > +++ trunk/orte/mca/iof/hnp/iof_hnp.c 2011-08-08 11:11:55 EDT (Mon, 08 Aug > 2011) > @@ -281,6 +281,7 @@ > &mca_iof_hnp_component.sinks); > sink->daemon.jobid = ORTE_PROC_MY_NAME->jobid; > sink->daemon.vpid = proc->node->daemon->name.vpid; > + sink->daemon.epoch = ORTE_EPOCH_INVALID; > sink->daemon.epoch = orte_ess.proc_get_epoch(&sink->daemon); > } > } > > Modified: trunk/orte/mca/odls/base/odls_base_default_fns.c > ============================================================================== > --- trunk/orte/mca/odls/base/odls_base_default_fns.c (original) > +++ trunk/orte/mca/odls/base/odls_base_default_fns.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -734,6 +734,7 @@ > proc.jobid = jobdat->jobid; > for (j=0; j < jobdat->num_procs; j++) { > proc.vpid = j; > + proc.epoch = ORTE_EPOCH_INVALID; > proc.epoch = orte_ess.proc_get_epoch(&proc); > /* get the vpid of the daemon that is to host this proc */ > if (ORTE_VPID_INVALID == (host_daemon = > orte_ess.proc_get_daemon(&proc))) { > > Modified: trunk/orte/mca/odls/base/odls_base_open.c > ============================================================================== > --- trunk/orte/mca/odls/base/odls_base_open.c (original) > +++ trunk/orte/mca/odls/base/odls_base_open.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -200,6 +200,7 @@ > * will be in the job - we'll check later > */ > nm->name.vpid = rank; > + nm->name.epoch = ORTE_EPOCH_INVALID; > nm->name.epoch = orte_ess.proc_get_epoch(&nm->name); > } > opal_list_append(&orte_odls_globals.xterm_ranks, &nm->item); > > Modified: trunk/orte/mca/plm/base/plm_base_launch_support.c > ============================================================================== > --- trunk/orte/mca/plm/base/plm_base_launch_support.c (original) > +++ trunk/orte/mca/plm/base/plm_base_launch_support.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -377,6 +377,7 @@ > /* push stdin - the IOF will know what to do with the specified target */ > name.jobid = job; > name.vpid = jdata->stdin_target; > + name.epoch = ORTE_EPOCH_INVALID; > name.epoch = orte_ess.proc_get_epoch(&name); > > if (ORTE_SUCCESS != (rc = orte_iof.push(&name, ORTE_IOF_STDIN, 0))) { > > Modified: trunk/orte/mca/plm/base/plm_base_orted_cmds.c > ============================================================================== > --- trunk/orte/mca/plm/base/plm_base_orted_cmds.c (original) > +++ trunk/orte/mca/plm/base/plm_base_orted_cmds.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -163,6 +163,7 @@ > continue; > } > peer.vpid = v; > + peer.epoch = ORTE_EPOCH_INVALID; > peer.epoch = orte_ess.proc_get_epoch(&peer); > > /* don't worry about errors on the send here - just > @@ -339,6 +340,7 @@ > continue; > } > peer.vpid = v; > + peer.epoch = ORTE_EPOCH_INVALID; > peer.epoch = orte_ess.proc_get_epoch(&peer); > /* check to see if this daemon is known to be "dead" */ > if (proc->state > ORTE_PROC_STATE_UNTERMINATED) { > > Modified: trunk/orte/mca/plm/base/plm_base_receive.c > ============================================================================== > --- trunk/orte/mca/plm/base/plm_base_receive.c (original) > +++ trunk/orte/mca/plm/base/plm_base_receive.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -394,6 +394,7 @@ > break; > } > name.vpid = vpid; > + name.epoch = ORTE_EPOCH_INVALID; > name.epoch = orte_ess.proc_get_epoch(&name); > > /* unpack the pid */ > > Modified: trunk/orte/mca/rmaps/base/rmaps_base_support_fns.c > ============================================================================== > --- trunk/orte/mca/rmaps/base/rmaps_base_support_fns.c (original) > +++ trunk/orte/mca/rmaps/base/rmaps_base_support_fns.c 2011-08-08 > 11:11:55 EDT (Mon, 08 Aug 2011) > @@ -559,6 +559,7 @@ > } > } > proc->name.vpid = vpid; > + proc->name.epoch = ORTE_EPOCH_INVALID; > proc->name.epoch = orte_ess.proc_get_epoch(&proc->name); > /* If there is an invalid epoch here, it's because it > doesn't exist yet. */ > if (ORTE_NODE_RANK_INVALID == proc->name.epoch) { > @@ -600,6 +601,7 @@ > } > } > proc->name.vpid = vpid; > + proc->name.epoch = ORTE_EPOCH_INVALID; > proc->name.epoch = orte_ess.proc_get_epoch(&proc->name); > } > if (NULL == opal_pointer_array_get_item(jdata->procs, > proc->name.vpid)) { > @@ -1012,6 +1014,7 @@ > return ORTE_ERR_OUT_OF_RESOURCE; > } > proc->name.vpid = jdata->num_procs; /* take the next available vpid > */ > + proc->name.epoch = ORTE_EPOCH_INVALID; > proc->name.epoch = orte_ess.proc_get_epoch(&proc->name); > proc->node = node; > proc->nodename = node->name; > > Modified: trunk/orte/mca/rmaps/rank_file/rmaps_rank_file.c > ============================================================================== > --- trunk/orte/mca/rmaps/rank_file/rmaps_rank_file.c (original) > +++ trunk/orte/mca/rmaps/rank_file/rmaps_rank_file.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -502,6 +502,7 @@ > } > proc->name.vpid = rank; > /* Either init or update the epoch. */ > + proc->name.epoch = ORTE_EPOCH_INVALID; > proc->name.epoch = orte_ess.proc_get_epoch(&proc->name); > > proc->slot_list = strdup(rfmap->slot_list); > > Modified: trunk/orte/mca/rmaps/seq/rmaps_seq.c > ============================================================================== > --- trunk/orte/mca/rmaps/seq/rmaps_seq.c (original) > +++ trunk/orte/mca/rmaps/seq/rmaps_seq.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -235,6 +235,7 @@ > } > /* assign the vpid */ > proc->name.vpid = vpid++; > + proc->name.epoch = ORTE_EPOCH_INVALID; > proc->name.epoch = orte_ess.proc_get_epoch(&proc->name); > > /* add to the jdata proc array */ > > Modified: trunk/orte/mca/rml/oob/rml_oob_component.c > ============================================================================== > --- trunk/orte/mca/rml/oob/rml_oob_component.c (original) > +++ trunk/orte/mca/rml/oob/rml_oob_component.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -363,7 +363,6 @@ > origin = hdr->origin; > > next = orte_routed.get_route(&hdr->destination); > -#if 0 > if (next.vpid == ORTE_VPID_INVALID) { > opal_output(0, > "%s:queued progress tried routing message from %s to > %s:%d, can't find route", > @@ -374,7 +373,6 @@ > opal_backtrace_print(stderr); > orte_errmgr.abort(ORTE_ERROR_DEFAULT_EXIT_CODE, NULL); > } > -#endif > > if (OPAL_EQUAL == orte_util_compare_name_fields(ORTE_NS_CMP_ALL, > &next, ORTE_PROC_MY_NAME)) { > opal_output(0, "%s:queued progress trying to get message from %s > to %s:%d, routing loop", > @@ -475,7 +473,6 @@ > > next = orte_routed.get_route(&hdr->destination); > if (next.vpid == ORTE_VPID_INVALID) { > -#if 0 > opal_output(0, "%s:route_callback tried routing message from %s to > %s:%d, can't find route", > ORTE_NAME_PRINT(ORTE_PROC_MY_NAME), > ORTE_NAME_PRINT(&origin), > @@ -483,7 +480,6 @@ > hdr->tag); > opal_backtrace_print(stderr); > orte_errmgr.abort(ORTE_ERROR_DEFAULT_EXIT_CODE, NULL); > -#endif > return; > } > > > Modified: trunk/orte/mca/routed/binomial/routed_binomial.c > ============================================================================== > --- trunk/orte/mca/routed/binomial/routed_binomial.c (original) > +++ trunk/orte/mca/routed/binomial/routed_binomial.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -274,6 +274,7 @@ > ORTE_NAME_PRINT(route))); > jfam->route.jobid = route->jobid; > jfam->route.vpid = route->vpid; > + jfam->route.epoch = ORTE_EPOCH_INVALID; > jfam->route.epoch = orte_ess.proc_get_epoch(&jfam->route); > > return ORTE_SUCCESS; > @@ -289,6 +290,7 @@ > jfam->job_family = jfamily; > jfam->route.jobid = route->jobid; > jfam->route.vpid = route->vpid; > + jfam->route.epoch = ORTE_EPOCH_INVALID; > jfam->route.epoch = orte_ess.proc_get_epoch(&jfam->route); > > opal_pointer_array_add(&orte_routed_jobfams, jfam); > @@ -459,6 +461,7 @@ > ret = &daemon; > > found: > + daemon.epoch = ORTE_EPOCH_INVALID; > daemon.epoch = orte_ess.proc_get_epoch(&daemon); > > OPAL_OUTPUT_VERBOSE((1, orte_routed_base_output, > @@ -1007,6 +1010,7 @@ > ORTE_PROC_MY_PARENT->vpid = binomial_tree(0, 0, ORTE_PROC_MY_NAME->vpid, > orte_process_info.max_procs, > &num_children, &my_children, NULL, true, > jobid); > + ORTE_PROC_MY_PARENT->epoch = ORTE_EPOCH_INVALID; > ORTE_PROC_MY_PARENT->epoch = orte_ess.proc_get_epoch(ORTE_PROC_MY_PARENT); > > if (0 < opal_output_get_verbosity(orte_routed_base_output)) { > > Modified: trunk/orte/mca/routed/cm/routed_cm.c > ============================================================================== > --- trunk/orte/mca/routed/cm/routed_cm.c (original) > +++ trunk/orte/mca/routed/cm/routed_cm.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -257,6 +257,7 @@ > ORTE_NAME_PRINT(route))); > jfam->route.jobid = route->jobid; > jfam->route.vpid = route->vpid; > + jfam->route.epoch = ORTE_EPOCH_INVALID; > jfam->route.epoch = orte_ess.proc_get_epoch(&jfam->route); > > return ORTE_SUCCESS; > @@ -272,6 +273,7 @@ > jfam->job_family = jfamily; > jfam->route.jobid = route->jobid; > jfam->route.vpid = route->vpid; > + jfam->route.epoch = ORTE_EPOCH_INVALID; > jfam->route.epoch = orte_ess.proc_get_epoch(&jfam->route); > > opal_pointer_array_add(&orte_routed_jobfams, jfam); > @@ -365,6 +367,7 @@ > } > > /* Initialize daemon's epoch, based on its current vpid/jobid */ > + daemon.epoch = ORTE_EPOCH_INVALID; > daemon.epoch = orte_ess.proc_get_epoch(&daemon); > > /* if the daemon is me, then send direct to the target! */ > @@ -811,6 +814,7 @@ > */ > local_lifeline.jobid = proc->jobid; > local_lifeline.vpid = proc->vpid; > + local_lifeline.epoch = ORTE_EPOCH_INVALID; > local_lifeline.epoch = orte_ess.proc_get_epoch(&local_lifeline); > > lifeline = &local_lifeline; > > Modified: trunk/orte/mca/routed/linear/routed_linear.c > ============================================================================== > --- trunk/orte/mca/routed/linear/routed_linear.c (original) > +++ trunk/orte/mca/routed/linear/routed_linear.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -373,6 +373,7 @@ > } > > /* Initialize daemon's epoch, based on its current vpid/jobid */ > + daemon.epoch = ORTE_EPOCH_INVALID; > daemon.epoch = orte_ess.proc_get_epoch(&daemon); > > /* if the daemon is me, then send direct to the target! */ > @@ -394,6 +395,7 @@ > /* we are at end of chain - wrap around */ > daemon.vpid = 0; > } > + daemon.epoch = ORTE_EPOCH_INVALID; > daemon.epoch = orte_ess.proc_get_epoch(&daemon); > ret = &daemon; > } > > Modified: trunk/orte/mca/routed/radix/routed_radix.c > ============================================================================== > --- trunk/orte/mca/routed/radix/routed_radix.c (original) > +++ trunk/orte/mca/routed/radix/routed_radix.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -413,6 +413,7 @@ > if (opal_bitmap_is_set_bit(&child->relatives, daemon.vpid)) { > /* yep - we need to step through this child */ > daemon.vpid = child->vpid; > + daemon.epoch = ORTE_EPOCH_INVALID; > daemon.epoch = orte_ess.proc_get_epoch(&daemon); > ret = &daemon; > goto found; > @@ -424,6 +425,7 @@ > * any of our children, so we have to step up through our parent > */ > daemon.vpid = ORTE_PROC_MY_PARENT->vpid; > + daemon.epoch = ORTE_EPOCH_INVALID; > daemon.epoch = orte_ess.proc_get_epoch(&daemon); > > ret = &daemon; > @@ -879,6 +881,7 @@ > ORTE_PROC_MY_PARENT->vpid = (Ii-Sum) % NInPrevLevel; > ORTE_PROC_MY_PARENT->vpid += (Sum - NInPrevLevel); > } > + ORTE_PROC_MY_PARENT->epoch = ORTE_EPOCH_INVALID; > ORTE_PROC_MY_PARENT->epoch = orte_ess.proc_get_epoch(ORTE_PROC_MY_PARENT); > > /* compute my direct children and the bitmap that shows which vpids > > Modified: trunk/orte/mca/routed/slave/routed_slave.c > ============================================================================== > --- trunk/orte/mca/routed/slave/routed_slave.c (original) > +++ trunk/orte/mca/routed/slave/routed_slave.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -275,6 +275,7 @@ > */ > local_lifeline.jobid = proc->jobid; > local_lifeline.vpid = proc->vpid; > + local_lifeline.epoch = ORTE_EPOCH_INVALID; > local_lifeline.epoch = orte_ess.proc_get_epoch(&local_lifeline); > > lifeline = &local_lifeline; > > Modified: trunk/orte/mca/sstore/central/sstore_central_global.c > ============================================================================== > --- trunk/orte/mca/sstore/central/sstore_central_global.c (original) > +++ trunk/orte/mca/sstore/central/sstore_central_global.c 2011-08-08 > 11:11:55 EDT (Mon, 08 Aug 2011) > @@ -1216,6 +1216,7 @@ > > vpid_snapshot->process_name.jobid = handle_info->jobid; > vpid_snapshot->process_name.vpid = i; > + vpid_snapshot->process_name.epoch = ORTE_EPOCH_INVALID; > vpid_snapshot->process_name.epoch = > orte_ess.proc_get_epoch(&vpid_snapshot->process_name); > > vpid_snapshot->crs_comp = NULL; > > Modified: trunk/orte/mca/sstore/stage/sstore_stage_global.c > ============================================================================== > --- trunk/orte/mca/sstore/stage/sstore_stage_global.c (original) > +++ trunk/orte/mca/sstore/stage/sstore_stage_global.c 2011-08-08 11:11:55 EDT > (Mon, 08 Aug 2011) > @@ -1706,6 +1706,7 @@ > > vpid_snapshot->process_name.jobid = handle_info->jobid; > vpid_snapshot->process_name.vpid = i; > + vpid_snapshot->process_name.epoch = ORTE_EPOCH_INVALID; > vpid_snapshot->process_name.epoch = > orte_ess.proc_get_epoch(&vpid_snapshot->process_name); > > /* JJH: Currently we do not have this information since we do not save > > Modified: trunk/orte/orted/orted_comm.c > ============================================================================== > --- trunk/orte/orted/orted_comm.c (original) > +++ trunk/orte/orted/orted_comm.c 2011-08-08 11:11:55 EDT (Mon, 08 Aug > 2011) > @@ -129,6 +129,7 @@ > continue; > } > > + target.epoch = ORTE_EPOCH_INVALID; > if (ORTE_NODE_RANK_INVALID == (target.epoch = > orte_ess.proc_get_epoch(&target))) { > /* If we are trying to send to a previously failed process it's > * better to fail silently. */ > > Modified: trunk/orte/test/system/oob_stress.c > ============================================================================== > --- trunk/orte/test/system/oob_stress.c (original) > +++ trunk/orte/test/system/oob_stress.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -74,7 +74,7 @@ > > for (j=1; j < count+1; j++) { > peer.vpid = (ORTE_PROC_MY_NAME->vpid + j) % > orte_process_info.num_procs; > - > + peer.epoch = ORTE_EPOCH_INVALID; > peer.epoch = orte_ess.proc_get_epoch(&peer); > > /* rank0 starts ring */ > > Modified: trunk/orte/test/system/orte_ring.c > ============================================================================== > --- trunk/orte/test/system/orte_ring.c (original) > +++ trunk/orte/test/system/orte_ring.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -41,6 +41,7 @@ > if( right_peer_orte_name.vpid >= num_peers ) { > right_peer_orte_name.vpid = 0; > } > + right_peer_orte_name.epoch = ORTE_EPOCH_INVALID; > right_peer_orte_name.epoch = > orte_ess.proc_get_epoch(&right_peer_orte_name); > > left_peer_orte_name.jobid = ORTE_PROC_MY_NAME->jobid; > @@ -48,6 +49,7 @@ > if( ORTE_PROC_MY_NAME->vpid == 0 ) { > left_peer_orte_name.vpid = num_peers - 1; > } > + left_peer_orte_name.epoch = ORTE_EPOCH_INVALID; > left_peer_orte_name.epoch = orte_ess.proc_get_epoch(&left_peer_orte_name); > > printf("My name is: %s -- PID %d\tMy Left Peer is %s\tMy Right Peer is > %s\n", > > Modified: trunk/orte/test/system/orte_spawn.c > ============================================================================== > --- trunk/orte/test/system/orte_spawn.c (original) > +++ trunk/orte/test/system/orte_spawn.c 2011-08-08 11:11:55 EDT (Mon, > 08 Aug 2011) > @@ -74,6 +74,7 @@ > for (i=0; i < app->num_procs; i++) { > name.vpid = i; > > + name.epoch = ORTE_EPOCH_INVALID; > name.epoch = orte_ess.proc_get_epoch(&name); > fprintf(stderr, "Parent: sending message to child %s\n", > ORTE_NAME_PRINT(&name)); > if (0 > (rc = orte_rml.send(&name, &msg, 1, MY_TAG, 0))) { > _______________________________________________ > svn-full mailing list > svn-f...@open-mpi.org > http://www.open-mpi.org/mailman/listinfo.cgi/svn-full -- Jeff Squyres jsquy...@cisco.com For corporate legal information go to: http://www.cisco.com/web/about/doing_business/legal/cri/