void _XMP_reflect__(_XMP_array_t *a) { int is_ordinal = 1; //_XMP_RETURN_IF_SINGLE; if (!a->is_allocated){ _xmp_set_reflect_flag = 0; return; } if (!_xmp_set_reflect_flag){ for (int i = 0; i < a->dim; i++){ _XMP_array_info_t *ai = &(a->info[i]); _xmp_lwidth[i] = ai->shadow_size_lo; _xmp_uwidth[i] = ai->shadow_size_hi; _xmp_is_periodic[i] = 0; } } _XMP_TSTART(t0); for (int i = 0; i < a->dim; i++){ _XMP_array_info_t *ai = &(a->info[i]); if (ai->shadow_type == _XMP_N_SHADOW_NONE){ continue; } else if (ai->shadow_type == _XMP_N_SHADOW_NORMAL){ _XMP_reflect_sched_t *reflect = ai->reflect_sched; if (_xmp_lwidth[i] || _xmp_uwidth[i]){ _XMP_ASSERT(reflect); /* if (!reflect->reflect_is_initialized || */ /* _xmp_lwidth[i] != reflect->lo_width || */ /* _xmp_uwidth[i] != reflect->hi_width || */ /* _xmp_is_periodic[i] != reflect->is_periodic){ */ /* reflect->lo_width = _xmp_lwidth[i]; */ /* reflect->hi_width = _xmp_uwidth[i]; */ /* reflect->is_periodic = _xmp_is_periodic[i]; */ /* if (_xmp_reflect_pack_flag){ */ /* _XMP_reflect_pcopy_sched_dim(a, i, _xmp_lwidth[i], _xmp_uwidth[i], _xmp_is_periodic[i], 0); */ /* } */ /* else { */ /* _XMP_reflect_normal_sched_dim(a, i, _xmp_lwidth[i], _xmp_uwidth[i], _xmp_is_periodic[i]); */ /* } */ /* reflect->reflect_is_initialized = 1; */ /* } */ if (!reflect->reflect_is_initialized || _xmp_lwidth[i] != reflect->lo_width || _xmp_uwidth[i] != reflect->hi_width || _xmp_is_periodic[i] != reflect->is_periodic){ if (_xmp_reflect_pack_flag){ _XMP_reflect_pcopy_sched_dim(a, i, _xmp_lwidth[i], _xmp_uwidth[i], _xmp_is_periodic[i], _XMP_COMM_REFLECT); } else { _XMP_reflect_normal_sched_dim(a, i, _xmp_lwidth[i], _xmp_uwidth[i], _xmp_is_periodic[i]); } reflect->reflect_is_initialized = 1; reflect->lo_width = _xmp_lwidth[i]; reflect->hi_width = _xmp_uwidth[i]; reflect->is_periodic = _xmp_is_periodic[i]; } if (_xmp_reflect_pack_flag && reflect->req[0] != MPI_REQUEST_NULL){ _XMP_TSTART(t0); _XMP_reflect_pack_dim(a, i, _xmp_lwidth, _xmp_uwidth, _xmp_is_periodic, _XMP_COMM_REFLECT); _XMP_TEND(xmptiming_.t_copy, t0); } _XMP_TSTART(t0); if (reflect->req[0] != MPI_REQUEST_NULL) // if req[0] isn't null, any others shouldn't be null. MPI_Startall(4, reflect->req); _XMP_TEND2(xmptiming_.t_comm, xmptiming_.tdim_comm[i], t0); if (is_ordinal){ _XMP_TSTART(t0); MPI_Waitall(4, reflect->req, MPI_STATUSES_IGNORE); _XMP_TEND2(xmptiming_.t_wait, xmptiming_.tdim_wait[i], t0); if (_xmp_reflect_pack_flag && reflect->req[0] != MPI_REQUEST_NULL){ _XMP_TSTART(t0); _XMP_reflect_unpack_dim(a, i, _xmp_lwidth, _xmp_uwidth, _xmp_is_periodic); _XMP_TEND(xmptiming_.t_copy, t0); } } } } else { /* _XMP_N_SHADOW_FULL */ _XMP_reflect_shadow_FULL(a->array_addr_p, a, i); } } _XMP_TEND(xmptiming_.t_sched, t0); // t0 = MPI_Wtime(); if (!is_ordinal) _XMP_reflect_wait(a, _xmp_lwidth, _xmp_uwidth, _xmp_is_periodic); // t_wait = t_wait + (MPI_Wtime() - t0); _xmp_set_reflect_flag = 0; for (int i = 0; i < a->dim; i++){ _xmp_lwidth[i] = 0; _xmp_uwidth[i] = 0; _xmp_is_periodic[i] = 0; } }
static void _XMP_reflect_sched(_XMP_array_t *a, int *lwidth, int *uwidth, int *is_periodic, int is_async, void *dev_addr) { _XMP_TSTART(t0); for (int i = 0; i < a->dim; i++){ _XMP_array_info_t *ai = &(a->info[i]); if (ai->shadow_type == _XMP_N_SHADOW_NONE){ continue; } else if (ai->shadow_type == _XMP_N_SHADOW_NORMAL){ _XMP_reflect_sched_t *reflect = ai->reflect_acc_sched; if(reflect == NULL){ reflect = _XMP_alloc(sizeof(_XMP_reflect_sched_t)); reflect->is_periodic = -1; /* not used yet */ reflect->datatype_lo = MPI_DATATYPE_NULL; reflect->datatype_hi = MPI_DATATYPE_NULL; for (int j = 0; j < 4; j++) reflect->req[j] = MPI_REQUEST_NULL; reflect->lo_send_buf = NULL; reflect->lo_recv_buf = NULL; reflect->hi_send_buf = NULL; reflect->hi_recv_buf = NULL; reflect->lo_send_host_buf = NULL; reflect->lo_recv_host_buf = NULL; reflect->hi_send_host_buf = NULL; reflect->hi_recv_host_buf = NULL; ai->reflect_acc_sched = reflect; }else{ // } if (1/*lwidth[i] || uwidth[i]*/){ _XMP_ASSERT(reflect); if (reflect->is_periodic == -1 /* not set yet */ || lwidth[i] != reflect->lo_width || uwidth[i] != reflect->hi_width || is_periodic[i] != reflect->is_periodic){ reflect->lo_width = lwidth[i]; reflect->hi_width = uwidth[i]; reflect->is_periodic = is_periodic[i]; if (/*_xmp_reflect_pack_flag && !is_async*/ 1){ _XMP_reflect_pcopy_sched_dim(a, i, lwidth[i], uwidth[i], is_periodic[i], dev_addr, lwidth, uwidth); } else { //_XMP_reflect_normal_sched_dim(a, i, lwidth[i], uwidth[i], is_periodic[i]); } } } } else { /* _XMP_N_SHADOW_FULL */ ; } } _XMP_TEND(xmptiming_.t_sched, t0); }