mpid_rma.c 15.6 KB
Newer Older
1
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil ; -*- */
2 3 4 5 6 7
/*
 *  (C) 2001 by Argonne National Laboratory.
 *      See COPYRIGHT in top-level directory.
 */

#include "mpidimpl.h"
8
#include "mpidrma.h"
9

Xin Zhao's avatar
Xin Zhao committed
10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
=== BEGIN_MPI_T_CVAR_INFO_BLOCK ===

cvars:
    - name        : MPIR_CVAR_CH3_RMA_SLOTS_SIZE
      category    : CH3
      type        : int
      default     : 262144
      class       : none
      verbosity   : MPI_T_VERBOSITY_USER_BASIC
      scope       : MPI_T_SCOPE_ALL_EQ
      description : >-
        Number of RMA slots during window creation. Each slot contains
        a linked list of target elements. The distribution of ranks among
        slots follows a round-robin pattern. Requires a positive value.

=== END_MPI_T_CVAR_INFO_BLOCK ===
*/

29 30 31

MPIU_THREADSAFE_INIT_DECL(initRMAoptions);

Xin Zhao's avatar
Xin Zhao committed
32
MPIDI_RMA_Win_list_t *MPIDI_RMA_Win_list = NULL, *MPIDI_RMA_Win_list_tail = NULL;
33 34
int num_active_issued_win = 0;
int num_passive_win = 0;
Xin Zhao's avatar
Xin Zhao committed
35

36
static int win_init(MPI_Aint size, int disp_unit, int create_flavor, int model,
37
                    MPID_Comm * comm_ptr, MPID_Win ** win_ptr);
38 39


40 41 42
#define MPID_WIN_FTABLE_SET_DEFAULTS(win_ptr)                   \
    do {                                                        \
        /* Get ptr to RMAFns, which is embedded in MPID_Win */  \
43
        MPID_RMAFns *ftable         = &(*(win_ptr))->RMAFns;    \
44
        ftable->Win_free            = MPIDI_Win_free;           \
45 46
        ftable->Win_attach          = MPIDI_Win_attach;         \
        ftable->Win_detach          = MPIDI_Win_detach;         \
47 48
        ftable->Win_shared_query    = MPIDI_Win_shared_query;   \
                                                                \
49 50 51
        ftable->Win_set_info        = MPIDI_Win_set_info;       \
        ftable->Win_get_info        = MPIDI_Win_get_info;       \
                                                                \
52 53 54
        ftable->Put                 = MPIDI_Put;                \
        ftable->Get                 = MPIDI_Get;                \
        ftable->Accumulate          = MPIDI_Accumulate;         \
55 56 57
        ftable->Get_accumulate      = MPIDI_Get_accumulate;     \
        ftable->Fetch_and_op        = MPIDI_Fetch_and_op;       \
        ftable->Compare_and_swap    = MPIDI_Compare_and_swap;   \
58
                                                                \
59 60 61 62
        ftable->Rput                = MPIDI_Rput;               \
        ftable->Rget                = MPIDI_Rget;               \
        ftable->Raccumulate         = MPIDI_Raccumulate;        \
        ftable->Rget_accumulate     = MPIDI_Rget_accumulate;    \
63 64 65 66 67 68 69 70 71 72 73 74 75
                                                                \
        ftable->Win_fence           = MPIDI_Win_fence;          \
        ftable->Win_post            = MPIDI_Win_post;           \
        ftable->Win_start           = MPIDI_Win_start;          \
        ftable->Win_complete        = MPIDI_Win_complete;       \
        ftable->Win_wait            = MPIDI_Win_wait;           \
        ftable->Win_test            = MPIDI_Win_test;           \
                                                                \
        ftable->Win_lock            = MPIDI_Win_lock;           \
        ftable->Win_unlock          = MPIDI_Win_unlock;         \
        ftable->Win_lock_all        = MPIDI_Win_lock_all;       \
        ftable->Win_unlock_all      = MPIDI_Win_unlock_all;     \
                                                                \
76 77 78 79
        ftable->Win_flush           = MPIDI_Win_flush;          \
        ftable->Win_flush_all       = MPIDI_Win_flush_all;      \
        ftable->Win_flush_local     = MPIDI_Win_flush_local;    \
        ftable->Win_flush_local_all = MPIDI_Win_flush_local_all;\
80 81 82 83
        ftable->Win_sync            = MPIDI_Win_sync;           \
    } while (0)


84
#undef FUNCNAME
85
#define FUNCNAME MPID_Win_create
86 87
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
88 89
int MPID_Win_create(void *base, MPI_Aint size, int disp_unit, MPID_Info * info,
                    MPID_Comm * comm_ptr, MPID_Win ** win_ptr)
90
{
91
    int mpi_errno = MPI_SUCCESS;
92

93
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_CREATE);
94

95 96
    MPIDI_RMA_FUNC_ENTER(MPID_STATE_MPID_WIN_CREATE);

Wesley Bland's avatar
Wesley Bland committed
97 98
    /* Check to make sure the communicator hasn't already been revoked */
    if (comm_ptr->revoked) {
99
        MPIU_ERR_SETANDJUMP(mpi_errno, MPIX_ERR_REVOKED, "**revoked");
Wesley Bland's avatar
Wesley Bland committed
100 101
    }

102 103 104 105
    mpi_errno =
        win_init(size, disp_unit, MPI_WIN_FLAVOR_CREATE, MPI_WIN_UNIFIED, comm_ptr, win_ptr);
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
106

107 108
    (*win_ptr)->base = base;

109 110 111
    mpi_errno = MPIDI_CH3U_Win_fns.create(base, size, disp_unit, info, comm_ptr, win_ptr);
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
112

113
  fn_fail:
114 115 116 117 118 119 120 121 122
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_CREATE);
    return mpi_errno;
}


#undef FUNCNAME
#define FUNCNAME MPID_Win_allocate
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
123 124
int MPID_Win_allocate(MPI_Aint size, int disp_unit, MPID_Info * info,
                      MPID_Comm * comm_ptr, void *baseptr, MPID_Win ** win_ptr)
125
{
126
    int mpi_errno = MPI_SUCCESS;
127
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_ALLOCATE);
128

129 130
    MPIDI_RMA_FUNC_ENTER(MPID_STATE_MPID_WIN_ALLOCATE);

131 132 133 134 135
    mpi_errno =
        win_init(size, disp_unit, MPI_WIN_FLAVOR_ALLOCATE, MPI_WIN_UNIFIED, comm_ptr, win_ptr);
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
136

137 138 139
    /* FOR ALLOCATE, alloc_shm info is default to set to TRUE */
    (*win_ptr)->info_args.alloc_shm = TRUE;

140 141
    if (info != NULL) {
        int alloc_shm_flag = 0;
142
        char shm_alloc_value[MPI_MAX_INFO_VAL + 1];
143
        MPIR_Info_get_impl(info, "alloc_shm", MPI_MAX_INFO_VAL, shm_alloc_value, &alloc_shm_flag);
144 145
        if ((alloc_shm_flag == 1) && (!strncmp(shm_alloc_value, "false", sizeof("false"))))
            (*win_ptr)->info_args.alloc_shm = FALSE;
146 147
    }

148
    mpi_errno = MPIDI_CH3U_Win_fns.allocate(size, disp_unit, info, comm_ptr, baseptr, win_ptr);
149 150 151
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
152

153
  fn_fail:
154 155 156 157 158 159 160 161 162
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_ALLOCATE);
    return mpi_errno;
}


#undef FUNCNAME
#define FUNCNAME MPID_Win_create_dynamic
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
163
int MPID_Win_create_dynamic(MPID_Info * info, MPID_Comm * comm_ptr, MPID_Win ** win_ptr)
164
{
165
    int mpi_errno = MPI_SUCCESS;
166

167
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_CREATE_DYNAMIC);
168

169
    MPIDI_RMA_FUNC_ENTER(MPID_STATE_MPID_WIN_CREATE_DYNAMIC);
170

171 172 173
    mpi_errno = win_init(0 /* spec defines size to be 0 */ ,
                         1 /* spec defines disp_unit to be 1 */ ,
                         MPI_WIN_FLAVOR_DYNAMIC, MPI_WIN_UNIFIED, comm_ptr, win_ptr);
174

175 176
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
177

178 179
    (*win_ptr)->base = MPI_BOTTOM;

180
    mpi_errno = MPIDI_CH3U_Win_fns.create_dynamic(info, comm_ptr, win_ptr);
181 182 183
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
184

185
  fn_fail:
186
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_CREATE_DYNAMIC);
187 188 189 190
    return mpi_errno;
}


191
/* The memory allocation functions */
192 193 194 195
#undef FUNCNAME
#define FUNCNAME MPID_Alloc_mem
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
196
void *MPID_Alloc_mem(size_t size, MPID_Info * info_ptr)
197
{
198
    void *ap = NULL;
199 200 201 202
    MPIDI_STATE_DECL(MPID_STATE_MPID_ALLOC_MEM);

    MPIDI_FUNC_ENTER(MPID_STATE_MPID_ALLOC_MEM);

203
    ap = MPIDI_Alloc_mem(size, info_ptr);
204

205 206 207 208 209 210 211 212 213
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_ALLOC_MEM);
    return ap;
}


#undef FUNCNAME
#define FUNCNAME MPID_Free_mem
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
214
int MPID_Free_mem(void *ptr)
215 216 217 218 219 220
{
    int mpi_errno = MPI_SUCCESS;
    MPIDI_STATE_DECL(MPID_STATE_MPID_FREE_MEM);

    MPIDI_FUNC_ENTER(MPID_STATE_MPID_FREE_MEM);

221
    mpi_errno = MPIDI_Free_mem(ptr);
222
    if (mpi_errno != MPI_SUCCESS) {
223
        MPIU_ERR_POP(mpi_errno);
224
    }
225 226

  fn_fail:
227
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_FREE_MEM);
228 229 230
    return mpi_errno;
}

231

232 233 234 235
#undef FUNCNAME
#define FUNCNAME MPID_Win_allocate_shared
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
236 237
int MPID_Win_allocate_shared(MPI_Aint size, int disp_unit, MPID_Info * info, MPID_Comm * comm_ptr,
                             void *base_ptr, MPID_Win ** win_ptr)
238
{
239
    int mpi_errno = MPI_SUCCESS;
240 241

    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_ALLOCATE_SHARED);
242

243 244
    MPIDI_RMA_FUNC_ENTER(MPID_STATE_MPID_WIN_ALLOCATE_SHARED);

245 246 247 248
    mpi_errno =
        win_init(size, disp_unit, MPI_WIN_FLAVOR_SHARED, MPI_WIN_UNIFIED, comm_ptr, win_ptr);
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
249

250 251 252 253 254
    /* FOR ALLOCATE_SHARED, alloc_shm info is default to set to TRUE */
    (*win_ptr)->info_args.alloc_shm = TRUE;

    if (info != NULL) {
        int alloc_shm_flag = 0;
255
        char shm_alloc_value[MPI_MAX_INFO_VAL + 1];
256 257 258 259 260 261
        MPIR_Info_get_impl(info, "alloc_shm", MPI_MAX_INFO_VAL, shm_alloc_value, &alloc_shm_flag);
        /* if value of 'alloc_shm' info is not set to true, throw an error */
        if (alloc_shm_flag == 1 && strncmp(shm_alloc_value, "true", sizeof("true")))
            MPIU_ERR_SETANDJUMP(mpi_errno, MPI_ERR_OTHER, "**infoval");
    }

262 263 264 265
    mpi_errno =
        MPIDI_CH3U_Win_fns.allocate_shared(size, disp_unit, info, comm_ptr, base_ptr, win_ptr);
    if (mpi_errno != MPI_SUCCESS)
        MPIU_ERR_POP(mpi_errno);
266

267
  fn_fail:
268 269 270
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_ALLOCATE_SHARED);
    return mpi_errno;
}
271 272 273 274 275 276 277


#undef FUNCNAME
#define FUNCNAME win_init
#undef FCNAME
#define FCNAME MPIU_QUOTE(FUNCNAME)
static int win_init(MPI_Aint size, int disp_unit, int create_flavor, int model,
278
                    MPID_Comm * comm_ptr, MPID_Win ** win_ptr)
279 280
{
    int mpi_errno = MPI_SUCCESS;
281
    int i;
282
    MPID_Comm *win_comm_ptr;
283
    int win_target_pool_size;
Xin Zhao's avatar
Xin Zhao committed
284 285
    MPIDI_RMA_Win_list_t *win_elem;
    MPIU_CHKPMEM_DECL(5);
286 287 288 289
    MPIDI_STATE_DECL(MPID_STATE_WIN_INIT);

    MPIDI_FUNC_ENTER(MPID_STATE_WIN_INIT);

290
    if (initRMAoptions) {
291
        MPIU_THREADSAFE_INIT_BLOCK_BEGIN(initRMAoptions);
292 293

        MPIDI_CH3_RMA_Init_Pvars();
294 295 296 297 298

        MPIU_THREADSAFE_INIT_CLEAR(initRMAoptions);
        MPIU_THREADSAFE_INIT_BLOCK_END(initRMAoptions);
    }

299 300 301
    *win_ptr = (MPID_Win *) MPIU_Handle_obj_alloc(&MPID_Win_mem);
    MPIU_ERR_CHKANDJUMP1(!(*win_ptr), mpi_errno, MPI_ERR_OTHER, "**nomem",
                         "**nomem %s", "MPID_Win_mem");
302 303

    mpi_errno = MPIR_Comm_dup_impl(comm_ptr, &win_comm_ptr);
304 305
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
306 307 308 309 310

    MPIU_Object_set_ref(*win_ptr, 1);

    /* (*win_ptr)->errhandler is set by upper level; */
    /* (*win_ptr)->base is set by caller; */
311 312 313 314 315 316
    (*win_ptr)->size = size;
    (*win_ptr)->disp_unit = disp_unit;
    (*win_ptr)->create_flavor = create_flavor;
    (*win_ptr)->model = model;
    (*win_ptr)->attributes = NULL;
    (*win_ptr)->comm_ptr = win_comm_ptr;
317

318
    (*win_ptr)->at_completion_counter = 0;
319 320 321 322
    /* (*win_ptr)->base_addrs[] is set by caller; */
    /* (*win_ptr)->sizes[] is set by caller; */
    /* (*win_ptr)->disp_units[] is set by caller; */
    /* (*win_ptr)->all_win_handles[] is set by caller; */
323
    (*win_ptr)->current_lock_type = MPID_LOCK_NONE;
324
    (*win_ptr)->shared_lock_ref_cnt = 0;
325 326 327 328
    (*win_ptr)->lock_queue = NULL;
    (*win_ptr)->epoch_state = MPIDI_EPOCH_NONE;
    (*win_ptr)->epoch_count = 0;
    (*win_ptr)->at_rma_ops_list = NULL;
329
    (*win_ptr)->at_rma_ops_list_tail = NULL;
330
    (*win_ptr)->shm_allocated = FALSE;
331 332
    (*win_ptr)->states.access_state = MPIDI_RMA_NONE;
    (*win_ptr)->states.exposure_state = MPIDI_RMA_NONE;
333
    (*win_ptr)->non_empty_slots = 0;
334
    (*win_ptr)->posted_ops_cnt = 0;
335
    (*win_ptr)->active_req_cnt = 0;
336 337 338 339 340 341 342 343
    (*win_ptr)->fence_sync_req = MPI_REQUEST_NULL;
    (*win_ptr)->start_req = NULL;
    (*win_ptr)->start_ranks_in_win_grp = NULL;
    (*win_ptr)->start_grp_size = 0;
    (*win_ptr)->lock_all_assert = 0;
    (*win_ptr)->lock_epoch_count = 0;
    (*win_ptr)->outstanding_locks = 0;
    (*win_ptr)->outstanding_unlocks = 0;
344

345
    /* Initialize the passive target lock state */
346
    MPIU_CHKPMEM_MALLOC((*win_ptr)->targets, struct MPIDI_Win_target_state *,
347
                        sizeof(struct MPIDI_Win_target_state) * MPIR_Comm_size(win_comm_ptr),
348 349 350 351
                        mpi_errno, "RMA target states array");

    for (i = 0; i < MPIR_Comm_size(win_comm_ptr); i++) {
        (*win_ptr)->targets[i].rma_ops_list = NULL;
352
        (*win_ptr)->targets[i].rma_ops_list_tail = NULL;
353
        (*win_ptr)->targets[i].remote_lock_state = MPIDI_CH3_WIN_LOCK_NONE;
354 355
    }

356
    /* Initialize the info flags */
357
    (*win_ptr)->info_args.no_locks = 0;
358
    (*win_ptr)->info_args.accumulate_ordering = MPIDI_ACC_ORDER_RAR | MPIDI_ACC_ORDER_RAW |
359 360 361
        MPIDI_ACC_ORDER_WAR | MPIDI_ACC_ORDER_WAW;
    (*win_ptr)->info_args.accumulate_ops = MPIDI_ACC_OPS_SAME_OP_NO_OP;
    (*win_ptr)->info_args.same_size = 0;
362
    (*win_ptr)->info_args.alloc_shared_noncontig = 0;
363
    (*win_ptr)->info_args.alloc_shm = FALSE;
364

365 366 367 368 369 370 371 372 373 374
    MPIU_CHKPMEM_MALLOC((*win_ptr)->op_pool_start, struct MPIDI_RMA_Op *,
                        sizeof(MPIDI_RMA_Op_t) * MPIR_CVAR_CH3_RMA_OP_WIN_POOL_SIZE, mpi_errno,
                        "RMA op pool");
    (*win_ptr)->op_pool = NULL;
    (*win_ptr)->op_pool_tail = NULL;
    for (i = 0; i < MPIR_CVAR_CH3_RMA_OP_WIN_POOL_SIZE; i++) {
        (*win_ptr)->op_pool_start[i].pool_type = MPIDI_RMA_POOL_WIN;
        MPL_LL_APPEND((*win_ptr)->op_pool, (*win_ptr)->op_pool_tail, &((*win_ptr)->op_pool_start[i]));
    }

375 376 377 378 379 380 381 382 383 384 385
    win_target_pool_size = MPIR_MIN(MPIR_CVAR_CH3_RMA_TARGET_WIN_POOL_SIZE, MPIR_Comm_size(win_comm_ptr));
    MPIU_CHKPMEM_MALLOC((*win_ptr)->target_pool_start, struct MPIDI_RMA_Target *,
                        sizeof(MPIDI_RMA_Target_t) * win_target_pool_size,
                        mpi_errno, "RMA target pool");
    (*win_ptr)->target_pool = NULL;
    (*win_ptr)->target_pool_tail = NULL;
    for (i = 0; i < win_target_pool_size; i++) {
        (*win_ptr)->target_pool_start[i].pool_type = MPIDI_RMA_POOL_WIN;
        MPL_LL_APPEND((*win_ptr)->target_pool, (*win_ptr)->target_pool_tail, &((*win_ptr)->target_pool_start[i]));
    }

Xin Zhao's avatar
Xin Zhao committed
386 387 388 389 390 391 392 393
    (*win_ptr)->num_slots = MPIR_MIN(MPIR_CVAR_CH3_RMA_SLOTS_SIZE, MPIR_Comm_size(win_comm_ptr));
    MPIU_CHKPMEM_MALLOC((*win_ptr)->slots, struct MPIDI_RMA_Slot *,
                        sizeof(MPIDI_RMA_Slot_t) * (*win_ptr)->num_slots, mpi_errno, "RMA slots");
    for (i = 0; i < (*win_ptr)->num_slots; i++) {
        (*win_ptr)->slots[i].target_list = NULL;
        (*win_ptr)->slots[i].target_list_tail = NULL;
    }

394 395
    MPID_WIN_FTABLE_SET_DEFAULTS(win_ptr);

Xin Zhao's avatar
Xin Zhao committed
396 397 398 399 400 401
    /* enqueue window into the global list */
    MPIU_CHKPMEM_MALLOC(win_elem, MPIDI_RMA_Win_list_t *, sizeof(MPIDI_RMA_Win_list_t), mpi_errno,
                        "Window list element");
    win_elem->win_ptr = *win_ptr;
    MPL_LL_APPEND(MPIDI_RMA_Win_list, MPIDI_RMA_Win_list_tail, win_elem);

402
  fn_exit:
403 404
    MPIDI_FUNC_EXIT(MPID_STATE_WIN_INIT);
    return mpi_errno;
405
  fn_fail:
406
    MPIU_CHKPMEM_REAP();
407 408
    goto fn_exit;
}
409 410 411 412 413 414


#undef FUNCNAME
#define FUNCNAME MPID_Win_set_info
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
415
int MPID_Win_set_info(MPID_Win * win, MPID_Info * info)
416 417 418 419 420 421 422
{
    int mpi_errno = MPI_SUCCESS;
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_SET_INFO);

    MPIDI_FUNC_ENTER(MPID_STATE_MPID_WIN_SET_INFO);

    mpi_errno = win->RMAFns.Win_set_info(win, info);
423 424 425
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
426

427
  fn_exit:
428 429
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_SET_INFO);
    return mpi_errno;
430
  fn_fail:
431 432 433 434 435 436 437 438
    goto fn_exit;
}


#undef FUNCNAME
#define FUNCNAME MPID_Win_get_info
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
439
int MPID_Win_get_info(MPID_Win * win, MPID_Info ** info_used)
440 441 442 443 444 445 446
{
    int mpi_errno = MPI_SUCCESS;
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_GET_INFO);

    MPIDI_FUNC_ENTER(MPID_STATE_MPID_WIN_GET_INFO);

    mpi_errno = win->RMAFns.Win_get_info(win, info_used);
447 448 449
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
450

451
  fn_exit:
452 453
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_GET_INFO);
    return mpi_errno;
454
  fn_fail:
455 456
    goto fn_exit;
}