mpid_rma.c 15.4 KB
Newer Older
1
/* -*- Mode: C; c-basic-offset:4 ; indent-tabs-mode:nil ; -*- */
2 3 4 5 6 7
/*
 *  (C) 2001 by Argonne National Laboratory.
 *      See COPYRIGHT in top-level directory.
 */

#include "mpidimpl.h"
8
#include "mpidrma.h"
9

Xin Zhao's avatar
Xin Zhao committed
10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
=== BEGIN_MPI_T_CVAR_INFO_BLOCK ===

cvars:
    - name        : MPIR_CVAR_CH3_RMA_SLOTS_SIZE
      category    : CH3
      type        : int
      default     : 262144
      class       : none
      verbosity   : MPI_T_VERBOSITY_USER_BASIC
      scope       : MPI_T_SCOPE_ALL_EQ
      description : >-
        Number of RMA slots during window creation. Each slot contains
        a linked list of target elements. The distribution of ranks among
        slots follows a round-robin pattern. Requires a positive value.

=== END_MPI_T_CVAR_INFO_BLOCK ===
*/

29 30 31

MPIU_THREADSAFE_INIT_DECL(initRMAoptions);

Xin Zhao's avatar
Xin Zhao committed
32 33
MPIDI_RMA_Win_list_t *MPIDI_RMA_Win_list = NULL, *MPIDI_RMA_Win_list_tail = NULL;

34
static int win_init(MPI_Aint size, int disp_unit, int create_flavor, int model,
35
                    MPID_Comm * comm_ptr, MPID_Win ** win_ptr);
36 37


38 39 40
#define MPID_WIN_FTABLE_SET_DEFAULTS(win_ptr)                   \
    do {                                                        \
        /* Get ptr to RMAFns, which is embedded in MPID_Win */  \
41
        MPID_RMAFns *ftable         = &(*(win_ptr))->RMAFns;    \
42
        ftable->Win_free            = MPIDI_Win_free;           \
43 44
        ftable->Win_attach          = MPIDI_Win_attach;         \
        ftable->Win_detach          = MPIDI_Win_detach;         \
45 46
        ftable->Win_shared_query    = MPIDI_Win_shared_query;   \
                                                                \
47 48 49
        ftable->Win_set_info        = MPIDI_Win_set_info;       \
        ftable->Win_get_info        = MPIDI_Win_get_info;       \
                                                                \
50 51 52
        ftable->Put                 = MPIDI_Put;                \
        ftable->Get                 = MPIDI_Get;                \
        ftable->Accumulate          = MPIDI_Accumulate;         \
53 54 55
        ftable->Get_accumulate      = MPIDI_Get_accumulate;     \
        ftable->Fetch_and_op        = MPIDI_Fetch_and_op;       \
        ftable->Compare_and_swap    = MPIDI_Compare_and_swap;   \
56
                                                                \
57 58 59 60
        ftable->Rput                = MPIDI_Rput;               \
        ftable->Rget                = MPIDI_Rget;               \
        ftable->Raccumulate         = MPIDI_Raccumulate;        \
        ftable->Rget_accumulate     = MPIDI_Rget_accumulate;    \
61 62 63 64 65 66 67 68 69 70 71 72 73
                                                                \
        ftable->Win_fence           = MPIDI_Win_fence;          \
        ftable->Win_post            = MPIDI_Win_post;           \
        ftable->Win_start           = MPIDI_Win_start;          \
        ftable->Win_complete        = MPIDI_Win_complete;       \
        ftable->Win_wait            = MPIDI_Win_wait;           \
        ftable->Win_test            = MPIDI_Win_test;           \
                                                                \
        ftable->Win_lock            = MPIDI_Win_lock;           \
        ftable->Win_unlock          = MPIDI_Win_unlock;         \
        ftable->Win_lock_all        = MPIDI_Win_lock_all;       \
        ftable->Win_unlock_all      = MPIDI_Win_unlock_all;     \
                                                                \
74 75 76 77
        ftable->Win_flush           = MPIDI_Win_flush;          \
        ftable->Win_flush_all       = MPIDI_Win_flush_all;      \
        ftable->Win_flush_local     = MPIDI_Win_flush_local;    \
        ftable->Win_flush_local_all = MPIDI_Win_flush_local_all;\
78 79 80 81
        ftable->Win_sync            = MPIDI_Win_sync;           \
    } while (0)


82
#undef FUNCNAME
83
#define FUNCNAME MPID_Win_create
84 85
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
86 87
int MPID_Win_create(void *base, MPI_Aint size, int disp_unit, MPID_Info * info,
                    MPID_Comm * comm_ptr, MPID_Win ** win_ptr)
88
{
89
    int mpi_errno = MPI_SUCCESS;
90

91
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_CREATE);
92

93 94
    MPIDI_RMA_FUNC_ENTER(MPID_STATE_MPID_WIN_CREATE);

Wesley Bland's avatar
Wesley Bland committed
95 96
    /* Check to make sure the communicator hasn't already been revoked */
    if (comm_ptr->revoked) {
97
        MPIU_ERR_SETANDJUMP(mpi_errno, MPIX_ERR_REVOKED, "**revoked");
Wesley Bland's avatar
Wesley Bland committed
98 99
    }

100 101 102 103
    mpi_errno =
        win_init(size, disp_unit, MPI_WIN_FLAVOR_CREATE, MPI_WIN_UNIFIED, comm_ptr, win_ptr);
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
104

105 106
    (*win_ptr)->base = base;

107 108 109
    mpi_errno = MPIDI_CH3U_Win_fns.create(base, size, disp_unit, info, comm_ptr, win_ptr);
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
110

111
  fn_fail:
112 113 114 115 116 117 118 119 120
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_CREATE);
    return mpi_errno;
}


#undef FUNCNAME
#define FUNCNAME MPID_Win_allocate
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
121 122
int MPID_Win_allocate(MPI_Aint size, int disp_unit, MPID_Info * info,
                      MPID_Comm * comm_ptr, void *baseptr, MPID_Win ** win_ptr)
123
{
124
    int mpi_errno = MPI_SUCCESS;
125
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_ALLOCATE);
126

127 128
    MPIDI_RMA_FUNC_ENTER(MPID_STATE_MPID_WIN_ALLOCATE);

129 130 131 132 133
    mpi_errno =
        win_init(size, disp_unit, MPI_WIN_FLAVOR_ALLOCATE, MPI_WIN_UNIFIED, comm_ptr, win_ptr);
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
134

135 136 137
    /* FOR ALLOCATE, alloc_shm info is default to set to TRUE */
    (*win_ptr)->info_args.alloc_shm = TRUE;

138 139
    if (info != NULL) {
        int alloc_shm_flag = 0;
140
        char shm_alloc_value[MPI_MAX_INFO_VAL + 1];
141
        MPIR_Info_get_impl(info, "alloc_shm", MPI_MAX_INFO_VAL, shm_alloc_value, &alloc_shm_flag);
142 143
        if ((alloc_shm_flag == 1) && (!strncmp(shm_alloc_value, "false", sizeof("false"))))
            (*win_ptr)->info_args.alloc_shm = FALSE;
144 145
    }

146
    mpi_errno = MPIDI_CH3U_Win_fns.allocate(size, disp_unit, info, comm_ptr, baseptr, win_ptr);
147 148 149
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
150

151
  fn_fail:
152 153 154 155 156 157 158 159 160
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_ALLOCATE);
    return mpi_errno;
}


#undef FUNCNAME
#define FUNCNAME MPID_Win_create_dynamic
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
161
int MPID_Win_create_dynamic(MPID_Info * info, MPID_Comm * comm_ptr, MPID_Win ** win_ptr)
162
{
163
    int mpi_errno = MPI_SUCCESS;
164

165
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_CREATE_DYNAMIC);
166

167
    MPIDI_RMA_FUNC_ENTER(MPID_STATE_MPID_WIN_CREATE_DYNAMIC);
168

169 170 171
    mpi_errno = win_init(0 /* spec defines size to be 0 */ ,
                         1 /* spec defines disp_unit to be 1 */ ,
                         MPI_WIN_FLAVOR_DYNAMIC, MPI_WIN_UNIFIED, comm_ptr, win_ptr);
172

173 174
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
175

176 177
    (*win_ptr)->base = MPI_BOTTOM;

178
    mpi_errno = MPIDI_CH3U_Win_fns.create_dynamic(info, comm_ptr, win_ptr);
179 180 181
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
182

183
  fn_fail:
184
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_CREATE_DYNAMIC);
185 186 187 188
    return mpi_errno;
}


189
/* The memory allocation functions */
190 191 192 193
#undef FUNCNAME
#define FUNCNAME MPID_Alloc_mem
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
194
void *MPID_Alloc_mem(size_t size, MPID_Info * info_ptr)
195
{
196
    void *ap = NULL;
197 198 199 200
    MPIDI_STATE_DECL(MPID_STATE_MPID_ALLOC_MEM);

    MPIDI_FUNC_ENTER(MPID_STATE_MPID_ALLOC_MEM);

201
    ap = MPIDI_Alloc_mem(size, info_ptr);
202

203 204 205 206 207 208 209 210 211
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_ALLOC_MEM);
    return ap;
}


#undef FUNCNAME
#define FUNCNAME MPID_Free_mem
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
212
int MPID_Free_mem(void *ptr)
213 214 215 216 217 218
{
    int mpi_errno = MPI_SUCCESS;
    MPIDI_STATE_DECL(MPID_STATE_MPID_FREE_MEM);

    MPIDI_FUNC_ENTER(MPID_STATE_MPID_FREE_MEM);

219
    mpi_errno = MPIDI_Free_mem(ptr);
220
    if (mpi_errno != MPI_SUCCESS) {
221
        MPIU_ERR_POP(mpi_errno);
222
    }
223 224

  fn_fail:
225
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_FREE_MEM);
226 227 228
    return mpi_errno;
}

229

230 231 232 233
#undef FUNCNAME
#define FUNCNAME MPID_Win_allocate_shared
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
234 235
int MPID_Win_allocate_shared(MPI_Aint size, int disp_unit, MPID_Info * info, MPID_Comm * comm_ptr,
                             void *base_ptr, MPID_Win ** win_ptr)
236
{
237
    int mpi_errno = MPI_SUCCESS;
238 239

    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_ALLOCATE_SHARED);
240

241 242
    MPIDI_RMA_FUNC_ENTER(MPID_STATE_MPID_WIN_ALLOCATE_SHARED);

243 244 245 246
    mpi_errno =
        win_init(size, disp_unit, MPI_WIN_FLAVOR_SHARED, MPI_WIN_UNIFIED, comm_ptr, win_ptr);
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
247

248 249 250 251 252
    /* FOR ALLOCATE_SHARED, alloc_shm info is default to set to TRUE */
    (*win_ptr)->info_args.alloc_shm = TRUE;

    if (info != NULL) {
        int alloc_shm_flag = 0;
253
        char shm_alloc_value[MPI_MAX_INFO_VAL + 1];
254 255 256 257 258 259
        MPIR_Info_get_impl(info, "alloc_shm", MPI_MAX_INFO_VAL, shm_alloc_value, &alloc_shm_flag);
        /* if value of 'alloc_shm' info is not set to true, throw an error */
        if (alloc_shm_flag == 1 && strncmp(shm_alloc_value, "true", sizeof("true")))
            MPIU_ERR_SETANDJUMP(mpi_errno, MPI_ERR_OTHER, "**infoval");
    }

260 261 262 263
    mpi_errno =
        MPIDI_CH3U_Win_fns.allocate_shared(size, disp_unit, info, comm_ptr, base_ptr, win_ptr);
    if (mpi_errno != MPI_SUCCESS)
        MPIU_ERR_POP(mpi_errno);
264

265
  fn_fail:
266 267 268
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_ALLOCATE_SHARED);
    return mpi_errno;
}
269 270 271 272 273 274 275


#undef FUNCNAME
#define FUNCNAME win_init
#undef FCNAME
#define FCNAME MPIU_QUOTE(FUNCNAME)
static int win_init(MPI_Aint size, int disp_unit, int create_flavor, int model,
276
                    MPID_Comm * comm_ptr, MPID_Win ** win_ptr)
277 278
{
    int mpi_errno = MPI_SUCCESS;
279
    int i;
280
    MPID_Comm *win_comm_ptr;
281
    int win_target_pool_size;
Xin Zhao's avatar
Xin Zhao committed
282 283
    MPIDI_RMA_Win_list_t *win_elem;
    MPIU_CHKPMEM_DECL(5);
284 285 286 287
    MPIDI_STATE_DECL(MPID_STATE_WIN_INIT);

    MPIDI_FUNC_ENTER(MPID_STATE_WIN_INIT);

288
    if (initRMAoptions) {
289
        MPIU_THREADSAFE_INIT_BLOCK_BEGIN(initRMAoptions);
290 291

        MPIDI_CH3_RMA_Init_Pvars();
292 293 294 295 296

        MPIU_THREADSAFE_INIT_CLEAR(initRMAoptions);
        MPIU_THREADSAFE_INIT_BLOCK_END(initRMAoptions);
    }

297 298 299
    *win_ptr = (MPID_Win *) MPIU_Handle_obj_alloc(&MPID_Win_mem);
    MPIU_ERR_CHKANDJUMP1(!(*win_ptr), mpi_errno, MPI_ERR_OTHER, "**nomem",
                         "**nomem %s", "MPID_Win_mem");
300 301

    mpi_errno = MPIR_Comm_dup_impl(comm_ptr, &win_comm_ptr);
302 303
    if (mpi_errno)
        MPIU_ERR_POP(mpi_errno);
304 305 306

    MPIU_Object_set_ref(*win_ptr, 1);

307
    (*win_ptr)->fence_issued = 0;
308 309
    /* (*win_ptr)->errhandler is set by upper level; */
    /* (*win_ptr)->base is set by caller; */
310 311 312 313 314 315 316 317
    (*win_ptr)->size = size;
    (*win_ptr)->disp_unit = disp_unit;
    (*win_ptr)->create_flavor = create_flavor;
    (*win_ptr)->model = model;
    (*win_ptr)->attributes = NULL;
    (*win_ptr)->start_group_ptr = NULL;
    (*win_ptr)->start_assert = 0;
    (*win_ptr)->comm_ptr = win_comm_ptr;
318

319
    (*win_ptr)->at_completion_counter = 0;
320 321 322 323
    /* (*win_ptr)->base_addrs[] is set by caller; */
    /* (*win_ptr)->sizes[] is set by caller; */
    /* (*win_ptr)->disp_units[] is set by caller; */
    /* (*win_ptr)->all_win_handles[] is set by caller; */
324
    (*win_ptr)->current_lock_type = MPID_LOCK_NONE;
325
    (*win_ptr)->shared_lock_ref_cnt = 0;
326 327 328 329
    (*win_ptr)->lock_queue = NULL;
    (*win_ptr)->epoch_state = MPIDI_EPOCH_NONE;
    (*win_ptr)->epoch_count = 0;
    (*win_ptr)->at_rma_ops_list = NULL;
330
    (*win_ptr)->at_rma_ops_list_tail = NULL;
331
    (*win_ptr)->shm_allocated = FALSE;
332 333
    (*win_ptr)->states.access_state = MPIDI_RMA_NONE;
    (*win_ptr)->states.exposure_state = MPIDI_RMA_NONE;
334
    (*win_ptr)->non_empty_slots = 0;
335
    (*win_ptr)->posted_ops_cnt = 0;
336
    (*win_ptr)->active_req_cnt = 0;
337

338
    /* Initialize the passive target lock state */
339
    MPIU_CHKPMEM_MALLOC((*win_ptr)->targets, struct MPIDI_Win_target_state *,
340
                        sizeof(struct MPIDI_Win_target_state) * MPIR_Comm_size(win_comm_ptr),
341 342 343 344
                        mpi_errno, "RMA target states array");

    for (i = 0; i < MPIR_Comm_size(win_comm_ptr); i++) {
        (*win_ptr)->targets[i].rma_ops_list = NULL;
345
        (*win_ptr)->targets[i].rma_ops_list_tail = NULL;
346
        (*win_ptr)->targets[i].remote_lock_state = MPIDI_CH3_WIN_LOCK_NONE;
347 348
    }

349
    /* Initialize the info flags */
350
    (*win_ptr)->info_args.no_locks = 0;
351
    (*win_ptr)->info_args.accumulate_ordering = MPIDI_ACC_ORDER_RAR | MPIDI_ACC_ORDER_RAW |
352 353 354
        MPIDI_ACC_ORDER_WAR | MPIDI_ACC_ORDER_WAW;
    (*win_ptr)->info_args.accumulate_ops = MPIDI_ACC_OPS_SAME_OP_NO_OP;
    (*win_ptr)->info_args.same_size = 0;
355
    (*win_ptr)->info_args.alloc_shared_noncontig = 0;
356
    (*win_ptr)->info_args.alloc_shm = FALSE;
357

358 359 360 361 362 363 364 365 366 367
    MPIU_CHKPMEM_MALLOC((*win_ptr)->op_pool_start, struct MPIDI_RMA_Op *,
                        sizeof(MPIDI_RMA_Op_t) * MPIR_CVAR_CH3_RMA_OP_WIN_POOL_SIZE, mpi_errno,
                        "RMA op pool");
    (*win_ptr)->op_pool = NULL;
    (*win_ptr)->op_pool_tail = NULL;
    for (i = 0; i < MPIR_CVAR_CH3_RMA_OP_WIN_POOL_SIZE; i++) {
        (*win_ptr)->op_pool_start[i].pool_type = MPIDI_RMA_POOL_WIN;
        MPL_LL_APPEND((*win_ptr)->op_pool, (*win_ptr)->op_pool_tail, &((*win_ptr)->op_pool_start[i]));
    }

368 369 370 371 372 373 374 375 376 377 378
    win_target_pool_size = MPIR_MIN(MPIR_CVAR_CH3_RMA_TARGET_WIN_POOL_SIZE, MPIR_Comm_size(win_comm_ptr));
    MPIU_CHKPMEM_MALLOC((*win_ptr)->target_pool_start, struct MPIDI_RMA_Target *,
                        sizeof(MPIDI_RMA_Target_t) * win_target_pool_size,
                        mpi_errno, "RMA target pool");
    (*win_ptr)->target_pool = NULL;
    (*win_ptr)->target_pool_tail = NULL;
    for (i = 0; i < win_target_pool_size; i++) {
        (*win_ptr)->target_pool_start[i].pool_type = MPIDI_RMA_POOL_WIN;
        MPL_LL_APPEND((*win_ptr)->target_pool, (*win_ptr)->target_pool_tail, &((*win_ptr)->target_pool_start[i]));
    }

Xin Zhao's avatar
Xin Zhao committed
379 380 381 382 383 384 385 386
    (*win_ptr)->num_slots = MPIR_MIN(MPIR_CVAR_CH3_RMA_SLOTS_SIZE, MPIR_Comm_size(win_comm_ptr));
    MPIU_CHKPMEM_MALLOC((*win_ptr)->slots, struct MPIDI_RMA_Slot *,
                        sizeof(MPIDI_RMA_Slot_t) * (*win_ptr)->num_slots, mpi_errno, "RMA slots");
    for (i = 0; i < (*win_ptr)->num_slots; i++) {
        (*win_ptr)->slots[i].target_list = NULL;
        (*win_ptr)->slots[i].target_list_tail = NULL;
    }

387 388
    MPID_WIN_FTABLE_SET_DEFAULTS(win_ptr);

Xin Zhao's avatar
Xin Zhao committed
389 390 391 392 393 394
    /* enqueue window into the global list */
    MPIU_CHKPMEM_MALLOC(win_elem, MPIDI_RMA_Win_list_t *, sizeof(MPIDI_RMA_Win_list_t), mpi_errno,
                        "Window list element");
    win_elem->win_ptr = *win_ptr;
    MPL_LL_APPEND(MPIDI_RMA_Win_list, MPIDI_RMA_Win_list_tail, win_elem);

395
  fn_exit:
396 397
    MPIDI_FUNC_EXIT(MPID_STATE_WIN_INIT);
    return mpi_errno;
398
  fn_fail:
399
    MPIU_CHKPMEM_REAP();
400 401
    goto fn_exit;
}
402 403 404 405 406 407


#undef FUNCNAME
#define FUNCNAME MPID_Win_set_info
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
408
int MPID_Win_set_info(MPID_Win * win, MPID_Info * info)
409 410 411 412 413 414 415
{
    int mpi_errno = MPI_SUCCESS;
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_SET_INFO);

    MPIDI_FUNC_ENTER(MPID_STATE_MPID_WIN_SET_INFO);

    mpi_errno = win->RMAFns.Win_set_info(win, info);
416 417 418
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
419

420
  fn_exit:
421 422
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_SET_INFO);
    return mpi_errno;
423
  fn_fail:
424 425 426 427 428 429 430 431
    goto fn_exit;
}


#undef FUNCNAME
#define FUNCNAME MPID_Win_get_info
#undef FCNAME
#define FCNAME MPIDI_QUOTE(FUNCNAME)
432
int MPID_Win_get_info(MPID_Win * win, MPID_Info ** info_used)
433 434 435 436 437 438 439
{
    int mpi_errno = MPI_SUCCESS;
    MPIDI_STATE_DECL(MPID_STATE_MPID_WIN_GET_INFO);

    MPIDI_FUNC_ENTER(MPID_STATE_MPID_WIN_GET_INFO);

    mpi_errno = win->RMAFns.Win_get_info(win, info_used);
440 441 442
    if (mpi_errno != MPI_SUCCESS) {
        MPIU_ERR_POP(mpi_errno);
    }
443

444
  fn_exit:
445 446
    MPIDI_FUNC_EXIT(MPID_STATE_MPID_WIN_GET_INFO);
    return mpi_errno;
447
  fn_fail:
448 449
    goto fn_exit;
}