margo.c 23.4 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11

/*
 * (C) 2015 The University of Chicago
 * 
 * See COPYRIGHT in top-level directory.
 */

#include <assert.h>
#include <unistd.h>
#include <errno.h>
#include <abt.h>
12
#include <abt-snoozer.h>
13
#include <time.h>
Philip Carns's avatar
Philip Carns committed
14
#include <math.h>
15 16

#include "margo.h"
17
#include "margo-timer.h"
Philip Carns's avatar
Philip Carns committed
18
#include "utlist.h"
19
#include "uthash.h"
20

21 22
#define MERCURY_PROGRESS_TIMEOUT_UB 100 /* 100 milliseconds */

23 24 25 26 27 28 29 30 31 32 33 34 35
struct mplex_key
{
    hg_id_t id;
    uint32_t mplex_id;
};

struct mplex_element
{
    struct mplex_key key;
    ABT_pool pool;
    UT_hash_handle hh;
};

Philip Carns's avatar
Philip Carns committed
36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51
struct diag_data
{
    double min;
    double max;
    double cumulative;
    int count;
};

#define __DIAG_UPDATE(__data, __time)\
do {\
    __data.count++; \
    __data.cumulative += (__time); \
    if((__time) > __data.max) __data.max = (__time); \
    if((__time) < __data.min) __data.min = (__time); \
} while(0)

52 53
struct margo_instance
{
54
    /* provided by caller */
55 56
    hg_context_t *hg_context;
    hg_class_t *hg_class;
57 58 59
    ABT_pool handler_pool;
    ABT_pool progress_pool;

60
    /* internal to margo for this particular instance */
61 62
    ABT_thread hg_progress_tid;
    int hg_progress_shutdown_flag;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
63
    ABT_xstream progress_xstream;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
64 65 66
    int owns_progress_pool;
    ABT_xstream *rpc_xstreams;
    int num_handler_pool_threads;
67 68 69

    /* control logic for callers waiting on margo to be finalized */
    int finalize_flag;
70
    int waiters_in_progress_pool;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
71
    int refcount;
72 73 74
    ABT_mutex finalize_mutex;
    ABT_cond finalize_cond;

75
    int table_index;
76 77 78

    /* hash table to track multiplexed rpcs registered with margo */
    struct mplex_element *mplex_table;
Philip Carns's avatar
Philip Carns committed
79 80 81 82 83 84 85 86 87 88 89 90

    /* optional diagnostics data tracking */
    /* NOTE: technically the following fields are subject to races if they
     * are updated from more than one thread at a time.  We will be careful
     * to only update the counters from the progress_fn,
     * which will serialize access.
     */
    int diag_enabled;
    struct diag_data diag_trigger_elapsed;
    struct diag_data diag_progress_elapsed_zero_timeout;
    struct diag_data diag_progress_elapsed_nonzero_timeout;
    struct diag_data diag_progress_timeout_value;
91 92 93 94 95 96 97 98
};

struct margo_handler_mapping
{
    hg_class_t *class;
    margo_instance_id mid;
};

99 100 101 102 103 104 105
struct margo_cb_arg
{
    ABT_eventual *eventual;
    margo_instance_id mid;
    char in_pool;
};

106 107 108
#define MAX_HANDLER_MAPPING 8
static int handler_mapping_table_size = 0;
static struct margo_handler_mapping handler_mapping_table[MAX_HANDLER_MAPPING] = {0};
109

110
static void hg_progress_fn(void* foo);
111
static int margo_xstream_is_in_progress_pool(margo_instance_id mid);
112 113 114 115 116 117 118 119

struct handler_entry
{
    void* fn;
    hg_handle_t handle;
    struct handler_entry *next; 
};

Jonathan Jenkins's avatar
Jonathan Jenkins committed
120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167
margo_instance_id margo_init(int use_progress_thread, int rpc_thread_count,
    hg_context_t *hg_context)
{
    struct margo_instance *mid = MARGO_INSTANCE_NULL;
    ABT_xstream progress_xstream = ABT_XSTREAM_NULL;
    ABT_pool progress_pool = ABT_POOL_NULL;
    ABT_xstream *rpc_xstreams = NULL;
    ABT_xstream rpc_xstream = ABT_XSTREAM_NULL;
    ABT_pool rpc_pool = ABT_POOL_NULL;
    int ret;
    int i;

    if (use_progress_thread)
    {
        ret = ABT_snoozer_xstream_create(1, &progress_pool, &progress_xstream);
        if (ret != ABT_SUCCESS) goto err;
    }
    else
    {
        ret = ABT_xstream_self(&progress_xstream);
        if (ret != ABT_SUCCESS) goto err;
        ret = ABT_xstream_get_main_pools(progress_xstream, 1, &progress_pool);
        if (ret != ABT_SUCCESS) goto err;
    }

    if (rpc_thread_count > 0)
    {
        rpc_xstreams = malloc(rpc_thread_count * sizeof(*rpc_xstreams));
        if (rpc_xstreams == NULL) goto err;
        ret = ABT_snoozer_xstream_create(rpc_thread_count, &rpc_pool,
                rpc_xstreams);
        if (ret != ABT_SUCCESS) goto err;
    }
    else if (rpc_thread_count == 0)
    {
        ret = ABT_xstream_self(&rpc_xstream);
        if (ret != ABT_SUCCESS) goto err;
        ret = ABT_xstream_get_main_pools(rpc_xstream, 1, &rpc_pool);
        if (ret != ABT_SUCCESS) goto err;
    }
    else
    {
        rpc_pool = progress_pool;
    }

    mid = margo_init_pool(progress_pool, rpc_pool, hg_context);
    if (mid == MARGO_INSTANCE_NULL) goto err;

Jonathan Jenkins's avatar
Jonathan Jenkins committed
168 169 170
    mid->owns_progress_pool = use_progress_thread;
    mid->progress_xstream = progress_xstream;
    mid->num_handler_pool_threads = rpc_thread_count < 0 ? 0 : rpc_thread_count;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192
    mid->rpc_xstreams = rpc_xstreams;
    return mid;

err:
    if (use_progress_thread && progress_xstream != ABT_XSTREAM_NULL)
    {
        ABT_xstream_join(progress_xstream);
        ABT_xstream_free(&progress_xstream);
    }
    if (rpc_thread_count > 0 && rpc_xstreams != NULL)
    {
        for (i = 0; i < rpc_thread_count; i++)
        {
            ABT_xstream_join(rpc_xstreams[i]);
            ABT_xstream_free(&rpc_xstreams[i]);
        }
        free(rpc_xstreams);
    }
    return MARGO_INSTANCE_NULL;
}

margo_instance_id margo_init_pool(ABT_pool progress_pool, ABT_pool handler_pool,
Jonathan Jenkins's avatar
Jonathan Jenkins committed
193
    hg_context_t *hg_context)
194 195
{
    int ret;
196 197 198
    struct margo_instance *mid;

    if(handler_mapping_table_size >= MAX_HANDLER_MAPPING)
199
        return(MARGO_INSTANCE_NULL);
200 201 202

    mid = malloc(sizeof(*mid));
    if(!mid)
203
        return(MARGO_INSTANCE_NULL);
204
    memset(mid, 0, sizeof(*mid));
205

206 207 208
    ABT_mutex_create(&mid->finalize_mutex);
    ABT_cond_create(&mid->finalize_cond);

209 210
    mid->progress_pool = progress_pool;
    mid->handler_pool = handler_pool;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
211
    mid->hg_class = HG_Context_get_class(hg_context);
212
    mid->hg_context = hg_context;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
213
    mid->refcount = 1;
214

215 216 217 218 219 220 221 222
    ret = margo_timer_instance_init(mid);
    if(ret != 0)
    {
        fprintf(stderr, "Error: margo_timer_instance_init()\n");
        free(mid);
        return(MARGO_INSTANCE_NULL);
    }

223
    ret = ABT_thread_create(mid->progress_pool, hg_progress_fn, mid, 
224
        ABT_THREAD_ATTR_NULL, &mid->hg_progress_tid);
225 226 227
    if(ret != 0)
    {
        fprintf(stderr, "Error: ABT_thread_create()\n");
228
        free(mid);
229
        return(MARGO_INSTANCE_NULL);
230 231
    }

232 233 234 235 236 237
    handler_mapping_table[handler_mapping_table_size].mid = mid;
    handler_mapping_table[handler_mapping_table_size].class = mid->hg_class;
    mid->table_index = handler_mapping_table_size;
    handler_mapping_table_size++;

    return mid;
238 239
}

Jonathan Jenkins's avatar
Jonathan Jenkins committed
240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267
static void margo_cleanup(margo_instance_id mid)
{
    int i;

    margo_timer_instance_finalize(mid);

    ABT_mutex_free(&mid->finalize_mutex);
    ABT_cond_free(&mid->finalize_cond);

    if (mid->owns_progress_pool)
    {
        ABT_xstream_join(mid->progress_xstream);
        ABT_xstream_free(&mid->progress_xstream);
    }

    if (mid->num_handler_pool_threads > 0)
    {
        for (i = 0; i < mid->num_handler_pool_threads; i++)
        {
            ABT_xstream_join(mid->rpc_xstreams[i]);
            ABT_xstream_free(&mid->rpc_xstreams[i]);
        }
        free(mid->rpc_xstreams);
    }

    free(mid);
}

268
void margo_finalize(margo_instance_id mid)
269
{
270
    int i;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
271
    int do_cleanup;
272

273
    /* tell progress thread to wrap things up */
274
    mid->hg_progress_shutdown_flag = 1;
275 276

    /* wait for it to shutdown cleanly */
277 278
    ABT_thread_join(mid->hg_progress_tid);
    ABT_thread_free(&mid->hg_progress_tid);
279

280 281 282 283 284
    for(i=mid->table_index; i<(handler_mapping_table_size-1); i++)
    {
        handler_mapping_table[i] = handler_mapping_table[i+1];
    }
    handler_mapping_table_size--;
285

286 287 288 289
    ABT_mutex_lock(mid->finalize_mutex);
    mid->finalize_flag = 1;
    ABT_cond_broadcast(mid->finalize_cond);

Jonathan Jenkins's avatar
Jonathan Jenkins committed
290 291
    mid->refcount--;
    do_cleanup = mid->refcount == 0;
292

Jonathan Jenkins's avatar
Jonathan Jenkins committed
293 294 295 296 297 298 299
    ABT_mutex_unlock(mid->finalize_mutex);

    /* if there was noone waiting on the finalize at the time of the finalize
     * broadcast, then we're safe to clean up. Otherwise, let the finalizer do
     * it */
    if (do_cleanup)
        margo_cleanup(mid);
300 301 302 303 304 305 306

    return;
}

void margo_wait_for_finalize(margo_instance_id mid)
{
    int in_pool = 0;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
307
    int do_cleanup;
308 309 310 311

    /* Is this waiter in the same pool as the pool running the progress
     * thread?
     */
312
    if(margo_xstream_is_in_progress_pool(mid))
313 314 315 316
        in_pool = 1;

    ABT_mutex_lock(mid->finalize_mutex);

317
        mid->waiters_in_progress_pool += in_pool;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
318
        mid->refcount++;
319 320 321 322
            
        while(!mid->finalize_flag)
            ABT_cond_wait(mid->finalize_cond, mid->finalize_mutex);

Jonathan Jenkins's avatar
Jonathan Jenkins committed
323 324 325
        mid->refcount--;
        do_cleanup = mid->refcount == 0;

326
    ABT_mutex_unlock(mid->finalize_mutex);
Jonathan Jenkins's avatar
Jonathan Jenkins committed
327 328 329 330

    if (do_cleanup)
        margo_cleanup(mid);

331 332 333 334
    return;
}

/* dedicated thread function to drive Mercury progress */
335
static void hg_progress_fn(void* foo)
336 337 338
{
    int ret;
    unsigned int actual_count;
339
    struct margo_instance *mid = (struct margo_instance *)foo;
340
    size_t size;
341 342
    unsigned int hg_progress_timeout = MERCURY_PROGRESS_TIMEOUT_UB;
    double next_timer_exp;
343
    int trigger_happened;
Philip Carns's avatar
Philip Carns committed
344 345
    double tm1, tm2;
    int diag_enabled = 0;
346

347
    while(!mid->hg_progress_shutdown_flag)
348
    {
349
        trigger_happened = 0;
350
        do {
Philip Carns's avatar
Philip Carns committed
351 352 353 354 355 356
            /* save value of instance diag variable, in case it is modified
             * while we are in loop 
             */
            diag_enabled = mid->diag_enabled;

            if(diag_enabled) tm1 = ABT_get_wtime();
357
            ret = HG_Trigger(mid->hg_context, 0, 1, &actual_count);
Philip Carns's avatar
Philip Carns committed
358 359 360 361 362 363
            if(diag_enabled)
            {
                tm2 = ABT_get_wtime();
                __DIAG_UPDATE(mid->diag_trigger_elapsed, (tm2-tm1));
            }

364 365
            if(ret == HG_SUCCESS && actual_count > 0)
                trigger_happened = 1;
366
        } while((ret == HG_SUCCESS) && actual_count && !mid->hg_progress_shutdown_flag);
367

368 369
        if(trigger_happened)
            ABT_thread_yield();
370

371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386
        ABT_pool_get_total_size(mid->progress_pool, &size);
        /* Are there any other threads executing in this pool that are *not*
         * blocked on margo_wait_for_finalize()?  If so then, we can't
         * sleep here or else those threads will not get a chance to
         * execute.
         */
        if(size > mid->waiters_in_progress_pool)
        {
            //printf("DEBUG: Margo progress function running while other ULTs are eligible for execution (size: %d, waiters: %d.\n", size, mid->waiters_in_progress_pool);

            /* TODO: this is being executed more than is necessary (i.e.
             * in cases where there are other legitimate ULTs eligible
             * for execution that are not blocking on any events, Margo
             * or otherwise). Maybe we need an abt scheduling tweak here
             * to make sure that this ULT is the lowest priority in that
             * scenario.
387
             */
388 389 390 391 392 393 394 395 396 397
            ret = HG_Progress(mid->hg_context, 0);
            if(ret == HG_SUCCESS)
            {
                /* Mercury completed something; loop around to trigger
                 * callbacks 
                 */
            }
            else if(ret == HG_TIMEOUT)
            {
                /* No completion; yield here to allow other ULTs to run */
Philip Carns's avatar
Philip Carns committed
398
                ABT_thread_yield();
399 400 401 402 403 404
            }
            else
            {
                /* TODO: error handling */
                fprintf(stderr, "WARNING: unexpected return code (%d) from HG_Progress()\n", ret);
            }
405 406 407
        }
        else
        {
408
            hg_progress_timeout = MERCURY_PROGRESS_TIMEOUT_UB;
409 410
            ret = margo_timer_get_next_expiration(mid, &next_timer_exp);
            if(ret == 0)
411
            {
412 413 414 415
                /* there is a queued timer, don't block long enough
                 * to keep this timer waiting
                 */
                if(next_timer_exp >= 0.0)
416
                {
417 418 419 420 421 422 423
                    next_timer_exp *= 1000; /* convert to milliseconds */
                    if(next_timer_exp < MERCURY_PROGRESS_TIMEOUT_UB)
                        hg_progress_timeout = (unsigned int)next_timer_exp;
                }
                else
                {
                    hg_progress_timeout = 0;
424
                }
425
            }
426 427 428 429 430 431
            ret = HG_Progress(mid->hg_context, hg_progress_timeout);
            if(ret != HG_SUCCESS && ret != HG_TIMEOUT)
            {
                /* TODO: error handling */
                fprintf(stderr, "WARNING: unexpected return code (%d) from HG_Progress()\n", ret);
            }
432
        }
433

434
        /* check for any expired timers */
435
        margo_check_timers(mid);
436 437
    }

438
    return;
439 440
}

441
ABT_pool* margo_get_handler_pool(margo_instance_id mid)
442
{
443
    return(&mid->handler_pool);
444 445
}

446 447 448 449 450 451 452 453 454 455 456
hg_context_t* margo_get_context(margo_instance_id mid)
{
    return(mid->hg_context);
}

hg_class_t* margo_get_class(margo_instance_id mid)
{
    return(mid->hg_class);
}


Jonathan Jenkins's avatar
Jonathan Jenkins committed
457
static hg_return_t margo_cb(const struct hg_cb_info *info)
458 459
{
    hg_return_t hret = info->ret;
460
    struct margo_cb_arg* arg = info->arg;
461 462

    /* propagate return code out through eventual */
463
    ABT_eventual_set(*(arg->eventual), &hret, sizeof(hret));
464
    
465
#if 0
466 467
    if(arg->in_pool)
        arg->mid->waiters_in_progress_pool--;
468
#endif
469

470 471 472
    return(HG_SUCCESS);
}

473 474 475
typedef struct
{
    hg_handle_t handle;
Shane Snyder's avatar
Shane Snyder committed
476
} margo_forward_timeout_cb_dat;
477 478 479

static void margo_forward_timeout_cb(void *arg)
{
Shane Snyder's avatar
Shane Snyder committed
480 481
    margo_forward_timeout_cb_dat *timeout_cb_dat =
        (margo_forward_timeout_cb_dat *)arg;
482 483

    /* cancel the Mercury op if the forward timed out */
484
    HG_Cancel(timeout_cb_dat->handle);
485 486 487
    return;
}

488 489 490 491 492 493
hg_return_t margo_forward_timed(
    margo_instance_id mid,
    hg_handle_t handle,
    void *in_struct,
    double timeout_ms)
{
Shane Snyder's avatar
Shane Snyder committed
494
    int ret;
495
    hg_return_t hret;
496 497
    ABT_eventual eventual;
    hg_return_t* waited_hret;
Shane Snyder's avatar
Shane Snyder committed
498 499
    margo_timer_t forward_timer;
    margo_forward_timeout_cb_dat timeout_cb_dat;
500
    struct margo_cb_arg arg;
501 502 503 504 505 506 507

    ret = ABT_eventual_create(sizeof(hret), &eventual);
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);        
    }

Shane Snyder's avatar
Shane Snyder committed
508 509
    /* set a timer object to expire when this forward times out */
    timeout_cb_dat.handle = handle;
510
    margo_timer_init(mid, &forward_timer, margo_forward_timeout_cb,
Shane Snyder's avatar
Shane Snyder committed
511
        &timeout_cb_dat, timeout_ms);
512

513 514
    arg.eventual = &eventual;
    arg.mid = mid;
515
#if 0
516 517 518 519 520 521 522
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
523
#endif
524
    hret = HG_Forward(handle, margo_cb, &arg, in_struct);
525 526 527 528 529 530
    if(hret == 0)
    {
        ABT_eventual_wait(eventual, (void**)&waited_hret);
        hret = *waited_hret;
    }

531 532 533 534
    /* convert HG_CANCELED to HG_TIMEOUT to indicate op timed out */
    if(hret == HG_CANCELED)
        hret = HG_TIMEOUT;

535 536
    /* remove timer if it is still in place (i.e., not timed out) */
    if(hret != HG_TIMEOUT)
537
        margo_timer_destroy(mid, &forward_timer);
538 539 540 541

    ABT_eventual_free(&eventual);

    return(hret);
542 543 544
}


545
hg_return_t margo_forward(
546
    margo_instance_id mid,
547 548 549 550 551 552 553
    hg_handle_t handle,
    void *in_struct)
{
    hg_return_t hret = HG_TIMEOUT;
    ABT_eventual eventual;
    int ret;
    hg_return_t* waited_hret;
554
    struct margo_cb_arg arg;
555 556 557 558 559 560 561

    ret = ABT_eventual_create(sizeof(hret), &eventual);
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);        
    }

562 563
    arg.eventual = &eventual;
    arg.mid = mid;
564
#if 0
565 566 567 568 569 570 571
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
572
#endif
573
    hret = HG_Forward(handle, margo_cb, &arg, in_struct);
Jonathan Jenkins's avatar
Jonathan Jenkins committed
574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593
    if(hret == 0)
    {
        ABT_eventual_wait(eventual, (void**)&waited_hret);
        hret = *waited_hret;
    }

    ABT_eventual_free(&eventual);

    return(hret);
}

hg_return_t margo_respond(
    margo_instance_id mid,
    hg_handle_t handle,
    void *out_struct)
{
    hg_return_t hret = HG_TIMEOUT;
    ABT_eventual eventual;
    int ret;
    hg_return_t* waited_hret;
594
    struct margo_cb_arg arg;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
595 596 597 598 599 600 601

    ret = ABT_eventual_create(sizeof(hret), &eventual);
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);
    }

602 603
    arg.eventual = &eventual;
    arg.mid = mid;
604
#if 0
605 606 607 608 609 610 611
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
612
#endif
613
    hret = HG_Respond(handle, margo_cb, &arg, out_struct);
614 615 616 617 618 619 620 621 622 623 624
    if(hret == 0)
    {
        ABT_eventual_wait(eventual, (void**)&waited_hret);
        hret = *waited_hret;
    }

    ABT_eventual_free(&eventual);

    return(hret);
}

625

626
static hg_return_t margo_bulk_transfer_cb(const struct hg_cb_info *info)
627
{
628
    hg_return_t hret = info->ret;
629
    struct margo_cb_arg* arg = info->arg;
630 631

    /* propagate return code out through eventual */
632
    ABT_eventual_set(*(arg->eventual), &hret, sizeof(hret));
633
    
634 635 636
    if(arg->in_pool)
        arg->mid->waiters_in_progress_pool--;

637 638 639
    return(HG_SUCCESS);
}

Philip Carns's avatar
Philip Carns committed
640 641
struct lookup_cb_evt
{
642 643
    hg_return_t nret;
    hg_addr_t addr;
Philip Carns's avatar
Philip Carns committed
644 645
};

646
static hg_return_t margo_addr_lookup_cb(const struct hg_cb_info *info)
Philip Carns's avatar
Philip Carns committed
647 648
{
    struct lookup_cb_evt evt;
649 650
    evt.nret = info->ret;
    evt.addr = info->info.lookup.addr;
651
    struct margo_cb_arg* arg = info->arg;
Philip Carns's avatar
Philip Carns committed
652 653

    /* propagate return code out through eventual */
654 655
    ABT_eventual_set(*(arg->eventual), &evt, sizeof(evt));

656
#if 0
657 658
    if(arg->in_pool)
        arg->mid->waiters_in_progress_pool--;
659
#endif
Philip Carns's avatar
Philip Carns committed
660
    
661
    return(HG_SUCCESS);
Philip Carns's avatar
Philip Carns committed
662 663 664
}


665
hg_return_t margo_addr_lookup(
666
    margo_instance_id mid,
Philip Carns's avatar
Philip Carns committed
667
    const char   *name,
668
    hg_addr_t    *addr)
669
{
670
    hg_return_t nret;
Philip Carns's avatar
Philip Carns committed
671
    struct lookup_cb_evt *evt;
672 673
    ABT_eventual eventual;
    int ret;
674
    struct margo_cb_arg arg;
675

Philip Carns's avatar
Philip Carns committed
676
    ret = ABT_eventual_create(sizeof(*evt), &eventual);
677 678 679 680 681
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);        
    }

682 683
    arg.eventual = &eventual;
    arg.mid = mid;
684
#if 0
685 686 687 688 689 690 691
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
692
#endif
Jonathan Jenkins's avatar
Jonathan Jenkins committed
693
    nret = HG_Addr_lookup(mid->hg_context, margo_addr_lookup_cb,
694
        &arg, name, HG_OP_ID_IGNORE);
695 696
    if(nret == 0)
    {
Philip Carns's avatar
Philip Carns committed
697 698 699
        ABT_eventual_wait(eventual, (void**)&evt);
        *addr = evt->addr;
        nret = evt->nret;
700 701 702 703 704 705 706
    }

    ABT_eventual_free(&eventual);

    return(nret);
}

707
hg_return_t margo_bulk_transfer(
708
    margo_instance_id mid,
709
    hg_bulk_op_t op,
710
    hg_addr_t origin_addr,
711 712 713 714 715 716 717 718 719 720
    hg_bulk_t origin_handle,
    size_t origin_offset,
    hg_bulk_t local_handle,
    size_t local_offset,
    size_t size)
{
    hg_return_t hret = HG_TIMEOUT;
    hg_return_t *waited_hret;
    ABT_eventual eventual;
    int ret;
721
    struct margo_cb_arg arg;
722 723 724 725 726 727 728

    ret = ABT_eventual_create(sizeof(hret), &eventual);
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);        
    }

729 730 731 732 733 734 735 736 737
    arg.eventual = &eventual;
    arg.mid = mid;
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
738
    hret = HG_Bulk_transfer(mid->hg_context, margo_bulk_transfer_cb,
739
        &arg, op, origin_addr, origin_handle, origin_offset, local_handle,
Jonathan Jenkins's avatar
Jonathan Jenkins committed
740
        local_offset, size, HG_OP_ID_IGNORE);
741 742 743 744 745 746 747 748 749 750 751
    if(hret == 0)
    {
        ABT_eventual_wait(eventual, (void**)&waited_hret);
        hret = *waited_hret;
    }

    ABT_eventual_free(&eventual);

    return(hret);
}

752 753
typedef struct
{
754
    margo_instance_id mid;
755 756
    ABT_mutex mutex;
    ABT_cond cond;
Shane Snyder's avatar
Shane Snyder committed
757 758
    char is_asleep;
    char in_pool;
759 760 761 762 763 764 765
} margo_thread_sleep_cb_dat;

static void margo_thread_sleep_cb(void *arg)
{
    margo_thread_sleep_cb_dat *sleep_cb_dat =
        (margo_thread_sleep_cb_dat *)arg;

766
    /* decrement number of waiting threads */
767
    sleep_cb_dat->mid->waiters_in_progress_pool -=
Shane Snyder's avatar
Shane Snyder committed
768
        sleep_cb_dat->in_pool;
769

770 771
    /* wake up the sleeping thread */
    ABT_mutex_lock(sleep_cb_dat->mutex);
772
    sleep_cb_dat->is_asleep = 0;
773 774 775 776 777 778 779
    ABT_cond_signal(sleep_cb_dat->cond);
    ABT_mutex_unlock(sleep_cb_dat->mutex);

    return;
}

void margo_thread_sleep(
780
    margo_instance_id mid,
781 782
    double timeout_ms)
{
783
    int in_pool = 0;
784 785 786
    margo_timer_t sleep_timer;
    margo_thread_sleep_cb_dat sleep_cb_dat;

Shane Snyder's avatar
Shane Snyder committed
787 788 789
    if(margo_xstream_is_in_progress_pool(mid))
        in_pool = 1;

790
    /* set data needed for sleep callback */
791
    sleep_cb_dat.mid = mid;
792 793
    ABT_mutex_create(&(sleep_cb_dat.mutex));
    ABT_cond_create(&(sleep_cb_dat.cond));
794
    sleep_cb_dat.is_asleep = 1;
Shane Snyder's avatar
Shane Snyder committed
795
    sleep_cb_dat.in_pool = in_pool;
796 797

    /* initialize the sleep timer */
798
    margo_timer_init(mid, &sleep_timer, margo_thread_sleep_cb,
799 800
        &sleep_cb_dat, timeout_ms);

801
    /* increment number of waiting threads */
802
    mid->waiters_in_progress_pool += in_pool;
803

804 805
    /* yield thread for specified timeout */
    ABT_mutex_lock(sleep_cb_dat.mutex);
806 807
    while(sleep_cb_dat.is_asleep)
        ABT_cond_wait(sleep_cb_dat.cond, sleep_cb_dat.mutex);
808 809
    ABT_mutex_unlock(sleep_cb_dat.mutex);

810 811 812 813
    /* clean up */
    ABT_mutex_free(&sleep_cb_dat.mutex);
    ABT_cond_free(&sleep_cb_dat.cond);

814 815 816
    return;
}

817
margo_instance_id margo_hg_class_to_instance(hg_class_t *cl)
818 819 820 821 822
{
    int i;

    for(i=0; i<handler_mapping_table_size; i++)
    {
823
        if(handler_mapping_table[i].class == cl)
824 825 826 827
            return(handler_mapping_table[i].mid);
    }
    return(NULL);
}
828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845

/* returns 1 if current xstream is in the progress pool, 0 if not */
static int margo_xstream_is_in_progress_pool(margo_instance_id mid)
{
    int ret;
    ABT_xstream xstream;
    ABT_pool pool;

    ret = ABT_xstream_self(&xstream);
    assert(ret == ABT_SUCCESS);
    ret = ABT_xstream_get_main_pools(xstream, 1, &pool);
    assert(ret == ABT_SUCCESS);

    if(pool == mid->progress_pool)
        return(1);
    else
        return(0);
}
Philip Carns's avatar
Philip Carns committed
846

847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865
int margo_lookup_mplex(margo_instance_id mid, hg_id_t id, uint32_t mplex_id, ABT_pool *pool)
{
    struct mplex_key key;
    struct mplex_element *element;

    if(!mplex_id)
    {
        *pool = mid->handler_pool;
        return(0);
    }

    memset(&key, 0, sizeof(key));
    key.id = id;
    key.mplex_id = mplex_id;

    HASH_FIND(hh, mid->mplex_table, &key, sizeof(key), element);
    if(!element)
        return(-1);

Philip Carns's avatar
Philip Carns committed
866 867
    assert(element->key.id == id && element->key.mplex_id == mplex_id);

868 869 870 871 872
    *pool = element->pool;

    return(0);
}

Philip Carns's avatar
Philip Carns committed
873 874
int margo_register_mplex(margo_instance_id mid, hg_id_t id, uint32_t mplex_id, ABT_pool pool)
{
875 876 877
    struct mplex_key key;
    struct mplex_element *element;

878 879 880
    /* nothing to do, we'll let the handler pool take this directly */
    if(mplex_id == MARGO_DEFAULT_MPLEX_ID)
        return(0);
881

882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898
    memset(&key, 0, sizeof(key));
    key.id = id;
    key.mplex_id = mplex_id;

    HASH_FIND(hh, mid->mplex_table, &key, sizeof(key), element);
    if(element)
        return(0);

    element = malloc(sizeof(*element));
    if(!element)
        return(-1);
    element->key = key;
    element->pool = pool;

    HASH_ADD(hh, mid->mplex_table, key, sizeof(key), element);

    return(0);
Philip Carns's avatar
Philip Carns committed
899
}
Philip Carns's avatar
Philip Carns committed
900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949


void margo_diag_start(margo_instance_id mid)
{
    mid->diag_enabled = 1;
}

static void print_diag_data(FILE *file, const char* name, struct diag_data *data)
{
    fprintf(file, "%s\t%.9f\t%.9f\t%.9f\t%d\n", name, data->cumulative/data->count, data->min, data->max, data->count);
    return;
}

void margo_diag_dump(margo_instance_id mid, const char* file)
{
    FILE *outfile;
    time_t ltime;

    assert(mid->diag_enabled);

    if(strcmp("-", file) == 0)
    {
        outfile = stdout;
    }
    else
    {
        outfile = fopen(file, "a");
        if(!outfile)
        {
            perror("fopen");
            return;
        }
    }

    /* TODO: retrieve self addr and include in output */
    /* TODO: support pattern substitution in file name to create unique
     * output files per process
     */

    time(&ltime);
    fprintf(outfile, "# Margo diagnostics\n");
    fprintf(outfile, "# %s\n", ctime(&ltime));
    fprintf(outfile, "# <stat>\t<avg>\t<min>\t<max>\t<count>\n");
    print_diag_data(outfile, "trigger_elapsed", &mid->diag_trigger_elapsed);

    if(outfile != stdout)
        fclose(outfile);
    
    return;
}