margo.c 24.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11

/*
 * (C) 2015 The University of Chicago
 * 
 * See COPYRIGHT in top-level directory.
 */

#include <assert.h>
#include <unistd.h>
#include <errno.h>
#include <abt.h>
12
#include <abt-snoozer.h>
13
#include <time.h>
Philip Carns's avatar
Philip Carns committed
14
#include <math.h>
15 16

#include "margo.h"
17
#include "margo-timer.h"
Philip Carns's avatar
Philip Carns committed
18
#include "utlist.h"
19
#include "uthash.h"
20

21 22
#define MERCURY_PROGRESS_TIMEOUT_UB 100 /* 100 milliseconds */

23 24 25 26 27 28 29 30 31 32 33 34 35
struct mplex_key
{
    hg_id_t id;
    uint32_t mplex_id;
};

struct mplex_element
{
    struct mplex_key key;
    ABT_pool pool;
    UT_hash_handle hh;
};

Philip Carns's avatar
Philip Carns committed
36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51
struct diag_data
{
    double min;
    double max;
    double cumulative;
    int count;
};

#define __DIAG_UPDATE(__data, __time)\
do {\
    __data.count++; \
    __data.cumulative += (__time); \
    if((__time) > __data.max) __data.max = (__time); \
    if((__time) < __data.min) __data.min = (__time); \
} while(0)

52 53
struct margo_instance
{
54
    /* provided by caller */
55 56
    hg_context_t *hg_context;
    hg_class_t *hg_class;
57 58 59
    ABT_pool handler_pool;
    ABT_pool progress_pool;

60
    /* internal to margo for this particular instance */
61 62
    ABT_thread hg_progress_tid;
    int hg_progress_shutdown_flag;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
63
    ABT_xstream progress_xstream;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
64 65 66
    int owns_progress_pool;
    ABT_xstream *rpc_xstreams;
    int num_handler_pool_threads;
67 68 69

    /* control logic for callers waiting on margo to be finalized */
    int finalize_flag;
70
    int waiters_in_progress_pool;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
71
    int refcount;
72 73 74
    ABT_mutex finalize_mutex;
    ABT_cond finalize_cond;

75
    int table_index;
76 77 78

    /* hash table to track multiplexed rpcs registered with margo */
    struct mplex_element *mplex_table;
Philip Carns's avatar
Philip Carns committed
79 80 81 82 83 84 85 86 87 88 89 90

    /* optional diagnostics data tracking */
    /* NOTE: technically the following fields are subject to races if they
     * are updated from more than one thread at a time.  We will be careful
     * to only update the counters from the progress_fn,
     * which will serialize access.
     */
    int diag_enabled;
    struct diag_data diag_trigger_elapsed;
    struct diag_data diag_progress_elapsed_zero_timeout;
    struct diag_data diag_progress_elapsed_nonzero_timeout;
    struct diag_data diag_progress_timeout_value;
91 92 93 94 95 96 97 98
};

struct margo_handler_mapping
{
    hg_class_t *class;
    margo_instance_id mid;
};

99 100 101 102 103 104 105
struct margo_cb_arg
{
    ABT_eventual *eventual;
    margo_instance_id mid;
    char in_pool;
};

106 107 108
#define MAX_HANDLER_MAPPING 8
static int handler_mapping_table_size = 0;
static struct margo_handler_mapping handler_mapping_table[MAX_HANDLER_MAPPING] = {0};
109

110
static void hg_progress_fn(void* foo);
111
static int margo_xstream_is_in_progress_pool(margo_instance_id mid);
112 113 114 115 116 117 118 119

struct handler_entry
{
    void* fn;
    hg_handle_t handle;
    struct handler_entry *next; 
};

Jonathan Jenkins's avatar
Jonathan Jenkins committed
120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167
margo_instance_id margo_init(int use_progress_thread, int rpc_thread_count,
    hg_context_t *hg_context)
{
    struct margo_instance *mid = MARGO_INSTANCE_NULL;
    ABT_xstream progress_xstream = ABT_XSTREAM_NULL;
    ABT_pool progress_pool = ABT_POOL_NULL;
    ABT_xstream *rpc_xstreams = NULL;
    ABT_xstream rpc_xstream = ABT_XSTREAM_NULL;
    ABT_pool rpc_pool = ABT_POOL_NULL;
    int ret;
    int i;

    if (use_progress_thread)
    {
        ret = ABT_snoozer_xstream_create(1, &progress_pool, &progress_xstream);
        if (ret != ABT_SUCCESS) goto err;
    }
    else
    {
        ret = ABT_xstream_self(&progress_xstream);
        if (ret != ABT_SUCCESS) goto err;
        ret = ABT_xstream_get_main_pools(progress_xstream, 1, &progress_pool);
        if (ret != ABT_SUCCESS) goto err;
    }

    if (rpc_thread_count > 0)
    {
        rpc_xstreams = malloc(rpc_thread_count * sizeof(*rpc_xstreams));
        if (rpc_xstreams == NULL) goto err;
        ret = ABT_snoozer_xstream_create(rpc_thread_count, &rpc_pool,
                rpc_xstreams);
        if (ret != ABT_SUCCESS) goto err;
    }
    else if (rpc_thread_count == 0)
    {
        ret = ABT_xstream_self(&rpc_xstream);
        if (ret != ABT_SUCCESS) goto err;
        ret = ABT_xstream_get_main_pools(rpc_xstream, 1, &rpc_pool);
        if (ret != ABT_SUCCESS) goto err;
    }
    else
    {
        rpc_pool = progress_pool;
    }

    mid = margo_init_pool(progress_pool, rpc_pool, hg_context);
    if (mid == MARGO_INSTANCE_NULL) goto err;

Jonathan Jenkins's avatar
Jonathan Jenkins committed
168 169 170
    mid->owns_progress_pool = use_progress_thread;
    mid->progress_xstream = progress_xstream;
    mid->num_handler_pool_threads = rpc_thread_count < 0 ? 0 : rpc_thread_count;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192
    mid->rpc_xstreams = rpc_xstreams;
    return mid;

err:
    if (use_progress_thread && progress_xstream != ABT_XSTREAM_NULL)
    {
        ABT_xstream_join(progress_xstream);
        ABT_xstream_free(&progress_xstream);
    }
    if (rpc_thread_count > 0 && rpc_xstreams != NULL)
    {
        for (i = 0; i < rpc_thread_count; i++)
        {
            ABT_xstream_join(rpc_xstreams[i]);
            ABT_xstream_free(&rpc_xstreams[i]);
        }
        free(rpc_xstreams);
    }
    return MARGO_INSTANCE_NULL;
}

margo_instance_id margo_init_pool(ABT_pool progress_pool, ABT_pool handler_pool,
Jonathan Jenkins's avatar
Jonathan Jenkins committed
193
    hg_context_t *hg_context)
194 195
{
    int ret;
196 197 198
    struct margo_instance *mid;

    if(handler_mapping_table_size >= MAX_HANDLER_MAPPING)
199
        return(MARGO_INSTANCE_NULL);
200 201 202

    mid = malloc(sizeof(*mid));
    if(!mid)
203
        return(MARGO_INSTANCE_NULL);
204
    memset(mid, 0, sizeof(*mid));
205

206 207 208
    ABT_mutex_create(&mid->finalize_mutex);
    ABT_cond_create(&mid->finalize_cond);

209 210
    mid->progress_pool = progress_pool;
    mid->handler_pool = handler_pool;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
211
    mid->hg_class = HG_Context_get_class(hg_context);
212
    mid->hg_context = hg_context;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
213
    mid->refcount = 1;
214

215 216 217 218 219 220 221 222
    ret = margo_timer_instance_init(mid);
    if(ret != 0)
    {
        fprintf(stderr, "Error: margo_timer_instance_init()\n");
        free(mid);
        return(MARGO_INSTANCE_NULL);
    }

223
    ret = ABT_thread_create(mid->progress_pool, hg_progress_fn, mid, 
224
        ABT_THREAD_ATTR_NULL, &mid->hg_progress_tid);
225 226 227
    if(ret != 0)
    {
        fprintf(stderr, "Error: ABT_thread_create()\n");
228
        free(mid);
229
        return(MARGO_INSTANCE_NULL);
230 231
    }

232 233 234 235 236 237
    handler_mapping_table[handler_mapping_table_size].mid = mid;
    handler_mapping_table[handler_mapping_table_size].class = mid->hg_class;
    mid->table_index = handler_mapping_table_size;
    handler_mapping_table_size++;

    return mid;
238 239
}

Jonathan Jenkins's avatar
Jonathan Jenkins committed
240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267
static void margo_cleanup(margo_instance_id mid)
{
    int i;

    margo_timer_instance_finalize(mid);

    ABT_mutex_free(&mid->finalize_mutex);
    ABT_cond_free(&mid->finalize_cond);

    if (mid->owns_progress_pool)
    {
        ABT_xstream_join(mid->progress_xstream);
        ABT_xstream_free(&mid->progress_xstream);
    }

    if (mid->num_handler_pool_threads > 0)
    {
        for (i = 0; i < mid->num_handler_pool_threads; i++)
        {
            ABT_xstream_join(mid->rpc_xstreams[i]);
            ABT_xstream_free(&mid->rpc_xstreams[i]);
        }
        free(mid->rpc_xstreams);
    }

    free(mid);
}

268
void margo_finalize(margo_instance_id mid)
269
{
270
    int i;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
271
    int do_cleanup;
272

273
    /* tell progress thread to wrap things up */
274
    mid->hg_progress_shutdown_flag = 1;
275 276

    /* wait for it to shutdown cleanly */
277 278
    ABT_thread_join(mid->hg_progress_tid);
    ABT_thread_free(&mid->hg_progress_tid);
279

280 281 282 283 284
    for(i=mid->table_index; i<(handler_mapping_table_size-1); i++)
    {
        handler_mapping_table[i] = handler_mapping_table[i+1];
    }
    handler_mapping_table_size--;
285

286 287 288 289
    ABT_mutex_lock(mid->finalize_mutex);
    mid->finalize_flag = 1;
    ABT_cond_broadcast(mid->finalize_cond);

Jonathan Jenkins's avatar
Jonathan Jenkins committed
290 291
    mid->refcount--;
    do_cleanup = mid->refcount == 0;
292

Jonathan Jenkins's avatar
Jonathan Jenkins committed
293 294 295 296 297 298 299
    ABT_mutex_unlock(mid->finalize_mutex);

    /* if there was noone waiting on the finalize at the time of the finalize
     * broadcast, then we're safe to clean up. Otherwise, let the finalizer do
     * it */
    if (do_cleanup)
        margo_cleanup(mid);
300 301 302 303 304 305 306

    return;
}

void margo_wait_for_finalize(margo_instance_id mid)
{
    int in_pool = 0;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
307
    int do_cleanup;
308 309 310 311

    /* Is this waiter in the same pool as the pool running the progress
     * thread?
     */
312
    if(margo_xstream_is_in_progress_pool(mid))
313 314 315 316
        in_pool = 1;

    ABT_mutex_lock(mid->finalize_mutex);

317
        mid->waiters_in_progress_pool += in_pool;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
318
        mid->refcount++;
319 320 321 322
            
        while(!mid->finalize_flag)
            ABT_cond_wait(mid->finalize_cond, mid->finalize_mutex);

Jonathan Jenkins's avatar
Jonathan Jenkins committed
323 324 325
        mid->refcount--;
        do_cleanup = mid->refcount == 0;

326
    ABT_mutex_unlock(mid->finalize_mutex);
Jonathan Jenkins's avatar
Jonathan Jenkins committed
327 328 329 330

    if (do_cleanup)
        margo_cleanup(mid);

331 332 333 334
    return;
}

/* dedicated thread function to drive Mercury progress */
335
static void hg_progress_fn(void* foo)
336 337 338
{
    int ret;
    unsigned int actual_count;
339
    struct margo_instance *mid = (struct margo_instance *)foo;
340
    size_t size;
341 342
    unsigned int hg_progress_timeout = MERCURY_PROGRESS_TIMEOUT_UB;
    double next_timer_exp;
343
    int trigger_happened;
Philip Carns's avatar
Philip Carns committed
344 345
    double tm1, tm2;
    int diag_enabled = 0;
346

347
    while(!mid->hg_progress_shutdown_flag)
348
    {
349
        trigger_happened = 0;
350
        do {
Philip Carns's avatar
Philip Carns committed
351 352 353 354 355 356
            /* save value of instance diag variable, in case it is modified
             * while we are in loop 
             */
            diag_enabled = mid->diag_enabled;

            if(diag_enabled) tm1 = ABT_get_wtime();
357
            ret = HG_Trigger(mid->hg_context, 0, 1, &actual_count);
Philip Carns's avatar
Philip Carns committed
358 359 360 361 362 363
            if(diag_enabled)
            {
                tm2 = ABT_get_wtime();
                __DIAG_UPDATE(mid->diag_trigger_elapsed, (tm2-tm1));
            }

364 365
            if(ret == HG_SUCCESS && actual_count > 0)
                trigger_happened = 1;
366
        } while((ret == HG_SUCCESS) && actual_count && !mid->hg_progress_shutdown_flag);
367

368 369
        if(trigger_happened)
            ABT_thread_yield();
370

371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386
        ABT_pool_get_total_size(mid->progress_pool, &size);
        /* Are there any other threads executing in this pool that are *not*
         * blocked on margo_wait_for_finalize()?  If so then, we can't
         * sleep here or else those threads will not get a chance to
         * execute.
         */
        if(size > mid->waiters_in_progress_pool)
        {
            //printf("DEBUG: Margo progress function running while other ULTs are eligible for execution (size: %d, waiters: %d.\n", size, mid->waiters_in_progress_pool);

            /* TODO: this is being executed more than is necessary (i.e.
             * in cases where there are other legitimate ULTs eligible
             * for execution that are not blocking on any events, Margo
             * or otherwise). Maybe we need an abt scheduling tweak here
             * to make sure that this ULT is the lowest priority in that
             * scenario.
387
             */
388
            if(diag_enabled) tm1 = ABT_get_wtime();
389
            ret = HG_Progress(mid->hg_context, 0);
390 391 392 393 394 395
            if(diag_enabled)
            {
                tm2 = ABT_get_wtime();
                __DIAG_UPDATE(mid->diag_progress_elapsed_zero_timeout, (tm2-tm1));
                __DIAG_UPDATE(mid->diag_progress_timeout_value, 0);
            }
396 397 398 399 400 401 402 403 404
            if(ret == HG_SUCCESS)
            {
                /* Mercury completed something; loop around to trigger
                 * callbacks 
                 */
            }
            else if(ret == HG_TIMEOUT)
            {
                /* No completion; yield here to allow other ULTs to run */
Philip Carns's avatar
Philip Carns committed
405
                ABT_thread_yield();
406 407 408 409 410 411
            }
            else
            {
                /* TODO: error handling */
                fprintf(stderr, "WARNING: unexpected return code (%d) from HG_Progress()\n", ret);
            }
412 413 414
        }
        else
        {
415
            hg_progress_timeout = MERCURY_PROGRESS_TIMEOUT_UB;
416 417
            ret = margo_timer_get_next_expiration(mid, &next_timer_exp);
            if(ret == 0)
418
            {
419 420 421 422
                /* there is a queued timer, don't block long enough
                 * to keep this timer waiting
                 */
                if(next_timer_exp >= 0.0)
423
                {
424 425 426 427 428 429 430
                    next_timer_exp *= 1000; /* convert to milliseconds */
                    if(next_timer_exp < MERCURY_PROGRESS_TIMEOUT_UB)
                        hg_progress_timeout = (unsigned int)next_timer_exp;
                }
                else
                {
                    hg_progress_timeout = 0;
431
                }
432
            }
433
            if(diag_enabled) tm1 = ABT_get_wtime();
434
            ret = HG_Progress(mid->hg_context, hg_progress_timeout);
435 436 437 438 439 440 441 442 443 444
            if(diag_enabled)
            {
                tm2 = ABT_get_wtime();
                if(hg_progress_timeout == 0)
                    __DIAG_UPDATE(mid->diag_progress_elapsed_zero_timeout, (tm2-tm1));
                else
                    __DIAG_UPDATE(mid->diag_progress_elapsed_nonzero_timeout, (tm2-tm1));
                    
                __DIAG_UPDATE(mid->diag_progress_timeout_value, hg_progress_timeout);
            }
445 446 447 448 449
            if(ret != HG_SUCCESS && ret != HG_TIMEOUT)
            {
                /* TODO: error handling */
                fprintf(stderr, "WARNING: unexpected return code (%d) from HG_Progress()\n", ret);
            }
450
        }
451

452
        /* check for any expired timers */
453
        margo_check_timers(mid);
454 455
    }

456
    return;
457 458
}

459
ABT_pool* margo_get_handler_pool(margo_instance_id mid)
460
{
461
    return(&mid->handler_pool);
462 463
}

464 465 466 467 468 469 470 471 472 473 474
hg_context_t* margo_get_context(margo_instance_id mid)
{
    return(mid->hg_context);
}

hg_class_t* margo_get_class(margo_instance_id mid)
{
    return(mid->hg_class);
}


Jonathan Jenkins's avatar
Jonathan Jenkins committed
475
static hg_return_t margo_cb(const struct hg_cb_info *info)
476 477
{
    hg_return_t hret = info->ret;
478
    struct margo_cb_arg* arg = info->arg;
479 480

    /* propagate return code out through eventual */
481
    ABT_eventual_set(*(arg->eventual), &hret, sizeof(hret));
482
    
483
#if 0
484 485
    if(arg->in_pool)
        arg->mid->waiters_in_progress_pool--;
486
#endif
487

488 489 490
    return(HG_SUCCESS);
}

491 492 493
typedef struct
{
    hg_handle_t handle;
Shane Snyder's avatar
Shane Snyder committed
494
} margo_forward_timeout_cb_dat;
495 496 497

static void margo_forward_timeout_cb(void *arg)
{
Shane Snyder's avatar
Shane Snyder committed
498 499
    margo_forward_timeout_cb_dat *timeout_cb_dat =
        (margo_forward_timeout_cb_dat *)arg;
500 501

    /* cancel the Mercury op if the forward timed out */
502
    HG_Cancel(timeout_cb_dat->handle);
503 504 505
    return;
}

506 507 508 509 510 511
hg_return_t margo_forward_timed(
    margo_instance_id mid,
    hg_handle_t handle,
    void *in_struct,
    double timeout_ms)
{
Shane Snyder's avatar
Shane Snyder committed
512
    int ret;
513
    hg_return_t hret;
514 515
    ABT_eventual eventual;
    hg_return_t* waited_hret;
Shane Snyder's avatar
Shane Snyder committed
516 517
    margo_timer_t forward_timer;
    margo_forward_timeout_cb_dat timeout_cb_dat;
518
    struct margo_cb_arg arg;
519 520 521 522 523 524 525

    ret = ABT_eventual_create(sizeof(hret), &eventual);
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);        
    }

Shane Snyder's avatar
Shane Snyder committed
526 527
    /* set a timer object to expire when this forward times out */
    timeout_cb_dat.handle = handle;
528
    margo_timer_init(mid, &forward_timer, margo_forward_timeout_cb,
Shane Snyder's avatar
Shane Snyder committed
529
        &timeout_cb_dat, timeout_ms);
530

531 532
    arg.eventual = &eventual;
    arg.mid = mid;
533
#if 0
534 535 536 537 538 539 540
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
541
#endif
542
    hret = HG_Forward(handle, margo_cb, &arg, in_struct);
543 544 545 546 547 548
    if(hret == 0)
    {
        ABT_eventual_wait(eventual, (void**)&waited_hret);
        hret = *waited_hret;
    }

549 550 551 552
    /* convert HG_CANCELED to HG_TIMEOUT to indicate op timed out */
    if(hret == HG_CANCELED)
        hret = HG_TIMEOUT;

553 554
    /* remove timer if it is still in place (i.e., not timed out) */
    if(hret != HG_TIMEOUT)
555
        margo_timer_destroy(mid, &forward_timer);
556 557 558 559

    ABT_eventual_free(&eventual);

    return(hret);
560 561 562
}


563
hg_return_t margo_forward(
564
    margo_instance_id mid,
565 566 567 568 569 570 571
    hg_handle_t handle,
    void *in_struct)
{
    hg_return_t hret = HG_TIMEOUT;
    ABT_eventual eventual;
    int ret;
    hg_return_t* waited_hret;
572
    struct margo_cb_arg arg;
573 574 575 576 577 578 579

    ret = ABT_eventual_create(sizeof(hret), &eventual);
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);        
    }

580 581
    arg.eventual = &eventual;
    arg.mid = mid;
582
#if 0
583 584 585 586 587 588 589
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
590
#endif
591
    hret = HG_Forward(handle, margo_cb, &arg, in_struct);
Jonathan Jenkins's avatar
Jonathan Jenkins committed
592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611
    if(hret == 0)
    {
        ABT_eventual_wait(eventual, (void**)&waited_hret);
        hret = *waited_hret;
    }

    ABT_eventual_free(&eventual);

    return(hret);
}

hg_return_t margo_respond(
    margo_instance_id mid,
    hg_handle_t handle,
    void *out_struct)
{
    hg_return_t hret = HG_TIMEOUT;
    ABT_eventual eventual;
    int ret;
    hg_return_t* waited_hret;
612
    struct margo_cb_arg arg;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
613 614 615 616 617 618 619

    ret = ABT_eventual_create(sizeof(hret), &eventual);
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);
    }

620 621
    arg.eventual = &eventual;
    arg.mid = mid;
622
#if 0
623 624 625 626 627 628 629
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
630
#endif
631
    hret = HG_Respond(handle, margo_cb, &arg, out_struct);
632 633 634 635 636 637 638 639 640 641 642
    if(hret == 0)
    {
        ABT_eventual_wait(eventual, (void**)&waited_hret);
        hret = *waited_hret;
    }

    ABT_eventual_free(&eventual);

    return(hret);
}

643

644
static hg_return_t margo_bulk_transfer_cb(const struct hg_cb_info *info)
645
{
646
    hg_return_t hret = info->ret;
647
    struct margo_cb_arg* arg = info->arg;
648 649

    /* propagate return code out through eventual */
650
    ABT_eventual_set(*(arg->eventual), &hret, sizeof(hret));
651
    
652 653 654
    if(arg->in_pool)
        arg->mid->waiters_in_progress_pool--;

655 656 657
    return(HG_SUCCESS);
}

Philip Carns's avatar
Philip Carns committed
658 659
struct lookup_cb_evt
{
660 661
    hg_return_t nret;
    hg_addr_t addr;
Philip Carns's avatar
Philip Carns committed
662 663
};

664
static hg_return_t margo_addr_lookup_cb(const struct hg_cb_info *info)
Philip Carns's avatar
Philip Carns committed
665 666
{
    struct lookup_cb_evt evt;
667 668
    evt.nret = info->ret;
    evt.addr = info->info.lookup.addr;
669
    struct margo_cb_arg* arg = info->arg;
Philip Carns's avatar
Philip Carns committed
670 671

    /* propagate return code out through eventual */
672 673
    ABT_eventual_set(*(arg->eventual), &evt, sizeof(evt));

674
#if 0
675 676
    if(arg->in_pool)
        arg->mid->waiters_in_progress_pool--;
677
#endif
Philip Carns's avatar
Philip Carns committed
678
    
679
    return(HG_SUCCESS);
Philip Carns's avatar
Philip Carns committed
680 681 682
}


683
hg_return_t margo_addr_lookup(
684
    margo_instance_id mid,
Philip Carns's avatar
Philip Carns committed
685
    const char   *name,
686
    hg_addr_t    *addr)
687
{
688
    hg_return_t nret;
Philip Carns's avatar
Philip Carns committed
689
    struct lookup_cb_evt *evt;
690 691
    ABT_eventual eventual;
    int ret;
692
    struct margo_cb_arg arg;
693

Philip Carns's avatar
Philip Carns committed
694
    ret = ABT_eventual_create(sizeof(*evt), &eventual);
695 696 697 698 699
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);        
    }

700 701
    arg.eventual = &eventual;
    arg.mid = mid;
702
#if 0
703 704 705 706 707 708 709
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
710
#endif
Jonathan Jenkins's avatar
Jonathan Jenkins committed
711
    nret = HG_Addr_lookup(mid->hg_context, margo_addr_lookup_cb,
712
        &arg, name, HG_OP_ID_IGNORE);
713 714
    if(nret == 0)
    {
Philip Carns's avatar
Philip Carns committed
715 716 717
        ABT_eventual_wait(eventual, (void**)&evt);
        *addr = evt->addr;
        nret = evt->nret;
718 719 720 721 722 723 724
    }

    ABT_eventual_free(&eventual);

    return(nret);
}

725
hg_return_t margo_bulk_transfer(
726
    margo_instance_id mid,
727
    hg_bulk_op_t op,
728
    hg_addr_t origin_addr,
729 730 731 732 733 734 735 736 737 738
    hg_bulk_t origin_handle,
    size_t origin_offset,
    hg_bulk_t local_handle,
    size_t local_offset,
    size_t size)
{
    hg_return_t hret = HG_TIMEOUT;
    hg_return_t *waited_hret;
    ABT_eventual eventual;
    int ret;
739
    struct margo_cb_arg arg;
740 741 742 743 744 745 746

    ret = ABT_eventual_create(sizeof(hret), &eventual);
    if(ret != 0)
    {
        return(HG_NOMEM_ERROR);        
    }

747 748 749 750 751 752 753 754 755
    arg.eventual = &eventual;
    arg.mid = mid;
    if(margo_xstream_is_in_progress_pool(mid))
    {
        arg.in_pool = 1;
        mid->waiters_in_progress_pool++;
    }
    else
        arg.in_pool = 0;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
756
    hret = HG_Bulk_transfer(mid->hg_context, margo_bulk_transfer_cb,
757
        &arg, op, origin_addr, origin_handle, origin_offset, local_handle,
Jonathan Jenkins's avatar
Jonathan Jenkins committed
758
        local_offset, size, HG_OP_ID_IGNORE);
759 760 761 762 763 764 765 766 767 768 769
    if(hret == 0)
    {
        ABT_eventual_wait(eventual, (void**)&waited_hret);
        hret = *waited_hret;
    }

    ABT_eventual_free(&eventual);

    return(hret);
}

770 771
typedef struct
{
772
    margo_instance_id mid;
773 774
    ABT_mutex mutex;
    ABT_cond cond;
Shane Snyder's avatar
Shane Snyder committed
775 776
    char is_asleep;
    char in_pool;
777 778 779 780 781 782 783
} margo_thread_sleep_cb_dat;

static void margo_thread_sleep_cb(void *arg)
{
    margo_thread_sleep_cb_dat *sleep_cb_dat =
        (margo_thread_sleep_cb_dat *)arg;

784
    /* decrement number of waiting threads */
785
    sleep_cb_dat->mid->waiters_in_progress_pool -=
Shane Snyder's avatar
Shane Snyder committed
786
        sleep_cb_dat->in_pool;
787

788 789
    /* wake up the sleeping thread */
    ABT_mutex_lock(sleep_cb_dat->mutex);
790
    sleep_cb_dat->is_asleep = 0;
791 792 793 794 795 796 797
    ABT_cond_signal(sleep_cb_dat->cond);
    ABT_mutex_unlock(sleep_cb_dat->mutex);

    return;
}

void margo_thread_sleep(
798
    margo_instance_id mid,
799 800
    double timeout_ms)
{
801
    int in_pool = 0;
802 803 804
    margo_timer_t sleep_timer;
    margo_thread_sleep_cb_dat sleep_cb_dat;

Shane Snyder's avatar
Shane Snyder committed
805 806 807
    if(margo_xstream_is_in_progress_pool(mid))
        in_pool = 1;

808
    /* set data needed for sleep callback */
809
    sleep_cb_dat.mid = mid;
810 811
    ABT_mutex_create(&(sleep_cb_dat.mutex));
    ABT_cond_create(&(sleep_cb_dat.cond));
812
    sleep_cb_dat.is_asleep = 1;
Shane Snyder's avatar
Shane Snyder committed
813
    sleep_cb_dat.in_pool = in_pool;
814 815

    /* initialize the sleep timer */
816
    margo_timer_init(mid, &sleep_timer, margo_thread_sleep_cb,
817 818
        &sleep_cb_dat, timeout_ms);

819
    /* increment number of waiting threads */
820
    mid->waiters_in_progress_pool += in_pool;
821

822 823
    /* yield thread for specified timeout */
    ABT_mutex_lock(sleep_cb_dat.mutex);
824 825
    while(sleep_cb_dat.is_asleep)
        ABT_cond_wait(sleep_cb_dat.cond, sleep_cb_dat.mutex);
826 827
    ABT_mutex_unlock(sleep_cb_dat.mutex);

828 829 830 831
    /* clean up */
    ABT_mutex_free(&sleep_cb_dat.mutex);
    ABT_cond_free(&sleep_cb_dat.cond);

832 833 834
    return;
}

835
margo_instance_id margo_hg_class_to_instance(hg_class_t *cl)
836 837 838 839 840
{
    int i;

    for(i=0; i<handler_mapping_table_size; i++)
    {
841
        if(handler_mapping_table[i].class == cl)
842 843 844 845
            return(handler_mapping_table[i].mid);
    }
    return(NULL);
}
846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863

/* returns 1 if current xstream is in the progress pool, 0 if not */
static int margo_xstream_is_in_progress_pool(margo_instance_id mid)
{
    int ret;
    ABT_xstream xstream;
    ABT_pool pool;

    ret = ABT_xstream_self(&xstream);
    assert(ret == ABT_SUCCESS);
    ret = ABT_xstream_get_main_pools(xstream, 1, &pool);
    assert(ret == ABT_SUCCESS);

    if(pool == mid->progress_pool)
        return(1);
    else
        return(0);
}
Philip Carns's avatar
Philip Carns committed
864

865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883
int margo_lookup_mplex(margo_instance_id mid, hg_id_t id, uint32_t mplex_id, ABT_pool *pool)
{
    struct mplex_key key;
    struct mplex_element *element;

    if(!mplex_id)
    {
        *pool = mid->handler_pool;
        return(0);
    }

    memset(&key, 0, sizeof(key));
    key.id = id;
    key.mplex_id = mplex_id;

    HASH_FIND(hh, mid->mplex_table, &key, sizeof(key), element);
    if(!element)
        return(-1);

Philip Carns's avatar
Philip Carns committed
884 885
    assert(element->key.id == id && element->key.mplex_id == mplex_id);

886 887 888 889 890
    *pool = element->pool;

    return(0);
}

Philip Carns's avatar
Philip Carns committed
891 892
int margo_register_mplex(margo_instance_id mid, hg_id_t id, uint32_t mplex_id, ABT_pool pool)
{
893 894 895
    struct mplex_key key;
    struct mplex_element *element;

896 897 898
    /* nothing to do, we'll let the handler pool take this directly */
    if(mplex_id == MARGO_DEFAULT_MPLEX_ID)
        return(0);
899

900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916
    memset(&key, 0, sizeof(key));
    key.id = id;
    key.mplex_id = mplex_id;

    HASH_FIND(hh, mid->mplex_table, &key, sizeof(key), element);
    if(element)
        return(0);

    element = malloc(sizeof(*element));
    if(!element)
        return(-1);
    element->key = key;
    element->pool = pool;

    HASH_ADD(hh, mid->mplex_table, key, sizeof(key), element);

    return(0);
Philip Carns's avatar
Philip Carns committed
917
}
Philip Carns's avatar
Philip Carns committed
918 919 920 921 922 923 924


void margo_diag_start(margo_instance_id mid)
{
    mid->diag_enabled = 1;
}

925
static void print_diag_data(FILE *file, const char* name, const char *description, struct diag_data *data)
Philip Carns's avatar
Philip Carns committed
926
{
927 928 929 930 931 932 933 934
    double avg;

    fprintf(file, "# %s\n", description);
    if(data->count != 0)
        avg = data->cumulative/data->count;
    else
        avg = 0;
    fprintf(file, "%s\t%.9f\t%.9f\t%.9f\t%d\n", name, avg, data->min, data->max, data->count);
Philip Carns's avatar
Philip Carns committed
935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967
    return;
}

void margo_diag_dump(margo_instance_id mid, const char* file)
{
    FILE *outfile;
    time_t ltime;

    assert(mid->diag_enabled);

    if(strcmp("-", file) == 0)
    {
        outfile = stdout;
    }
    else
    {
        outfile = fopen(file, "a");
        if(!outfile)
        {
            perror("fopen");
            return;
        }
    }

    /* TODO: retrieve self addr and include in output */
    /* TODO: support pattern substitution in file name to create unique
     * output files per process
     */

    time(&ltime);
    fprintf(outfile, "# Margo diagnostics\n");
    fprintf(outfile, "# %s\n", ctime(&ltime));
    fprintf(outfile, "# <stat>\t<avg>\t<min>\t<max>\t<count>\n");
968 969 970 971 972 973 974 975 976 977 978 979
    print_diag_data(outfile, "trigger_elapsed", 
        "Time consumed by HG_Trigger()", 
        &mid->diag_trigger_elapsed);
    print_diag_data(outfile, "progress_elapsed_zero_timeout", 
        "Time consumed by HG_Progress() when called with timeout==0", 
        &mid->diag_progress_elapsed_zero_timeout);
    print_diag_data(outfile, "progress_elapsed_nonzero_timeout", 
        "Time consumed by HG_Progress() when called with timeout!=0", 
        &mid->diag_progress_elapsed_nonzero_timeout);
    print_diag_data(outfile, "progress_timeout_value", 
        "Timeout values passed to HG_Progress()", 
        &mid->diag_progress_timeout_value);
Philip Carns's avatar
Philip Carns committed
980 981 982 983 984 985

    if(outfile != stdout)
        fclose(outfile);
    
    return;
}