darshan-posix.c 58.7 KB
Newer Older
1
/*
Shane Snyder's avatar
Shane Snyder committed
2 3 4
 * Copyright (C) 2015 University of Chicago.
 * See COPYRIGHT notice in top-level directory.
 *
5 6
 */

7 8 9
#define _XOPEN_SOURCE 500
#define _GNU_SOURCE

10
#include "darshan-runtime-config.h"
11 12 13 14 15 16 17 18 19 20 21 22 23 24
#include <stdio.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <stdarg.h>
#include <string.h>
#include <time.h>
#include <stdlib.h>
#include <errno.h>
#include <sys/uio.h>
#include <sys/mman.h>
#include <search.h>
#include <assert.h>
25
#include <libgen.h>
Philip Carns's avatar
Philip Carns committed
26
#include <aio.h>
27
#include <pthread.h>
28

29
#include "utlist.h"
30
#include "darshan.h"
31
#include "darshan-dynamic.h"
32

33
#ifndef HAVE_OFF64_T
34 35
typedef int64_t off64_t;
#endif
36 37 38
#ifndef HAVE_AIOCB64
#define aiocb64 aiocb
#endif
39

40

41 42
DARSHAN_FORWARD_DECL(open, int, (const char *path, int flags, ...));
DARSHAN_FORWARD_DECL(open64, int, (const char *path, int flags, ...));
43 44
DARSHAN_FORWARD_DECL(creat, int, (const char* path, mode_t mode));
DARSHAN_FORWARD_DECL(creat64, int, (const char* path, mode_t mode));
45 46 47 48
DARSHAN_FORWARD_DECL(mkstemp, int, (char *template));
DARSHAN_FORWARD_DECL(mkostemp, int, (char *template, int flags));
DARSHAN_FORWARD_DECL(mkstemps, int, (char *template, int suffixlen));
DARSHAN_FORWARD_DECL(mkostemps, int, (char *template, int suffixlen, int flags));
49 50 51 52 53 54 55 56
DARSHAN_FORWARD_DECL(read, ssize_t, (int fd, void *buf, size_t count));
DARSHAN_FORWARD_DECL(write, ssize_t, (int fd, const void *buf, size_t count));
DARSHAN_FORWARD_DECL(pread, ssize_t, (int fd, void *buf, size_t count, off_t offset));
DARSHAN_FORWARD_DECL(pwrite, ssize_t, (int fd, const void *buf, size_t count, off_t offset));
DARSHAN_FORWARD_DECL(pread64, ssize_t, (int fd, void *buf, size_t count, off64_t offset));
DARSHAN_FORWARD_DECL(pwrite64, ssize_t, (int fd, const void *buf, size_t count, off64_t offset));
DARSHAN_FORWARD_DECL(readv, ssize_t, (int fd, const struct iovec *iov, int iovcnt));
DARSHAN_FORWARD_DECL(writev, ssize_t, (int fd, const struct iovec *iov, int iovcnt));
57 58
DARSHAN_FORWARD_DECL(lseek, off_t, (int fd, off_t offset, int whence));
DARSHAN_FORWARD_DECL(lseek64, off64_t, (int fd, off64_t offset, int whence));
59 60 61 62 63 64
DARSHAN_FORWARD_DECL(__xstat, int, (int vers, const char* path, struct stat *buf));
DARSHAN_FORWARD_DECL(__xstat64, int, (int vers, const char* path, struct stat64 *buf));
DARSHAN_FORWARD_DECL(__lxstat, int, (int vers, const char* path, struct stat *buf));
DARSHAN_FORWARD_DECL(__lxstat64, int, (int vers, const char* path, struct stat64 *buf));
DARSHAN_FORWARD_DECL(__fxstat, int, (int vers, int fd, struct stat *buf));
DARSHAN_FORWARD_DECL(__fxstat64, int, (int vers, int fd, struct stat64 *buf));
65
#ifdef DARSHAN_WRAP_MMAP
Shane Snyder's avatar
Shane Snyder committed
66 67
DARSHAN_FORWARD_DECL(mmap, void*, (void *addr, size_t length, int prot, int flags, int fd, off_t offset));
DARSHAN_FORWARD_DECL(mmap64, void*, (void *addr, size_t length, int prot, int flags, int fd, off64_t offset));
68
#endif /* DARSHAN_WRAP_MMAP */
69 70
DARSHAN_FORWARD_DECL(fsync, int, (int fd));
DARSHAN_FORWARD_DECL(fdatasync, int, (int fd));
71
DARSHAN_FORWARD_DECL(close, int, (int fd));
72 73 74 75 76 77 78 79
DARSHAN_FORWARD_DECL(aio_read, int, (struct aiocb *aiocbp));
DARSHAN_FORWARD_DECL(aio_write, int, (struct aiocb *aiocbp));
DARSHAN_FORWARD_DECL(aio_read64, int, (struct aiocb64 *aiocbp));
DARSHAN_FORWARD_DECL(aio_write64, int, (struct aiocb64 *aiocbp));
DARSHAN_FORWARD_DECL(aio_return, ssize_t, (struct aiocb *aiocbp));
DARSHAN_FORWARD_DECL(aio_return64, ssize_t, (struct aiocb64 *aiocbp));
DARSHAN_FORWARD_DECL(lio_listio, int, (int mode, struct aiocb *const aiocb_list[], int nitems, struct sigevent *sevp));
DARSHAN_FORWARD_DECL(lio_listio64, int, (int mode, struct aiocb64 *const aiocb_list[], int nitems, struct sigevent *sevp));
80

81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98
/* The posix_file_record_ref structure maintains necessary runtime metadata
 * for the POSIX file record (darshan_posix_file structure, defined in
 * darshan-posix-log-format.h) pointed to by 'file_rec'. This metadata
 * assists with the instrumenting of specific statistics in the file record.
 *
 * RATIONALE: the POSIX module needs to track some stateful, volatile 
 * information about each open file (like the current file offset, most recent 
 * access time, etc.) to aid in instrumentation, but this information can't be
 * stored in the darshan_posix_file struct because we don't want it to appear in
 * the final darshan log file.  We therefore associate a posix_file_record_ref
 * struct with each darshan_posix_file struct in order to track this information
 * (i.e., the mapping between posix_file_record_ref structs to darshan_posix_file
 * structs is one-to-one).
 *
 * NOTE: we use the 'darshan_record_ref' interface (in darshan-common) to
 * associate different types of handles with this posix_file_record_ref struct.
 * This allows us to index this struct (and the underlying file record) by using
 * either the corresponding Darshan record identifier (derived from the filename)
99 100
 * or by a generated file descriptor, for instance. Note that, while there should
 * only be a single Darshan record identifier that indexes a posix_file_record_ref,
101 102
 * there could be multiple open file descriptors that index it.
 */
103
struct posix_file_record_ref
104
{
105
    struct darshan_posix_file *file_rec;
106 107 108
    int64_t offset;
    int64_t last_byte_read;
    int64_t last_byte_written;
Shane Snyder's avatar
Shane Snyder committed
109
    enum darshan_io_type last_io_type;
110 111 112
    double last_meta_end;
    double last_read_end;
    double last_write_end;
113
    void *access_root;
114
    int access_count;
115
    void *stride_root;
116
    int stride_count;
117
    struct posix_aio_tracker* aio_list;
118
    int fs_type; /* same as darshan_fs_info->fs_type */
119 120
};

121 122 123 124
/* The posix_runtime structure maintains necessary state for storing
 * POSIX file records and for coordinating with darshan-core at 
 * shutdown time.
 */
125 126
struct posix_runtime
{
127 128 129
    void *rec_id_hash;
    void *fd_hash;
    int file_rec_count;
130 131
};

132 133 134 135 136
/* struct to track information about aio operations in flight */
struct posix_aio_tracker
{
    double tm1;
    void *aiocbp;
137
    struct posix_aio_tracker *next;
138
};
139

140 141 142
static void posix_runtime_initialize(
    void);
static struct posix_file_record_ref *posix_track_new_file_record(
143
    darshan_record_id rec_id, const char *path);
144 145 146 147
static void posix_aio_tracker_add(
    int fd, void *aiocbp);
static struct posix_aio_tracker* posix_aio_tracker_del(
    int fd, void *aiocbp);
148 149
static void posix_finalize_file_records(
    void *rec_ref_p);
150 151 152 153 154
static void posix_record_reduction_op(
    void* infile_v, void* inoutfile_v, int *len, MPI_Datatype *datatype);
static void posix_shared_record_variance(
    MPI_Comm mod_comm, struct darshan_posix_file *inrec_array,
    struct darshan_posix_file *outrec_array, int shared_rec_count);
155
static void posix_cleanup_runtime(
156
    void);
157 158

static void posix_shutdown(
159
    MPI_Comm mod_comm, darshan_record_id *shared_recs,
160
    int shared_rec_count, void **posix_buf, int *posix_buf_sz);
161

162 163 164 165 166
/* extern DXT function defs */
extern void dxt_posix_write(darshan_record_id rec_id, int64_t offset,
    int64_t length, double start_time, double end_time);
extern void dxt_posix_read(darshan_record_id rec_id, int64_t offset,
    int64_t length, double start_time, double end_time);
167

168 169 170 171
static struct posix_runtime *posix_runtime = NULL;
static pthread_mutex_t posix_runtime_mutex = PTHREAD_RECURSIVE_MUTEX_INITIALIZER_NP;
static int my_rank = -1;
static int darshan_mem_alignment = 1;
172
static int enable_dxt_io_trace = 0;
173

174 175 176
#define POSIX_LOCK() pthread_mutex_lock(&posix_runtime_mutex)
#define POSIX_UNLOCK() pthread_mutex_unlock(&posix_runtime_mutex)

177 178
#define POSIX_PRE_RECORD() do { \
    POSIX_LOCK(); \
179
    if(!darshan_core_disabled_instrumentation()) { \
180 181 182
        if(!posix_runtime) { \
            posix_runtime_initialize(); \
        } \
183
        if(posix_runtime) break; \
184
    } \
185 186
    POSIX_UNLOCK(); \
    return(ret); \
187 188 189 190 191
} while(0)

#define POSIX_POST_RECORD() do { \
    POSIX_UNLOCK(); \
} while(0)
192

Philip Carns's avatar
Philip Carns committed
193
#define POSIX_RECORD_OPEN(__ret, __path, __mode, __tm1, __tm2) do { \
194
    darshan_record_id rec_id; \
195 196
    struct posix_file_record_ref *rec_ref; \
    char *newpath; \
197
    if(__ret < 0) break; \
198 199 200 201 202 203 204
    newpath = darshan_clean_file_path(__path); \
    if(!newpath) newpath = (char *)__path; \
    if(darshan_core_excluded_path(newpath)) { \
        if(newpath != __path) free(newpath); \
        break; \
    } \
    rec_id = darshan_core_gen_record_id(newpath); \
205
    rec_ref = darshan_lookup_record_ref(posix_runtime->rec_id_hash, &rec_id, sizeof(darshan_record_id)); \
206
    if(!rec_ref) rec_ref = posix_track_new_file_record(rec_id, newpath); \
207
    if(!rec_ref) { \
208 209
        if(newpath != __path) free(newpath); \
        break; \
210
    } \
211
    if(__mode) \
212 213 214 215
        rec_ref->file_rec->counters[POSIX_MODE] = __mode; \
    rec_ref->offset = 0; \
    rec_ref->last_byte_written = 0; \
    rec_ref->last_byte_read = 0; \
216
    rec_ref->file_rec->counters[POSIX_OPENS] += 1; \
217 218 219 220
    if(rec_ref->file_rec->fcounters[POSIX_F_OPEN_START_TIMESTAMP] == 0 || \
     rec_ref->file_rec->fcounters[POSIX_F_OPEN_START_TIMESTAMP] > __tm1) \
        rec_ref->file_rec->fcounters[POSIX_F_OPEN_START_TIMESTAMP] = __tm1; \
    rec_ref->file_rec->fcounters[POSIX_F_OPEN_END_TIMESTAMP] = __tm2; \
221 222
    DARSHAN_TIMER_INC_NO_OVERLAP(rec_ref->file_rec->fcounters[POSIX_F_META_TIME], \
        __tm1, __tm2, rec_ref->last_meta_end); \
223
    darshan_add_record_ref(&(posix_runtime->fd_hash), &__ret, sizeof(int), rec_ref); \
224
    darshan_instrument_fs_data(rec_ref->fs_type, newpath, __ret); \
225
    if(newpath != __path) free(newpath); \
226 227
} while(0)

228
#define POSIX_RECORD_READ(__ret, __fd, __pread_flag, __pread_offset, __aligned, __tm1, __tm2) do { \
229
    struct posix_file_record_ref* rec_ref; \
230
    size_t stride; \
231
    int64_t this_offset; \
232
    int64_t file_alignment; \
233 234
    double __elapsed = __tm2-__tm1; \
    if(__ret < 0) break; \
235 236
    rec_ref = darshan_lookup_record_ref(posix_runtime->fd_hash, &(__fd), sizeof(int)); \
    if(!rec_ref) break; \
237
    if(__pread_flag) \
238 239
        this_offset = __pread_offset; \
    else \
240
        this_offset = rec_ref->offset; \
241
    /* DXT to record detailed read tracing information */ \
242 243
    if(enable_dxt_io_trace) { \
        dxt_posix_read(rec_ref->file_rec->base_rec.id, this_offset, __ret, __tm1, __tm2); \
244
    } \
245 246 247 248 249 250 251
    if(this_offset > rec_ref->last_byte_read) \
        rec_ref->file_rec->counters[POSIX_SEQ_READS] += 1;  \
    if(this_offset == (rec_ref->last_byte_read + 1)) \
        rec_ref->file_rec->counters[POSIX_CONSEC_READS] += 1;  \
    if(this_offset > 0 && this_offset > rec_ref->last_byte_read \
        && rec_ref->last_byte_read != 0) \
        stride = this_offset - rec_ref->last_byte_read - 1; \
252
    else \
253
        stride = 0; \
254 255 256 257 258
    rec_ref->last_byte_read = this_offset + __ret - 1; \
    rec_ref->offset = this_offset + __ret; \
    if(rec_ref->file_rec->counters[POSIX_MAX_BYTE_READ] < (this_offset + __ret - 1)) \
        rec_ref->file_rec->counters[POSIX_MAX_BYTE_READ] = (this_offset + __ret - 1); \
    rec_ref->file_rec->counters[POSIX_BYTES_READ] += __ret; \
259
    rec_ref->file_rec->counters[POSIX_READS] += 1; \
260 261 262 263 264 265 266
    DARSHAN_BUCKET_INC(&(rec_ref->file_rec->counters[POSIX_SIZE_READ_0_100]), __ret); \
    darshan_common_val_counter(&rec_ref->access_root, &rec_ref->access_count, __ret, \
        &(rec_ref->file_rec->counters[POSIX_ACCESS1_ACCESS]), \
        &(rec_ref->file_rec->counters[POSIX_ACCESS1_COUNT])); \
    darshan_common_val_counter(&rec_ref->stride_root, &rec_ref->stride_count, stride, \
        &(rec_ref->file_rec->counters[POSIX_STRIDE1_STRIDE]), \
        &(rec_ref->file_rec->counters[POSIX_STRIDE1_COUNT])); \
267
    if(!__aligned) \
268 269
        rec_ref->file_rec->counters[POSIX_MEM_NOT_ALIGNED] += 1; \
    file_alignment = rec_ref->file_rec->counters[POSIX_FILE_ALIGNMENT]; \
270
    if(file_alignment > 0 && (this_offset % file_alignment) != 0) \
271 272 273 274
        rec_ref->file_rec->counters[POSIX_FILE_NOT_ALIGNED] += 1; \
    if(rec_ref->last_io_type == DARSHAN_IO_WRITE) \
        rec_ref->file_rec->counters[POSIX_RW_SWITCHES] += 1; \
    rec_ref->last_io_type = DARSHAN_IO_READ; \
275 276
    if(rec_ref->file_rec->fcounters[POSIX_F_READ_START_TIMESTAMP] == 0 || \
     rec_ref->file_rec->fcounters[POSIX_F_READ_START_TIMESTAMP] > __tm1) \
277 278 279 280 281 282 283
        rec_ref->file_rec->fcounters[POSIX_F_READ_START_TIMESTAMP] = __tm1; \
    rec_ref->file_rec->fcounters[POSIX_F_READ_END_TIMESTAMP] = __tm2; \
    if(rec_ref->file_rec->fcounters[POSIX_F_MAX_READ_TIME] < __elapsed) { \
        rec_ref->file_rec->fcounters[POSIX_F_MAX_READ_TIME] = __elapsed; \
        rec_ref->file_rec->counters[POSIX_MAX_READ_TIME_SIZE] = __ret; } \
    DARSHAN_TIMER_INC_NO_OVERLAP(rec_ref->file_rec->fcounters[POSIX_F_READ_TIME], \
        __tm1, __tm2, rec_ref->last_read_end); \
284 285
} while(0)

286
#define POSIX_RECORD_WRITE(__ret, __fd, __pwrite_flag, __pwrite_offset, __aligned, __tm1, __tm2) do { \
287
    struct posix_file_record_ref* rec_ref; \
288
    size_t stride; \
289
    int64_t this_offset; \
290
    int64_t file_alignment; \
291 292
    double __elapsed = __tm2-__tm1; \
    if(__ret < 0) break; \
293 294
    rec_ref = darshan_lookup_record_ref(posix_runtime->fd_hash, &__fd, sizeof(int)); \
    if(!rec_ref) break; \
295
    if(__pwrite_flag) \
296 297
        this_offset = __pwrite_offset; \
    else \
298
        this_offset = rec_ref->offset; \
299
    /* DXT to record detailed write tracing information */ \
300 301
    if(enable_dxt_io_trace) { \
        dxt_posix_write(rec_ref->file_rec->base_rec.id, this_offset, __ret, __tm1, __tm2); \
302
    } \
303 304 305 306 307 308 309
    if(this_offset > rec_ref->last_byte_written) \
        rec_ref->file_rec->counters[POSIX_SEQ_WRITES] += 1; \
    if(this_offset == (rec_ref->last_byte_written + 1)) \
        rec_ref->file_rec->counters[POSIX_CONSEC_WRITES] += 1; \
    if(this_offset > 0 && this_offset > rec_ref->last_byte_written \
        && rec_ref->last_byte_written != 0) \
        stride = this_offset - rec_ref->last_byte_written - 1; \
310
    else \
311
        stride = 0; \
312 313 314 315 316
    rec_ref->last_byte_written = this_offset + __ret - 1; \
    rec_ref->offset = this_offset + __ret; \
    if(rec_ref->file_rec->counters[POSIX_MAX_BYTE_WRITTEN] < (this_offset + __ret - 1)) \
        rec_ref->file_rec->counters[POSIX_MAX_BYTE_WRITTEN] = (this_offset + __ret - 1); \
    rec_ref->file_rec->counters[POSIX_BYTES_WRITTEN] += __ret; \
317
    rec_ref->file_rec->counters[POSIX_WRITES] += 1; \
318 319 320 321 322 323 324
    DARSHAN_BUCKET_INC(&(rec_ref->file_rec->counters[POSIX_SIZE_WRITE_0_100]), __ret); \
    darshan_common_val_counter(&rec_ref->access_root, &rec_ref->access_count, __ret, \
        &(rec_ref->file_rec->counters[POSIX_ACCESS1_ACCESS]), \
        &(rec_ref->file_rec->counters[POSIX_ACCESS1_COUNT])); \
    darshan_common_val_counter(&rec_ref->stride_root, &rec_ref->stride_count, stride, \
        &(rec_ref->file_rec->counters[POSIX_STRIDE1_STRIDE]), \
        &(rec_ref->file_rec->counters[POSIX_STRIDE1_COUNT])); \
325
    if(!__aligned) \
326 327
        rec_ref->file_rec->counters[POSIX_MEM_NOT_ALIGNED] += 1; \
    file_alignment = rec_ref->file_rec->counters[POSIX_FILE_ALIGNMENT]; \
328
    if(file_alignment > 0 && (this_offset % file_alignment) != 0) \
329 330 331 332
        rec_ref->file_rec->counters[POSIX_FILE_NOT_ALIGNED] += 1; \
    if(rec_ref->last_io_type == DARSHAN_IO_READ) \
        rec_ref->file_rec->counters[POSIX_RW_SWITCHES] += 1; \
    rec_ref->last_io_type = DARSHAN_IO_WRITE; \
333 334
    if(rec_ref->file_rec->fcounters[POSIX_F_WRITE_START_TIMESTAMP] == 0 || \
     rec_ref->file_rec->fcounters[POSIX_F_WRITE_START_TIMESTAMP] > __tm1) \
335 336 337 338 339 340 341
        rec_ref->file_rec->fcounters[POSIX_F_WRITE_START_TIMESTAMP] = __tm1; \
    rec_ref->file_rec->fcounters[POSIX_F_WRITE_END_TIMESTAMP] = __tm2; \
    if(rec_ref->file_rec->fcounters[POSIX_F_MAX_WRITE_TIME] < __elapsed) { \
        rec_ref->file_rec->fcounters[POSIX_F_MAX_WRITE_TIME] = __elapsed; \
        rec_ref->file_rec->counters[POSIX_MAX_WRITE_TIME_SIZE] = __ret; } \
    DARSHAN_TIMER_INC_NO_OVERLAP(rec_ref->file_rec->fcounters[POSIX_F_WRITE_TIME], \
        __tm1, __tm2, rec_ref->last_write_end); \
342
} while(0)
343

344
#define POSIX_LOOKUP_RECORD_STAT(__path, __statbuf, __tm1, __tm2) do { \
345
    darshan_record_id rec_id; \
346 347 348 349 350 351
    struct posix_file_record_ref* rec_ref; \
    char *newpath = darshan_clean_file_path(__path); \
    if(!newpath) newpath = (char *)__path; \
    if(darshan_core_excluded_path(newpath)) { \
        if(newpath != __path) free(newpath); \
        break; \
352
    } \
353 354
    rec_id = darshan_core_gen_record_id(newpath); \
    rec_ref = darshan_lookup_record_ref(posix_runtime->rec_id_hash, &rec_id, sizeof(darshan_record_id)); \
355
    if(!rec_ref) rec_ref = posix_track_new_file_record(rec_id, newpath); \
356
    if(newpath != __path) free(newpath); \
357 358
    if(rec_ref) { \
        POSIX_RECORD_STAT(rec_ref, __statbuf, __tm1, __tm2); \
359 360 361
    } \
} while(0)

362 363 364 365
#define POSIX_RECORD_STAT(__rec_ref, __statbuf, __tm1, __tm2) do { \
    (__rec_ref)->file_rec->counters[POSIX_STATS] += 1; \
    DARSHAN_TIMER_INC_NO_OVERLAP((__rec_ref)->file_rec->fcounters[POSIX_F_META_TIME], \
        __tm1, __tm2, (__rec_ref)->last_meta_end); \
366 367
} while(0)

368

369 370 371 372
/**********************************************************
 *      Wrappers for POSIX I/O functions of interest      * 
 **********************************************************/

373
int DARSHAN_DECL(open)(const char *path, int flags, ...)
374 375 376 377 378
{
    int mode = 0;
    int ret;
    double tm1, tm2;

379 380
    MAP_OR_FAIL(open);

381
    if(flags & O_CREAT) 
382 383 384 385 386 387
    {
        va_list arg;
        va_start(arg, flags);
        mode = va_arg(arg, int);
        va_end(arg);

388
        tm1 = darshan_core_wtime();
389
        ret = __real_open(path, flags, mode);
390
        tm2 = darshan_core_wtime();
391 392 393
    }
    else
    {
394
        tm1 = darshan_core_wtime();
395
        ret = __real_open(path, flags);
396
        tm2 = darshan_core_wtime();
397 398
    }

399
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
400
    POSIX_RECORD_OPEN(ret, path, mode, tm1, tm2);
401
    POSIX_POST_RECORD();
402 403 404 405

    return(ret);
}

Shane Snyder's avatar
Shane Snyder committed
406 407 408 409 410 411
int DARSHAN_DECL(open64)(const char *path, int flags, ...)
{
    int mode = 0;
    int ret;
    double tm1, tm2;

412
    MAP_OR_FAIL(open64);
Shane Snyder's avatar
Shane Snyder committed
413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431

    if(flags & O_CREAT)
    {
        va_list arg;
        va_start(arg, flags);
        mode = va_arg(arg, int);
        va_end(arg);

        tm1 = darshan_core_wtime();
        ret = __real_open64(path, flags, mode);
        tm2 = darshan_core_wtime();
    }
    else
    {
        tm1 = darshan_core_wtime();
        ret = __real_open64(path, flags);
        tm2 = darshan_core_wtime();
    }

432
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
433
    POSIX_RECORD_OPEN(ret, path, mode, tm1, tm2);
434
    POSIX_POST_RECORD();
435 436 437 438 439 440 441 442 443 444 445 446 447 448 449

    return(ret);
}

int DARSHAN_DECL(creat)(const char* path, mode_t mode)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(creat);

    tm1 = darshan_core_wtime();
    ret = __real_creat(path, mode);
    tm2 = darshan_core_wtime();

450
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
451
    POSIX_RECORD_OPEN(ret, path, mode, tm1, tm2);
452
    POSIX_POST_RECORD();
453 454 455 456 457 458 459 460 461 462

    return(ret);
}

int DARSHAN_DECL(creat64)(const char* path, mode_t mode)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(creat64);
Shane Snyder's avatar
Shane Snyder committed
463

464 465 466 467
    tm1 = darshan_core_wtime();
    ret = __real_creat64(path, mode);
    tm2 = darshan_core_wtime();

468
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
469
    POSIX_RECORD_OPEN(ret, path, mode, tm1, tm2);
470
    POSIX_POST_RECORD();
471 472 473 474

    return(ret);
}

475 476 477 478 479 480 481 482 483 484 485
int DARSHAN_DECL(mkstemp)(char* template)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(mkstemp);

    tm1 = darshan_core_wtime();
    ret = __real_mkstemp(template);
    tm2 = darshan_core_wtime();

486
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
487
    POSIX_RECORD_OPEN(ret, template, 0, tm1, tm2);
488
    POSIX_POST_RECORD();
489 490 491 492 493 494 495 496 497 498 499 500 501 502 503

    return(ret);
}

int DARSHAN_DECL(mkostemp)(char* template, int flags)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(mkostemp);

    tm1 = darshan_core_wtime();
    ret = __real_mkostemp(template, flags);
    tm2 = darshan_core_wtime();

504
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
505
    POSIX_RECORD_OPEN(ret, template, 0, tm1, tm2);
506
    POSIX_POST_RECORD();
507 508 509 510 511 512 513 514 515 516 517 518 519 520 521

    return(ret);
}

int DARSHAN_DECL(mkstemps)(char* template, int suffixlen)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(mkstemps);

    tm1 = darshan_core_wtime();
    ret = __real_mkstemps(template, suffixlen);
    tm2 = darshan_core_wtime();

522
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
523
    POSIX_RECORD_OPEN(ret, template, 0, tm1, tm2);
524
    POSIX_POST_RECORD();
525 526 527 528 529 530 531 532 533 534 535 536 537 538 539

    return(ret);
}

int DARSHAN_DECL(mkostemps)(char* template, int suffixlen, int flags)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(mkostemps);

    tm1 = darshan_core_wtime();
    ret = __real_mkostemps(template, suffixlen, flags);
    tm2 = darshan_core_wtime();

540
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
541
    POSIX_RECORD_OPEN(ret, template, 0, tm1, tm2);
542
    POSIX_POST_RECORD();
543 544 545 546

    return(ret);
}

547 548 549 550 551 552
ssize_t DARSHAN_DECL(read)(int fd, void *buf, size_t count)
{
    ssize_t ret;
    int aligned_flag = 0;
    double tm1, tm2;

Shane Snyder's avatar
Shane Snyder committed
553
    MAP_OR_FAIL(read);
554

555
    if((unsigned long)buf % darshan_mem_alignment == 0) aligned_flag = 1;
556 557 558 559 560

    tm1 = darshan_core_wtime();
    ret = __real_read(fd, buf, count);
    tm2 = darshan_core_wtime();

561
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
562
    POSIX_RECORD_READ(ret, fd, 0, 0, aligned_flag, tm1, tm2);
563
    POSIX_POST_RECORD();
564 565 566 567 568 569 570 571 572 573 574 575

    return(ret);
}

ssize_t DARSHAN_DECL(write)(int fd, const void *buf, size_t count)
{
    ssize_t ret;
    int aligned_flag = 0;
    double tm1, tm2;

    MAP_OR_FAIL(write);

576
    if((unsigned long)buf % darshan_mem_alignment == 0) aligned_flag = 1;
577 578 579 580 581

    tm1 = darshan_core_wtime();
    ret = __real_write(fd, buf, count);
    tm2 = darshan_core_wtime();

582
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
583
    POSIX_RECORD_WRITE(ret, fd, 0, 0, aligned_flag, tm1, tm2);
584
    POSIX_POST_RECORD();
585 586 587 588 589 590 591 592 593 594 595 596

    return(ret);
}

ssize_t DARSHAN_DECL(pread)(int fd, void *buf, size_t count, off_t offset)
{
    ssize_t ret;
    int aligned_flag = 0;
    double tm1, tm2;

    MAP_OR_FAIL(pread);

597
    if((unsigned long)buf % darshan_mem_alignment == 0) aligned_flag = 1;
598 599 600 601 602

    tm1 = darshan_core_wtime();
    ret = __real_pread(fd, buf, count, offset);
    tm2 = darshan_core_wtime();

603
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
604
    POSIX_RECORD_READ(ret, fd, 1, offset, aligned_flag, tm1, tm2);
605
    POSIX_POST_RECORD();
606 607 608 609 610 611 612 613 614 615 616 617

    return(ret);
}

ssize_t DARSHAN_DECL(pwrite)(int fd, const void *buf, size_t count, off_t offset)
{
    ssize_t ret;
    int aligned_flag = 0;
    double tm1, tm2;

    MAP_OR_FAIL(pwrite);

618
    if((unsigned long)buf % darshan_mem_alignment == 0) aligned_flag = 1;
619 620 621 622 623

    tm1 = darshan_core_wtime();
    ret = __real_pwrite(fd, buf, count, offset);
    tm2 = darshan_core_wtime();

624
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
625
    POSIX_RECORD_WRITE(ret, fd, 1, offset, aligned_flag, tm1, tm2);
626
    POSIX_POST_RECORD();
627 628 629 630 631 632 633 634 635 636 637 638

    return(ret);
}

ssize_t DARSHAN_DECL(pread64)(int fd, void *buf, size_t count, off64_t offset)
{
    ssize_t ret;
    int aligned_flag = 0;
    double tm1, tm2;

    MAP_OR_FAIL(pread64);

639
    if((unsigned long)buf % darshan_mem_alignment == 0) aligned_flag = 1;
640 641 642 643 644

    tm1 = darshan_core_wtime();
    ret = __real_pread64(fd, buf, count, offset);
    tm2 = darshan_core_wtime();

645
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
646
    POSIX_RECORD_READ(ret, fd, 1, offset, aligned_flag, tm1, tm2);
647
    POSIX_POST_RECORD();
648 649 650 651 652 653 654 655 656 657 658 659

    return(ret);
}

ssize_t DARSHAN_DECL(pwrite64)(int fd, const void *buf, size_t count, off64_t offset)
{
    ssize_t ret;
    int aligned_flag = 0;
    double tm1, tm2;

    MAP_OR_FAIL(pwrite64);

660
    if((unsigned long)buf % darshan_mem_alignment == 0) aligned_flag = 1;
661 662 663 664 665

    tm1 = darshan_core_wtime();
    ret = __real_pwrite64(fd, buf, count, offset);
    tm2 = darshan_core_wtime();

666
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
667
    POSIX_RECORD_WRITE(ret, fd, 1, offset, aligned_flag, tm1, tm2);
668
    POSIX_POST_RECORD();
669 670 671 672 673 674 675

    return(ret);
}

ssize_t DARSHAN_DECL(readv)(int fd, const struct iovec *iov, int iovcnt)
{
    ssize_t ret;
676
    int aligned_flag = 1;
677 678 679 680
    int i;
    double tm1, tm2;

    MAP_OR_FAIL(readv);
681

682 683 684 685
    for(i=0; i<iovcnt; i++)
    {
        if(((unsigned long)iov[i].iov_base % darshan_mem_alignment) != 0)
            aligned_flag = 0;
686
    }
687 688 689 690 691

    tm1 = darshan_core_wtime();
    ret = __real_readv(fd, iov, iovcnt);
    tm2 = darshan_core_wtime();

692
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
693
    POSIX_RECORD_READ(ret, fd, 0, 0, aligned_flag, tm1, tm2);
694
    POSIX_POST_RECORD();
695 696 697 698 699 700 701

    return(ret);
}

ssize_t DARSHAN_DECL(writev)(int fd, const struct iovec *iov, int iovcnt)
{
    ssize_t ret;
702
    int aligned_flag = 1;
703 704 705 706
    int i;
    double tm1, tm2;

    MAP_OR_FAIL(writev);
707

708 709 710 711
    for(i=0; i<iovcnt; i++)
    {
        if(((unsigned long)iov[i].iov_base % darshan_mem_alignment) != 0)
            aligned_flag = 0;
712
    }
713 714 715 716 717

    tm1 = darshan_core_wtime();
    ret = __real_writev(fd, iov, iovcnt);
    tm2 = darshan_core_wtime();

718
    POSIX_PRE_RECORD();
Philip Carns's avatar
Philip Carns committed
719
    POSIX_RECORD_WRITE(ret, fd, 0, 0, aligned_flag, tm1, tm2);
720
    POSIX_POST_RECORD();
721 722 723 724 725 726 727

    return(ret);
}

off_t DARSHAN_DECL(lseek)(int fd, off_t offset, int whence)
{
    off_t ret;
728
    struct posix_file_record_ref *rec_ref;
729 730 731 732 733 734 735 736 737 738
    double tm1, tm2;

    MAP_OR_FAIL(lseek);

    tm1 = darshan_core_wtime();
    ret = __real_lseek(fd, offset, whence);
    tm2 = darshan_core_wtime();

    if(ret >= 0)
    {
739
        POSIX_PRE_RECORD();
740 741
        rec_ref = darshan_lookup_record_ref(posix_runtime->fd_hash, &fd, sizeof(int));
        if(rec_ref)
742
        {
743
            rec_ref->offset = ret;
744
            DARSHAN_TIMER_INC_NO_OVERLAP(
745 746 747
                rec_ref->file_rec->fcounters[POSIX_F_META_TIME],
                tm1, tm2, rec_ref->last_meta_end);
            rec_ref->file_rec->counters[POSIX_SEEKS] += 1;
748
        }
749
        POSIX_POST_RECORD();
750 751 752 753 754 755 756 757
    }

    return(ret);
}

off_t DARSHAN_DECL(lseek64)(int fd, off_t offset, int whence)
{
    off_t ret;
758
    struct posix_file_record_ref *rec_ref;
759 760 761 762 763 764 765 766 767 768
    double tm1, tm2;

    MAP_OR_FAIL(lseek64);

    tm1 = darshan_core_wtime();
    ret = __real_lseek64(fd, offset, whence);
    tm2 = darshan_core_wtime();

    if(ret >= 0)
    {
769
        POSIX_PRE_RECORD();
770 771
        rec_ref = darshan_lookup_record_ref(posix_runtime->fd_hash, &fd, sizeof(int));
        if(rec_ref)
772
        {
773
            rec_ref->offset = ret;
774
            DARSHAN_TIMER_INC_NO_OVERLAP(
775 776 777
                rec_ref->file_rec->fcounters[POSIX_F_META_TIME],
                tm1, tm2, rec_ref->last_meta_end);
            rec_ref->file_rec->counters[POSIX_SEEKS] += 1;
778
        }
779
        POSIX_POST_RECORD();
780 781 782 783 784
    }

    return(ret);
}

785 786 787 788 789 790 791 792 793 794 795 796 797 798
int DARSHAN_DECL(__xstat)(int vers, const char *path, struct stat *buf)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(__xstat);

    tm1 = darshan_core_wtime();
    ret = __real___xstat(vers, path, buf);
    tm2 = darshan_core_wtime();

    if(ret < 0 || !S_ISREG(buf->st_mode))
        return(ret);

799
    POSIX_PRE_RECORD();
800
    POSIX_LOOKUP_RECORD_STAT(path, buf, tm1, tm2);
801
    POSIX_POST_RECORD();
802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819

    return(ret);
}

int DARSHAN_DECL(__xstat64)(int vers, const char *path, struct stat64 *buf)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(__xstat64);

    tm1 = darshan_core_wtime();
    ret = __real___xstat64(vers, path, buf);
    tm2 = darshan_core_wtime();

    if(ret < 0 || !S_ISREG(buf->st_mode))
        return(ret);

820
    POSIX_PRE_RECORD();
821
    POSIX_LOOKUP_RECORD_STAT(path, buf, tm1, tm2);
822
    POSIX_POST_RECORD();
823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840

    return(ret);
}

int DARSHAN_DECL(__lxstat)(int vers, const char *path, struct stat *buf)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(__lxstat);

    tm1 = darshan_core_wtime();
    ret = __real___lxstat(vers, path, buf);
    tm2 = darshan_core_wtime();

    if(ret < 0 || !S_ISREG(buf->st_mode))
        return(ret);

841
    POSIX_PRE_RECORD();
842
    POSIX_LOOKUP_RECORD_STAT(path, buf, tm1, tm2);
843
    POSIX_POST_RECORD();
844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861

    return(ret);
}

int DARSHAN_DECL(__lxstat64)(int vers, const char *path, struct stat64 *buf)
{
    int ret;
    double tm1, tm2;

    MAP_OR_FAIL(__lxstat64);

    tm1 = darshan_core_wtime();
    ret = __real___lxstat64(vers, path, buf);
    tm2 = darshan_core_wtime();

    if(ret < 0 || !S_ISREG(buf->st_mode))
        return(ret);

862
    POSIX_PRE_RECORD();
863
    POSIX_LOOKUP_RECORD_STAT(path, buf, tm1, tm2);
864
    POSIX_POST_RECORD();
865 866 867 868 869 870 871

    return(ret);
}

int DARSHAN_DECL(__fxstat)(int vers, int fd, struct stat *buf)
{
    int ret;
872
    struct posix_file_record_ref *rec_ref;
873 874 875 876 877 878 879 880 881 882 883
    double tm1, tm2;

    MAP_OR_FAIL(__fxstat);

    tm1 = darshan_core_wtime();
    ret = __real___fxstat(vers, fd, buf);
    tm2 = darshan_core_wtime();

    if(ret < 0 || !S_ISREG(buf->st_mode))
        return(ret);

884
    POSIX_PRE_RECORD();
885 886
    rec_ref = darshan_lookup_record_ref(posix_runtime->fd_hash, &fd, sizeof(int));
    if(rec_ref)
887
    {
888
        POSIX_RECORD_STAT(rec_ref, buf, tm1, tm2);
889
    }
890
    POSIX_POST_RECORD();
891 892 893 894 895 896 897

    return(ret);
}

int DARSHAN_DECL(__fxstat64)(int vers, int fd, struct stat64 *buf)
{
    int ret;
898
    struct posix_file_record_ref *rec_ref;
899 900 901 902 903 904 905 906 907 908 909
    double tm1, tm2;

    MAP_OR_FAIL(__fxstat64);

    tm1 = darshan_core_wtime();
    ret = __real___fxstat64(vers, fd, buf);
    tm2 = darshan_core_wtime();

    if(ret < 0 || !S_ISREG(buf->st_mode))
        return(ret);

910
    POSIX_PRE_RECORD();
911 912
    rec_ref = darshan_lookup_record_ref(posix_runtime->fd_hash, &fd, sizeof(int));
    if(rec_ref)
913
    {
914
        POSIX_RECORD_STAT(rec_ref, buf, tm1, tm2);
915
    }
916
    POSIX_POST_RECORD();
917 918 919 920

    return(ret);
}

921
#ifdef DARSHAN_WRAP_MMAP
Shane Snyder's avatar
Shane Snyder committed
922 923 924 925
void* DARSHAN_DECL(mmap)(void *addr, size_t length, int prot, int flags,
    int fd, off_t offset)
{
    void* ret;
926
    struct posix_file_record_ref *rec_ref;
Shane Snyder's avatar
Shane Snyder committed
927 928 929

    MAP_OR_FAIL(mmap);

930 931 932 933 934 935 936 937
    if(fd < 0 || (flags & MAP_ANONYMOUS))
    {
        /* mmap is not associated with a backing file; skip all Darshan
         * characterization attempts.
         */
        return(__real_mmap(addr, length, prot, flags, fd, offset));
    }

Shane Snyder's avatar
Shane Snyder committed
938 939 940 941
    ret = __real_mmap(addr, length, prot, flags, fd, offset);
    if(ret == MAP_FAILED)
        return(ret);

942
    POSIX_PRE_RECORD();
943 944
    rec_ref = darshan_lookup_record_ref(posix_runtime->fd_hash, &fd, sizeof(int));
    if(rec_ref)
Shane Snyder's avatar
Shane Snyder committed
945
    {
946
        rec_ref->file_rec->counters[POSIX_MMAPS] += 1;
Shane Snyder's avatar
Shane Snyder committed
947
    }
948
    POSIX_POST_RECORD();
Shane Snyder's avatar
Shane Snyder committed
949 950 951

    return(ret);
}
952
#endif /* DARSHAN_WRAP_MMAP */
Shane Snyder's avatar
Shane Snyder committed
953

954
#ifdef DARSHAN_WRAP_MMAP
Shane Snyder's avatar
Shane Snyder committed
955 956 957 958
void* DARSHAN_DECL(mmap64)(void *addr, size_t length, int prot, int flags,
    int fd, off64_t offset)
{
    void* ret;
959
    struct posix_file_record_ref *rec_ref;
Shane Snyder's avatar
Shane Snyder committed
960 961 962

    MAP_OR_FAIL(mmap64);

963 964 965 966 967 968 969 970
    if(fd < 0 || (flags & MAP_ANONYMOUS))
    {
        /* mmap is not associated with a backing file; skip all Darshan
         * characterization attempts.
         */
        return(__real_mmap64(addr, length, prot, flags, fd, offset));
    }

Shane Snyder's avatar
Shane Snyder committed
971 972 973 974
    ret = __real_mmap64(addr, length, prot, flags, fd, offset);
    if(ret == MAP_FAILED)
        return(ret);

975
    POSIX_PRE_RECORD();
976 977
    rec_ref = darshan_lookup_record_ref(posix_runtime->fd_hash, &fd, sizeof(int));
    if(rec_ref)
Shane Snyder's avatar
Shane Snyder committed
978
    {
979
        rec_ref->file_rec->counters[POSIX_MMAPS] += 1;
Shane Snyder's avatar
Shane Snyder committed
980
    }
981
    POSIX_POST_RECORD();
Shane Snyder's avatar
Shane Snyder committed
982 983 984

    return(ret);
}
985
#endif /* DARSHAN_WRAP_MMAP */
Shane Snyder's avatar
Shane Snyder committed
986

987 988 989
int DARSHAN_DECL(fsync)(int fd)
{
    int ret;
990
    struct posix_file_record_ref *rec_ref;
991 992 993 994 995 996 997 998 999 1000 1001
    double tm1, tm2;