codes-workload.h 10.3 KB
Newer Older
1
2
3
4
5
6
/*
 * Copyright (C) 2013 University of Chicago.
 * See COPYRIGHT notice in top-level directory.
 *
 */

7
/* I/O workload generator API to be used for reading I/O operations into
Philip Carns's avatar
Philip Carns committed
8
9
10
 * storage system simulations.  This API just describes the operations to be
 * executed; it does not service the operations.
 */
11
12
13
14

#ifndef CODES_WORKLOAD_H
#define CODES_WORKLOAD_H

Jonathan Jenkins's avatar
Jonathan Jenkins committed
15
16
17
18
#ifdef __cplusplus
extern "C" {
#endif

19
20
21
#include <ross.h>
#include "configuration.h"

Jonathan Jenkins's avatar
Jonathan Jenkins committed
22
#define MAX_NAME_LENGTH_WKLD 512
23

24
/* implementations included with codes */
Jonathan Jenkins's avatar
Jonathan Jenkins committed
25
typedef struct iomock_params iomock_params;
26
typedef struct iolang_params iolang_params;
27
typedef struct darshan_params darshan_params;
28
typedef struct recorder_params recorder_params;
29

30
31
/* struct to hold the actual data from a single MPI event*/
typedef struct dumpi_trace_params dumpi_trace_params;
32
typedef struct checkpoint_wrkld_params checkpoint_wrkld_params;
33

Jonathan Jenkins's avatar
Jonathan Jenkins committed
34
35
36
37
38
39
40
41
42
43
44
45
struct iomock_params
{
    uint64_t file_id;
    int use_uniq_file_ids;
    int is_write;
    int num_requests;
    int request_size;
    // for optimizing lookup - set higher (>= num ranks) to reduce collisions
    // and 0 to use the default
    int rank_table_size;
};

46
struct iolang_params
47
{
Jonathan Jenkins's avatar
Jonathan Jenkins committed
48
    /* the rank count is defined in the workload config file */
49
    int num_cns;
50
51
    /* flag - use path to find kernel files relative to the metafile */
    int use_relpath;
Jonathan Jenkins's avatar
Jonathan Jenkins committed
52
    char io_kernel_meta_path[MAX_NAME_LENGTH_WKLD];
53
    /* set by config in the metadata path */
Jonathan Jenkins's avatar
Jonathan Jenkins committed
54
    char io_kernel_path[MAX_NAME_LENGTH_WKLD];
55
56
};

57
58
59
struct darshan_params
{
    char log_file_path[MAX_NAME_LENGTH_WKLD];
60
    int64_t aggregator_cnt;
61
62
};

63
64
65
struct recorder_params
{
    char trace_dir_path[MAX_NAME_LENGTH_WKLD];
66
    int64_t nprocs;
67
68
};

69
70
struct dumpi_trace_params {
   char file_name[MAX_NAME_LENGTH_WKLD];
71
   int num_net_traces;
72
73
74
75
#ifdef ENABLE_CORTEX
   char cortex_script[MAX_NAME_LENGTH_WKLD];
   char cortex_class[MAX_NAME_LENGTH_WKLD];
#endif
76
77
};

78
79
80
81
82
struct checkpoint_wrkld_params
{
    int nprocs; /* number of workload processes */
    double checkpoint_sz; /* size of checkpoint, in TiB */
    double checkpoint_wr_bw; /* checkpoint write b/w, in GiB/s */
83
    int total_checkpoints; /* total number of checkpoint phases */
84
85
    double mtti; /* mean time to interrupt, in hours */
};
86

87
88
89
90
/* supported I/O operations */
enum codes_workload_op_type
{
    /* terminator; there are no more operations for this rank */
91
    CODES_WK_END = 1,
92
93
94
95
    /* sleep/delay to simulate computation or other activity */
    CODES_WK_DELAY,
    /* block until specified ranks have reached the same point */
    CODES_WK_BARRIER,
96
97

    /* IO operations */
98
99
    /* open */
    CODES_WK_OPEN,
100
    /* close */
101
102
103
104
    CODES_WK_CLOSE,
    /* write */
    CODES_WK_WRITE,
    /* read */
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
    CODES_WK_READ,

    /* network operations (modelled after MPI operations) */
    /* blocking send operation */
    CODES_WK_SEND,
    /* blocking recv operation */
    CODES_WK_RECV,
    /* non-blocking send operation */
    CODES_WK_ISEND,
    /* non-blocking receive operation */
    CODES_WK_IRECV,
    /* broadcast operation */
    CODES_WK_BCAST,
    /* Allgather operation */
    CODES_WK_ALLGATHER,
    /* Allgatherv operation */
    CODES_WK_ALLGATHERV,
    /* Alltoall operation */
    CODES_WK_ALLTOALL,
    /* Alltoallv operation */
    CODES_WK_ALLTOALLV,
    /* Reduce operation */
    CODES_WK_REDUCE,
    /* Allreduce operation */
    CODES_WK_ALLREDUCE,
    /* Generic collective operation */
    CODES_WK_COL,
132
    /* Waitall operation */
133
    CODES_WK_WAITALL,
134
    /* Wait operation */
135
    CODES_WK_WAIT,
136
    /* Waitsome operation */
137
    CODES_WK_WAITSOME,
138
    /* Waitany operation */
139
    CODES_WK_WAITANY,
140
    /* Testall operation */
141
    CODES_WK_TESTALL,
142
143
    /* MPI request free operation*/
    CODES_WK_REQ_FREE,
Jonathan Jenkins's avatar
Jonathan Jenkins committed
144
145
146
147

    /* for workloads that have events not yet handled
     * (eg the workload language) */
    CODES_WK_IGNORE
148
149
150
151
152
153
154
155
156
};

/* I/O operation paramaters */
struct codes_workload_op
{
    /* TODO: do we need different "classes" of operations to differentiate
     * between different APIs?
     */

Philip Carns's avatar
Philip Carns committed
157
    /* what type of operation this is */
158
    enum codes_workload_op_type op_type;
159
160
161
    /* currently only used by network workloads */
    double start_time;
    double end_time;
162
    double sim_start_time;
163

Philip Carns's avatar
Philip Carns committed
164
    /* parameters for each operation type */
165
166
167
168
    union
    {
        struct {
            double seconds;
169
	    double nsecs;
170
171
        } delay;
        struct {
Philip Carns's avatar
Philip Carns committed
172
            int count;  /* num ranks in barrier, -1 means "all" */
173
174
175
            int root;   /* root rank */
        } barrier;
        struct {
176
            uint64_t file_id;      /* integer identifier for the file */
177
178
179
            int create_flag;  /* file must be created, not just opened */
        } open;
        struct {
180
            uint64_t file_id;  /* file to operate on */
181
182
183
184
            off_t offset; /* offset and size */
            size_t size;
        } write;
        struct {
185
            uint64_t file_id;  /* file to operate on */
186
187
188
189
            off_t offset; /* offset and size */
            size_t size;
        } read;
        struct {
190
            uint64_t file_id;  /* file to operate on */
191
        } close;
192
193
194
195
        struct {
            /* TODO: not sure why source rank is here */
            int source_rank;/* source rank of MPI send message */
            int dest_rank; /* dest rank of MPI send message */
196
            int64_t num_bytes; /* number of bytes to be transferred over the network */
197
            int16_t data_type; /* MPI data type to be matched with the recv */
198
199
            int count; /* number of elements to be received */
            int tag; /* tag of the message */
200
            int32_t req_id;
201
202
203
204
205
206
        } send;
        struct {
            /* TODO: not sure why source rank is here */
            int source_rank;/* source rank of MPI recv message */
            int dest_rank;/* dest rank of MPI recv message */
            int num_bytes; /* number of bytes to be transferred over the network */
207
            int16_t data_type; /* MPI data type to be matched with the send */
208
209
            int count; /* number of elements to be sent */
            int tag; /* tag of the message */
210
            int32_t req_id;
211
212
213
214
215
        } recv;
        /* TODO: non-stub for other collectives */
        struct {
            int num_bytes;
        } collective;
216
217
        struct {
            int count;
218
            int32_t* req_ids;
219
220
        } waits;
        struct {
221
            int32_t req_id;
222
        } wait;
223
224
225
226
227
        struct
        {
            int32_t req_id;
        }
        free;
228
    }u;
229
230
};

231
232
233
234
235
236
237
// helper macro for implementations - call this if multi-app support not
// available
#define APP_ID_UNSUPPORTED(id, name) \
    if (id != 0) \
        tw_error(TW_LOC,\
                "APP IDs not supported for %s generator, 0 required", name);

238
239
240
241
242
243
244
245
246
/* read workload configuration from a CODES configuration file and return the
 * workload name and parameters, which can then be passed to
 * codes_workload_load */
typedef struct
{
    char const * type;
    void * params;
} codes_workload_config_return;

247
248
249
// NOTE: some workloads (iolang, checkpoint) require information about the
// total number of ranks to correctly process traces/config files, etc. Other
// workload generators (darshan) ignore it
250
251
codes_workload_config_return codes_workload_read_config(
        ConfigHandle * handle,
252
253
254
        char const * section_name,
        char const * annotation,
        int num_ranks);
255
256
257

void codes_workload_free_config_return(codes_workload_config_return *c);

258
259
/* load and initialize workload of of type "type" with parameters specified by
 * "params".  The rank is the caller's relative rank within the collection
260
261
262
 * of processes that will participate in this workload. The app_id is the
 * "application" that the rank is participating in, used to differentiate
 * between multiple, concurrent workloads
263
264
265
266
 *
 * This function is intended to be called by a compute node LP in a model
 * and may be called multiple times over the course of a
 * simulation in order to execute different application workloads.
267
 *
268
269
270
 * Returns and identifier that can be used to retrieve operations later.
 * Returns -1 on failure.
 */
271
272
273
274
275
int codes_workload_load(
        const char* type,
        const char* params,
        int app_id,
        int rank);
276
277
278
279
280

/* Retrieves the next I/O operation to execute.  the wkld_id is the
 * identifier returned by the init() function.  The op argument is a pointer
 * to a structure to be filled in with I/O operation information.
 */
281
282
283
284
285
void codes_workload_get_next(
        int wkld_id,
        int app_id,
        int rank,
        struct codes_workload_op *op);
286
287

/* Reverse of the above function. */
288
289
290
291
292
void codes_workload_get_next_rc(
        int wkld_id,
        int app_id,
        int rank,
        const struct codes_workload_op *op);
293

294
295
296
297
298
299
/* Another version of reverse handler. */
void codes_workload_get_next_rc2(
                int wkld_id,
                int app_id,
                int rank);

300
/* Retrieve the number of ranks contained in a workload */
301
302
303
304
int codes_workload_get_rank_cnt(
        const char* type,
        const char* params,
        int app_id);
305

306
/* for debugging/logging: print an individual operation to the specified file */
307
308
309
310
311
void codes_workload_print_op(
        FILE *f,
        struct codes_workload_op *op,
        int app_id,
        int rank);
312

313
314
315
316
317
318
319
320
321
/* implementation structure */
struct codes_workload_method
{
    char *method_name; /* name of the generator */
    void * (*codes_workload_read_config) (
            ConfigHandle *handle, char const * section_name,
            char const * annotation, int num_ranks);
    int (*codes_workload_load)(const char* params, int app_id, int rank);
    void (*codes_workload_get_next)(int app_id, int rank, struct codes_workload_op *op);
322
    void (*codes_workload_get_next_rc2)(int app_id, int rank);
323
324
325
    int (*codes_workload_get_rank_cnt)(const char* params, int app_id);
};

326

327
328
329
330
/* dynamically add to the workload implementation table. Must be done BEFORE
 * calls to codes_workload_read_config or codes_workload_load */
void codes_workload_add_method(struct codes_workload_method const * method);

331
332
333
334
335
336
/* NOTE: there is deliberately no finalize function; we don't have any
 * reliable way to tell when a workload is truly done and will not
 * participate in further reverse computation.   The underlying generators
 * will shut down automatically once they have issued their last event.
 */

Jonathan Jenkins's avatar
Jonathan Jenkins committed
337
338
339
340
#ifdef __cplusplus
}
#endif

341
342
343
344
345
346
#endif /* CODES_WORKLOAD_H */

/*
 * Local variables:
 *  c-indent-level: 4
 *  c-basic-offset: 4
347
 *  indent-tabs-mode: nil
348
349
350
351
 * End:
 *
 * vim: ft=c ts=8 sts=4 sw=4 expandtab
 */