margo-regression.qsub 2.47 KB
Newer Older
Philip Carns's avatar
Philip Carns committed
1
2
#!/bin/bash
#COBALT -n 2
3
#COBALT -t 20
Philip Carns's avatar
Philip Carns committed
4
5
6
#COBALT --mode script
#COBALT -A radix-io
#COBALT -q debug-flat-quad
7
#COBALT -M carns@mcs.anl.gov
Philip Carns's avatar
Philip Carns committed
8

9
10
11
# XXX xalt module currently eating '-M' flag for mercury-runner...disabling for now
module unload xalt

12
13
14
15
16
# NOTE: needed as of January 2018 to avoid conflicts between MPI and 
#       libfabric GNI provider
# NOTE: doing this with -e option to aprun
# export MPICH_GNI_NDREG_MAX_ENTRIES=2000

17
echo "## MPI (one way, double the latency for round trip):"
18
19
aprun -n 2 -N 1 ./osu_latency

20
21
22
23
24
25
26
27
echo "## Margo OFI/GNI (round trip, busy spin):"
aprun -e MPICH_GNI_NDREG_ENTRIES=2000 -n 2 -N 1 ./margo-p2p-latency -i 100000 -n ofi+gni://ipogif0:5000 -t 0,0
echo "## Margo OFI/GNI (bw, busy spin):"
aprun -e MPICH_GNI_NDREG_ENTRIES=2000 -n 2 -N 1 ./margo-p2p-bw -x 1048576 -n ofi+gni://ipogif0:5000 -c 1 -D 20 -t 0,0
echo "## Margo OFI/GNI (bw, 8x concurrency, busy spin):"
aprun -e MPICH_GNI_NDREG_ENTRIES=2000 -n 2 -N 1 ./margo-p2p-bw -x 1048576 -n ofi+gni://ipogif0:5000 -c 8 -D 20 -t 0,0


28
echo "## Margo BMI/TCP (round trip):"
29
30
31
32
33
34
aprun -e MPICH_GNI_NDREG_ENTRIES=2000 -n 2 -N 1 ./margo-p2p-latency -i 100000 -n bmi+tcp://
echo "## Margo BMI/TCP (bw):"
aprun -e MPICH_GNI_NDREG_ENTRIES=2000 -n 2 -N 1 ./margo-p2p-bw -x 1048576 -n bmi+tcp:// -c 1 -D 20
echo "## Margo BMI/TCP (bw, 8x concurrency):"
aprun -e MPICH_GNI_NDREG_ENTRIES=2000 -n 2 -N 1 ./margo-p2p-bw -x 1048576 -n bmi+tcp:// -c 8 -D 20

35
# echo "## WARNING: Margo OFI/TCP (disabled because it hangs as of 8/10/2017)"
36
# aprun -n 2 -N 1 ./margo-p2p-latency -i 100000 -n ofi+tcp://ipogif0:5000
Philip Carns's avatar
Philip Carns committed
37

38

Philip Carns's avatar
Philip Carns committed
39
# figure out nodes and hostnames for use with fi_
40
declare -a nodes=($(python /home/carns/bin/run_on_all_nids.py));
Philip Carns's avatar
Philip Carns committed
41
42
server_hostname=$(printf "nid%05d\n" ${nodes[0]})

43
echo "## fi_pingpong OFI/GNI (one way, double the usec/xfer for round trip):"
Philip Carns's avatar
Philip Carns committed
44
aprun -n 1 -N 1 -L ${nodes[0]} -b -p carns-test ./fi_pingpong -p gni -S 1 -I 10000 > $COBALT_JOBID.fi_pingpong_server.log &
Philip Carns's avatar
Philip Carns committed
45
sleep 5
Philip Carns's avatar
Philip Carns committed
46
47
48
49
aprun -n 1 -N 1 -L ${nodes[1]} -b -p carns-test ./fi_pingpong -p gni -S 1 -I 10000 $server_hostname > $COBALT_JOBID.fi_pingpong_client.log &

wait
cat $COBALT_JOBID.fi_pingpong_client.log
Philip Carns's avatar
Philip Carns committed
50
51

# one more margo run, this time with diagnostics enabled
52
53
# echo "## Margo OFI/GNI (round trip) with diagnostics:"
# aprun -n 2 -N 1 ./margo-p2p-latency -i 100000 -n ofi+gni://ipogif0:5000 -d $COBALT_JOBID.diag
Philip Carns's avatar
Philip Carns committed
54

55
echo "## Mercury-runner OFI/GNI (round trip):"
56
aprun -e MPICH_GNI_NDREG_ENTRIES=2000 -n 2 -N 1 ./mercury-runner -q -c 100000 -l 1 -m c -M -d `pwd` 1 h0=ofi+gni://ipogif0:5000 h1