tests: add 'postk_master' branch tests
Change-Id: Ie0d4cfd0921aed89d2db6083c9eb068b1cfc1984
This commit is contained in:
@@ -1,508 +1,424 @@
|
||||
#include <sys/types.h>
|
||||
#include <sys/stat.h>
|
||||
#include <fcntl.h>
|
||||
#include <time.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
#include <stdint.h>
|
||||
#include <sys/mman.h>
|
||||
#include <unistd.h>
|
||||
#include <getopt.h>
|
||||
#include <sys/syscall.h> /* For SYS_xxx definitions */
|
||||
#include <sched.h>
|
||||
#include <errno.h>
|
||||
|
||||
#include <psm2.h> /* required for core PSM2 functions */
|
||||
#include <psm2_mq.h> /* required for PSM2 MQ functions (send, recv, etc) */
|
||||
|
||||
//#define DEBUG
|
||||
#ifdef DEBUG
|
||||
#define dprintf printf
|
||||
#else
|
||||
#define dprintf {}
|
||||
#endif
|
||||
|
||||
#define BUFFER_LENGTH /*8000000*/(1ULL<<12)
|
||||
#define CONNECT_ARRAY_SIZE 8
|
||||
void die(char *msg, int rc) {
|
||||
fprintf(stderr, "%s: %d\n", msg, rc);
|
||||
fflush(stderr);
|
||||
}
|
||||
|
||||
#define DIFFNSEC(end, start) ((end.tv_sec - start.tv_sec) * 1000000000UL + (end.tv_nsec - start.tv_nsec))
|
||||
|
||||
static inline void fixed_size_work() {
|
||||
asm volatile(
|
||||
"movq $0, %%rcx\n\t"
|
||||
"1:\t"
|
||||
"addq $1, %%rcx\n\t"
|
||||
"cmpq $99, %%rcx\n\t"
|
||||
"jle 1b\n\t"
|
||||
:
|
||||
:
|
||||
: "rcx", "cc");
|
||||
}
|
||||
|
||||
static inline void bulk_fsw(unsigned long n) {
|
||||
int j;
|
||||
for (j = 0; j < (n); j++) {
|
||||
fixed_size_work();
|
||||
}
|
||||
}
|
||||
|
||||
double nspw; /* nsec per work */
|
||||
unsigned long nsec;
|
||||
|
||||
void fwq_init() {
|
||||
struct timespec start, end;
|
||||
int i;
|
||||
clock_gettime(CLOCK_THREAD_CPUTIME_ID, &start);
|
||||
#define N_INIT 10000000
|
||||
bulk_fsw(N_INIT);
|
||||
clock_gettime(CLOCK_THREAD_CPUTIME_ID, &end);
|
||||
nsec = DIFFNSEC(end, start);
|
||||
nspw = nsec / (double)N_INIT;
|
||||
}
|
||||
|
||||
#if 1
|
||||
void fwq(long delay_nsec) {
|
||||
if (delay_nsec < 0) {
|
||||
return;
|
||||
//printf("%s: delay_nsec < 0\n", __FUNCTION__);
|
||||
}
|
||||
bulk_fsw(delay_nsec / nspw);
|
||||
}
|
||||
#else /* For machines with large core-to-core performance variation (e.g. OFP) */
|
||||
void fwq(long delay_nsec) {
|
||||
struct timespec start, end;
|
||||
clock_gettime(CLOCK_THREAD_CPUTIME_ID, &start);
|
||||
|
||||
while (1) {
|
||||
clock_gettime(CLOCK_THREAD_CPUTIME_ID, &end);
|
||||
if (DIFFNSEC(end, start) >= delay_nsec) {
|
||||
break;
|
||||
}
|
||||
bulk_fsw(2); /* ~150 ns per iteration on FOP */
|
||||
}
|
||||
}
|
||||
#endif
|
||||
|
||||
|
||||
static int print_cpu_last_executed_on() {
|
||||
char fn[256];
|
||||
char* result;
|
||||
pid_t tid = syscall(SYS_gettid);
|
||||
int fd;
|
||||
int offset;
|
||||
int mpi_errno = 0;
|
||||
|
||||
sprintf(fn, "/proc/%d/task/%d/stat", getpid(), (int)tid);
|
||||
//printf("fn=%s\n", fn);
|
||||
fd = open(fn, O_RDONLY);
|
||||
if(fd == -1) {
|
||||
printf("open() failed\n");
|
||||
goto fn_fail;
|
||||
}
|
||||
|
||||
result = malloc(65536);
|
||||
if(result == NULL) {
|
||||
printf("malloc() failed");
|
||||
goto fn_fail;
|
||||
}
|
||||
|
||||
int amount = 0;
|
||||
offset = 0;
|
||||
while(1) {
|
||||
amount = read(fd, result + offset, 65536);
|
||||
// printf("amount=%d\n", amount);
|
||||
if(amount == -1) {
|
||||
printf("read() failed");
|
||||
goto fn_fail;
|
||||
}
|
||||
if(amount == 0) {
|
||||
goto eof;
|
||||
}
|
||||
offset += amount;
|
||||
}
|
||||
eof:;
|
||||
//printf("result:%s\n", result);
|
||||
|
||||
char* next_delim = result;
|
||||
char* field;
|
||||
int i;
|
||||
for(i = 0; i < 39; i++) {
|
||||
field = strsep(&next_delim, " ");
|
||||
}
|
||||
|
||||
int cpu = sched_getcpu();
|
||||
if(cpu == -1) {
|
||||
printf("getpu() failed\n");
|
||||
goto fn_fail;
|
||||
}
|
||||
|
||||
printf("compute thread,pmi_rank=%02d,stat-cpu=%02d,sched_getcpu=%02d,pid=%d,tid=%d\n", atoi(getenv("PMI_RANK")), atoi(field), cpu, getpid(), tid); fflush(stdout);
|
||||
fn_exit:
|
||||
free(result);
|
||||
return mpi_errno;
|
||||
fn_fail:
|
||||
mpi_errno = -1;
|
||||
goto fn_exit;
|
||||
}
|
||||
|
||||
static inline int on_same_node(int ppn, int me, int you) {
|
||||
return (me / ppn == you / ppn);
|
||||
}
|
||||
|
||||
/* Helper functions to find the server's PSM2 endpoint identifier (epid). */
|
||||
psm2_epid_t find_server(int rank) {
|
||||
FILE *fp = NULL;
|
||||
psm2_epid_t server_epid = 0;
|
||||
char fn[256];
|
||||
printf("%s: enter\n", __FUNCTION__); fflush(stdout);
|
||||
|
||||
sprintf(fn, "psm2-demo-server-epid-%d", rank);
|
||||
printf("PSM2 client waiting for epid mapping file to appear...\n"); fflush(stdout);
|
||||
while (!fp) {
|
||||
sleep(1);
|
||||
fp = fopen(fn, "r");
|
||||
}
|
||||
fscanf(fp, "%lx", &server_epid);
|
||||
fclose(fp);
|
||||
printf("PSM2 client found server epid = 0x%lx\n", server_epid);
|
||||
return server_epid;
|
||||
}
|
||||
|
||||
void write_epid_to_file(int rank, psm2_epid_t myepid) {
|
||||
FILE *fp;
|
||||
char fn[256];
|
||||
printf("%s: enter\n", __FUNCTION__);
|
||||
sprintf(fn, "psm2-demo-server-epid-%d", rank);
|
||||
fp = fopen(fn, "w");
|
||||
if (!fp) {
|
||||
fprintf(stderr,
|
||||
"Exiting, couldn't write server's epid mapping file: ");
|
||||
die(strerror(errno), errno);
|
||||
}
|
||||
fprintf(fp, "0x%lx", myepid);
|
||||
fclose(fp);
|
||||
printf("PSM2 server wrote epid = 0x%lx to file.\n", myepid);
|
||||
return;
|
||||
}
|
||||
|
||||
psm2_uuid_t uuid;
|
||||
psm2_ep_t myep;
|
||||
psm2_epid_t myepid;
|
||||
psm2_epid_t server_epid;
|
||||
psm2_epid_t epid_array[CONNECT_ARRAY_SIZE];
|
||||
int epid_array_mask[CONNECT_ARRAY_SIZE];
|
||||
psm2_error_t epid_connect_errors[CONNECT_ARRAY_SIZE];
|
||||
psm2_epaddr_t epaddr_array[CONNECT_ARRAY_SIZE];
|
||||
|
||||
int my_psm2_init(int my_rank, int server_rank) {
|
||||
struct psm2_ep_open_opts o;
|
||||
int rc;
|
||||
int ver_major = PSM2_VERNO_MAJOR;
|
||||
int ver_minor = PSM2_VERNO_MINOR;
|
||||
|
||||
printf("%s: my_rank=%d,server_rank=%d\n", __FUNCTION__, my_rank, server_rank); fflush(stdout);
|
||||
memset(uuid, 0, sizeof(psm2_uuid_t)); /* Use a UUID of zero */
|
||||
/* Try to initialize PSM2 with the requested library version.
|
||||
* * In this example, given the use of the PSM2_VERNO_MAJOR and MINOR
|
||||
* * as defined in the PSM2 headers, ensure that we are linking with
|
||||
* * the same version of PSM2 as we compiled against. */
|
||||
|
||||
if ((rc = psm2_init(&ver_major, &ver_minor)) != PSM2_OK) {
|
||||
die("couldn't init", rc);
|
||||
}
|
||||
printf("PSM2 init done.\n");
|
||||
/* Setup the endpoint options struct */
|
||||
if ((rc = psm2_ep_open_opts_get_defaults(&o)) != PSM2_OK) {
|
||||
die("couldn't set default opts", rc);
|
||||
}
|
||||
printf("PSM2 opts_get_defaults done.\n");
|
||||
/* Attempt to open a PSM2 endpoint. This allocates hardware resources. */
|
||||
if ((rc = psm2_ep_open(uuid, &o, &myep, &myepid)) != PSM2_OK) {
|
||||
die("couldn't psm2_ep_open()", rc);
|
||||
}
|
||||
printf("PSM2 endpoint open done.\n");
|
||||
|
||||
return 0;
|
||||
}
|
||||
int my_psm2_connect(int my_rank, int server_rank) {
|
||||
int rc;
|
||||
int is_server = (my_rank == server_rank) ? 1 : 0;
|
||||
printf("%s: my_rank=%d,server_rank=%d\n", __FUNCTION__, my_rank, server_rank); fflush(stdout);
|
||||
if (is_server) {
|
||||
write_epid_to_file(my_rank, myepid);
|
||||
} else {
|
||||
server_epid = find_server(server_rank);
|
||||
}
|
||||
printf("%s: epid exchange done\n", __FUNCTION__); fflush(stdout);
|
||||
if (is_server) {
|
||||
/* Server does nothing here. A connection does not have to be
|
||||
* * established to receive messages. */
|
||||
printf("PSM2 server up.\n");
|
||||
} else {
|
||||
/* Setup connection request info */
|
||||
/* PSM2 can connect to a single epid per request,
|
||||
* * or an arbitrary number of epids in a single connect call.
|
||||
* * For this example, use part of an array of
|
||||
* * connection requests. */
|
||||
memset(epid_array_mask, 0, sizeof(int) * CONNECT_ARRAY_SIZE);
|
||||
epid_array[0] = server_epid;
|
||||
epid_array_mask[0] = 1;
|
||||
/* Begin the connection process.
|
||||
* * note that if a requested epid is not responding,
|
||||
* * the connect call will still return OK.
|
||||
* * The errors array will contain the state of individual
|
||||
* * connection requests. */
|
||||
if ((rc = psm2_ep_connect(myep,
|
||||
CONNECT_ARRAY_SIZE,
|
||||
epid_array,
|
||||
epid_array_mask,
|
||||
epid_connect_errors,
|
||||
epaddr_array,
|
||||
0 /* no timeout */
|
||||
)) != PSM2_OK) {
|
||||
die("couldn't ep_connect", rc);
|
||||
return -1;
|
||||
}
|
||||
printf("PSM2 connect request processed.\n");
|
||||
/* Now check if our connection to the server is ready */
|
||||
if (epid_connect_errors[0] != PSM2_OK) {
|
||||
die("couldn't connect to server", epid_connect_errors[0]);
|
||||
return -1;
|
||||
}
|
||||
printf("PSM2 client-server connection established.\n");
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
char msgbuf[BUFFER_LENGTH];
|
||||
|
||||
int my_psm2_sendrecv(int rank, int sender, int receiver) {
|
||||
int is_server = (rank == receiver) ? 1 : 0;
|
||||
int rc;
|
||||
psm2_mq_t q;
|
||||
psm2_mq_req_t req_mq;
|
||||
//char msgbuf[BUFFER_LENGTH];
|
||||
|
||||
register long rsp asm ("rsp");
|
||||
printf("rsp=%lx.msgbuf=%p\n", rsp, msgbuf); fflush(stdout);
|
||||
|
||||
memset(msgbuf, 0, BUFFER_LENGTH);
|
||||
|
||||
/* Setup our PSM2 message queue */
|
||||
if ((rc = psm2_mq_init(myep, PSM2_MQ_ORDERMASK_NONE, NULL, 0, &q))
|
||||
!= PSM2_OK) {
|
||||
die("couldn't initialize PSM2 MQ", rc);
|
||||
}
|
||||
printf("PSM2 MQ init done.\n");
|
||||
if (is_server) {
|
||||
psm2_mq_tag_t t = {0xABCD};
|
||||
psm2_mq_tag_t tm = {-1};
|
||||
/* Post the receive request */
|
||||
if ((rc = psm2_mq_irecv2(q, PSM2_MQ_ANY_ADDR,
|
||||
&t, /* message tag */
|
||||
&tm, /* message tag mask */
|
||||
0, /* no flags */
|
||||
msgbuf, BUFFER_LENGTH,
|
||||
NULL, /* no context to add */
|
||||
&req_mq /* track irecv status */
|
||||
)) != PSM2_OK) {
|
||||
die("couldn't post psm2_mq_irecv()", rc);
|
||||
}
|
||||
printf("PSM2 MQ irecv() posted\n");
|
||||
/* Wait until the message arrives */
|
||||
if ((rc = psm2_mq_wait(&req_mq, NULL)) != PSM2_OK) {
|
||||
die("couldn't wait for the irecv", rc);
|
||||
}
|
||||
printf("PSM2 MQ wait() done.\n");
|
||||
printf("Message from client:\n");
|
||||
printf("%s", msgbuf);
|
||||
|
||||
if (is_server) {
|
||||
char fn[256];
|
||||
sprintf(fn, "psm2-demo-server-epid-%d", rank);
|
||||
unlink(fn);
|
||||
}
|
||||
} else {
|
||||
/* Say hello */
|
||||
snprintf(msgbuf, BUFFER_LENGTH,
|
||||
"Hello world from epid=0x%lx, pid=%d.\n",
|
||||
myepid, getpid());
|
||||
psm2_mq_tag_t t = {0xABCD};
|
||||
if ((rc = psm2_mq_send2(q,
|
||||
epaddr_array[0], /* destination epaddr */
|
||||
PSM2_MQ_FLAG_SENDSYNC, /* no flags */
|
||||
&t, /* tag */
|
||||
msgbuf, BUFFER_LENGTH
|
||||
)) != PSM2_OK) {
|
||||
die("couldn't post psm2_mq_isend", rc);
|
||||
}
|
||||
printf("PSM2 MQ send() done.\n");
|
||||
}
|
||||
/* Close down the MQ */
|
||||
if ((rc = psm2_mq_finalize(q)) != PSM2_OK) {
|
||||
die("couldn't psm2_mq_finalize()", rc);
|
||||
}
|
||||
printf("PSM2 MQ finalized.\n");
|
||||
/* Close our ep, releasing all hardware resources.
|
||||
* * Try to close all connections properly */
|
||||
if ((rc = psm2_ep_close(myep, PSM2_EP_CLOSE_GRACEFUL,
|
||||
0 /* no timeout */)) != PSM2_OK) {
|
||||
die("couldn't psm2_ep_close()", rc);
|
||||
}
|
||||
printf("PSM2 ep closed.\n");
|
||||
/* Release all local PSM2 resources */
|
||||
if ((rc = psm2_finalize()) != PSM2_OK) {
|
||||
die("couldn't psm2_finalize()", rc);
|
||||
}
|
||||
printf("PSM2 shut down, exiting.\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
static struct option options[] = {
|
||||
{
|
||||
.name = "ppn",
|
||||
.has_arg = required_argument,
|
||||
.flag = NULL,
|
||||
.val = 'P',
|
||||
},
|
||||
/* end */
|
||||
{ NULL, 0, NULL, 0, },
|
||||
};
|
||||
|
||||
struct thr_arg {
|
||||
pthread_barrier_t bar;
|
||||
pthread_t pthread;
|
||||
int rank;
|
||||
int ppn;
|
||||
int nproc;
|
||||
int server_rank;
|
||||
};
|
||||
|
||||
struct thr_arg thr_arg;
|
||||
|
||||
void *progress_fn(void *arg) {
|
||||
struct thr_arg *thr_arg = (struct thr_arg *)arg;
|
||||
int rc;
|
||||
int i;
|
||||
|
||||
rc = syscall(732);
|
||||
if (rc == -1)
|
||||
fprintf(stdout, "CT09100 progress_fn running on Linux OK\n");
|
||||
else {
|
||||
fprintf(stdout, "CT09100 progress_fn running on McKernel NG (%d)\n", rc);
|
||||
}
|
||||
|
||||
printf("progress,enter\n");
|
||||
|
||||
pthread_barrier_wait(&thr_arg->bar);
|
||||
|
||||
pthread_barrier_wait(&thr_arg->bar);
|
||||
|
||||
|
||||
printf("progress,exit\n");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
int main(int argc, char **argv) {
|
||||
int rc;
|
||||
int actual;
|
||||
int nproc;
|
||||
int ppn = -1;
|
||||
int my_rank = -1, size = -1;
|
||||
int i, j;
|
||||
struct timespec start, end;
|
||||
long t_pure_l, t_overall_l;
|
||||
long t_pure, t_overall;
|
||||
int opt;
|
||||
pthread_barrierattr_t barrierattr;
|
||||
|
||||
fwq_init();
|
||||
|
||||
while ((opt = getopt_long(argc, argv, "+P:", options, NULL)) != -1) {
|
||||
switch (opt) {
|
||||
case 'P':
|
||||
ppn = atoi(optarg);
|
||||
break;
|
||||
default: /* '?' */
|
||||
printf("unknown option %c\n", optopt);
|
||||
exit(1);
|
||||
}
|
||||
}
|
||||
|
||||
if (ppn == -1) {
|
||||
printf("specify ppn with --ppn");
|
||||
exit(1);
|
||||
}
|
||||
|
||||
char *rank_str = getenv("PMI_RANK");
|
||||
if (!rank_str) {
|
||||
printf("getenv failed\n");
|
||||
exit(1);
|
||||
}
|
||||
my_rank = atoi(rank_str);
|
||||
printf("my_rank=%d\n", my_rank); fflush(stdout);
|
||||
|
||||
nproc = 2;
|
||||
|
||||
if (my_rank == 0) {
|
||||
printf("tid=%d,pid=%d,nproc=%d\n", syscall(__NR_gettid), getpid(), nproc);
|
||||
printf("nsec=%ld, nspw=%f\n", nsec, nspw);
|
||||
}
|
||||
|
||||
|
||||
/* Spawn a thread */
|
||||
thr_arg.rank = my_rank;
|
||||
thr_arg.ppn = ppn;
|
||||
thr_arg.nproc = nproc;
|
||||
thr_arg.server_rank = ppn + (my_rank % ppn);
|
||||
|
||||
pthread_barrierattr_init(&barrierattr);
|
||||
pthread_barrier_init(&thr_arg.bar, &barrierattr, nproc);
|
||||
|
||||
char *uti_str = getenv("DISABLE_UTI");
|
||||
int uti_val = uti_str ? atoi(uti_str) : 0;
|
||||
if (!uti_val) {
|
||||
rc = syscall(731, 1, NULL);
|
||||
if (rc) {
|
||||
fprintf(stdout, "CT09003 INFO: uti not available (rc=%d)\n", rc);
|
||||
} else {
|
||||
fprintf(stdout, "CT09003 INFO: uti available\n");
|
||||
}
|
||||
} else {
|
||||
fprintf(stdout, "CT09003 INFO: uti disabled\n");
|
||||
}
|
||||
|
||||
rc = pthread_create(&thr_arg.pthread, NULL, progress_fn, &thr_arg);
|
||||
if (rc){
|
||||
fprintf(stdout, "pthread_create: %d\n", rc);
|
||||
exit(1);
|
||||
}
|
||||
|
||||
pthread_barrier_wait(&thr_arg.bar);
|
||||
|
||||
my_psm2_init(thr_arg.rank, thr_arg.server_rank);
|
||||
my_psm2_connect(thr_arg.rank, thr_arg.server_rank);
|
||||
|
||||
for (i = 0; i < thr_arg.nproc; i++) {
|
||||
if (!on_same_node(thr_arg.ppn, thr_arg.rank, i)) {
|
||||
if (thr_arg.rank < i) {
|
||||
my_psm2_sendrecv(thr_arg.rank, thr_arg.rank, i);
|
||||
} else {
|
||||
my_psm2_sendrecv(thr_arg.rank, i, thr_arg.rank);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
pthread_barrier_wait(&thr_arg.bar);
|
||||
|
||||
pthread_join(thr_arg.pthread, NULL);
|
||||
|
||||
fn_exit:
|
||||
return 0;
|
||||
fn_fail:
|
||||
goto fn_exit;
|
||||
}
|
||||
#include <sys/types.h>
|
||||
#include <sys/stat.h>
|
||||
#include <fcntl.h>
|
||||
#include <time.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
#include <stdint.h>
|
||||
#include <sys/mman.h>
|
||||
#include <unistd.h>
|
||||
#include <getopt.h>
|
||||
#include <sys/syscall.h> /* For SYS_xxx definitions */
|
||||
#include <sched.h>
|
||||
#include <errno.h>
|
||||
#include <psm2.h> /* required for core PSM2 functions */
|
||||
#include <psm2_mq.h> /* required for PSM2 MQ functions (send, recv, etc) */
|
||||
#include "util.h"
|
||||
#include "fwq.h"
|
||||
|
||||
//#define DEBUG
|
||||
#ifdef DEBUG
|
||||
#define dprintf printf
|
||||
#else
|
||||
#define dprintf {}
|
||||
#endif
|
||||
|
||||
#define BUFFER_LENGTH /*8000000*/(1ULL<<12)
|
||||
#define CONNECT_ARRAY_SIZE 8
|
||||
void die(char *msg, int rc)
|
||||
{
|
||||
fprintf(stderr, "%s: %d\n", msg, rc);
|
||||
fflush(stderr);
|
||||
}
|
||||
|
||||
static inline int on_same_node(int ppn, int me, int you)
|
||||
{
|
||||
return (me / ppn == you / ppn);
|
||||
}
|
||||
|
||||
/* Helper functions to find the server's PSM2 endpoint identifier (epid). */
|
||||
psm2_epid_t find_server(int rank)
|
||||
{
|
||||
FILE *fp = NULL;
|
||||
psm2_epid_t server_epid = 0;
|
||||
char fn[256];
|
||||
|
||||
printf("%s: enter\n", __func__); fflush(stdout);
|
||||
|
||||
sprintf(fn, "psm2-demo-server-epid-%d", rank);
|
||||
printf("PSM2 client waiting for epid mapping file to appear...\n");
|
||||
fflush(stdout);
|
||||
|
||||
while (!fp) {
|
||||
sleep(1);
|
||||
fp = fopen(fn, "r");
|
||||
}
|
||||
fscanf(fp, "%lx", &server_epid);
|
||||
fclose(fp);
|
||||
printf("PSM2 client found server epid = 0x%lx\n", server_epid);
|
||||
return server_epid;
|
||||
}
|
||||
|
||||
void write_epid_to_file(int rank, psm2_epid_t myepid)
|
||||
{
|
||||
FILE *fp;
|
||||
char fn[256];
|
||||
|
||||
printf("%s: enter\n", __func__);
|
||||
sprintf(fn, "psm2-demo-server-epid-%d", rank);
|
||||
fp = fopen(fn, "w");
|
||||
if (!fp) {
|
||||
fprintf(stderr,
|
||||
"Exiting, couldn't write server's epid mapping file: ");
|
||||
die(strerror(errno), errno);
|
||||
}
|
||||
fprintf(fp, "0x%lx", myepid);
|
||||
fclose(fp);
|
||||
printf("PSM2 server wrote epid = 0x%lx to file.\n", myepid);
|
||||
}
|
||||
|
||||
psm2_uuid_t uuid;
|
||||
psm2_ep_t myep;
|
||||
psm2_epid_t myepid;
|
||||
psm2_epid_t server_epid;
|
||||
psm2_epid_t epid_array[CONNECT_ARRAY_SIZE];
|
||||
int epid_array_mask[CONNECT_ARRAY_SIZE];
|
||||
psm2_error_t epid_connect_errors[CONNECT_ARRAY_SIZE];
|
||||
psm2_epaddr_t epaddr_array[CONNECT_ARRAY_SIZE];
|
||||
|
||||
int my_psm2_init(int my_rank, int server_rank)
|
||||
{
|
||||
struct psm2_ep_open_opts o;
|
||||
int rc;
|
||||
int ver_major = PSM2_VERNO_MAJOR;
|
||||
int ver_minor = PSM2_VERNO_MINOR;
|
||||
|
||||
printf("%s: my_rank=%d,server_rank=%d\n",
|
||||
__func__, my_rank, server_rank);
|
||||
fflush(stdout);
|
||||
memset(uuid, 0, sizeof(psm2_uuid_t)); /* Use a UUID of zero */
|
||||
/* Try to initialize PSM2 with the requested library version.
|
||||
* In this example, given the use of the PSM2_VERNO_MAJOR and MINOR
|
||||
* as defined in the PSM2 headers, ensure that we are linking with
|
||||
* the same version of PSM2 as we compiled against.
|
||||
*/
|
||||
|
||||
if ((rc = psm2_init(&ver_major, &ver_minor)) != PSM2_OK) {
|
||||
die("couldn't init", rc);
|
||||
}
|
||||
printf("PSM2 init done.\n");
|
||||
/* Setup the endpoint options struct */
|
||||
if ((rc = psm2_ep_open_opts_get_defaults(&o)) != PSM2_OK) {
|
||||
die("couldn't set default opts", rc);
|
||||
}
|
||||
printf("PSM2 opts_get_defaults done.\n");
|
||||
/* Attempt to open a PSM2 endpoint. This allocates hardware resources.
|
||||
*/
|
||||
if ((rc = psm2_ep_open(uuid, &o, &myep, &myepid)) != PSM2_OK) {
|
||||
die("couldn't psm2_ep_open()", rc);
|
||||
}
|
||||
printf("PSM2 endpoint open done.\n");
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int my_psm2_connect(int my_rank, int server_rank)
|
||||
{
|
||||
int rc;
|
||||
int is_server = (my_rank == server_rank) ? 1 : 0;
|
||||
|
||||
printf("%s: my_rank=%d,server_rank=%d\n",
|
||||
__func__, my_rank, server_rank);
|
||||
fflush(stdout);
|
||||
if (is_server) {
|
||||
write_epid_to_file(my_rank, myepid);
|
||||
} else {
|
||||
server_epid = find_server(server_rank);
|
||||
}
|
||||
printf("%s: epid exchange done\n", __func__);
|
||||
fflush(stdout);
|
||||
if (is_server) {
|
||||
/* Server does nothing here. A connection does not have to be
|
||||
* established to receive messages.
|
||||
*/
|
||||
printf("PSM2 server up.\n");
|
||||
} else {
|
||||
/* Setup connection request info */
|
||||
/* PSM2 can connect to a single epid per request,
|
||||
* or an arbitrary number of epids in a single connect call.
|
||||
* For this example, use part of an array of
|
||||
* connection requests.
|
||||
*/
|
||||
memset(epid_array_mask, 0, sizeof(int) * CONNECT_ARRAY_SIZE);
|
||||
epid_array[0] = server_epid;
|
||||
epid_array_mask[0] = 1;
|
||||
/* Begin the connection process.
|
||||
* note that if a requested epid is not responding,
|
||||
* the connect call will still return OK.
|
||||
* The errors array will contain the state of individual
|
||||
* connection requests.
|
||||
*/
|
||||
if ((rc = psm2_ep_connect(myep,
|
||||
CONNECT_ARRAY_SIZE,
|
||||
epid_array,
|
||||
epid_array_mask,
|
||||
epid_connect_errors,
|
||||
epaddr_array,
|
||||
0 /* no timeout */
|
||||
)) != PSM2_OK) {
|
||||
die("couldn't ep_connect", rc);
|
||||
return -1;
|
||||
}
|
||||
printf("PSM2 connect request processed.\n");
|
||||
/* Now check if our connection to the server is ready */
|
||||
if (epid_connect_errors[0] != PSM2_OK) {
|
||||
die("couldn't connect to server",
|
||||
epid_connect_errors[0]);
|
||||
return -1;
|
||||
}
|
||||
printf("PSM2 client-server connection established.\n");
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
char msgbuf[BUFFER_LENGTH];
|
||||
|
||||
int my_psm2_sendrecv(int rank, int sender, int receiver)
|
||||
{
|
||||
int is_server = (rank == receiver) ? 1 : 0;
|
||||
int rc;
|
||||
psm2_mq_t q;
|
||||
psm2_mq_req_t req_mq;
|
||||
//char msgbuf[BUFFER_LENGTH];
|
||||
|
||||
register long rsp asm ("rsp");
|
||||
printf("rsp=%lx.msgbuf=%p\n", rsp, msgbuf); fflush(stdout);
|
||||
|
||||
memset(msgbuf, 0, BUFFER_LENGTH);
|
||||
|
||||
/* Setup our PSM2 message queue */
|
||||
if ((rc = psm2_mq_init(myep, PSM2_MQ_ORDERMASK_NONE, NULL, 0, &q))
|
||||
!= PSM2_OK) {
|
||||
die("couldn't initialize PSM2 MQ", rc);
|
||||
}
|
||||
printf("PSM2 MQ init done.\n");
|
||||
if (is_server) {
|
||||
psm2_mq_tag_t t = {0xABCD};
|
||||
psm2_mq_tag_t tm = {-1};
|
||||
/* Post the receive request */
|
||||
if ((rc = psm2_mq_irecv2(q, PSM2_MQ_ANY_ADDR,
|
||||
&t, /* message tag */
|
||||
&tm, /* message tag mask */
|
||||
0, /* no flags */
|
||||
msgbuf, BUFFER_LENGTH,
|
||||
NULL, /* no context to add */
|
||||
&req_mq /* track irecv status */
|
||||
)) != PSM2_OK) {
|
||||
die("couldn't post psm2_mq_irecv()", rc);
|
||||
}
|
||||
printf("PSM2 MQ irecv() posted\n");
|
||||
/* Wait until the message arrives */
|
||||
if ((rc = psm2_mq_wait(&req_mq, NULL)) != PSM2_OK) {
|
||||
die("couldn't wait for the irecv", rc);
|
||||
}
|
||||
printf("PSM2 MQ wait() done.\n");
|
||||
printf("Message from client:\n");
|
||||
printf("%s", msgbuf);
|
||||
|
||||
if (is_server) {
|
||||
char fn[256];
|
||||
|
||||
sprintf(fn, "psm2-demo-server-epid-%d", rank);
|
||||
unlink(fn);
|
||||
}
|
||||
} else {
|
||||
/* Say hello */
|
||||
snprintf(msgbuf, BUFFER_LENGTH,
|
||||
"Hello world from epid=0x%lx, pid=%d.\n",
|
||||
myepid, getpid());
|
||||
psm2_mq_tag_t t = {0xABCD};
|
||||
|
||||
if ((rc = psm2_mq_send2(q,
|
||||
epaddr_array[0], /* destination epaddr */
|
||||
PSM2_MQ_FLAG_SENDSYNC, /* no flags */
|
||||
&t, /* tag */
|
||||
msgbuf, BUFFER_LENGTH
|
||||
)) != PSM2_OK) {
|
||||
die("couldn't post psm2_mq_isend", rc);
|
||||
}
|
||||
printf("PSM2 MQ send() done.\n");
|
||||
}
|
||||
/* Close down the MQ */
|
||||
if ((rc = psm2_mq_finalize(q)) != PSM2_OK) {
|
||||
die("couldn't psm2_mq_finalize()", rc);
|
||||
}
|
||||
printf("PSM2 MQ finalized.\n");
|
||||
/* Close our ep, releasing all hardware resources.
|
||||
* Try to close all connections properly
|
||||
*/
|
||||
if ((rc = psm2_ep_close(myep, PSM2_EP_CLOSE_GRACEFUL,
|
||||
0 /* no timeout */)) != PSM2_OK) {
|
||||
die("couldn't psm2_ep_close()", rc);
|
||||
}
|
||||
printf("PSM2 ep closed.\n");
|
||||
/* Release all local PSM2 resources */
|
||||
if ((rc = psm2_finalize()) != PSM2_OK) {
|
||||
die("couldn't psm2_finalize()", rc);
|
||||
}
|
||||
printf("PSM2 shut down, exiting.\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
static struct option options[] = {
|
||||
{
|
||||
.name = "ppn",
|
||||
.has_arg = required_argument,
|
||||
.flag = NULL,
|
||||
.val = 'P',
|
||||
},
|
||||
/* end */
|
||||
{ NULL, 0, NULL, 0, },
|
||||
};
|
||||
|
||||
struct thr_arg {
|
||||
pthread_barrier_t bar;
|
||||
pthread_t pthread;
|
||||
int rank;
|
||||
int ppn;
|
||||
int nproc;
|
||||
int server_rank;
|
||||
};
|
||||
|
||||
struct thr_arg thr_arg;
|
||||
|
||||
void *progress_fn(void *arg)
|
||||
{
|
||||
struct thr_arg *thr_arg = (struct thr_arg *)arg;
|
||||
int rc;
|
||||
int i;
|
||||
|
||||
rc = syscall(732);
|
||||
if (rc == -1)
|
||||
fprintf(stdout, "CT09100 %s running on Linux OK\n",
|
||||
__func__);
|
||||
else {
|
||||
fprintf(stdout, "CT09100 %s running on McKernel NG (%d)\n",
|
||||
__func__, rc);
|
||||
}
|
||||
|
||||
printf("progress,enter\n");
|
||||
|
||||
pthread_barrier_wait(&thr_arg->bar);
|
||||
|
||||
pthread_barrier_wait(&thr_arg->bar);
|
||||
|
||||
|
||||
printf("progress,exit\n");
|
||||
return NULL;
|
||||
}
|
||||
|
||||
int main(int argc, char **argv)
|
||||
{
|
||||
int rc;
|
||||
int actual;
|
||||
int nproc;
|
||||
int ppn = -1;
|
||||
int my_rank = -1, size = -1;
|
||||
int i, j;
|
||||
struct timespec start, end;
|
||||
long t_pure_l, t_overall_l;
|
||||
long t_pure, t_overall;
|
||||
int opt;
|
||||
pthread_barrierattr_t barrierattr;
|
||||
|
||||
fwq_init();
|
||||
|
||||
while ((opt = getopt_long(argc, argv, "+P:", options, NULL)) != -1) {
|
||||
switch (opt) {
|
||||
case 'P':
|
||||
ppn = atoi(optarg);
|
||||
break;
|
||||
default: /* '?' */
|
||||
printf("unknown option %c\n", optopt);
|
||||
exit(1);
|
||||
}
|
||||
}
|
||||
|
||||
if (ppn == -1) {
|
||||
printf("specify ppn with --ppn");
|
||||
exit(1);
|
||||
}
|
||||
|
||||
char *rank_str = getenv("PMI_RANK");
|
||||
|
||||
if (!rank_str) {
|
||||
printf("getenv failed\n");
|
||||
exit(1);
|
||||
}
|
||||
my_rank = atoi(rank_str);
|
||||
printf("my_rank=%d\n", my_rank); fflush(stdout);
|
||||
|
||||
nproc = 2;
|
||||
|
||||
if (my_rank == 0) {
|
||||
printf("tid=%d,pid=%d,nproc=%d\n",
|
||||
syscall(__NR_gettid), getpid(), nproc);
|
||||
printf("nsec=%ld, nspw=%f\n", nsec, nspw);
|
||||
}
|
||||
|
||||
|
||||
/* Spawn a thread */
|
||||
thr_arg.rank = my_rank;
|
||||
thr_arg.ppn = ppn;
|
||||
thr_arg.nproc = nproc;
|
||||
thr_arg.server_rank = ppn + (my_rank % ppn);
|
||||
|
||||
pthread_barrierattr_init(&barrierattr);
|
||||
pthread_barrier_init(&thr_arg.bar, &barrierattr, nproc);
|
||||
|
||||
char *uti_str = getenv("DISABLE_UTI");
|
||||
int uti_val = uti_str ? atoi(uti_str) : 0;
|
||||
|
||||
if (!uti_val) {
|
||||
rc = syscall(731, 1, NULL);
|
||||
if (rc) {
|
||||
fprintf(stdout,
|
||||
"CT09003 INFO: uti not available (rc=%d)\n",
|
||||
rc);
|
||||
} else {
|
||||
fprintf(stdout, "CT09003 INFO: uti available\n");
|
||||
}
|
||||
} else {
|
||||
fprintf(stdout, "CT09003 INFO: uti disabled\n");
|
||||
}
|
||||
|
||||
rc = pthread_create(&thr_arg.pthread, NULL, progress_fn, &thr_arg);
|
||||
if (rc) {
|
||||
fprintf(stdout, "pthread_create: %d\n", rc);
|
||||
exit(1);
|
||||
}
|
||||
|
||||
pthread_barrier_wait(&thr_arg.bar);
|
||||
|
||||
my_psm2_init(thr_arg.rank, thr_arg.server_rank);
|
||||
my_psm2_connect(thr_arg.rank, thr_arg.server_rank);
|
||||
|
||||
for (i = 0; i < thr_arg.nproc; i++) {
|
||||
if (!on_same_node(thr_arg.ppn, thr_arg.rank, i)) {
|
||||
if (thr_arg.rank < i) {
|
||||
my_psm2_sendrecv(thr_arg.rank, thr_arg.rank, i);
|
||||
} else {
|
||||
my_psm2_sendrecv(thr_arg.rank, i, thr_arg.rank);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
pthread_barrier_wait(&thr_arg.bar);
|
||||
|
||||
pthread_join(thr_arg.pthread, NULL);
|
||||
|
||||
fn_exit:
|
||||
return 0;
|
||||
fn_fail:
|
||||
goto fn_exit;
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user