Logo Search packages:      
Sourcecode: libibverbs version File versions  Download package

ud_pingpong.c

/*
 * Copyright (c) 2005 Topspin Communications.  All rights reserved.
 *
 * This software is available to you under a choice of one of two
 * licenses.  You may choose to be licensed under the terms of the GNU
 * General Public License (GPL) Version 2, available from the file
 * COPYING in the main directory of this source tree, or the
 * OpenIB.org BSD license below:
 *
 *     Redistribution and use in source and binary forms, with or
 *     without modification, are permitted provided that the following
 *     conditions are met:
 *
 *      - Redistributions of source code must retain the above
 *        copyright notice, this list of conditions and the following
 *        disclaimer.
 *
 *      - Redistributions in binary form must reproduce the above
 *        copyright notice, this list of conditions and the following
 *        disclaimer in the documentation and/or other materials
 *        provided with the distribution.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 * SOFTWARE.
 */

#if HAVE_CONFIG_H
#  include <config.h>
#endif /* HAVE_CONFIG_H */

#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <string.h>
#include <sys/types.h>
#include <sys/socket.h>
#include <sys/time.h>
#include <netdb.h>
#include <malloc.h>
#include <getopt.h>
#include <arpa/inet.h>
#include <time.h>

#include "pingpong.h"

enum {
      PINGPONG_RECV_WRID = 1,
      PINGPONG_SEND_WRID = 2,
};

static int page_size;

struct pingpong_context {
      struct ibv_context      *context;
      struct ibv_comp_channel *channel;
      struct ibv_pd           *pd;
      struct ibv_mr           *mr;
      struct ibv_cq           *cq;
      struct ibv_qp           *qp;
      struct ibv_ah           *ah;
      void              *buf;
      int                size;
      int                rx_depth;
      int                pending;
};

struct pingpong_dest {
      int lid;
      int qpn;
      int psn;
};

static int pp_connect_ctx(struct pingpong_context *ctx, int port, int my_psn,
                    struct pingpong_dest *dest)
{
      struct ibv_qp_attr attr;
      struct ibv_ah_attr ah_attr = {
            .is_global     = 0,
            .dlid          = dest->lid,
            .sl            = 0,
            .src_path_bits = 0,
            .port_num      = port
      };

      attr.qp_state           = IBV_QPS_RTR;

      if (ibv_modify_qp(ctx->qp, &attr, IBV_QP_STATE)) {
            fprintf(stderr, "Failed to modify QP to RTR\n");
            return 1;
      }

      attr.qp_state         = IBV_QPS_RTS;
      attr.sq_psn     = my_psn;

      if (ibv_modify_qp(ctx->qp, &attr,
                    IBV_QP_STATE              |
                    IBV_QP_SQ_PSN)) {
            fprintf(stderr, "Failed to modify QP to RTS\n");
            return 1;
      }

      ctx->ah = ibv_create_ah(ctx->pd, &ah_attr);
      if (!ctx->ah) {
            fprintf(stderr, "Failed to create AH\n");
            return 1;
      }

      return 0;
}

static struct pingpong_dest *pp_client_exch_dest(const char *servername, int port,
                                     const struct pingpong_dest *my_dest)
{
      struct addrinfo *res, *t;
      struct addrinfo hints = {
            .ai_family   = AF_UNSPEC,
            .ai_socktype = SOCK_STREAM
      };
      char *service;
      char msg[sizeof "0000:000000:000000"];
      int n;
      int sockfd = -1;
      struct pingpong_dest *rem_dest = NULL;

      if (asprintf(&service, "%d", port) < 0)
            return NULL;

      n = getaddrinfo(servername, service, &hints, &res);

      if (n < 0) {
            fprintf(stderr, "%s for %s:%d\n", gai_strerror(n), servername, port);
            return NULL;
      }

      for (t = res; t; t = t->ai_next) {
            sockfd = socket(t->ai_family, t->ai_socktype, t->ai_protocol);
            if (sockfd >= 0) {
                  if (!connect(sockfd, t->ai_addr, t->ai_addrlen))
                        break;
                  close(sockfd);
                  sockfd = -1;
            }
      }

      freeaddrinfo(res);

      if (sockfd < 0) {
            fprintf(stderr, "Couldn't connect to %s:%d\n", servername, port);
            return NULL;
      }

      sprintf(msg, "%04x:%06x:%06x", my_dest->lid, my_dest->qpn, my_dest->psn);
      if (write(sockfd, msg, sizeof msg) != sizeof msg) {
            fprintf(stderr, "Couldn't send local address\n");
            goto out;
      }

      if (read(sockfd, msg, sizeof msg) != sizeof msg) {
            perror("client read");
            fprintf(stderr, "Couldn't read remote address\n");
            goto out;
      }

      write(sockfd, "done", sizeof "done");

      rem_dest = malloc(sizeof *rem_dest);
      if (!rem_dest)
            goto out;

      sscanf(msg, "%x:%x:%x", &rem_dest->lid, &rem_dest->qpn, &rem_dest->psn);

out:
      close(sockfd);
      return rem_dest;
}

static struct pingpong_dest *pp_server_exch_dest(struct pingpong_context *ctx,
                                     int ib_port, int port,
                                     const struct pingpong_dest *my_dest)
{
      struct addrinfo *res, *t;
      struct addrinfo hints = {
            .ai_flags    = AI_PASSIVE,
            .ai_family   = AF_UNSPEC,
            .ai_socktype = SOCK_STREAM
      };
      char *service;
      char msg[sizeof "0000:000000:000000"];
      int n;
      int sockfd = -1, connfd;
      struct pingpong_dest *rem_dest = NULL;

      if (asprintf(&service, "%d", port) < 0)
            return NULL;

      n = getaddrinfo(NULL, service, &hints, &res);

      if (n < 0) {
            fprintf(stderr, "%s for port %d\n", gai_strerror(n), port);
            return NULL;
      }

      for (t = res; t; t = t->ai_next) {
            sockfd = socket(t->ai_family, t->ai_socktype, t->ai_protocol);
            if (sockfd >= 0) {
                  n = 1;

                  setsockopt(sockfd, SOL_SOCKET, SO_REUSEADDR, &n, sizeof n);

                  if (!bind(sockfd, t->ai_addr, t->ai_addrlen))
                        break;
                  close(sockfd);
                  sockfd = -1;
            }
      }

      freeaddrinfo(res);

      if (sockfd < 0) {
            fprintf(stderr, "Couldn't listen to port %d\n", port);
            return NULL;
      }

      listen(sockfd, 1);
      connfd = accept(sockfd, NULL, 0);
      close(sockfd);
      if (connfd < 0) {
            fprintf(stderr, "accept() failed\n");
            return NULL;
      }

      n = read(connfd, msg, sizeof msg);
      if (n != sizeof msg) {
            perror("server read");
            fprintf(stderr, "%d/%d: Couldn't read remote address\n", n, (int) sizeof msg);
            goto out;
      }

      rem_dest = malloc(sizeof *rem_dest);
      if (!rem_dest)
            goto out;

      sscanf(msg, "%x:%x:%x", &rem_dest->lid, &rem_dest->qpn, &rem_dest->psn);

      if (pp_connect_ctx(ctx, ib_port, my_dest->psn, rem_dest)) {
            fprintf(stderr, "Couldn't connect to remote QP\n");
            free(rem_dest);
            rem_dest = NULL;
            goto out;
      }

      sprintf(msg, "%04x:%06x:%06x", my_dest->lid, my_dest->qpn, my_dest->psn);
      if (write(connfd, msg, sizeof msg) != sizeof msg) {
            fprintf(stderr, "Couldn't send local address\n");
            free(rem_dest);
            rem_dest = NULL;
            goto out;
      }

      read(connfd, msg, sizeof msg);

out:
      close(connfd);
      return rem_dest;
}

static struct pingpong_context *pp_init_ctx(struct ibv_device *ib_dev, int size,
                                  int rx_depth, int port,
                                  int use_event)
{
      struct pingpong_context *ctx;

      ctx = malloc(sizeof *ctx);
      if (!ctx)
            return NULL;

      ctx->size     = size;
      ctx->rx_depth = rx_depth;

      ctx->buf = memalign(page_size, size + 40);
      if (!ctx->buf) {
            fprintf(stderr, "Couldn't allocate work buf.\n");
            return NULL;
      }

      memset(ctx->buf, 0, size + 40);

      ctx->context = ibv_open_device(ib_dev);
      if (!ctx->context) {
            fprintf(stderr, "Couldn't get context for %s\n",
                  ibv_get_device_name(ib_dev));
            return NULL;
      }

      if (use_event) {
            ctx->channel = ibv_create_comp_channel(ctx->context);
            if (!ctx->channel) {
                  fprintf(stderr, "Couldn't create completion channel\n");
                  return NULL;
            }
      } else
            ctx->channel = NULL;

      ctx->pd = ibv_alloc_pd(ctx->context);
      if (!ctx->pd) {
            fprintf(stderr, "Couldn't allocate PD\n");
            return NULL;
      }

      ctx->mr = ibv_reg_mr(ctx->pd, ctx->buf, size + 40, IBV_ACCESS_LOCAL_WRITE);
      if (!ctx->mr) {
            fprintf(stderr, "Couldn't register MR\n");
            return NULL;
      }

      ctx->cq = ibv_create_cq(ctx->context, rx_depth + 1, NULL,
                        ctx->channel, 0);
      if (!ctx->cq) {
            fprintf(stderr, "Couldn't create CQ\n");
            return NULL;
      }

      {
            struct ibv_qp_init_attr attr = {
                  .send_cq = ctx->cq,
                  .recv_cq = ctx->cq,
                  .cap     = {
                        .max_send_wr  = 1,
                        .max_recv_wr  = rx_depth,
                        .max_send_sge = 1,
                        .max_recv_sge = 1
                  },
                  .qp_type = IBV_QPT_UD,
            };

            ctx->qp = ibv_create_qp(ctx->pd, &attr);
            if (!ctx->qp)  {
                  fprintf(stderr, "Couldn't create QP\n");
                  return NULL;
            }
      }

      {
            struct ibv_qp_attr attr;

            attr.qp_state        = IBV_QPS_INIT;
            attr.pkey_index      = 0;
            attr.port_num        = port;
            attr.qkey            = 0x11111111;

            if (ibv_modify_qp(ctx->qp, &attr,
                          IBV_QP_STATE              |
                          IBV_QP_PKEY_INDEX         |
                          IBV_QP_PORT               |
                          IBV_QP_QKEY)) {
                  fprintf(stderr, "Failed to modify QP to INIT\n");
                  return NULL;
            }
      }

      return ctx;
}

int pp_close_ctx(struct pingpong_context *ctx)
{
      if (ibv_destroy_qp(ctx->qp)) {
            fprintf(stderr, "Couldn't destroy QP\n");
            return 1;
      }

      if (ibv_destroy_cq(ctx->cq)) {
            fprintf(stderr, "Couldn't destroy CQ\n");
            return 1;
      }

      if (ibv_dereg_mr(ctx->mr)) {
            fprintf(stderr, "Couldn't deregister MR\n");
            return 1;
      }

      if (ibv_destroy_ah(ctx->ah)) {
            fprintf(stderr, "Couldn't destroy AH\n");
            return 1;
      }

      if (ibv_dealloc_pd(ctx->pd)) {
            fprintf(stderr, "Couldn't deallocate PD\n");
            return 1;
      }

      if (ctx->channel) {
            if (ibv_destroy_comp_channel(ctx->channel)) {
                  fprintf(stderr, "Couldn't destroy completion channel\n");
                  return 1;
            }
      }

      if (ibv_close_device(ctx->context)) {
            fprintf(stderr, "Couldn't release context\n");
            return 1;
      }

      free(ctx->buf);
      free(ctx);

      return 0;
}

static int pp_post_recv(struct pingpong_context *ctx, int n)
{
      struct ibv_sge list = {
            .addr = (uintptr_t) ctx->buf,
            .length = ctx->size + 40,
            .lkey = ctx->mr->lkey
      };
      struct ibv_recv_wr wr = {
            .wr_id          = PINGPONG_RECV_WRID,
            .sg_list    = &list,
            .num_sge    = 1,
      };
      struct ibv_recv_wr *bad_wr;
      int i;

      for (i = 0; i < n; ++i)
            if (ibv_post_recv(ctx->qp, &wr, &bad_wr))
                  break;

      return i;
}

static int pp_post_send(struct pingpong_context *ctx, uint32_t qpn)
{
      struct ibv_sge list = {
            .addr = (uintptr_t) ctx->buf + 40,
            .length = ctx->size,
            .lkey = ctx->mr->lkey
      };
      struct ibv_send_wr wr = {
            .wr_id          = PINGPONG_SEND_WRID,
            .sg_list    = &list,
            .num_sge    = 1,
            .opcode     = IBV_WR_SEND,
            .send_flags = IBV_SEND_SIGNALED,
            .wr         = {
                  .ud = {
                         .ah          = ctx->ah,
                         .remote_qpn  = qpn,
                         .remote_qkey = 0x11111111
                   }
            }
      };
      struct ibv_send_wr *bad_wr;

      return ibv_post_send(ctx->qp, &wr, &bad_wr);
}

static void usage(const char *argv0)
{
      printf("Usage:\n");
      printf("  %s            start a server and wait for connection\n", argv0);
      printf("  %s <host>     connect to server at <host>\n", argv0);
      printf("\n");
      printf("Options:\n");
      printf("  -p, --port=<port>      listen on/connect to port <port> (default 18515)\n");
      printf("  -d, --ib-dev=<dev>     use IB device <dev> (default first device found)\n");
      printf("  -i, --ib-port=<port>   use port <port> of IB device (default 1)\n");
      printf("  -s, --size=<size>      size of message to exchange (default 2048)\n");
      printf("  -r, --rx-depth=<dep>   number of receives to post at a time (default 500)\n");
      printf("  -n, --iters=<iters>    number of exchanges (default 1000)\n");
      printf("  -e, --events           sleep on CQ events (default poll)\n");
}

int main(int argc, char *argv[])
{
      struct ibv_device      **dev_list;
      struct ibv_device *ib_dev;
      struct pingpong_context *ctx;
      struct pingpong_dest     my_dest;
      struct pingpong_dest    *rem_dest;
      struct timeval           start, end;
      char                    *ib_devname = NULL;
      char                    *servername = NULL;
      int                      port = 18515;
      int                      ib_port = 1;
      int                      size = 2048;
      int                      rx_depth = 500;
      int                      iters = 1000;
      int                      use_event = 0;
      int                      routs;
      int                      rcnt, scnt;
      int                      num_cq_events = 0;

      srand48(getpid() * time(NULL));

      while (1) {
            int c;

            static struct option long_options[] = {
                  { .name = "port",     .has_arg = 1, .val = 'p' },
                  { .name = "ib-dev",   .has_arg = 1, .val = 'd' },
                  { .name = "ib-port",  .has_arg = 1, .val = 'i' },
                  { .name = "size",     .has_arg = 1, .val = 's' },
                  { .name = "rx-depth", .has_arg = 1, .val = 'r' },
                  { .name = "iters",    .has_arg = 1, .val = 'n' },
                  { .name = "events",   .has_arg = 0, .val = 'e' },
                  { 0 }
            };

            c = getopt_long(argc, argv, "p:d:i:s:r:n:e", long_options, NULL);
            if (c == -1)
                  break;

            switch (c) {
            case 'p':
                  port = strtol(optarg, NULL, 0);
                  if (port < 0 || port > 65535) {
                        usage(argv[0]);
                        return 1;
                  }
                  break;

            case 'd':
                  ib_devname = strdupa(optarg);
                  break;

            case 'i':
                  ib_port = strtol(optarg, NULL, 0);
                  if (ib_port < 0) {
                        usage(argv[0]);
                        return 1;
                  }
                  break;

            case 's':
                  size = strtol(optarg, NULL, 0);
                  break;

            case 'r':
                  rx_depth = strtol(optarg, NULL, 0);
                  break;

            case 'n':
                  iters = strtol(optarg, NULL, 0);
                  break;

            case 'e':
                  ++use_event;
                  break;

            default:
                  usage(argv[0]);
                  return 1;
            }
      }

      if (optind == argc - 1)
            servername = strdupa(argv[optind]);
      else if (optind < argc) {
            usage(argv[0]);
            return 1;
      }

      page_size = sysconf(_SC_PAGESIZE);

      dev_list = ibv_get_device_list(NULL);
      if (!dev_list) {
            fprintf(stderr, "No IB devices found\n");
            return 1;
      }

      if (!ib_devname) {
            ib_dev = *dev_list;
            if (!ib_dev) {
                  fprintf(stderr, "No IB devices found\n");
                  return 1;
            }
      } else {
            int i;
            for (i = 0; dev_list[i]; ++i)
                  if (!strcmp(ibv_get_device_name(dev_list[i]), ib_devname))
                        break;
            ib_dev = dev_list[i];
            if (!ib_dev) {
                  fprintf(stderr, "IB device %s not found\n", ib_devname);
                  return 1;
            }
      }

      ctx = pp_init_ctx(ib_dev, size, rx_depth, ib_port, use_event);
      if (!ctx)
            return 1;

      routs = pp_post_recv(ctx, ctx->rx_depth);
      if (routs < ctx->rx_depth) {
            fprintf(stderr, "Couldn't post receive (%d)\n", routs);
            return 1;
      }

      if (use_event)
            if (ibv_req_notify_cq(ctx->cq, 0)) {
                  fprintf(stderr, "Couldn't request CQ notification\n");
                  return 1;
            }

      my_dest.lid = pp_get_local_lid(ctx->context, ib_port);
      my_dest.qpn = ctx->qp->qp_num;
      my_dest.psn = lrand48() & 0xffffff;
      if (!my_dest.lid) {
            fprintf(stderr, "Couldn't get local LID\n");
            return 1;
      }

      printf("  local address:  LID 0x%04x, QPN 0x%06x, PSN 0x%06x\n",
             my_dest.lid, my_dest.qpn, my_dest.psn);

      if (servername)
            rem_dest = pp_client_exch_dest(servername, port, &my_dest);
      else
            rem_dest = pp_server_exch_dest(ctx, ib_port, port, &my_dest);

      if (!rem_dest)
            return 1;

      printf("  remote address: LID 0x%04x, QPN 0x%06x, PSN 0x%06x\n",
             rem_dest->lid, rem_dest->qpn, rem_dest->psn);

      if (servername)
            if (pp_connect_ctx(ctx, ib_port, my_dest.psn, rem_dest))
                  return 1;

      ctx->pending = PINGPONG_RECV_WRID;

      if (servername) {
            if (pp_post_send(ctx, rem_dest->qpn)) {
                  fprintf(stderr, "Couldn't post send\n");
                  return 1;
            }
            ctx->pending |= PINGPONG_SEND_WRID;
      }

      if (gettimeofday(&start, NULL)) {
            perror("gettimeofday");
            return 1;
      }

      rcnt = scnt = 0;
      while (rcnt < iters || scnt < iters) {
            if (use_event) {
                  struct ibv_cq *ev_cq;
                  void          *ev_ctx;

                  if (ibv_get_cq_event(ctx->channel, &ev_cq, &ev_ctx)) {
                        fprintf(stderr, "Failed to get cq_event\n");
                        return 1;
                  }

                  ++num_cq_events;

                  if (ev_cq != ctx->cq) {
                        fprintf(stderr, "CQ event for unknown CQ %p\n", ev_cq);
                        return 1;
                  }

                  if (ibv_req_notify_cq(ctx->cq, 0)) {
                        fprintf(stderr, "Couldn't request CQ notification\n");
                        return 1;
                  }
            }

            {
                  struct ibv_wc wc[2];
                  int ne, i;

                  do {
                        ne = ibv_poll_cq(ctx->cq, 2, wc);
                        if (ne < 0) {
                              fprintf(stderr, "poll CQ failed %d\n", ne);
                              return 1;
                        }
                  } while (!use_event && ne < 1);

                  for (i = 0; i < ne; ++i) {
                        if (wc[i].status != IBV_WC_SUCCESS) {
                              fprintf(stderr, "Failed status %d for wr_id %d\n",
                                    wc[i].status, (int) wc[i].wr_id);
                              return 1;
                        }

                        switch ((int) wc[i].wr_id) {
                        case PINGPONG_SEND_WRID:
                              ++scnt;
                              break;

                        case PINGPONG_RECV_WRID:
                              if (--routs <= 1) {
                                    routs += pp_post_recv(ctx, ctx->rx_depth - routs);
                                    if (routs < ctx->rx_depth) {
                                          fprintf(stderr,
                                                "Couldn't post receive (%d)\n",
                                                routs);
                                          return 1;
                                    }
                              }

                              ++rcnt;
                              break;

                        default:
                              fprintf(stderr, "Completion for unknown wr_id %d\n",
                                    (int) wc[i].wr_id);
                              return 1;
                        }

                        ctx->pending &= ~(int) wc[i].wr_id;
                        if (scnt < iters && !ctx->pending) {
                              if (pp_post_send(ctx, rem_dest->qpn)) {
                                    fprintf(stderr, "Couldn't post send\n");
                                    return 1;
                              }
                              ctx->pending = PINGPONG_RECV_WRID |
                                           PINGPONG_SEND_WRID;
                        }
                  }
            }
      }

      if (gettimeofday(&end, NULL)) {
            perror("gettimeofday");
            return 1;
      }

      {
            float usec = (end.tv_sec - start.tv_sec) * 1000000 +
                  (end.tv_usec - start.tv_usec);
            long long bytes = (long long) size * iters * 2;

            printf("%lld bytes in %.2f seconds = %.2f Mbit/sec\n",
                   bytes, usec / 1000000., bytes * 8. / usec);
            printf("%d iters in %.2f seconds = %.2f usec/iter\n",
                   iters, usec / 1000000., usec / iters);
      }

      ibv_ack_cq_events(ctx->cq, num_cq_events);

      if (pp_close_ctx(ctx))
            return 1;

      ibv_free_device_list(dev_list);
      free(rem_dest);

      return 0;
}

Generated by  Doxygen 1.6.0   Back to index