| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| #define _GNU_SOURCE |
| #include <config.h> |
| |
| #include <endian.h> |
| #include <stdio.h> |
| #include <unistd.h> |
| #include <stdlib.h> |
| #include <errno.h> |
| #include <string.h> |
| #include <linux/ip.h> |
| #include <dirent.h> |
| #include <netinet/in.h> |
| |
| #include <util/compiler.h> |
| #include <util/symver.h> |
| #include <infiniband/cmd_write.h> |
| |
| #include "ibverbs.h" |
| #include <net/if.h> |
| #include <net/if_arp.h> |
| #include "neigh.h" |
| |
| #undef ibv_query_port |
| |
| int __attribute__((const)) ibv_rate_to_mult(enum ibv_rate rate) |
| { |
| switch (rate) { |
| case IBV_RATE_2_5_GBPS: return 1; |
| case IBV_RATE_5_GBPS: return 2; |
| case IBV_RATE_10_GBPS: return 4; |
| case IBV_RATE_20_GBPS: return 8; |
| case IBV_RATE_30_GBPS: return 12; |
| case IBV_RATE_40_GBPS: return 16; |
| case IBV_RATE_60_GBPS: return 24; |
| case IBV_RATE_80_GBPS: return 32; |
| case IBV_RATE_120_GBPS: return 48; |
| case IBV_RATE_28_GBPS: return 11; |
| case IBV_RATE_50_GBPS: return 20; |
| case IBV_RATE_400_GBPS: return 160; |
| case IBV_RATE_600_GBPS: return 240; |
| default: return -1; |
| } |
| } |
| |
| enum ibv_rate __attribute__((const)) mult_to_ibv_rate(int mult) |
| { |
| switch (mult) { |
| case 1: return IBV_RATE_2_5_GBPS; |
| case 2: return IBV_RATE_5_GBPS; |
| case 4: return IBV_RATE_10_GBPS; |
| case 8: return IBV_RATE_20_GBPS; |
| case 12: return IBV_RATE_30_GBPS; |
| case 16: return IBV_RATE_40_GBPS; |
| case 24: return IBV_RATE_60_GBPS; |
| case 32: return IBV_RATE_80_GBPS; |
| case 48: return IBV_RATE_120_GBPS; |
| case 11: return IBV_RATE_28_GBPS; |
| case 20: return IBV_RATE_50_GBPS; |
| case 160: return IBV_RATE_400_GBPS; |
| case 240: return IBV_RATE_600_GBPS; |
| default: return IBV_RATE_MAX; |
| } |
| } |
| |
| int __attribute__((const)) ibv_rate_to_mbps(enum ibv_rate rate) |
| { |
| switch (rate) { |
| case IBV_RATE_2_5_GBPS: return 2500; |
| case IBV_RATE_5_GBPS: return 5000; |
| case IBV_RATE_10_GBPS: return 10000; |
| case IBV_RATE_20_GBPS: return 20000; |
| case IBV_RATE_30_GBPS: return 30000; |
| case IBV_RATE_40_GBPS: return 40000; |
| case IBV_RATE_60_GBPS: return 60000; |
| case IBV_RATE_80_GBPS: return 80000; |
| case IBV_RATE_120_GBPS: return 120000; |
| case IBV_RATE_14_GBPS: return 14062; |
| case IBV_RATE_56_GBPS: return 56250; |
| case IBV_RATE_112_GBPS: return 112500; |
| case IBV_RATE_168_GBPS: return 168750; |
| case IBV_RATE_25_GBPS: return 25781; |
| case IBV_RATE_100_GBPS: return 103125; |
| case IBV_RATE_200_GBPS: return 206250; |
| case IBV_RATE_300_GBPS: return 309375; |
| case IBV_RATE_28_GBPS: return 28125; |
| case IBV_RATE_50_GBPS: return 53125; |
| case IBV_RATE_400_GBPS: return 425000; |
| case IBV_RATE_600_GBPS: return 637500; |
| default: return -1; |
| } |
| } |
| |
| enum ibv_rate __attribute__((const)) mbps_to_ibv_rate(int mbps) |
| { |
| switch (mbps) { |
| case 2500: return IBV_RATE_2_5_GBPS; |
| case 5000: return IBV_RATE_5_GBPS; |
| case 10000: return IBV_RATE_10_GBPS; |
| case 20000: return IBV_RATE_20_GBPS; |
| case 30000: return IBV_RATE_30_GBPS; |
| case 40000: return IBV_RATE_40_GBPS; |
| case 60000: return IBV_RATE_60_GBPS; |
| case 80000: return IBV_RATE_80_GBPS; |
| case 120000: return IBV_RATE_120_GBPS; |
| case 14062: return IBV_RATE_14_GBPS; |
| case 56250: return IBV_RATE_56_GBPS; |
| case 112500: return IBV_RATE_112_GBPS; |
| case 168750: return IBV_RATE_168_GBPS; |
| case 25781: return IBV_RATE_25_GBPS; |
| case 103125: return IBV_RATE_100_GBPS; |
| case 206250: return IBV_RATE_200_GBPS; |
| case 309375: return IBV_RATE_300_GBPS; |
| case 28125: return IBV_RATE_28_GBPS; |
| case 53125: return IBV_RATE_50_GBPS; |
| case 425000: return IBV_RATE_400_GBPS; |
| case 637500: return IBV_RATE_600_GBPS; |
| default: return IBV_RATE_MAX; |
| } |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_query_device, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_context *context, |
| struct ibv_device_attr *device_attr) |
| { |
| return get_ops(context)->query_device(context, device_attr); |
| } |
| |
| int __lib_query_port(struct ibv_context *context, uint8_t port_num, |
| struct ibv_port_attr *port_attr, size_t port_attr_len) |
| { |
| |
| |
| |
| if (port_attr_len < sizeof(struct ibv_port_attr)) { |
| struct ibv_port_attr tmp_attr = {}; |
| int rc; |
| |
| rc = get_ops(context)->query_port(context, port_num, |
| &tmp_attr); |
| if (rc) |
| return rc; |
| |
| memcpy(port_attr, &tmp_attr, port_attr_len); |
| return 0; |
| } |
| |
| memset(port_attr, 0, port_attr_len); |
| return get_ops(context)->query_port(context, port_num, port_attr); |
| } |
| |
| struct _compat_ibv_port_attr { |
| enum ibv_port_state state; |
| enum ibv_mtu max_mtu; |
| enum ibv_mtu active_mtu; |
| int gid_tbl_len; |
| uint32_t port_cap_flags; |
| uint32_t max_msg_sz; |
| uint32_t bad_pkey_cntr; |
| uint32_t qkey_viol_cntr; |
| uint16_t pkey_tbl_len; |
| uint16_t lid; |
| uint16_t sm_lid; |
| uint8_t lmc; |
| uint8_t max_vl_num; |
| uint8_t sm_sl; |
| uint8_t subnet_timeout; |
| uint8_t init_type_reply; |
| uint8_t active_width; |
| uint8_t active_speed; |
| uint8_t phys_state; |
| uint8_t link_layer; |
| uint8_t flags; |
| }; |
| |
| LATEST_SYMVER_FUNC(ibv_query_port, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_context *context, uint8_t port_num, |
| struct _compat_ibv_port_attr *port_attr) |
| { |
| return __lib_query_port(context, port_num, |
| (struct ibv_port_attr *)port_attr, |
| sizeof(*port_attr)); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_query_gid, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_context *context, uint8_t port_num, |
| int index, union ibv_gid *gid) |
| { |
| struct verbs_device *verbs_device = verbs_get_device(context->device); |
| char attr[41]; |
| uint16_t val; |
| int i; |
| |
| if (ibv_read_ibdev_sysfs_file(attr, sizeof(attr), verbs_device->sysfs, |
| "ports/%d/gids/%d", port_num, index) < 0) |
| return -1; |
| |
| for (i = 0; i < 8; ++i) { |
| if (sscanf(attr + i * 5, "%hx", &val) != 1) |
| return -1; |
| gid->raw[i * 2 ] = val >> 8; |
| gid->raw[i * 2 + 1] = val & 0xff; |
| } |
| |
| return 0; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_query_pkey, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_context *context, uint8_t port_num, |
| int index, __be16 *pkey) |
| { |
| struct verbs_device *verbs_device = verbs_get_device(context->device); |
| char attr[8]; |
| uint16_t val; |
| |
| if (ibv_read_ibdev_sysfs_file(attr, sizeof(attr), verbs_device->sysfs, |
| "ports/%d/pkeys/%d", port_num, index) < 0) |
| return -1; |
| |
| if (sscanf(attr, "%hx", &val) != 1) |
| return -1; |
| |
| *pkey = htobe16(val); |
| return 0; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_get_pkey_index, 1_5, "IBVERBS_1.5", |
| int, |
| struct ibv_context *context, uint8_t port_num, __be16 pkey) |
| { |
| __be16 pkey_i; |
| int i, ret; |
| |
| for (i = 0; ; i++) { |
| ret = ibv_query_pkey(context, port_num, i, &pkey_i); |
| if (ret < 0) |
| return ret; |
| if (pkey == pkey_i) |
| return i; |
| } |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_alloc_pd, 1_1, "IBVERBS_1.1", |
| struct ibv_pd *, |
| struct ibv_context *context) |
| { |
| struct ibv_pd *pd; |
| |
| pd = get_ops(context)->alloc_pd(context); |
| if (pd) |
| pd->context = context; |
| |
| return pd; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_dealloc_pd, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_pd *pd) |
| { |
| return get_ops(pd->context)->dealloc_pd(pd); |
| } |
| |
| #undef ibv_reg_mr |
| LATEST_SYMVER_FUNC(ibv_reg_mr, 1_1, "IBVERBS_1.1", |
| struct ibv_mr *, |
| struct ibv_pd *pd, void *addr, |
| size_t length, int access) |
| { |
| struct ibv_mr *mr; |
| |
| if (ibv_dontfork_range(addr, length)) |
| return NULL; |
| |
| mr = get_ops(pd->context)->reg_mr(pd, addr, length, (uintptr_t) addr, |
| access); |
| if (mr) { |
| mr->context = pd->context; |
| mr->pd = pd; |
| mr->addr = addr; |
| mr->length = length; |
| } else |
| ibv_dofork_range(addr, length); |
| |
| return mr; |
| } |
| |
| #undef ibv_reg_mr_iova |
| struct ibv_mr *ibv_reg_mr_iova(struct ibv_pd *pd, void *addr, size_t length, |
| uint64_t iova, int access) |
| { |
| struct ibv_mr *mr; |
| |
| if (ibv_dontfork_range(addr, length)) |
| return NULL; |
| |
| mr = get_ops(pd->context)->reg_mr(pd, addr, length, iova, access); |
| if (mr) { |
| mr->context = pd->context; |
| mr->pd = pd; |
| mr->addr = addr; |
| mr->length = length; |
| } else |
| ibv_dofork_range(addr, length); |
| |
| return mr; |
| } |
| |
| struct ibv_mr *ibv_reg_mr_iova2(struct ibv_pd *pd, void *addr, size_t length, |
| uint64_t iova, unsigned int access) |
| { |
| struct verbs_device *device = verbs_get_device(pd->context->device); |
| |
| if (!(device->core_support & IB_UVERBS_CORE_SUPPORT_OPTIONAL_MR_ACCESS)) |
| access &= ~IBV_ACCESS_OPTIONAL_RANGE; |
| |
| return ibv_reg_mr_iova(pd, addr, length, iova, access); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_rereg_mr, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_mr *mr, int flags, |
| struct ibv_pd *pd, void *addr, |
| size_t length, int access) |
| { |
| int dofork_onfail = 0; |
| int err; |
| void *old_addr; |
| size_t old_len; |
| |
| if (verbs_get_mr(mr)->mr_type != IBV_MR_TYPE_MR) { |
| errno = EINVAL; |
| return IBV_REREG_MR_ERR_INPUT; |
| } |
| |
| if (flags & ~IBV_REREG_MR_FLAGS_SUPPORTED) { |
| errno = EINVAL; |
| return IBV_REREG_MR_ERR_INPUT; |
| } |
| |
| if ((flags & IBV_REREG_MR_CHANGE_TRANSLATION) && |
| (!length || !addr)) { |
| errno = EINVAL; |
| return IBV_REREG_MR_ERR_INPUT; |
| } |
| |
| if (access && !(flags & IBV_REREG_MR_CHANGE_ACCESS)) { |
| errno = EINVAL; |
| return IBV_REREG_MR_ERR_INPUT; |
| } |
| |
| if (flags & IBV_REREG_MR_CHANGE_TRANSLATION) { |
| err = ibv_dontfork_range(addr, length); |
| if (err) |
| return IBV_REREG_MR_ERR_DONT_FORK_NEW; |
| dofork_onfail = 1; |
| } |
| |
| old_addr = mr->addr; |
| old_len = mr->length; |
| err = get_ops(mr->context)->rereg_mr(verbs_get_mr(mr), |
| flags, pd, addr, |
| length, access); |
| if (!err) { |
| if (flags & IBV_REREG_MR_CHANGE_PD) |
| mr->pd = pd; |
| if (flags & IBV_REREG_MR_CHANGE_TRANSLATION) { |
| mr->addr = addr; |
| mr->length = length; |
| err = ibv_dofork_range(old_addr, old_len); |
| if (err) |
| return IBV_REREG_MR_ERR_DO_FORK_OLD; |
| } |
| } else { |
| err = IBV_REREG_MR_ERR_CMD; |
| if (dofork_onfail) { |
| if (ibv_dofork_range(addr, length)) |
| err = IBV_REREG_MR_ERR_CMD_AND_DO_FORK_NEW; |
| } |
| } |
| |
| return err; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_dereg_mr, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_mr *mr) |
| { |
| int ret; |
| void *addr = mr->addr; |
| size_t length = mr->length; |
| enum ibv_mr_type type = verbs_get_mr(mr)->mr_type; |
| |
| ret = get_ops(mr->context)->dereg_mr(verbs_get_mr(mr)); |
| if (!ret && type == IBV_MR_TYPE_MR) |
| ibv_dofork_range(addr, length); |
| |
| return ret; |
| } |
| |
| struct ibv_comp_channel *ibv_create_comp_channel(struct ibv_context *context) |
| { |
| struct ibv_create_comp_channel req; |
| struct ib_uverbs_create_comp_channel_resp resp; |
| struct ibv_comp_channel *channel; |
| |
| channel = malloc(sizeof *channel); |
| if (!channel) |
| return NULL; |
| |
| req.core_payload = (struct ib_uverbs_create_comp_channel){}; |
| if (execute_cmd_write(context, IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL, |
| &req, sizeof(req), &resp, sizeof(resp))) { |
| free(channel); |
| return NULL; |
| } |
| |
| channel->context = context; |
| channel->fd = resp.fd; |
| channel->refcnt = 0; |
| |
| return channel; |
| } |
| |
| int ibv_destroy_comp_channel(struct ibv_comp_channel *channel) |
| { |
| struct ibv_context *context; |
| int ret; |
| |
| context = channel->context; |
| pthread_mutex_lock(&context->mutex); |
| |
| if (channel->refcnt) { |
| ret = EBUSY; |
| goto out; |
| } |
| |
| close(channel->fd); |
| free(channel); |
| ret = 0; |
| |
| out: |
| pthread_mutex_unlock(&context->mutex); |
| |
| return ret; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_create_cq, 1_1, "IBVERBS_1.1", |
| struct ibv_cq *, |
| struct ibv_context *context, int cqe, void *cq_context, |
| struct ibv_comp_channel *channel, int comp_vector) |
| { |
| struct ibv_cq *cq; |
| |
| cq = get_ops(context)->create_cq(context, cqe, channel, comp_vector); |
| |
| if (cq) |
| verbs_init_cq(cq, context, channel, cq_context); |
| |
| return cq; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_resize_cq, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_cq *cq, int cqe) |
| { |
| return get_ops(cq->context)->resize_cq(cq, cqe); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_destroy_cq, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_cq *cq) |
| { |
| struct ibv_comp_channel *channel = cq->channel; |
| int ret; |
| |
| ret = get_ops(cq->context)->destroy_cq(cq); |
| |
| if (channel) { |
| if (!ret) { |
| pthread_mutex_lock(&channel->context->mutex); |
| --channel->refcnt; |
| pthread_mutex_unlock(&channel->context->mutex); |
| } |
| } |
| |
| return ret; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_get_cq_event, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_comp_channel *channel, |
| struct ibv_cq **cq, void **cq_context) |
| { |
| struct ib_uverbs_comp_event_desc ev; |
| |
| if (read(channel->fd, &ev, sizeof ev) != sizeof ev) |
| return -1; |
| |
| *cq = (struct ibv_cq *) (uintptr_t) ev.cq_handle; |
| *cq_context = (*cq)->cq_context; |
| |
| get_ops((*cq)->context)->cq_event(*cq); |
| |
| return 0; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_ack_cq_events, 1_1, "IBVERBS_1.1", |
| void, |
| struct ibv_cq *cq, unsigned int nevents) |
| { |
| pthread_mutex_lock(&cq->mutex); |
| cq->comp_events_completed += nevents; |
| pthread_cond_signal(&cq->cond); |
| pthread_mutex_unlock(&cq->mutex); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_create_srq, 1_1, "IBVERBS_1.1", |
| struct ibv_srq *, |
| struct ibv_pd *pd, |
| struct ibv_srq_init_attr *srq_init_attr) |
| { |
| struct ibv_srq *srq; |
| |
| srq = get_ops(pd->context)->create_srq(pd, srq_init_attr); |
| if (srq) { |
| srq->context = pd->context; |
| srq->srq_context = srq_init_attr->srq_context; |
| srq->pd = pd; |
| srq->events_completed = 0; |
| pthread_mutex_init(&srq->mutex, NULL); |
| pthread_cond_init(&srq->cond, NULL); |
| } |
| |
| return srq; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_modify_srq, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_srq *srq, |
| struct ibv_srq_attr *srq_attr, |
| int srq_attr_mask) |
| { |
| return get_ops(srq->context)->modify_srq(srq, srq_attr, srq_attr_mask); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_query_srq, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_srq *srq, struct ibv_srq_attr *srq_attr) |
| { |
| return get_ops(srq->context)->query_srq(srq, srq_attr); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_destroy_srq, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_srq *srq) |
| { |
| return get_ops(srq->context)->destroy_srq(srq); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_create_qp, 1_1, "IBVERBS_1.1", |
| struct ibv_qp *, |
| struct ibv_pd *pd, |
| struct ibv_qp_init_attr *qp_init_attr) |
| { |
| struct ibv_qp *qp = get_ops(pd->context)->create_qp(pd, qp_init_attr); |
| |
| if (qp) { |
| qp->context = pd->context; |
| qp->qp_context = qp_init_attr->qp_context; |
| qp->pd = pd; |
| qp->send_cq = qp_init_attr->send_cq; |
| qp->recv_cq = qp_init_attr->recv_cq; |
| qp->srq = qp_init_attr->srq; |
| qp->qp_type = qp_init_attr->qp_type; |
| qp->state = IBV_QPS_RESET; |
| qp->events_completed = 0; |
| pthread_mutex_init(&qp->mutex, NULL); |
| pthread_cond_init(&qp->cond, NULL); |
| } |
| |
| return qp; |
| } |
| |
| struct ibv_qp_ex *ibv_qp_to_qp_ex(struct ibv_qp *qp) |
| { |
| struct verbs_qp *vqp = (struct verbs_qp *)qp; |
| |
| if (vqp->comp_mask & VERBS_QP_EX) |
| return &vqp->qp_ex; |
| return NULL; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_query_qp, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_qp *qp, struct ibv_qp_attr *attr, |
| int attr_mask, |
| struct ibv_qp_init_attr *init_attr) |
| { |
| int ret; |
| |
| ret = get_ops(qp->context)->query_qp(qp, attr, attr_mask, init_attr); |
| if (ret) |
| return ret; |
| |
| if (attr_mask & IBV_QP_STATE) |
| qp->state = attr->qp_state; |
| |
| return 0; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_modify_qp, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_qp *qp, struct ibv_qp_attr *attr, |
| int attr_mask) |
| { |
| int ret; |
| |
| ret = get_ops(qp->context)->modify_qp(qp, attr, attr_mask); |
| if (ret) |
| return ret; |
| |
| if (attr_mask & IBV_QP_STATE) |
| qp->state = attr->qp_state; |
| |
| return 0; |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_destroy_qp, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_qp *qp) |
| { |
| return get_ops(qp->context)->destroy_qp(qp); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_create_ah, 1_1, "IBVERBS_1.1", |
| struct ibv_ah *, |
| struct ibv_pd *pd, struct ibv_ah_attr *attr) |
| { |
| struct ibv_ah *ah = get_ops(pd->context)->create_ah(pd, attr); |
| |
| if (ah) { |
| ah->context = pd->context; |
| ah->pd = pd; |
| } |
| |
| return ah; |
| } |
| |
| |
| |
| |
| #define V1_TYPE "IB/RoCE v1" |
| #define V2_TYPE "RoCE v2" |
| int ibv_query_gid_type(struct ibv_context *context, uint8_t port_num, |
| unsigned int index, enum ibv_gid_type *type) |
| { |
| struct verbs_device *verbs_device = verbs_get_device(context->device); |
| char buff[11]; |
| |
| |
| |
| |
| errno = 0; |
| if (ibv_read_ibdev_sysfs_file(buff, sizeof(buff), verbs_device->sysfs, |
| "ports/%d/gid_attrs/types/%d", port_num, |
| index) <= 0) { |
| char *dir_path; |
| DIR *dir; |
| |
| if (errno == EINVAL) { |
| |
| |
| |
| *type = IBV_GID_TYPE_IB_ROCE_V1; |
| return 0; |
| } |
| if (asprintf(&dir_path, "%s/%s/%d/%s/", |
| verbs_device->sysfs->ibdev_path, "ports", port_num, |
| "gid_attrs") < 0) |
| return -1; |
| dir = opendir(dir_path); |
| free(dir_path); |
| if (!dir) { |
| if (errno == ENOENT) |
| |
| |
| |
| |
| *type = IBV_GID_TYPE_IB_ROCE_V1; |
| else |
| return -1; |
| } else { |
| closedir(dir); |
| errno = EFAULT; |
| return -1; |
| } |
| } else { |
| if (!strcmp(buff, V1_TYPE)) { |
| *type = IBV_GID_TYPE_IB_ROCE_V1; |
| } else if (!strcmp(buff, V2_TYPE)) { |
| *type = IBV_GID_TYPE_ROCE_V2; |
| } else { |
| errno = ENOTSUP; |
| return -1; |
| } |
| } |
| |
| return 0; |
| } |
| |
| static int ibv_find_gid_index(struct ibv_context *context, uint8_t port_num, |
| union ibv_gid *gid, enum ibv_gid_type gid_type) |
| { |
| enum ibv_gid_type sgid_type = 0; |
| union ibv_gid sgid; |
| int i = 0, ret; |
| |
| do { |
| ret = ibv_query_gid(context, port_num, i, &sgid); |
| if (!ret) { |
| ret = ibv_query_gid_type(context, port_num, i, |
| &sgid_type); |
| } |
| i++; |
| } while (!ret && (memcmp(&sgid, gid, sizeof(*gid)) || |
| (gid_type != sgid_type))); |
| |
| return ret ? ret : i - 1; |
| } |
| |
| static inline void map_ipv4_addr_to_ipv6(__be32 ipv4, struct in6_addr *ipv6) |
| { |
| ipv6->s6_addr32[0] = 0; |
| ipv6->s6_addr32[1] = 0; |
| ipv6->s6_addr32[2] = htobe32(0x0000FFFF); |
| ipv6->s6_addr32[3] = ipv4; |
| } |
| |
| static inline __sum16 ipv4_calc_hdr_csum(uint16_t *data, unsigned int num_hwords) |
| { |
| unsigned int i = 0; |
| uint32_t sum = 0; |
| |
| for (i = 0; i < num_hwords; i++) |
| sum += *(data++); |
| |
| sum = (sum & 0xffff) + (sum >> 16); |
| |
| return (__force __sum16)~sum; |
| } |
| |
| static inline int get_grh_header_version(struct ibv_grh *grh) |
| { |
| int ip6h_version = (be32toh(grh->version_tclass_flow) >> 28) & 0xf; |
| struct iphdr *ip4h = (struct iphdr *)((void *)grh + 20); |
| struct iphdr ip4h_checked; |
| |
| if (ip6h_version != 6) { |
| if (ip4h->version == 4) |
| return 4; |
| errno = EPROTONOSUPPORT; |
| return -1; |
| } |
| |
| if (ip4h->ihl != 5) |
| return 6; |
| |
| |
| |
| |
| |
| memcpy(&ip4h_checked, ip4h, sizeof(ip4h_checked)); |
| |
| |
| |
| ip4h_checked.check = 0; |
| ip4h_checked.check = ipv4_calc_hdr_csum((uint16_t *)&ip4h_checked, 10); |
| |
| if (ip4h->check == ip4h_checked.check) |
| return 4; |
| return 6; |
| } |
| |
| static inline void set_ah_attr_generic_fields(struct ibv_ah_attr *ah_attr, |
| struct ibv_wc *wc, |
| struct ibv_grh *grh, |
| uint8_t port_num) |
| { |
| uint32_t flow_class; |
| |
| flow_class = be32toh(grh->version_tclass_flow); |
| ah_attr->grh.flow_label = flow_class & 0xFFFFF; |
| ah_attr->dlid = wc->slid; |
| ah_attr->sl = wc->sl; |
| ah_attr->src_path_bits = wc->dlid_path_bits; |
| ah_attr->port_num = port_num; |
| } |
| |
| static inline int set_ah_attr_by_ipv4(struct ibv_context *context, |
| struct ibv_ah_attr *ah_attr, |
| struct iphdr *ip4h, uint8_t port_num) |
| { |
| union ibv_gid sgid; |
| int ret; |
| |
| |
| if (IN_CLASSD(be32toh(ip4h->daddr))) { |
| errno = EINVAL; |
| return -1; |
| } |
| |
| map_ipv4_addr_to_ipv6(ip4h->daddr, (struct in6_addr *)&sgid); |
| ret = ibv_find_gid_index(context, port_num, &sgid, |
| IBV_GID_TYPE_ROCE_V2); |
| if (ret < 0) |
| return ret; |
| |
| map_ipv4_addr_to_ipv6(ip4h->saddr, |
| (struct in6_addr *)&ah_attr->grh.dgid); |
| ah_attr->grh.sgid_index = (uint8_t) ret; |
| ah_attr->grh.hop_limit = ip4h->ttl; |
| ah_attr->grh.traffic_class = ip4h->tos; |
| |
| return 0; |
| } |
| |
| #define IB_NEXT_HDR 0x1b |
| static inline int set_ah_attr_by_ipv6(struct ibv_context *context, |
| struct ibv_ah_attr *ah_attr, |
| struct ibv_grh *grh, uint8_t port_num) |
| { |
| uint32_t flow_class; |
| uint32_t sgid_type; |
| int ret; |
| |
| |
| if (grh->dgid.raw[0] == 0xFF) { |
| errno = EINVAL; |
| return -1; |
| } |
| |
| ah_attr->grh.dgid = grh->sgid; |
| if (grh->next_hdr == IPPROTO_UDP) { |
| sgid_type = IBV_GID_TYPE_ROCE_V2; |
| } else if (grh->next_hdr == IB_NEXT_HDR) { |
| sgid_type = IBV_GID_TYPE_IB_ROCE_V1; |
| } else { |
| errno = EPROTONOSUPPORT; |
| return -1; |
| } |
| |
| ret = ibv_find_gid_index(context, port_num, &grh->dgid, |
| sgid_type); |
| if (ret < 0) |
| return ret; |
| |
| ah_attr->grh.sgid_index = (uint8_t) ret; |
| flow_class = be32toh(grh->version_tclass_flow); |
| ah_attr->grh.hop_limit = grh->hop_limit; |
| ah_attr->grh.traffic_class = (flow_class >> 20) & 0xFF; |
| |
| return 0; |
| } |
| |
| int ibv_init_ah_from_wc(struct ibv_context *context, uint8_t port_num, |
| struct ibv_wc *wc, struct ibv_grh *grh, |
| struct ibv_ah_attr *ah_attr) |
| { |
| int version; |
| int ret = 0; |
| |
| memset(ah_attr, 0, sizeof *ah_attr); |
| set_ah_attr_generic_fields(ah_attr, wc, grh, port_num); |
| |
| if (wc->wc_flags & IBV_WC_GRH) { |
| ah_attr->is_global = 1; |
| version = get_grh_header_version(grh); |
| |
| if (version == 4) |
| ret = set_ah_attr_by_ipv4(context, ah_attr, |
| (struct iphdr *)((void *)grh + 20), |
| port_num); |
| else if (version == 6) |
| ret = set_ah_attr_by_ipv6(context, ah_attr, grh, |
| port_num); |
| else |
| ret = -1; |
| } |
| |
| return ret; |
| } |
| |
| struct ibv_ah *ibv_create_ah_from_wc(struct ibv_pd *pd, struct ibv_wc *wc, |
| struct ibv_grh *grh, uint8_t port_num) |
| { |
| struct ibv_ah_attr ah_attr; |
| int ret; |
| |
| ret = ibv_init_ah_from_wc(pd->context, port_num, wc, grh, &ah_attr); |
| if (ret) |
| return NULL; |
| |
| return ibv_create_ah(pd, &ah_attr); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_destroy_ah, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_ah *ah) |
| { |
| return get_ops(ah->context)->destroy_ah(ah); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_attach_mcast, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_qp *qp, const union ibv_gid *gid, uint16_t lid) |
| { |
| return get_ops(qp->context)->attach_mcast(qp, gid, lid); |
| } |
| |
| LATEST_SYMVER_FUNC(ibv_detach_mcast, 1_1, "IBVERBS_1.1", |
| int, |
| struct ibv_qp *qp, const union ibv_gid *gid, uint16_t lid) |
| { |
| return get_ops(qp->context)->detach_mcast(qp, gid, lid); |
| } |
| |
| static inline int ipv6_addr_v4mapped(const struct in6_addr *a) |
| { |
| return IN6_IS_ADDR_V4MAPPED(&a->s6_addr32) || |
| |
| (a->s6_addr32[0] == htobe32(0xff0e0000) && |
| ((a->s6_addr32[1] | |
| (a->s6_addr32[2] ^ htobe32(0x0000ffff))) == 0UL)); |
| } |
| |
| struct peer_address { |
| void *address; |
| uint32_t size; |
| }; |
| |
| static inline int create_peer_from_gid(int family, void *raw_gid, |
| struct peer_address *peer_address) |
| { |
| switch (family) { |
| case AF_INET: |
| peer_address->address = raw_gid + 12; |
| peer_address->size = 4; |
| break; |
| case AF_INET6: |
| peer_address->address = raw_gid; |
| peer_address->size = 16; |
| break; |
| default: |
| return -1; |
| } |
| |
| return 0; |
| } |
| |
| #define NEIGH_GET_DEFAULT_TIMEOUT_MS 3000 |
| int ibv_resolve_eth_l2_from_gid(struct ibv_context *context, |
| struct ibv_ah_attr *attr, |
| uint8_t eth_mac[ETHERNET_LL_SIZE], |
| uint16_t *vid) |
| { |
| int dst_family; |
| int src_family; |
| int oif; |
| struct get_neigh_handler neigh_handler; |
| union ibv_gid sgid; |
| int ether_len; |
| struct peer_address src; |
| struct peer_address dst; |
| uint16_t ret_vid; |
| int ret = -EINVAL; |
| int err; |
| |
| err = ibv_query_gid(context, attr->port_num, |
| attr->grh.sgid_index, &sgid); |
| |
| if (err) |
| return err; |
| |
| err = neigh_init_resources(&neigh_handler, |
| NEIGH_GET_DEFAULT_TIMEOUT_MS); |
| |
| if (err) |
| return err; |
| |
| dst_family = ipv6_addr_v4mapped((struct in6_addr *)attr->grh.dgid.raw) ? |
| AF_INET : AF_INET6; |
| src_family = ipv6_addr_v4mapped((struct in6_addr *)sgid.raw) ? |
| AF_INET : AF_INET6; |
| |
| if (create_peer_from_gid(dst_family, attr->grh.dgid.raw, &dst)) |
| goto free_resources; |
| |
| if (create_peer_from_gid(src_family, &sgid.raw, &src)) |
| goto free_resources; |
| |
| if (neigh_set_dst(&neigh_handler, dst_family, dst.address, |
| dst.size)) |
| goto free_resources; |
| |
| if (neigh_set_src(&neigh_handler, src_family, src.address, |
| src.size)) |
| goto free_resources; |
| |
| oif = neigh_get_oif_from_src(&neigh_handler); |
| |
| if (oif > 0) |
| neigh_set_oif(&neigh_handler, oif); |
| else |
| goto free_resources; |
| |
| ret = -EHOSTUNREACH; |
| |
| |
| if (process_get_neigh(&neigh_handler)) |
| goto free_resources; |
| |
| if (vid) { |
| ret_vid = neigh_get_vlan_id_from_dev(&neigh_handler); |
| |
| if (ret_vid <= 0xfff) |
| neigh_set_vlan_id(&neigh_handler, ret_vid); |
| } |
| |
| |
| ether_len = neigh_get_ll(&neigh_handler, |
| eth_mac, |
| sizeof(uint8_t) * ETHERNET_LL_SIZE); |
| |
| if (ether_len <= 0) |
| goto free_resources; |
| |
| if (vid) |
| *vid = ret_vid; |
| |
| ret = 0; |
| |
| free_resources: |
| neigh_free_resources(&neigh_handler); |
| |
| return ret; |
| } |