blob: 8addee43a381138dddc2022ee55c9c68a90e452e [file]
// SPDX-License-Identifier: GPL-2.0-or-later
/*
* Copyright (c) 2012,2016,2017,2025 Stefan Metzmacher
*/
#include "internal.h"
#include "../common/smb2status.h"
static int smbdirect_connect_setup_connection(struct smbdirect_socket *sc);
static int smbdirect_connect_resolve_addr(struct smbdirect_socket *sc,
const struct sockaddr *src,
const struct sockaddr *dst);
static int smbdirect_connect_rdma_event_handler(struct rdma_cm_id *id,
struct rdma_cm_event *event);
static int smbdirect_connect_negotiate_start(struct smbdirect_socket *sc);
static void smbdirect_connect_negotiate_send_done(struct ib_cq *cq, struct ib_wc *wc);
static void smbdirect_connect_negotiate_recv_done(struct ib_cq *cq, struct ib_wc *wc);
int smbdirect_connect(struct smbdirect_socket *sc, const struct sockaddr *dst)
{
const struct sockaddr *src = NULL;
union {
struct sockaddr sa;
struct sockaddr_storage ss;
} src_addr = {
.sa = {
.sa_family = AF_UNSPEC,
},
};
int ret;
if (sc->first_error)
return -ENOTCONN;
if (sc->status != SMBDIRECT_SOCKET_CREATED)
return -EALREADY;
if (WARN_ON_ONCE(!sc->rdma.cm_id))
return -EINVAL;
src_addr.ss = sc->rdma.cm_id->route.addr.src_addr;
if (src_addr.sa.sa_family != AF_UNSPEC)
src = &src_addr.sa;
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_INFO,
"connect: src: %pISpsfc dst: %pISpsfc\n",
src, dst);
ret = smbdirect_connect_setup_connection(sc);
if (ret)
return ret;
ret = smbdirect_connect_resolve_addr(sc, src, dst);
if (ret)
return ret;
/*
* The rest happens async via smbdirect_connect_rdma_event_handler()
* the caller will decide to wait or not.
*/
return 0;
}
__SMBDIRECT_EXPORT_SYMBOL__(smbdirect_connect);
static int smbdirect_connect_setup_connection(struct smbdirect_socket *sc)
{
rdma_lock_handler(sc->rdma.cm_id);
sc->rdma.cm_id->event_handler = smbdirect_connect_rdma_event_handler;
rdma_unlock_handler(sc->rdma.cm_id);
if (SMBDIRECT_CHECK_STATUS_WARN(sc, SMBDIRECT_SOCKET_CREATED))
return -EINVAL;
sc->status = SMBDIRECT_SOCKET_RESOLVE_ADDR_NEEDED;
return 0;
}
static int smbdirect_connect_resolve_addr(struct smbdirect_socket *sc,
const struct sockaddr *src,
const struct sockaddr *dst)
{
const struct smbdirect_socket_parameters *sp = &sc->parameters;
struct sockaddr *src_addr = NULL;
struct sockaddr *dst_addr = NULL;
int ret;
src_addr = (struct sockaddr *)src;
if (src_addr && src_addr->sa_family == AF_UNSPEC)
src_addr = NULL;
dst_addr = (struct sockaddr *)dst;
if (SMBDIRECT_CHECK_STATUS_WARN(sc, SMBDIRECT_SOCKET_RESOLVE_ADDR_NEEDED))
return -EINVAL;
sc->status = SMBDIRECT_SOCKET_RESOLVE_ADDR_RUNNING;
sc->rdma.expected_event = RDMA_CM_EVENT_ADDR_RESOLVED;
ret = rdma_resolve_addr(sc->rdma.cm_id, src_addr, dst_addr,
sp->resolve_addr_timeout_msec);
if (ret) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"rdma_resolve_addr() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
return ret;
}
return 0;
}
static int smbdirect_connect_resolve_route(struct smbdirect_socket *sc)
{
const struct smbdirect_socket_parameters *sp = &sc->parameters;
int ret;
if (SMBDIRECT_CHECK_STATUS_DISCONNECT(sc, SMBDIRECT_SOCKET_RESOLVE_ROUTE_NEEDED))
return sc->first_error;
sc->status = SMBDIRECT_SOCKET_RESOLVE_ROUTE_RUNNING;
sc->rdma.expected_event = RDMA_CM_EVENT_ROUTE_RESOLVED;
ret = rdma_resolve_route(sc->rdma.cm_id, sp->resolve_route_timeout_msec);
if (ret) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"rdma_resolve_route() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
return ret;
}
return 0;
}
static int smbdirect_connect_rdma_connect(struct smbdirect_socket *sc)
{
struct smbdirect_socket_parameters *sp = &sc->parameters;
struct rdma_conn_param conn_param;
__be32 ird_ord_hdr[2];
int ret;
sc->ib.dev = sc->rdma.cm_id->device;
if (!smbdirect_frwr_is_supported(&sc->ib.dev->attrs)) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"Fast Registration Work Requests (FRWR) is not supported device %.*s\n",
IB_DEVICE_NAME_MAX,
sc->ib.dev->name);
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"Device capability flags = %llx max_fast_reg_page_list_len = %u\n",
sc->ib.dev->attrs.device_cap_flags,
sc->ib.dev->attrs.max_fast_reg_page_list_len);
return -EPROTONOSUPPORT;
}
if (sp->flags & SMBDIRECT_FLAG_PORT_RANGE_ONLY_IB &&
!rdma_ib_or_roce(sc->ib.dev, sc->rdma.cm_id->port_num)) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"Not IB: device: %.*s IW:%u local: %pISpsfc remote: %pISpsfc\n",
IB_DEVICE_NAME_MAX,
sc->ib.dev->name,
rdma_protocol_iwarp(sc->ib.dev, sc->rdma.cm_id->port_num),
&sc->rdma.cm_id->route.addr.src_addr,
&sc->rdma.cm_id->route.addr.dst_addr);
return -EPROTONOSUPPORT;
}
if (sp->flags & SMBDIRECT_FLAG_PORT_RANGE_ONLY_IW &&
!rdma_protocol_iwarp(sc->ib.dev, sc->rdma.cm_id->port_num)) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"Not IW: device: %.*s IB:%u local: %pISpsfc remote: %pISpsfc\n",
IB_DEVICE_NAME_MAX,
sc->ib.dev->name,
rdma_ib_or_roce(sc->ib.dev, sc->rdma.cm_id->port_num),
&sc->rdma.cm_id->route.addr.src_addr,
&sc->rdma.cm_id->route.addr.dst_addr);
return -EPROTONOSUPPORT;
}
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_INFO,
"rdma connect: device: %.*s local: %pISpsfc remote: %pISpsfc\n",
IB_DEVICE_NAME_MAX,
sc->ib.dev->name,
&sc->rdma.cm_id->route.addr.src_addr,
&sc->rdma.cm_id->route.addr.dst_addr);
sp->max_frmr_depth = min_t(u32, sp->max_frmr_depth,
sc->ib.dev->attrs.max_fast_reg_page_list_len);
sc->mr_io.type = IB_MR_TYPE_MEM_REG;
if (sc->ib.dev->attrs.kernel_cap_flags & IBK_SG_GAPS_REG)
sc->mr_io.type = IB_MR_TYPE_SG_GAPS;
sp->responder_resources = min_t(u8, sp->responder_resources,
sc->ib.dev->attrs.max_qp_rd_atom);
smbdirect_log_rdma_mr(sc, SMBDIRECT_LOG_INFO,
"responder_resources=%d\n",
sp->responder_resources);
ret = smbdirect_connection_create_qp(sc);
if (ret) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connection_create_qp() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
return ret;
}
memset(&conn_param, 0, sizeof(conn_param));
conn_param.initiator_depth = sp->initiator_depth;
conn_param.responder_resources = sp->responder_resources;
/* Need to send IRD/ORD in private data for iWARP */
if (rdma_protocol_iwarp(sc->ib.dev, sc->rdma.cm_id->port_num)) {
ird_ord_hdr[0] = cpu_to_be32(conn_param.responder_resources);
ird_ord_hdr[1] = cpu_to_be32(conn_param.initiator_depth);
conn_param.private_data = ird_ord_hdr;
conn_param.private_data_len = sizeof(ird_ord_hdr);
} else {
conn_param.private_data = NULL;
conn_param.private_data_len = 0;
}
conn_param.retry_count = SMBDIRECT_RDMA_CM_RETRY;
conn_param.rnr_retry_count = SMBDIRECT_RDMA_CM_RNR_RETRY;
conn_param.flow_control = 0;
if (SMBDIRECT_CHECK_STATUS_DISCONNECT(sc, SMBDIRECT_SOCKET_RDMA_CONNECT_NEEDED))
return sc->first_error;
sc->status = SMBDIRECT_SOCKET_RDMA_CONNECT_RUNNING;
sc->rdma.expected_event = RDMA_CM_EVENT_ESTABLISHED;
ret = rdma_connect_locked(sc->rdma.cm_id, &conn_param);
if (ret) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"rdma_connect_locked() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
return ret;
}
/*
* start with the rdma connect timeout and SMBDIRECT_KEEPALIVE_PENDING
* so that the timer will cause a disconnect.
*/
INIT_DELAYED_WORK(&sc->idle.timer_work, smbdirect_connection_idle_timer_work);
sc->idle.keepalive = SMBDIRECT_KEEPALIVE_PENDING;
mod_delayed_work(sc->workqueues.idle, &sc->idle.timer_work,
msecs_to_jiffies(sp->rdma_connect_timeout_msec));
return 0;
}
static int smbdirect_connect_rdma_event_handler(struct rdma_cm_id *id,
struct rdma_cm_event *event)
{
struct smbdirect_socket *sc = id->context;
u8 peer_initiator_depth;
u8 peer_responder_resources;
int ret;
/*
* cma_cm_event_handler() has
* lockdep_assert_held(&id_priv->handler_mutex);
*
* Mutexes are not allowed in interrupts,
* and we rely on not being in an interrupt here,
* as we might sleep.
*
* We didn't timeout so we cancel our idle timer,
* it will be scheduled again if needed.
*/
WARN_ON_ONCE(in_interrupt());
sc->idle.keepalive = SMBDIRECT_KEEPALIVE_NONE;
cancel_delayed_work_sync(&sc->idle.timer_work);
if (event->status || event->event != sc->rdma.expected_event) {
int lvl = SMBDIRECT_LOG_ERR;
ret = -ECONNABORTED;
if (event->event == RDMA_CM_EVENT_REJECTED)
ret = -ECONNREFUSED;
if (event->event == RDMA_CM_EVENT_DEVICE_REMOVAL)
ret = -ENETDOWN;
if (IS_ERR(SMBDIRECT_DEBUG_ERR_PTR(event->status)))
ret = event->status;
if (ret == -ENODEV)
lvl = SMBDIRECT_LOG_INFO;
smbdirect_log_rdma_event(sc, lvl,
"%s (first_error=%1pe, expected=%s) => event=%s status=%d => ret=%1pe\n",
smbdirect_socket_status_string(sc->status),
SMBDIRECT_DEBUG_ERR_PTR(sc->first_error),
rdma_event_msg(sc->rdma.expected_event),
rdma_event_msg(event->event),
event->status,
SMBDIRECT_DEBUG_ERR_PTR(ret));
smbdirect_socket_schedule_cleanup_lvl(sc,
lvl,
ret);
return 0;
}
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_INFO,
"%s (first_error=%1pe) event=%s\n",
smbdirect_socket_status_string(sc->status),
SMBDIRECT_DEBUG_ERR_PTR(sc->first_error),
rdma_event_msg(event->event));
if (sc->first_error)
return 0;
switch (event->event) {
case RDMA_CM_EVENT_ADDR_RESOLVED:
if (SMBDIRECT_CHECK_STATUS_DISCONNECT(sc, SMBDIRECT_SOCKET_RESOLVE_ADDR_RUNNING))
return 0;
sc->status = SMBDIRECT_SOCKET_RESOLVE_ROUTE_NEEDED;
ret = smbdirect_connect_resolve_route(sc);
if (ret)
smbdirect_socket_schedule_cleanup(sc, ret);
return 0;
case RDMA_CM_EVENT_ROUTE_RESOLVED:
if (SMBDIRECT_CHECK_STATUS_DISCONNECT(sc, SMBDIRECT_SOCKET_RESOLVE_ROUTE_RUNNING))
return 0;
sc->status = SMBDIRECT_SOCKET_RDMA_CONNECT_NEEDED;
ret = smbdirect_connect_rdma_connect(sc);
if (ret)
smbdirect_socket_schedule_cleanup(sc, ret);
return 0;
case RDMA_CM_EVENT_ESTABLISHED:
smbdirect_connection_rdma_established(sc);
if (SMBDIRECT_CHECK_STATUS_DISCONNECT(sc, SMBDIRECT_SOCKET_RDMA_CONNECT_RUNNING))
return 0;
sc->status = SMBDIRECT_SOCKET_NEGOTIATE_NEEDED;
/*
* Here we work around an inconsistency between
* iWarp and other devices (at least rxe and irdma using RoCEv2)
*/
if (rdma_protocol_iwarp(id->device, id->port_num)) {
/*
* iWarp devices report the peer's values
* with the perspective of the peer here.
* Tested with siw and irdma (in iwarp mode)
* We need to change to our perspective here,
* so we need to switch the values.
*/
peer_initiator_depth = event->param.conn.responder_resources;
peer_responder_resources = event->param.conn.initiator_depth;
} else {
/*
* Non iWarp devices report the peer's values
* already changed to our perspective here.
* Tested with rxe and irdma (in roce mode).
*/
peer_initiator_depth = event->param.conn.initiator_depth;
peer_responder_resources = event->param.conn.responder_resources;
}
smbdirect_connection_negotiate_rdma_resources(sc,
peer_initiator_depth,
peer_responder_resources,
&event->param.conn);
ret = smbdirect_connect_negotiate_start(sc);
if (ret)
smbdirect_socket_schedule_cleanup(sc, ret);
return 0;
default:
break;
}
/*
* This is an internal error
*/
WARN_ON_ONCE(sc->rdma.expected_event != RDMA_CM_EVENT_ESTABLISHED);
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return 0;
}
static int smbdirect_connect_negotiate_start(struct smbdirect_socket *sc)
{
const struct smbdirect_socket_parameters *sp = &sc->parameters;
struct smbdirect_recv_io *recv_io = NULL;
struct smbdirect_send_io *send_io = NULL;
struct smbdirect_negotiate_req *nreq = NULL;
int ret;
if (SMBDIRECT_CHECK_STATUS_DISCONNECT(sc, SMBDIRECT_SOCKET_NEGOTIATE_NEEDED))
return sc->first_error;
sc->status = SMBDIRECT_SOCKET_NEGOTIATE_RUNNING;
ret = smbdirect_connection_create_mem_pools(sc);
if (ret) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connection_create_mem_pools() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
goto create_mem_pools_failed;
}
/*
* There is only a single batch credit
*/
atomic_set(&sc->send_io.bcredits.count, 1);
/*
* Initialize the local credits to post
* IB_WR_SEND[_WITH_INV].
*/
atomic_set(&sc->send_io.lcredits.count, sp->send_credit_target);
recv_io = smbdirect_connection_get_recv_io(sc);
if (WARN_ON_ONCE(!recv_io)) {
ret = -EINVAL;
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connection_get_recv_io() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
goto get_recv_io_failed;
}
recv_io->cqe.done = smbdirect_connect_negotiate_recv_done;
send_io = smbdirect_connection_alloc_send_io(sc);
if (IS_ERR(send_io)) {
ret = PTR_ERR(send_io);
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connection_alloc_send_io() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
goto alloc_send_io_failed;
}
send_io->cqe.done = smbdirect_connect_negotiate_send_done;
nreq = (struct smbdirect_negotiate_req *)send_io->packet;
nreq->min_version = cpu_to_le16(SMBDIRECT_V1);
nreq->max_version = cpu_to_le16(SMBDIRECT_V1);
nreq->reserved = 0;
nreq->credits_requested = cpu_to_le16(sp->send_credit_target);
nreq->preferred_send_size = cpu_to_le32(sp->max_send_size);
nreq->max_receive_size = cpu_to_le32(sp->max_recv_size);
nreq->max_fragmented_size = cpu_to_le32(sp->max_fragmented_recv_size);
smbdirect_log_negotiate(sc, SMBDIRECT_LOG_INFO,
"ReqOut: %s%x, %s%x, %s%u, %s%u, %s%u, %s%u\n",
"MinVersion=0x",
le16_to_cpu(nreq->min_version),
"MaxVersion=0x",
le16_to_cpu(nreq->max_version),
"CreditsRequested=",
le16_to_cpu(nreq->credits_requested),
"PreferredSendSize=",
le32_to_cpu(nreq->preferred_send_size),
"MaxRecvSize=",
le32_to_cpu(nreq->max_receive_size),
"MaxFragmentedSize=",
le32_to_cpu(nreq->max_fragmented_size));
send_io->sge[0].addr = ib_dma_map_single(sc->ib.dev,
nreq,
sizeof(*nreq),
DMA_TO_DEVICE);
ret = ib_dma_mapping_error(sc->ib.dev, send_io->sge[0].addr);
if (ret) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"ib_dma_mapping_error() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
goto dma_mapping_failed;
}
send_io->sge[0].length = sizeof(*nreq);
send_io->sge[0].lkey = sc->ib.pd->local_dma_lkey;
send_io->num_sge = 1;
ib_dma_sync_single_for_device(sc->ib.dev,
send_io->sge[0].addr,
send_io->sge[0].length,
DMA_TO_DEVICE);
smbdirect_log_rdma_send(sc, SMBDIRECT_LOG_INFO,
"sge addr=0x%llx length=%u lkey=0x%x\n",
send_io->sge[0].addr,
send_io->sge[0].length,
send_io->sge[0].lkey);
/*
* Now post the recv_io buffer in order to get
* the negotiate response
*/
sc->recv_io.expected = SMBDIRECT_EXPECT_NEGOTIATE_REP;
ret = smbdirect_connection_post_recv_io(recv_io);
if (ret) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connection_post_recv_io() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
goto post_recv_io_failed;
}
send_io->wr.next = NULL;
send_io->wr.wr_cqe = &send_io->cqe;
send_io->wr.sg_list = send_io->sge;
send_io->wr.num_sge = send_io->num_sge;
send_io->wr.opcode = IB_WR_SEND;
send_io->wr.send_flags = IB_SEND_SIGNALED;
ret = smbdirect_connection_post_send_wr(sc, &send_io->wr);
if (ret) {
/* if we reach here, post send failed */
smbdirect_log_rdma_send(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connection_post_send_wr() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
goto post_send_wr_failed;
}
/*
* start with the negotiate timeout and SMBDIRECT_KEEPALIVE_PENDING
* so that the timer will cause a disconnect.
*/
sc->idle.keepalive = SMBDIRECT_KEEPALIVE_PENDING;
mod_delayed_work(sc->workqueues.idle, &sc->idle.timer_work,
msecs_to_jiffies(sp->negotiate_timeout_msec));
return 0;
post_send_wr_failed:
/*
* ib_dma_unmap_single is called in
* smbdirect_connection_free_send_io()
*/
smbdirect_connection_free_send_io(send_io);
/*
* recv_io is given to the rdma layer,
* we should not put it even on error
* nor call smbdirect_connection_destroy_mem_pools()
* it will be cleaned up during disconnect.
*/
return ret;
post_recv_io_failed:
/*
* ib_dma_unmap_single is called in
* smbdirect_connection_free_send_io()
*/
dma_mapping_failed:
smbdirect_connection_free_send_io(send_io);
alloc_send_io_failed:
smbdirect_connection_put_recv_io(recv_io);
get_recv_io_failed:
smbdirect_connection_destroy_mem_pools(sc);
create_mem_pools_failed:
return ret;
}
static void smbdirect_connect_negotiate_send_done(struct ib_cq *cq, struct ib_wc *wc)
{
struct smbdirect_send_io *send_io =
container_of(wc->wr_cqe, struct smbdirect_send_io, cqe);
struct smbdirect_socket *sc = send_io->socket;
smbdirect_log_rdma_send(sc, SMBDIRECT_LOG_INFO,
"smbdirect_send_io completed. status='%s (%d)', opcode=%d\n",
ib_wc_status_msg(wc->status), wc->status, wc->opcode);
/* Note this frees wc->wr_cqe, but not wc */
smbdirect_connection_free_send_io(send_io);
atomic_dec(&sc->send_io.pending.count);
if (unlikely(wc->status != IB_WC_SUCCESS || WARN_ON_ONCE(wc->opcode != IB_WC_SEND))) {
if (wc->status != IB_WC_WR_FLUSH_ERR)
smbdirect_log_rdma_send(sc, SMBDIRECT_LOG_ERR,
"wc->status=%s (%d) wc->opcode=%d\n",
ib_wc_status_msg(wc->status), wc->status, wc->opcode);
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
}
static void smbdirect_connect_negotiate_recv_work(struct work_struct *work);
static void smbdirect_connect_negotiate_recv_done(struct ib_cq *cq, struct ib_wc *wc)
{
struct smbdirect_recv_io *recv_io =
container_of(wc->wr_cqe, struct smbdirect_recv_io, cqe);
struct smbdirect_socket *sc = recv_io->socket;
unsigned long flags;
if (unlikely(wc->status != IB_WC_SUCCESS || WARN_ON_ONCE(wc->opcode != IB_WC_RECV))) {
if (wc->status != IB_WC_WR_FLUSH_ERR)
smbdirect_log_rdma_recv(sc, SMBDIRECT_LOG_ERR,
"wc->status=%s (%d) wc->opcode=%d\n",
ib_wc_status_msg(wc->status), wc->status, wc->opcode);
goto error;
}
smbdirect_log_rdma_recv(sc, SMBDIRECT_LOG_INFO,
"smbdirect_recv_io completed. status='%s (%d)', opcode=%d\n",
ib_wc_status_msg(wc->status), wc->status, wc->opcode);
/*
* This is an internal error!
*/
if (WARN_ON_ONCE(sc->recv_io.expected != SMBDIRECT_EXPECT_NEGOTIATE_REP))
goto error;
/*
* Don't reset timer to the keepalive interval in
* this will be done in smbdirect_accept_direct_negotiate_recv_work.
*/
ib_dma_sync_single_for_cpu(sc->ib.dev,
recv_io->sge.addr,
recv_io->sge.length,
DMA_FROM_DEVICE);
/*
* Only remember recv_io if it has enough bytes,
* this gives smbdirect_accept_negotiate_recv_work enough
* information in order to disconnect if it was not
* valid.
*/
sc->recv_io.reassembly.full_packet_received = true;
if (wc->byte_len >= sizeof(struct smbdirect_negotiate_resp))
smbdirect_connection_reassembly_append_recv_io(sc, recv_io, 0);
else
smbdirect_connection_put_recv_io(recv_io);
/*
* We continue via the workqueue as we may have
* complex work that might sleep.
*
* So we defer further processing of the negotiation
* to smbdirect_connect_negotiate_recv_work().
*/
spin_lock_irqsave(&sc->connect.lock, flags);
if (!sc->first_error) {
INIT_WORK(&sc->connect.work, smbdirect_connect_negotiate_recv_work);
if (sc->status == SMBDIRECT_SOCKET_NEGOTIATE_RUNNING)
queue_work(sc->workqueues.connect, &sc->connect.work);
}
spin_unlock_irqrestore(&sc->connect.lock, flags);
return;
error:
/*
* recv_io.posted.refill_work is still disabled,
* so smbdirect_connection_put_recv_io() won't
* start it.
*/
smbdirect_connection_put_recv_io(recv_io);
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
}
static void smbdirect_connect_negotiate_recv_work(struct work_struct *work)
{
struct smbdirect_socket *sc =
container_of(work, struct smbdirect_socket, connect.work);
struct smbdirect_socket_parameters *sp = &sc->parameters;
struct smbdirect_recv_io *recv_io;
struct smbdirect_negotiate_resp *nrep;
unsigned long flags;
u16 negotiated_version;
u16 credits_requested;
u16 credits_granted;
u32 status;
u32 max_readwrite_size;
u32 preferred_send_size;
u32 max_receive_size;
u32 max_fragmented_size;
int posted;
int ret;
if (sc->first_error)
return;
/*
* make sure we won't start again...
*/
disable_work(work);
/*
* Reset timer to the keepalive interval in
* order to trigger our next keepalive message.
*/
sc->idle.keepalive = SMBDIRECT_KEEPALIVE_NONE;
mod_delayed_work(sc->workqueues.idle, &sc->idle.timer_work,
msecs_to_jiffies(sp->keepalive_interval_msec));
/*
* If smbdirect_connect_negotiate_recv_done() detected an
* invalid request we want to disconnect.
*/
recv_io = smbdirect_connection_reassembly_first_recv_io(sc);
if (!recv_io) {
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
spin_lock_irqsave(&sc->recv_io.reassembly.lock, flags);
sc->recv_io.reassembly.queue_length--;
list_del(&recv_io->list);
spin_unlock_irqrestore(&sc->recv_io.reassembly.lock, flags);
smbdirect_connection_put_recv_io(recv_io);
if (SMBDIRECT_CHECK_STATUS_DISCONNECT(sc, SMBDIRECT_SOCKET_NEGOTIATE_RUNNING))
return;
/*
* Note recv_io is already part of the free list,
* as we just called smbdirect_connection_put_recv_io(),
* but it won't be reused before we call
* smbdirect_connection_recv_io_refill() below.
*/
nrep = (struct smbdirect_negotiate_resp *)recv_io->packet;
negotiated_version = le16_to_cpu(nrep->negotiated_version);
credits_requested = le16_to_cpu(nrep->credits_requested);
credits_granted = le16_to_cpu(nrep->credits_granted);
status = le32_to_cpu(nrep->status);
max_readwrite_size = le32_to_cpu(nrep->max_readwrite_size);
preferred_send_size = le32_to_cpu(nrep->preferred_send_size);
max_receive_size = le32_to_cpu(nrep->max_receive_size);
max_fragmented_size = le32_to_cpu(nrep->max_fragmented_size);
smbdirect_log_negotiate(sc, SMBDIRECT_LOG_INFO,
"RepIn: %s%x, %s%x, %s%x, %s%u, %s%u, %s%x, %s%u, %s%u, %s%u, %s%u\n",
"MinVersion=0x",
le16_to_cpu(nrep->min_version),
"MaxVersion=0x",
le16_to_cpu(nrep->max_version),
"NegotiatedVersion=0x",
le16_to_cpu(nrep->negotiated_version),
"CreditsRequested=",
le16_to_cpu(nrep->credits_requested),
"CreditsGranted=",
le16_to_cpu(nrep->credits_granted),
"Status=0x",
le32_to_cpu(nrep->status),
"MaxReadWriteSize=",
le32_to_cpu(nrep->max_readwrite_size),
"PreferredSendSize=",
le32_to_cpu(nrep->preferred_send_size),
"MaxRecvSize=",
le32_to_cpu(nrep->max_receive_size),
"MaxFragmentedSize=",
le32_to_cpu(nrep->max_fragmented_size));
if (negotiated_version != SMBDIRECT_V1) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"invalid: negotiated_version=0x%x\n",
negotiated_version);
smbdirect_socket_schedule_cleanup(sc, -ECONNREFUSED);
return;
}
if (status != le32_to_cpu(STATUS_SUCCESS)) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"invalid: status=0x%x != 0x0\n",
status);
smbdirect_socket_schedule_cleanup(sc, -ECONNREFUSED);
return;
}
if (max_receive_size < SMBDIRECT_MIN_RECEIVE_SIZE) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"invalid: max_receive_size=%u < %u\n",
max_receive_size,
SMBDIRECT_MIN_RECEIVE_SIZE);
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
if (max_fragmented_size < SMBDIRECT_MIN_FRAGMENTED_SIZE) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"invalid: max_fragmented_size=%u < %u\n",
max_fragmented_size,
SMBDIRECT_MIN_FRAGMENTED_SIZE);
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
if (credits_granted == 0) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"invalid: credits_granted == 0\n");
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
if (credits_requested == 0) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"invalid: credits_requested == 0\n");
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
if (preferred_send_size > sp->max_recv_size) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"invalid: preferred_send_size=%u > max_recv_size=%u\n",
preferred_send_size,
sp->max_recv_size);
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
/*
* We take the value from the peer, which is checked to be higher than 0,
* but we limit it to the max value we support in order to have
* the main logic simpler.
*/
sc->recv_io.credits.target = credits_requested;
sc->recv_io.credits.target = min_t(u16, sc->recv_io.credits.target,
sp->recv_credit_max);
/*
* At least the value of SMBDIRECT_MIN_RECEIVE_SIZE is used.
*/
sp->max_recv_size = min_t(u32, sp->max_recv_size, preferred_send_size);
sp->max_recv_size = max_t(u32, sp->max_recv_size, SMBDIRECT_MIN_RECEIVE_SIZE);
/*
* We already sent our sp->max_fragmented_recv_size
* to the peer, so we can't lower it here any more.
*
* TODO: but if the peer lowered sp->max_recv_size
* we will have to adjust our number of buffers.
*
* But for now we keep it as the cifs.ko code
* worked before.
*/
/*
* Note nrep->max_receive_size was already checked against
* SMBDIRECT_MIN_RECEIVE_SIZE above.
*/
sp->max_send_size = min_t(u32, sp->max_send_size, max_receive_size);
/*
* Make sure the resulting max_frmr_depth is at least 1,
* which means max_read_write_size needs to be at least PAGE_SIZE.
*/
sp->max_read_write_size = min_t(u32, sp->max_frmr_depth * PAGE_SIZE,
max_readwrite_size);
if (sp->max_read_write_size < PAGE_SIZE) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"invalid: max_readwrite_size=%u < PAGE_SIZE(%lu)\n",
max_readwrite_size,
PAGE_SIZE);
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
sp->max_frmr_depth = sp->max_read_write_size / PAGE_SIZE;
/*
* Note nrep->credits_granted was already checked against 0 above.
*/
atomic_set(&sc->send_io.credits.count, credits_granted);
/*
* Note nrep->max_fragmented_size was already checked against
* SMBDIRECT_MIN_FRAGMENTED_SIZE above.
*/
sp->max_fragmented_send_size = max_fragmented_size;
ret = smbdirect_connection_create_mr_list(sc);
if (ret) {
smbdirect_log_rdma_mr(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connection_create_mr_list() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
smbdirect_socket_schedule_cleanup(sc, ret);
return;
}
/*
* Prepare for receiving data_transfer messages
*/
sc->recv_io.reassembly.full_packet_received = true;
sc->recv_io.expected = SMBDIRECT_EXPECT_DATA_TRANSFER;
list_for_each_entry(recv_io, &sc->recv_io.free.list, list)
recv_io->cqe.done = smbdirect_connection_recv_io_done;
recv_io = NULL;
/*
* We should at least post 1 smbdirect_recv_io!
*/
posted = smbdirect_connection_recv_io_refill(sc);
if (posted < 1) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connection_recv_io_refill() failed %1pe\n",
SMBDIRECT_DEBUG_ERR_PTR(ret));
smbdirect_socket_schedule_cleanup(sc, -ECONNABORTED);
return;
}
/*
* smbdirect_connection_negotiation_done()
* will setup all required things and wake up
* the waiter.
*/
smbdirect_connection_negotiation_done(sc);
}
int smbdirect_connect_sync(struct smbdirect_socket *sc,
const struct sockaddr *dst)
{
int ret;
ret = smbdirect_connect(sc, dst);
if (ret) {
smbdirect_log_rdma_event(sc, SMBDIRECT_LOG_ERR,
"smbdirect_connect(%pISpsfc) failed %1pe\n",
dst, SMBDIRECT_DEBUG_ERR_PTR(ret));
return ret;
}
ret = smbdirect_connection_wait_for_connected(sc);
if (ret) {
int lvl = SMBDIRECT_LOG_ERR;
if (ret == -ENODEV)
lvl = SMBDIRECT_LOG_INFO;
smbdirect_log_rdma_event(sc, lvl,
"wait for smbdirect_connect(%pISpsfc) failed %1pe\n",
dst, SMBDIRECT_DEBUG_ERR_PTR(ret));
return ret;
}
return 0;
}
__SMBDIRECT_EXPORT_SYMBOL__(smbdirect_connect_sync);