Commit 647e18e3 authored by Chuck Lever's avatar Chuck Lever Committed by J. Bruce Fields

svcrdma: Clean up RPC-over-RDMA Call header decoder

Replace C structure-based XDR decoding with pointer arithmetic.
Pointer arithmetic is considered more portable.

Rename the "decode" functions. Nothing is decoded here, they
perform only transport header sanity checking. Use existing XDR
naming conventions to help readability.

Straight-line the hot path:
 - relocate the dprintk call sites out of line
 - remove unnecessary byte-swapping
 - reduce count of conditional branches

Deprecate RDMA_MSGP. It's not properly spec'd by RFC5666, and
therefore never used by any V1 client.
Signed-off-by: default avatarChuck Lever <chuck.lever@oracle.com>
Reviewed-by: default avatarChristoph Hellwig <hch@lst.de>
Signed-off-by: default avatarJ. Bruce Fields <bfields@redhat.com>
parent 98fc21d3
/* /*
* Copyright (c) 2016 Oracle. All rights reserved.
* Copyright (c) 2005-2006 Network Appliance, Inc. All rights reserved. * Copyright (c) 2005-2006 Network Appliance, Inc. All rights reserved.
* *
* This software is available to you under a choice of one of two * This software is available to you under a choice of one of two
...@@ -47,102 +48,43 @@ ...@@ -47,102 +48,43 @@
#define RPCDBG_FACILITY RPCDBG_SVCXPRT #define RPCDBG_FACILITY RPCDBG_SVCXPRT
/* static __be32 *xdr_check_read_list(__be32 *p, __be32 *end)
* Decodes a read chunk list. The expected format is as follows:
* descrim : xdr_one
* position : __be32 offset into XDR stream
* handle : __be32 RKEY
* . . .
* end-of-list: xdr_zero
*/
static __be32 *decode_read_list(__be32 *va, __be32 *vaend)
{ {
struct rpcrdma_read_chunk *ch = (struct rpcrdma_read_chunk *)va; __be32 *next;
while (ch->rc_discrim != xdr_zero) { while (*p++ != xdr_zero) {
if (((unsigned long)ch + sizeof(struct rpcrdma_read_chunk)) > next = p + rpcrdma_readchunk_maxsz - 1;
(unsigned long)vaend) { if (next > end)
dprintk("svcrdma: vaend=%p, ch=%p\n", vaend, ch);
return NULL; return NULL;
} p = next;
ch++;
} }
return &ch->rc_position; return p;
} }
/* static __be32 *xdr_check_write_list(__be32 *p, __be32 *end)
* Decodes a write chunk list. The expected format is as follows:
* descrim : xdr_one
* nchunks : <count>
* handle : __be32 RKEY ---+
* length : __be32 <len of segment> |
* offset : remove va + <count>
* . . . |
* ---+
*/
static __be32 *decode_write_list(__be32 *va, __be32 *vaend)
{ {
unsigned long start, end; __be32 *next;
int nchunks;
struct rpcrdma_write_array *ary =
(struct rpcrdma_write_array *)va;
/* Check for not write-array */
if (ary->wc_discrim == xdr_zero)
return &ary->wc_nchunks;
if ((unsigned long)ary + sizeof(struct rpcrdma_write_array) > while (*p++ != xdr_zero) {
(unsigned long)vaend) { next = p + 1 + be32_to_cpup(p) * rpcrdma_segment_maxsz;
dprintk("svcrdma: ary=%p, vaend=%p\n", ary, vaend); if (next > end)
return NULL; return NULL;
} p = next;
nchunks = be32_to_cpu(ary->wc_nchunks);
start = (unsigned long)&ary->wc_array[0];
end = (unsigned long)vaend;
if (nchunks < 0 ||
nchunks > (SIZE_MAX - start) / sizeof(struct rpcrdma_write_chunk) ||
(start + (sizeof(struct rpcrdma_write_chunk) * nchunks)) > end) {
dprintk("svcrdma: ary=%p, wc_nchunks=%d, vaend=%p\n",
ary, nchunks, vaend);
return NULL;
} }
/* return p;
* rs_length is the 2nd 4B field in wc_target and taking its
* address skips the list terminator
*/
return &ary->wc_array[nchunks].wc_target.rs_length;
} }
static __be32 *decode_reply_array(__be32 *va, __be32 *vaend) static __be32 *xdr_check_reply_chunk(__be32 *p, __be32 *end)
{ {
unsigned long start, end; __be32 *next;
int nchunks;
struct rpcrdma_write_array *ary = if (*p++ != xdr_zero) {
(struct rpcrdma_write_array *)va; next = p + 1 + be32_to_cpup(p) * rpcrdma_segment_maxsz;
if (next > end)
/* Check for no reply-array */ return NULL;
if (ary->wc_discrim == xdr_zero) p = next;
return &ary->wc_nchunks;
if ((unsigned long)ary + sizeof(struct rpcrdma_write_array) >
(unsigned long)vaend) {
dprintk("svcrdma: ary=%p, vaend=%p\n", ary, vaend);
return NULL;
}
nchunks = be32_to_cpu(ary->wc_nchunks);
start = (unsigned long)&ary->wc_array[0];
end = (unsigned long)vaend;
if (nchunks < 0 ||
nchunks > (SIZE_MAX - start) / sizeof(struct rpcrdma_write_chunk) ||
(start + (sizeof(struct rpcrdma_write_chunk) * nchunks)) > end) {
dprintk("svcrdma: ary=%p, wc_nchunks=%d, vaend=%p\n",
ary, nchunks, vaend);
return NULL;
} }
return (__be32 *)&ary->wc_array[nchunks]; return p;
} }
/** /**
...@@ -158,87 +100,71 @@ static __be32 *decode_reply_array(__be32 *va, __be32 *vaend) ...@@ -158,87 +100,71 @@ static __be32 *decode_reply_array(__be32 *va, __be32 *vaend)
*/ */
int svc_rdma_xdr_decode_req(struct xdr_buf *rq_arg) int svc_rdma_xdr_decode_req(struct xdr_buf *rq_arg)
{ {
struct rpcrdma_msg *rmsgp; __be32 *p, *end, *rdma_argp;
__be32 *va, *vaend; unsigned int hdr_len;
unsigned int len;
u32 hdr_len;
/* Verify that there's enough bytes for header + something */ /* Verify that there's enough bytes for header + something */
if (rq_arg->len <= RPCRDMA_HDRLEN_ERR) { if (rq_arg->len <= RPCRDMA_HDRLEN_ERR)
dprintk("svcrdma: header too short = %d\n", goto out_short;
rq_arg->len);
return -EINVAL;
}
rmsgp = (struct rpcrdma_msg *)rq_arg->head[0].iov_base; rdma_argp = rq_arg->head[0].iov_base;
if (rmsgp->rm_vers != rpcrdma_version) { if (*(rdma_argp + 1) != rpcrdma_version)
dprintk("%s: bad version %u\n", __func__, goto out_version;
be32_to_cpu(rmsgp->rm_vers));
return -EPROTONOSUPPORT;
}
switch (be32_to_cpu(rmsgp->rm_type)) { switch (*(rdma_argp + 3)) {
case RDMA_MSG: case rdma_msg:
case RDMA_NOMSG: case rdma_nomsg:
break; break;
case RDMA_DONE: case rdma_done:
/* Just drop it */ goto out_drop;
dprintk("svcrdma: dropping RDMA_DONE message\n");
return 0;
case RDMA_ERROR:
/* Possible if this is a backchannel reply.
* XXX: We should cancel this XID, though.
*/
dprintk("svcrdma: dropping RDMA_ERROR message\n");
return 0;
case RDMA_MSGP:
/* Pull in the extra for the padded case, bump our pointer */
rmsgp->rm_body.rm_padded.rm_align =
be32_to_cpu(rmsgp->rm_body.rm_padded.rm_align);
rmsgp->rm_body.rm_padded.rm_thresh =
be32_to_cpu(rmsgp->rm_body.rm_padded.rm_thresh);
va = &rmsgp->rm_body.rm_padded.rm_pempty[4];
rq_arg->head[0].iov_base = va;
len = (u32)((unsigned long)va - (unsigned long)rmsgp);
rq_arg->head[0].iov_len -= len;
if (len > rq_arg->len)
return -EINVAL;
return len;
default:
dprintk("svcrdma: bad rdma procedure (%u)\n",
be32_to_cpu(rmsgp->rm_type));
return -EINVAL;
}
/* The chunk list may contain either a read chunk list or a write case rdma_error:
* chunk list and a reply chunk list. goto out_drop;
*/
va = &rmsgp->rm_body.rm_chunks[0]; default:
vaend = (__be32 *)((unsigned long)rmsgp + rq_arg->len); goto out_proc;
va = decode_read_list(va, vaend);
if (!va) {
dprintk("svcrdma: failed to decode read list\n");
return -EINVAL;
}
va = decode_write_list(va, vaend);
if (!va) {
dprintk("svcrdma: failed to decode write list\n");
return -EINVAL;
}
va = decode_reply_array(va, vaend);
if (!va) {
dprintk("svcrdma: failed to decode reply chunk\n");
return -EINVAL;
} }
rq_arg->head[0].iov_base = va; end = (__be32 *)((unsigned long)rdma_argp + rq_arg->len);
hdr_len = (unsigned long)va - (unsigned long)rmsgp; p = xdr_check_read_list(rdma_argp + 4, end);
if (!p)
goto out_inval;
p = xdr_check_write_list(p, end);
if (!p)
goto out_inval;
p = xdr_check_reply_chunk(p, end);
if (!p)
goto out_inval;
if (p > end)
goto out_inval;
rq_arg->head[0].iov_base = p;
hdr_len = (unsigned long)p - (unsigned long)rdma_argp;
rq_arg->head[0].iov_len -= hdr_len; rq_arg->head[0].iov_len -= hdr_len;
return hdr_len; return hdr_len;
out_short:
dprintk("svcrdma: header too short = %d\n", rq_arg->len);
return -EINVAL;
out_version:
dprintk("svcrdma: bad xprt version: %u\n",
be32_to_cpup(rdma_argp + 1));
return -EPROTONOSUPPORT;
out_drop:
dprintk("svcrdma: dropping RDMA_DONE/ERROR message\n");
return 0;
out_proc:
dprintk("svcrdma: bad rdma procedure (%u)\n",
be32_to_cpup(rdma_argp + 3));
return -EINVAL;
out_inval:
dprintk("svcrdma: failed to parse transport header\n");
return -EINVAL;
} }
int svc_rdma_xdr_encode_error(struct svcxprt_rdma *xprt, int svc_rdma_xdr_encode_error(struct svcxprt_rdma *xprt,
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment