ixgbe: reset before SRIOV init to avoid mailbox issues
[cascardo/linux.git] / net / rxrpc / sendmsg.c
1 /* AF_RXRPC sendmsg() implementation.
2  *
3  * Copyright (C) 2007, 2016 Red Hat, Inc. All Rights Reserved.
4  * Written by David Howells (dhowells@redhat.com)
5  *
6  * This program is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU General Public Licence
8  * as published by the Free Software Foundation; either version
9  * 2 of the Licence, or (at your option) any later version.
10  */
11
12 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
13
14 #include <linux/net.h>
15 #include <linux/gfp.h>
16 #include <linux/skbuff.h>
17 #include <linux/export.h>
18 #include <net/sock.h>
19 #include <net/af_rxrpc.h>
20 #include "ar-internal.h"
21
22 enum rxrpc_command {
23         RXRPC_CMD_SEND_DATA,            /* send data message */
24         RXRPC_CMD_SEND_ABORT,           /* request abort generation */
25         RXRPC_CMD_ACCEPT,               /* [server] accept incoming call */
26         RXRPC_CMD_REJECT_BUSY,          /* [server] reject a call as busy */
27 };
28
29 /*
30  * wait for space to appear in the transmit/ACK window
31  * - caller holds the socket locked
32  */
33 static int rxrpc_wait_for_tx_window(struct rxrpc_sock *rx,
34                                     struct rxrpc_call *call,
35                                     long *timeo)
36 {
37         DECLARE_WAITQUEUE(myself, current);
38         int ret;
39
40         _enter(",{%u,%u,%u}",
41                call->tx_hard_ack, call->tx_top, call->tx_winsize);
42
43         add_wait_queue(&call->waitq, &myself);
44
45         for (;;) {
46                 set_current_state(TASK_INTERRUPTIBLE);
47                 ret = 0;
48                 if (call->tx_top - call->tx_hard_ack < call->tx_winsize)
49                         break;
50                 if (call->state >= RXRPC_CALL_COMPLETE) {
51                         ret = -call->error;
52                         break;
53                 }
54                 if (signal_pending(current)) {
55                         ret = sock_intr_errno(*timeo);
56                         break;
57                 }
58
59                 trace_rxrpc_transmit(call, rxrpc_transmit_wait);
60                 release_sock(&rx->sk);
61                 *timeo = schedule_timeout(*timeo);
62                 lock_sock(&rx->sk);
63         }
64
65         remove_wait_queue(&call->waitq, &myself);
66         set_current_state(TASK_RUNNING);
67         _leave(" = %d", ret);
68         return ret;
69 }
70
71 /*
72  * Schedule an instant Tx resend.
73  */
74 static inline void rxrpc_instant_resend(struct rxrpc_call *call, int ix)
75 {
76         spin_lock_bh(&call->lock);
77
78         if (call->state < RXRPC_CALL_COMPLETE) {
79                 call->rxtx_annotations[ix] = RXRPC_TX_ANNO_RETRANS;
80                 if (!test_and_set_bit(RXRPC_CALL_EV_RESEND, &call->events))
81                         rxrpc_queue_call(call);
82         }
83
84         spin_unlock_bh(&call->lock);
85 }
86
87 /*
88  * Queue a DATA packet for transmission, set the resend timeout and send the
89  * packet immediately
90  */
91 static void rxrpc_queue_packet(struct rxrpc_call *call, struct sk_buff *skb,
92                                bool last)
93 {
94         struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
95         rxrpc_seq_t seq = sp->hdr.seq;
96         int ret, ix;
97
98         _net("queue skb %p [%d]", skb, seq);
99
100         ASSERTCMP(seq, ==, call->tx_top + 1);
101
102         ix = seq & RXRPC_RXTX_BUFF_MASK;
103         rxrpc_get_skb(skb, rxrpc_skb_tx_got);
104         call->rxtx_annotations[ix] = RXRPC_TX_ANNO_UNACK;
105         smp_wmb();
106         call->rxtx_buffer[ix] = skb;
107         call->tx_top = seq;
108         if (last) {
109                 set_bit(RXRPC_CALL_TX_LAST, &call->flags);
110                 trace_rxrpc_transmit(call, rxrpc_transmit_queue_last);
111         } else if (sp->hdr.flags & RXRPC_REQUEST_ACK) {
112                 trace_rxrpc_transmit(call, rxrpc_transmit_queue_reqack);
113         } else {
114                 trace_rxrpc_transmit(call, rxrpc_transmit_queue);
115         }
116
117         if (last || call->state == RXRPC_CALL_SERVER_ACK_REQUEST) {
118                 _debug("________awaiting reply/ACK__________");
119                 write_lock_bh(&call->state_lock);
120                 switch (call->state) {
121                 case RXRPC_CALL_CLIENT_SEND_REQUEST:
122                         call->state = RXRPC_CALL_CLIENT_AWAIT_REPLY;
123                         break;
124                 case RXRPC_CALL_SERVER_ACK_REQUEST:
125                         call->state = RXRPC_CALL_SERVER_SEND_REPLY;
126                         if (!last)
127                                 break;
128                 case RXRPC_CALL_SERVER_SEND_REPLY:
129                         call->state = RXRPC_CALL_SERVER_AWAIT_ACK;
130                         break;
131                 default:
132                         break;
133                 }
134                 write_unlock_bh(&call->state_lock);
135         }
136
137         _proto("Tx DATA %%%u { #%u }", sp->hdr.serial, sp->hdr.seq);
138
139         if (seq == 1 && rxrpc_is_client_call(call))
140                 rxrpc_expose_client_call(call);
141
142         sp->resend_at = jiffies + rxrpc_resend_timeout;
143         ret = rxrpc_send_data_packet(call->conn, skb);
144         if (ret < 0) {
145                 _debug("need instant resend %d", ret);
146                 rxrpc_instant_resend(call, ix);
147         }
148
149         rxrpc_free_skb(skb, rxrpc_skb_tx_freed);
150         _leave("");
151 }
152
153 /*
154  * Convert a host-endian header into a network-endian header.
155  */
156 static void rxrpc_insert_header(struct sk_buff *skb)
157 {
158         struct rxrpc_wire_header whdr;
159         struct rxrpc_skb_priv *sp = rxrpc_skb(skb);
160
161         whdr.epoch      = htonl(sp->hdr.epoch);
162         whdr.cid        = htonl(sp->hdr.cid);
163         whdr.callNumber = htonl(sp->hdr.callNumber);
164         whdr.seq        = htonl(sp->hdr.seq);
165         whdr.serial     = htonl(sp->hdr.serial);
166         whdr.type       = sp->hdr.type;
167         whdr.flags      = sp->hdr.flags;
168         whdr.userStatus = sp->hdr.userStatus;
169         whdr.securityIndex = sp->hdr.securityIndex;
170         whdr._rsvd      = htons(sp->hdr._rsvd);
171         whdr.serviceId  = htons(sp->hdr.serviceId);
172
173         memcpy(skb->head, &whdr, sizeof(whdr));
174 }
175
176 /*
177  * send data through a socket
178  * - must be called in process context
179  * - caller holds the socket locked
180  */
181 static int rxrpc_send_data(struct rxrpc_sock *rx,
182                            struct rxrpc_call *call,
183                            struct msghdr *msg, size_t len)
184 {
185         struct rxrpc_skb_priv *sp;
186         struct sk_buff *skb;
187         struct sock *sk = &rx->sk;
188         long timeo;
189         bool more;
190         int ret, copied;
191
192         timeo = sock_sndtimeo(sk, msg->msg_flags & MSG_DONTWAIT);
193
194         /* this should be in poll */
195         sk_clear_bit(SOCKWQ_ASYNC_NOSPACE, sk);
196
197         if (sk->sk_err || (sk->sk_shutdown & SEND_SHUTDOWN))
198                 return -EPIPE;
199
200         more = msg->msg_flags & MSG_MORE;
201
202         skb = call->tx_pending;
203         call->tx_pending = NULL;
204         rxrpc_see_skb(skb, rxrpc_skb_tx_seen);
205
206         copied = 0;
207         do {
208                 if (!skb) {
209                         size_t size, chunk, max, space;
210
211                         _debug("alloc");
212
213                         if (call->tx_top - call->tx_hard_ack >=
214                             call->tx_winsize) {
215                                 ret = -EAGAIN;
216                                 if (msg->msg_flags & MSG_DONTWAIT)
217                                         goto maybe_error;
218                                 ret = rxrpc_wait_for_tx_window(rx, call,
219                                                                &timeo);
220                                 if (ret < 0)
221                                         goto maybe_error;
222                         }
223
224                         max = RXRPC_JUMBO_DATALEN;
225                         max -= call->conn->security_size;
226                         max &= ~(call->conn->size_align - 1UL);
227
228                         chunk = max;
229                         if (chunk > msg_data_left(msg) && !more)
230                                 chunk = msg_data_left(msg);
231
232                         space = chunk + call->conn->size_align;
233                         space &= ~(call->conn->size_align - 1UL);
234
235                         size = space + call->conn->header_size;
236
237                         _debug("SIZE: %zu/%zu/%zu", chunk, space, size);
238
239                         /* create a buffer that we can retain until it's ACK'd */
240                         skb = sock_alloc_send_skb(
241                                 sk, size, msg->msg_flags & MSG_DONTWAIT, &ret);
242                         if (!skb)
243                                 goto maybe_error;
244
245                         rxrpc_new_skb(skb, rxrpc_skb_tx_new);
246
247                         _debug("ALLOC SEND %p", skb);
248
249                         ASSERTCMP(skb->mark, ==, 0);
250
251                         _debug("HS: %u", call->conn->header_size);
252                         skb_reserve(skb, call->conn->header_size);
253                         skb->len += call->conn->header_size;
254
255                         sp = rxrpc_skb(skb);
256                         sp->remain = chunk;
257                         if (sp->remain > skb_tailroom(skb))
258                                 sp->remain = skb_tailroom(skb);
259
260                         _net("skb: hr %d, tr %d, hl %d, rm %d",
261                                skb_headroom(skb),
262                                skb_tailroom(skb),
263                                skb_headlen(skb),
264                                sp->remain);
265
266                         skb->ip_summed = CHECKSUM_UNNECESSARY;
267                 }
268
269                 _debug("append");
270                 sp = rxrpc_skb(skb);
271
272                 /* append next segment of data to the current buffer */
273                 if (msg_data_left(msg) > 0) {
274                         int copy = skb_tailroom(skb);
275                         ASSERTCMP(copy, >, 0);
276                         if (copy > msg_data_left(msg))
277                                 copy = msg_data_left(msg);
278                         if (copy > sp->remain)
279                                 copy = sp->remain;
280
281                         _debug("add");
282                         ret = skb_add_data(skb, &msg->msg_iter, copy);
283                         _debug("added");
284                         if (ret < 0)
285                                 goto efault;
286                         sp->remain -= copy;
287                         skb->mark += copy;
288                         copied += copy;
289                 }
290
291                 /* check for the far side aborting the call or a network error
292                  * occurring */
293                 if (call->state == RXRPC_CALL_COMPLETE)
294                         goto call_terminated;
295
296                 /* add the packet to the send queue if it's now full */
297                 if (sp->remain <= 0 ||
298                     (msg_data_left(msg) == 0 && !more)) {
299                         struct rxrpc_connection *conn = call->conn;
300                         uint32_t seq;
301                         size_t pad;
302
303                         /* pad out if we're using security */
304                         if (conn->security_ix) {
305                                 pad = conn->security_size + skb->mark;
306                                 pad = conn->size_align - pad;
307                                 pad &= conn->size_align - 1;
308                                 _debug("pad %zu", pad);
309                                 if (pad)
310                                         memset(skb_put(skb, pad), 0, pad);
311                         }
312
313                         seq = call->tx_top + 1;
314
315                         sp->hdr.epoch   = conn->proto.epoch;
316                         sp->hdr.cid     = call->cid;
317                         sp->hdr.callNumber = call->call_id;
318                         sp->hdr.seq     = seq;
319                         sp->hdr.serial  = atomic_inc_return(&conn->serial);
320                         sp->hdr.type    = RXRPC_PACKET_TYPE_DATA;
321                         sp->hdr.userStatus = 0;
322                         sp->hdr.securityIndex = call->security_ix;
323                         sp->hdr._rsvd   = 0;
324                         sp->hdr.serviceId = call->service_id;
325
326                         sp->hdr.flags = conn->out_clientflag;
327                         if (msg_data_left(msg) == 0 && !more)
328                                 sp->hdr.flags |= RXRPC_LAST_PACKET;
329                         else if (call->tx_top - call->tx_hard_ack <
330                                  call->tx_winsize)
331                                 sp->hdr.flags |= RXRPC_MORE_PACKETS;
332                         if (more && seq & 1)
333                                 sp->hdr.flags |= RXRPC_REQUEST_ACK;
334
335                         ret = conn->security->secure_packet(
336                                 call, skb, skb->mark,
337                                 skb->head + sizeof(struct rxrpc_wire_header));
338                         if (ret < 0)
339                                 goto out;
340
341                         rxrpc_insert_header(skb);
342                         rxrpc_queue_packet(call, skb, !msg_data_left(msg) && !more);
343                         skb = NULL;
344                 }
345         } while (msg_data_left(msg) > 0);
346
347 success:
348         ret = copied;
349 out:
350         call->tx_pending = skb;
351         _leave(" = %d", ret);
352         return ret;
353
354 call_terminated:
355         rxrpc_free_skb(skb, rxrpc_skb_tx_freed);
356         _leave(" = %d", -call->error);
357         return -call->error;
358
359 maybe_error:
360         if (copied)
361                 goto success;
362         goto out;
363
364 efault:
365         ret = -EFAULT;
366         goto out;
367 }
368
369 /*
370  * extract control messages from the sendmsg() control buffer
371  */
372 static int rxrpc_sendmsg_cmsg(struct msghdr *msg,
373                               unsigned long *user_call_ID,
374                               enum rxrpc_command *command,
375                               u32 *abort_code,
376                               bool *_exclusive)
377 {
378         struct cmsghdr *cmsg;
379         bool got_user_ID = false;
380         int len;
381
382         *command = RXRPC_CMD_SEND_DATA;
383
384         if (msg->msg_controllen == 0)
385                 return -EINVAL;
386
387         for_each_cmsghdr(cmsg, msg) {
388                 if (!CMSG_OK(msg, cmsg))
389                         return -EINVAL;
390
391                 len = cmsg->cmsg_len - CMSG_ALIGN(sizeof(struct cmsghdr));
392                 _debug("CMSG %d, %d, %d",
393                        cmsg->cmsg_level, cmsg->cmsg_type, len);
394
395                 if (cmsg->cmsg_level != SOL_RXRPC)
396                         continue;
397
398                 switch (cmsg->cmsg_type) {
399                 case RXRPC_USER_CALL_ID:
400                         if (msg->msg_flags & MSG_CMSG_COMPAT) {
401                                 if (len != sizeof(u32))
402                                         return -EINVAL;
403                                 *user_call_ID = *(u32 *) CMSG_DATA(cmsg);
404                         } else {
405                                 if (len != sizeof(unsigned long))
406                                         return -EINVAL;
407                                 *user_call_ID = *(unsigned long *)
408                                         CMSG_DATA(cmsg);
409                         }
410                         _debug("User Call ID %lx", *user_call_ID);
411                         got_user_ID = true;
412                         break;
413
414                 case RXRPC_ABORT:
415                         if (*command != RXRPC_CMD_SEND_DATA)
416                                 return -EINVAL;
417                         *command = RXRPC_CMD_SEND_ABORT;
418                         if (len != sizeof(*abort_code))
419                                 return -EINVAL;
420                         *abort_code = *(unsigned int *) CMSG_DATA(cmsg);
421                         _debug("Abort %x", *abort_code);
422                         if (*abort_code == 0)
423                                 return -EINVAL;
424                         break;
425
426                 case RXRPC_ACCEPT:
427                         if (*command != RXRPC_CMD_SEND_DATA)
428                                 return -EINVAL;
429                         *command = RXRPC_CMD_ACCEPT;
430                         if (len != 0)
431                                 return -EINVAL;
432                         break;
433
434                 case RXRPC_EXCLUSIVE_CALL:
435                         *_exclusive = true;
436                         if (len != 0)
437                                 return -EINVAL;
438                         break;
439                 default:
440                         return -EINVAL;
441                 }
442         }
443
444         if (!got_user_ID)
445                 return -EINVAL;
446         _leave(" = 0");
447         return 0;
448 }
449
450 /*
451  * Create a new client call for sendmsg().
452  */
453 static struct rxrpc_call *
454 rxrpc_new_client_call_for_sendmsg(struct rxrpc_sock *rx, struct msghdr *msg,
455                                   unsigned long user_call_ID, bool exclusive)
456 {
457         struct rxrpc_conn_parameters cp;
458         struct rxrpc_call *call;
459         struct key *key;
460
461         DECLARE_SOCKADDR(struct sockaddr_rxrpc *, srx, msg->msg_name);
462
463         _enter("");
464
465         if (!msg->msg_name)
466                 return ERR_PTR(-EDESTADDRREQ);
467
468         key = rx->key;
469         if (key && !rx->key->payload.data[0])
470                 key = NULL;
471
472         memset(&cp, 0, sizeof(cp));
473         cp.local                = rx->local;
474         cp.key                  = rx->key;
475         cp.security_level       = rx->min_sec_level;
476         cp.exclusive            = rx->exclusive | exclusive;
477         cp.service_id           = srx->srx_service;
478         call = rxrpc_new_client_call(rx, &cp, srx, user_call_ID, GFP_KERNEL);
479
480         _leave(" = %p\n", call);
481         return call;
482 }
483
484 /*
485  * send a message forming part of a client call through an RxRPC socket
486  * - caller holds the socket locked
487  * - the socket may be either a client socket or a server socket
488  */
489 int rxrpc_do_sendmsg(struct rxrpc_sock *rx, struct msghdr *msg, size_t len)
490 {
491         enum rxrpc_command cmd;
492         struct rxrpc_call *call;
493         unsigned long user_call_ID = 0;
494         bool exclusive = false;
495         u32 abort_code = 0;
496         int ret;
497
498         _enter("");
499
500         ret = rxrpc_sendmsg_cmsg(msg, &user_call_ID, &cmd, &abort_code,
501                                  &exclusive);
502         if (ret < 0)
503                 return ret;
504
505         if (cmd == RXRPC_CMD_ACCEPT) {
506                 if (rx->sk.sk_state != RXRPC_SERVER_LISTENING)
507                         return -EINVAL;
508                 call = rxrpc_accept_call(rx, user_call_ID, NULL);
509                 if (IS_ERR(call))
510                         return PTR_ERR(call);
511                 rxrpc_put_call(call, rxrpc_call_put);
512                 return 0;
513         }
514
515         call = rxrpc_find_call_by_user_ID(rx, user_call_ID);
516         if (!call) {
517                 if (cmd != RXRPC_CMD_SEND_DATA)
518                         return -EBADSLT;
519                 call = rxrpc_new_client_call_for_sendmsg(rx, msg, user_call_ID,
520                                                          exclusive);
521                 if (IS_ERR(call))
522                         return PTR_ERR(call);
523         }
524
525         _debug("CALL %d USR %lx ST %d on CONN %p",
526                call->debug_id, call->user_call_ID, call->state, call->conn);
527
528         if (call->state >= RXRPC_CALL_COMPLETE) {
529                 /* it's too late for this call */
530                 ret = -ESHUTDOWN;
531         } else if (cmd == RXRPC_CMD_SEND_ABORT) {
532                 ret = 0;
533                 if (rxrpc_abort_call("CMD", call, 0, abort_code, ECONNABORTED))
534                         ret = rxrpc_send_call_packet(call,
535                                                      RXRPC_PACKET_TYPE_ABORT);
536         } else if (cmd != RXRPC_CMD_SEND_DATA) {
537                 ret = -EINVAL;
538         } else if (rxrpc_is_client_call(call) &&
539                    call->state != RXRPC_CALL_CLIENT_SEND_REQUEST) {
540                 /* request phase complete for this client call */
541                 ret = -EPROTO;
542         } else if (rxrpc_is_service_call(call) &&
543                    call->state != RXRPC_CALL_SERVER_ACK_REQUEST &&
544                    call->state != RXRPC_CALL_SERVER_SEND_REPLY) {
545                 /* Reply phase not begun or not complete for service call. */
546                 ret = -EPROTO;
547         } else {
548                 ret = rxrpc_send_data(rx, call, msg, len);
549         }
550
551         rxrpc_put_call(call, rxrpc_call_put);
552         _leave(" = %d", ret);
553         return ret;
554 }
555
556 /**
557  * rxrpc_kernel_send_data - Allow a kernel service to send data on a call
558  * @sock: The socket the call is on
559  * @call: The call to send data through
560  * @msg: The data to send
561  * @len: The amount of data to send
562  *
563  * Allow a kernel service to send data on a call.  The call must be in an state
564  * appropriate to sending data.  No control data should be supplied in @msg,
565  * nor should an address be supplied.  MSG_MORE should be flagged if there's
566  * more data to come, otherwise this data will end the transmission phase.
567  */
568 int rxrpc_kernel_send_data(struct socket *sock, struct rxrpc_call *call,
569                            struct msghdr *msg, size_t len)
570 {
571         int ret;
572
573         _enter("{%d,%s},", call->debug_id, rxrpc_call_states[call->state]);
574
575         ASSERTCMP(msg->msg_name, ==, NULL);
576         ASSERTCMP(msg->msg_control, ==, NULL);
577
578         lock_sock(sock->sk);
579
580         _debug("CALL %d USR %lx ST %d on CONN %p",
581                call->debug_id, call->user_call_ID, call->state, call->conn);
582
583         if (call->state >= RXRPC_CALL_COMPLETE) {
584                 ret = -ESHUTDOWN; /* it's too late for this call */
585         } else if (call->state != RXRPC_CALL_CLIENT_SEND_REQUEST &&
586                    call->state != RXRPC_CALL_SERVER_ACK_REQUEST &&
587                    call->state != RXRPC_CALL_SERVER_SEND_REPLY) {
588                 ret = -EPROTO; /* request phase complete for this client call */
589         } else {
590                 ret = rxrpc_send_data(rxrpc_sk(sock->sk), call, msg, len);
591         }
592
593         release_sock(sock->sk);
594         _leave(" = %d", ret);
595         return ret;
596 }
597 EXPORT_SYMBOL(rxrpc_kernel_send_data);
598
599 /**
600  * rxrpc_kernel_abort_call - Allow a kernel service to abort a call
601  * @sock: The socket the call is on
602  * @call: The call to be aborted
603  * @abort_code: The abort code to stick into the ABORT packet
604  * @error: Local error value
605  * @why: 3-char string indicating why.
606  *
607  * Allow a kernel service to abort a call, if it's still in an abortable state.
608  */
609 void rxrpc_kernel_abort_call(struct socket *sock, struct rxrpc_call *call,
610                              u32 abort_code, int error, const char *why)
611 {
612         _enter("{%d},%d,%d,%s", call->debug_id, abort_code, error, why);
613
614         lock_sock(sock->sk);
615
616         if (rxrpc_abort_call(why, call, 0, abort_code, error))
617                 rxrpc_send_call_packet(call, RXRPC_PACKET_TYPE_ABORT);
618
619         release_sock(sock->sk);
620         _leave("");
621 }
622
623 EXPORT_SYMBOL(rxrpc_kernel_abort_call);