]> git.proxmox.com Git - mirror_ovs.git/blob - lib/vconn.c
openflow: Table maintenance commands for Geneve options.
[mirror_ovs.git] / lib / vconn.c
1 /*
2 * Copyright (c) 2008, 2009, 2010, 2011, 2012, 2013, 2014, 2015 Nicira, Inc.
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 #include <config.h>
18 #include "vconn-provider.h"
19 #include <errno.h>
20 #include <inttypes.h>
21 #include <netinet/in.h>
22 #include <poll.h>
23 #include <stdlib.h>
24 #include <string.h>
25 #include "coverage.h"
26 #include "dynamic-string.h"
27 #include "fatal-signal.h"
28 #include "flow.h"
29 #include "ofp-errors.h"
30 #include "ofp-msgs.h"
31 #include "ofp-print.h"
32 #include "ofp-util.h"
33 #include "ofpbuf.h"
34 #include "openflow/nicira-ext.h"
35 #include "openflow/openflow.h"
36 #include "packets.h"
37 #include "poll-loop.h"
38 #include "random.h"
39 #include "util.h"
40 #include "openvswitch/vlog.h"
41 #include "socket-util.h"
42
43 VLOG_DEFINE_THIS_MODULE(vconn);
44
45 COVERAGE_DEFINE(vconn_open);
46 COVERAGE_DEFINE(vconn_received);
47 COVERAGE_DEFINE(vconn_sent);
48
49 /* State of an active vconn.*/
50 enum vconn_state {
51 /* This is the ordinary progression of states. */
52 VCS_CONNECTING, /* Underlying vconn is not connected. */
53 VCS_SEND_HELLO, /* Waiting to send OFPT_HELLO message. */
54 VCS_RECV_HELLO, /* Waiting to receive OFPT_HELLO message. */
55 VCS_CONNECTED, /* Connection established. */
56
57 /* These states are entered only when something goes wrong. */
58 VCS_SEND_ERROR, /* Sending OFPT_ERROR message. */
59 VCS_DISCONNECTED /* Connection failed or connection closed. */
60 };
61
62 static const struct vconn_class *vconn_classes[] = {
63 &tcp_vconn_class,
64 &unix_vconn_class,
65 #ifdef HAVE_OPENSSL
66 &ssl_vconn_class,
67 #endif
68 };
69
70 static const struct pvconn_class *pvconn_classes[] = {
71 &ptcp_pvconn_class,
72 &punix_pvconn_class,
73 #ifdef HAVE_OPENSSL
74 &pssl_pvconn_class,
75 #endif
76 };
77
78 /* Rate limit for individual OpenFlow messages going over the vconn, output at
79 * DBG level. This is very high because, if these are enabled, it is because
80 * we really need to see them. */
81 static struct vlog_rate_limit ofmsg_rl = VLOG_RATE_LIMIT_INIT(600, 600);
82
83 /* Rate limit for OpenFlow message parse errors. These always indicate a bug
84 * in the peer and so there's not much point in showing a lot of them. */
85 static struct vlog_rate_limit bad_ofmsg_rl = VLOG_RATE_LIMIT_INIT(1, 5);
86
87 static int do_recv(struct vconn *, struct ofpbuf **);
88 static int do_send(struct vconn *, struct ofpbuf *);
89
90 /* Check the validity of the vconn class structures. */
91 static void
92 check_vconn_classes(void)
93 {
94 #ifndef NDEBUG
95 size_t i;
96
97 for (i = 0; i < ARRAY_SIZE(vconn_classes); i++) {
98 const struct vconn_class *class = vconn_classes[i];
99 ovs_assert(class->name != NULL);
100 ovs_assert(class->open != NULL);
101 if (class->close || class->recv || class->send
102 || class->run || class->run_wait || class->wait) {
103 ovs_assert(class->close != NULL);
104 ovs_assert(class->recv != NULL);
105 ovs_assert(class->send != NULL);
106 ovs_assert(class->wait != NULL);
107 } else {
108 /* This class delegates to another one. */
109 }
110 }
111
112 for (i = 0; i < ARRAY_SIZE(pvconn_classes); i++) {
113 const struct pvconn_class *class = pvconn_classes[i];
114 ovs_assert(class->name != NULL);
115 ovs_assert(class->listen != NULL);
116 if (class->close || class->accept || class->wait) {
117 ovs_assert(class->close != NULL);
118 ovs_assert(class->accept != NULL);
119 ovs_assert(class->wait != NULL);
120 } else {
121 /* This class delegates to another one. */
122 }
123 }
124 #endif
125 }
126
127 /* Prints information on active (if 'active') and passive (if 'passive')
128 * connection methods supported by the vconn. If 'bootstrap' is true, also
129 * advertises options to bootstrap the CA certificate. */
130 void
131 vconn_usage(bool active, bool passive, bool bootstrap OVS_UNUSED)
132 {
133 /* Really this should be implemented via callbacks into the vconn
134 * providers, but that seems too heavy-weight to bother with at the
135 * moment. */
136
137 printf("\n");
138 if (active) {
139 printf("Active OpenFlow connection methods:\n");
140 printf(" tcp:IP[:PORT] "
141 "PORT (default: %d) at remote IP\n", OFP_PORT);
142 #ifdef HAVE_OPENSSL
143 printf(" ssl:IP[:PORT] "
144 "SSL PORT (default: %d) at remote IP\n", OFP_PORT);
145 #endif
146 printf(" unix:FILE Unix domain socket named FILE\n");
147 }
148
149 if (passive) {
150 printf("Passive OpenFlow connection methods:\n");
151 printf(" ptcp:[PORT][:IP] "
152 "listen to TCP PORT (default: %d) on IP\n",
153 OFP_PORT);
154 #ifdef HAVE_OPENSSL
155 printf(" pssl:[PORT][:IP] "
156 "listen for SSL on PORT (default: %d) on IP\n",
157 OFP_PORT);
158 #endif
159 printf(" punix:FILE "
160 "listen on Unix domain socket FILE\n");
161 }
162
163 #ifdef HAVE_OPENSSL
164 printf("PKI configuration (required to use SSL):\n"
165 " -p, --private-key=FILE file with private key\n"
166 " -c, --certificate=FILE file with certificate for private key\n"
167 " -C, --ca-cert=FILE file with peer CA certificate\n");
168 if (bootstrap) {
169 printf(" --bootstrap-ca-cert=FILE file with peer CA certificate "
170 "to read or create\n");
171 }
172 #endif
173 }
174
175 /* Given 'name', a connection name in the form "TYPE:ARGS", stores the class
176 * named "TYPE" into '*classp' and returns 0. Returns EAFNOSUPPORT and stores
177 * a null pointer into '*classp' if 'name' is in the wrong form or if no such
178 * class exists. */
179 static int
180 vconn_lookup_class(const char *name, const struct vconn_class **classp)
181 {
182 size_t prefix_len;
183
184 prefix_len = strcspn(name, ":");
185 if (name[prefix_len] != '\0') {
186 size_t i;
187
188 for (i = 0; i < ARRAY_SIZE(vconn_classes); i++) {
189 const struct vconn_class *class = vconn_classes[i];
190 if (strlen(class->name) == prefix_len
191 && !memcmp(class->name, name, prefix_len)) {
192 *classp = class;
193 return 0;
194 }
195 }
196 }
197
198 *classp = NULL;
199 return EAFNOSUPPORT;
200 }
201
202 /* Returns 0 if 'name' is a connection name in the form "TYPE:ARGS" and TYPE is
203 * a supported connection type, otherwise EAFNOSUPPORT. */
204 int
205 vconn_verify_name(const char *name)
206 {
207 const struct vconn_class *class;
208 return vconn_lookup_class(name, &class);
209 }
210
211 /* Attempts to connect to an OpenFlow device. 'name' is a connection name in
212 * the form "TYPE:ARGS", where TYPE is an active vconn class's name and ARGS
213 * are vconn class-specific.
214 *
215 * The vconn will automatically negotiate an OpenFlow protocol version
216 * acceptable to both peers on the connection. The version negotiated will be
217 * one of those in the 'allowed_versions' bitmap: version 'x' is allowed if
218 * allowed_versions & (1 << x) is nonzero. If 'allowed_versions' is zero, then
219 * OFPUTIL_DEFAULT_VERSIONS are allowed.
220 *
221 * Returns 0 if successful, otherwise a positive errno value. If successful,
222 * stores a pointer to the new connection in '*vconnp', otherwise a null
223 * pointer. */
224 int
225 vconn_open(const char *name, uint32_t allowed_versions, uint8_t dscp,
226 struct vconn **vconnp)
227 {
228 const struct vconn_class *class;
229 struct vconn *vconn;
230 char *suffix_copy;
231 int error;
232
233 COVERAGE_INC(vconn_open);
234 check_vconn_classes();
235
236 if (!allowed_versions) {
237 allowed_versions = OFPUTIL_DEFAULT_VERSIONS;
238 }
239
240 /* Look up the class. */
241 error = vconn_lookup_class(name, &class);
242 if (!class) {
243 goto error;
244 }
245
246 /* Call class's "open" function. */
247 suffix_copy = xstrdup(strchr(name, ':') + 1);
248 error = class->open(name, allowed_versions, suffix_copy, &vconn, dscp);
249 free(suffix_copy);
250 if (error) {
251 goto error;
252 }
253
254 /* Success. */
255 ovs_assert(vconn->state != VCS_CONNECTING || vconn->vclass->connect);
256 *vconnp = vconn;
257 return 0;
258
259 error:
260 *vconnp = NULL;
261 return error;
262 }
263
264 /* Allows 'vconn' to perform maintenance activities, such as flushing output
265 * buffers. */
266 void
267 vconn_run(struct vconn *vconn)
268 {
269 if (vconn->state == VCS_CONNECTING ||
270 vconn->state == VCS_SEND_HELLO ||
271 vconn->state == VCS_RECV_HELLO) {
272 vconn_connect(vconn);
273 }
274
275 if (vconn->vclass->run) {
276 (vconn->vclass->run)(vconn);
277 }
278 }
279
280 /* Arranges for the poll loop to wake up when 'vconn' needs to perform
281 * maintenance activities. */
282 void
283 vconn_run_wait(struct vconn *vconn)
284 {
285 if (vconn->state == VCS_CONNECTING ||
286 vconn->state == VCS_SEND_HELLO ||
287 vconn->state == VCS_RECV_HELLO) {
288 vconn_connect_wait(vconn);
289 }
290
291 if (vconn->vclass->run_wait) {
292 (vconn->vclass->run_wait)(vconn);
293 }
294 }
295
296 /* Returns 0 if 'vconn' is healthy (connecting or connected), a positive errno
297 * value if the connection died abnormally (connection failed or aborted), or
298 * EOF if the connection was closed in a normal way. */
299 int
300 vconn_get_status(const struct vconn *vconn)
301 {
302 return vconn->error == EAGAIN ? 0 : vconn->error;
303 }
304
305 int
306 vconn_open_block(const char *name, uint32_t allowed_versions, uint8_t dscp,
307 struct vconn **vconnp)
308 {
309 struct vconn *vconn;
310 int error;
311
312 fatal_signal_run();
313
314 error = vconn_open(name, allowed_versions, dscp, &vconn);
315 if (!error) {
316 error = vconn_connect_block(vconn);
317 }
318
319 if (error) {
320 vconn_close(vconn);
321 *vconnp = NULL;
322 } else {
323 *vconnp = vconn;
324 }
325 return error;
326 }
327
328 /* Closes 'vconn'. */
329 void
330 vconn_close(struct vconn *vconn)
331 {
332 if (vconn != NULL) {
333 char *name = vconn->name;
334 (vconn->vclass->close)(vconn);
335 free(name);
336 }
337 }
338
339 /* Returns the name of 'vconn', that is, the string passed to vconn_open(). */
340 const char *
341 vconn_get_name(const struct vconn *vconn)
342 {
343 return vconn->name;
344 }
345
346 /* Returns the allowed_versions of 'vconn', that is,
347 * the allowed_versions passed to vconn_open(). */
348 uint32_t
349 vconn_get_allowed_versions(const struct vconn *vconn)
350 {
351 return vconn->allowed_versions;
352 }
353
354 /* Sets the allowed_versions of 'vconn', overriding
355 * the allowed_versions passed to vconn_open(). */
356 void
357 vconn_set_allowed_versions(struct vconn *vconn, uint32_t allowed_versions)
358 {
359 vconn->allowed_versions = allowed_versions;
360 }
361
362 /* Returns the OpenFlow version negotiated with the peer, or -1 if version
363 * negotiation is not yet complete.
364 *
365 * A vconn that has successfully connected (that is, vconn_connect() or
366 * vconn_send() or vconn_recv() has returned 0) always negotiated a version. */
367 int
368 vconn_get_version(const struct vconn *vconn)
369 {
370 return vconn->version ? vconn->version : -1;
371 }
372
373 /* By default, a vconn accepts only OpenFlow messages whose version matches the
374 * one negotiated for the connection. A message received with a different
375 * version is an error that causes the vconn to drop the connection.
376 *
377 * This functions allows 'vconn' to accept messages with any OpenFlow version.
378 * This is useful in the special case where 'vconn' is used as an rconn
379 * "monitor" connection (see rconn_add_monitor()), that is, where 'vconn' is
380 * used as a target for mirroring OpenFlow messages for debugging and
381 * troubleshooting.
382 *
383 * This function should be called after a successful vconn_open() or
384 * pvconn_accept() but before the connection completes, that is, before
385 * vconn_connect() returns success. Otherwise, messages that arrive on 'vconn'
386 * beforehand with an unexpected version will the vconn to drop the
387 * connection. */
388 void
389 vconn_set_recv_any_version(struct vconn *vconn)
390 {
391 vconn->recv_any_version = true;
392 }
393
394 static void
395 vcs_connecting(struct vconn *vconn)
396 {
397 int retval = (vconn->vclass->connect)(vconn);
398 ovs_assert(retval != EINPROGRESS);
399 if (!retval) {
400 vconn->state = VCS_SEND_HELLO;
401 } else if (retval != EAGAIN) {
402 vconn->state = VCS_DISCONNECTED;
403 vconn->error = retval;
404 }
405 }
406
407 static void
408 vcs_send_hello(struct vconn *vconn)
409 {
410 struct ofpbuf *b;
411 int retval;
412
413 b = ofputil_encode_hello(vconn->allowed_versions);
414 retval = do_send(vconn, b);
415 if (!retval) {
416 vconn->state = VCS_RECV_HELLO;
417 } else {
418 ofpbuf_delete(b);
419 if (retval != EAGAIN) {
420 vconn->state = VCS_DISCONNECTED;
421 vconn->error = retval;
422 }
423 }
424 }
425
426 static char *
427 version_bitmap_to_string(uint32_t bitmap)
428 {
429 struct ds s;
430
431 ds_init(&s);
432 if (!bitmap) {
433 ds_put_cstr(&s, "no versions");
434 } else if (is_pow2(bitmap)) {
435 ds_put_cstr(&s, "version ");
436 ofputil_format_version(&s, leftmost_1bit_idx(bitmap));
437 } else if (is_pow2((bitmap >> 1) + 1)) {
438 ds_put_cstr(&s, "version ");
439 ofputil_format_version(&s, leftmost_1bit_idx(bitmap));
440 ds_put_cstr(&s, " and earlier");
441 } else {
442 ds_put_cstr(&s, "versions ");
443 ofputil_format_version_bitmap(&s, bitmap);
444 }
445 return ds_steal_cstr(&s);
446 }
447
448 static void
449 vcs_recv_hello(struct vconn *vconn)
450 {
451 struct ofpbuf *b;
452 int retval;
453
454 retval = do_recv(vconn, &b);
455 if (!retval) {
456 enum ofptype type;
457 enum ofperr error;
458
459 error = ofptype_decode(&type, b->data);
460 if (!error && type == OFPTYPE_HELLO) {
461 char *peer_s, *local_s;
462 uint32_t common_versions;
463
464 if (!ofputil_decode_hello(b->data, &vconn->peer_versions)) {
465 struct ds msg = DS_EMPTY_INITIALIZER;
466 ds_put_format(&msg, "%s: unknown data in hello:\n",
467 vconn->name);
468 ds_put_hex_dump(&msg, b->data, b->size, 0, true);
469 VLOG_WARN_RL(&bad_ofmsg_rl, "%s", ds_cstr(&msg));
470 ds_destroy(&msg);
471 }
472
473 local_s = version_bitmap_to_string(vconn->allowed_versions);
474 peer_s = version_bitmap_to_string(vconn->peer_versions);
475
476 common_versions = vconn->peer_versions & vconn->allowed_versions;
477 if (!common_versions) {
478 vconn->version = leftmost_1bit_idx(vconn->peer_versions);
479 VLOG_WARN_RL(&bad_ofmsg_rl,
480 "%s: version negotiation failed (we support "
481 "%s, peer supports %s)",
482 vconn->name, local_s, peer_s);
483 vconn->state = VCS_SEND_ERROR;
484 } else {
485 vconn->version = leftmost_1bit_idx(common_versions);
486 VLOG_DBG("%s: negotiated OpenFlow version 0x%02x "
487 "(we support %s, peer supports %s)", vconn->name,
488 vconn->version, local_s, peer_s);
489 vconn->state = VCS_CONNECTED;
490 }
491
492 free(local_s);
493 free(peer_s);
494
495 ofpbuf_delete(b);
496 return;
497 } else {
498 char *s = ofp_to_string(b->data, b->size, 1);
499 VLOG_WARN_RL(&bad_ofmsg_rl,
500 "%s: received message while expecting hello: %s",
501 vconn->name, s);
502 free(s);
503 retval = EPROTO;
504 ofpbuf_delete(b);
505 }
506 }
507
508 if (retval != EAGAIN) {
509 vconn->state = VCS_DISCONNECTED;
510 vconn->error = retval == EOF ? ECONNRESET : retval;
511 }
512 }
513
514 static void
515 vcs_send_error(struct vconn *vconn)
516 {
517 struct ofpbuf *b;
518 char s[128];
519 int retval;
520 char *local_s, *peer_s;
521
522 local_s = version_bitmap_to_string(vconn->allowed_versions);
523 peer_s = version_bitmap_to_string(vconn->peer_versions);
524 snprintf(s, sizeof s, "We support %s, you support %s, no common versions.",
525 local_s, peer_s);
526 free(peer_s);
527 free(local_s);
528
529 b = ofperr_encode_hello(OFPERR_OFPHFC_INCOMPATIBLE, vconn->version, s);
530 retval = do_send(vconn, b);
531 if (retval) {
532 ofpbuf_delete(b);
533 }
534 if (retval != EAGAIN) {
535 vconn->state = VCS_DISCONNECTED;
536 vconn->error = retval ? retval : EPROTO;
537 }
538 }
539
540 /* Tries to complete the connection on 'vconn'. If 'vconn''s connection is
541 * complete, returns 0 if the connection was successful or a positive errno
542 * value if it failed. If the connection is still in progress, returns
543 * EAGAIN. */
544 int
545 vconn_connect(struct vconn *vconn)
546 {
547 enum vconn_state last_state;
548
549 do {
550 last_state = vconn->state;
551 switch (vconn->state) {
552 case VCS_CONNECTING:
553 vcs_connecting(vconn);
554 break;
555
556 case VCS_SEND_HELLO:
557 vcs_send_hello(vconn);
558 break;
559
560 case VCS_RECV_HELLO:
561 vcs_recv_hello(vconn);
562 break;
563
564 case VCS_CONNECTED:
565 return 0;
566
567 case VCS_SEND_ERROR:
568 vcs_send_error(vconn);
569 break;
570
571 case VCS_DISCONNECTED:
572 return vconn->error;
573
574 default:
575 OVS_NOT_REACHED();
576 }
577 } while (vconn->state != last_state);
578
579 return EAGAIN;
580 }
581
582 /* Tries to receive an OpenFlow message from 'vconn'. If successful, stores
583 * the received message into '*msgp' and returns 0. The caller is responsible
584 * for destroying the message with ofpbuf_delete(). On failure, returns a
585 * positive errno value and stores a null pointer into '*msgp'. On normal
586 * connection close, returns EOF.
587 *
588 * vconn_recv will not block waiting for a packet to arrive. If no packets
589 * have been received, it returns EAGAIN immediately. */
590 int
591 vconn_recv(struct vconn *vconn, struct ofpbuf **msgp)
592 {
593 struct ofpbuf *msg;
594 int retval;
595
596 retval = vconn_connect(vconn);
597 if (!retval) {
598 retval = do_recv(vconn, &msg);
599 }
600 if (!retval && !vconn->recv_any_version) {
601 const struct ofp_header *oh = msg->data;
602 if (oh->version != vconn->version) {
603 enum ofptype type;
604
605 if (ofptype_decode(&type, msg->data)
606 || (type != OFPTYPE_HELLO &&
607 type != OFPTYPE_ERROR &&
608 type != OFPTYPE_ECHO_REQUEST &&
609 type != OFPTYPE_ECHO_REPLY)) {
610 struct ofpbuf *reply;
611
612 VLOG_ERR_RL(&bad_ofmsg_rl, "%s: received OpenFlow version "
613 "0x%02"PRIx8" != expected %02x",
614 vconn->name, oh->version, vconn->version);
615
616 /* Send a "bad version" reply, if we can. */
617 reply = ofperr_encode_reply(OFPERR_OFPBRC_BAD_VERSION, oh);
618 retval = vconn_send(vconn, reply);
619 if (retval) {
620 VLOG_INFO_RL(&bad_ofmsg_rl,
621 "%s: failed to queue error reply (%s)",
622 vconn->name, ovs_strerror(retval));
623 ofpbuf_delete(reply);
624 }
625
626 /* Suppress the received message, as if it had not arrived. */
627 retval = EAGAIN;
628 ofpbuf_delete(msg);
629 }
630 }
631 }
632
633 *msgp = retval ? NULL : msg;
634 return retval;
635 }
636
637 static int
638 do_recv(struct vconn *vconn, struct ofpbuf **msgp)
639 {
640 int retval = (vconn->vclass->recv)(vconn, msgp);
641 if (!retval) {
642 COVERAGE_INC(vconn_received);
643 if (VLOG_IS_DBG_ENABLED()) {
644 char *s = ofp_to_string((*msgp)->data, (*msgp)->size, 1);
645 VLOG_DBG_RL(&ofmsg_rl, "%s: received: %s", vconn->name, s);
646 free(s);
647 }
648 }
649 return retval;
650 }
651
652 /* Tries to queue 'msg' for transmission on 'vconn'. If successful, returns 0,
653 * in which case ownership of 'msg' is transferred to the vconn. Success does
654 * not guarantee that 'msg' has been or ever will be delivered to the peer,
655 * only that it has been queued for transmission.
656 *
657 * Returns a positive errno value on failure, in which case the caller
658 * retains ownership of 'msg'.
659 *
660 * vconn_send will not block. If 'msg' cannot be immediately accepted for
661 * transmission, it returns EAGAIN immediately. */
662 int
663 vconn_send(struct vconn *vconn, struct ofpbuf *msg)
664 {
665 int retval = vconn_connect(vconn);
666 if (!retval) {
667 retval = do_send(vconn, msg);
668 }
669 return retval;
670 }
671
672 static int
673 do_send(struct vconn *vconn, struct ofpbuf *msg)
674 {
675 int retval;
676
677 ovs_assert(msg->size >= sizeof(struct ofp_header));
678
679 ofpmsg_update_length(msg);
680 if (!VLOG_IS_DBG_ENABLED()) {
681 COVERAGE_INC(vconn_sent);
682 retval = (vconn->vclass->send)(vconn, msg);
683 } else {
684 char *s = ofp_to_string(msg->data, msg->size, 1);
685 retval = (vconn->vclass->send)(vconn, msg);
686 if (retval != EAGAIN) {
687 VLOG_DBG_RL(&ofmsg_rl, "%s: sent (%s): %s",
688 vconn->name, ovs_strerror(retval), s);
689 }
690 free(s);
691 }
692 return retval;
693 }
694
695 /* Same as vconn_connect(), except that it waits until the connection on
696 * 'vconn' completes or fails. Thus, it will never return EAGAIN. */
697 int
698 vconn_connect_block(struct vconn *vconn)
699 {
700 int error;
701
702 while ((error = vconn_connect(vconn)) == EAGAIN) {
703 vconn_run(vconn);
704 vconn_run_wait(vconn);
705 vconn_connect_wait(vconn);
706 poll_block();
707 }
708 ovs_assert(error != EINPROGRESS);
709
710 return error;
711 }
712
713 /* Same as vconn_send, except that it waits until 'msg' can be transmitted. */
714 int
715 vconn_send_block(struct vconn *vconn, struct ofpbuf *msg)
716 {
717 int retval;
718
719 fatal_signal_run();
720
721 while ((retval = vconn_send(vconn, msg)) == EAGAIN) {
722 vconn_run(vconn);
723 vconn_run_wait(vconn);
724 vconn_send_wait(vconn);
725 poll_block();
726 }
727 return retval;
728 }
729
730 /* Same as vconn_recv, except that it waits until a message is received. */
731 int
732 vconn_recv_block(struct vconn *vconn, struct ofpbuf **msgp)
733 {
734 int retval;
735
736 fatal_signal_run();
737
738 while ((retval = vconn_recv(vconn, msgp)) == EAGAIN) {
739 vconn_run(vconn);
740 vconn_run_wait(vconn);
741 vconn_recv_wait(vconn);
742 poll_block();
743 }
744 return retval;
745 }
746
747 static int
748 vconn_recv_xid__(struct vconn *vconn, ovs_be32 xid, struct ofpbuf **replyp,
749 void (*error_reporter)(const struct ofp_header *))
750 {
751 for (;;) {
752 ovs_be32 recv_xid;
753 struct ofpbuf *reply;
754 const struct ofp_header *oh;
755 enum ofptype type;
756 int error;
757
758 error = vconn_recv_block(vconn, &reply);
759 if (error) {
760 *replyp = NULL;
761 return error;
762 }
763 oh = reply->data;
764 recv_xid = oh->xid;
765 if (xid == recv_xid) {
766 *replyp = reply;
767 return 0;
768 }
769
770 error = ofptype_decode(&type, oh);
771 if (!error && type == OFPTYPE_ERROR && error_reporter) {
772 error_reporter(oh);
773 } else {
774 VLOG_DBG_RL(&bad_ofmsg_rl, "%s: received reply with xid %08"PRIx32
775 " != expected %08"PRIx32,
776 vconn->name, ntohl(recv_xid), ntohl(xid));
777 }
778 ofpbuf_delete(reply);
779 }
780 }
781
782 /* Waits until a message with a transaction ID matching 'xid' is received on
783 * 'vconn'. Returns 0 if successful, in which case the reply is stored in
784 * '*replyp' for the caller to examine and free. Otherwise returns a positive
785 * errno value, or EOF, and sets '*replyp' to null.
786 *
787 * 'request' is always destroyed, regardless of the return value. */
788 int
789 vconn_recv_xid(struct vconn *vconn, ovs_be32 xid, struct ofpbuf **replyp)
790 {
791 return vconn_recv_xid__(vconn, xid, replyp, NULL);
792 }
793
794 static int
795 vconn_transact__(struct vconn *vconn, struct ofpbuf *request,
796 struct ofpbuf **replyp,
797 void (*error_reporter)(const struct ofp_header *))
798 {
799 ovs_be32 send_xid = ((struct ofp_header *) request->data)->xid;
800 int error;
801
802 *replyp = NULL;
803 error = vconn_send_block(vconn, request);
804 if (error) {
805 ofpbuf_delete(request);
806 }
807 return error ? error : vconn_recv_xid__(vconn, send_xid, replyp,
808 error_reporter);
809 }
810
811 /* Sends 'request' to 'vconn' and blocks until it receives a reply with a
812 * matching transaction ID. Returns 0 if successful, in which case the reply
813 * is stored in '*replyp' for the caller to examine and free. Otherwise
814 * returns a positive errno value, or EOF, and sets '*replyp' to null.
815 *
816 * 'request' should be an OpenFlow request that requires a reply. Otherwise,
817 * if there is no reply, this function can end up blocking forever (or until
818 * the peer drops the connection).
819 *
820 * 'request' is always destroyed, regardless of the return value. */
821 int
822 vconn_transact(struct vconn *vconn, struct ofpbuf *request,
823 struct ofpbuf **replyp)
824 {
825 return vconn_transact__(vconn, request, replyp, NULL);
826 }
827
828 /* Sends 'request' followed by a barrier request to 'vconn', then blocks until
829 * it receives a reply to the barrier. If successful, stores the reply to
830 * 'request' in '*replyp', if one was received, and otherwise NULL, then
831 * returns 0. Otherwise returns a positive errno value, or EOF, and sets
832 * '*replyp' to null.
833 *
834 * This function is useful for sending an OpenFlow request that doesn't
835 * ordinarily include a reply but might report an error in special
836 * circumstances.
837 *
838 * 'request' is always destroyed, regardless of the return value. */
839 int
840 vconn_transact_noreply(struct vconn *vconn, struct ofpbuf *request,
841 struct ofpbuf **replyp)
842 {
843 ovs_be32 request_xid;
844 ovs_be32 barrier_xid;
845 struct ofpbuf *barrier;
846 int error;
847
848 *replyp = NULL;
849
850 /* Send request. */
851 request_xid = ((struct ofp_header *) request->data)->xid;
852 error = vconn_send_block(vconn, request);
853 if (error) {
854 ofpbuf_delete(request);
855 return error;
856 }
857
858 /* Send barrier. */
859 barrier = ofputil_encode_barrier_request(vconn_get_version(vconn));
860 barrier_xid = ((struct ofp_header *) barrier->data)->xid;
861 error = vconn_send_block(vconn, barrier);
862 if (error) {
863 ofpbuf_delete(barrier);
864 return error;
865 }
866
867 for (;;) {
868 struct ofpbuf *msg;
869 ovs_be32 msg_xid;
870 int error;
871
872 error = vconn_recv_block(vconn, &msg);
873 if (error) {
874 ofpbuf_delete(*replyp);
875 *replyp = NULL;
876 return error;
877 }
878
879 msg_xid = ((struct ofp_header *) msg->data)->xid;
880 if (msg_xid == request_xid) {
881 if (*replyp) {
882 VLOG_WARN_RL(&bad_ofmsg_rl, "%s: duplicate replies with "
883 "xid %08"PRIx32, vconn->name, ntohl(msg_xid));
884 ofpbuf_delete(*replyp);
885 }
886 *replyp = msg;
887 } else {
888 ofpbuf_delete(msg);
889 if (msg_xid == barrier_xid) {
890 return 0;
891 } else {
892 VLOG_DBG_RL(&bad_ofmsg_rl, "%s: reply with xid %08"PRIx32
893 " != expected %08"PRIx32" or %08"PRIx32,
894 vconn->name, ntohl(msg_xid),
895 ntohl(request_xid), ntohl(barrier_xid));
896 }
897 }
898 }
899 }
900
901 /* vconn_transact_noreply() for a list of "struct ofpbuf"s, sent one by one.
902 * All of the requests on 'requests' are always destroyed, regardless of the
903 * return value. */
904 int
905 vconn_transact_multiple_noreply(struct vconn *vconn, struct ovs_list *requests,
906 struct ofpbuf **replyp)
907 {
908 struct ofpbuf *request;
909
910 LIST_FOR_EACH_POP (request, list_node, requests) {
911 int error;
912
913 error = vconn_transact_noreply(vconn, request, replyp);
914 if (error || *replyp) {
915 ofpbuf_list_delete(requests);
916 return error;
917 }
918 }
919
920 *replyp = NULL;
921 return 0;
922 }
923
924 static enum ofperr
925 vconn_bundle_reply_validate(struct ofpbuf *reply,
926 struct ofputil_bundle_ctrl_msg *request,
927 void (*error_reporter)(const struct ofp_header *))
928 {
929 const struct ofp_header *oh;
930 enum ofptype type;
931 enum ofperr error;
932 struct ofputil_bundle_ctrl_msg rbc;
933
934 oh = reply->data;
935 error = ofptype_decode(&type, oh);
936 if (error) {
937 return error;
938 }
939
940 if (type == OFPTYPE_ERROR) {
941 error_reporter(oh);
942 return ofperr_decode_msg(oh, NULL);
943 }
944 if (type != OFPTYPE_BUNDLE_CONTROL) {
945 return OFPERR_OFPBRC_BAD_TYPE;
946 }
947
948 error = ofputil_decode_bundle_ctrl(oh, &rbc);
949 if (error) {
950 return error;
951 }
952
953 if (rbc.bundle_id != request->bundle_id) {
954 return OFPERR_OFPBFC_BAD_ID;
955 }
956
957 if (rbc.type != request->type + 1) {
958 return OFPERR_OFPBFC_BAD_TYPE;
959 }
960
961 return 0;
962 }
963
964 /* Send bundle control message 'bc' of 'type' via 'vconn', and wait for either
965 * an error or the corresponding bundle control message response.
966 *
967 * 'error_reporter' is called for any error responses received, which may be
968 * also regarding earlier OpenFlow messages than this bundle control message.
969 *
970 * Returns errno value, or 0 when successful. */
971 static int
972 vconn_bundle_control_transact(struct vconn *vconn,
973 struct ofputil_bundle_ctrl_msg *bc,
974 uint16_t type,
975 void (*error_reporter)(const struct ofp_header *))
976 {
977 struct ofpbuf *request, *reply;
978 int error;
979 enum ofperr ofperr;
980
981 bc->type = type;
982 request = ofputil_encode_bundle_ctrl_request(vconn->version, bc);
983 ofpmsg_update_length(request);
984 error = vconn_transact__(vconn, request, &reply, error_reporter);
985 if (error) {
986 return error;
987 }
988
989 ofperr = vconn_bundle_reply_validate(reply, bc, error_reporter);
990 if (ofperr) {
991 VLOG_WARN_RL(&bad_ofmsg_rl, "Bundle %s failed (%s).",
992 type == OFPBCT_OPEN_REQUEST ? "open"
993 : type == OFPBCT_CLOSE_REQUEST ? "close"
994 : type == OFPBCT_COMMIT_REQUEST ? "commit"
995 : type == OFPBCT_DISCARD_REQUEST ? "discard"
996 : "control message",
997 ofperr_to_string(ofperr));
998 }
999 ofpbuf_delete(reply);
1000
1001 return ofperr ? EPROTO : 0;
1002 }
1003
1004 /* Checks if error responses can be received on 'vconn'. */
1005 static void
1006 vconn_recv_error(struct vconn *vconn,
1007 void (*error_reporter)(const struct ofp_header *))
1008 {
1009 int error;
1010
1011 do {
1012 struct ofpbuf *reply;
1013
1014 error = vconn_recv(vconn, &reply);
1015 if (!error) {
1016 const struct ofp_header *oh;
1017 enum ofptype type;
1018 enum ofperr ofperr;
1019
1020 oh = reply->data;
1021 ofperr = ofptype_decode(&type, oh);
1022 if (!ofperr && type == OFPTYPE_ERROR) {
1023 error_reporter(oh);
1024 } else {
1025 VLOG_DBG_RL(&bad_ofmsg_rl,
1026 "%s: received unexpected reply with xid %08"PRIx32,
1027 vconn->name, ntohl(oh->xid));
1028 }
1029 ofpbuf_delete(reply);
1030 }
1031 } while (!error);
1032 }
1033
1034 static int
1035 vconn_bundle_add_msg(struct vconn *vconn, struct ofputil_bundle_ctrl_msg *bc,
1036 struct ofpbuf *msg,
1037 void (*error_reporter)(const struct ofp_header *))
1038 {
1039 struct ofputil_bundle_add_msg bam;
1040 struct ofpbuf *request;
1041 int error;
1042
1043 bam.bundle_id = bc->bundle_id;
1044 bam.flags = bc->flags;
1045 bam.msg = msg->data;
1046
1047 request = ofputil_encode_bundle_add(vconn->version, &bam);
1048 ofpmsg_update_length(request);
1049
1050 error = vconn_send_block(vconn, request);
1051 if (!error) {
1052 /* Check for an error return, so that the socket buffer does not become
1053 * full of errors. */
1054 vconn_recv_error(vconn, error_reporter);
1055 }
1056 return error;
1057 }
1058
1059 int
1060 vconn_bundle_transact(struct vconn *vconn, struct ovs_list *requests,
1061 uint16_t flags,
1062 void (*error_reporter)(const struct ofp_header *))
1063 {
1064 struct ofputil_bundle_ctrl_msg bc;
1065 struct ofpbuf *request;
1066 int error;
1067
1068 memset(&bc, 0, sizeof bc);
1069 bc.flags = flags;
1070 error = vconn_bundle_control_transact(vconn, &bc, OFPBCT_OPEN_REQUEST,
1071 error_reporter);
1072 if (error) {
1073 return error;
1074 }
1075
1076 LIST_FOR_EACH (request, list_node, requests) {
1077 error = vconn_bundle_add_msg(vconn, &bc, request, error_reporter);
1078 if (error) {
1079 break;
1080 }
1081 }
1082
1083 if (!error) {
1084 error = vconn_bundle_control_transact(vconn, &bc,
1085 OFPBCT_COMMIT_REQUEST,
1086 error_reporter);
1087 } else {
1088 /* Do not overwrite the error code from vconn_bundle_add_msg().
1089 * Any error in discard should be either reported or logged, so it
1090 * should not get lost. */
1091 vconn_bundle_control_transact(vconn, &bc, OFPBCT_DISCARD_REQUEST,
1092 error_reporter);
1093 }
1094 return error;
1095 }
1096
1097 void
1098 vconn_wait(struct vconn *vconn, enum vconn_wait_type wait)
1099 {
1100 ovs_assert(wait == WAIT_CONNECT || wait == WAIT_RECV || wait == WAIT_SEND);
1101
1102 switch (vconn->state) {
1103 case VCS_CONNECTING:
1104 wait = WAIT_CONNECT;
1105 break;
1106
1107 case VCS_SEND_HELLO:
1108 case VCS_SEND_ERROR:
1109 wait = WAIT_SEND;
1110 break;
1111
1112 case VCS_RECV_HELLO:
1113 wait = WAIT_RECV;
1114 break;
1115
1116 case VCS_CONNECTED:
1117 break;
1118
1119 case VCS_DISCONNECTED:
1120 poll_immediate_wake();
1121 return;
1122 }
1123 (vconn->vclass->wait)(vconn, wait);
1124 }
1125
1126 void
1127 vconn_connect_wait(struct vconn *vconn)
1128 {
1129 vconn_wait(vconn, WAIT_CONNECT);
1130 }
1131
1132 void
1133 vconn_recv_wait(struct vconn *vconn)
1134 {
1135 vconn_wait(vconn, WAIT_RECV);
1136 }
1137
1138 void
1139 vconn_send_wait(struct vconn *vconn)
1140 {
1141 vconn_wait(vconn, WAIT_SEND);
1142 }
1143
1144 /* Given 'name', a connection name in the form "TYPE:ARGS", stores the class
1145 * named "TYPE" into '*classp' and returns 0. Returns EAFNOSUPPORT and stores
1146 * a null pointer into '*classp' if 'name' is in the wrong form or if no such
1147 * class exists. */
1148 static int
1149 pvconn_lookup_class(const char *name, const struct pvconn_class **classp)
1150 {
1151 size_t prefix_len;
1152
1153 prefix_len = strcspn(name, ":");
1154 if (name[prefix_len] != '\0') {
1155 size_t i;
1156
1157 for (i = 0; i < ARRAY_SIZE(pvconn_classes); i++) {
1158 const struct pvconn_class *class = pvconn_classes[i];
1159 if (strlen(class->name) == prefix_len
1160 && !memcmp(class->name, name, prefix_len)) {
1161 *classp = class;
1162 return 0;
1163 }
1164 }
1165 }
1166
1167 *classp = NULL;
1168 return EAFNOSUPPORT;
1169 }
1170
1171 /* Returns 0 if 'name' is a connection name in the form "TYPE:ARGS" and TYPE is
1172 * a supported connection type, otherwise EAFNOSUPPORT. */
1173 int
1174 pvconn_verify_name(const char *name)
1175 {
1176 const struct pvconn_class *class;
1177 return pvconn_lookup_class(name, &class);
1178 }
1179
1180 /* Attempts to start listening for OpenFlow connections. 'name' is a
1181 * connection name in the form "TYPE:ARGS", where TYPE is an passive vconn
1182 * class's name and ARGS are vconn class-specific.
1183 *
1184 * vconns accepted by the pvconn will automatically negotiate an OpenFlow
1185 * protocol version acceptable to both peers on the connection. The version
1186 * negotiated will be one of those in the 'allowed_versions' bitmap: version
1187 * 'x' is allowed if allowed_versions & (1 << x) is nonzero. If
1188 * 'allowed_versions' is zero, then OFPUTIL_DEFAULT_VERSIONS are allowed.
1189 *
1190 * Returns 0 if successful, otherwise a positive errno value. If successful,
1191 * stores a pointer to the new connection in '*pvconnp', otherwise a null
1192 * pointer. */
1193 int
1194 pvconn_open(const char *name, uint32_t allowed_versions, uint8_t dscp,
1195 struct pvconn **pvconnp)
1196 {
1197 const struct pvconn_class *class;
1198 struct pvconn *pvconn;
1199 char *suffix_copy;
1200 int error;
1201
1202 check_vconn_classes();
1203
1204 if (!allowed_versions) {
1205 allowed_versions = OFPUTIL_DEFAULT_VERSIONS;
1206 }
1207
1208 /* Look up the class. */
1209 error = pvconn_lookup_class(name, &class);
1210 if (!class) {
1211 goto error;
1212 }
1213
1214 /* Call class's "open" function. */
1215 suffix_copy = xstrdup(strchr(name, ':') + 1);
1216 error = class->listen(name, allowed_versions, suffix_copy, &pvconn, dscp);
1217 free(suffix_copy);
1218 if (error) {
1219 goto error;
1220 }
1221
1222 /* Success. */
1223 *pvconnp = pvconn;
1224 return 0;
1225
1226 error:
1227 *pvconnp = NULL;
1228 return error;
1229 }
1230
1231 /* Returns the name that was used to open 'pvconn'. The caller must not
1232 * modify or free the name. */
1233 const char *
1234 pvconn_get_name(const struct pvconn *pvconn)
1235 {
1236 return pvconn->name;
1237 }
1238
1239 /* Closes 'pvconn'. */
1240 void
1241 pvconn_close(struct pvconn *pvconn)
1242 {
1243 if (pvconn != NULL) {
1244 char *name = pvconn->name;
1245 (pvconn->pvclass->close)(pvconn);
1246 free(name);
1247 }
1248 }
1249
1250 /* Tries to accept a new connection on 'pvconn'. If successful, stores the new
1251 * connection in '*new_vconn' and returns 0. Otherwise, returns a positive
1252 * errno value.
1253 *
1254 * The new vconn will automatically negotiate an OpenFlow protocol version
1255 * acceptable to both peers on the connection. The version negotiated will be
1256 * no lower than 'min_version' and no higher than 'max_version'.
1257 *
1258 * pvconn_accept() will not block waiting for a connection. If no connection
1259 * is ready to be accepted, it returns EAGAIN immediately. */
1260 int
1261 pvconn_accept(struct pvconn *pvconn, struct vconn **new_vconn)
1262 {
1263 int retval = (pvconn->pvclass->accept)(pvconn, new_vconn);
1264 if (retval) {
1265 *new_vconn = NULL;
1266 } else {
1267 ovs_assert((*new_vconn)->state != VCS_CONNECTING
1268 || (*new_vconn)->vclass->connect);
1269 }
1270 return retval;
1271 }
1272
1273 void
1274 pvconn_wait(struct pvconn *pvconn)
1275 {
1276 (pvconn->pvclass->wait)(pvconn);
1277 }
1278
1279 /* Initializes 'vconn' as a new vconn named 'name', implemented via 'class'.
1280 * The initial connection status, supplied as 'connect_status', is interpreted
1281 * as follows:
1282 *
1283 * - 0: 'vconn' is connected. Its 'send' and 'recv' functions may be
1284 * called in the normal fashion.
1285 *
1286 * - EAGAIN: 'vconn' is trying to complete a connection. Its 'connect'
1287 * function should be called to complete the connection.
1288 *
1289 * - Other positive errno values indicate that the connection failed with
1290 * the specified error.
1291 *
1292 * After calling this function, vconn_close() must be used to destroy 'vconn',
1293 * otherwise resources will be leaked.
1294 *
1295 * The caller retains ownership of 'name'. */
1296 void
1297 vconn_init(struct vconn *vconn, const struct vconn_class *class,
1298 int connect_status, const char *name, uint32_t allowed_versions)
1299 {
1300 memset(vconn, 0, sizeof *vconn);
1301 vconn->vclass = class;
1302 vconn->state = (connect_status == EAGAIN ? VCS_CONNECTING
1303 : !connect_status ? VCS_SEND_HELLO
1304 : VCS_DISCONNECTED);
1305 vconn->error = connect_status;
1306 vconn->allowed_versions = allowed_versions;
1307 vconn->name = xstrdup(name);
1308 ovs_assert(vconn->state != VCS_CONNECTING || class->connect);
1309 }
1310
1311 void
1312 pvconn_init(struct pvconn *pvconn, const struct pvconn_class *class,
1313 const char *name, uint32_t allowed_versions)
1314 {
1315 pvconn->pvclass = class;
1316 pvconn->name = xstrdup(name);
1317 pvconn->allowed_versions = allowed_versions;
1318 }