X-Git-Url: http://git.onelab.eu/?a=blobdiff_plain;f=lib%2Frconn.c;h=ea45134fea3bcaf02ec4a34a12abe104a530b9af;hb=6f643e4946016399f0b217c2226284e3892b6267;hp=181cae59940b89c2390ddc37f5edb97de698b938;hpb=3b01baa3970139c3a195017ab1ea3e42761e3db2;p=sliver-openvswitch.git diff --git a/lib/rconn.c b/lib/rconn.c index 181cae599..ea45134fe 100644 --- a/lib/rconn.c +++ b/lib/rconn.c @@ -1,5 +1,5 @@ /* - * Copyright (c) 2008, 2009 Nicira Networks. + * Copyright (c) 2008, 2009, 2010 Nicira Networks. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -76,6 +76,7 @@ struct rconn { time_t last_connected; unsigned int packets_sent; unsigned int seqno; + int last_error; /* In S_ACTIVE and S_IDLE, probably_admitted reports whether we believe * that the peer has made a (positive) admission control decision on our @@ -111,6 +112,18 @@ struct rconn { * a response. */ int probe_interval; /* Secs of inactivity before sending probe. */ + /* When we create a vconn we obtain these values, to save them past the end + * of the vconn's lifetime. Otherwise, in-band control will only allow + * traffic when a vconn is actually open, but it is nice to allow ARP to + * complete even between connection attempts, and it is also polite to + * allow traffic from other switches to go through to the controller + * whether or not we are connected. + * + * We don't cache the local port, because that changes from one connection + * attempt to the next. */ + uint32_t local_ip, remote_ip; + uint16_t remote_port; + /* Messages sent or received are copied to the monitor connections. */ #define MAX_MONITORS 8 struct vconn *monitors[8]; @@ -121,8 +134,10 @@ static unsigned int elapsed_in_this_state(const struct rconn *); static unsigned int timeout(const struct rconn *); static bool timed_out(const struct rconn *); static void state_transition(struct rconn *, enum state); +static void set_vconn_name(struct rconn *, const char *name); static int try_send(struct rconn *); static int reconnect(struct rconn *); +static void report_error(struct rconn *, int error); static void disconnect(struct rconn *, int error); static void flush_queue(struct rconn *); static void question_connectivity(struct rconn *); @@ -159,11 +174,11 @@ rconn_new_from_vconn(const char *name, struct vconn *vconn) * 'max_backoff' is the maximum number of seconds between attempts to connect * to the peer. The actual interval starts at 1 second and doubles on each * failure until it reaches 'max_backoff'. If 0 is specified, the default of - * 60 seconds is used. */ + * 8 seconds is used. */ struct rconn * rconn_create(int probe_interval, int max_backoff) { - struct rconn *rc = xcalloc(1, sizeof *rc); + struct rconn *rc = xzalloc(sizeof *rc); rc->state = S_VOID; rc->state_entered = time_now(); @@ -175,7 +190,7 @@ rconn_create(int probe_interval, int max_backoff) queue_init(&rc->txq); rc->backoff = 0; - rc->max_backoff = max_backoff ? max_backoff : 60; + rc->max_backoff = max_backoff ? max_backoff : 8; rc->backoff_deadline = TIME_MIN; rc->last_received = time_now(); rc->last_connected = time_now(); @@ -236,8 +251,7 @@ int rconn_connect(struct rconn *rc, const char *name) { rconn_disconnect(rc); - free(rc->name); - rc->name = xstrdup(name); + set_vconn_name(rc, name); rc->reliable = true; return reconnect(rc); } @@ -248,8 +262,7 @@ rconn_connect_unreliably(struct rconn *rc, { assert(vconn != NULL); rconn_disconnect(rc); - free(rc->name); - rc->name = xstrdup(name); + set_vconn_name(rc, name); rc->reliable = false; rc->vconn = vconn; rc->last_connected = time_now(); @@ -261,6 +274,7 @@ void rconn_reconnect(struct rconn *rc) { if (rc->state & (S_ACTIVE | S_IDLE)) { + VLOG_INFO("%s: disconnecting", rc->name); disconnect(rc, 0); } } @@ -273,8 +287,7 @@ rconn_disconnect(struct rconn *rc) vconn_close(rc->vconn); rc->vconn = NULL; } - free(rc->name); - rc->name = xstrdup("void"); + set_vconn_name(rc, "void"); rc->reliable = false; rc->backoff = 0; @@ -303,13 +316,13 @@ rconn_destroy(struct rconn *rc) } static unsigned int -timeout_VOID(const struct rconn *rc UNUSED) +timeout_VOID(const struct rconn *rc OVS_UNUSED) { return UINT_MAX; } static void -run_VOID(struct rconn *rc UNUSED) +run_VOID(struct rconn *rc OVS_UNUSED) { /* Nothing to do. */ } @@ -323,12 +336,15 @@ reconnect(struct rconn *rc) rc->n_attempted_connections++; retval = vconn_open(rc->name, OFP_VERSION, &rc->vconn); if (!retval) { + rc->remote_ip = vconn_get_remote_ip(rc->vconn); + rc->local_ip = vconn_get_local_ip(rc->vconn); + rc->remote_port = vconn_get_remote_port(rc->vconn); rc->backoff_deadline = time_now() + rc->backoff; state_transition(rc, S_CONNECTING); } else { VLOG_WARN("%s: connection failed (%s)", rc->name, strerror(retval)); rc->backoff_deadline = TIME_MAX; /* Prevent resetting backoff. */ - disconnect(rc, 0); + disconnect(rc, retval); } return retval; } @@ -368,7 +384,7 @@ run_CONNECTING(struct rconn *rc) } else if (timed_out(rc)) { VLOG_INFO("%s: connection timed out", rc->name); rc->backoff_deadline = TIME_MAX; /* Prevent resetting backoff. */ - disconnect(rc, 0); + disconnect(rc, ETIMEDOUT); } } @@ -433,7 +449,7 @@ run_IDLE(struct rconn *rc) VLOG_ERR("%s: no response to inactivity probe after %u " "seconds, disconnecting", rc->name, elapsed_in_this_state(rc)); - disconnect(rc, 0); + disconnect(rc, ETIMEDOUT); } else { do_tx_work(rc); } @@ -446,6 +462,15 @@ void rconn_run(struct rconn *rc) { int old_state; + size_t i; + + if (rc->vconn) { + vconn_run(rc->vconn); + } + for (i = 0; i < rc->n_monitors; i++) { + vconn_run(rc->monitors[i]); + } + do { old_state = rc->state; switch (rc->state) { @@ -463,7 +488,17 @@ rconn_run(struct rconn *rc) void rconn_run_wait(struct rconn *rc) { - unsigned int timeo = timeout(rc); + unsigned int timeo; + size_t i; + + if (rc->vconn) { + vconn_run_wait(rc->vconn); + } + for (i = 0; i < rc->n_monitors; i++) { + vconn_run_wait(rc->monitors[i]); + } + + timeo = timeout(rc); if (timeo != UINT_MAX) { unsigned int expires = sat_add(rc->state_entered, timeo); unsigned int remaining = sat_sub(expires, time_now()); @@ -486,7 +521,7 @@ rconn_recv(struct rconn *rc) int error = vconn_recv(rc->vconn, &buffer); if (!error) { copy_to_monitor(rc, buffer); - if (is_admitted_msg(buffer) + if (rc->probably_admitted || is_admitted_msg(buffer) || time_now() - rc->last_connected >= 30) { rc->probably_admitted = true; rc->last_admitted = time_now(); @@ -498,6 +533,7 @@ rconn_recv(struct rconn *rc) } return buffer; } else if (error != EAGAIN) { + report_error(rc, error); disconnect(rc, error); } } @@ -534,7 +570,7 @@ rconn_send(struct rconn *rc, struct ofpbuf *b, if (rconn_is_connected(rc)) { COVERAGE_INC(rconn_queued); copy_to_monitor(rc, b); - b->private = counter; + b->private_p = counter; if (counter) { rconn_packet_counter_inc(counter); } @@ -624,31 +660,38 @@ rconn_is_connected(const struct rconn *rconn) return is_connected_state(rconn->state); } -/* Returns 0 if 'rconn' is connected. Otherwise, if 'rconn' is in a "failure - * mode" (that is, it is not connected), returns the number of seconds that it - * has been in failure mode, ignoring any times that it connected but the - * controller's admission control policy caused it to be quickly - * disconnected. */ +/* Returns true if 'rconn' is connected and thought to have been accepted by + * the peer's admission-control policy. */ +bool +rconn_is_admitted(const struct rconn *rconn) +{ + return (rconn_is_connected(rconn) + && rconn->last_admitted >= rconn->last_connected); +} + +/* Returns 0 if 'rconn' is currently connected and considered to have been + * accepted by the peer's admission-control policy, otherwise the number of + * seconds since 'rconn' was last in such a state. */ int rconn_failure_duration(const struct rconn *rconn) { - return rconn_is_connected(rconn) ? 0 : time_now() - rconn->last_admitted; + return rconn_is_admitted(rconn) ? 0 : time_now() - rconn->last_admitted; } -/* Returns the IP address of the peer, or 0 if the peer is not connected over - * an IP-based protocol or if its IP address is not known. */ +/* Returns the IP address of the peer, or 0 if the peer's IP address is not + * known. */ uint32_t rconn_get_remote_ip(const struct rconn *rconn) { - return rconn->vconn ? vconn_get_remote_ip(rconn->vconn) : 0; + return rconn->remote_ip; } -/* Returns the transport port of the peer, or 0 if the peer does not - * contain a port or if the port is not known. */ +/* Returns the transport port of the peer, or 0 if the peer's port is not + * known. */ uint16_t rconn_get_remote_port(const struct rconn *rconn) { - return rconn->vconn ? vconn_get_remote_port(rconn->vconn) : 0; + return rconn->remote_port; } /* Returns the IP address used to connect to the peer, or 0 if the @@ -657,7 +700,7 @@ rconn_get_remote_port(const struct rconn *rconn) uint32_t rconn_get_local_ip(const struct rconn *rconn) { - return rconn->vconn ? vconn_get_local_ip(rconn->vconn) : 0; + return rconn->local_ip; } /* Returns the transport port used to connect to the peer, or 0 if the @@ -769,6 +812,22 @@ rconn_get_connection_seqno(const struct rconn *rc) { return rc->seqno; } + +/* Returns a value that explains why 'rc' last disconnected: + * + * - 0 means that the last disconnection was caused by a call to + * rconn_disconnect(), or that 'rc' is new and has not yet completed its + * initial connection or connection attempt. + * + * - EOF means that the connection was closed in the normal way by the peer. + * + * - A positive integer is an errno value that represents the error. + */ +int +rconn_get_last_error(const struct rconn *rc) +{ + return rc->last_error; +} struct rconn_packet_counter * rconn_packet_counter_create(void) @@ -805,6 +864,19 @@ rconn_packet_counter_dec(struct rconn_packet_counter *c) } } +/* Set the name of the remote vconn to 'name' and clear out the cached IP + * address and port information, since changing the name also likely changes + * these values. */ +static void +set_vconn_name(struct rconn *rc, const char *name) +{ + free(rc->name); + rc->name = xstrdup(name); + rc->local_ip = 0; + rc->remote_ip = 0; + rc->remote_port = 0; +} + /* Tries to send a packet from 'rc''s send buffer. Returns 0 if successful, * otherwise a positive errno value. */ static int @@ -812,10 +884,11 @@ try_send(struct rconn *rc) { int retval = 0; struct ofpbuf *next = rc->txq.head->next; - struct rconn_packet_counter *counter = rc->txq.head->private; + struct rconn_packet_counter *counter = rc->txq.head->private_p; retval = vconn_send(rc->vconn, rc->txq.head); if (retval) { if (retval != EAGAIN) { + report_error(rc, retval); disconnect(rc, retval); } return retval; @@ -829,26 +902,41 @@ try_send(struct rconn *rc) return 0; } -/* Disconnects 'rc'. 'error' is used only for logging purposes. If it is - * nonzero, then it should be EOF to indicate the connection was closed by the - * peer in a normal fashion or a positive errno value. */ +/* Reports that 'error' caused 'rc' to disconnect. 'error' may be a positive + * errno value, or it may be EOF to indicate that the connection was closed + * normally. */ +static void +report_error(struct rconn *rc, int error) +{ + if (error == EOF) { + /* If 'rc' isn't reliable, then we don't really expect this connection + * to last forever anyway (probably it's a connection that we received + * via accept()), so use DBG level to avoid cluttering the logs. */ + enum vlog_level level = rc->reliable ? VLL_INFO : VLL_DBG; + VLOG(level, "%s: connection closed by peer", rc->name); + } else { + VLOG_WARN("%s: connection dropped (%s)", rc->name, strerror(error)); + } +} + +/* Disconnects 'rc' and records 'error' as the error that caused 'rc''s last + * disconnection: + * + * - 0 means that this disconnection is due to a request by 'rc''s client, + * not due to any kind of network error. + * + * - EOF means that the connection was closed in the normal way by the peer. + * + * - A positive integer is an errno value that represents the error. + */ static void disconnect(struct rconn *rc, int error) { + rc->last_error = error; if (rc->reliable) { time_t now = time_now(); if (rc->state & (S_CONNECTING | S_ACTIVE | S_IDLE)) { - if (error > 0) { - VLOG_WARN("%s: connection dropped (%s)", - rc->name, strerror(error)); - } else if (error == EOF) { - if (rc->reliable) { - VLOG_INFO("%s: connection closed by peer", rc->name); - } - } else { - VLOG_INFO("%s: connection dropped", rc->name); - } vconn_close(rc->vconn); rc->vconn = NULL; flush_queue(rc); @@ -881,7 +969,7 @@ flush_queue(struct rconn *rc) } while (rc->txq.n > 0) { struct ofpbuf *b = queue_pop_head(&rc->txq); - struct rconn_packet_counter *counter = b->private; + struct rconn_packet_counter *counter = b->private_p; if (counter) { rconn_packet_counter_dec(counter); }