X-Git-Url: http://git.onelab.eu/?a=blobdiff_plain;f=vswitchd%2Fovs-brcompatd.c;h=b5037056e41ac28cc452b1ff27c8e763fb937f8e;hb=939ff2674caa93d15b607bc514932533490ff2a0;hp=b7627e01ef1f59f5982c765b22ab67d5fe6a8423;hpb=9852694f9e9ac12868463094b894a1da61535a7f;p=sliver-openvswitch.git diff --git a/vswitchd/ovs-brcompatd.c b/vswitchd/ovs-brcompatd.c index b7627e01e..b5037056e 100644 --- a/vswitchd/ovs-brcompatd.c +++ b/vswitchd/ovs-brcompatd.c @@ -1,4 +1,4 @@ -/* Copyright (c) 2008, 2009 Nicira Networks +/* Copyright (c) 2008, 2009, 2010 Nicira Networks * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -39,7 +39,7 @@ #include "dirs.h" #include "dynamic-string.h" #include "fatal-signal.h" -#include "fault.h" +#include "json.h" #include "leak-checker.h" #include "netdev.h" #include "netlink.h" @@ -75,10 +75,6 @@ static void usage(void) NO_RETURN; static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(5, 60); -/* Maximum number of milliseconds to wait for the config file to be - * unlocked. If set to zero, no waiting will occur. */ -static int lock_timeout = 500; - /* Maximum number of milliseconds to wait before pruning port entries that * no longer exist. If set to zero, ports are never pruned. */ static int prune_timeout = 5000; @@ -376,12 +372,97 @@ ovs_insert_bridge(const struct ovsrec_open_vswitch *ovs, free(bridges); } +static struct json * +where_uuid_equals(const struct uuid *uuid) +{ + return + json_array_create_1( + json_array_create_3( + json_string_create("_uuid"), + json_string_create("=="), + json_array_create_2( + json_string_create("uuid"), + json_string_create_nocopy( + xasprintf(UUID_FMT, UUID_ARGS(uuid)))))); +} + +/* Commits 'txn'. If 'wait_for_reload' is true, also waits for Open vSwitch to + reload the configuration before returning. + + Returns EAGAIN if the caller should try the operation again, 0 on success, + otherwise a positive errno value. */ +static int +commit_txn(struct ovsdb_idl_txn *txn, bool wait_for_reload) +{ + struct ovsdb_idl *idl = ovsdb_idl_txn_get_idl (txn); + enum ovsdb_idl_txn_status status; + int64_t next_cfg = 0; + + if (wait_for_reload) { + const struct ovsrec_open_vswitch *ovs = ovsrec_open_vswitch_first(idl); + struct json *where = where_uuid_equals(&ovs->header_.uuid); + ovsdb_idl_txn_increment(txn, "Open_vSwitch", "next_cfg", where); + json_destroy(where); + } + status = ovsdb_idl_txn_commit_block(txn); + if (wait_for_reload && status == TXN_SUCCESS) { + next_cfg = ovsdb_idl_txn_get_increment_new_value(txn); + } + ovsdb_idl_txn_destroy(txn); + + switch (status) { + case TXN_INCOMPLETE: + NOT_REACHED(); + + case TXN_ABORTED: + VLOG_ERR_RL(&rl, "OVSDB transaction unexpectedly aborted"); + return ECONNABORTED; + + case TXN_UNCHANGED: + return 0; + + case TXN_SUCCESS: + if (wait_for_reload) { + for (;;) { + /* We can't use 'ovs' any longer because ovsdb_idl_run() can + * destroy it. */ + const struct ovsrec_open_vswitch *ovs2; + + ovsdb_idl_run(idl); + OVSREC_OPEN_VSWITCH_FOR_EACH (ovs2, idl) { + if (ovs2->cur_cfg >= next_cfg) { + goto done; + } + } + ovsdb_idl_wait(idl); + poll_block(); + } + done: ; + } + return 0; + + case TXN_TRY_AGAIN: + VLOG_ERR_RL(&rl, "OVSDB transaction needs retry"); + return EAGAIN; + + case TXN_ERROR: + VLOG_ERR_RL(&rl, "OVSDB transaction failed: %s", + ovsdb_idl_txn_get_error(txn)); + return EBUSY; + + default: + NOT_REACHED(); + } +} + static int -add_bridge(const struct ovsrec_open_vswitch *ovs, const char *br_name) +add_bridge(struct ovsdb_idl *idl, const struct ovsrec_open_vswitch *ovs, + const char *br_name) { struct ovsrec_bridge *br; struct ovsrec_port *port; struct ovsrec_interface *iface; + struct ovsdb_idl_txn *txn; if (find_bridge(ovs, br_name)) { VLOG_WARN("addbr %s: bridge %s exists", br_name, br_name); @@ -408,6 +489,10 @@ add_bridge(const struct ovsrec_open_vswitch *ovs, const char *br_name) return EEXIST; } + txn = ovsdb_idl_txn_create(idl); + + ovsdb_idl_txn_add_comment(txn, "ovs-brcompatd: addbr %s", br_name); + iface = ovsrec_interface_insert(txn_from_openvswitch(ovs)); ovsrec_interface_set_name(iface, br_name); @@ -421,9 +506,7 @@ add_bridge(const struct ovsrec_open_vswitch *ovs, const char *br_name) ovs_insert_bridge(ovs, br); - VLOG_INFO("addbr %s: success", br_name); - - return 0; + return commit_txn(txn, true); } static void @@ -452,46 +535,107 @@ add_port(const struct ovsrec_open_vswitch *ovs, free(ports); } +/* Deletes 'port' from 'br'. + * + * After calling this function, 'port' must not be referenced again. */ static void -del_port(const struct ovsrec_bridge *br, const char *port_name) +del_port(const struct ovsrec_bridge *br, const struct ovsrec_port *port) { - size_t i, j; - struct ovsrec_port *port_rec = NULL; + struct ovsrec_port **ports; + size_t i, n; + + /* Remove 'port' from the bridge's list of ports. */ + ports = xmalloc(sizeof *br->ports * br->n_ports); + for (i = n = 0; i < br->n_ports; i++) { + if (br->ports[i] != port) { + ports[n++] = br->ports[i]; + } + } + ovsrec_bridge_set_ports(br, ports, n); + free(ports); + + /* Delete all of the port's interfaces. */ + for (i = 0; i < port->n_interfaces; i++) { + ovsrec_interface_delete(port->interfaces[i]); + } + + /* Delete the port itself. */ + ovsrec_port_delete(port); +} + +/* Delete 'iface' from 'port' (which must be within 'br'). If 'iface' was + * 'port''s only interface, delete 'port' from 'br' also. + * + * After calling this function, 'iface' must not be referenced again. */ +static void +del_interface(const struct ovsrec_bridge *br, + const struct ovsrec_port *port, + const struct ovsrec_interface *iface) +{ + if (port->n_interfaces == 1) { + del_port(br, port); + } else { + struct ovsrec_interface **ifaces; + size_t i, n; + + ifaces = xmalloc(sizeof *port->interfaces * port->n_interfaces); + for (i = n = 0; i < port->n_interfaces; i++) { + if (port->interfaces[i] != iface) { + ifaces[n++] = port->interfaces[i]; + } + } + ovsrec_port_set_interfaces(port, ifaces, n); + free(ifaces); + ovsrec_interface_delete(iface); + } +} + +/* Find and return a port within 'br' named 'port_name'. */ +static const struct ovsrec_port * +find_port(const struct ovsrec_bridge *br, const char *port_name) +{ + size_t i; for (i = 0; i < br->n_ports; i++) { struct ovsrec_port *port = br->ports[i]; if (!strcmp(port_name, port->name)) { - port_rec = port; - } - for (j = 0; j < port->n_interfaces; j++) { - struct ovsrec_interface *iface = port->interfaces[j]; - if (!strcmp(port_name, iface->name)) { - ovsrec_interface_delete(iface); - } + return port; } } + return NULL; +} + +/* Find and return an interface within 'br' named 'iface_name'. */ +static const struct ovsrec_interface * +find_interface(const struct ovsrec_bridge *br, const char *iface_name, + struct ovsrec_port **portp) +{ + size_t i; - /* xxx Probably can move this into the "for" loop. */ - if (port_rec) { - struct ovsrec_port **ports; - size_t n; + for (i = 0; i < br->n_ports; i++) { + struct ovsrec_port *port = br->ports[i]; + size_t j; - ports = xmalloc(sizeof *br->ports * br->n_ports); - for (i = n = 0; i < br->n_ports; i++) { - if (br->ports[i] != port_rec) { - ports[n++] = br->ports[i]; + for (j = 0; j < port->n_interfaces; j++) { + struct ovsrec_interface *iface = port->interfaces[j]; + if (!strcmp(iface->name, iface_name)) { + *portp = port; + return iface; } } - ovsrec_bridge_set_ports(br, ports, n); - free(ports); } + + *portp = NULL; + return NULL; } -static int -del_bridge(const struct ovsrec_open_vswitch *ovs, const char *br_name) +static int +del_bridge(struct ovsdb_idl *idl, + const struct ovsrec_open_vswitch *ovs, const char *br_name) { struct ovsrec_bridge *br = find_bridge(ovs, br_name); struct ovsrec_bridge **bridges; + struct ovsdb_idl_txn *txn; size_t i, n; if (!br) { @@ -499,10 +643,29 @@ del_bridge(const struct ovsrec_open_vswitch *ovs, const char *br_name) return ENXIO; } - del_port(br, br_name); + txn = ovsdb_idl_txn_create(idl); - ovsrec_bridge_delete(br); + ovsdb_idl_txn_add_comment(txn, "ovs-brcompatd: delbr %s", br_name); + + /* Delete everything that the bridge points to, then delete the bridge + * itself. */ + while (br->n_ports > 0) { + del_port(br, br->ports[0]); + } + for (i = 0; i < br->n_mirrors; i++) { + ovsrec_mirror_delete(br->mirrors[i]); + } + if (br->netflow) { + ovsrec_netflow_delete(br->netflow); + } + if (br->sflow) { + ovsrec_sflow_delete(br->sflow); + } + if (br->controller) { + ovsrec_controller_delete(br->controller); + } + /* Remove 'br' from the vswitch's list of bridges. */ bridges = xmalloc(sizeof *ovs->bridges * ovs->n_bridges); for (i = n = 0; i < ovs->n_bridges; i++) { if (ovs->bridges[i] != br) { @@ -512,9 +675,10 @@ del_bridge(const struct ovsrec_open_vswitch *ovs, const char *br_name) ovsrec_open_vswitch_set_bridges(ovs, bridges, n); free(bridges); - VLOG_INFO("delbr %s: success", br_name); + /* Delete the bridge itself. */ + ovsrec_bridge_delete(br); - return 0; + return commit_txn(txn, true); } static int @@ -589,7 +753,8 @@ send_simple_reply(uint32_t seq, int error) } static int -handle_bridge_cmd(const struct ovsrec_open_vswitch *ovs, +handle_bridge_cmd(struct ovsdb_idl *idl, + const struct ovsrec_open_vswitch *ovs, struct ofpbuf *buffer, bool add) { const char *br_name; @@ -598,7 +763,14 @@ handle_bridge_cmd(const struct ovsrec_open_vswitch *ovs, error = parse_command(buffer, &seq, &br_name, NULL, NULL, NULL); if (!error) { - error = add ? add_bridge(ovs, br_name) : del_bridge(ovs, br_name); + int retval; + + do { + retval = (add ? add_bridge : del_bridge)(idl, ovs, br_name); + VLOG_INFO_RL(&rl, "%sbr %s: %s", + add ? "add" : "del", br_name, strerror(retval)); + } while (retval == EAGAIN); + send_simple_reply(seq, error); } return error; @@ -610,7 +782,8 @@ static const struct nl_policy brc_port_policy[] = { }; static int -handle_port_cmd(const struct ovsrec_open_vswitch *ovs, +handle_port_cmd(struct ovsdb_idl *idl, + const struct ovsrec_open_vswitch *ovs, struct ofpbuf *buffer, bool add) { const char *cmd_name = add ? "add-if" : "del-if"; @@ -631,12 +804,27 @@ handle_port_cmd(const struct ovsrec_open_vswitch *ovs, cmd_name, br_name, port_name, port_name); error = EINVAL; } else { - if (add) { - add_port(ovs, br, port_name); - } else { - del_port(br, port_name); - } - VLOG_INFO("%s %s %s: success", cmd_name, br_name, port_name); + do { + struct ovsdb_idl_txn *txn = ovsdb_idl_txn_create(idl); + + if (add) { + ovsdb_idl_txn_add_comment(txn, "ovs-brcompatd: add-if %s", + port_name); + add_port(ovs, br, port_name); + } else { + const struct ovsrec_port *port = find_port(br, port_name); + if (port) { + ovsdb_idl_txn_add_comment(txn, + "ovs-brcompatd: del-if %s", + port_name); + del_port(br, port); + } + } + + error = commit_txn(txn, true); + VLOG_INFO_RL(&rl, "%s %s %s: %s", + cmd_name, br_name, port_name, strerror(error)); + } while (error == EAGAIN); } send_simple_reply(seq, error); } @@ -760,8 +948,8 @@ handle_fdb_query_cmd(const struct ovsrec_open_vswitch *ovs, struct mac *mac = &local_macs[n_local_macs]; struct netdev *netdev; - error = netdev_open(iface_name, NETDEV_ETH_TYPE_NONE, &netdev); - if (netdev) { + error = netdev_open_default(iface_name, &netdev); + if (!error) { if (!netdev_get_etheraddr(netdev, mac->addr)) { n_local_macs++; } @@ -949,12 +1137,12 @@ handle_get_ports_cmd(const struct ovsrec_open_vswitch *ovs, } static void -brc_recv_update(const struct ovsrec_open_vswitch *ovs) +brc_recv_update(struct ovsdb_idl *idl) { int retval; struct ofpbuf *buffer; struct genlmsghdr *genlmsghdr; - + const struct ovsrec_open_vswitch *ovs; buffer = NULL; do { @@ -983,21 +1171,31 @@ brc_recv_update(const struct ovsrec_open_vswitch *ovs) goto error; } + /* Get the Open vSwitch configuration. Just drop the request on the floor + * if a valid configuration doesn't exist. (We could check this earlier, + * but we want to drain pending Netlink messages even when there is no Open + * vSwitch configuration.) */ + ovs = ovsrec_open_vswitch_first(idl); + if (!ovs) { + VLOG_WARN_RL(&rl, "could not find valid configuration to update"); + goto error; + } + switch (genlmsghdr->cmd) { case BRC_GENL_C_DP_ADD: - handle_bridge_cmd(ovs, buffer, true); + handle_bridge_cmd(idl, ovs, buffer, true); break; case BRC_GENL_C_DP_DEL: - handle_bridge_cmd(ovs, buffer, false); + handle_bridge_cmd(idl, ovs, buffer, false); break; case BRC_GENL_C_PORT_ADD: - handle_port_cmd(ovs, buffer, true); + handle_port_cmd(idl, ovs, buffer, true); break; case BRC_GENL_C_PORT_DEL: - handle_port_cmd(ovs, buffer, false); + handle_port_cmd(idl, ovs, buffer, false); break; case BRC_GENL_C_FDB_QUERY: @@ -1014,7 +1212,7 @@ brc_recv_update(const struct ovsrec_open_vswitch *ovs) default: VLOG_WARN_RL(&rl, "received unknown brc netlink command: %d\n", - genlmsghdr->cmd); + genlmsghdr->cmd); break; } @@ -1023,10 +1221,10 @@ error: return; } -#if 0 /* Check for interface configuration changes announced through RTNL. */ static void -rtnl_recv_update(void) +rtnl_recv_update(struct ovsdb_idl *idl, + const struct ovsrec_open_vswitch *ovs) { struct ofpbuf *buf; @@ -1068,27 +1266,35 @@ rtnl_recv_update(void) return; } - if (cfg_lock(NULL, lock_timeout)) { - /* Couldn't lock config file. */ - /* xxx this should try again and print error msg. */ - ofpbuf_delete(buf); - return; - } - if (!netdev_exists(port_name)) { /* Network device is really gone. */ - struct svec ports; + struct ovsdb_idl_txn *txn; + const struct ovsrec_interface *iface; + struct ovsrec_port *port; + struct ovsrec_bridge *br; VLOG_INFO("network device %s destroyed, " "removing from bridge %s", port_name, br_name); - svec_init(&ports); - cfg_get_all_keys(&ports, "bridge.%s.port", br_name); - svec_sort(&ports); - if (svec_contains(&ports, port_name)) { - del_port(br_name, port_name); + br = find_bridge(ovs, br_name); + if (!br) { + VLOG_WARN("no bridge named %s from which to remove %s", + br_name, port_name); + ofpbuf_delete(buf); + return; + } + + txn = ovsdb_idl_txn_create(idl); + + iface = find_interface(br, port_name, &port); + if (iface) { + del_interface(br, port, iface); + ovsdb_idl_txn_add_comment(txn, + "ovs-brcompatd: destroy port %s", + port_name); } - svec_destroy(&ports); + + commit_txn(txn, false); } else { /* A network device by that name exists even though the kernel * told us it had disappeared. Probably, what happened was @@ -1135,12 +1341,10 @@ rtnl_recv_update(void) "a device by that name exists (XS Tools 5.0.0?)", port_name); } - cfg_unlock(); } ofpbuf_delete(buf); } } -#endif int main(int argc, char *argv[]) @@ -1148,11 +1352,10 @@ main(int argc, char *argv[]) struct unixctl_server *unixctl; const char *remote; struct ovsdb_idl *idl; - unsigned int idl_seqno; int retval; + proctitle_init(argc, argv); set_program_name(argv[0]); - register_fault_handlers(); time_init(); vlog_init(); vlog_set_levels(VLM_ANY_MODULE, VLF_CONSOLE, VLL_WARN); @@ -1161,13 +1364,14 @@ main(int argc, char *argv[]) remote = parse_options(argc, argv); signal(SIGPIPE, SIG_IGN); process_init(); + ovsrec_init(); die_if_already_running(); - daemonize(); + daemonize_start(); retval = unixctl_server_create(NULL, &unixctl); if (retval) { - ovs_fatal(retval, "could not listen for vlog connections"); + exit(EXIT_FAILURE); } if (brc_open(&brc_sock)) { @@ -1181,45 +1385,29 @@ main(int argc, char *argv[]) } } + daemonize_complete(); + idl = ovsdb_idl_create(remote, &ovsrec_idl_class); - idl_seqno = ovsdb_idl_get_seqno(idl); for (;;) { const struct ovsrec_open_vswitch *ovs; - struct ovsdb_idl_txn *txn; - int status; - unsigned int new_idl_seqno; ovsdb_idl_run(idl); - /* xxx Complete hack to get around bad ovs! */ - new_idl_seqno = ovsdb_idl_get_seqno(idl); - if (new_idl_seqno == idl_seqno) { - ovsdb_idl_wait(idl); - poll_block(); - printf("xxx trying again...\n"); - idl_seqno = new_idl_seqno; - continue; - } + unixctl_server_run(unixctl); + brc_recv_update(idl); ovs = ovsrec_open_vswitch_first(idl); - if (!ovs) { - /* XXX it would be more user-friendly to create a record ourselves - * (while verifying that the table is empty before doing so). */ - ovs_fatal(0, "%s: database does not contain any Open vSwitch " - "configuration", remote); + if (!ovs && ovsdb_idl_has_ever_connected(idl)) { + static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 1); + VLOG_WARN_RL(&rl, "%s: database does not contain any Open vSwitch " + "configuration", remote); } - - txn = ovsdb_idl_txn_create(idl); - - unixctl_server_run(unixctl); - brc_recv_update(ovs); netdev_run(); -#if 0 /* If 'prune_timeout' is non-zero, we actively prune from the - * config file any 'bridge..port' entries that are no - * longer valid. We use two methods: + * configuration of port entries that are no longer valid. We + * use two methods: * * 1) The kernel explicitly notifies us of removed ports * through the RTNL messages. @@ -1227,46 +1415,16 @@ main(int argc, char *argv[]) * 2) We periodically check all ports associated with bridges * to see if they no longer exist. */ - if (prune_timeout) { - rtnl_recv_update(); + if (ovs && prune_timeout) { + rtnl_recv_update(idl, ovs); +#if 0 prune_ports(); +#endif nl_sock_wait(rtnl_sock, POLLIN); poll_timer_wait(prune_timeout); } -#endif - - while ((status = ovsdb_idl_txn_commit(txn)) == TXN_INCOMPLETE) { - ovsdb_idl_run(idl); - ovsdb_idl_wait(idl); - ovsdb_idl_txn_wait(txn); - poll_block(); - } - ovsdb_idl_txn_destroy(txn); - - switch (status) { - case TXN_INCOMPLETE: - NOT_REACHED(); - - case TXN_ABORTED: - /* Should not happen--we never call ovsdb_idl_txn_abort(). */ - ovs_fatal(0, "transaction aborted"); - - case TXN_SUCCESS: - break; - - case TXN_TRY_AGAIN: - /* xxx Handle this better! */ - printf("xxx We need to try again!\n"); - break; - case TXN_ERROR: - /* xxx Is this what we want to do? */ - ovs_fatal(0, "transaction error"); - - default: - NOT_REACHED(); - } nl_sock_wait(brc_sock, POLLIN); ovsdb_idl_wait(idl); @@ -1305,7 +1463,6 @@ static const char * parse_options(int argc, char *argv[]) { enum { - OPT_LOCK_TIMEOUT = UCHAR_MAX + 1, OPT_PRUNE_TIMEOUT, OPT_APPCTL_COMMAND, VLOG_OPTION_ENUMS, @@ -1314,7 +1471,6 @@ parse_options(int argc, char *argv[]) static struct option long_options[] = { {"help", no_argument, 0, 'h'}, {"version", no_argument, 0, 'V'}, - {"lock-timeout", required_argument, 0, OPT_LOCK_TIMEOUT}, {"prune-timeout", required_argument, 0, OPT_PRUNE_TIMEOUT}, {"appctl-command", required_argument, 0, OPT_APPCTL_COMMAND}, DAEMON_LONG_OPTIONS, @@ -1342,10 +1498,6 @@ parse_options(int argc, char *argv[]) OVS_PRINT_VERSION(0, 0); exit(EXIT_SUCCESS); - case OPT_LOCK_TIMEOUT: - lock_timeout = atoi(optarg); - break; - case OPT_PRUNE_TIMEOUT: prune_timeout = atoi(optarg) * 1000; break; @@ -1390,7 +1542,6 @@ usage(void) printf("\nConfiguration options:\n" " --appctl-command=COMMAND shell command to run ovs-appctl\n" " --prune-timeout=SECS wait at most SECS before pruning ports\n" - " --lock-timeout=MSECS wait at most MSECS for CONFIG to unlock\n" ); daemon_usage(); vlog_usage();