2 * Copyright (c) 2008, 2009, 2010, 2011 Nicira, Inc.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
19 #include <arpa/inet.h>
23 #include "byte-order.h"
24 #include "collectors.h"
27 #include "lib/netflow.h"
30 #include "ofproto/netflow.h"
32 #include "poll-loop.h"
33 #include "socket-util.h"
38 VLOG_DEFINE_THIS_MODULE(netflow);
41 uint8_t engine_type; /* Value of engine_type to use. */
42 uint8_t engine_id; /* Value of engine_id to use. */
43 long long int boot_time; /* Time when netflow_create() was called. */
44 struct collectors *collectors; /* NetFlow collectors. */
45 bool add_id_to_iface; /* Put the 7 least significiant bits of
46 * 'engine_id' into the most significant
47 * bits of the interface fields. */
48 uint32_t netflow_cnt; /* Flow sequence number for NetFlow. */
49 struct ofpbuf packet; /* NetFlow packet being accumulated. */
50 long long int active_timeout; /* Timeout for flows that are still active. */
51 long long int next_timeout; /* Next scheduled active timeout. */
52 long long int reconfig_time; /* When we reconfigured the timeouts. */
54 struct hmap flows; /* Contains 'netflow_flows'. */
58 struct hmap_node hmap_node;
60 long long int last_expired; /* Time this flow last timed out. */
61 long long int created; /* Time flow was created since time out. */
63 ofp_port_t output_iface; /* Output interface index. */
64 uint16_t tcp_flags; /* Bitwise-OR of all TCP flags seen. */
66 ofp_port_t in_port; /* Input port. */
67 ovs_be32 nw_src; /* IPv4 source address. */
68 ovs_be32 nw_dst; /* IPv4 destination address. */
69 uint8_t nw_tos; /* IP ToS (including DSCP and ECN). */
70 uint8_t nw_proto; /* IP protocol. */
71 ovs_be16 tp_src; /* TCP/UDP/SCTP source port. */
72 ovs_be16 tp_dst; /* TCP/UDP/SCTP destination port. */
74 uint64_t packet_count; /* Packets from subrules. */
75 uint64_t byte_count; /* Bytes from subrules. */
76 long long int used; /* Last-used time (0 if never used). */
79 static struct netflow_flow *netflow_flow_lookup(const struct netflow *,
81 static uint32_t netflow_flow_hash(const struct flow *);
82 static void netflow_expire__(struct netflow *, struct netflow_flow *);
85 netflow_mask_wc(struct flow *flow, struct flow_wildcards *wc)
87 if (flow->dl_type != htons(ETH_TYPE_IP)) {
90 memset(&wc->masks.nw_proto, 0xff, sizeof wc->masks.nw_proto);
91 memset(&wc->masks.nw_src, 0xff, sizeof wc->masks.nw_src);
92 memset(&wc->masks.nw_dst, 0xff, sizeof wc->masks.nw_dst);
93 memset(&wc->masks.tp_src, 0xff, sizeof wc->masks.tp_src);
94 memset(&wc->masks.tp_dst, 0xff, sizeof wc->masks.tp_dst);
95 wc->masks.nw_tos |= IP_DSCP_MASK;
99 gen_netflow_rec(struct netflow *nf, struct netflow_flow *nf_flow,
100 uint32_t packet_count, uint32_t byte_count)
102 struct netflow_v5_header *nf_hdr;
103 struct netflow_v5_record *nf_rec;
105 if (!nf->packet.size) {
108 time_wall_timespec(&now);
110 nf_hdr = ofpbuf_put_zeros(&nf->packet, sizeof *nf_hdr);
111 nf_hdr->version = htons(NETFLOW_V5_VERSION);
112 nf_hdr->count = htons(0);
113 nf_hdr->sysuptime = htonl(time_msec() - nf->boot_time);
114 nf_hdr->unix_secs = htonl(now.tv_sec);
115 nf_hdr->unix_nsecs = htonl(now.tv_nsec);
116 nf_hdr->flow_seq = htonl(nf->netflow_cnt++);
117 nf_hdr->engine_type = nf->engine_type;
118 nf_hdr->engine_id = nf->engine_id;
119 nf_hdr->sampling_interval = htons(0);
122 nf_hdr = nf->packet.data;
123 nf_hdr->count = htons(ntohs(nf_hdr->count) + 1);
125 nf_rec = ofpbuf_put_zeros(&nf->packet, sizeof *nf_rec);
126 nf_rec->src_addr = nf_flow->nw_src;
127 nf_rec->dst_addr = nf_flow->nw_dst;
128 nf_rec->nexthop = htonl(0);
129 if (nf->add_id_to_iface) {
130 uint16_t iface = (nf->engine_id & 0x7f) << 9;
131 nf_rec->input = htons(iface | (ofp_to_u16(nf_flow->in_port) & 0x1ff));
132 nf_rec->output = htons(iface
133 | (ofp_to_u16(nf_flow->output_iface) & 0x1ff));
135 nf_rec->input = htons(ofp_to_u16(nf_flow->in_port));
136 nf_rec->output = htons(ofp_to_u16(nf_flow->output_iface));
138 nf_rec->packet_count = htonl(packet_count);
139 nf_rec->byte_count = htonl(byte_count);
140 nf_rec->init_time = htonl(nf_flow->created - nf->boot_time);
141 nf_rec->used_time = htonl(MAX(nf_flow->created, nf_flow->used)
143 if (nf_flow->nw_proto == IPPROTO_ICMP) {
144 /* In NetFlow, the ICMP type and code are concatenated and
145 * placed in the 'dst_port' field. */
146 uint8_t type = ntohs(nf_flow->tp_src);
147 uint8_t code = ntohs(nf_flow->tp_dst);
148 nf_rec->src_port = htons(0);
149 nf_rec->dst_port = htons((type << 8) | code);
151 nf_rec->src_port = nf_flow->tp_src;
152 nf_rec->dst_port = nf_flow->tp_dst;
154 nf_rec->tcp_flags = (uint8_t) nf_flow->tcp_flags;
155 nf_rec->ip_proto = nf_flow->nw_proto;
156 nf_rec->ip_tos = nf_flow->nw_tos & IP_DSCP_MASK;
158 /* NetFlow messages are limited to 30 records. */
159 if (ntohs(nf_hdr->count) >= 30) {
165 netflow_flow_update(struct netflow *nf, struct flow *flow,
166 ofp_port_t output_iface,
167 const struct dpif_flow_stats *stats)
169 struct netflow_flow *nf_flow;
172 /* NetFlow only reports on IP packets. */
173 if (flow->dl_type != htons(ETH_TYPE_IP)) {
177 nf_flow = netflow_flow_lookup(nf, flow);
179 nf_flow = xzalloc(sizeof *nf_flow);
180 nf_flow->in_port = flow->in_port.ofp_port;
181 nf_flow->nw_src = flow->nw_src;
182 nf_flow->nw_dst = flow->nw_dst;
183 nf_flow->nw_tos = flow->nw_tos;
184 nf_flow->nw_proto = flow->nw_proto;
185 nf_flow->tp_src = flow->tp_src;
186 nf_flow->tp_dst = flow->tp_dst;
187 nf_flow->created = stats->used;
188 nf_flow->output_iface = output_iface;
189 hmap_insert(&nf->flows, &nf_flow->hmap_node, netflow_flow_hash(flow));
192 if (nf_flow->output_iface != output_iface) {
193 netflow_expire__(nf, nf_flow);
194 nf_flow->created = stats->used;
195 nf_flow->output_iface = output_iface;
198 nf_flow->packet_count += stats->n_packets;
199 nf_flow->byte_count += stats->n_bytes;
200 nf_flow->tcp_flags |= stats->tcp_flags;
202 used = MAX(nf_flow->used, stats->used);
203 if (nf_flow->used != used) {
204 nf_flow->used = used;
205 if (!nf->active_timeout || !nf_flow->last_expired
206 || nf->reconfig_time > nf_flow->last_expired) {
207 /* Keep the time updated to prevent a flood of expiration in
209 nf_flow->last_expired = time_msec();
215 netflow_expire__(struct netflow *nf, struct netflow_flow *nf_flow)
217 uint64_t pkts, bytes;
219 pkts = nf_flow->packet_count;
220 bytes = nf_flow->byte_count;
222 nf_flow->last_expired += nf->active_timeout;
228 if ((bytes >> 32) <= 175) {
229 /* NetFlow v5 records are limited to 32-bit counters. If we've wrapped
230 * a counter, send as multiple records so we don't lose track of any
231 * traffic. We try to evenly distribute the packet and byte counters,
232 * so that the bytes-per-packet lengths don't look wonky across the
235 int n_recs = (bytes + UINT32_MAX - 1) / UINT32_MAX;
236 uint32_t pkt_count = pkts / n_recs;
237 uint32_t byte_count = bytes / n_recs;
239 gen_netflow_rec(nf, nf_flow, pkt_count, byte_count);
245 /* In 600 seconds, a 10GbE link can theoretically transmit 75 * 10**10
246 * == 175 * 2**32 bytes. The byte counter is bigger than that, so it's
247 * probably a bug--for example, the netdev code uses UINT64_MAX to
248 * report "unknown value", and perhaps that has leaked through to here.
250 * We wouldn't want to hit the loop above in this case, because it
251 * would try to send up to UINT32_MAX netflow records, which would take
254 static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 1);
256 VLOG_WARN_RL(&rl, "impossible byte counter %"PRIu64, bytes);
259 /* Update flow tracking data. */
260 nf_flow->created = 0;
261 nf_flow->packet_count = 0;
262 nf_flow->byte_count = 0;
263 nf_flow->tcp_flags = 0;
267 netflow_expire(struct netflow *nf, struct flow *flow)
269 struct netflow_flow *nf_flow = netflow_flow_lookup(nf, flow);
272 netflow_expire__(nf, nf_flow);
277 netflow_flow_clear(struct netflow *nf, struct flow *flow)
279 struct netflow_flow *nf_flow = netflow_flow_lookup(nf, flow);
282 ovs_assert(!nf_flow->packet_count);
283 ovs_assert(!nf_flow->byte_count);
284 hmap_remove(&nf->flows, &nf_flow->hmap_node);
289 /* Returns true if it's time to send out a round of NetFlow active timeouts,
290 * false otherwise. */
292 netflow_run(struct netflow *nf)
294 long long int now = time_msec();
295 struct netflow_flow *nf_flow, *next;
297 if (nf->packet.size) {
298 collectors_send(nf->collectors, nf->packet.data, nf->packet.size);
302 if (!nf->active_timeout || now < nf->next_timeout) {
306 nf->next_timeout = now + 1000;
308 HMAP_FOR_EACH_SAFE (nf_flow, next, hmap_node, &nf->flows) {
309 if (now > nf_flow->last_expired + nf->active_timeout) {
310 bool idle = nf_flow->used < nf_flow->last_expired;
311 netflow_expire__(nf, nf_flow);
314 /* If the netflow_flow hasn't been used in a while, it's
315 * possible the upper layer lost track of it. */
316 hmap_remove(&nf->flows, &nf_flow->hmap_node);
324 netflow_wait(struct netflow *nf)
326 if (nf->active_timeout) {
327 poll_timer_wait_until(nf->next_timeout);
329 if (nf->packet.size) {
330 poll_immediate_wake();
335 netflow_set_options(struct netflow *nf,
336 const struct netflow_options *nf_options)
339 long long int old_timeout;
341 nf->engine_type = nf_options->engine_type;
342 nf->engine_id = nf_options->engine_id;
343 nf->add_id_to_iface = nf_options->add_id_to_iface;
345 collectors_destroy(nf->collectors);
346 collectors_create(&nf_options->collectors, 0, &nf->collectors);
348 old_timeout = nf->active_timeout;
349 if (nf_options->active_timeout >= 0) {
350 nf->active_timeout = nf_options->active_timeout;
352 nf->active_timeout = NF_ACTIVE_TIMEOUT_DEFAULT;
354 nf->active_timeout *= 1000;
355 if (old_timeout != nf->active_timeout) {
356 nf->reconfig_time = time_msec();
357 nf->next_timeout = time_msec();
366 struct netflow *nf = xzalloc(sizeof *nf);
369 nf->boot_time = time_msec();
370 nf->collectors = NULL;
371 nf->add_id_to_iface = false;
373 hmap_init(&nf->flows);
374 ofpbuf_init(&nf->packet, 1500);
379 netflow_destroy(struct netflow *nf)
382 ofpbuf_uninit(&nf->packet);
383 collectors_destroy(nf->collectors);
390 static struct netflow_flow *
391 netflow_flow_lookup(const struct netflow *nf, const struct flow *flow)
393 struct netflow_flow *nf_flow;
395 HMAP_FOR_EACH_WITH_HASH (nf_flow, hmap_node, netflow_flow_hash(flow),
397 if (flow->in_port.ofp_port == nf_flow->in_port
398 && flow->nw_src == nf_flow->nw_src
399 && flow->nw_dst == nf_flow->nw_dst
400 && flow->nw_tos == nf_flow->nw_tos
401 && flow->nw_proto == nf_flow->nw_proto
402 && flow->tp_src == nf_flow->tp_src
403 && flow->tp_dst == nf_flow->tp_dst) {
412 netflow_flow_hash(const struct flow *flow)
416 hash = mhash_add(hash, (OVS_FORCE uint32_t) flow->in_port.ofp_port);
417 hash = mhash_add(hash, ntohl(flow->nw_src));
418 hash = mhash_add(hash, ntohl(flow->nw_dst));
419 hash = mhash_add(hash, flow->nw_tos);
420 hash = mhash_add(hash, flow->nw_proto);
421 hash = mhash_add(hash, ntohs(flow->tp_src));
422 hash = mhash_add(hash, ntohs(flow->tp_dst));
424 return mhash_finish(hash, 28);