X-Git-Url: http://git.cascardo.eti.br/?a=blobdiff_plain;f=ofproto%2Fnetflow.c;h=f1b6fbe2d1a2c4e3d2a186e228deff153aa6136b;hb=994fcc5a15d32b16e249eaa97c7948a75ba370bd;hp=2e32f219cb5c10848dba79b9333e656381a562b3;hpb=4e022ec09e14ac89add74c1b4b8e3ff3873edbf0;p=cascardo%2Fovs.git diff --git a/ofproto/netflow.c b/ofproto/netflow.c index 2e32f219c..f1b6fbe2d 100644 --- a/ofproto/netflow.c +++ b/ofproto/netflow.c @@ -1,5 +1,5 @@ /* - * Copyright (c) 2008, 2009, 2010, 2011 Nicira, Inc. + * Copyright (c) 2008, 2009, 2010, 2011, 2013, 2014, 2015 Nicira, Inc. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -22,6 +22,7 @@ #include #include "byte-order.h" #include "collectors.h" +#include "dpif.h" #include "flow.h" #include "lib/netflow.h" #include "ofpbuf.h" @@ -32,7 +33,7 @@ #include "socket-util.h" #include "timeval.h" #include "util.h" -#include "vlog.h" +#include "openvswitch/vlog.h" VLOG_DEFINE_THIS_MODULE(netflow); @@ -49,24 +50,62 @@ struct netflow { long long int active_timeout; /* Timeout for flows that are still active. */ long long int next_timeout; /* Next scheduled active timeout. */ long long int reconfig_time; /* When we reconfigured the timeouts. */ + + struct hmap flows; /* Contains 'netflow_flows'. */ + + struct ovs_refcount ref_cnt; +}; + +struct netflow_flow { + struct hmap_node hmap_node; + + long long int last_expired; /* Time this flow last timed out. */ + long long int created; /* Time flow was created since time out. */ + + ofp_port_t output_iface; /* Output interface index. */ + uint16_t tcp_flags; /* Bitwise-OR of all TCP flags seen. */ + + ofp_port_t in_port; /* Input port. */ + ovs_be32 nw_src; /* IPv4 source address. */ + ovs_be32 nw_dst; /* IPv4 destination address. */ + uint8_t nw_tos; /* IP ToS (including DSCP and ECN). */ + uint8_t nw_proto; /* IP protocol. */ + ovs_be16 tp_src; /* TCP/UDP/SCTP source port. */ + ovs_be16 tp_dst; /* TCP/UDP/SCTP destination port. */ + + uint64_t packet_count; /* Packets from subrules. */ + uint64_t byte_count; /* Bytes from subrules. */ + long long int used; /* Last-used time (0 if never used). */ }; +static struct ovs_mutex mutex = OVS_MUTEX_INITIALIZER; +static atomic_count netflow_count = ATOMIC_COUNT_INIT(0); + +static struct netflow_flow *netflow_flow_lookup(const struct netflow *, + const struct flow *) + OVS_REQUIRES(mutex); +static uint32_t netflow_flow_hash(const struct flow *); +static void netflow_expire__(struct netflow *, struct netflow_flow *) + OVS_REQUIRES(mutex); +static void netflow_run__(struct netflow *) OVS_REQUIRES(mutex); + void -netflow_mask_wc(struct flow_wildcards *wc) +netflow_mask_wc(const struct flow *flow, struct flow_wildcards *wc) { - memset(&wc->masks.dl_type, 0xff, sizeof wc->masks.dl_type); + if (flow->dl_type != htons(ETH_TYPE_IP)) { + return; + } memset(&wc->masks.nw_proto, 0xff, sizeof wc->masks.nw_proto); memset(&wc->masks.nw_src, 0xff, sizeof wc->masks.nw_src); memset(&wc->masks.nw_dst, 0xff, sizeof wc->masks.nw_dst); - memset(&wc->masks.tp_src, 0xff, sizeof wc->masks.tp_src); - memset(&wc->masks.tp_dst, 0xff, sizeof wc->masks.tp_dst); + flow_unwildcard_tp_ports(flow, wc); wc->masks.nw_tos |= IP_DSCP_MASK; } static void gen_netflow_rec(struct netflow *nf, struct netflow_flow *nf_flow, - struct ofexpired *expired, uint32_t packet_count, uint32_t byte_count) + OVS_REQUIRES(mutex) { struct netflow_v5_header *nf_hdr; struct netflow_v5_record *nf_rec; @@ -82,7 +121,6 @@ gen_netflow_rec(struct netflow *nf, struct netflow_flow *nf_flow, nf_hdr->sysuptime = htonl(time_msec() - nf->boot_time); nf_hdr->unix_secs = htonl(now.tv_sec); nf_hdr->unix_nsecs = htonl(now.tv_nsec); - nf_hdr->flow_seq = htonl(nf->netflow_cnt++); nf_hdr->engine_type = nf->engine_type; nf_hdr->engine_id = nf->engine_id; nf_hdr->sampling_interval = htons(0); @@ -90,77 +128,131 @@ gen_netflow_rec(struct netflow *nf, struct netflow_flow *nf_flow, nf_hdr = nf->packet.data; nf_hdr->count = htons(ntohs(nf_hdr->count) + 1); + nf_hdr->flow_seq = htonl(nf->netflow_cnt++); nf_rec = ofpbuf_put_zeros(&nf->packet, sizeof *nf_rec); - nf_rec->src_addr = expired->flow.nw_src; - nf_rec->dst_addr = expired->flow.nw_dst; + nf_rec->src_addr = nf_flow->nw_src; + nf_rec->dst_addr = nf_flow->nw_dst; nf_rec->nexthop = htonl(0); if (nf->add_id_to_iface) { uint16_t iface = (nf->engine_id & 0x7f) << 9; - nf_rec->input = htons(iface - | (ofp_to_u16(expired->flow.in_port.ofp_port) & 0x1ff)); + nf_rec->input = htons(iface | (ofp_to_u16(nf_flow->in_port) & 0x1ff)); nf_rec->output = htons(iface | (ofp_to_u16(nf_flow->output_iface) & 0x1ff)); } else { - nf_rec->input = htons(ofp_to_u16(expired->flow.in_port.ofp_port)); + nf_rec->input = htons(ofp_to_u16(nf_flow->in_port)); nf_rec->output = htons(ofp_to_u16(nf_flow->output_iface)); } nf_rec->packet_count = htonl(packet_count); nf_rec->byte_count = htonl(byte_count); nf_rec->init_time = htonl(nf_flow->created - nf->boot_time); - nf_rec->used_time = htonl(MAX(nf_flow->created, expired->used) + nf_rec->used_time = htonl(MAX(nf_flow->created, nf_flow->used) - nf->boot_time); - if (expired->flow.nw_proto == IPPROTO_ICMP) { + if (nf_flow->nw_proto == IPPROTO_ICMP) { /* In NetFlow, the ICMP type and code are concatenated and * placed in the 'dst_port' field. */ - uint8_t type = ntohs(expired->flow.tp_src); - uint8_t code = ntohs(expired->flow.tp_dst); + uint8_t type = ntohs(nf_flow->tp_src); + uint8_t code = ntohs(nf_flow->tp_dst); nf_rec->src_port = htons(0); nf_rec->dst_port = htons((type << 8) | code); } else { - nf_rec->src_port = expired->flow.tp_src; - nf_rec->dst_port = expired->flow.tp_dst; + nf_rec->src_port = nf_flow->tp_src; + nf_rec->dst_port = nf_flow->tp_dst; } - nf_rec->tcp_flags = nf_flow->tcp_flags; - nf_rec->ip_proto = expired->flow.nw_proto; - nf_rec->ip_tos = expired->flow.nw_tos & IP_DSCP_MASK; + nf_rec->tcp_flags = (uint8_t) nf_flow->tcp_flags; + nf_rec->ip_proto = nf_flow->nw_proto; + nf_rec->ip_tos = nf_flow->nw_tos & IP_DSCP_MASK; /* NetFlow messages are limited to 30 records. */ if (ntohs(nf_hdr->count) >= 30) { - netflow_run(nf); + netflow_run__(nf); } } void -netflow_expire(struct netflow *nf, struct netflow_flow *nf_flow, - struct ofexpired *expired) +netflow_flow_update(struct netflow *nf, const struct flow *flow, + ofp_port_t output_iface, + const struct dpif_flow_stats *stats) + OVS_EXCLUDED(mutex) { - uint64_t pkt_delta = expired->packet_count - nf_flow->packet_count_off; - uint64_t byte_delta = expired->byte_count - nf_flow->byte_count_off; + struct netflow_flow *nf_flow; + long long int used; + + /* NetFlow only reports on IP packets. */ + if (flow->dl_type != htons(ETH_TYPE_IP)) { + return; + } + + ovs_mutex_lock(&mutex); + nf_flow = netflow_flow_lookup(nf, flow); + if (!nf_flow) { + nf_flow = xzalloc(sizeof *nf_flow); + nf_flow->in_port = flow->in_port.ofp_port; + nf_flow->nw_src = flow->nw_src; + nf_flow->nw_dst = flow->nw_dst; + nf_flow->nw_tos = flow->nw_tos; + nf_flow->nw_proto = flow->nw_proto; + nf_flow->tp_src = flow->tp_src; + nf_flow->tp_dst = flow->tp_dst; + nf_flow->created = stats->used; + nf_flow->output_iface = output_iface; + hmap_insert(&nf->flows, &nf_flow->hmap_node, netflow_flow_hash(flow)); + } + + if (nf_flow->output_iface != output_iface) { + netflow_expire__(nf, nf_flow); + nf_flow->created = stats->used; + nf_flow->output_iface = output_iface; + } + + nf_flow->packet_count += stats->n_packets; + nf_flow->byte_count += stats->n_bytes; + nf_flow->tcp_flags |= stats->tcp_flags; + + used = MAX(nf_flow->used, stats->used); + if (nf_flow->used != used) { + nf_flow->used = used; + if (!nf->active_timeout || !nf_flow->last_expired + || nf->reconfig_time > nf_flow->last_expired) { + /* Keep the time updated to prevent a flood of expiration in + * the future. */ + nf_flow->last_expired = time_msec(); + } + } + + ovs_mutex_unlock(&mutex); +} + +static void +netflow_expire__(struct netflow *nf, struct netflow_flow *nf_flow) + OVS_REQUIRES(mutex) +{ + uint64_t pkts, bytes; + + pkts = nf_flow->packet_count; + bytes = nf_flow->byte_count; nf_flow->last_expired += nf->active_timeout; - /* NetFlow only reports on IP packets and we should only report flows - * that actually have traffic. */ - if (expired->flow.dl_type != htons(ETH_TYPE_IP) || pkt_delta == 0) { + if (pkts == 0) { return; } - if ((byte_delta >> 32) <= 175) { + if ((bytes >> 32) <= 175) { /* NetFlow v5 records are limited to 32-bit counters. If we've wrapped * a counter, send as multiple records so we don't lose track of any * traffic. We try to evenly distribute the packet and byte counters, * so that the bytes-per-packet lengths don't look wonky across the * records. */ - while (byte_delta) { - int n_recs = (byte_delta + UINT32_MAX - 1) / UINT32_MAX; - uint32_t pkt_count = pkt_delta / n_recs; - uint32_t byte_count = byte_delta / n_recs; + while (bytes) { + int n_recs = (bytes + UINT32_MAX - 1) / UINT32_MAX; + uint32_t pkt_count = pkts / n_recs; + uint32_t byte_count = bytes / n_recs; - gen_netflow_rec(nf, nf_flow, expired, pkt_count, byte_count); + gen_netflow_rec(nf, nf_flow, pkt_count, byte_count); - pkt_delta -= pkt_count; - byte_delta -= byte_count; + pkts -= pkt_count; + bytes -= byte_count; } } else { /* In 600 seconds, a 10GbE link can theoretically transmit 75 * 10**10 @@ -174,52 +266,95 @@ netflow_expire(struct netflow *nf, struct netflow_flow *nf_flow, */ static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 1); - VLOG_WARN_RL(&rl, "impossible byte counter %"PRIu64, byte_delta); + VLOG_WARN_RL(&rl, "impossible byte counter %"PRIu64, bytes); } /* Update flow tracking data. */ - nf_flow->created = 0; - nf_flow->packet_count_off = expired->packet_count; - nf_flow->byte_count_off = expired->byte_count; + nf_flow->packet_count = 0; + nf_flow->byte_count = 0; nf_flow->tcp_flags = 0; } +void +netflow_flow_clear(struct netflow *nf, const struct flow *flow) + OVS_EXCLUDED(mutex) +{ + struct netflow_flow *nf_flow; + + ovs_mutex_lock(&mutex); + nf_flow = netflow_flow_lookup(nf, flow); + if (nf_flow) { + netflow_expire__(nf, nf_flow); + hmap_remove(&nf->flows, &nf_flow->hmap_node); + free(nf_flow); + } + ovs_mutex_unlock(&mutex); +} + /* Returns true if it's time to send out a round of NetFlow active timeouts, * false otherwise. */ -bool -netflow_run(struct netflow *nf) +static void +netflow_run__(struct netflow *nf) OVS_REQUIRES(mutex) { + long long int now = time_msec(); + struct netflow_flow *nf_flow, *next; + if (nf->packet.size) { collectors_send(nf->collectors, nf->packet.data, nf->packet.size); nf->packet.size = 0; } - if (nf->active_timeout && time_msec() >= nf->next_timeout) { - nf->next_timeout = time_msec() + 1000; - return true; - } else { - return false; + if (!nf->active_timeout || now < nf->next_timeout) { + return; } + + nf->next_timeout = now + 1000; + + HMAP_FOR_EACH_SAFE (nf_flow, next, hmap_node, &nf->flows) { + if (now > nf_flow->last_expired + nf->active_timeout) { + bool idle = nf_flow->used < nf_flow->last_expired; + netflow_expire__(nf, nf_flow); + + if (idle) { + /* If the netflow_flow hasn't been used in a while, it's + * possible the upper layer lost track of it. */ + hmap_remove(&nf->flows, &nf_flow->hmap_node); + free(nf_flow); + } + } + } +} + +void +netflow_run(struct netflow *nf) +{ + ovs_mutex_lock(&mutex); + netflow_run__(nf); + ovs_mutex_unlock(&mutex); } void -netflow_wait(struct netflow *nf) +netflow_wait(struct netflow *nf) OVS_EXCLUDED(mutex) { + ovs_mutex_lock(&mutex); if (nf->active_timeout) { poll_timer_wait_until(nf->next_timeout); } if (nf->packet.size) { poll_immediate_wake(); } + ovs_mutex_unlock(&mutex); } int netflow_set_options(struct netflow *nf, const struct netflow_options *nf_options) + OVS_EXCLUDED(mutex) { int error = 0; long long int old_timeout; + ovs_mutex_lock(&mutex); nf->engine_type = nf_options->engine_type; nf->engine_id = nf_options->engine_id; nf->add_id_to_iface = nf_options->add_id_to_iface; @@ -238,6 +373,7 @@ netflow_set_options(struct netflow *nf, nf->reconfig_time = time_msec(); nf->next_timeout = time_msec(); } + ovs_mutex_unlock(&mutex); return error; } @@ -246,71 +382,87 @@ struct netflow * netflow_create(void) { struct netflow *nf = xzalloc(sizeof *nf); + nf->engine_type = 0; nf->engine_id = 0; nf->boot_time = time_msec(); nf->collectors = NULL; nf->add_id_to_iface = false; nf->netflow_cnt = 0; + hmap_init(&nf->flows); + ovs_refcount_init(&nf->ref_cnt); ofpbuf_init(&nf->packet, 1500); + atomic_count_inc(&netflow_count); return nf; } -void -netflow_destroy(struct netflow *nf) +struct netflow * +netflow_ref(const struct netflow *nf_) { + struct netflow *nf = CONST_CAST(struct netflow *, nf_); if (nf) { - ofpbuf_uninit(&nf->packet); - collectors_destroy(nf->collectors); - free(nf); + ovs_refcount_ref(&nf->ref_cnt); } + return nf; } -/* Initializes a new 'nf_flow' given that the caller has already cleared it to - * all-zero-bits. */ void -netflow_flow_init(struct netflow_flow *nf_flow OVS_UNUSED) +netflow_unref(struct netflow *nf) { - /* Nothing to do. */ + if (nf && ovs_refcount_unref_relaxed(&nf->ref_cnt) == 1) { + atomic_count_dec(&netflow_count); + collectors_destroy(nf->collectors); + ofpbuf_uninit(&nf->packet); + free(nf); + } } -void -netflow_flow_clear(struct netflow_flow *nf_flow) +/* Returns true if there exist any netflow objects, false otherwise. + * Callers must cope with transient false positives, i.e., there is no tight + * synchronization with the count and the actual existence of netflow objects. + */ +bool +netflow_exists(void) { - ofp_port_t output_iface = nf_flow->output_iface; - - memset(nf_flow, 0, sizeof *nf_flow); - nf_flow->output_iface = output_iface; + return atomic_count_get(&netflow_count) > 0; } + +/* Helpers. */ -void -netflow_flow_update_time(struct netflow *nf, struct netflow_flow *nf_flow, - long long int used) +static struct netflow_flow * +netflow_flow_lookup(const struct netflow *nf, const struct flow *flow) + OVS_REQUIRES(mutex) { - if (!nf_flow->created) { - nf_flow->created = used; + struct netflow_flow *nf_flow; + + HMAP_FOR_EACH_WITH_HASH (nf_flow, hmap_node, netflow_flow_hash(flow), + &nf->flows) { + if (flow->in_port.ofp_port == nf_flow->in_port + && flow->nw_src == nf_flow->nw_src + && flow->nw_dst == nf_flow->nw_dst + && flow->nw_tos == nf_flow->nw_tos + && flow->nw_proto == nf_flow->nw_proto + && flow->tp_src == nf_flow->tp_src + && flow->tp_dst == nf_flow->tp_dst) { + return nf_flow; + } } - if (!nf || !nf->active_timeout || !nf_flow->last_expired || - nf->reconfig_time > nf_flow->last_expired) { - /* Keep the time updated to prevent a flood of expiration in - * the future. */ - nf_flow->last_expired = time_msec(); - } + return NULL; } -void -netflow_flow_update_flags(struct netflow_flow *nf_flow, uint8_t tcp_flags) +static uint32_t +netflow_flow_hash(const struct flow *flow) { - nf_flow->tcp_flags |= tcp_flags; -} + uint32_t hash = 0; -bool -netflow_active_timeout_expired(struct netflow *nf, struct netflow_flow *nf_flow) -{ - if (nf->active_timeout) { - return time_msec() > nf_flow->last_expired + nf->active_timeout; - } + hash = hash_add(hash, (OVS_FORCE uint32_t) flow->in_port.ofp_port); + hash = hash_add(hash, ntohl(flow->nw_src)); + hash = hash_add(hash, ntohl(flow->nw_dst)); + hash = hash_add(hash, flow->nw_tos); + hash = hash_add(hash, flow->nw_proto); + hash = hash_add(hash, ntohs(flow->tp_src)); + hash = hash_add(hash, ntohs(flow->tp_dst)); - return false; + return hash_finish(hash, 28); }