| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | /*
 | 
					
						
							| 
									
										
										
										
											2010-10-08 16:36:13 -07:00
										 |  |  |  * Copyright (c) 2009, 2010 Nicira Networks. | 
					
						
							|  |  |  |  * Copyright (c) 2009 InMon Corp. | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |  * | 
					
						
							|  |  |  |  * Licensed under the Apache License, Version 2.0 (the "License"); | 
					
						
							|  |  |  |  * you may not use this file except in compliance with the License. | 
					
						
							|  |  |  |  * You may obtain a copy of the License at: | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  *     http://www.apache.org/licenses/LICENSE-2.0
 | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Unless required by applicable law or agreed to in writing, software | 
					
						
							|  |  |  |  * distributed under the License is distributed on an "AS IS" BASIS, | 
					
						
							|  |  |  |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
					
						
							|  |  |  |  * See the License for the specific language governing permissions and | 
					
						
							|  |  |  |  * limitations under the License. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include <config.h>
 | 
					
						
							|  |  |  | #include "ofproto-sflow.h"
 | 
					
						
							|  |  |  | #include <inttypes.h>
 | 
					
						
							|  |  |  | #include <stdlib.h>
 | 
					
						
							|  |  |  | #include "collectors.h"
 | 
					
						
							|  |  |  | #include "dpif.h"
 | 
					
						
							|  |  |  | #include "compiler.h"
 | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  | #include "hash.h"
 | 
					
						
							|  |  |  | #include "hmap.h"
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | #include "netdev.h"
 | 
					
						
							| 
									
										
										
										
											2010-12-10 10:40:58 -08:00
										 |  |  | #include "netlink.h"
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | #include "ofpbuf.h"
 | 
					
						
							|  |  |  | #include "ofproto.h"
 | 
					
						
							| 
									
										
										
										
											2010-10-08 16:26:21 -07:00
										 |  |  | #include "packets.h"
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | #include "poll-loop.h"
 | 
					
						
							|  |  |  | #include "sflow_api.h"
 | 
					
						
							|  |  |  | #include "socket-util.h"
 | 
					
						
							|  |  |  | #include "timeval.h"
 | 
					
						
							|  |  |  | #include "vlog.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-19 14:47:01 -07:00
										 |  |  | VLOG_DEFINE_THIS_MODULE(sflow); | 
					
						
							| 
									
										
										
										
											2010-07-16 11:02:49 -07:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | struct ofproto_sflow_port { | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |     struct hmap_node hmap_node; /* In struct ofproto_sflow's "ports" hmap. */ | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     struct netdev *netdev;      /* Underlying network device, for stats. */ | 
					
						
							|  |  |  |     SFLDataSource_instance dsi; /* sFlow library's notion of port number. */ | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |     uint16_t odp_port;          /* ODP port number. */ | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | struct ofproto_sflow { | 
					
						
							|  |  |  |     struct ofproto *ofproto; | 
					
						
							|  |  |  |     struct collectors *collectors; | 
					
						
							|  |  |  |     SFLAgent *sflow_agent; | 
					
						
							|  |  |  |     struct ofproto_sflow_options *options; | 
					
						
							|  |  |  |     struct dpif *dpif; | 
					
						
							|  |  |  |     time_t next_tick; | 
					
						
							|  |  |  |     size_t n_flood, n_all; | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |     struct hmap ports;          /* Contains "struct ofproto_sflow_port"s. */ | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  | static void ofproto_sflow_del_port__(struct ofproto_sflow *, | 
					
						
							|  |  |  |                                      struct ofproto_sflow_port *); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | #define RECEIVER_INDEX 1
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 5); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-11 11:07:59 -08:00
										 |  |  | static bool | 
					
						
							|  |  |  | nullable_string_is_equal(const char *a, const char *b) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     return a ? b && !strcmp(a, b) : !b; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | static bool | 
					
						
							|  |  |  | ofproto_sflow_options_equal(const struct ofproto_sflow_options *a, | 
					
						
							|  |  |  |                             const struct ofproto_sflow_options *b) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     return (svec_equal(&a->targets, &b->targets) | 
					
						
							|  |  |  |             && a->sampling_rate == b->sampling_rate | 
					
						
							|  |  |  |             && a->polling_interval == b->polling_interval | 
					
						
							|  |  |  |             && a->header_len == b->header_len | 
					
						
							|  |  |  |             && a->sub_id == b->sub_id | 
					
						
							| 
									
										
										
										
											2010-01-11 11:07:59 -08:00
										 |  |  |             && nullable_string_is_equal(a->agent_device, b->agent_device) | 
					
						
							|  |  |  |             && nullable_string_is_equal(a->control_ip, b->control_ip)); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static struct ofproto_sflow_options * | 
					
						
							|  |  |  | ofproto_sflow_options_clone(const struct ofproto_sflow_options *old) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     struct ofproto_sflow_options *new = xmemdup(old, sizeof *old); | 
					
						
							| 
									
										
										
										
											2010-01-11 11:07:59 -08:00
										 |  |  |     svec_clone(&new->targets, &old->targets); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     new->agent_device = old->agent_device ? xstrdup(old->agent_device) : NULL; | 
					
						
							|  |  |  |     new->control_ip = old->control_ip ? xstrdup(old->control_ip) : NULL; | 
					
						
							|  |  |  |     return new; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static void | 
					
						
							|  |  |  | ofproto_sflow_options_destroy(struct ofproto_sflow_options *options) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     if (options) { | 
					
						
							| 
									
										
										
										
											2010-01-11 11:07:59 -08:00
										 |  |  |         svec_destroy(&options->targets); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |         free(options->agent_device); | 
					
						
							|  |  |  |         free(options->control_ip); | 
					
						
							|  |  |  |         free(options); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* sFlow library callback to allocate memory. */ | 
					
						
							|  |  |  | static void * | 
					
						
							| 
									
										
										
										
											2010-02-11 10:59:47 -08:00
										 |  |  | sflow_agent_alloc_cb(void *magic OVS_UNUSED, SFLAgent *agent OVS_UNUSED, | 
					
						
							|  |  |  |                      size_t bytes) | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | { | 
					
						
							|  |  |  |     return calloc(1, bytes); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* sFlow library callback to free memory. */ | 
					
						
							|  |  |  | static int | 
					
						
							| 
									
										
										
										
											2010-02-11 10:59:47 -08:00
										 |  |  | sflow_agent_free_cb(void *magic OVS_UNUSED, SFLAgent *agent OVS_UNUSED, | 
					
						
							|  |  |  |                     void *obj) | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | { | 
					
						
							|  |  |  |     free(obj); | 
					
						
							|  |  |  |     return 0; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* sFlow library callback to report error. */ | 
					
						
							|  |  |  | static void | 
					
						
							| 
									
										
										
										
											2010-02-11 10:59:47 -08:00
										 |  |  | sflow_agent_error_cb(void *magic OVS_UNUSED, SFLAgent *agent OVS_UNUSED, | 
					
						
							|  |  |  |                      char *msg) | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | { | 
					
						
							|  |  |  |     VLOG_WARN("sFlow agent error: %s", msg); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* sFlow library callback to send datagram. */ | 
					
						
							|  |  |  | static void | 
					
						
							| 
									
										
										
										
											2010-02-11 10:59:47 -08:00
										 |  |  | sflow_agent_send_packet_cb(void *os_, SFLAgent *agent OVS_UNUSED, | 
					
						
							|  |  |  |                            SFLReceiver *receiver OVS_UNUSED, u_char *pkt, | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |                            uint32_t pktLen) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     struct ofproto_sflow *os = os_; | 
					
						
							|  |  |  |     collectors_send(os->collectors, pkt, pktLen); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  | static struct ofproto_sflow_port * | 
					
						
							|  |  |  | ofproto_sflow_find_port(const struct ofproto_sflow *os, uint16_t odp_port) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     struct ofproto_sflow_port *osp; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-09-17 10:33:10 -07:00
										 |  |  |     HMAP_FOR_EACH_IN_BUCKET (osp, hmap_node, | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |                              hash_int(odp_port, 0), &os->ports) { | 
					
						
							|  |  |  |         if (osp->odp_port == odp_port) { | 
					
						
							|  |  |  |             return osp; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     return NULL; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | static void | 
					
						
							|  |  |  | sflow_agent_get_counters(void *os_, SFLPoller *poller, | 
					
						
							|  |  |  |                          SFL_COUNTERS_SAMPLE_TYPE *cs) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     struct ofproto_sflow *os = os_; | 
					
						
							|  |  |  |     SFLCounters_sample_element elem; | 
					
						
							|  |  |  |     struct ofproto_sflow_port *osp; | 
					
						
							|  |  |  |     SFLIf_counters *counters; | 
					
						
							|  |  |  |     struct netdev_stats stats; | 
					
						
							|  |  |  |     enum netdev_flags flags; | 
					
						
							|  |  |  |     uint32_t current; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |     osp = ofproto_sflow_find_port(os, poller->bridgePort); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     if (!osp) { | 
					
						
							|  |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     elem.tag = SFLCOUNTERS_GENERIC; | 
					
						
							|  |  |  |     counters = &elem.counterBlock.generic; | 
					
						
							|  |  |  |     counters->ifIndex = SFL_DS_INDEX(poller->dsi); | 
					
						
							|  |  |  |     counters->ifType = 6; | 
					
						
							|  |  |  |     if (!netdev_get_features(osp->netdev, ¤t, NULL, NULL, NULL)) { | 
					
						
							| 
									
										
										
										
											2010-01-11 11:08:29 -08:00
										 |  |  |       /* The values of ifDirection come from MAU MIB (RFC 2668): 0 = unknown,
 | 
					
						
							|  |  |  |          1 = full-duplex, 2 = half-duplex, 3 = in, 4=out */ | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |         counters->ifSpeed = netdev_features_to_bps(current); | 
					
						
							|  |  |  |         counters->ifDirection = (netdev_features_is_full_duplex(current) | 
					
						
							|  |  |  |                                  ? 1 : 2); | 
					
						
							|  |  |  |     } else { | 
					
						
							|  |  |  |         counters->ifSpeed = 100000000; | 
					
						
							| 
									
										
										
										
											2010-01-11 11:08:29 -08:00
										 |  |  |         counters->ifDirection = 0; | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     } | 
					
						
							|  |  |  |     if (!netdev_get_flags(osp->netdev, &flags) && flags & NETDEV_UP) { | 
					
						
							|  |  |  |         counters->ifStatus = 1; /* ifAdminStatus up. */ | 
					
						
							| 
									
										
										
										
											2010-10-27 15:29:16 -07:00
										 |  |  |         if (netdev_get_carrier(osp->netdev)) { | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |             counters->ifStatus |= 2; /* ifOperStatus us. */ | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } else { | 
					
						
							|  |  |  |         counters->ifStatus = 0;  /* Down. */ | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* XXX
 | 
					
						
							|  |  |  |        1. Is the multicast counter filled in? | 
					
						
							|  |  |  |        2. Does the multicast counter include broadcasts? | 
					
						
							|  |  |  |        3. Does the rx_packets counter include multicasts/broadcasts? | 
					
						
							|  |  |  |     */ | 
					
						
							|  |  |  |     netdev_get_stats(osp->netdev, &stats); | 
					
						
							|  |  |  |     counters->ifInOctets = stats.rx_bytes; | 
					
						
							|  |  |  |     counters->ifInUcastPkts = stats.rx_packets; | 
					
						
							|  |  |  |     counters->ifInMulticastPkts = stats.multicast; | 
					
						
							|  |  |  |     counters->ifInBroadcastPkts = -1; | 
					
						
							|  |  |  |     counters->ifInDiscards = stats.rx_dropped; | 
					
						
							|  |  |  |     counters->ifInErrors = stats.rx_errors; | 
					
						
							|  |  |  |     counters->ifInUnknownProtos = -1; | 
					
						
							|  |  |  |     counters->ifOutOctets = stats.tx_bytes; | 
					
						
							|  |  |  |     counters->ifOutUcastPkts = stats.tx_packets; | 
					
						
							|  |  |  |     counters->ifOutMulticastPkts = -1; | 
					
						
							|  |  |  |     counters->ifOutBroadcastPkts = -1; | 
					
						
							|  |  |  |     counters->ifOutDiscards = stats.tx_dropped; | 
					
						
							|  |  |  |     counters->ifOutErrors = stats.tx_errors; | 
					
						
							|  |  |  |     counters->ifPromiscuousMode = 0; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     SFLADD_ELEMENT(cs, &elem); | 
					
						
							|  |  |  |     sfl_poller_writeCountersSample(poller, cs); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* Obtains an address to use for the local sFlow agent and stores it into
 | 
					
						
							|  |  |  |  * '*agent_addr'.  Returns true if successful, false on failure. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * The sFlow agent address should be a local IP address that is persistent and | 
					
						
							|  |  |  |  * reachable over the network, if possible.  The IP address associated with | 
					
						
							|  |  |  |  * 'agent_device' is used if it has one, and otherwise 'control_ip', the IP | 
					
						
							|  |  |  |  * address used to talk to the controller. */ | 
					
						
							|  |  |  | static bool | 
					
						
							|  |  |  | sflow_choose_agent_address(const char *agent_device, const char *control_ip, | 
					
						
							|  |  |  |                            SFLAddress *agent_addr) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     struct in_addr in4; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     memset(agent_addr, 0, sizeof *agent_addr); | 
					
						
							|  |  |  |     agent_addr->type = SFLADDRESSTYPE_IP_V4; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (agent_device) { | 
					
						
							|  |  |  |         struct netdev *netdev; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-02-05 15:58:27 -08:00
										 |  |  |         if (!netdev_open_default(agent_device, &netdev)) { | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |             int error = netdev_get_in4(netdev, &in4, NULL); | 
					
						
							|  |  |  |             netdev_close(netdev); | 
					
						
							|  |  |  |             if (!error) { | 
					
						
							|  |  |  |                 goto success; | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (control_ip && !lookup_ip(control_ip, &in4)) { | 
					
						
							|  |  |  |         goto success; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     VLOG_ERR("could not determine IP address for sFlow agent"); | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | success: | 
					
						
							|  |  |  |     agent_addr->address.ip_v4.addr = in4.s_addr; | 
					
						
							|  |  |  |     return true; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void | 
					
						
							|  |  |  | ofproto_sflow_clear(struct ofproto_sflow *os) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     if (os->sflow_agent) { | 
					
						
							|  |  |  |         sfl_agent_release(os->sflow_agent); | 
					
						
							|  |  |  |         os->sflow_agent = NULL; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     collectors_destroy(os->collectors); | 
					
						
							|  |  |  |     os->collectors = NULL; | 
					
						
							|  |  |  |     ofproto_sflow_options_destroy(os->options); | 
					
						
							|  |  |  |     os->options = NULL; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Turn off sampling to save CPU cycles. */ | 
					
						
							|  |  |  |     dpif_set_sflow_probability(os->dpif, 0); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool | 
					
						
							|  |  |  | ofproto_sflow_is_enabled(const struct ofproto_sflow *os) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     return os->collectors != NULL; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | struct ofproto_sflow * | 
					
						
							|  |  |  | ofproto_sflow_create(struct dpif *dpif) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     struct ofproto_sflow *os; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     os = xcalloc(1, sizeof *os); | 
					
						
							|  |  |  |     os->dpif = dpif; | 
					
						
							|  |  |  |     os->next_tick = time_now() + 1; | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |     hmap_init(&os->ports); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     return os; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void | 
					
						
							|  |  |  | ofproto_sflow_destroy(struct ofproto_sflow *os) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     if (os) { | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |         struct ofproto_sflow_port *osp, *next; | 
					
						
							| 
									
										
										
										
											2010-05-07 09:29:02 -07:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |         ofproto_sflow_clear(os); | 
					
						
							| 
									
										
										
										
											2010-09-17 10:33:10 -07:00
										 |  |  |         HMAP_FOR_EACH_SAFE (osp, next, hmap_node, &os->ports) { | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |             ofproto_sflow_del_port__(os, osp); | 
					
						
							| 
									
										
										
										
											2010-05-07 09:29:02 -07:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |         hmap_destroy(&os->ports); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |         free(os); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | static void | 
					
						
							|  |  |  | ofproto_sflow_add_poller(struct ofproto_sflow *os, | 
					
						
							|  |  |  |                          struct ofproto_sflow_port *osp, uint16_t odp_port) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     SFLPoller *poller = sfl_agent_addPoller(os->sflow_agent, &osp->dsi, os, | 
					
						
							|  |  |  |                                             sflow_agent_get_counters); | 
					
						
							|  |  |  |     sfl_poller_set_sFlowCpInterval(poller, os->options->polling_interval); | 
					
						
							|  |  |  |     sfl_poller_set_sFlowCpReceiver(poller, RECEIVER_INDEX); | 
					
						
							|  |  |  |     sfl_poller_set_bridgePort(poller, odp_port); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
											  
											
												sflow: Fix sFlow sampling structure.
According to Neil McKee, in an email archived at
http://openvswitch.org/pipermail/dev_openvswitch.org/2010-January/000934.html:
    The containment rule is that a given sflow-datasource (sampler or
    poller) should be scoped within only one sflow-agent (or
    sub-agent).  So the issue arrises when you have two
    switches/datapaths defined on the same host being managed with
    the same IP address: each switch is a separate sub-agent, so they
    can run independently (e.g. with their own sequence numbers) but
    they can't both claim to speak for the same sflow-datasource.
    Specifically, they can't both represent the <ifindex>:0
    data-source.  This containment rule is necessary so that the
    sFlow collector can scale and combine the results accurately.
    One option would be to stick with the <ifindex>:0 data-source but
    elevate it to be global across all bridges, with a global
    sample_pool and a global sflow_agent.  Not tempting.  Better to
    go the other way and allow each interface to have it's own
    sampler, just as it already has it's own poller.  The ifIndex
    numbers are globally unique across all switches/datapaths on the
    host, so the containment is now clean.  Datasource <ifindex>:5
    might be on one switch, whille <ifindex>:7 can be on another.
    Other benefits are that 1) you can support the option of
    overriding the default sampling-rate on an interface-by-interface
    basis, and 2) this is how most sFlow implementations are coded,
    so there will be no surprises or interoperability issues with any
    sFlow collectors out there.
This commit implements the approach suggested by Neil.
This commit uses an atomic_t to represent the sampling pool.  This is
because we do want access to it to be atomic, but we expect that it will
"mostly" be accessed from a single CPU at a time.  Perhaps this is a bad
assumption; we can always switch to another form of synchronization later.
CC: Neil McKee <neil.mckee@inmon.com>
											
										 
											2010-01-20 13:52:42 -08:00
										 |  |  | static void | 
					
						
							|  |  |  | ofproto_sflow_add_sampler(struct ofproto_sflow *os, | 
					
						
							| 
									
										
										
										
											2010-05-05 13:26:23 -07:00
										 |  |  | 			  struct ofproto_sflow_port *osp) | 
					
						
							| 
									
										
											  
											
												sflow: Fix sFlow sampling structure.
According to Neil McKee, in an email archived at
http://openvswitch.org/pipermail/dev_openvswitch.org/2010-January/000934.html:
    The containment rule is that a given sflow-datasource (sampler or
    poller) should be scoped within only one sflow-agent (or
    sub-agent).  So the issue arrises when you have two
    switches/datapaths defined on the same host being managed with
    the same IP address: each switch is a separate sub-agent, so they
    can run independently (e.g. with their own sequence numbers) but
    they can't both claim to speak for the same sflow-datasource.
    Specifically, they can't both represent the <ifindex>:0
    data-source.  This containment rule is necessary so that the
    sFlow collector can scale and combine the results accurately.
    One option would be to stick with the <ifindex>:0 data-source but
    elevate it to be global across all bridges, with a global
    sample_pool and a global sflow_agent.  Not tempting.  Better to
    go the other way and allow each interface to have it's own
    sampler, just as it already has it's own poller.  The ifIndex
    numbers are globally unique across all switches/datapaths on the
    host, so the containment is now clean.  Datasource <ifindex>:5
    might be on one switch, whille <ifindex>:7 can be on another.
    Other benefits are that 1) you can support the option of
    overriding the default sampling-rate on an interface-by-interface
    basis, and 2) this is how most sFlow implementations are coded,
    so there will be no surprises or interoperability issues with any
    sFlow collectors out there.
This commit implements the approach suggested by Neil.
This commit uses an atomic_t to represent the sampling pool.  This is
because we do want access to it to be atomic, but we expect that it will
"mostly" be accessed from a single CPU at a time.  Perhaps this is a bad
assumption; we can always switch to another form of synchronization later.
CC: Neil McKee <neil.mckee@inmon.com>
											
										 
											2010-01-20 13:52:42 -08:00
										 |  |  | { | 
					
						
							|  |  |  |     SFLSampler *sampler = sfl_agent_addSampler(os->sflow_agent, &osp->dsi); | 
					
						
							| 
									
										
										
										
											2010-05-05 13:26:23 -07:00
										 |  |  |     sfl_sampler_set_sFlowFsPacketSamplingRate(sampler, os->options->sampling_rate); | 
					
						
							|  |  |  |     sfl_sampler_set_sFlowFsMaximumHeaderSize(sampler, os->options->header_len); | 
					
						
							| 
									
										
											  
											
												sflow: Fix sFlow sampling structure.
According to Neil McKee, in an email archived at
http://openvswitch.org/pipermail/dev_openvswitch.org/2010-January/000934.html:
    The containment rule is that a given sflow-datasource (sampler or
    poller) should be scoped within only one sflow-agent (or
    sub-agent).  So the issue arrises when you have two
    switches/datapaths defined on the same host being managed with
    the same IP address: each switch is a separate sub-agent, so they
    can run independently (e.g. with their own sequence numbers) but
    they can't both claim to speak for the same sflow-datasource.
    Specifically, they can't both represent the <ifindex>:0
    data-source.  This containment rule is necessary so that the
    sFlow collector can scale and combine the results accurately.
    One option would be to stick with the <ifindex>:0 data-source but
    elevate it to be global across all bridges, with a global
    sample_pool and a global sflow_agent.  Not tempting.  Better to
    go the other way and allow each interface to have it's own
    sampler, just as it already has it's own poller.  The ifIndex
    numbers are globally unique across all switches/datapaths on the
    host, so the containment is now clean.  Datasource <ifindex>:5
    might be on one switch, whille <ifindex>:7 can be on another.
    Other benefits are that 1) you can support the option of
    overriding the default sampling-rate on an interface-by-interface
    basis, and 2) this is how most sFlow implementations are coded,
    so there will be no surprises or interoperability issues with any
    sFlow collectors out there.
This commit implements the approach suggested by Neil.
This commit uses an atomic_t to represent the sampling pool.  This is
because we do want access to it to be atomic, but we expect that it will
"mostly" be accessed from a single CPU at a time.  Perhaps this is a bad
assumption; we can always switch to another form of synchronization later.
CC: Neil McKee <neil.mckee@inmon.com>
											
										 
											2010-01-20 13:52:42 -08:00
										 |  |  |     sfl_sampler_set_sFlowFsReceiver(sampler, RECEIVER_INDEX); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | void | 
					
						
							|  |  |  | ofproto_sflow_add_port(struct ofproto_sflow *os, uint16_t odp_port, | 
					
						
							|  |  |  |                        const char *netdev_name) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     struct ofproto_sflow_port *osp; | 
					
						
							|  |  |  |     struct netdev *netdev; | 
					
						
							|  |  |  |     uint32_t ifindex; | 
					
						
							|  |  |  |     int error; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     ofproto_sflow_del_port(os, odp_port); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Open network device. */ | 
					
						
							| 
									
										
										
										
											2010-02-05 15:58:27 -08:00
										 |  |  |     error = netdev_open_default(netdev_name, &netdev); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     if (error) { | 
					
						
							|  |  |  |         VLOG_WARN_RL(&rl, "failed to open network device \"%s\": %s", | 
					
						
							|  |  |  |                      netdev_name, strerror(error)); | 
					
						
							|  |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Add to table of ports. */ | 
					
						
							|  |  |  |     osp = xmalloc(sizeof *osp); | 
					
						
							|  |  |  |     osp->netdev = netdev; | 
					
						
							|  |  |  |     ifindex = netdev_get_ifindex(netdev); | 
					
						
							|  |  |  |     if (ifindex <= 0) { | 
					
						
							|  |  |  |         ifindex = (os->sflow_agent->subId << 16) + odp_port; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     SFL_DS_SET(osp->dsi, 0, ifindex, 0); | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |     osp->odp_port = odp_port; | 
					
						
							|  |  |  |     hmap_insert(&os->ports, &osp->hmap_node, hash_int(odp_port, 0)); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-05-05 13:26:23 -07:00
										 |  |  |     /* Add poller and sampler. */ | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     if (os->sflow_agent) { | 
					
						
							|  |  |  |         ofproto_sflow_add_poller(os, osp, odp_port); | 
					
						
							| 
									
										
										
										
											2010-05-05 13:26:23 -07:00
										 |  |  |         ofproto_sflow_add_sampler(os, osp); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  | static void | 
					
						
							|  |  |  | ofproto_sflow_del_port__(struct ofproto_sflow *os, | 
					
						
							|  |  |  |                          struct ofproto_sflow_port *osp) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     if (os->sflow_agent) { | 
					
						
							|  |  |  |         sfl_agent_removePoller(os->sflow_agent, &osp->dsi); | 
					
						
							|  |  |  |         sfl_agent_removeSampler(os->sflow_agent, &osp->dsi); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     netdev_close(osp->netdev); | 
					
						
							|  |  |  |     hmap_remove(&os->ports, &osp->hmap_node); | 
					
						
							|  |  |  |     free(osp); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | void | 
					
						
							|  |  |  | ofproto_sflow_del_port(struct ofproto_sflow *os, uint16_t odp_port) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |     struct ofproto_sflow_port *osp = ofproto_sflow_find_port(os, odp_port); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     if (osp) { | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |         ofproto_sflow_del_port__(os, osp); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void | 
					
						
							|  |  |  | ofproto_sflow_set_options(struct ofproto_sflow *os, | 
					
						
							|  |  |  |                           const struct ofproto_sflow_options *options) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     struct ofproto_sflow_port *osp; | 
					
						
							|  |  |  |     bool options_changed; | 
					
						
							|  |  |  |     SFLReceiver *receiver; | 
					
						
							|  |  |  |     SFLAddress agentIP; | 
					
						
							|  |  |  |     time_t now; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-11 11:09:14 -08:00
										 |  |  |     if (!options->targets.n || !options->sampling_rate) { | 
					
						
							|  |  |  |         /* No point in doing any work if there are no targets or nothing to
 | 
					
						
							|  |  |  |          * sample. */ | 
					
						
							|  |  |  |         ofproto_sflow_clear(os); | 
					
						
							|  |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     options_changed = (!os->options | 
					
						
							|  |  |  |                        || !ofproto_sflow_options_equal(options, os->options)); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Configure collectors if options have changed or if we're shortchanged in
 | 
					
						
							|  |  |  |      * collectors (which indicates that opening one or more of the configured | 
					
						
							|  |  |  |      * collectors failed, so that we should retry). */ | 
					
						
							|  |  |  |     if (options_changed | 
					
						
							|  |  |  |         || collectors_count(os->collectors) < options->targets.n) { | 
					
						
							|  |  |  |         collectors_destroy(os->collectors); | 
					
						
							| 
									
										
										
										
											2010-02-10 11:04:30 -08:00
										 |  |  |         collectors_create(&options->targets, SFL_DEFAULT_COLLECTOR_PORT, | 
					
						
							|  |  |  |                           &os->collectors); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |         if (os->collectors == NULL) { | 
					
						
							| 
									
										
										
										
											2010-01-11 11:09:14 -08:00
										 |  |  |             VLOG_WARN_RL(&rl, "no collectors could be initialized, " | 
					
						
							|  |  |  |                          "sFlow disabled"); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |             ofproto_sflow_clear(os); | 
					
						
							|  |  |  |             return; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Avoid reconfiguring if options didn't change. */ | 
					
						
							|  |  |  |     if (!options_changed) { | 
					
						
							|  |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     ofproto_sflow_options_destroy(os->options); | 
					
						
							|  |  |  |     os->options = ofproto_sflow_options_clone(options); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Choose agent IP address. */ | 
					
						
							|  |  |  |     if (!sflow_choose_agent_address(options->agent_device, | 
					
						
							|  |  |  |                                     options->control_ip, &agentIP)) { | 
					
						
							|  |  |  |         ofproto_sflow_clear(os); | 
					
						
							|  |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Create agent. */ | 
					
						
							|  |  |  |     VLOG_INFO("creating sFlow agent %d", options->sub_id); | 
					
						
							|  |  |  |     if (os->sflow_agent) { | 
					
						
							|  |  |  |         sfl_agent_release(os->sflow_agent); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     os->sflow_agent = xcalloc(1, sizeof *os->sflow_agent); | 
					
						
							| 
									
										
										
										
											2010-06-08 17:18:48 -07:00
										 |  |  |     now = time_wall(); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     sfl_agent_init(os->sflow_agent, | 
					
						
							|  |  |  |                    &agentIP, | 
					
						
							|  |  |  |                    options->sub_id, | 
					
						
							|  |  |  |                    now,         /* Boot time. */ | 
					
						
							|  |  |  |                    now,         /* Current time. */ | 
					
						
							|  |  |  |                    os,          /* Pointer supplied to callbacks. */ | 
					
						
							|  |  |  |                    sflow_agent_alloc_cb, | 
					
						
							|  |  |  |                    sflow_agent_free_cb, | 
					
						
							|  |  |  |                    sflow_agent_error_cb, | 
					
						
							|  |  |  |                    sflow_agent_send_packet_cb); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     receiver = sfl_agent_addReceiver(os->sflow_agent); | 
					
						
							| 
									
										
										
										
											2010-01-11 11:10:01 -08:00
										 |  |  |     sfl_receiver_set_sFlowRcvrOwner(receiver, "Open vSwitch sFlow"); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     sfl_receiver_set_sFlowRcvrTimeout(receiver, 0xffffffff); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Set the sampling_rate down in the datapath. */ | 
					
						
							|  |  |  |     dpif_set_sflow_probability(os->dpif, | 
					
						
							|  |  |  |                                MAX(1, UINT32_MAX / options->sampling_rate)); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
											  
											
												sflow: Fix sFlow sampling structure.
According to Neil McKee, in an email archived at
http://openvswitch.org/pipermail/dev_openvswitch.org/2010-January/000934.html:
    The containment rule is that a given sflow-datasource (sampler or
    poller) should be scoped within only one sflow-agent (or
    sub-agent).  So the issue arrises when you have two
    switches/datapaths defined on the same host being managed with
    the same IP address: each switch is a separate sub-agent, so they
    can run independently (e.g. with their own sequence numbers) but
    they can't both claim to speak for the same sflow-datasource.
    Specifically, they can't both represent the <ifindex>:0
    data-source.  This containment rule is necessary so that the
    sFlow collector can scale and combine the results accurately.
    One option would be to stick with the <ifindex>:0 data-source but
    elevate it to be global across all bridges, with a global
    sample_pool and a global sflow_agent.  Not tempting.  Better to
    go the other way and allow each interface to have it's own
    sampler, just as it already has it's own poller.  The ifIndex
    numbers are globally unique across all switches/datapaths on the
    host, so the containment is now clean.  Datasource <ifindex>:5
    might be on one switch, whille <ifindex>:7 can be on another.
    Other benefits are that 1) you can support the option of
    overriding the default sampling-rate on an interface-by-interface
    basis, and 2) this is how most sFlow implementations are coded,
    so there will be no surprises or interoperability issues with any
    sFlow collectors out there.
This commit implements the approach suggested by Neil.
This commit uses an atomic_t to represent the sampling pool.  This is
because we do want access to it to be atomic, but we expect that it will
"mostly" be accessed from a single CPU at a time.  Perhaps this is a bad
assumption; we can always switch to another form of synchronization later.
CC: Neil McKee <neil.mckee@inmon.com>
											
										 
											2010-01-20 13:52:42 -08:00
										 |  |  |     /* Add samplers and pollers for the currently known ports. */ | 
					
						
							| 
									
										
										
										
											2010-09-17 10:33:10 -07:00
										 |  |  |     HMAP_FOR_EACH (osp, hmap_node, &os->ports) { | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |         ofproto_sflow_add_poller(os, osp, osp->odp_port); | 
					
						
							| 
									
										
										
										
											2010-05-05 13:26:23 -07:00
										 |  |  |         ofproto_sflow_add_sampler(os, osp); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-06 10:24:52 -08:00
										 |  |  | static int | 
					
						
							|  |  |  | ofproto_sflow_odp_port_to_ifindex(const struct ofproto_sflow *os, | 
					
						
							|  |  |  |                                   uint16_t odp_port) | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2010-07-19 11:43:05 -07:00
										 |  |  |     struct ofproto_sflow_port *osp = ofproto_sflow_find_port(os, odp_port); | 
					
						
							| 
									
										
										
										
											2010-01-06 10:24:52 -08:00
										 |  |  |     return osp ? SFL_DS_INDEX(osp->dsi) : 0; | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | void | 
					
						
							| 
									
										
											  
											
												datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other.  To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace.  This means that userspace can intelligently figure out
what to do:
   - If userspace's notion of the flow for the packet matches the kernel's,
     then nothing special is necessary.
   - If the kernel has a more specific notion for the flow than userspace,
     for example if the kernel decoded IPv6 headers but userspace stopped
     at the Ethernet type (because it does not understand IPv6), then again
     nothing special is necessary: userspace can still set up the flow in
     the usual way.
   - If userspace has a more specific notion for the flow than the kernel,
     for example if userspace decoded an IPv6 header but the kernel
     stopped at the Ethernet type, then userspace can forward the packet
     manually, without setting up a flow in the kernel.  (This case is
     bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently.  This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes.  The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace.  I'm not entirely pleased with how I did it.  I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome.  Not changing anything wasn't an option,
unfortunately.  At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace.  But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
											
										 
											2011-01-24 14:59:57 -08:00
										 |  |  | ofproto_sflow_received(struct ofproto_sflow *os, | 
					
						
							|  |  |  |                        const struct dpif_upcall *upcall, | 
					
						
							|  |  |  |                        const struct flow *flow) | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | { | 
					
						
							|  |  |  |     SFL_FLOW_SAMPLE_TYPE fs; | 
					
						
							|  |  |  |     SFLFlow_sample_element hdrElem; | 
					
						
							|  |  |  |     SFLSampled_header *header; | 
					
						
							|  |  |  |     SFLFlow_sample_element switchElem; | 
					
						
							| 
									
										
											  
											
												sflow: Fix sFlow sampling structure.
According to Neil McKee, in an email archived at
http://openvswitch.org/pipermail/dev_openvswitch.org/2010-January/000934.html:
    The containment rule is that a given sflow-datasource (sampler or
    poller) should be scoped within only one sflow-agent (or
    sub-agent).  So the issue arrises when you have two
    switches/datapaths defined on the same host being managed with
    the same IP address: each switch is a separate sub-agent, so they
    can run independently (e.g. with their own sequence numbers) but
    they can't both claim to speak for the same sflow-datasource.
    Specifically, they can't both represent the <ifindex>:0
    data-source.  This containment rule is necessary so that the
    sFlow collector can scale and combine the results accurately.
    One option would be to stick with the <ifindex>:0 data-source but
    elevate it to be global across all bridges, with a global
    sample_pool and a global sflow_agent.  Not tempting.  Better to
    go the other way and allow each interface to have it's own
    sampler, just as it already has it's own poller.  The ifIndex
    numbers are globally unique across all switches/datapaths on the
    host, so the containment is now clean.  Datasource <ifindex>:5
    might be on one switch, whille <ifindex>:7 can be on another.
    Other benefits are that 1) you can support the option of
    overriding the default sampling-rate on an interface-by-interface
    basis, and 2) this is how most sFlow implementations are coded,
    so there will be no surprises or interoperability issues with any
    sFlow collectors out there.
This commit implements the approach suggested by Neil.
This commit uses an atomic_t to represent the sampling pool.  This is
because we do want access to it to be atomic, but we expect that it will
"mostly" be accessed from a single CPU at a time.  Perhaps this is a bad
assumption; we can always switch to another form of synchronization later.
CC: Neil McKee <neil.mckee@inmon.com>
											
										 
											2010-01-20 13:52:42 -08:00
										 |  |  |     SFLSampler *sampler; | 
					
						
							| 
									
										
										
										
											2010-12-10 10:40:58 -08:00
										 |  |  |     unsigned int left; | 
					
						
							| 
									
										
											  
											
												datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other.  To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace.  This means that userspace can intelligently figure out
what to do:
   - If userspace's notion of the flow for the packet matches the kernel's,
     then nothing special is necessary.
   - If the kernel has a more specific notion for the flow than userspace,
     for example if the kernel decoded IPv6 headers but userspace stopped
     at the Ethernet type (because it does not understand IPv6), then again
     nothing special is necessary: userspace can still set up the flow in
     the usual way.
   - If userspace has a more specific notion for the flow than the kernel,
     for example if userspace decoded an IPv6 header but the kernel
     stopped at the Ethernet type, then userspace can forward the packet
     manually, without setting up a flow in the kernel.  (This case is
     bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently.  This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes.  The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace.  I'm not entirely pleased with how I did it.  I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome.  Not changing anything wasn't an option,
unfortunately.  At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace.  But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
											
										 
											2011-01-24 14:59:57 -08:00
										 |  |  |     struct nlattr *a; | 
					
						
							| 
									
										
										
										
											2010-12-10 10:40:58 -08:00
										 |  |  |     size_t n_outputs; | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     /* Build a flow sample */ | 
					
						
							|  |  |  |     memset(&fs, 0, sizeof fs); | 
					
						
							| 
									
										
											  
											
												datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other.  To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace.  This means that userspace can intelligently figure out
what to do:
   - If userspace's notion of the flow for the packet matches the kernel's,
     then nothing special is necessary.
   - If the kernel has a more specific notion for the flow than userspace,
     for example if the kernel decoded IPv6 headers but userspace stopped
     at the Ethernet type (because it does not understand IPv6), then again
     nothing special is necessary: userspace can still set up the flow in
     the usual way.
   - If userspace has a more specific notion for the flow than the kernel,
     for example if userspace decoded an IPv6 header but the kernel
     stopped at the Ethernet type, then userspace can forward the packet
     manually, without setting up a flow in the kernel.  (This case is
     bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently.  This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes.  The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace.  I'm not entirely pleased with how I did it.  I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome.  Not changing anything wasn't an option,
unfortunately.  At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace.  But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
											
										 
											2011-01-24 14:59:57 -08:00
										 |  |  |     fs.input = ofproto_sflow_odp_port_to_ifindex(os, flow->in_port); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     fs.output = 0;              /* Filled in correctly below. */ | 
					
						
							| 
									
										
											  
											
												datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other.  To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace.  This means that userspace can intelligently figure out
what to do:
   - If userspace's notion of the flow for the packet matches the kernel's,
     then nothing special is necessary.
   - If the kernel has a more specific notion for the flow than userspace,
     for example if the kernel decoded IPv6 headers but userspace stopped
     at the Ethernet type (because it does not understand IPv6), then again
     nothing special is necessary: userspace can still set up the flow in
     the usual way.
   - If userspace has a more specific notion for the flow than the kernel,
     for example if userspace decoded an IPv6 header but the kernel
     stopped at the Ethernet type, then userspace can forward the packet
     manually, without setting up a flow in the kernel.  (This case is
     bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently.  This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes.  The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace.  I'm not entirely pleased with how I did it.  I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome.  Not changing anything wasn't an option,
unfortunately.  At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace.  But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
											
										 
											2011-01-24 14:59:57 -08:00
										 |  |  |     fs.sample_pool = upcall->sample_pool; | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | 
 | 
					
						
							| 
									
										
											  
											
												sflow: Fix sFlow sampling structure.
According to Neil McKee, in an email archived at
http://openvswitch.org/pipermail/dev_openvswitch.org/2010-January/000934.html:
    The containment rule is that a given sflow-datasource (sampler or
    poller) should be scoped within only one sflow-agent (or
    sub-agent).  So the issue arrises when you have two
    switches/datapaths defined on the same host being managed with
    the same IP address: each switch is a separate sub-agent, so they
    can run independently (e.g. with their own sequence numbers) but
    they can't both claim to speak for the same sflow-datasource.
    Specifically, they can't both represent the <ifindex>:0
    data-source.  This containment rule is necessary so that the
    sFlow collector can scale and combine the results accurately.
    One option would be to stick with the <ifindex>:0 data-source but
    elevate it to be global across all bridges, with a global
    sample_pool and a global sflow_agent.  Not tempting.  Better to
    go the other way and allow each interface to have it's own
    sampler, just as it already has it's own poller.  The ifIndex
    numbers are globally unique across all switches/datapaths on the
    host, so the containment is now clean.  Datasource <ifindex>:5
    might be on one switch, whille <ifindex>:7 can be on another.
    Other benefits are that 1) you can support the option of
    overriding the default sampling-rate on an interface-by-interface
    basis, and 2) this is how most sFlow implementations are coded,
    so there will be no surprises or interoperability issues with any
    sFlow collectors out there.
This commit implements the approach suggested by Neil.
This commit uses an atomic_t to represent the sampling pool.  This is
because we do want access to it to be atomic, but we expect that it will
"mostly" be accessed from a single CPU at a time.  Perhaps this is a bad
assumption; we can always switch to another form of synchronization later.
CC: Neil McKee <neil.mckee@inmon.com>
											
										 
											2010-01-20 13:52:42 -08:00
										 |  |  |     /* We are going to give it to the sampler that represents this input port.
 | 
					
						
							|  |  |  |      * By implementing "ingress-only" sampling like this we ensure that we | 
					
						
							|  |  |  |      * never have to offer the same sample to more than one sampler. */ | 
					
						
							|  |  |  |     sampler = sfl_agent_getSamplerByIfIndex(os->sflow_agent, fs.input); | 
					
						
							|  |  |  |     if (!sampler) { | 
					
						
							|  |  |  |         VLOG_WARN_RL(&rl, "no sampler for input ifIndex (%"PRIu32")", | 
					
						
							|  |  |  |                      fs.input); | 
					
						
							|  |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     /* Sampled header. */ | 
					
						
							|  |  |  |     memset(&hdrElem, 0, sizeof hdrElem); | 
					
						
							|  |  |  |     hdrElem.tag = SFLFLOW_HEADER; | 
					
						
							|  |  |  |     header = &hdrElem.flowType.header; | 
					
						
							|  |  |  |     header->header_protocol = SFLHEADER_ETHERNET_ISO8023; | 
					
						
							| 
									
										
										
										
											2010-05-05 13:24:03 -07:00
										 |  |  |     /* The frame_length should include the Ethernet FCS (4 bytes),
 | 
					
						
							|  |  |  |        but it has already been stripped,  so we need to add 4 here. */ | 
					
						
							| 
									
										
											  
											
												datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other.  To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace.  This means that userspace can intelligently figure out
what to do:
   - If userspace's notion of the flow for the packet matches the kernel's,
     then nothing special is necessary.
   - If the kernel has a more specific notion for the flow than userspace,
     for example if the kernel decoded IPv6 headers but userspace stopped
     at the Ethernet type (because it does not understand IPv6), then again
     nothing special is necessary: userspace can still set up the flow in
     the usual way.
   - If userspace has a more specific notion for the flow than the kernel,
     for example if userspace decoded an IPv6 header but the kernel
     stopped at the Ethernet type, then userspace can forward the packet
     manually, without setting up a flow in the kernel.  (This case is
     bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently.  This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes.  The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace.  I'm not entirely pleased with how I did it.  I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome.  Not changing anything wasn't an option,
unfortunately.  At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace.  But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
											
										 
											2011-01-24 14:59:57 -08:00
										 |  |  |     header->frame_length = upcall->packet->size + 4; | 
					
						
							| 
									
										
										
										
											2010-05-05 13:24:03 -07:00
										 |  |  |     /* Ethernet FCS stripped off. */ | 
					
						
							|  |  |  |     header->stripped = 4; | 
					
						
							| 
									
										
											  
											
												datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other.  To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace.  This means that userspace can intelligently figure out
what to do:
   - If userspace's notion of the flow for the packet matches the kernel's,
     then nothing special is necessary.
   - If the kernel has a more specific notion for the flow than userspace,
     for example if the kernel decoded IPv6 headers but userspace stopped
     at the Ethernet type (because it does not understand IPv6), then again
     nothing special is necessary: userspace can still set up the flow in
     the usual way.
   - If userspace has a more specific notion for the flow than the kernel,
     for example if userspace decoded an IPv6 header but the kernel
     stopped at the Ethernet type, then userspace can forward the packet
     manually, without setting up a flow in the kernel.  (This case is
     bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently.  This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes.  The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace.  I'm not entirely pleased with how I did it.  I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome.  Not changing anything wasn't an option,
unfortunately.  At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace.  But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
											
										 
											2011-01-24 14:59:57 -08:00
										 |  |  |     header->header_length = MIN(upcall->packet->size, | 
					
						
							|  |  |  |                                 sampler->sFlowFsMaximumHeaderSize); | 
					
						
							|  |  |  |     header->header_bytes = upcall->packet->data; | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     /* Add extended switch element. */ | 
					
						
							|  |  |  |     memset(&switchElem, 0, sizeof(switchElem)); | 
					
						
							|  |  |  |     switchElem.tag = SFLFLOW_EX_SWITCH; | 
					
						
							| 
									
										
											  
											
												datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other.  To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace.  This means that userspace can intelligently figure out
what to do:
   - If userspace's notion of the flow for the packet matches the kernel's,
     then nothing special is necessary.
   - If the kernel has a more specific notion for the flow than userspace,
     for example if the kernel decoded IPv6 headers but userspace stopped
     at the Ethernet type (because it does not understand IPv6), then again
     nothing special is necessary: userspace can still set up the flow in
     the usual way.
   - If userspace has a more specific notion for the flow than the kernel,
     for example if userspace decoded an IPv6 header but the kernel
     stopped at the Ethernet type, then userspace can forward the packet
     manually, without setting up a flow in the kernel.  (This case is
     bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently.  This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes.  The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace.  I'm not entirely pleased with how I did it.  I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome.  Not changing anything wasn't an option,
unfortunately.  At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace.  But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
											
										 
											2011-01-24 14:59:57 -08:00
										 |  |  |     switchElem.flowType.sw.src_vlan = vlan_tci_to_vid(flow->vlan_tci); | 
					
						
							|  |  |  |     switchElem.flowType.sw.src_priority = vlan_tci_to_pcp(flow->vlan_tci); | 
					
						
							| 
									
										
										
										
											2010-05-05 13:24:27 -07:00
										 |  |  |      /* Initialize the output VLAN and priority to be the same as the input,
 | 
					
						
							|  |  |  |         but these fields can be overriden below if affected by an action. */ | 
					
						
							|  |  |  |     switchElem.flowType.sw.dst_vlan = switchElem.flowType.sw.src_vlan; | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     switchElem.flowType.sw.dst_priority = switchElem.flowType.sw.src_priority; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Figure out the output ports. */ | 
					
						
							|  |  |  |     n_outputs = 0; | 
					
						
							| 
									
										
											  
											
												datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other.  To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace.  This means that userspace can intelligently figure out
what to do:
   - If userspace's notion of the flow for the packet matches the kernel's,
     then nothing special is necessary.
   - If the kernel has a more specific notion for the flow than userspace,
     for example if the kernel decoded IPv6 headers but userspace stopped
     at the Ethernet type (because it does not understand IPv6), then again
     nothing special is necessary: userspace can still set up the flow in
     the usual way.
   - If userspace has a more specific notion for the flow than the kernel,
     for example if userspace decoded an IPv6 header but the kernel
     stopped at the Ethernet type, then userspace can forward the packet
     manually, without setting up a flow in the kernel.  (This case is
     bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently.  This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes.  The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace.  I'm not entirely pleased with how I did it.  I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome.  Not changing anything wasn't an option,
unfortunately.  At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace.  But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
											
										 
											2011-01-24 14:59:57 -08:00
										 |  |  |     NL_ATTR_FOR_EACH_UNSAFE (a, left, upcall->actions, upcall->actions_len) { | 
					
						
							| 
									
										
										
										
											2010-12-10 10:40:58 -08:00
										 |  |  |         ovs_be16 tci; | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-12-10 10:40:58 -08:00
										 |  |  |         switch (nl_attr_type(a)) { | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |         case ODPAT_OUTPUT: | 
					
						
							| 
									
										
										
										
											2010-12-10 10:40:58 -08:00
										 |  |  |             fs.output = ofproto_sflow_odp_port_to_ifindex(os, | 
					
						
							|  |  |  |                                                           nl_attr_get_u32(a)); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |             n_outputs++; | 
					
						
							|  |  |  |             break; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-08 16:26:21 -07:00
										 |  |  |         case ODPAT_SET_DL_TCI: | 
					
						
							| 
									
										
										
										
											2010-12-10 10:40:58 -08:00
										 |  |  |             tci = nl_attr_get_be16(a); | 
					
						
							| 
									
										
										
										
											2010-10-18 11:18:10 -07:00
										 |  |  |             switchElem.flowType.sw.dst_vlan = vlan_tci_to_vid(tci); | 
					
						
							|  |  |  |             switchElem.flowType.sw.dst_priority = vlan_tci_to_pcp(tci); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |             break; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         default: | 
					
						
							|  |  |  |             break; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2010-01-11 11:09:43 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     /* Set output port, as defined by http://www.sflow.org/sflow_version_5.txt
 | 
					
						
							|  |  |  |        (search for "Input/output port information"). */ | 
					
						
							| 
									
										
										
										
											2010-01-08 16:10:01 -08:00
										 |  |  |     if (!n_outputs) { | 
					
						
							|  |  |  |         /* This value indicates that the packet was dropped for an unknown
 | 
					
						
							|  |  |  |          * reason. */ | 
					
						
							|  |  |  |         fs.output = 0x40000000 | 256; | 
					
						
							|  |  |  |     } else if (n_outputs > 1 || !fs.output) { | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |         /* Setting the high bit means "multiple output ports". */ | 
					
						
							|  |  |  |         fs.output = 0x80000000 | n_outputs; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /* Submit the flow sample to be encoded into the next datagram. */ | 
					
						
							|  |  |  |     SFLADD_ELEMENT(&fs, &hdrElem); | 
					
						
							|  |  |  |     SFLADD_ELEMENT(&fs, &switchElem); | 
					
						
							|  |  |  |     sfl_sampler_writeFlowSample(sampler, &fs); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void | 
					
						
							|  |  |  | ofproto_sflow_run(struct ofproto_sflow *os) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     if (ofproto_sflow_is_enabled(os)) { | 
					
						
							|  |  |  |         time_t now = time_now(); | 
					
						
							|  |  |  |         if (now >= os->next_tick) { | 
					
						
							| 
									
										
										
										
											2010-06-08 17:18:48 -07:00
										 |  |  |             sfl_agent_tick(os->sflow_agent, time_wall()); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |             os->next_tick = now + 1; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void | 
					
						
							|  |  |  | ofproto_sflow_wait(struct ofproto_sflow *os) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     if (ofproto_sflow_is_enabled(os)) { | 
					
						
							| 
									
										
										
										
											2010-05-12 12:53:07 -07:00
										 |  |  |         poll_timer_wait_until(os->next_tick * 1000LL); | 
					
						
							| 
									
										
										
										
											2010-01-04 13:08:37 -08:00
										 |  |  |     } | 
					
						
							|  |  |  | } |