2009-06-15 15:11:30 -07:00
|
|
|
/*
|
2010-05-27 09:24:11 -07:00
|
|
|
* Copyright (c) 2009, 2010 Nicira Networks.
|
2009-06-15 15:11:30 -07:00
|
|
|
* Distributed under the terms of the GNU GPL version 2.
|
|
|
|
*
|
|
|
|
* Significant portions of this file may be copied from parts of the Linux
|
|
|
|
* kernel, by Linus Torvalds and others.
|
|
|
|
*/
|
|
|
|
|
2009-07-08 13:19:16 -07:00
|
|
|
#ifndef FLOW_H
|
|
|
|
#define FLOW_H 1
|
|
|
|
|
|
|
|
#include <linux/kernel.h>
|
2010-12-10 14:38:25 -08:00
|
|
|
#include <linux/netlink.h>
|
2009-07-08 13:19:16 -07:00
|
|
|
#include <linux/spinlock.h>
|
|
|
|
#include <linux/types.h>
|
|
|
|
#include <linux/rcupdate.h>
|
2010-08-24 16:00:27 -07:00
|
|
|
#include <linux/if_ether.h>
|
2010-07-15 19:22:07 -07:00
|
|
|
#include <linux/jiffies.h>
|
2010-05-27 09:24:11 -07:00
|
|
|
#include <linux/time.h>
|
2009-07-08 13:19:16 -07:00
|
|
|
|
|
|
|
#include "openvswitch/datapath-protocol.h"
|
2010-04-02 16:46:18 -04:00
|
|
|
#include "table.h"
|
2009-07-08 13:19:16 -07:00
|
|
|
|
|
|
|
struct sk_buff;
|
|
|
|
|
|
|
|
struct sw_flow_actions {
|
|
|
|
struct rcu_head rcu;
|
2010-12-10 10:40:58 -08:00
|
|
|
u32 actions_len;
|
|
|
|
struct nlattr actions[];
|
2009-07-08 13:19:16 -07:00
|
|
|
};
|
|
|
|
|
2011-01-23 18:44:44 -08:00
|
|
|
struct sw_flow_key {
|
|
|
|
__be64 tun_id; /* Encapsulating tunnel ID. */
|
|
|
|
__be32 nw_src; /* IP source address. */
|
|
|
|
__be32 nw_dst; /* IP destination address. */
|
|
|
|
u16 in_port; /* Input switch port. */
|
|
|
|
__be16 dl_tci; /* 0 if no VLAN, VLAN_TAG_PRESENT set otherwise. */
|
|
|
|
__be16 dl_type; /* Ethernet frame type. */
|
|
|
|
__be16 tp_src; /* TCP/UDP source port. */
|
|
|
|
__be16 tp_dst; /* TCP/UDP destination port. */
|
|
|
|
u8 dl_src[ETH_ALEN]; /* Ethernet source address. */
|
|
|
|
u8 dl_dst[ETH_ALEN]; /* Ethernet destination address. */
|
|
|
|
u8 nw_proto; /* IP protocol or lower 8 bits of ARP opcode. */
|
|
|
|
u8 nw_tos; /* IP ToS (DSCP field, 6 bits). */
|
|
|
|
};
|
|
|
|
|
2009-07-08 13:19:16 -07:00
|
|
|
struct sw_flow {
|
|
|
|
struct rcu_head rcu;
|
2010-04-02 16:46:18 -04:00
|
|
|
struct tbl_node tbl_node;
|
|
|
|
|
2011-01-23 18:44:44 -08:00
|
|
|
struct sw_flow_key key;
|
2010-12-04 11:50:53 -08:00
|
|
|
struct sw_flow_actions __rcu *sf_acts;
|
2009-07-08 13:19:16 -07:00
|
|
|
|
2010-08-29 09:49:51 -07:00
|
|
|
atomic_t refcnt;
|
|
|
|
bool dead;
|
|
|
|
|
2009-07-08 13:19:16 -07:00
|
|
|
spinlock_t lock; /* Lock for values below. */
|
2010-07-15 19:22:07 -07:00
|
|
|
unsigned long used; /* Last used time (in jiffies). */
|
2009-07-08 13:19:16 -07:00
|
|
|
u64 packet_count; /* Number of packets matched. */
|
|
|
|
u64 byte_count; /* Number of bytes matched. */
|
|
|
|
u8 tcp_flags; /* Union of seen TCP flags. */
|
|
|
|
};
|
|
|
|
|
2010-08-24 16:00:27 -07:00
|
|
|
struct arp_eth_header
|
|
|
|
{
|
|
|
|
__be16 ar_hrd; /* format of hardware address */
|
|
|
|
__be16 ar_pro; /* format of protocol address */
|
|
|
|
unsigned char ar_hln; /* length of hardware address */
|
|
|
|
unsigned char ar_pln; /* length of protocol address */
|
|
|
|
__be16 ar_op; /* ARP opcode (command) */
|
|
|
|
|
|
|
|
/* Ethernet+IPv4 specific members. */
|
|
|
|
unsigned char ar_sha[ETH_ALEN]; /* sender hardware address */
|
|
|
|
unsigned char ar_sip[4]; /* sender IP address */
|
|
|
|
unsigned char ar_tha[ETH_ALEN]; /* target hardware address */
|
|
|
|
unsigned char ar_tip[4]; /* target IP address */
|
2010-12-11 23:29:22 -08:00
|
|
|
} __packed;
|
2010-08-24 16:00:27 -07:00
|
|
|
|
2010-07-26 18:46:27 -07:00
|
|
|
int flow_init(void);
|
|
|
|
void flow_exit(void);
|
2009-07-08 13:19:16 -07:00
|
|
|
|
2010-07-26 18:46:27 -07:00
|
|
|
struct sw_flow *flow_alloc(void);
|
2009-07-08 13:19:16 -07:00
|
|
|
void flow_deferred_free(struct sw_flow *);
|
2010-07-26 18:46:27 -07:00
|
|
|
void flow_free_tbl(struct tbl_node *);
|
|
|
|
|
2010-12-10 10:40:58 -08:00
|
|
|
struct sw_flow_actions *flow_actions_alloc(u32 actions_len);
|
2009-07-08 13:19:16 -07:00
|
|
|
void flow_deferred_free_acts(struct sw_flow_actions *);
|
2010-07-26 18:46:27 -07:00
|
|
|
|
2010-08-29 09:49:51 -07:00
|
|
|
void flow_hold(struct sw_flow *);
|
|
|
|
void flow_put(struct sw_flow *);
|
|
|
|
|
2011-01-23 18:44:44 -08:00
|
|
|
int flow_extract(struct sk_buff *, u16 in_port, struct sw_flow_key *, bool *is_frag);
|
2009-07-08 13:19:16 -07:00
|
|
|
void flow_used(struct sw_flow *, struct sk_buff *);
|
|
|
|
|
2011-01-23 18:44:44 -08:00
|
|
|
u32 flow_hash(const struct sw_flow_key *);
|
2010-04-02 16:46:18 -04:00
|
|
|
int flow_cmp(const struct tbl_node *, void *target);
|
2009-07-08 13:19:16 -07:00
|
|
|
|
2011-01-23 18:44:44 -08:00
|
|
|
/* By my calculations currently the longest valid nlattr-formatted flow key is
|
|
|
|
* 80 bytes long, so this leaves some safety margin.
|
|
|
|
*/
|
|
|
|
#define FLOW_BUFSIZE 96
|
|
|
|
|
datapath: Report kernel's flow key when passing packets up to userspace.
One of the goals for Open vSwitch is to decouple kernel and userspace
software, so that either one can be upgraded or rolled back independent of
the other. To do this in full generality, it must be possible to change
the kernel's idea of the flow key separately from the userspace version.
This commit takes one step in that direction by making the kernel report
its idea of the flow that a packet belongs to whenever it passes a packet
up to userspace. This means that userspace can intelligently figure out
what to do:
- If userspace's notion of the flow for the packet matches the kernel's,
then nothing special is necessary.
- If the kernel has a more specific notion for the flow than userspace,
for example if the kernel decoded IPv6 headers but userspace stopped
at the Ethernet type (because it does not understand IPv6), then again
nothing special is necessary: userspace can still set up the flow in
the usual way.
- If userspace has a more specific notion for the flow than the kernel,
for example if userspace decoded an IPv6 header but the kernel
stopped at the Ethernet type, then userspace can forward the packet
manually, without setting up a flow in the kernel. (This case is
bad from a performance point of view, but at least it is correct.)
This commit does not actually make userspace flexible enough to handle
changes in the kernel flow key structure, although userspace does now
have enough information to do that intelligently. This will have to wait
for later commits.
This commit is bigger than it would otherwise be because it is rolled
together with changing "struct odp_msg" to a sequence of Netlink
attributes. The alternative, to do each of those changes in a separate
patch, seemed like overkill because it meant that either we would have to
introduce and then kill off Netlink attributes for in_port and tun_id, if
Netlink conversion went first, or shove yet another variable-length header
into the stuff already after odp_msg, if adding the flow key to odp_msg
went first.
This commit will slow down performance of checksumming packets sent up to
userspace. I'm not entirely pleased with how I did it. I considered a
couple of alternatives, but none of them seemed that much better.
Suggestions welcome. Not changing anything wasn't an option,
unfortunately. At any rate some slowdown will become unavoidable when OVS
actually starts using Netlink instead of just Netlink framing.
(Actually, I thought of one option where we could avoid that: make
userspace do the checksum instead, by passing csum_start and csum_offset as
part of what goes to userspace. But that's not perfect either.)
Signed-off-by: Ben Pfaff <blp@nicira.com>
Acked-by: Jesse Gross <jesse@nicira.com>
2011-01-24 14:59:57 -08:00
|
|
|
u32 flow_to_nlattrs(const struct sw_flow_key *, struct sk_buff *);
|
2011-01-23 18:44:44 -08:00
|
|
|
int flow_copy_from_user(struct sw_flow_key *, const struct nlattr __user *ukey, u32 key_len);
|
|
|
|
int flow_copy_to_user(struct nlattr __user *ukey, const struct sw_flow_key *, u32 key_len);
|
|
|
|
|
2010-07-23 13:05:25 -07:00
|
|
|
static inline struct sw_flow *flow_cast(const struct tbl_node *node)
|
|
|
|
{
|
|
|
|
return container_of(node, struct sw_flow, tbl_node);
|
|
|
|
}
|
|
|
|
|
2009-07-08 13:19:16 -07:00
|
|
|
#endif /* flow.h */
|