mirror of
				https://github.com/openvswitch/ovs
				synced 2025-10-25 15:07:05 +00:00 
			
		
		
		
	datapath: Mega flow implementation
Add wildcarded flow support in kernel datapath. Wildcarded flow can improve OVS flow set up performance by avoid sending matching new flows to the user space program. The exact performance boost will largely dependent on wildcarded flow hit rate. In case all new flows hits wildcard flows, the flow set up rate is within 5% of that of linux bridge module. Pravin has made significant contributions to this patch. Including API clean ups and bug fixes. Co-authored-by: Pravin B Shelar <pshelar@nicira.com> Signed-off-by: Pravin B Shelar <pshelar@nicira.com> Signed-off-by: Andy Zhou <azhou@nicira.com> [jesse: Additional documentation, fix memory leak, and improve validation.] Signed-off-by: Jesse Gross <jesse@nicira.com>
This commit is contained in:
		| @@ -91,6 +91,46 @@ Often we ellipsize arguments not important to the discussion, e.g.: | ||||
|     in_port(1), eth(...), eth_type(0x0800), ipv4(...), tcp(...) | ||||
|  | ||||
|  | ||||
| Wildcarded flow key format | ||||
| -------------------------- | ||||
|  | ||||
| A wildcarded flow is described with two sequences of Netlink attributes | ||||
| passed over the Netlink socket. A flow key, exactly as described above, and an | ||||
| optional corresponding flow mask. | ||||
|  | ||||
| A wildcarded flow can represent a group of exact match flows. Each '1' bit | ||||
| in the mask specifies a exact match with the corresponding bit in the flow key. | ||||
| A '0' bit specifies a don't care bit, which will match either a '1' or '0' bit | ||||
| of a incoming packet. Using wildcarded flow can improve the flow set up rate | ||||
| by reduce the number of new flows need to be processed by the user space program. | ||||
|  | ||||
| Support for the mask Netlink attribute is optional for both the kernel and user | ||||
| space program. The kernel can ignore the mask attribute, installing an exact | ||||
| match flow, or reduce the number of don't care bits in the kernel to less than | ||||
| what was specified by the user space program. In this case, variations in bits | ||||
| that the kernel does not implement will simply result in additional flow setups. | ||||
| The kernel module will also work with user space programs that neither support | ||||
| nor supply flow mask attributes. | ||||
|  | ||||
| Since the kernel may ignore or modify wildcard bits, it can be difficult for | ||||
| the userspace program to know exactly what matches are installed. There are | ||||
| two possible approaches: reactively install flows as they miss the kernel | ||||
| flow table (and therefore not attempt to determine wildcard changes at all) | ||||
| or use the kernel's response messages to determine the installed wildcards. | ||||
|  | ||||
| When interacting with userspace, the kernel should maintain the match portion | ||||
| of the key exactly as originally installed. This will provides a handle to | ||||
| identify the flow for all future operations. However, when reporting the | ||||
| mask of an installed flow, the mask should include any restrictions imposed | ||||
| by the kernel. | ||||
|  | ||||
| The behavior when using overlapping wildcarded flows is undefined. It is the | ||||
| responsibility of the user space program to ensure that any incoming packet | ||||
| can match at most one flow, wildcarded or not. The current implementation | ||||
| performs best-effort detection of overlapping wildcarded flows and may reject | ||||
| some but not all of them. However, this behavior may change in future versions. | ||||
|  | ||||
|  | ||||
| Basic rule for evolving flow keys | ||||
| --------------------------------- | ||||
|  | ||||
|   | ||||
| @@ -1,5 +1,5 @@ | ||||
| /* | ||||
|  * Copyright (c) 2007-2012 Nicira, Inc. | ||||
|  * Copyright (c) 2007-2013 Nicira, Inc. | ||||
|  * | ||||
|  * This program is free software; you can redistribute it and/or | ||||
|  * modify it under the terms of version 2 of the GNU General Public | ||||
| @@ -173,7 +173,7 @@ static void destroy_dp_rcu(struct rcu_head *rcu) | ||||
| { | ||||
| 	struct datapath *dp = container_of(rcu, struct datapath, rcu); | ||||
|  | ||||
| 	ovs_flow_tbl_destroy((__force struct flow_table *)dp->table); | ||||
| 	ovs_flow_tbl_destroy((__force struct flow_table *)dp->table, false); | ||||
| 	free_percpu(dp->stats_percpu); | ||||
| 	release_net(ovs_dp_get_net(dp)); | ||||
| 	kfree(dp->ports); | ||||
| @@ -234,19 +234,18 @@ void ovs_dp_process_received_packet(struct vport *p, struct sk_buff *skb) | ||||
| 	struct sw_flow_key key; | ||||
| 	u64 *stats_counter; | ||||
| 	int error; | ||||
| 	int key_len; | ||||
|  | ||||
| 	stats = this_cpu_ptr(dp->stats_percpu); | ||||
|  | ||||
| 	/* Extract flow from 'skb' into 'key'. */ | ||||
| 	error = ovs_flow_extract(skb, p->port_no, &key, &key_len); | ||||
| 	error = ovs_flow_extract(skb, p->port_no, &key); | ||||
| 	if (unlikely(error)) { | ||||
| 		kfree_skb(skb); | ||||
| 		return; | ||||
| 	} | ||||
|  | ||||
| 	/* Look up flow. */ | ||||
| 	flow = ovs_flow_tbl_lookup(rcu_dereference(dp->table), &key, key_len); | ||||
| 	flow = ovs_flow_lookup(rcu_dereference(dp->table), &key); | ||||
| 	if (unlikely(!flow)) { | ||||
| 		struct dp_upcall_info upcall; | ||||
|  | ||||
| @@ -443,7 +442,7 @@ static int queue_userspace_packet(struct net *net, int dp_ifindex, | ||||
| 	upcall->dp_ifindex = dp_ifindex; | ||||
|  | ||||
| 	nla = nla_nest_start(user_skb, OVS_PACKET_ATTR_KEY); | ||||
| 	ovs_flow_to_nlattrs(upcall_info->key, user_skb); | ||||
| 	ovs_flow_to_nlattrs(upcall_info->key, upcall_info->key, user_skb); | ||||
| 	nla_nest_end(user_skb, nla); | ||||
|  | ||||
| 	if (upcall_info->userdata) | ||||
| @@ -476,7 +475,7 @@ static int flush_flows(struct datapath *dp) | ||||
|  | ||||
| 	rcu_assign_pointer(dp->table, new_table); | ||||
|  | ||||
| 	ovs_flow_tbl_deferred_destroy(old_table); | ||||
| 	ovs_flow_tbl_destroy(old_table, true); | ||||
| 	return 0; | ||||
| } | ||||
|  | ||||
| @@ -619,10 +618,12 @@ static int validate_tp_port(const struct sw_flow_key *flow_key) | ||||
| static int validate_and_copy_set_tun(const struct nlattr *attr, | ||||
| 				     struct sw_flow_actions **sfa) | ||||
| { | ||||
| 	struct ovs_key_ipv4_tunnel tun_key; | ||||
| 	struct sw_flow_match match; | ||||
| 	struct sw_flow_key key; | ||||
| 	int err, start; | ||||
|  | ||||
| 	err = ipv4_tun_from_nlattr(nla_data(attr), &tun_key); | ||||
| 	ovs_match_init(&match, &key, NULL); | ||||
| 	err = ipv4_tun_from_nlattr(nla_data(attr), &match, false); | ||||
| 	if (err) | ||||
| 		return err; | ||||
|  | ||||
| @@ -630,7 +631,8 @@ static int validate_and_copy_set_tun(const struct nlattr *attr, | ||||
| 	if (start < 0) | ||||
| 		return start; | ||||
|  | ||||
| 	err = add_action(sfa, OVS_KEY_ATTR_IPV4_TUNNEL, &tun_key, sizeof(tun_key)); | ||||
| 	err = add_action(sfa, OVS_KEY_ATTR_IPV4_TUNNEL, &match.key->tun_key, | ||||
| 			sizeof(match.key->tun_key)); | ||||
| 	add_nested_action_end(*sfa, start); | ||||
|  | ||||
| 	return err; | ||||
| @@ -871,7 +873,6 @@ static int ovs_packet_cmd_execute(struct sk_buff *skb, struct genl_info *info) | ||||
| 	struct ethhdr *eth; | ||||
| 	int len; | ||||
| 	int err; | ||||
| 	int key_len; | ||||
|  | ||||
| 	err = -EINVAL; | ||||
| 	if (!a[OVS_PACKET_ATTR_PACKET] || !a[OVS_PACKET_ATTR_KEY] || | ||||
| @@ -904,11 +905,11 @@ static int ovs_packet_cmd_execute(struct sk_buff *skb, struct genl_info *info) | ||||
| 	if (IS_ERR(flow)) | ||||
| 		goto err_kfree_skb; | ||||
|  | ||||
| 	err = ovs_flow_extract(packet, -1, &flow->key, &key_len); | ||||
| 	err = ovs_flow_extract(packet, -1, &flow->key); | ||||
| 	if (err) | ||||
| 		goto err_flow_free; | ||||
|  | ||||
| 	err = ovs_flow_metadata_from_nlattrs(flow, key_len, a[OVS_PACKET_ATTR_KEY]); | ||||
| 	err = ovs_flow_metadata_from_nlattrs(flow, a[OVS_PACKET_ATTR_KEY]); | ||||
| 	if (err) | ||||
| 		goto err_flow_free; | ||||
| 	acts = ovs_flow_actions_alloc(nla_len(a[OVS_PACKET_ATTR_ACTIONS])); | ||||
| @@ -936,13 +937,13 @@ static int ovs_packet_cmd_execute(struct sk_buff *skb, struct genl_info *info) | ||||
| 	local_bh_enable(); | ||||
| 	rcu_read_unlock(); | ||||
|  | ||||
| 	ovs_flow_free(flow); | ||||
| 	ovs_flow_free(flow, false); | ||||
| 	return err; | ||||
|  | ||||
| err_unlock: | ||||
| 	rcu_read_unlock(); | ||||
| err_flow_free: | ||||
| 	ovs_flow_free(flow); | ||||
| 	ovs_flow_free(flow, false); | ||||
| err_kfree_skb: | ||||
| 	kfree_skb(packet); | ||||
| err: | ||||
| @@ -1061,7 +1062,8 @@ static int set_action_to_attr(const struct nlattr *a, struct sk_buff *skb) | ||||
| 		if (!start) | ||||
| 			return -EMSGSIZE; | ||||
|  | ||||
| 		err = ipv4_tun_to_nlattr(skb, nla_data(ovs_key)); | ||||
| 		err = ipv4_tun_to_nlattr(skb, | ||||
| 				nla_data(ovs_key), nla_data(ovs_key)); | ||||
| 		if (err) | ||||
| 			return err; | ||||
| 		nla_nest_end(skb, start); | ||||
| @@ -1109,6 +1111,7 @@ static size_t ovs_flow_cmd_msg_size(const struct sw_flow_actions *acts) | ||||
| { | ||||
| 	return NLMSG_ALIGN(sizeof(struct ovs_header)) | ||||
| 		+ nla_total_size(key_attr_size()) /* OVS_FLOW_ATTR_KEY */ | ||||
| 		+ nla_total_size(key_attr_size()) /* OVS_FLOW_ATTR_MASK */ | ||||
| 		+ nla_total_size(sizeof(struct ovs_flow_stats)) /* OVS_FLOW_ATTR_STATS */ | ||||
| 		+ nla_total_size(1) /* OVS_FLOW_ATTR_TCP_FLAGS */ | ||||
| 		+ nla_total_size(8) /* OVS_FLOW_ATTR_USED */ | ||||
| @@ -1138,14 +1141,28 @@ static int ovs_flow_cmd_fill_info(struct sw_flow *flow, struct datapath *dp, | ||||
|  | ||||
| 	ovs_header->dp_ifindex = get_dpifindex(dp); | ||||
|  | ||||
| 	/* Fill flow key. */ | ||||
| 	nla = nla_nest_start(skb, OVS_FLOW_ATTR_KEY); | ||||
| 	if (!nla) | ||||
| 		goto nla_put_failure; | ||||
| 	err = ovs_flow_to_nlattrs(&flow->key, skb); | ||||
|  | ||||
| 	err = ovs_flow_to_nlattrs(&flow->unmasked_key, | ||||
| 			&flow->unmasked_key, skb); | ||||
| 	if (err) | ||||
| 		goto error; | ||||
| 	nla_nest_end(skb, nla); | ||||
|  | ||||
| 	nla = nla_nest_start(skb, OVS_FLOW_ATTR_MASK); | ||||
| 	if (!nla) | ||||
| 		goto nla_put_failure; | ||||
|  | ||||
| 	err = ovs_flow_to_nlattrs(&flow->key, | ||||
| 			&ovsl_dereference(flow->mask)->key, skb); | ||||
| 	if (err) | ||||
| 		goto error; | ||||
|  | ||||
| 	nla_nest_end(skb, nla); | ||||
|  | ||||
| 	spin_lock_bh(&flow->lock); | ||||
| 	used = flow->used; | ||||
| 	stats.n_packets = flow->packet_count; | ||||
| @@ -1229,19 +1246,23 @@ static int ovs_flow_cmd_new_or_set(struct sk_buff *skb, struct genl_info *info) | ||||
| 	struct nlattr **a = info->attrs; | ||||
| 	struct ovs_header *ovs_header = info->userhdr; | ||||
| 	struct sw_flow_key key; | ||||
| 	struct sw_flow *flow; | ||||
| 	struct sw_flow *flow = NULL; | ||||
| 	struct sw_flow_mask mask; | ||||
| 	struct sk_buff *reply; | ||||
| 	struct datapath *dp; | ||||
| 	struct flow_table *table; | ||||
| 	struct sw_flow_actions *acts = NULL; | ||||
| 	struct sw_flow_match match; | ||||
| 	int error; | ||||
| 	int key_len; | ||||
|  | ||||
| 	/* Extract key. */ | ||||
| 	error = -EINVAL; | ||||
| 	if (!a[OVS_FLOW_ATTR_KEY]) | ||||
| 		goto error; | ||||
| 	error = ovs_flow_from_nlattrs(&key, &key_len, a[OVS_FLOW_ATTR_KEY]); | ||||
|  | ||||
| 	ovs_match_init(&match, &key, &mask); | ||||
| 	error = ovs_match_from_nlattrs(&match, | ||||
| 			a[OVS_FLOW_ATTR_KEY], a[OVS_FLOW_ATTR_MASK]); | ||||
| 	if (error) | ||||
| 		goto error; | ||||
|  | ||||
| @@ -1267,8 +1288,11 @@ static int ovs_flow_cmd_new_or_set(struct sk_buff *skb, struct genl_info *info) | ||||
| 		goto err_unlock_ovs; | ||||
|  | ||||
| 	table = ovsl_dereference(dp->table); | ||||
| 	flow = ovs_flow_tbl_lookup(table, &key, key_len); | ||||
|  | ||||
| 	/* Check if this is a duplicate flow */ | ||||
| 	flow = ovs_flow_lookup(table, &key); | ||||
| 	if (!flow) { | ||||
| 		struct sw_flow_mask *mask_p; | ||||
| 		/* Bail out if we're not allowed to create a new flow. */ | ||||
| 		error = -ENOENT; | ||||
| 		if (info->genlhdr->cmd == OVS_FLOW_CMD_SET) | ||||
| @@ -1281,7 +1305,7 @@ static int ovs_flow_cmd_new_or_set(struct sk_buff *skb, struct genl_info *info) | ||||
| 			new_table = ovs_flow_tbl_expand(table); | ||||
| 			if (!IS_ERR(new_table)) { | ||||
| 				rcu_assign_pointer(dp->table, new_table); | ||||
| 				ovs_flow_tbl_deferred_destroy(table); | ||||
| 				ovs_flow_tbl_destroy(table, true); | ||||
| 				table = ovsl_dereference(dp->table); | ||||
| 			} | ||||
| 		} | ||||
| @@ -1294,18 +1318,37 @@ static int ovs_flow_cmd_new_or_set(struct sk_buff *skb, struct genl_info *info) | ||||
| 		} | ||||
| 		clear_stats(flow); | ||||
|  | ||||
| 		/* Make sure mask is unique in the system */ | ||||
| 		mask_p = ovs_sw_flow_mask_find(table, &mask); | ||||
| 		if (!mask_p) { | ||||
| 			/* Allocate a new mask if none exsits. */ | ||||
| 			mask_p = ovs_sw_flow_mask_alloc(); | ||||
| 			if (!mask_p) | ||||
| 				goto err_flow_free; | ||||
| 			mask_p->key = mask.key; | ||||
| 			mask_p->range = mask.range; | ||||
| 			ovs_sw_flow_mask_insert(table, mask_p); | ||||
| 		} | ||||
|  | ||||
| 		ovs_sw_flow_mask_add_ref(mask_p); | ||||
| 		rcu_assign_pointer(flow->mask, mask_p); | ||||
| 		rcu_assign_pointer(flow->sf_acts, acts); | ||||
|  | ||||
| 		/* Put flow in bucket. */ | ||||
| 		ovs_flow_tbl_insert(table, flow, &key, key_len); | ||||
| 		ovs_flow_insert(table, flow, &key, match.range.end); | ||||
|  | ||||
| 		reply = ovs_flow_cmd_build_info(flow, dp, info->snd_portid, | ||||
| 						info->snd_seq, | ||||
| 						OVS_FLOW_CMD_NEW); | ||||
| 						info->snd_seq, OVS_FLOW_CMD_NEW); | ||||
| 	} else { | ||||
| 		/* We found a matching flow. */ | ||||
| 		struct sw_flow_actions *old_acts; | ||||
|  | ||||
| 		/* Make sure the it has the same unmasked key. */ | ||||
| 		if (!ovs_flow_cmp_unmasked_key(flow, &key, match.range.end)) { | ||||
| 			error = -EINVAL; | ||||
| 			goto err_unlock_ovs; | ||||
| 		} | ||||
|  | ||||
| 		/* Bail out if we're not allowed to modify an existing flow. | ||||
| 		 * We accept NLM_F_CREATE in place of the intended NLM_F_EXCL | ||||
| 		 * because Generic Netlink treats the latter as a dump | ||||
| @@ -1341,6 +1384,8 @@ static int ovs_flow_cmd_new_or_set(struct sk_buff *skb, struct genl_info *info) | ||||
| 				ovs_dp_flow_multicast_group.id,	PTR_ERR(reply)); | ||||
| 	return 0; | ||||
|  | ||||
| err_flow_free: | ||||
| 	ovs_flow_free(flow, false); | ||||
| err_unlock_ovs: | ||||
| 	ovs_unlock(); | ||||
| err_kfree: | ||||
| @@ -1358,12 +1403,14 @@ static int ovs_flow_cmd_get(struct sk_buff *skb, struct genl_info *info) | ||||
| 	struct sw_flow *flow; | ||||
| 	struct datapath *dp; | ||||
| 	struct flow_table *table; | ||||
| 	struct sw_flow_match match; | ||||
| 	int err; | ||||
| 	int key_len; | ||||
|  | ||||
| 	if (!a[OVS_FLOW_ATTR_KEY]) | ||||
| 		return -EINVAL; | ||||
| 	err = ovs_flow_from_nlattrs(&key, &key_len, a[OVS_FLOW_ATTR_KEY]); | ||||
|  | ||||
| 	ovs_match_init(&match, &key, NULL); | ||||
| 	err = ovs_match_from_nlattrs(&match, a[OVS_FLOW_ATTR_KEY], NULL); | ||||
| 	if (err) | ||||
| 		return err; | ||||
|  | ||||
| @@ -1375,7 +1422,7 @@ static int ovs_flow_cmd_get(struct sk_buff *skb, struct genl_info *info) | ||||
| 	} | ||||
|  | ||||
| 	table = ovsl_dereference(dp->table); | ||||
| 	flow = ovs_flow_tbl_lookup(table, &key, key_len); | ||||
| 	flow = ovs_flow_lookup_unmasked_key(table, &match); | ||||
| 	if (!flow) { | ||||
| 		err = -ENOENT; | ||||
| 		goto unlock; | ||||
| @@ -1404,8 +1451,8 @@ static int ovs_flow_cmd_del(struct sk_buff *skb, struct genl_info *info) | ||||
| 	struct sw_flow *flow; | ||||
| 	struct datapath *dp; | ||||
| 	struct flow_table *table; | ||||
| 	struct sw_flow_match match; | ||||
| 	int err; | ||||
| 	int key_len; | ||||
|  | ||||
| 	ovs_lock(); | ||||
| 	dp = get_dp(sock_net(skb->sk), ovs_header->dp_ifindex); | ||||
| @@ -1418,12 +1465,14 @@ static int ovs_flow_cmd_del(struct sk_buff *skb, struct genl_info *info) | ||||
| 		err = flush_flows(dp); | ||||
| 		goto unlock; | ||||
| 	} | ||||
| 	err = ovs_flow_from_nlattrs(&key, &key_len, a[OVS_FLOW_ATTR_KEY]); | ||||
|  | ||||
| 	ovs_match_init(&match, &key, NULL); | ||||
| 	err = ovs_match_from_nlattrs(&match, a[OVS_FLOW_ATTR_KEY], NULL); | ||||
| 	if (err) | ||||
| 		goto unlock; | ||||
|  | ||||
| 	table = ovsl_dereference(dp->table); | ||||
| 	flow = ovs_flow_tbl_lookup(table, &key, key_len); | ||||
| 	flow = ovs_flow_lookup_unmasked_key(table, &match); | ||||
| 	if (!flow) { | ||||
| 		err = -ENOENT; | ||||
| 		goto unlock; | ||||
| @@ -1435,13 +1484,13 @@ static int ovs_flow_cmd_del(struct sk_buff *skb, struct genl_info *info) | ||||
| 		goto unlock; | ||||
| 	} | ||||
|  | ||||
| 	ovs_flow_tbl_remove(table, flow); | ||||
| 	ovs_flow_remove(table, flow); | ||||
|  | ||||
| 	err = ovs_flow_cmd_fill_info(flow, dp, reply, info->snd_portid, | ||||
| 				     info->snd_seq, 0, OVS_FLOW_CMD_DEL); | ||||
| 	BUG_ON(err < 0); | ||||
|  | ||||
| 	ovs_flow_deferred_free(flow); | ||||
| 	ovs_flow_free(flow, true); | ||||
| 	ovs_unlock(); | ||||
|  | ||||
| 	ovs_notify(reply, info, &ovs_dp_flow_multicast_group); | ||||
| @@ -1472,7 +1521,7 @@ static int ovs_flow_cmd_dump(struct sk_buff *skb, struct netlink_callback *cb) | ||||
|  | ||||
| 		bucket = cb->args[0]; | ||||
| 		obj = cb->args[1]; | ||||
| 		flow = ovs_flow_tbl_next(table, &bucket, &obj); | ||||
| 		flow = ovs_flow_dump_next(table, &bucket, &obj); | ||||
| 		if (!flow) | ||||
| 			break; | ||||
|  | ||||
| @@ -1705,7 +1754,7 @@ err_destroy_ports_array: | ||||
| err_destroy_percpu: | ||||
| 	free_percpu(dp->stats_percpu); | ||||
| err_destroy_table: | ||||
| 	ovs_flow_tbl_destroy(ovsl_dereference(dp->table)); | ||||
| 	ovs_flow_tbl_destroy(ovsl_dereference(dp->table), false); | ||||
| err_free_dp: | ||||
| 	release_net(ovs_dp_get_net(dp)); | ||||
| 	kfree(dp); | ||||
| @@ -2357,7 +2406,7 @@ static void rehash_flow_table(struct work_struct *work) | ||||
| 			new_table = ovs_flow_tbl_rehash(old_table); | ||||
| 			if (!IS_ERR(new_table)) { | ||||
| 				rcu_assign_pointer(dp->table, new_table); | ||||
| 				ovs_flow_tbl_deferred_destroy(old_table); | ||||
| 				ovs_flow_tbl_destroy(old_table, true); | ||||
| 			} | ||||
| 		} | ||||
| 	} | ||||
|   | ||||
							
								
								
									
										1278
									
								
								datapath/flow.c
									
									
									
									
									
								
							
							
						
						
									
										1278
									
								
								datapath/flow.c
									
									
									
									
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -1,5 +1,5 @@ | ||||
| /* | ||||
|  * Copyright (c) 2007-2011 Nicira, Inc. | ||||
|  * Copyright (c) 2007-2013 Nicira, Inc. | ||||
|  * | ||||
|  * This program is free software; you can redistribute it and/or | ||||
|  * modify it under the terms of version 2 of the GNU General Public | ||||
| @@ -33,6 +33,8 @@ | ||||
| #include <net/inet_ecn.h> | ||||
|  | ||||
| struct sk_buff; | ||||
| struct sw_flow_mask; | ||||
| struct flow_table; | ||||
|  | ||||
| struct sw_flow_actions { | ||||
| 	struct rcu_head rcu; | ||||
| @@ -120,6 +122,8 @@ struct sw_flow { | ||||
| 	u32 hash; | ||||
|  | ||||
| 	struct sw_flow_key key; | ||||
| 	struct sw_flow_key unmasked_key; | ||||
| 	struct sw_flow_mask __rcu *mask; | ||||
| 	struct sw_flow_actions __rcu *sf_acts; | ||||
|  | ||||
| 	spinlock_t lock;	/* Lock for values below. */ | ||||
| @@ -129,6 +133,25 @@ struct sw_flow { | ||||
| 	u8 tcp_flags;		/* Union of seen TCP flags. */ | ||||
| }; | ||||
|  | ||||
| struct sw_flow_key_range { | ||||
| 	size_t start; | ||||
| 	size_t end; | ||||
| }; | ||||
|  | ||||
| static inline u16 ovs_sw_flow_key_range_actual_size(const struct sw_flow_key_range *range) | ||||
| { | ||||
| 	return range->end - range->start; | ||||
| } | ||||
|  | ||||
| struct sw_flow_match { | ||||
| 	struct sw_flow_key *key; | ||||
| 	struct sw_flow_key_range range; | ||||
| 	struct sw_flow_mask *mask; | ||||
| }; | ||||
|  | ||||
| void ovs_match_init(struct sw_flow_match *match, | ||||
| 		struct sw_flow_key *key, struct sw_flow_mask *mask); | ||||
|  | ||||
| struct arp_eth_header { | ||||
| 	__be16      ar_hrd;	/* format of hardware address   */ | ||||
| 	__be16      ar_pro;	/* format of protocol address   */ | ||||
| @@ -148,21 +171,21 @@ void ovs_flow_exit(void); | ||||
|  | ||||
| struct sw_flow *ovs_flow_alloc(void); | ||||
| void ovs_flow_deferred_free(struct sw_flow *); | ||||
| void ovs_flow_free(struct sw_flow *); | ||||
| void ovs_flow_free(struct sw_flow *, bool deferred); | ||||
|  | ||||
| struct sw_flow_actions *ovs_flow_actions_alloc(int actions_len); | ||||
| void ovs_flow_deferred_free_acts(struct sw_flow_actions *); | ||||
|  | ||||
| int ovs_flow_extract(struct sk_buff *, u16 in_port, struct sw_flow_key *, | ||||
| 		     int *key_lenp); | ||||
| int ovs_flow_extract(struct sk_buff *, u16 in_port, struct sw_flow_key *); | ||||
| void ovs_flow_used(struct sw_flow *, struct sk_buff *); | ||||
| u64 ovs_flow_used_time(unsigned long flow_jiffies); | ||||
|  | ||||
| int ovs_flow_to_nlattrs(const struct sw_flow_key *, struct sk_buff *); | ||||
| int ovs_flow_from_nlattrs(struct sw_flow_key *swkey, int *key_lenp, | ||||
| int ovs_flow_to_nlattrs(const struct sw_flow_key *, | ||||
| 		const struct sw_flow_key *, struct sk_buff *); | ||||
| int ovs_match_from_nlattrs(struct sw_flow_match *match, | ||||
| 		      const struct nlattr *, | ||||
| 		      const struct nlattr *); | ||||
| int ovs_flow_metadata_from_nlattrs(struct sw_flow *flow, int key_len, | ||||
| 				   const struct nlattr *attr); | ||||
| int ovs_flow_metadata_from_nlattrs(struct sw_flow *flow, | ||||
| 		const struct nlattr *attr); | ||||
|  | ||||
| #define MAX_ACTIONS_BUFSIZE	(32 * 1024) | ||||
| #define TBL_MIN_BUCKETS		1024 | ||||
| @@ -171,6 +194,7 @@ struct flow_table { | ||||
| 	struct flex_array *buckets; | ||||
| 	unsigned int count, n_buckets; | ||||
| 	struct rcu_head rcu; | ||||
| 	struct list_head mask_list; | ||||
| 	int node_ver; | ||||
| 	u32 hash_seed; | ||||
| 	bool keep_flows; | ||||
| @@ -186,22 +210,55 @@ static inline int ovs_flow_tbl_need_to_expand(struct flow_table *table) | ||||
| 	return (table->count > table->n_buckets); | ||||
| } | ||||
|  | ||||
| struct sw_flow *ovs_flow_tbl_lookup(struct flow_table *table, | ||||
| 				    struct sw_flow_key *key, int len); | ||||
| void ovs_flow_tbl_destroy(struct flow_table *table); | ||||
| void ovs_flow_tbl_deferred_destroy(struct flow_table *table); | ||||
| struct sw_flow *ovs_flow_lookup(struct flow_table *, | ||||
| 				const struct sw_flow_key *); | ||||
| struct sw_flow *ovs_flow_lookup_unmasked_key(struct flow_table *table, | ||||
| 				    struct sw_flow_match *match); | ||||
|  | ||||
| void ovs_flow_tbl_destroy(struct flow_table *table, bool deferred); | ||||
| struct flow_table *ovs_flow_tbl_alloc(int new_size); | ||||
| struct flow_table *ovs_flow_tbl_expand(struct flow_table *table); | ||||
| struct flow_table *ovs_flow_tbl_rehash(struct flow_table *table); | ||||
| void ovs_flow_tbl_insert(struct flow_table *table, struct sw_flow *flow, | ||||
| 			 struct sw_flow_key *key, int key_len); | ||||
| void ovs_flow_tbl_remove(struct flow_table *table, struct sw_flow *flow); | ||||
| void ovs_flow_insert(struct flow_table *table, struct sw_flow *flow, | ||||
| 		const struct sw_flow_key *key, int key_len); | ||||
|  | ||||
| struct sw_flow *ovs_flow_tbl_next(struct flow_table *table, u32 *bucket, u32 *idx); | ||||
| void ovs_flow_remove(struct flow_table *table, struct sw_flow *flow); | ||||
|  | ||||
| struct sw_flow *ovs_flow_dump_next(struct flow_table *table, u32 *bucket, u32 *idx); | ||||
| extern const int ovs_key_lens[OVS_KEY_ATTR_MAX + 1]; | ||||
| int ipv4_tun_from_nlattr(const struct nlattr *attr, | ||||
| 			 struct ovs_key_ipv4_tunnel *tun_key); | ||||
| 			 struct sw_flow_match *match, bool is_mask); | ||||
| int ipv4_tun_to_nlattr(struct sk_buff *skb, | ||||
| 			const struct ovs_key_ipv4_tunnel *tun_key); | ||||
| 			const struct ovs_key_ipv4_tunnel *tun_key, | ||||
| 			const struct ovs_key_ipv4_tunnel *output); | ||||
|  | ||||
| bool ovs_flow_cmp_unmasked_key(const struct sw_flow *flow, | ||||
| 		const struct sw_flow_key *key, int key_len); | ||||
|  | ||||
| struct sw_flow_mask { | ||||
| 	int ref_count; | ||||
| 	struct rcu_head rcu; | ||||
| 	struct list_head list; | ||||
| 	struct sw_flow_key_range range; | ||||
| 	struct sw_flow_key key; | ||||
| }; | ||||
|  | ||||
| static inline u16 | ||||
| ovs_sw_flow_mask_actual_size(const struct sw_flow_mask *mask) | ||||
| { | ||||
| 	return ovs_sw_flow_key_range_actual_size(&mask->range); | ||||
| } | ||||
|  | ||||
| static inline u16 | ||||
| ovs_sw_flow_mask_size_roundup(const struct sw_flow_mask *mask) | ||||
| { | ||||
| 	return roundup(ovs_sw_flow_mask_actual_size(mask), sizeof(u32)); | ||||
| } | ||||
|  | ||||
| struct sw_flow_mask *ovs_sw_flow_mask_alloc(void); | ||||
| void ovs_sw_flow_mask_add_ref(struct sw_flow_mask *); | ||||
| void ovs_sw_flow_mask_del_ref(struct sw_flow_mask *, bool deferred); | ||||
| void ovs_sw_flow_mask_insert(struct flow_table *, struct sw_flow_mask *); | ||||
| struct sw_flow_mask *ovs_sw_flow_mask_find(const struct flow_table *, | ||||
| 		const struct sw_flow_mask *); | ||||
| #endif /* flow.h */ | ||||
|   | ||||
| @@ -1,5 +1,5 @@ | ||||
| /* | ||||
|  * Copyright (c) 2007-2011 Nicira, Inc. | ||||
|  * Copyright (c) 2007-2013 Nicira, Inc. | ||||
|  * | ||||
|  * This file is offered under your choice of two licenses: Apache 2.0 or GNU | ||||
|  * GPL 2.0 or later.  The permission statements for each of these licenses is | ||||
| @@ -410,6 +410,12 @@ struct ovs_key_nd { | ||||
|  * @OVS_FLOW_ATTR_CLEAR: If present in a %OVS_FLOW_CMD_SET request, clears the | ||||
|  * last-used time, accumulated TCP flags, and statistics for this flow. | ||||
|  * Otherwise ignored in requests.  Never present in notifications. | ||||
|  * @OVS_FLOW_ATTR_MASK: Nested %OVS_KEY_ATTR_* attributes specifying the | ||||
|  * mask bits for wildcarded flow match. Mask bit value '1' specifies exact | ||||
|  * match with corresponding flow key bit, while mask bit value '0' specifies | ||||
|  * a wildcarded match. Omitting attribute is treated as wildcarding all | ||||
|  * corresponding fields. Optional for all requests. If not present, | ||||
|  * all flow key bits are exact match bits. | ||||
|  * | ||||
|  * These attributes follow the &struct ovs_header within the Generic Netlink | ||||
|  * payload for %OVS_FLOW_* commands. | ||||
| @@ -422,6 +428,7 @@ enum ovs_flow_attr { | ||||
| 	OVS_FLOW_ATTR_TCP_FLAGS, /* 8-bit OR'd TCP flags. */ | ||||
| 	OVS_FLOW_ATTR_USED,      /* u64 msecs last used in monotonic time. */ | ||||
| 	OVS_FLOW_ATTR_CLEAR,     /* Flag to clear stats, tcp_flags, used. */ | ||||
| 	OVS_FLOW_ATTR_MASK,      /* Sequence of OVS_KEY_ATTR_* attributes. */ | ||||
| 	__OVS_FLOW_ATTR_MAX | ||||
| }; | ||||
|  | ||||
|   | ||||
		Reference in New Issue
	
	Block a user