1 /*
2  * Copyright (c) 2015, Mellanox Technologies. All rights reserved.
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * OpenIB.org BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and/or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  */
32 
33 #ifndef _MLX5_FS_CORE_
34 #define _MLX5_FS_CORE_
35 
36 #include <linux/refcount.h>
37 #include <linux/mlx5/fs.h>
38 #include <linux/rhashtable.h>
39 #include <linux/llist.h>
40 #include <steering/fs_dr.h>
41 
42 #define FDB_TC_MAX_CHAIN 3
43 #define FDB_FT_CHAIN (FDB_TC_MAX_CHAIN + 1)
44 #define FDB_TC_SLOW_PATH_CHAIN (FDB_FT_CHAIN + 1)
45 
46 /* The index of the last real chain (FT) + 1 as chain zero is valid as well */
47 #define FDB_NUM_CHAINS (FDB_FT_CHAIN + 1)
48 
49 #define FDB_TC_MAX_PRIO 16
50 #define FDB_TC_LEVELS_PER_PRIO 2
51 
52 struct mlx5_flow_definer {
53 	enum mlx5_flow_namespace_type ns_type;
54 	u32 id;
55 };
56 
57 enum mlx5_flow_resource_owner {
58 	MLX5_FLOW_RESOURCE_OWNER_FW,
59 	MLX5_FLOW_RESOURCE_OWNER_SW,
60 };
61 
62 struct mlx5_modify_hdr {
63 	enum mlx5_flow_namespace_type ns_type;
64 	enum mlx5_flow_resource_owner owner;
65 	union {
66 		struct mlx5_fs_dr_action action;
67 		u32 id;
68 	};
69 };
70 
71 struct mlx5_pkt_reformat {
72 	enum mlx5_flow_namespace_type ns_type;
73 	int reformat_type; /* from mlx5_ifc */
74 	enum mlx5_flow_resource_owner owner;
75 	union {
76 		struct mlx5_fs_dr_action action;
77 		u32 id;
78 	};
79 };
80 
81 /* FS_TYPE_PRIO_CHAINS is a PRIO that will have namespaces only,
82  * and those are in parallel to one another when going over them to connect
83  * a new flow table. Meaning the last flow table in a TYPE_PRIO prio in one
84  * parallel namespace will not automatically connect to the first flow table
85  * found in any prio in any next namespace, but skip the entire containing
86  * TYPE_PRIO_CHAINS prio.
87  *
88  * This is used to implement tc chains, each chain of prios is a different
89  * namespace inside a containing TYPE_PRIO_CHAINS prio.
90  */
91 
92 enum fs_node_type {
93 	FS_TYPE_NAMESPACE,
94 	FS_TYPE_PRIO,
95 	FS_TYPE_PRIO_CHAINS,
96 	FS_TYPE_FLOW_TABLE,
97 	FS_TYPE_FLOW_GROUP,
98 	FS_TYPE_FLOW_ENTRY,
99 	FS_TYPE_FLOW_DEST
100 };
101 
102 enum fs_flow_table_type {
103 	FS_FT_NIC_RX          = 0x0,
104 	FS_FT_NIC_TX          = 0x1,
105 	FS_FT_ESW_EGRESS_ACL  = 0x2,
106 	FS_FT_ESW_INGRESS_ACL = 0x3,
107 	FS_FT_FDB             = 0X4,
108 	FS_FT_SNIFFER_RX	= 0X5,
109 	FS_FT_SNIFFER_TX	= 0X6,
110 	FS_FT_RDMA_RX		= 0X7,
111 	FS_FT_RDMA_TX		= 0X8,
112 	FS_FT_PORT_SEL		= 0X9,
113 	FS_FT_FDB_RX		= 0xa,
114 	FS_FT_FDB_TX		= 0xb,
115 	FS_FT_MAX_TYPE = FS_FT_FDB_TX,
116 };
117 
118 enum fs_flow_table_op_mod {
119 	FS_FT_OP_MOD_NORMAL,
120 	FS_FT_OP_MOD_LAG_DEMUX,
121 };
122 
123 enum fs_fte_status {
124 	FS_FTE_STATUS_EXISTING = 1UL << 0,
125 };
126 
127 enum mlx5_flow_steering_mode {
128 	MLX5_FLOW_STEERING_MODE_DMFS,
129 	MLX5_FLOW_STEERING_MODE_SMFS
130 };
131 
132 enum mlx5_flow_steering_capabilty {
133 	MLX5_FLOW_STEERING_CAP_VLAN_PUSH_ON_RX = 1UL << 0,
134 	MLX5_FLOW_STEERING_CAP_VLAN_POP_ON_TX = 1UL << 1,
135 	MLX5_FLOW_STEERING_CAP_MATCH_RANGES = 1UL << 2,
136 	MLX5_FLOW_STEERING_CAP_DUPLICATE_MATCH = 1UL << 3,
137 };
138 
139 struct mlx5_flow_steering {
140 	struct mlx5_core_dev *dev;
141 	enum   mlx5_flow_steering_mode	mode;
142 	struct kmem_cache		*fgs_cache;
143 	struct kmem_cache               *ftes_cache;
144 	struct mlx5_flow_root_namespace *root_ns;
145 	struct mlx5_flow_root_namespace *fdb_root_ns;
146 	struct mlx5_flow_namespace	**fdb_sub_ns;
147 	struct mlx5_flow_root_namespace **esw_egress_root_ns;
148 	struct mlx5_flow_root_namespace **esw_ingress_root_ns;
149 	struct mlx5_flow_root_namespace	*sniffer_tx_root_ns;
150 	struct mlx5_flow_root_namespace	*sniffer_rx_root_ns;
151 	struct mlx5_flow_root_namespace	*rdma_rx_root_ns;
152 	struct mlx5_flow_root_namespace	*rdma_tx_root_ns;
153 	struct mlx5_flow_root_namespace	*egress_root_ns;
154 	struct mlx5_flow_root_namespace	*port_sel_root_ns;
155 	int esw_egress_acl_vports;
156 	int esw_ingress_acl_vports;
157 };
158 
159 struct fs_node {
160 	struct list_head	list;
161 	struct list_head	children;
162 	enum fs_node_type	type;
163 	struct fs_node		*parent;
164 	struct fs_node		*root;
165 	/* lock the node for writing and traversing */
166 	struct rw_semaphore	lock;
167 	refcount_t		refcount;
168 	bool			active;
169 	void			(*del_hw_func)(struct fs_node *);
170 	void			(*del_sw_func)(struct fs_node *);
171 	atomic_t		version;
172 };
173 
174 struct mlx5_flow_rule {
175 	struct fs_node				node;
176 	struct mlx5_flow_table			*ft;
177 	struct mlx5_flow_destination		dest_attr;
178 	/* next_ft should be accessed under chain_lock and only of
179 	 * destination type is FWD_NEXT_fT.
180 	 */
181 	struct list_head			next_ft;
182 	u32					sw_action;
183 };
184 
185 struct mlx5_flow_handle {
186 	int num_rules;
187 	struct mlx5_flow_rule *rule[] __counted_by(num_rules);
188 };
189 
190 /* Type of children is mlx5_flow_group */
191 struct mlx5_flow_table {
192 	struct fs_node			node;
193 	struct mlx5_fs_dr_table		fs_dr_table;
194 	u32				id;
195 	u16				vport;
196 	unsigned int			max_fte;
197 	unsigned int			level;
198 	enum fs_flow_table_type		type;
199 	enum fs_flow_table_op_mod	op_mod;
200 	struct {
201 		bool			active;
202 		unsigned int		required_groups;
203 		unsigned int		group_size;
204 		unsigned int		num_groups;
205 		unsigned int		max_fte;
206 	} autogroup;
207 	/* Protect fwd_rules */
208 	struct mutex			lock;
209 	/* FWD rules that point on this flow table */
210 	struct list_head		fwd_rules;
211 	u32				flags;
212 	struct rhltable			fgs_hash;
213 	enum mlx5_flow_table_miss_action def_miss_action;
214 	struct mlx5_flow_namespace	*ns;
215 };
216 
217 struct mlx5_ft_underlay_qp {
218 	struct list_head list;
219 	u32 qpn;
220 };
221 
222 #define MLX5_FTE_MATCH_PARAM_RESERVED	reserved_at_e00
223 /* Calculate the fte_match_param length and without the reserved length.
224  * Make sure the reserved field is the last.
225  */
226 #define MLX5_ST_SZ_DW_MATCH_PARAM					    \
227 	((MLX5_BYTE_OFF(fte_match_param, MLX5_FTE_MATCH_PARAM_RESERVED) / sizeof(u32)) + \
228 	 BUILD_BUG_ON_ZERO(MLX5_ST_SZ_BYTES(fte_match_param) !=		     \
229 			   MLX5_FLD_SZ_BYTES(fte_match_param,		     \
230 					     MLX5_FTE_MATCH_PARAM_RESERVED) +\
231 			   MLX5_BYTE_OFF(fte_match_param,		     \
232 					 MLX5_FTE_MATCH_PARAM_RESERVED)))
233 
234 struct fs_fte_action {
235 	int				modify_mask;
236 	u32				dests_size;
237 	u32				fwd_dests;
238 	struct mlx5_flow_context	flow_context;
239 	struct mlx5_flow_act		action;
240 };
241 
242 struct fs_fte_dup {
243 	struct list_head children;
244 	struct fs_fte_action act_dests;
245 };
246 
247 /* Type of children is mlx5_flow_rule */
248 struct fs_fte {
249 	struct fs_node			node;
250 	struct mlx5_fs_dr_rule		fs_dr_rule;
251 	u32				val[MLX5_ST_SZ_DW_MATCH_PARAM];
252 	struct fs_fte_action		act_dests;
253 	struct fs_fte_dup		*dup;
254 	u32				index;
255 	enum fs_fte_status		status;
256 	struct rhash_head		hash;
257 };
258 
259 /* Type of children is mlx5_flow_table/namespace */
260 struct fs_prio {
261 	struct fs_node			node;
262 	unsigned int			num_levels;
263 	unsigned int			start_level;
264 	unsigned int			prio;
265 	unsigned int			num_ft;
266 };
267 
268 /* Type of children is fs_prio */
269 struct mlx5_flow_namespace {
270 	/* parent == NULL => root ns */
271 	struct	fs_node			node;
272 	enum mlx5_flow_table_miss_action def_miss_action;
273 };
274 
275 struct mlx5_flow_group_mask {
276 	u8	match_criteria_enable;
277 	u32	match_criteria[MLX5_ST_SZ_DW_MATCH_PARAM];
278 };
279 
280 /* Type of children is fs_fte */
281 struct mlx5_flow_group {
282 	struct fs_node			node;
283 	struct mlx5_fs_dr_matcher	fs_dr_matcher;
284 	struct mlx5_flow_group_mask	mask;
285 	u32				start_index;
286 	u32				max_ftes;
287 	struct ida			fte_allocator;
288 	u32				id;
289 	struct rhashtable		ftes_hash;
290 	struct rhlist_head		hash;
291 };
292 
293 struct mlx5_flow_root_namespace {
294 	struct mlx5_flow_namespace	ns;
295 	enum   mlx5_flow_steering_mode	mode;
296 	struct mlx5_fs_dr_domain	fs_dr_domain;
297 	enum   fs_flow_table_type	table_type;
298 	struct mlx5_core_dev		*dev;
299 	struct mlx5_flow_table		*root_ft;
300 	/* Should be held when chaining flow tables */
301 	struct mutex			chain_lock;
302 	struct list_head		underlay_qpns;
303 	const struct mlx5_flow_cmds	*cmds;
304 };
305 
306 int mlx5_init_fc_stats(struct mlx5_core_dev *dev);
307 void mlx5_cleanup_fc_stats(struct mlx5_core_dev *dev);
308 void mlx5_fc_queue_stats_work(struct mlx5_core_dev *dev,
309 			      struct delayed_work *dwork,
310 			      unsigned long delay);
311 void mlx5_fc_update_sampling_interval(struct mlx5_core_dev *dev,
312 				      unsigned long interval);
313 
314 const struct mlx5_flow_cmds *mlx5_fs_cmd_get_fw_cmds(void);
315 
316 int mlx5_flow_namespace_set_peer(struct mlx5_flow_root_namespace *ns,
317 				 struct mlx5_flow_root_namespace *peer_ns,
318 				 u16 peer_vhca_id);
319 
320 int mlx5_flow_namespace_set_mode(struct mlx5_flow_namespace *ns,
321 				 enum mlx5_flow_steering_mode mode);
322 
323 int mlx5_fs_core_alloc(struct mlx5_core_dev *dev);
324 void mlx5_fs_core_free(struct mlx5_core_dev *dev);
325 int mlx5_fs_core_init(struct mlx5_core_dev *dev);
326 void mlx5_fs_core_cleanup(struct mlx5_core_dev *dev);
327 
328 int mlx5_fs_egress_acls_init(struct mlx5_core_dev *dev, int total_vports);
329 void mlx5_fs_egress_acls_cleanup(struct mlx5_core_dev *dev);
330 int mlx5_fs_ingress_acls_init(struct mlx5_core_dev *dev, int total_vports);
331 void mlx5_fs_ingress_acls_cleanup(struct mlx5_core_dev *dev);
332 
333 u32 mlx5_fs_get_capabilities(struct mlx5_core_dev *dev, enum mlx5_flow_namespace_type type);
334 
335 struct mlx5_flow_root_namespace *find_root(struct fs_node *node);
336 
337 #define fs_get_obj(v, _node)  {v = container_of((_node), typeof(*v), node); }
338 
339 #define fs_list_for_each_entry(pos, root)		\
340 	list_for_each_entry(pos, root, node.list)
341 
342 #define fs_list_for_each_entry_safe(pos, tmp, root)		\
343 	list_for_each_entry_safe(pos, tmp, root, node.list)
344 
345 #define fs_for_each_ns_or_ft_reverse(pos, prio)				\
346 	list_for_each_entry_reverse(pos, &(prio)->node.children, list)
347 
348 #define fs_for_each_ns_or_ft(pos, prio)					\
349 	list_for_each_entry(pos, (&(prio)->node.children), list)
350 
351 #define fs_for_each_prio(pos, ns)			\
352 	fs_list_for_each_entry(pos, &(ns)->node.children)
353 
354 #define fs_for_each_ns(pos, prio)			\
355 	fs_list_for_each_entry(pos, &(prio)->node.children)
356 
357 #define fs_for_each_ft(pos, prio)			\
358 	fs_list_for_each_entry(pos, &(prio)->node.children)
359 
360 #define fs_for_each_ft_safe(pos, tmp, prio)			\
361 	fs_list_for_each_entry_safe(pos, tmp, &(prio)->node.children)
362 
363 #define fs_for_each_fg(pos, ft)			\
364 	fs_list_for_each_entry(pos, &(ft)->node.children)
365 
366 #define fs_for_each_fte(pos, fg)			\
367 	fs_list_for_each_entry(pos, &(fg)->node.children)
368 
369 #define fs_for_each_dst(pos, fte)			\
370 	fs_list_for_each_entry(pos, &(fte)->node.children)
371 
372 #define MLX5_CAP_FLOWTABLE_TYPE(mdev, cap, type) (		\
373 	(type == FS_FT_NIC_RX) ? MLX5_CAP_FLOWTABLE_NIC_RX(mdev, cap) :		\
374 	(type == FS_FT_NIC_TX) ? MLX5_CAP_FLOWTABLE_NIC_TX(mdev, cap) :		\
375 	(type == FS_FT_ESW_EGRESS_ACL) ? MLX5_CAP_ESW_EGRESS_ACL(mdev, cap) :		\
376 	(type == FS_FT_ESW_INGRESS_ACL) ? MLX5_CAP_ESW_INGRESS_ACL(mdev, cap) :		\
377 	(type == FS_FT_FDB) ? MLX5_CAP_ESW_FLOWTABLE_FDB(mdev, cap) :		\
378 	(type == FS_FT_SNIFFER_RX) ? MLX5_CAP_FLOWTABLE_SNIFFER_RX(mdev, cap) :		\
379 	(type == FS_FT_SNIFFER_TX) ? MLX5_CAP_FLOWTABLE_SNIFFER_TX(mdev, cap) :		\
380 	(type == FS_FT_RDMA_RX) ? MLX5_CAP_FLOWTABLE_RDMA_RX(mdev, cap) :		\
381 	(type == FS_FT_RDMA_TX) ? MLX5_CAP_FLOWTABLE_RDMA_TX(mdev, cap) :      \
382 	(type == FS_FT_PORT_SEL) ? MLX5_CAP_FLOWTABLE_PORT_SELECTION(mdev, cap) :      \
383 	(type == FS_FT_FDB_RX) ? MLX5_CAP_ESW_FLOWTABLE_FDB(mdev, cap) :      \
384 	(type == FS_FT_FDB_TX) ? MLX5_CAP_ESW_FLOWTABLE_FDB(mdev, cap) :      \
385 	(BUILD_BUG_ON_ZERO(FS_FT_FDB_TX != FS_FT_MAX_TYPE))\
386 	)
387 
388 #endif
389