1 /* 2 * Copyright (c) 2015, Mellanox Technologies. All rights reserved. 3 * 4 * This software is available to you under a choice of one of two 5 * licenses. You may choose to be licensed under the terms of the GNU 6 * General Public License (GPL) Version 2, available from the file 7 * COPYING in the main directory of this source tree, or the 8 * OpenIB.org BSD license below: 9 * 10 * Redistribution and use in source and binary forms, with or 11 * without modification, are permitted provided that the following 12 * conditions are met: 13 * 14 * - Redistributions of source code must retain the above 15 * copyright notice, this list of conditions and the following 16 * disclaimer. 17 * 18 * - Redistributions in binary form must reproduce the above 19 * copyright notice, this list of conditions and the following 20 * disclaimer in the documentation and/or other materials 21 * provided with the distribution. 22 * 23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 30 * SOFTWARE. 31 */ 32 33 #ifndef _MLX5_FS_CORE_ 34 #define _MLX5_FS_CORE_ 35 36 #include <linux/refcount.h> 37 #include <linux/mlx5/fs.h> 38 #include <linux/rhashtable.h> 39 #include <linux/llist.h> 40 #include <steering/sws/fs_dr.h> 41 #include <steering/hws/fs_hws.h> 42 43 #define FDB_TC_MAX_CHAIN 3 44 #define FDB_FT_CHAIN (FDB_TC_MAX_CHAIN + 1) 45 #define FDB_TC_SLOW_PATH_CHAIN (FDB_FT_CHAIN + 1) 46 47 /* The index of the last real chain (FT) + 1 as chain zero is valid as well */ 48 #define FDB_NUM_CHAINS (FDB_FT_CHAIN + 1) 49 50 #define FDB_TC_MAX_PRIO 16 51 #define FDB_TC_LEVELS_PER_PRIO 2 52 53 struct mlx5_flow_definer { 54 enum mlx5_flow_namespace_type ns_type; 55 u32 id; 56 }; 57 58 enum mlx5_flow_resource_owner { 59 MLX5_FLOW_RESOURCE_OWNER_FW, 60 MLX5_FLOW_RESOURCE_OWNER_SW, 61 MLX5_FLOW_RESOURCE_OWNER_HWS, 62 }; 63 64 struct mlx5_modify_hdr { 65 enum mlx5_flow_namespace_type ns_type; 66 enum mlx5_flow_resource_owner owner; 67 union { 68 struct mlx5_fs_dr_action fs_dr_action; 69 struct mlx5_fs_hws_action fs_hws_action; 70 u32 id; 71 }; 72 }; 73 74 struct mlx5_pkt_reformat { 75 enum mlx5_flow_namespace_type ns_type; 76 int reformat_type; /* from mlx5_ifc */ 77 enum mlx5_flow_resource_owner owner; 78 union { 79 struct mlx5_fs_dr_action fs_dr_action; 80 struct mlx5_fs_hws_action fs_hws_action; 81 u32 id; 82 }; 83 }; 84 85 /* FS_TYPE_PRIO_CHAINS is a PRIO that will have namespaces only, 86 * and those are in parallel to one another when going over them to connect 87 * a new flow table. Meaning the last flow table in a TYPE_PRIO prio in one 88 * parallel namespace will not automatically connect to the first flow table 89 * found in any prio in any next namespace, but skip the entire containing 90 * TYPE_PRIO_CHAINS prio. 91 * 92 * This is used to implement tc chains, each chain of prios is a different 93 * namespace inside a containing TYPE_PRIO_CHAINS prio. 94 */ 95 96 enum fs_node_type { 97 FS_TYPE_NAMESPACE, 98 FS_TYPE_PRIO, 99 FS_TYPE_PRIO_CHAINS, 100 FS_TYPE_FLOW_TABLE, 101 FS_TYPE_FLOW_GROUP, 102 FS_TYPE_FLOW_ENTRY, 103 FS_TYPE_FLOW_DEST 104 }; 105 106 enum fs_flow_table_type { 107 FS_FT_NIC_RX = 0x0, 108 FS_FT_NIC_TX = 0x1, 109 FS_FT_ESW_EGRESS_ACL = 0x2, 110 FS_FT_ESW_INGRESS_ACL = 0x3, 111 FS_FT_FDB = 0X4, 112 FS_FT_SNIFFER_RX = 0X5, 113 FS_FT_SNIFFER_TX = 0X6, 114 FS_FT_RDMA_RX = 0X7, 115 FS_FT_RDMA_TX = 0X8, 116 FS_FT_PORT_SEL = 0X9, 117 FS_FT_FDB_RX = 0xa, 118 FS_FT_FDB_TX = 0xb, 119 FS_FT_RDMA_TRANSPORT_RX = 0xd, 120 FS_FT_RDMA_TRANSPORT_TX = 0xe, 121 FS_FT_MAX_TYPE = FS_FT_RDMA_TRANSPORT_TX, 122 }; 123 124 enum fs_flow_table_op_mod { 125 FS_FT_OP_MOD_NORMAL, 126 FS_FT_OP_MOD_LAG_DEMUX, 127 }; 128 129 enum fs_fte_status { 130 FS_FTE_STATUS_EXISTING = 1UL << 0, 131 }; 132 133 enum mlx5_flow_steering_mode { 134 MLX5_FLOW_STEERING_MODE_DMFS, 135 MLX5_FLOW_STEERING_MODE_SMFS, 136 MLX5_FLOW_STEERING_MODE_HMFS, 137 }; 138 139 enum mlx5_flow_steering_capabilty { 140 MLX5_FLOW_STEERING_CAP_VLAN_PUSH_ON_RX = 1UL << 0, 141 MLX5_FLOW_STEERING_CAP_VLAN_POP_ON_TX = 1UL << 1, 142 MLX5_FLOW_STEERING_CAP_MATCH_RANGES = 1UL << 2, 143 MLX5_FLOW_STEERING_CAP_DUPLICATE_MATCH = 1UL << 3, 144 }; 145 146 struct mlx5_flow_steering { 147 struct mlx5_core_dev *dev; 148 enum mlx5_flow_steering_mode mode; 149 struct kmem_cache *fgs_cache; 150 struct kmem_cache *ftes_cache; 151 struct mlx5_flow_root_namespace *root_ns; 152 struct mlx5_flow_root_namespace *fdb_root_ns; 153 struct mlx5_flow_namespace **fdb_sub_ns; 154 struct mlx5_flow_root_namespace **esw_egress_root_ns; 155 struct mlx5_flow_root_namespace **esw_ingress_root_ns; 156 struct mlx5_flow_root_namespace *sniffer_tx_root_ns; 157 struct mlx5_flow_root_namespace *sniffer_rx_root_ns; 158 struct mlx5_flow_root_namespace *rdma_rx_root_ns; 159 struct mlx5_flow_root_namespace *rdma_tx_root_ns; 160 struct mlx5_flow_root_namespace *egress_root_ns; 161 struct mlx5_flow_root_namespace *port_sel_root_ns; 162 int esw_egress_acl_vports; 163 int esw_ingress_acl_vports; 164 struct mlx5_flow_root_namespace **rdma_transport_rx_root_ns; 165 struct mlx5_flow_root_namespace **rdma_transport_tx_root_ns; 166 int rdma_transport_rx_vports; 167 int rdma_transport_tx_vports; 168 }; 169 170 struct fs_node { 171 struct list_head list; 172 struct list_head children; 173 enum fs_node_type type; 174 struct fs_node *parent; 175 struct fs_node *root; 176 /* lock the node for writing and traversing */ 177 struct rw_semaphore lock; 178 refcount_t refcount; 179 bool active; 180 void (*del_hw_func)(struct fs_node *); 181 void (*del_sw_func)(struct fs_node *); 182 atomic_t version; 183 }; 184 185 struct mlx5_flow_rule { 186 struct fs_node node; 187 struct mlx5_flow_table *ft; 188 struct mlx5_flow_destination dest_attr; 189 /* next_ft should be accessed under chain_lock and only of 190 * destination type is FWD_NEXT_fT. 191 */ 192 struct list_head next_ft; 193 u32 sw_action; 194 }; 195 196 struct mlx5_flow_handle { 197 int num_rules; 198 struct mlx5_flow_rule *rule[] __counted_by(num_rules); 199 }; 200 201 /* Type of children is mlx5_flow_group */ 202 struct mlx5_flow_table { 203 struct fs_node node; 204 union { 205 struct mlx5_fs_dr_table fs_dr_table; 206 struct mlx5_fs_hws_table fs_hws_table; 207 }; 208 u32 id; 209 u16 vport; 210 unsigned int max_fte; 211 unsigned int level; 212 enum fs_flow_table_type type; 213 enum fs_flow_table_op_mod op_mod; 214 struct { 215 bool active; 216 unsigned int required_groups; 217 unsigned int group_size; 218 unsigned int num_groups; 219 unsigned int max_fte; 220 } autogroup; 221 /* Protect fwd_rules */ 222 struct mutex lock; 223 /* FWD rules that point on this flow table */ 224 struct list_head fwd_rules; 225 u32 flags; 226 struct rhltable fgs_hash; 227 enum mlx5_flow_table_miss_action def_miss_action; 228 struct mlx5_flow_namespace *ns; 229 }; 230 231 struct mlx5_ft_underlay_qp { 232 struct list_head list; 233 u32 qpn; 234 }; 235 236 #define MLX5_FTE_MATCH_PARAM_RESERVED reserved_at_e00 237 /* Calculate the fte_match_param length and without the reserved length. 238 * Make sure the reserved field is the last. 239 */ 240 #define MLX5_ST_SZ_DW_MATCH_PARAM \ 241 ((MLX5_BYTE_OFF(fte_match_param, MLX5_FTE_MATCH_PARAM_RESERVED) / sizeof(u32)) + \ 242 BUILD_BUG_ON_ZERO(MLX5_ST_SZ_BYTES(fte_match_param) != \ 243 MLX5_FLD_SZ_BYTES(fte_match_param, \ 244 MLX5_FTE_MATCH_PARAM_RESERVED) +\ 245 MLX5_BYTE_OFF(fte_match_param, \ 246 MLX5_FTE_MATCH_PARAM_RESERVED))) 247 248 struct fs_fte_action { 249 int modify_mask; 250 u32 dests_size; 251 u32 fwd_dests; 252 struct mlx5_flow_context flow_context; 253 struct mlx5_flow_act action; 254 }; 255 256 struct fs_fte_dup { 257 struct list_head children; 258 struct fs_fte_action act_dests; 259 }; 260 261 /* Type of children is mlx5_flow_rule */ 262 struct fs_fte { 263 struct fs_node node; 264 union { 265 struct mlx5_fs_dr_rule fs_dr_rule; 266 struct mlx5_fs_hws_rule fs_hws_rule; 267 }; 268 u32 val[MLX5_ST_SZ_DW_MATCH_PARAM]; 269 struct fs_fte_action act_dests; 270 struct fs_fte_dup *dup; 271 u32 index; 272 enum fs_fte_status status; 273 struct rhash_head hash; 274 }; 275 276 /* Type of children is mlx5_flow_table/namespace */ 277 struct fs_prio { 278 struct fs_node node; 279 unsigned int num_levels; 280 unsigned int start_level; 281 unsigned int prio; 282 unsigned int num_ft; 283 }; 284 285 /* Type of children is fs_prio */ 286 struct mlx5_flow_namespace { 287 /* parent == NULL => root ns */ 288 struct fs_node node; 289 enum mlx5_flow_table_miss_action def_miss_action; 290 }; 291 292 struct mlx5_flow_group_mask { 293 u8 match_criteria_enable; 294 u32 match_criteria[MLX5_ST_SZ_DW_MATCH_PARAM]; 295 }; 296 297 /* Type of children is fs_fte */ 298 struct mlx5_flow_group { 299 struct fs_node node; 300 union { 301 struct mlx5_fs_dr_matcher fs_dr_matcher; 302 struct mlx5_fs_hws_matcher fs_hws_matcher; 303 }; 304 struct mlx5_flow_group_mask mask; 305 u32 start_index; 306 u32 max_ftes; 307 struct ida fte_allocator; 308 u32 id; 309 struct rhashtable ftes_hash; 310 struct rhlist_head hash; 311 }; 312 313 struct mlx5_flow_root_namespace { 314 struct mlx5_flow_namespace ns; 315 enum mlx5_flow_steering_mode mode; 316 union { 317 struct mlx5_fs_dr_domain fs_dr_domain; 318 struct mlx5_fs_hws_context fs_hws_context; 319 }; 320 enum fs_flow_table_type table_type; 321 struct mlx5_core_dev *dev; 322 struct mlx5_flow_table *root_ft; 323 /* Should be held when chaining flow tables */ 324 struct mutex chain_lock; 325 struct list_head underlay_qpns; 326 const struct mlx5_flow_cmds *cmds; 327 }; 328 329 enum mlx5_fc_type { 330 MLX5_FC_TYPE_ACQUIRED = 0, 331 MLX5_FC_TYPE_LOCAL, 332 }; 333 334 struct mlx5_fc_cache { 335 u64 packets; 336 u64 bytes; 337 u64 lastuse; 338 }; 339 340 struct mlx5_fc { 341 u32 id; 342 bool aging; 343 enum mlx5_fc_type type; 344 struct mlx5_fc_bulk *bulk; 345 struct mlx5_fc_cache cache; 346 /* last{packets,bytes} are used for calculating deltas since last reading. */ 347 u64 lastpackets; 348 u64 lastbytes; 349 }; 350 351 struct mlx5_fc_bulk { 352 struct mlx5_fs_bulk fs_bulk; 353 u32 base_id; 354 struct mlx5_fs_hws_data hws_data; 355 struct mlx5_fc fcs[]; 356 }; 357 358 u32 mlx5_fc_get_base_id(struct mlx5_fc *counter); 359 int mlx5_init_fc_stats(struct mlx5_core_dev *dev); 360 void mlx5_cleanup_fc_stats(struct mlx5_core_dev *dev); 361 void mlx5_fc_queue_stats_work(struct mlx5_core_dev *dev, 362 struct delayed_work *dwork, 363 unsigned long delay); 364 void mlx5_fc_update_sampling_interval(struct mlx5_core_dev *dev, 365 unsigned long interval); 366 367 const struct mlx5_flow_cmds *mlx5_fs_cmd_get_fw_cmds(void); 368 369 int mlx5_flow_namespace_set_peer(struct mlx5_flow_root_namespace *ns, 370 struct mlx5_flow_root_namespace *peer_ns, 371 u16 peer_vhca_id); 372 373 int mlx5_flow_namespace_set_mode(struct mlx5_flow_namespace *ns, 374 enum mlx5_flow_steering_mode mode); 375 376 int mlx5_fs_core_alloc(struct mlx5_core_dev *dev); 377 void mlx5_fs_core_free(struct mlx5_core_dev *dev); 378 int mlx5_fs_core_init(struct mlx5_core_dev *dev); 379 void mlx5_fs_core_cleanup(struct mlx5_core_dev *dev); 380 381 int mlx5_fs_egress_acls_init(struct mlx5_core_dev *dev, int total_vports); 382 void mlx5_fs_egress_acls_cleanup(struct mlx5_core_dev *dev); 383 int mlx5_fs_ingress_acls_init(struct mlx5_core_dev *dev, int total_vports); 384 void mlx5_fs_ingress_acls_cleanup(struct mlx5_core_dev *dev); 385 386 u32 mlx5_fs_get_capabilities(struct mlx5_core_dev *dev, enum mlx5_flow_namespace_type type); 387 388 struct mlx5_flow_root_namespace *find_root(struct fs_node *node); 389 390 int mlx5_fs_get_packet_reformat_id(struct mlx5_pkt_reformat *pkt_reformat, 391 u32 *id); 392 393 #define fs_get_obj(v, _node) {v = container_of((_node), typeof(*v), node); } 394 395 #define fs_list_for_each_entry(pos, root) \ 396 list_for_each_entry(pos, root, node.list) 397 398 #define fs_list_for_each_entry_safe(pos, tmp, root) \ 399 list_for_each_entry_safe(pos, tmp, root, node.list) 400 401 #define fs_for_each_ns_or_ft_reverse(pos, prio) \ 402 list_for_each_entry_reverse(pos, &(prio)->node.children, list) 403 404 #define fs_for_each_ns_or_ft(pos, prio) \ 405 list_for_each_entry(pos, (&(prio)->node.children), list) 406 407 #define fs_for_each_prio(pos, ns) \ 408 fs_list_for_each_entry(pos, &(ns)->node.children) 409 410 #define fs_for_each_ns(pos, prio) \ 411 fs_list_for_each_entry(pos, &(prio)->node.children) 412 413 #define fs_for_each_ft(pos, prio) \ 414 fs_list_for_each_entry(pos, &(prio)->node.children) 415 416 #define fs_for_each_ft_safe(pos, tmp, prio) \ 417 fs_list_for_each_entry_safe(pos, tmp, &(prio)->node.children) 418 419 #define fs_for_each_fg(pos, ft) \ 420 fs_list_for_each_entry(pos, &(ft)->node.children) 421 422 #define fs_for_each_fte(pos, fg) \ 423 fs_list_for_each_entry(pos, &(fg)->node.children) 424 425 #define fs_for_each_dst(pos, fte) \ 426 fs_list_for_each_entry(pos, &(fte)->node.children) 427 428 #define MLX5_CAP_FLOWTABLE_TYPE(mdev, cap, type) ( \ 429 (type == FS_FT_NIC_RX) ? MLX5_CAP_FLOWTABLE_NIC_RX(mdev, cap) : \ 430 (type == FS_FT_NIC_TX) ? MLX5_CAP_FLOWTABLE_NIC_TX(mdev, cap) : \ 431 (type == FS_FT_ESW_EGRESS_ACL) ? MLX5_CAP_ESW_EGRESS_ACL(mdev, cap) : \ 432 (type == FS_FT_ESW_INGRESS_ACL) ? MLX5_CAP_ESW_INGRESS_ACL(mdev, cap) : \ 433 (type == FS_FT_FDB) ? MLX5_CAP_ESW_FLOWTABLE_FDB(mdev, cap) : \ 434 (type == FS_FT_SNIFFER_RX) ? MLX5_CAP_FLOWTABLE_SNIFFER_RX(mdev, cap) : \ 435 (type == FS_FT_SNIFFER_TX) ? MLX5_CAP_FLOWTABLE_SNIFFER_TX(mdev, cap) : \ 436 (type == FS_FT_RDMA_RX) ? MLX5_CAP_FLOWTABLE_RDMA_RX(mdev, cap) : \ 437 (type == FS_FT_RDMA_TX) ? MLX5_CAP_FLOWTABLE_RDMA_TX(mdev, cap) : \ 438 (type == FS_FT_PORT_SEL) ? MLX5_CAP_FLOWTABLE_PORT_SELECTION(mdev, cap) : \ 439 (type == FS_FT_FDB_RX) ? MLX5_CAP_ESW_FLOWTABLE_FDB(mdev, cap) : \ 440 (type == FS_FT_FDB_TX) ? MLX5_CAP_ESW_FLOWTABLE_FDB(mdev, cap) : \ 441 (type == FS_FT_RDMA_TRANSPORT_RX) ? MLX5_CAP_FLOWTABLE_RDMA_TRANSPORT_RX(mdev, cap) : \ 442 (type == FS_FT_RDMA_TRANSPORT_TX) ? MLX5_CAP_FLOWTABLE_RDMA_TRANSPORT_TX(mdev, cap) : \ 443 (BUILD_BUG_ON_ZERO(FS_FT_RDMA_TRANSPORT_TX != FS_FT_MAX_TYPE))\ 444 ) 445 446 #endif 447