cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

cxgb4_tc_flower.c (30179B)


      1/*
      2 * This file is part of the Chelsio T4/T5/T6 Ethernet driver for Linux.
      3 *
      4 * Copyright (c) 2017 Chelsio Communications, Inc. All rights reserved.
      5 *
      6 * This software is available to you under a choice of one of two
      7 * licenses.  You may choose to be licensed under the terms of the GNU
      8 * General Public License (GPL) Version 2, available from the file
      9 * COPYING in the main directory of this source tree, or the
     10 * OpenIB.org BSD license below:
     11 *
     12 *     Redistribution and use in source and binary forms, with or
     13 *     without modification, are permitted provided that the following
     14 *     conditions are met:
     15 *
     16 *      - Redistributions of source code must retain the above
     17 *        copyright notice, this list of conditions and the following
     18 *        disclaimer.
     19 *
     20 *      - Redistributions in binary form must reproduce the above
     21 *        copyright notice, this list of conditions and the following
     22 *        disclaimer in the documentation and/or other materials
     23 *        provided with the distribution.
     24 *
     25 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
     26 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
     27 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
     28 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
     29 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
     30 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
     31 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
     32 * SOFTWARE.
     33 */
     34
     35#include <net/tc_act/tc_mirred.h>
     36#include <net/tc_act/tc_pedit.h>
     37#include <net/tc_act/tc_gact.h>
     38#include <net/tc_act/tc_vlan.h>
     39
     40#include "cxgb4.h"
     41#include "cxgb4_filter.h"
     42#include "cxgb4_tc_flower.h"
     43
     44#define STATS_CHECK_PERIOD (HZ / 2)
     45
     46static struct ch_tc_pedit_fields pedits[] = {
     47	PEDIT_FIELDS(ETH_, DMAC_31_0, 4, dmac, 0),
     48	PEDIT_FIELDS(ETH_, DMAC_47_32, 2, dmac, 4),
     49	PEDIT_FIELDS(ETH_, SMAC_15_0, 2, smac, 0),
     50	PEDIT_FIELDS(ETH_, SMAC_47_16, 4, smac, 2),
     51	PEDIT_FIELDS(IP4_, SRC, 4, nat_fip, 0),
     52	PEDIT_FIELDS(IP4_, DST, 4, nat_lip, 0),
     53	PEDIT_FIELDS(IP6_, SRC_31_0, 4, nat_fip, 0),
     54	PEDIT_FIELDS(IP6_, SRC_63_32, 4, nat_fip, 4),
     55	PEDIT_FIELDS(IP6_, SRC_95_64, 4, nat_fip, 8),
     56	PEDIT_FIELDS(IP6_, SRC_127_96, 4, nat_fip, 12),
     57	PEDIT_FIELDS(IP6_, DST_31_0, 4, nat_lip, 0),
     58	PEDIT_FIELDS(IP6_, DST_63_32, 4, nat_lip, 4),
     59	PEDIT_FIELDS(IP6_, DST_95_64, 4, nat_lip, 8),
     60	PEDIT_FIELDS(IP6_, DST_127_96, 4, nat_lip, 12),
     61};
     62
     63static const struct cxgb4_natmode_config cxgb4_natmode_config_array[] = {
     64	/* Default supported NAT modes */
     65	{
     66		.chip = CHELSIO_T5,
     67		.flags = CXGB4_ACTION_NATMODE_NONE,
     68		.natmode = NAT_MODE_NONE,
     69	},
     70	{
     71		.chip = CHELSIO_T5,
     72		.flags = CXGB4_ACTION_NATMODE_DIP,
     73		.natmode = NAT_MODE_DIP,
     74	},
     75	{
     76		.chip = CHELSIO_T5,
     77		.flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_DPORT,
     78		.natmode = NAT_MODE_DIP_DP,
     79	},
     80	{
     81		.chip = CHELSIO_T5,
     82		.flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_DPORT |
     83			 CXGB4_ACTION_NATMODE_SIP,
     84		.natmode = NAT_MODE_DIP_DP_SIP,
     85	},
     86	{
     87		.chip = CHELSIO_T5,
     88		.flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_DPORT |
     89			 CXGB4_ACTION_NATMODE_SPORT,
     90		.natmode = NAT_MODE_DIP_DP_SP,
     91	},
     92	{
     93		.chip = CHELSIO_T5,
     94		.flags = CXGB4_ACTION_NATMODE_SIP | CXGB4_ACTION_NATMODE_SPORT,
     95		.natmode = NAT_MODE_SIP_SP,
     96	},
     97	{
     98		.chip = CHELSIO_T5,
     99		.flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_SIP |
    100			 CXGB4_ACTION_NATMODE_SPORT,
    101		.natmode = NAT_MODE_DIP_SIP_SP,
    102	},
    103	{
    104		.chip = CHELSIO_T5,
    105		.flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_SIP |
    106			 CXGB4_ACTION_NATMODE_DPORT |
    107			 CXGB4_ACTION_NATMODE_SPORT,
    108		.natmode = NAT_MODE_ALL,
    109	},
    110	/* T6+ can ignore L4 ports when they're disabled. */
    111	{
    112		.chip = CHELSIO_T6,
    113		.flags = CXGB4_ACTION_NATMODE_SIP,
    114		.natmode = NAT_MODE_SIP_SP,
    115	},
    116	{
    117		.chip = CHELSIO_T6,
    118		.flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_SPORT,
    119		.natmode = NAT_MODE_DIP_DP_SP,
    120	},
    121	{
    122		.chip = CHELSIO_T6,
    123		.flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_SIP,
    124		.natmode = NAT_MODE_ALL,
    125	},
    126};
    127
    128static void cxgb4_action_natmode_tweak(struct ch_filter_specification *fs,
    129				       u8 natmode_flags)
    130{
    131	u8 i = 0;
    132
    133	/* Translate the enabled NAT 4-tuple fields to one of the
    134	 * hardware supported NAT mode configurations. This ensures
    135	 * that we pick a valid combination, where the disabled fields
    136	 * do not get overwritten to 0.
    137	 */
    138	for (i = 0; i < ARRAY_SIZE(cxgb4_natmode_config_array); i++) {
    139		if (cxgb4_natmode_config_array[i].flags == natmode_flags) {
    140			fs->nat_mode = cxgb4_natmode_config_array[i].natmode;
    141			return;
    142		}
    143	}
    144}
    145
    146static struct ch_tc_flower_entry *allocate_flower_entry(void)
    147{
    148	struct ch_tc_flower_entry *new = kzalloc(sizeof(*new), GFP_KERNEL);
    149	if (new)
    150		spin_lock_init(&new->lock);
    151	return new;
    152}
    153
    154/* Must be called with either RTNL or rcu_read_lock */
    155static struct ch_tc_flower_entry *ch_flower_lookup(struct adapter *adap,
    156						   unsigned long flower_cookie)
    157{
    158	return rhashtable_lookup_fast(&adap->flower_tbl, &flower_cookie,
    159				      adap->flower_ht_params);
    160}
    161
    162static void cxgb4_process_flow_match(struct net_device *dev,
    163				     struct flow_rule *rule,
    164				     struct ch_filter_specification *fs)
    165{
    166	u16 addr_type = 0;
    167
    168	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_CONTROL)) {
    169		struct flow_match_control match;
    170
    171		flow_rule_match_control(rule, &match);
    172		addr_type = match.key->addr_type;
    173	} else if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IPV4_ADDRS)) {
    174		addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
    175	} else if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IPV6_ADDRS)) {
    176		addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
    177	}
    178
    179	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_BASIC)) {
    180		struct flow_match_basic match;
    181		u16 ethtype_key, ethtype_mask;
    182
    183		flow_rule_match_basic(rule, &match);
    184		ethtype_key = ntohs(match.key->n_proto);
    185		ethtype_mask = ntohs(match.mask->n_proto);
    186
    187		if (ethtype_key == ETH_P_ALL) {
    188			ethtype_key = 0;
    189			ethtype_mask = 0;
    190		}
    191
    192		if (ethtype_key == ETH_P_IPV6)
    193			fs->type = 1;
    194
    195		fs->val.ethtype = ethtype_key;
    196		fs->mask.ethtype = ethtype_mask;
    197		fs->val.proto = match.key->ip_proto;
    198		fs->mask.proto = match.mask->ip_proto;
    199	}
    200
    201	if (addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS) {
    202		struct flow_match_ipv4_addrs match;
    203
    204		flow_rule_match_ipv4_addrs(rule, &match);
    205		fs->type = 0;
    206		memcpy(&fs->val.lip[0], &match.key->dst, sizeof(match.key->dst));
    207		memcpy(&fs->val.fip[0], &match.key->src, sizeof(match.key->src));
    208		memcpy(&fs->mask.lip[0], &match.mask->dst, sizeof(match.mask->dst));
    209		memcpy(&fs->mask.fip[0], &match.mask->src, sizeof(match.mask->src));
    210
    211		/* also initialize nat_lip/fip to same values */
    212		memcpy(&fs->nat_lip[0], &match.key->dst, sizeof(match.key->dst));
    213		memcpy(&fs->nat_fip[0], &match.key->src, sizeof(match.key->src));
    214	}
    215
    216	if (addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS) {
    217		struct flow_match_ipv6_addrs match;
    218
    219		flow_rule_match_ipv6_addrs(rule, &match);
    220		fs->type = 1;
    221		memcpy(&fs->val.lip[0], match.key->dst.s6_addr,
    222		       sizeof(match.key->dst));
    223		memcpy(&fs->val.fip[0], match.key->src.s6_addr,
    224		       sizeof(match.key->src));
    225		memcpy(&fs->mask.lip[0], match.mask->dst.s6_addr,
    226		       sizeof(match.mask->dst));
    227		memcpy(&fs->mask.fip[0], match.mask->src.s6_addr,
    228		       sizeof(match.mask->src));
    229
    230		/* also initialize nat_lip/fip to same values */
    231		memcpy(&fs->nat_lip[0], match.key->dst.s6_addr,
    232		       sizeof(match.key->dst));
    233		memcpy(&fs->nat_fip[0], match.key->src.s6_addr,
    234		       sizeof(match.key->src));
    235	}
    236
    237	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_PORTS)) {
    238		struct flow_match_ports match;
    239
    240		flow_rule_match_ports(rule, &match);
    241		fs->val.lport = be16_to_cpu(match.key->dst);
    242		fs->mask.lport = be16_to_cpu(match.mask->dst);
    243		fs->val.fport = be16_to_cpu(match.key->src);
    244		fs->mask.fport = be16_to_cpu(match.mask->src);
    245
    246		/* also initialize nat_lport/fport to same values */
    247		fs->nat_lport = fs->val.lport;
    248		fs->nat_fport = fs->val.fport;
    249	}
    250
    251	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IP)) {
    252		struct flow_match_ip match;
    253
    254		flow_rule_match_ip(rule, &match);
    255		fs->val.tos = match.key->tos;
    256		fs->mask.tos = match.mask->tos;
    257	}
    258
    259	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_ENC_KEYID)) {
    260		struct flow_match_enc_keyid match;
    261
    262		flow_rule_match_enc_keyid(rule, &match);
    263		fs->val.vni = be32_to_cpu(match.key->keyid);
    264		fs->mask.vni = be32_to_cpu(match.mask->keyid);
    265		if (fs->mask.vni) {
    266			fs->val.encap_vld = 1;
    267			fs->mask.encap_vld = 1;
    268		}
    269	}
    270
    271	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_VLAN)) {
    272		struct flow_match_vlan match;
    273		u16 vlan_tci, vlan_tci_mask;
    274
    275		flow_rule_match_vlan(rule, &match);
    276		vlan_tci = match.key->vlan_id | (match.key->vlan_priority <<
    277					       VLAN_PRIO_SHIFT);
    278		vlan_tci_mask = match.mask->vlan_id | (match.mask->vlan_priority <<
    279						     VLAN_PRIO_SHIFT);
    280		fs->val.ivlan = vlan_tci;
    281		fs->mask.ivlan = vlan_tci_mask;
    282
    283		fs->val.ivlan_vld = 1;
    284		fs->mask.ivlan_vld = 1;
    285
    286		/* Chelsio adapters use ivlan_vld bit to match vlan packets
    287		 * as 802.1Q. Also, when vlan tag is present in packets,
    288		 * ethtype match is used then to match on ethtype of inner
    289		 * header ie. the header following the vlan header.
    290		 * So, set the ivlan_vld based on ethtype info supplied by
    291		 * TC for vlan packets if its 802.1Q. And then reset the
    292		 * ethtype value else, hw will try to match the supplied
    293		 * ethtype value with ethtype of inner header.
    294		 */
    295		if (fs->val.ethtype == ETH_P_8021Q) {
    296			fs->val.ethtype = 0;
    297			fs->mask.ethtype = 0;
    298		}
    299	}
    300
    301	/* Match only packets coming from the ingress port where this
    302	 * filter will be created.
    303	 */
    304	fs->val.iport = netdev2pinfo(dev)->port_id;
    305	fs->mask.iport = ~0;
    306}
    307
    308static int cxgb4_validate_flow_match(struct net_device *dev,
    309				     struct flow_rule *rule)
    310{
    311	struct flow_dissector *dissector = rule->match.dissector;
    312	u16 ethtype_mask = 0;
    313	u16 ethtype_key = 0;
    314
    315	if (dissector->used_keys &
    316	    ~(BIT(FLOW_DISSECTOR_KEY_CONTROL) |
    317	      BIT(FLOW_DISSECTOR_KEY_BASIC) |
    318	      BIT(FLOW_DISSECTOR_KEY_IPV4_ADDRS) |
    319	      BIT(FLOW_DISSECTOR_KEY_IPV6_ADDRS) |
    320	      BIT(FLOW_DISSECTOR_KEY_PORTS) |
    321	      BIT(FLOW_DISSECTOR_KEY_ENC_KEYID) |
    322	      BIT(FLOW_DISSECTOR_KEY_VLAN) |
    323	      BIT(FLOW_DISSECTOR_KEY_IP))) {
    324		netdev_warn(dev, "Unsupported key used: 0x%x\n",
    325			    dissector->used_keys);
    326		return -EOPNOTSUPP;
    327	}
    328
    329	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_BASIC)) {
    330		struct flow_match_basic match;
    331
    332		flow_rule_match_basic(rule, &match);
    333		ethtype_key = ntohs(match.key->n_proto);
    334		ethtype_mask = ntohs(match.mask->n_proto);
    335	}
    336
    337	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IP)) {
    338		u16 eth_ip_type = ethtype_key & ethtype_mask;
    339		struct flow_match_ip match;
    340
    341		if (eth_ip_type != ETH_P_IP && eth_ip_type != ETH_P_IPV6) {
    342			netdev_err(dev, "IP Key supported only with IPv4/v6");
    343			return -EINVAL;
    344		}
    345
    346		flow_rule_match_ip(rule, &match);
    347		if (match.mask->ttl) {
    348			netdev_warn(dev, "ttl match unsupported for offload");
    349			return -EOPNOTSUPP;
    350		}
    351	}
    352
    353	return 0;
    354}
    355
    356static void offload_pedit(struct ch_filter_specification *fs, u32 val, u32 mask,
    357			  u8 field)
    358{
    359	u32 set_val = val & ~mask;
    360	u32 offset = 0;
    361	u8 size = 1;
    362	int i;
    363
    364	for (i = 0; i < ARRAY_SIZE(pedits); i++) {
    365		if (pedits[i].field == field) {
    366			offset = pedits[i].offset;
    367			size = pedits[i].size;
    368			break;
    369		}
    370	}
    371	memcpy((u8 *)fs + offset, &set_val, size);
    372}
    373
    374static void process_pedit_field(struct ch_filter_specification *fs, u32 val,
    375				u32 mask, u32 offset, u8 htype,
    376				u8 *natmode_flags)
    377{
    378	switch (htype) {
    379	case FLOW_ACT_MANGLE_HDR_TYPE_ETH:
    380		switch (offset) {
    381		case PEDIT_ETH_DMAC_31_0:
    382			fs->newdmac = 1;
    383			offload_pedit(fs, val, mask, ETH_DMAC_31_0);
    384			break;
    385		case PEDIT_ETH_DMAC_47_32_SMAC_15_0:
    386			if (~mask & PEDIT_ETH_DMAC_MASK)
    387				offload_pedit(fs, val, mask, ETH_DMAC_47_32);
    388			else
    389				offload_pedit(fs, val >> 16, mask >> 16,
    390					      ETH_SMAC_15_0);
    391			break;
    392		case PEDIT_ETH_SMAC_47_16:
    393			fs->newsmac = 1;
    394			offload_pedit(fs, val, mask, ETH_SMAC_47_16);
    395		}
    396		break;
    397	case FLOW_ACT_MANGLE_HDR_TYPE_IP4:
    398		switch (offset) {
    399		case PEDIT_IP4_SRC:
    400			offload_pedit(fs, val, mask, IP4_SRC);
    401			*natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
    402			break;
    403		case PEDIT_IP4_DST:
    404			offload_pedit(fs, val, mask, IP4_DST);
    405			*natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
    406		}
    407		break;
    408	case FLOW_ACT_MANGLE_HDR_TYPE_IP6:
    409		switch (offset) {
    410		case PEDIT_IP6_SRC_31_0:
    411			offload_pedit(fs, val, mask, IP6_SRC_31_0);
    412			*natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
    413			break;
    414		case PEDIT_IP6_SRC_63_32:
    415			offload_pedit(fs, val, mask, IP6_SRC_63_32);
    416			*natmode_flags |=  CXGB4_ACTION_NATMODE_SIP;
    417			break;
    418		case PEDIT_IP6_SRC_95_64:
    419			offload_pedit(fs, val, mask, IP6_SRC_95_64);
    420			*natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
    421			break;
    422		case PEDIT_IP6_SRC_127_96:
    423			offload_pedit(fs, val, mask, IP6_SRC_127_96);
    424			*natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
    425			break;
    426		case PEDIT_IP6_DST_31_0:
    427			offload_pedit(fs, val, mask, IP6_DST_31_0);
    428			*natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
    429			break;
    430		case PEDIT_IP6_DST_63_32:
    431			offload_pedit(fs, val, mask, IP6_DST_63_32);
    432			*natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
    433			break;
    434		case PEDIT_IP6_DST_95_64:
    435			offload_pedit(fs, val, mask, IP6_DST_95_64);
    436			*natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
    437			break;
    438		case PEDIT_IP6_DST_127_96:
    439			offload_pedit(fs, val, mask, IP6_DST_127_96);
    440			*natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
    441		}
    442		break;
    443	case FLOW_ACT_MANGLE_HDR_TYPE_TCP:
    444		switch (offset) {
    445		case PEDIT_TCP_SPORT_DPORT:
    446			if (~mask & PEDIT_TCP_UDP_SPORT_MASK) {
    447				fs->nat_fport = val;
    448				*natmode_flags |= CXGB4_ACTION_NATMODE_SPORT;
    449			} else {
    450				fs->nat_lport = val >> 16;
    451				*natmode_flags |= CXGB4_ACTION_NATMODE_DPORT;
    452			}
    453		}
    454		break;
    455	case FLOW_ACT_MANGLE_HDR_TYPE_UDP:
    456		switch (offset) {
    457		case PEDIT_UDP_SPORT_DPORT:
    458			if (~mask & PEDIT_TCP_UDP_SPORT_MASK) {
    459				fs->nat_fport = val;
    460				*natmode_flags |= CXGB4_ACTION_NATMODE_SPORT;
    461			} else {
    462				fs->nat_lport = val >> 16;
    463				*natmode_flags |= CXGB4_ACTION_NATMODE_DPORT;
    464			}
    465		}
    466		break;
    467	}
    468}
    469
    470static int cxgb4_action_natmode_validate(struct adapter *adap, u8 natmode_flags,
    471					 struct netlink_ext_ack *extack)
    472{
    473	u8 i = 0;
    474
    475	/* Extract the NAT mode to enable based on what 4-tuple fields
    476	 * are enabled to be overwritten. This ensures that the
    477	 * disabled fields don't get overwritten to 0.
    478	 */
    479	for (i = 0; i < ARRAY_SIZE(cxgb4_natmode_config_array); i++) {
    480		const struct cxgb4_natmode_config *c;
    481
    482		c = &cxgb4_natmode_config_array[i];
    483		if (CHELSIO_CHIP_VERSION(adap->params.chip) >= c->chip &&
    484		    natmode_flags == c->flags)
    485			return 0;
    486	}
    487	NL_SET_ERR_MSG_MOD(extack, "Unsupported NAT mode 4-tuple combination");
    488	return -EOPNOTSUPP;
    489}
    490
    491void cxgb4_process_flow_actions(struct net_device *in,
    492				struct flow_action *actions,
    493				struct ch_filter_specification *fs)
    494{
    495	struct flow_action_entry *act;
    496	u8 natmode_flags = 0;
    497	int i;
    498
    499	flow_action_for_each(i, act, actions) {
    500		switch (act->id) {
    501		case FLOW_ACTION_ACCEPT:
    502			fs->action = FILTER_PASS;
    503			break;
    504		case FLOW_ACTION_DROP:
    505			fs->action = FILTER_DROP;
    506			break;
    507		case FLOW_ACTION_MIRRED:
    508		case FLOW_ACTION_REDIRECT: {
    509			struct net_device *out = act->dev;
    510			struct port_info *pi = netdev_priv(out);
    511
    512			fs->action = FILTER_SWITCH;
    513			fs->eport = pi->port_id;
    514			}
    515			break;
    516		case FLOW_ACTION_VLAN_POP:
    517		case FLOW_ACTION_VLAN_PUSH:
    518		case FLOW_ACTION_VLAN_MANGLE: {
    519			u8 prio = act->vlan.prio;
    520			u16 vid = act->vlan.vid;
    521			u16 vlan_tci = (prio << VLAN_PRIO_SHIFT) | vid;
    522			switch (act->id) {
    523			case FLOW_ACTION_VLAN_POP:
    524				fs->newvlan |= VLAN_REMOVE;
    525				break;
    526			case FLOW_ACTION_VLAN_PUSH:
    527				fs->newvlan |= VLAN_INSERT;
    528				fs->vlan = vlan_tci;
    529				break;
    530			case FLOW_ACTION_VLAN_MANGLE:
    531				fs->newvlan |= VLAN_REWRITE;
    532				fs->vlan = vlan_tci;
    533				break;
    534			default:
    535				break;
    536			}
    537			}
    538			break;
    539		case FLOW_ACTION_MANGLE: {
    540			u32 mask, val, offset;
    541			u8 htype;
    542
    543			htype = act->mangle.htype;
    544			mask = act->mangle.mask;
    545			val = act->mangle.val;
    546			offset = act->mangle.offset;
    547
    548			process_pedit_field(fs, val, mask, offset, htype,
    549					    &natmode_flags);
    550			}
    551			break;
    552		case FLOW_ACTION_QUEUE:
    553			fs->action = FILTER_PASS;
    554			fs->dirsteer = 1;
    555			fs->iq = act->queue.index;
    556			break;
    557		default:
    558			break;
    559		}
    560	}
    561	if (natmode_flags)
    562		cxgb4_action_natmode_tweak(fs, natmode_flags);
    563
    564}
    565
    566static bool valid_l4_mask(u32 mask)
    567{
    568	u16 hi, lo;
    569
    570	/* Either the upper 16-bits (SPORT) OR the lower
    571	 * 16-bits (DPORT) can be set, but NOT BOTH.
    572	 */
    573	hi = (mask >> 16) & 0xFFFF;
    574	lo = mask & 0xFFFF;
    575
    576	return hi && lo ? false : true;
    577}
    578
    579static bool valid_pedit_action(struct net_device *dev,
    580			       const struct flow_action_entry *act,
    581			       u8 *natmode_flags)
    582{
    583	u32 mask, offset;
    584	u8 htype;
    585
    586	htype = act->mangle.htype;
    587	mask = act->mangle.mask;
    588	offset = act->mangle.offset;
    589
    590	switch (htype) {
    591	case FLOW_ACT_MANGLE_HDR_TYPE_ETH:
    592		switch (offset) {
    593		case PEDIT_ETH_DMAC_31_0:
    594		case PEDIT_ETH_DMAC_47_32_SMAC_15_0:
    595		case PEDIT_ETH_SMAC_47_16:
    596			break;
    597		default:
    598			netdev_err(dev, "%s: Unsupported pedit field\n",
    599				   __func__);
    600			return false;
    601		}
    602		break;
    603	case FLOW_ACT_MANGLE_HDR_TYPE_IP4:
    604		switch (offset) {
    605		case PEDIT_IP4_SRC:
    606			*natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
    607			break;
    608		case PEDIT_IP4_DST:
    609			*natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
    610			break;
    611		default:
    612			netdev_err(dev, "%s: Unsupported pedit field\n",
    613				   __func__);
    614			return false;
    615		}
    616		break;
    617	case FLOW_ACT_MANGLE_HDR_TYPE_IP6:
    618		switch (offset) {
    619		case PEDIT_IP6_SRC_31_0:
    620		case PEDIT_IP6_SRC_63_32:
    621		case PEDIT_IP6_SRC_95_64:
    622		case PEDIT_IP6_SRC_127_96:
    623			*natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
    624			break;
    625		case PEDIT_IP6_DST_31_0:
    626		case PEDIT_IP6_DST_63_32:
    627		case PEDIT_IP6_DST_95_64:
    628		case PEDIT_IP6_DST_127_96:
    629			*natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
    630			break;
    631		default:
    632			netdev_err(dev, "%s: Unsupported pedit field\n",
    633				   __func__);
    634			return false;
    635		}
    636		break;
    637	case FLOW_ACT_MANGLE_HDR_TYPE_TCP:
    638		switch (offset) {
    639		case PEDIT_TCP_SPORT_DPORT:
    640			if (!valid_l4_mask(~mask)) {
    641				netdev_err(dev, "%s: Unsupported mask for TCP L4 ports\n",
    642					   __func__);
    643				return false;
    644			}
    645			if (~mask & PEDIT_TCP_UDP_SPORT_MASK)
    646				*natmode_flags |= CXGB4_ACTION_NATMODE_SPORT;
    647			else
    648				*natmode_flags |= CXGB4_ACTION_NATMODE_DPORT;
    649			break;
    650		default:
    651			netdev_err(dev, "%s: Unsupported pedit field\n",
    652				   __func__);
    653			return false;
    654		}
    655		break;
    656	case FLOW_ACT_MANGLE_HDR_TYPE_UDP:
    657		switch (offset) {
    658		case PEDIT_UDP_SPORT_DPORT:
    659			if (!valid_l4_mask(~mask)) {
    660				netdev_err(dev, "%s: Unsupported mask for UDP L4 ports\n",
    661					   __func__);
    662				return false;
    663			}
    664			if (~mask & PEDIT_TCP_UDP_SPORT_MASK)
    665				*natmode_flags |= CXGB4_ACTION_NATMODE_SPORT;
    666			else
    667				*natmode_flags |= CXGB4_ACTION_NATMODE_DPORT;
    668			break;
    669		default:
    670			netdev_err(dev, "%s: Unsupported pedit field\n",
    671				   __func__);
    672			return false;
    673		}
    674		break;
    675	default:
    676		netdev_err(dev, "%s: Unsupported pedit type\n", __func__);
    677		return false;
    678	}
    679	return true;
    680}
    681
    682int cxgb4_validate_flow_actions(struct net_device *dev,
    683				struct flow_action *actions,
    684				struct netlink_ext_ack *extack,
    685				u8 matchall_filter)
    686{
    687	struct adapter *adap = netdev2adap(dev);
    688	struct flow_action_entry *act;
    689	bool act_redir = false;
    690	bool act_pedit = false;
    691	bool act_vlan = false;
    692	u8 natmode_flags = 0;
    693	int i;
    694
    695	if (!flow_action_basic_hw_stats_check(actions, extack))
    696		return -EOPNOTSUPP;
    697
    698	flow_action_for_each(i, act, actions) {
    699		switch (act->id) {
    700		case FLOW_ACTION_ACCEPT:
    701		case FLOW_ACTION_DROP:
    702			/* Do nothing */
    703			break;
    704		case FLOW_ACTION_MIRRED:
    705		case FLOW_ACTION_REDIRECT: {
    706			struct net_device *n_dev, *target_dev;
    707			bool found = false;
    708			unsigned int i;
    709
    710			if (act->id == FLOW_ACTION_MIRRED &&
    711			    !matchall_filter) {
    712				NL_SET_ERR_MSG_MOD(extack,
    713						   "Egress mirror action is only supported for tc-matchall");
    714				return -EOPNOTSUPP;
    715			}
    716
    717			target_dev = act->dev;
    718			for_each_port(adap, i) {
    719				n_dev = adap->port[i];
    720				if (target_dev == n_dev) {
    721					found = true;
    722					break;
    723				}
    724			}
    725
    726			/* If interface doesn't belong to our hw, then
    727			 * the provided output port is not valid
    728			 */
    729			if (!found) {
    730				netdev_err(dev, "%s: Out port invalid\n",
    731					   __func__);
    732				return -EINVAL;
    733			}
    734			act_redir = true;
    735			}
    736			break;
    737		case FLOW_ACTION_VLAN_POP:
    738		case FLOW_ACTION_VLAN_PUSH:
    739		case FLOW_ACTION_VLAN_MANGLE: {
    740			u16 proto = be16_to_cpu(act->vlan.proto);
    741
    742			switch (act->id) {
    743			case FLOW_ACTION_VLAN_POP:
    744				break;
    745			case FLOW_ACTION_VLAN_PUSH:
    746			case FLOW_ACTION_VLAN_MANGLE:
    747				if (proto != ETH_P_8021Q) {
    748					netdev_err(dev, "%s: Unsupported vlan proto\n",
    749						   __func__);
    750					return -EOPNOTSUPP;
    751				}
    752				break;
    753			default:
    754				netdev_err(dev, "%s: Unsupported vlan action\n",
    755					   __func__);
    756				return -EOPNOTSUPP;
    757			}
    758			act_vlan = true;
    759			}
    760			break;
    761		case FLOW_ACTION_MANGLE: {
    762			bool pedit_valid = valid_pedit_action(dev, act,
    763							      &natmode_flags);
    764
    765			if (!pedit_valid)
    766				return -EOPNOTSUPP;
    767			act_pedit = true;
    768			}
    769			break;
    770		case FLOW_ACTION_QUEUE:
    771			/* Do nothing. cxgb4_set_filter will validate */
    772			break;
    773		default:
    774			netdev_err(dev, "%s: Unsupported action\n", __func__);
    775			return -EOPNOTSUPP;
    776		}
    777	}
    778
    779	if ((act_pedit || act_vlan) && !act_redir) {
    780		netdev_err(dev, "%s: pedit/vlan rewrite invalid without egress redirect\n",
    781			   __func__);
    782		return -EINVAL;
    783	}
    784
    785	if (act_pedit) {
    786		int ret;
    787
    788		ret = cxgb4_action_natmode_validate(adap, natmode_flags,
    789						    extack);
    790		if (ret)
    791			return ret;
    792	}
    793
    794	return 0;
    795}
    796
    797static void cxgb4_tc_flower_hash_prio_add(struct adapter *adap, u32 tc_prio)
    798{
    799	spin_lock_bh(&adap->tids.ftid_lock);
    800	if (adap->tids.tc_hash_tids_max_prio < tc_prio)
    801		adap->tids.tc_hash_tids_max_prio = tc_prio;
    802	spin_unlock_bh(&adap->tids.ftid_lock);
    803}
    804
    805static void cxgb4_tc_flower_hash_prio_del(struct adapter *adap, u32 tc_prio)
    806{
    807	struct tid_info *t = &adap->tids;
    808	struct ch_tc_flower_entry *fe;
    809	struct rhashtable_iter iter;
    810	u32 found = 0;
    811
    812	spin_lock_bh(&t->ftid_lock);
    813	/* Bail if the current rule is not the one with the max
    814	 * prio.
    815	 */
    816	if (t->tc_hash_tids_max_prio != tc_prio)
    817		goto out_unlock;
    818
    819	/* Search for the next rule having the same or next lower
    820	 * max prio.
    821	 */
    822	rhashtable_walk_enter(&adap->flower_tbl, &iter);
    823	do {
    824		rhashtable_walk_start(&iter);
    825
    826		fe = rhashtable_walk_next(&iter);
    827		while (!IS_ERR_OR_NULL(fe)) {
    828			if (fe->fs.hash &&
    829			    fe->fs.tc_prio <= t->tc_hash_tids_max_prio) {
    830				t->tc_hash_tids_max_prio = fe->fs.tc_prio;
    831				found++;
    832
    833				/* Bail if we found another rule
    834				 * having the same prio as the
    835				 * current max one.
    836				 */
    837				if (fe->fs.tc_prio == tc_prio)
    838					break;
    839			}
    840
    841			fe = rhashtable_walk_next(&iter);
    842		}
    843
    844		rhashtable_walk_stop(&iter);
    845	} while (fe == ERR_PTR(-EAGAIN));
    846	rhashtable_walk_exit(&iter);
    847
    848	if (!found)
    849		t->tc_hash_tids_max_prio = 0;
    850
    851out_unlock:
    852	spin_unlock_bh(&t->ftid_lock);
    853}
    854
    855int cxgb4_flow_rule_replace(struct net_device *dev, struct flow_rule *rule,
    856			    u32 tc_prio, struct netlink_ext_ack *extack,
    857			    struct ch_filter_specification *fs, u32 *tid)
    858{
    859	struct adapter *adap = netdev2adap(dev);
    860	struct filter_ctx ctx;
    861	u8 inet_family;
    862	int fidx, ret;
    863
    864	if (cxgb4_validate_flow_actions(dev, &rule->action, extack, 0))
    865		return -EOPNOTSUPP;
    866
    867	if (cxgb4_validate_flow_match(dev, rule))
    868		return -EOPNOTSUPP;
    869
    870	cxgb4_process_flow_match(dev, rule, fs);
    871	cxgb4_process_flow_actions(dev, &rule->action, fs);
    872
    873	fs->hash = is_filter_exact_match(adap, fs);
    874	inet_family = fs->type ? PF_INET6 : PF_INET;
    875
    876	/* Get a free filter entry TID, where we can insert this new
    877	 * rule. Only insert rule if its prio doesn't conflict with
    878	 * existing rules.
    879	 */
    880	fidx = cxgb4_get_free_ftid(dev, inet_family, fs->hash,
    881				   tc_prio);
    882	if (fidx < 0) {
    883		NL_SET_ERR_MSG_MOD(extack,
    884				   "No free LETCAM index available");
    885		return -ENOMEM;
    886	}
    887
    888	if (fidx < adap->tids.nhpftids) {
    889		fs->prio = 1;
    890		fs->hash = 0;
    891	}
    892
    893	/* If the rule can be inserted into HASH region, then ignore
    894	 * the index to normal FILTER region.
    895	 */
    896	if (fs->hash)
    897		fidx = 0;
    898
    899	fs->tc_prio = tc_prio;
    900
    901	init_completion(&ctx.completion);
    902	ret = __cxgb4_set_filter(dev, fidx, fs, &ctx);
    903	if (ret) {
    904		netdev_err(dev, "%s: filter creation err %d\n",
    905			   __func__, ret);
    906		return ret;
    907	}
    908
    909	/* Wait for reply */
    910	ret = wait_for_completion_timeout(&ctx.completion, 10 * HZ);
    911	if (!ret)
    912		return -ETIMEDOUT;
    913
    914	/* Check if hw returned error for filter creation */
    915	if (ctx.result)
    916		return ctx.result;
    917
    918	*tid = ctx.tid;
    919
    920	if (fs->hash)
    921		cxgb4_tc_flower_hash_prio_add(adap, tc_prio);
    922
    923	return 0;
    924}
    925
    926int cxgb4_tc_flower_replace(struct net_device *dev,
    927			    struct flow_cls_offload *cls)
    928{
    929	struct flow_rule *rule = flow_cls_offload_flow_rule(cls);
    930	struct netlink_ext_ack *extack = cls->common.extack;
    931	struct adapter *adap = netdev2adap(dev);
    932	struct ch_tc_flower_entry *ch_flower;
    933	struct ch_filter_specification *fs;
    934	int ret;
    935
    936	ch_flower = allocate_flower_entry();
    937	if (!ch_flower) {
    938		netdev_err(dev, "%s: ch_flower alloc failed.\n", __func__);
    939		return -ENOMEM;
    940	}
    941
    942	fs = &ch_flower->fs;
    943	fs->hitcnts = 1;
    944	fs->tc_cookie = cls->cookie;
    945
    946	ret = cxgb4_flow_rule_replace(dev, rule, cls->common.prio, extack, fs,
    947				      &ch_flower->filter_id);
    948	if (ret)
    949		goto free_entry;
    950
    951	ch_flower->tc_flower_cookie = cls->cookie;
    952	ret = rhashtable_insert_fast(&adap->flower_tbl, &ch_flower->node,
    953				     adap->flower_ht_params);
    954	if (ret)
    955		goto del_filter;
    956
    957	return 0;
    958
    959del_filter:
    960	if (fs->hash)
    961		cxgb4_tc_flower_hash_prio_del(adap, cls->common.prio);
    962
    963	cxgb4_del_filter(dev, ch_flower->filter_id, &ch_flower->fs);
    964
    965free_entry:
    966	kfree(ch_flower);
    967	return ret;
    968}
    969
    970int cxgb4_flow_rule_destroy(struct net_device *dev, u32 tc_prio,
    971			    struct ch_filter_specification *fs, int tid)
    972{
    973	struct adapter *adap = netdev2adap(dev);
    974	u8 hash;
    975	int ret;
    976
    977	hash = fs->hash;
    978
    979	ret = cxgb4_del_filter(dev, tid, fs);
    980	if (ret)
    981		return ret;
    982
    983	if (hash)
    984		cxgb4_tc_flower_hash_prio_del(adap, tc_prio);
    985
    986	return ret;
    987}
    988
    989int cxgb4_tc_flower_destroy(struct net_device *dev,
    990			    struct flow_cls_offload *cls)
    991{
    992	struct adapter *adap = netdev2adap(dev);
    993	struct ch_tc_flower_entry *ch_flower;
    994	int ret;
    995
    996	ch_flower = ch_flower_lookup(adap, cls->cookie);
    997	if (!ch_flower)
    998		return -ENOENT;
    999
   1000	rhashtable_remove_fast(&adap->flower_tbl, &ch_flower->node,
   1001			       adap->flower_ht_params);
   1002
   1003	ret = cxgb4_flow_rule_destroy(dev, ch_flower->fs.tc_prio,
   1004				      &ch_flower->fs, ch_flower->filter_id);
   1005	if (ret)
   1006		netdev_err(dev, "Flow rule destroy failed for tid: %u, ret: %d",
   1007			   ch_flower->filter_id, ret);
   1008
   1009	kfree_rcu(ch_flower, rcu);
   1010	return ret;
   1011}
   1012
   1013static void ch_flower_stats_handler(struct work_struct *work)
   1014{
   1015	struct adapter *adap = container_of(work, struct adapter,
   1016					    flower_stats_work);
   1017	struct ch_tc_flower_entry *flower_entry;
   1018	struct ch_tc_flower_stats *ofld_stats;
   1019	struct rhashtable_iter iter;
   1020	u64 packets;
   1021	u64 bytes;
   1022	int ret;
   1023
   1024	rhashtable_walk_enter(&adap->flower_tbl, &iter);
   1025	do {
   1026		rhashtable_walk_start(&iter);
   1027
   1028		while ((flower_entry = rhashtable_walk_next(&iter)) &&
   1029		       !IS_ERR(flower_entry)) {
   1030			ret = cxgb4_get_filter_counters(adap->port[0],
   1031							flower_entry->filter_id,
   1032							&packets, &bytes,
   1033							flower_entry->fs.hash);
   1034			if (!ret) {
   1035				spin_lock(&flower_entry->lock);
   1036				ofld_stats = &flower_entry->stats;
   1037
   1038				if (ofld_stats->prev_packet_count != packets) {
   1039					ofld_stats->prev_packet_count = packets;
   1040					ofld_stats->last_used = jiffies;
   1041				}
   1042				spin_unlock(&flower_entry->lock);
   1043			}
   1044		}
   1045
   1046		rhashtable_walk_stop(&iter);
   1047
   1048	} while (flower_entry == ERR_PTR(-EAGAIN));
   1049	rhashtable_walk_exit(&iter);
   1050	mod_timer(&adap->flower_stats_timer, jiffies + STATS_CHECK_PERIOD);
   1051}
   1052
   1053static void ch_flower_stats_cb(struct timer_list *t)
   1054{
   1055	struct adapter *adap = from_timer(adap, t, flower_stats_timer);
   1056
   1057	schedule_work(&adap->flower_stats_work);
   1058}
   1059
   1060int cxgb4_tc_flower_stats(struct net_device *dev,
   1061			  struct flow_cls_offload *cls)
   1062{
   1063	struct adapter *adap = netdev2adap(dev);
   1064	struct ch_tc_flower_stats *ofld_stats;
   1065	struct ch_tc_flower_entry *ch_flower;
   1066	u64 packets;
   1067	u64 bytes;
   1068	int ret;
   1069
   1070	ch_flower = ch_flower_lookup(adap, cls->cookie);
   1071	if (!ch_flower) {
   1072		ret = -ENOENT;
   1073		goto err;
   1074	}
   1075
   1076	ret = cxgb4_get_filter_counters(dev, ch_flower->filter_id,
   1077					&packets, &bytes,
   1078					ch_flower->fs.hash);
   1079	if (ret < 0)
   1080		goto err;
   1081
   1082	spin_lock_bh(&ch_flower->lock);
   1083	ofld_stats = &ch_flower->stats;
   1084	if (ofld_stats->packet_count != packets) {
   1085		if (ofld_stats->prev_packet_count != packets)
   1086			ofld_stats->last_used = jiffies;
   1087		flow_stats_update(&cls->stats, bytes - ofld_stats->byte_count,
   1088				  packets - ofld_stats->packet_count, 0,
   1089				  ofld_stats->last_used,
   1090				  FLOW_ACTION_HW_STATS_IMMEDIATE);
   1091
   1092		ofld_stats->packet_count = packets;
   1093		ofld_stats->byte_count = bytes;
   1094		ofld_stats->prev_packet_count = packets;
   1095	}
   1096	spin_unlock_bh(&ch_flower->lock);
   1097	return 0;
   1098
   1099err:
   1100	return ret;
   1101}
   1102
   1103static const struct rhashtable_params cxgb4_tc_flower_ht_params = {
   1104	.nelem_hint = 384,
   1105	.head_offset = offsetof(struct ch_tc_flower_entry, node),
   1106	.key_offset = offsetof(struct ch_tc_flower_entry, tc_flower_cookie),
   1107	.key_len = sizeof(((struct ch_tc_flower_entry *)0)->tc_flower_cookie),
   1108	.max_size = 524288,
   1109	.min_size = 512,
   1110	.automatic_shrinking = true
   1111};
   1112
   1113int cxgb4_init_tc_flower(struct adapter *adap)
   1114{
   1115	int ret;
   1116
   1117	if (adap->tc_flower_initialized)
   1118		return -EEXIST;
   1119
   1120	adap->flower_ht_params = cxgb4_tc_flower_ht_params;
   1121	ret = rhashtable_init(&adap->flower_tbl, &adap->flower_ht_params);
   1122	if (ret)
   1123		return ret;
   1124
   1125	INIT_WORK(&adap->flower_stats_work, ch_flower_stats_handler);
   1126	timer_setup(&adap->flower_stats_timer, ch_flower_stats_cb, 0);
   1127	mod_timer(&adap->flower_stats_timer, jiffies + STATS_CHECK_PERIOD);
   1128	adap->tc_flower_initialized = true;
   1129	return 0;
   1130}
   1131
   1132void cxgb4_cleanup_tc_flower(struct adapter *adap)
   1133{
   1134	if (!adap->tc_flower_initialized)
   1135		return;
   1136
   1137	if (adap->flower_stats_timer.function)
   1138		del_timer_sync(&adap->flower_stats_timer);
   1139	cancel_work_sync(&adap->flower_stats_work);
   1140	rhashtable_destroy(&adap->flower_tbl);
   1141	adap->tc_flower_initialized = false;
   1142}