linux/drivers/net/ethernet/chelsio/cxgb4/cxgb4_tc_flower.c
<<
>>
Prefs
   1/*
   2 * This file is part of the Chelsio T4/T5/T6 Ethernet driver for Linux.
   3 *
   4 * Copyright (c) 2017 Chelsio Communications, Inc. All rights reserved.
   5 *
   6 * This software is available to you under a choice of one of two
   7 * licenses.  You may choose to be licensed under the terms of the GNU
   8 * General Public License (GPL) Version 2, available from the file
   9 * COPYING in the main directory of this source tree, or the
  10 * OpenIB.org BSD license below:
  11 *
  12 *     Redistribution and use in source and binary forms, with or
  13 *     without modification, are permitted provided that the following
  14 *     conditions are met:
  15 *
  16 *      - Redistributions of source code must retain the above
  17 *        copyright notice, this list of conditions and the following
  18 *        disclaimer.
  19 *
  20 *      - Redistributions in binary form must reproduce the above
  21 *        copyright notice, this list of conditions and the following
  22 *        disclaimer in the documentation and/or other materials
  23 *        provided with the distribution.
  24 *
  25 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  26 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  27 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  28 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  29 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  30 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  31 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  32 * SOFTWARE.
  33 */
  34
  35#include <net/tc_act/tc_mirred.h>
  36#include <net/tc_act/tc_pedit.h>
  37#include <net/tc_act/tc_gact.h>
  38#include <net/tc_act/tc_vlan.h>
  39
  40#include "cxgb4.h"
  41#include "cxgb4_filter.h"
  42#include "cxgb4_tc_flower.h"
  43
  44#define STATS_CHECK_PERIOD (HZ / 2)
  45
  46static struct ch_tc_pedit_fields pedits[] = {
  47        PEDIT_FIELDS(ETH_, DMAC_31_0, 4, dmac, 0),
  48        PEDIT_FIELDS(ETH_, DMAC_47_32, 2, dmac, 4),
  49        PEDIT_FIELDS(ETH_, SMAC_15_0, 2, smac, 0),
  50        PEDIT_FIELDS(ETH_, SMAC_47_16, 4, smac, 2),
  51        PEDIT_FIELDS(IP4_, SRC, 4, nat_fip, 0),
  52        PEDIT_FIELDS(IP4_, DST, 4, nat_lip, 0),
  53        PEDIT_FIELDS(IP6_, SRC_31_0, 4, nat_fip, 0),
  54        PEDIT_FIELDS(IP6_, SRC_63_32, 4, nat_fip, 4),
  55        PEDIT_FIELDS(IP6_, SRC_95_64, 4, nat_fip, 8),
  56        PEDIT_FIELDS(IP6_, SRC_127_96, 4, nat_fip, 12),
  57        PEDIT_FIELDS(IP6_, DST_31_0, 4, nat_lip, 0),
  58        PEDIT_FIELDS(IP6_, DST_63_32, 4, nat_lip, 4),
  59        PEDIT_FIELDS(IP6_, DST_95_64, 4, nat_lip, 8),
  60        PEDIT_FIELDS(IP6_, DST_127_96, 4, nat_lip, 12),
  61};
  62
  63static const struct cxgb4_natmode_config cxgb4_natmode_config_array[] = {
  64        /* Default supported NAT modes */
  65        {
  66                .chip = CHELSIO_T5,
  67                .flags = CXGB4_ACTION_NATMODE_NONE,
  68                .natmode = NAT_MODE_NONE,
  69        },
  70        {
  71                .chip = CHELSIO_T5,
  72                .flags = CXGB4_ACTION_NATMODE_DIP,
  73                .natmode = NAT_MODE_DIP,
  74        },
  75        {
  76                .chip = CHELSIO_T5,
  77                .flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_DPORT,
  78                .natmode = NAT_MODE_DIP_DP,
  79        },
  80        {
  81                .chip = CHELSIO_T5,
  82                .flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_DPORT |
  83                         CXGB4_ACTION_NATMODE_SIP,
  84                .natmode = NAT_MODE_DIP_DP_SIP,
  85        },
  86        {
  87                .chip = CHELSIO_T5,
  88                .flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_DPORT |
  89                         CXGB4_ACTION_NATMODE_SPORT,
  90                .natmode = NAT_MODE_DIP_DP_SP,
  91        },
  92        {
  93                .chip = CHELSIO_T5,
  94                .flags = CXGB4_ACTION_NATMODE_SIP | CXGB4_ACTION_NATMODE_SPORT,
  95                .natmode = NAT_MODE_SIP_SP,
  96        },
  97        {
  98                .chip = CHELSIO_T5,
  99                .flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_SIP |
 100                         CXGB4_ACTION_NATMODE_SPORT,
 101                .natmode = NAT_MODE_DIP_SIP_SP,
 102        },
 103        {
 104                .chip = CHELSIO_T5,
 105                .flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_SIP |
 106                         CXGB4_ACTION_NATMODE_DPORT |
 107                         CXGB4_ACTION_NATMODE_SPORT,
 108                .natmode = NAT_MODE_ALL,
 109        },
 110        /* T6+ can ignore L4 ports when they're disabled. */
 111        {
 112                .chip = CHELSIO_T6,
 113                .flags = CXGB4_ACTION_NATMODE_SIP,
 114                .natmode = NAT_MODE_SIP_SP,
 115        },
 116        {
 117                .chip = CHELSIO_T6,
 118                .flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_SPORT,
 119                .natmode = NAT_MODE_DIP_DP_SP,
 120        },
 121        {
 122                .chip = CHELSIO_T6,
 123                .flags = CXGB4_ACTION_NATMODE_DIP | CXGB4_ACTION_NATMODE_SIP,
 124                .natmode = NAT_MODE_ALL,
 125        },
 126};
 127
 128static void cxgb4_action_natmode_tweak(struct ch_filter_specification *fs,
 129                                       u8 natmode_flags)
 130{
 131        u8 i = 0;
 132
 133        /* Translate the enabled NAT 4-tuple fields to one of the
 134         * hardware supported NAT mode configurations. This ensures
 135         * that we pick a valid combination, where the disabled fields
 136         * do not get overwritten to 0.
 137         */
 138        for (i = 0; i < ARRAY_SIZE(cxgb4_natmode_config_array); i++) {
 139                if (cxgb4_natmode_config_array[i].flags == natmode_flags) {
 140                        fs->nat_mode = cxgb4_natmode_config_array[i].natmode;
 141                        return;
 142                }
 143        }
 144}
 145
 146static struct ch_tc_flower_entry *allocate_flower_entry(void)
 147{
 148        struct ch_tc_flower_entry *new = kzalloc(sizeof(*new), GFP_KERNEL);
 149        if (new)
 150                spin_lock_init(&new->lock);
 151        return new;
 152}
 153
 154/* Must be called with either RTNL or rcu_read_lock */
 155static struct ch_tc_flower_entry *ch_flower_lookup(struct adapter *adap,
 156                                                   unsigned long flower_cookie)
 157{
 158        return rhashtable_lookup_fast(&adap->flower_tbl, &flower_cookie,
 159                                      adap->flower_ht_params);
 160}
 161
 162static void cxgb4_process_flow_match(struct net_device *dev,
 163                                     struct flow_rule *rule,
 164                                     struct ch_filter_specification *fs)
 165{
 166        u16 addr_type = 0;
 167
 168        if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_CONTROL)) {
 169                struct flow_match_control match;
 170
 171                flow_rule_match_control(rule, &match);
 172                addr_type = match.key->addr_type;
 173        } else if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IPV4_ADDRS)) {
 174                addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
 175        } else if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IPV6_ADDRS)) {
 176                addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
 177        }
 178
 179        if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_BASIC)) {
 180                struct flow_match_basic match;
 181                u16 ethtype_key, ethtype_mask;
 182
 183                flow_rule_match_basic(rule, &match);
 184                ethtype_key = ntohs(match.key->n_proto);
 185                ethtype_mask = ntohs(match.mask->n_proto);
 186
 187                if (ethtype_key == ETH_P_ALL) {
 188                        ethtype_key = 0;
 189                        ethtype_mask = 0;
 190                }
 191
 192                if (ethtype_key == ETH_P_IPV6)
 193                        fs->type = 1;
 194
 195                fs->val.ethtype = ethtype_key;
 196                fs->mask.ethtype = ethtype_mask;
 197                fs->val.proto = match.key->ip_proto;
 198                fs->mask.proto = match.mask->ip_proto;
 199        }
 200
 201        if (addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS) {
 202                struct flow_match_ipv4_addrs match;
 203
 204                flow_rule_match_ipv4_addrs(rule, &match);
 205                fs->type = 0;
 206                memcpy(&fs->val.lip[0], &match.key->dst, sizeof(match.key->dst));
 207                memcpy(&fs->val.fip[0], &match.key->src, sizeof(match.key->src));
 208                memcpy(&fs->mask.lip[0], &match.mask->dst, sizeof(match.mask->dst));
 209                memcpy(&fs->mask.fip[0], &match.mask->src, sizeof(match.mask->src));
 210
 211                /* also initialize nat_lip/fip to same values */
 212                memcpy(&fs->nat_lip[0], &match.key->dst, sizeof(match.key->dst));
 213                memcpy(&fs->nat_fip[0], &match.key->src, sizeof(match.key->src));
 214        }
 215
 216        if (addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS) {
 217                struct flow_match_ipv6_addrs match;
 218
 219                flow_rule_match_ipv6_addrs(rule, &match);
 220                fs->type = 1;
 221                memcpy(&fs->val.lip[0], match.key->dst.s6_addr,
 222                       sizeof(match.key->dst));
 223                memcpy(&fs->val.fip[0], match.key->src.s6_addr,
 224                       sizeof(match.key->src));
 225                memcpy(&fs->mask.lip[0], match.mask->dst.s6_addr,
 226                       sizeof(match.mask->dst));
 227                memcpy(&fs->mask.fip[0], match.mask->src.s6_addr,
 228                       sizeof(match.mask->src));
 229
 230                /* also initialize nat_lip/fip to same values */
 231                memcpy(&fs->nat_lip[0], match.key->dst.s6_addr,
 232                       sizeof(match.key->dst));
 233                memcpy(&fs->nat_fip[0], match.key->src.s6_addr,
 234                       sizeof(match.key->src));
 235        }
 236
 237        if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_PORTS)) {
 238                struct flow_match_ports match;
 239
 240                flow_rule_match_ports(rule, &match);
 241                fs->val.lport = be16_to_cpu(match.key->dst);
 242                fs->mask.lport = be16_to_cpu(match.mask->dst);
 243                fs->val.fport = be16_to_cpu(match.key->src);
 244                fs->mask.fport = be16_to_cpu(match.mask->src);
 245
 246                /* also initialize nat_lport/fport to same values */
 247                fs->nat_lport = fs->val.lport;
 248                fs->nat_fport = fs->val.fport;
 249        }
 250
 251        if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IP)) {
 252                struct flow_match_ip match;
 253
 254                flow_rule_match_ip(rule, &match);
 255                fs->val.tos = match.key->tos;
 256                fs->mask.tos = match.mask->tos;
 257        }
 258
 259        if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_ENC_KEYID)) {
 260                struct flow_match_enc_keyid match;
 261
 262                flow_rule_match_enc_keyid(rule, &match);
 263                fs->val.vni = be32_to_cpu(match.key->keyid);
 264                fs->mask.vni = be32_to_cpu(match.mask->keyid);
 265                if (fs->mask.vni) {
 266                        fs->val.encap_vld = 1;
 267                        fs->mask.encap_vld = 1;
 268                }
 269        }
 270
 271        if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_VLAN)) {
 272                struct flow_match_vlan match;
 273                u16 vlan_tci, vlan_tci_mask;
 274
 275                flow_rule_match_vlan(rule, &match);
 276                vlan_tci = match.key->vlan_id | (match.key->vlan_priority <<
 277                                               VLAN_PRIO_SHIFT);
 278                vlan_tci_mask = match.mask->vlan_id | (match.mask->vlan_priority <<
 279                                                     VLAN_PRIO_SHIFT);
 280                fs->val.ivlan = vlan_tci;
 281                fs->mask.ivlan = vlan_tci_mask;
 282
 283                fs->val.ivlan_vld = 1;
 284                fs->mask.ivlan_vld = 1;
 285
 286                /* Chelsio adapters use ivlan_vld bit to match vlan packets
 287                 * as 802.1Q. Also, when vlan tag is present in packets,
 288                 * ethtype match is used then to match on ethtype of inner
 289                 * header ie. the header following the vlan header.
 290                 * So, set the ivlan_vld based on ethtype info supplied by
 291                 * TC for vlan packets if its 802.1Q. And then reset the
 292                 * ethtype value else, hw will try to match the supplied
 293                 * ethtype value with ethtype of inner header.
 294                 */
 295                if (fs->val.ethtype == ETH_P_8021Q) {
 296                        fs->val.ethtype = 0;
 297                        fs->mask.ethtype = 0;
 298                }
 299        }
 300
 301        /* Match only packets coming from the ingress port where this
 302         * filter will be created.
 303         */
 304        fs->val.iport = netdev2pinfo(dev)->port_id;
 305        fs->mask.iport = ~0;
 306}
 307
 308static int cxgb4_validate_flow_match(struct net_device *dev,
 309                                     struct flow_rule *rule)
 310{
 311        struct flow_dissector *dissector = rule->match.dissector;
 312        u16 ethtype_mask = 0;
 313        u16 ethtype_key = 0;
 314
 315        if (dissector->used_keys &
 316            ~(BIT(FLOW_DISSECTOR_KEY_CONTROL) |
 317              BIT(FLOW_DISSECTOR_KEY_BASIC) |
 318              BIT(FLOW_DISSECTOR_KEY_IPV4_ADDRS) |
 319              BIT(FLOW_DISSECTOR_KEY_IPV6_ADDRS) |
 320              BIT(FLOW_DISSECTOR_KEY_PORTS) |
 321              BIT(FLOW_DISSECTOR_KEY_ENC_KEYID) |
 322              BIT(FLOW_DISSECTOR_KEY_VLAN) |
 323              BIT(FLOW_DISSECTOR_KEY_IP))) {
 324                netdev_warn(dev, "Unsupported key used: 0x%x\n",
 325                            dissector->used_keys);
 326                return -EOPNOTSUPP;
 327        }
 328
 329        if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_BASIC)) {
 330                struct flow_match_basic match;
 331
 332                flow_rule_match_basic(rule, &match);
 333                ethtype_key = ntohs(match.key->n_proto);
 334                ethtype_mask = ntohs(match.mask->n_proto);
 335        }
 336
 337        if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IP)) {
 338                u16 eth_ip_type = ethtype_key & ethtype_mask;
 339                struct flow_match_ip match;
 340
 341                if (eth_ip_type != ETH_P_IP && eth_ip_type != ETH_P_IPV6) {
 342                        netdev_err(dev, "IP Key supported only with IPv4/v6");
 343                        return -EINVAL;
 344                }
 345
 346                flow_rule_match_ip(rule, &match);
 347                if (match.mask->ttl) {
 348                        netdev_warn(dev, "ttl match unsupported for offload");
 349                        return -EOPNOTSUPP;
 350                }
 351        }
 352
 353        return 0;
 354}
 355
 356static void offload_pedit(struct ch_filter_specification *fs, u32 val, u32 mask,
 357                          u8 field)
 358{
 359        u32 set_val = val & ~mask;
 360        u32 offset = 0;
 361        u8 size = 1;
 362        int i;
 363
 364        for (i = 0; i < ARRAY_SIZE(pedits); i++) {
 365                if (pedits[i].field == field) {
 366                        offset = pedits[i].offset;
 367                        size = pedits[i].size;
 368                        break;
 369                }
 370        }
 371        memcpy((u8 *)fs + offset, &set_val, size);
 372}
 373
 374static void process_pedit_field(struct ch_filter_specification *fs, u32 val,
 375                                u32 mask, u32 offset, u8 htype,
 376                                u8 *natmode_flags)
 377{
 378        switch (htype) {
 379        case FLOW_ACT_MANGLE_HDR_TYPE_ETH:
 380                switch (offset) {
 381                case PEDIT_ETH_DMAC_31_0:
 382                        fs->newdmac = 1;
 383                        offload_pedit(fs, val, mask, ETH_DMAC_31_0);
 384                        break;
 385                case PEDIT_ETH_DMAC_47_32_SMAC_15_0:
 386                        if (~mask & PEDIT_ETH_DMAC_MASK)
 387                                offload_pedit(fs, val, mask, ETH_DMAC_47_32);
 388                        else
 389                                offload_pedit(fs, val >> 16, mask >> 16,
 390                                              ETH_SMAC_15_0);
 391                        break;
 392                case PEDIT_ETH_SMAC_47_16:
 393                        fs->newsmac = 1;
 394                        offload_pedit(fs, val, mask, ETH_SMAC_47_16);
 395                }
 396                break;
 397        case FLOW_ACT_MANGLE_HDR_TYPE_IP4:
 398                switch (offset) {
 399                case PEDIT_IP4_SRC:
 400                        offload_pedit(fs, val, mask, IP4_SRC);
 401                        *natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
 402                        break;
 403                case PEDIT_IP4_DST:
 404                        offload_pedit(fs, val, mask, IP4_DST);
 405                        *natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
 406                }
 407                break;
 408        case FLOW_ACT_MANGLE_HDR_TYPE_IP6:
 409                switch (offset) {
 410                case PEDIT_IP6_SRC_31_0:
 411                        offload_pedit(fs, val, mask, IP6_SRC_31_0);
 412                        *natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
 413                        break;
 414                case PEDIT_IP6_SRC_63_32:
 415                        offload_pedit(fs, val, mask, IP6_SRC_63_32);
 416                        *natmode_flags |=  CXGB4_ACTION_NATMODE_SIP;
 417                        break;
 418                case PEDIT_IP6_SRC_95_64:
 419                        offload_pedit(fs, val, mask, IP6_SRC_95_64);
 420                        *natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
 421                        break;
 422                case PEDIT_IP6_SRC_127_96:
 423                        offload_pedit(fs, val, mask, IP6_SRC_127_96);
 424                        *natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
 425                        break;
 426                case PEDIT_IP6_DST_31_0:
 427                        offload_pedit(fs, val, mask, IP6_DST_31_0);
 428                        *natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
 429                        break;
 430                case PEDIT_IP6_DST_63_32:
 431                        offload_pedit(fs, val, mask, IP6_DST_63_32);
 432                        *natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
 433                        break;
 434                case PEDIT_IP6_DST_95_64:
 435                        offload_pedit(fs, val, mask, IP6_DST_95_64);
 436                        *natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
 437                        break;
 438                case PEDIT_IP6_DST_127_96:
 439                        offload_pedit(fs, val, mask, IP6_DST_127_96);
 440                        *natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
 441                }
 442                break;
 443        case FLOW_ACT_MANGLE_HDR_TYPE_TCP:
 444                switch (offset) {
 445                case PEDIT_TCP_SPORT_DPORT:
 446                        if (~mask & PEDIT_TCP_UDP_SPORT_MASK) {
 447                                fs->nat_fport = val;
 448                                *natmode_flags |= CXGB4_ACTION_NATMODE_SPORT;
 449                        } else {
 450                                fs->nat_lport = val >> 16;
 451                                *natmode_flags |= CXGB4_ACTION_NATMODE_DPORT;
 452                        }
 453                }
 454                break;
 455        case FLOW_ACT_MANGLE_HDR_TYPE_UDP:
 456                switch (offset) {
 457                case PEDIT_UDP_SPORT_DPORT:
 458                        if (~mask & PEDIT_TCP_UDP_SPORT_MASK) {
 459                                fs->nat_fport = val;
 460                                *natmode_flags |= CXGB4_ACTION_NATMODE_SPORT;
 461                        } else {
 462                                fs->nat_lport = val >> 16;
 463                                *natmode_flags |= CXGB4_ACTION_NATMODE_DPORT;
 464                        }
 465                }
 466                break;
 467        }
 468}
 469
 470static int cxgb4_action_natmode_validate(struct adapter *adap, u8 natmode_flags,
 471                                         struct netlink_ext_ack *extack)
 472{
 473        u8 i = 0;
 474
 475        /* Extract the NAT mode to enable based on what 4-tuple fields
 476         * are enabled to be overwritten. This ensures that the
 477         * disabled fields don't get overwritten to 0.
 478         */
 479        for (i = 0; i < ARRAY_SIZE(cxgb4_natmode_config_array); i++) {
 480                const struct cxgb4_natmode_config *c;
 481
 482                c = &cxgb4_natmode_config_array[i];
 483                if (CHELSIO_CHIP_VERSION(adap->params.chip) >= c->chip &&
 484                    natmode_flags == c->flags)
 485                        return 0;
 486        }
 487        NL_SET_ERR_MSG_MOD(extack, "Unsupported NAT mode 4-tuple combination");
 488        return -EOPNOTSUPP;
 489}
 490
 491void cxgb4_process_flow_actions(struct net_device *in,
 492                                struct flow_action *actions,
 493                                struct ch_filter_specification *fs)
 494{
 495        struct flow_action_entry *act;
 496        u8 natmode_flags = 0;
 497        int i;
 498
 499        flow_action_for_each(i, act, actions) {
 500                switch (act->id) {
 501                case FLOW_ACTION_ACCEPT:
 502                        fs->action = FILTER_PASS;
 503                        break;
 504                case FLOW_ACTION_DROP:
 505                        fs->action = FILTER_DROP;
 506                        break;
 507                case FLOW_ACTION_MIRRED:
 508                case FLOW_ACTION_REDIRECT: {
 509                        struct net_device *out = act->dev;
 510                        struct port_info *pi = netdev_priv(out);
 511
 512                        fs->action = FILTER_SWITCH;
 513                        fs->eport = pi->port_id;
 514                        }
 515                        break;
 516                case FLOW_ACTION_VLAN_POP:
 517                case FLOW_ACTION_VLAN_PUSH:
 518                case FLOW_ACTION_VLAN_MANGLE: {
 519                        u8 prio = act->vlan.prio;
 520                        u16 vid = act->vlan.vid;
 521                        u16 vlan_tci = (prio << VLAN_PRIO_SHIFT) | vid;
 522                        switch (act->id) {
 523                        case FLOW_ACTION_VLAN_POP:
 524                                fs->newvlan |= VLAN_REMOVE;
 525                                break;
 526                        case FLOW_ACTION_VLAN_PUSH:
 527                                fs->newvlan |= VLAN_INSERT;
 528                                fs->vlan = vlan_tci;
 529                                break;
 530                        case FLOW_ACTION_VLAN_MANGLE:
 531                                fs->newvlan |= VLAN_REWRITE;
 532                                fs->vlan = vlan_tci;
 533                                break;
 534                        default:
 535                                break;
 536                        }
 537                        }
 538                        break;
 539                case FLOW_ACTION_MANGLE: {
 540                        u32 mask, val, offset;
 541                        u8 htype;
 542
 543                        htype = act->mangle.htype;
 544                        mask = act->mangle.mask;
 545                        val = act->mangle.val;
 546                        offset = act->mangle.offset;
 547
 548                        process_pedit_field(fs, val, mask, offset, htype,
 549                                            &natmode_flags);
 550                        }
 551                        break;
 552                case FLOW_ACTION_QUEUE:
 553                        fs->action = FILTER_PASS;
 554                        fs->dirsteer = 1;
 555                        fs->iq = act->queue.index;
 556                        break;
 557                default:
 558                        break;
 559                }
 560        }
 561        if (natmode_flags)
 562                cxgb4_action_natmode_tweak(fs, natmode_flags);
 563
 564}
 565
 566static bool valid_l4_mask(u32 mask)
 567{
 568        u16 hi, lo;
 569
 570        /* Either the upper 16-bits (SPORT) OR the lower
 571         * 16-bits (DPORT) can be set, but NOT BOTH.
 572         */
 573        hi = (mask >> 16) & 0xFFFF;
 574        lo = mask & 0xFFFF;
 575
 576        return hi && lo ? false : true;
 577}
 578
 579static bool valid_pedit_action(struct net_device *dev,
 580                               const struct flow_action_entry *act,
 581                               u8 *natmode_flags)
 582{
 583        u32 mask, offset;
 584        u8 htype;
 585
 586        htype = act->mangle.htype;
 587        mask = act->mangle.mask;
 588        offset = act->mangle.offset;
 589
 590        switch (htype) {
 591        case FLOW_ACT_MANGLE_HDR_TYPE_ETH:
 592                switch (offset) {
 593                case PEDIT_ETH_DMAC_31_0:
 594                case PEDIT_ETH_DMAC_47_32_SMAC_15_0:
 595                case PEDIT_ETH_SMAC_47_16:
 596                        break;
 597                default:
 598                        netdev_err(dev, "%s: Unsupported pedit field\n",
 599                                   __func__);
 600                        return false;
 601                }
 602                break;
 603        case FLOW_ACT_MANGLE_HDR_TYPE_IP4:
 604                switch (offset) {
 605                case PEDIT_IP4_SRC:
 606                        *natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
 607                        break;
 608                case PEDIT_IP4_DST:
 609                        *natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
 610                        break;
 611                default:
 612                        netdev_err(dev, "%s: Unsupported pedit field\n",
 613                                   __func__);
 614                        return false;
 615                }
 616                break;
 617        case FLOW_ACT_MANGLE_HDR_TYPE_IP6:
 618                switch (offset) {
 619                case PEDIT_IP6_SRC_31_0:
 620                case PEDIT_IP6_SRC_63_32:
 621                case PEDIT_IP6_SRC_95_64:
 622                case PEDIT_IP6_SRC_127_96:
 623                        *natmode_flags |= CXGB4_ACTION_NATMODE_SIP;
 624                        break;
 625                case PEDIT_IP6_DST_31_0:
 626                case PEDIT_IP6_DST_63_32:
 627                case PEDIT_IP6_DST_95_64:
 628                case PEDIT_IP6_DST_127_96:
 629                        *natmode_flags |= CXGB4_ACTION_NATMODE_DIP;
 630                        break;
 631                default:
 632                        netdev_err(dev, "%s: Unsupported pedit field\n",
 633                                   __func__);
 634                        return false;
 635                }
 636                break;
 637        case FLOW_ACT_MANGLE_HDR_TYPE_TCP:
 638                switch (offset) {
 639                case PEDIT_TCP_SPORT_DPORT:
 640                        if (!valid_l4_mask(~mask)) {
 641                                netdev_err(dev, "%s: Unsupported mask for TCP L4 ports\n",
 642                                           __func__);
 643                                return false;
 644                        }
 645                        if (~mask & PEDIT_TCP_UDP_SPORT_MASK)
 646                                *natmode_flags |= CXGB4_ACTION_NATMODE_SPORT;
 647                        else
 648                                *natmode_flags |= CXGB4_ACTION_NATMODE_DPORT;
 649                        break;
 650                default:
 651                        netdev_err(dev, "%s: Unsupported pedit field\n",
 652                                   __func__);
 653                        return false;
 654                }
 655                break;
 656        case FLOW_ACT_MANGLE_HDR_TYPE_UDP:
 657                switch (offset) {
 658                case PEDIT_UDP_SPORT_DPORT:
 659                        if (!valid_l4_mask(~mask)) {
 660                                netdev_err(dev, "%s: Unsupported mask for UDP L4 ports\n",
 661                                           __func__);
 662                                return false;
 663                        }
 664                        if (~mask & PEDIT_TCP_UDP_SPORT_MASK)
 665                                *natmode_flags |= CXGB4_ACTION_NATMODE_SPORT;
 666                        else
 667                                *natmode_flags |= CXGB4_ACTION_NATMODE_DPORT;
 668                        break;
 669                default:
 670                        netdev_err(dev, "%s: Unsupported pedit field\n",
 671                                   __func__);
 672                        return false;
 673                }
 674                break;
 675        default:
 676                netdev_err(dev, "%s: Unsupported pedit type\n", __func__);
 677                return false;
 678        }
 679        return true;
 680}
 681
 682int cxgb4_validate_flow_actions(struct net_device *dev,
 683                                struct flow_action *actions,
 684                                struct netlink_ext_ack *extack,
 685                                u8 matchall_filter)
 686{
 687        struct adapter *adap = netdev2adap(dev);
 688        struct flow_action_entry *act;
 689        bool act_redir = false;
 690        bool act_pedit = false;
 691        bool act_vlan = false;
 692        u8 natmode_flags = 0;
 693        int i;
 694
 695        if (!flow_action_basic_hw_stats_check(actions, extack))
 696                return -EOPNOTSUPP;
 697
 698        flow_action_for_each(i, act, actions) {
 699                switch (act->id) {
 700                case FLOW_ACTION_ACCEPT:
 701                case FLOW_ACTION_DROP:
 702                        /* Do nothing */
 703                        break;
 704                case FLOW_ACTION_MIRRED:
 705                case FLOW_ACTION_REDIRECT: {
 706                        struct net_device *n_dev, *target_dev;
 707                        bool found = false;
 708                        unsigned int i;
 709
 710                        if (act->id == FLOW_ACTION_MIRRED &&
 711                            !matchall_filter) {
 712                                NL_SET_ERR_MSG_MOD(extack,
 713                                                   "Egress mirror action is only supported for tc-matchall");
 714                                return -EOPNOTSUPP;
 715                        }
 716
 717                        target_dev = act->dev;
 718                        for_each_port(adap, i) {
 719                                n_dev = adap->port[i];
 720                                if (target_dev == n_dev) {
 721                                        found = true;
 722                                        break;
 723                                }
 724                        }
 725
 726                        /* If interface doesn't belong to our hw, then
 727                         * the provided output port is not valid
 728                         */
 729                        if (!found) {
 730                                netdev_err(dev, "%s: Out port invalid\n",
 731                                           __func__);
 732                                return -EINVAL;
 733                        }
 734                        act_redir = true;
 735                        }
 736                        break;
 737                case FLOW_ACTION_VLAN_POP:
 738                case FLOW_ACTION_VLAN_PUSH:
 739                case FLOW_ACTION_VLAN_MANGLE: {
 740                        u16 proto = be16_to_cpu(act->vlan.proto);
 741
 742                        switch (act->id) {
 743                        case FLOW_ACTION_VLAN_POP:
 744                                break;
 745                        case FLOW_ACTION_VLAN_PUSH:
 746                        case FLOW_ACTION_VLAN_MANGLE:
 747                                if (proto != ETH_P_8021Q) {
 748                                        netdev_err(dev, "%s: Unsupported vlan proto\n",
 749                                                   __func__);
 750                                        return -EOPNOTSUPP;
 751                                }
 752                                break;
 753                        default:
 754                                netdev_err(dev, "%s: Unsupported vlan action\n",
 755                                           __func__);
 756                                return -EOPNOTSUPP;
 757                        }
 758                        act_vlan = true;
 759                        }
 760                        break;
 761                case FLOW_ACTION_MANGLE: {
 762                        bool pedit_valid = valid_pedit_action(dev, act,
 763                                                              &natmode_flags);
 764
 765                        if (!pedit_valid)
 766                                return -EOPNOTSUPP;
 767                        act_pedit = true;
 768                        }
 769                        break;
 770                case FLOW_ACTION_QUEUE:
 771                        /* Do nothing. cxgb4_set_filter will validate */
 772                        break;
 773                default:
 774                        netdev_err(dev, "%s: Unsupported action\n", __func__);
 775                        return -EOPNOTSUPP;
 776                }
 777        }
 778
 779        if ((act_pedit || act_vlan) && !act_redir) {
 780                netdev_err(dev, "%s: pedit/vlan rewrite invalid without egress redirect\n",
 781                           __func__);
 782                return -EINVAL;
 783        }
 784
 785        if (act_pedit) {
 786                int ret;
 787
 788                ret = cxgb4_action_natmode_validate(adap, natmode_flags,
 789                                                    extack);
 790                if (ret)
 791                        return ret;
 792        }
 793
 794        return 0;
 795}
 796
 797static void cxgb4_tc_flower_hash_prio_add(struct adapter *adap, u32 tc_prio)
 798{
 799        spin_lock_bh(&adap->tids.ftid_lock);
 800        if (adap->tids.tc_hash_tids_max_prio < tc_prio)
 801                adap->tids.tc_hash_tids_max_prio = tc_prio;
 802        spin_unlock_bh(&adap->tids.ftid_lock);
 803}
 804
 805static void cxgb4_tc_flower_hash_prio_del(struct adapter *adap, u32 tc_prio)
 806{
 807        struct tid_info *t = &adap->tids;
 808        struct ch_tc_flower_entry *fe;
 809        struct rhashtable_iter iter;
 810        u32 found = 0;
 811
 812        spin_lock_bh(&t->ftid_lock);
 813        /* Bail if the current rule is not the one with the max
 814         * prio.
 815         */
 816        if (t->tc_hash_tids_max_prio != tc_prio)
 817                goto out_unlock;
 818
 819        /* Search for the next rule having the same or next lower
 820         * max prio.
 821         */
 822        rhashtable_walk_enter(&adap->flower_tbl, &iter);
 823        do {
 824                rhashtable_walk_start(&iter);
 825
 826                fe = rhashtable_walk_next(&iter);
 827                while (!IS_ERR_OR_NULL(fe)) {
 828                        if (fe->fs.hash &&
 829                            fe->fs.tc_prio <= t->tc_hash_tids_max_prio) {
 830                                t->tc_hash_tids_max_prio = fe->fs.tc_prio;
 831                                found++;
 832
 833                                /* Bail if we found another rule
 834                                 * having the same prio as the
 835                                 * current max one.
 836                                 */
 837                                if (fe->fs.tc_prio == tc_prio)
 838                                        break;
 839                        }
 840
 841                        fe = rhashtable_walk_next(&iter);
 842                }
 843
 844                rhashtable_walk_stop(&iter);
 845        } while (fe == ERR_PTR(-EAGAIN));
 846        rhashtable_walk_exit(&iter);
 847
 848        if (!found)
 849                t->tc_hash_tids_max_prio = 0;
 850
 851out_unlock:
 852        spin_unlock_bh(&t->ftid_lock);
 853}
 854
 855int cxgb4_flow_rule_replace(struct net_device *dev, struct flow_rule *rule,
 856                            u32 tc_prio, struct netlink_ext_ack *extack,
 857                            struct ch_filter_specification *fs, u32 *tid)
 858{
 859        struct adapter *adap = netdev2adap(dev);
 860        struct filter_ctx ctx;
 861        u8 inet_family;
 862        int fidx, ret;
 863
 864        if (cxgb4_validate_flow_actions(dev, &rule->action, extack, 0))
 865                return -EOPNOTSUPP;
 866
 867        if (cxgb4_validate_flow_match(dev, rule))
 868                return -EOPNOTSUPP;
 869
 870        cxgb4_process_flow_match(dev, rule, fs);
 871        cxgb4_process_flow_actions(dev, &rule->action, fs);
 872
 873        fs->hash = is_filter_exact_match(adap, fs);
 874        inet_family = fs->type ? PF_INET6 : PF_INET;
 875
 876        /* Get a free filter entry TID, where we can insert this new
 877         * rule. Only insert rule if its prio doesn't conflict with
 878         * existing rules.
 879         */
 880        fidx = cxgb4_get_free_ftid(dev, inet_family, fs->hash,
 881                                   tc_prio);
 882        if (fidx < 0) {
 883                NL_SET_ERR_MSG_MOD(extack,
 884                                   "No free LETCAM index available");
 885                return -ENOMEM;
 886        }
 887
 888        if (fidx < adap->tids.nhpftids) {
 889                fs->prio = 1;
 890                fs->hash = 0;
 891        }
 892
 893        /* If the rule can be inserted into HASH region, then ignore
 894         * the index to normal FILTER region.
 895         */
 896        if (fs->hash)
 897                fidx = 0;
 898
 899        fs->tc_prio = tc_prio;
 900
 901        init_completion(&ctx.completion);
 902        ret = __cxgb4_set_filter(dev, fidx, fs, &ctx);
 903        if (ret) {
 904                netdev_err(dev, "%s: filter creation err %d\n",
 905                           __func__, ret);
 906                return ret;
 907        }
 908
 909        /* Wait for reply */
 910        ret = wait_for_completion_timeout(&ctx.completion, 10 * HZ);
 911        if (!ret)
 912                return -ETIMEDOUT;
 913
 914        /* Check if hw returned error for filter creation */
 915        if (ctx.result)
 916                return ctx.result;
 917
 918        *tid = ctx.tid;
 919
 920        if (fs->hash)
 921                cxgb4_tc_flower_hash_prio_add(adap, tc_prio);
 922
 923        return 0;
 924}
 925
 926int cxgb4_tc_flower_replace(struct net_device *dev,
 927                            struct flow_cls_offload *cls)
 928{
 929        struct flow_rule *rule = flow_cls_offload_flow_rule(cls);
 930        struct netlink_ext_ack *extack = cls->common.extack;
 931        struct adapter *adap = netdev2adap(dev);
 932        struct ch_tc_flower_entry *ch_flower;
 933        struct ch_filter_specification *fs;
 934        int ret;
 935
 936        ch_flower = allocate_flower_entry();
 937        if (!ch_flower) {
 938                netdev_err(dev, "%s: ch_flower alloc failed.\n", __func__);
 939                return -ENOMEM;
 940        }
 941
 942        fs = &ch_flower->fs;
 943        fs->hitcnts = 1;
 944        fs->tc_cookie = cls->cookie;
 945
 946        ret = cxgb4_flow_rule_replace(dev, rule, cls->common.prio, extack, fs,
 947                                      &ch_flower->filter_id);
 948        if (ret)
 949                goto free_entry;
 950
 951        ch_flower->tc_flower_cookie = cls->cookie;
 952        ret = rhashtable_insert_fast(&adap->flower_tbl, &ch_flower->node,
 953                                     adap->flower_ht_params);
 954        if (ret)
 955                goto del_filter;
 956
 957        return 0;
 958
 959del_filter:
 960        if (fs->hash)
 961                cxgb4_tc_flower_hash_prio_del(adap, cls->common.prio);
 962
 963        cxgb4_del_filter(dev, ch_flower->filter_id, &ch_flower->fs);
 964
 965free_entry:
 966        kfree(ch_flower);
 967        return ret;
 968}
 969
 970int cxgb4_flow_rule_destroy(struct net_device *dev, u32 tc_prio,
 971                            struct ch_filter_specification *fs, int tid)
 972{
 973        struct adapter *adap = netdev2adap(dev);
 974        u8 hash;
 975        int ret;
 976
 977        hash = fs->hash;
 978
 979        ret = cxgb4_del_filter(dev, tid, fs);
 980        if (ret)
 981                return ret;
 982
 983        if (hash)
 984                cxgb4_tc_flower_hash_prio_del(adap, tc_prio);
 985
 986        return ret;
 987}
 988
 989int cxgb4_tc_flower_destroy(struct net_device *dev,
 990                            struct flow_cls_offload *cls)
 991{
 992        struct adapter *adap = netdev2adap(dev);
 993        struct ch_tc_flower_entry *ch_flower;
 994        int ret;
 995
 996        ch_flower = ch_flower_lookup(adap, cls->cookie);
 997        if (!ch_flower)
 998                return -ENOENT;
 999
1000        rhashtable_remove_fast(&adap->flower_tbl, &ch_flower->node,
1001                               adap->flower_ht_params);
1002
1003        ret = cxgb4_flow_rule_destroy(dev, ch_flower->fs.tc_prio,
1004                                      &ch_flower->fs, ch_flower->filter_id);
1005        if (ret)
1006                netdev_err(dev, "Flow rule destroy failed for tid: %u, ret: %d",
1007                           ch_flower->filter_id, ret);
1008
1009        kfree_rcu(ch_flower, rcu);
1010        return ret;
1011}
1012
1013static void ch_flower_stats_handler(struct work_struct *work)
1014{
1015        struct adapter *adap = container_of(work, struct adapter,
1016                                            flower_stats_work);
1017        struct ch_tc_flower_entry *flower_entry;
1018        struct ch_tc_flower_stats *ofld_stats;
1019        struct rhashtable_iter iter;
1020        u64 packets;
1021        u64 bytes;
1022        int ret;
1023
1024        rhashtable_walk_enter(&adap->flower_tbl, &iter);
1025        do {
1026                rhashtable_walk_start(&iter);
1027
1028                while ((flower_entry = rhashtable_walk_next(&iter)) &&
1029                       !IS_ERR(flower_entry)) {
1030                        ret = cxgb4_get_filter_counters(adap->port[0],
1031                                                        flower_entry->filter_id,
1032                                                        &packets, &bytes,
1033                                                        flower_entry->fs.hash);
1034                        if (!ret) {
1035                                spin_lock(&flower_entry->lock);
1036                                ofld_stats = &flower_entry->stats;
1037
1038                                if (ofld_stats->prev_packet_count != packets) {
1039                                        ofld_stats->prev_packet_count = packets;
1040                                        ofld_stats->last_used = jiffies;
1041                                }
1042                                spin_unlock(&flower_entry->lock);
1043                        }
1044                }
1045
1046                rhashtable_walk_stop(&iter);
1047
1048        } while (flower_entry == ERR_PTR(-EAGAIN));
1049        rhashtable_walk_exit(&iter);
1050        mod_timer(&adap->flower_stats_timer, jiffies + STATS_CHECK_PERIOD);
1051}
1052
1053static void ch_flower_stats_cb(struct timer_list *t)
1054{
1055        struct adapter *adap = from_timer(adap, t, flower_stats_timer);
1056
1057        schedule_work(&adap->flower_stats_work);
1058}
1059
1060int cxgb4_tc_flower_stats(struct net_device *dev,
1061                          struct flow_cls_offload *cls)
1062{
1063        struct adapter *adap = netdev2adap(dev);
1064        struct ch_tc_flower_stats *ofld_stats;
1065        struct ch_tc_flower_entry *ch_flower;
1066        u64 packets;
1067        u64 bytes;
1068        int ret;
1069
1070        ch_flower = ch_flower_lookup(adap, cls->cookie);
1071        if (!ch_flower) {
1072                ret = -ENOENT;
1073                goto err;
1074        }
1075
1076        ret = cxgb4_get_filter_counters(dev, ch_flower->filter_id,
1077                                        &packets, &bytes,
1078                                        ch_flower->fs.hash);
1079        if (ret < 0)
1080                goto err;
1081
1082        spin_lock_bh(&ch_flower->lock);
1083        ofld_stats = &ch_flower->stats;
1084        if (ofld_stats->packet_count != packets) {
1085                if (ofld_stats->prev_packet_count != packets)
1086                        ofld_stats->last_used = jiffies;
1087                flow_stats_update(&cls->stats, bytes - ofld_stats->byte_count,
1088                                  packets - ofld_stats->packet_count, 0,
1089                                  ofld_stats->last_used,
1090                                  FLOW_ACTION_HW_STATS_IMMEDIATE);
1091
1092                ofld_stats->packet_count = packets;
1093                ofld_stats->byte_count = bytes;
1094                ofld_stats->prev_packet_count = packets;
1095        }
1096        spin_unlock_bh(&ch_flower->lock);
1097        return 0;
1098
1099err:
1100        return ret;
1101}
1102
1103static const struct rhashtable_params cxgb4_tc_flower_ht_params = {
1104        .nelem_hint = 384,
1105        .head_offset = offsetof(struct ch_tc_flower_entry, node),
1106        .key_offset = offsetof(struct ch_tc_flower_entry, tc_flower_cookie),
1107        .key_len = sizeof(((struct ch_tc_flower_entry *)0)->tc_flower_cookie),
1108        .max_size = 524288,
1109        .min_size = 512,
1110        .automatic_shrinking = true
1111};
1112
1113int cxgb4_init_tc_flower(struct adapter *adap)
1114{
1115        int ret;
1116
1117        if (adap->tc_flower_initialized)
1118                return -EEXIST;
1119
1120        adap->flower_ht_params = cxgb4_tc_flower_ht_params;
1121        ret = rhashtable_init(&adap->flower_tbl, &adap->flower_ht_params);
1122        if (ret)
1123                return ret;
1124
1125        INIT_WORK(&adap->flower_stats_work, ch_flower_stats_handler);
1126        timer_setup(&adap->flower_stats_timer, ch_flower_stats_cb, 0);
1127        mod_timer(&adap->flower_stats_timer, jiffies + STATS_CHECK_PERIOD);
1128        adap->tc_flower_initialized = true;
1129        return 0;
1130}
1131
1132void cxgb4_cleanup_tc_flower(struct adapter *adap)
1133{
1134        if (!adap->tc_flower_initialized)
1135                return;
1136
1137        if (adap->flower_stats_timer.function)
1138                del_timer_sync(&adap->flower_stats_timer);
1139        cancel_work_sync(&adap->flower_stats_work);
1140        rhashtable_destroy(&adap->flower_tbl);
1141        adap->tc_flower_initialized = false;
1142}
1143