/* SPDX-License-Identifier: BSD-3-Clause * * Copyright(c) 2019-2021 Xilinx, Inc. * Copyright(c) 2019 Solarflare Communications Inc. * * This software was jointly developed between OKTET Labs (under contract * for Solarflare) and Solarflare Communications, Inc. */ #include #include #include #include #include #include "efx.h" #include "sfc.h" #include "sfc_flow_tunnel.h" #include "sfc_mae_counter.h" #include "sfc_mae_ct.h" #include "sfc_log.h" #include "sfc_switch.h" #include "sfc_service.h" static int sfc_mae_assign_ethdev_mport(struct sfc_adapter *sa, efx_mport_sel_t *mportp) { const efx_nic_cfg_t *encp = efx_nic_cfg_get(sa->nic); return efx_mae_mport_by_pcie_function(encp->enc_pf, encp->enc_vf, mportp); } static int sfc_mae_assign_entity_mport(struct sfc_adapter *sa, efx_mport_sel_t *mportp) { const efx_nic_cfg_t *encp = efx_nic_cfg_get(sa->nic); int rc = 0; if (encp->enc_mae_admin) { /* * This ethdev sits on MAE admin PF. The represented * entity is the network port assigned to that PF. */ rc = efx_mae_mport_by_phy_port(encp->enc_assigned_port, mportp); } else { /* * This ethdev sits on unprivileged PF / VF. The entity * represented by the ethdev can change dynamically * as MAE admin changes default traffic rules. * * For the sake of simplicity, do not fill in the m-port * and assume that flow rules should not be allowed to * reference the entity represented by this ethdev. */ efx_mae_mport_invalid(mportp); } return rc; } static int sfc_mae_counter_registry_init(struct sfc_mae_counter_registry *registry, uint32_t nb_action_counters_max, uint32_t nb_conntrack_counters_max) { int ret; ret = sfc_mae_counters_init(®istry->action_counters, nb_action_counters_max); if (ret != 0) return ret; registry->action_counters.type = EFX_COUNTER_TYPE_ACTION; ret = sfc_mae_counters_init(®istry->conntrack_counters, nb_conntrack_counters_max); if (ret != 0) return ret; registry->conntrack_counters.type = EFX_COUNTER_TYPE_CONNTRACK; return 0; } static void sfc_mae_counter_registry_fini(struct sfc_mae_counter_registry *registry) { sfc_mae_counters_fini(®istry->conntrack_counters); sfc_mae_counters_fini(®istry->action_counters); } struct rte_flow * sfc_mae_repr_flow_create(struct sfc_adapter *sa, int prio, uint16_t port_id, enum rte_flow_action_type dst_type, enum rte_flow_item_type src_type) { const struct rte_flow_item_ethdev item_spec = { .port_id = port_id }; const struct rte_flow_action_ethdev action = { .port_id = port_id }; const void *item_mask = &rte_flow_item_ethdev_mask; struct rte_flow_attr attr = { .transfer = 1 }; const struct rte_flow_action actions[] = { { .type = dst_type, .conf = &action }, { .type = RTE_FLOW_ACTION_TYPE_END } }; const struct rte_flow_item items[] = { { .type = src_type, .mask = item_mask, .spec = &item_spec }, { .type = RTE_FLOW_ITEM_TYPE_END } }; struct sfc_mae *mae = &sa->mae; struct rte_flow_error error; if (prio > 0 && (unsigned int)prio >= mae->nb_action_rule_prios_max) { sfc_err(sa, "failed: invalid priority %d (max %u)", prio, mae->nb_action_rule_prios_max); return NULL; } if (prio < 0) prio = mae->nb_action_rule_prios_max - 1; attr.priority = prio; return sfc_flow_create_locked(sa, true, &attr, items, actions, &error); } void sfc_mae_repr_flow_destroy(struct sfc_adapter *sa, struct rte_flow *flow) { struct rte_flow_error error; int rc; rc = sfc_flow_destroy_locked(sa, flow, &error); if (rc != 0) sfc_err(sa, "failed to destroy the internal flow"); } int sfc_mae_attach(struct sfc_adapter *sa) { struct sfc_adapter_shared * const sas = sfc_sa2shared(sa); struct sfc_mae_switch_port_request switch_port_request = {0}; const efx_nic_cfg_t *encp = efx_nic_cfg_get(sa->nic); efx_mport_sel_t ethdev_mport; efx_mport_sel_t entity_mport; struct sfc_mae *mae = &sa->mae; struct sfc_mae_bounce_eh *bounce_eh = &mae->bounce_eh; efx_mae_limits_t limits; int rc; sfc_log_init(sa, "entry"); if (!encp->enc_mae_supported) { mae->status = SFC_MAE_STATUS_UNSUPPORTED; return 0; } if (encp->enc_mae_admin) { sfc_log_init(sa, "init MAE"); rc = efx_mae_init(sa->nic); if (rc != 0) goto fail_mae_init; sfc_log_init(sa, "get MAE limits"); rc = efx_mae_get_limits(sa->nic, &limits); if (rc != 0) goto fail_mae_get_limits; sfc_log_init(sa, "init MAE counter record registry"); rc = sfc_mae_counter_registry_init(&mae->counter_registry, limits.eml_max_n_action_counters, limits.eml_max_n_conntrack_counters); if (rc != 0) { sfc_err(sa, "failed to init record registry for %u AR and %u CT counters: %s", limits.eml_max_n_action_counters, limits.eml_max_n_conntrack_counters, rte_strerror(rc)); goto fail_counter_registry_init; } } sfc_log_init(sa, "assign ethdev MPORT"); rc = sfc_mae_assign_ethdev_mport(sa, ðdev_mport); if (rc != 0) goto fail_mae_assign_ethdev_mport; sfc_log_init(sa, "assign entity MPORT"); rc = sfc_mae_assign_entity_mport(sa, &entity_mport); if (rc != 0) goto fail_mae_assign_entity_mport; sfc_log_init(sa, "assign RTE switch domain"); rc = sfc_mae_assign_switch_domain(sa, &mae->switch_domain_id); if (rc != 0) goto fail_mae_assign_switch_domain; sfc_log_init(sa, "assign RTE switch port"); switch_port_request.type = SFC_MAE_SWITCH_PORT_INDEPENDENT; switch_port_request.ethdev_mportp = ðdev_mport; switch_port_request.entity_mportp = &entity_mport; switch_port_request.ethdev_port_id = sas->port_id; switch_port_request.port_data.indep.mae_admin = encp->enc_mae_admin == B_TRUE; rc = sfc_mae_assign_switch_port(mae->switch_domain_id, &switch_port_request, &mae->switch_port_id); if (rc != 0) goto fail_mae_assign_switch_port; if (encp->enc_mae_admin) { sfc_log_init(sa, "allocate encap. header bounce buffer"); bounce_eh->buf_size = limits.eml_encap_header_size_limit; bounce_eh->buf = rte_malloc("sfc_mae_bounce_eh", bounce_eh->buf_size, 0); if (bounce_eh->buf == NULL) { rc = ENOMEM; goto fail_mae_alloc_bounce_eh; } sfc_log_init(sa, "allocate bounce action set pointer array"); mae->bounce_aset_ptrs = rte_calloc("sfc_mae_bounce_aset_ptrs", EFX_MAE_ACTION_SET_LIST_MAX_NENTRIES, sizeof(*mae->bounce_aset_ptrs), 0); if (mae->bounce_aset_ptrs == NULL) { rc = ENOMEM; goto fail_mae_alloc_bounce_aset_ptrs; } sfc_log_init(sa, "allocate bounce action set contexts"); mae->bounce_aset_ctxs = rte_calloc("sfc_mae_bounce_aset_ctxs", EFX_MAE_ACTION_SET_LIST_MAX_NENTRIES, sizeof(*mae->bounce_aset_ctxs), 0); if (mae->bounce_aset_ctxs == NULL) { rc = ENOMEM; goto fail_mae_alloc_bounce_aset_ctxs; } sfc_log_init(sa, "allocate bounce action set ID array"); mae->bounce_aset_ids = rte_calloc("sfc_mae_bounce_aset_ids", EFX_MAE_ACTION_SET_LIST_MAX_NENTRIES, sizeof(*mae->bounce_aset_ids), 0); if (mae->bounce_aset_ids == NULL) { rc = ENOMEM; goto fail_mae_alloc_bounce_aset_ids; } mae->nb_outer_rule_prios_max = limits.eml_max_n_outer_prios; mae->nb_action_rule_prios_max = limits.eml_max_n_action_prios; mae->encap_types_supported = limits.eml_encap_types_supported; } TAILQ_INIT(&mae->outer_rules); TAILQ_INIT(&mae->mac_addrs); TAILQ_INIT(&mae->encap_headers); TAILQ_INIT(&mae->counters); TAILQ_INIT(&mae->action_sets); TAILQ_INIT(&mae->action_set_lists); TAILQ_INIT(&mae->action_rules); if (encp->enc_mae_admin) mae->status = SFC_MAE_STATUS_ADMIN; else mae->status = SFC_MAE_STATUS_SUPPORTED; sfc_log_init(sa, "done"); return 0; fail_mae_alloc_bounce_aset_ids: rte_free(mae->bounce_aset_ctxs); fail_mae_alloc_bounce_aset_ctxs: rte_free(mae->bounce_aset_ptrs); fail_mae_alloc_bounce_aset_ptrs: rte_free(mae->bounce_eh.buf); fail_mae_alloc_bounce_eh: fail_mae_assign_switch_port: fail_mae_assign_switch_domain: fail_mae_assign_entity_mport: fail_mae_assign_ethdev_mport: if (encp->enc_mae_admin) sfc_mae_counter_registry_fini(&mae->counter_registry); fail_counter_registry_init: fail_mae_get_limits: if (encp->enc_mae_admin) efx_mae_fini(sa->nic); fail_mae_init: sfc_log_init(sa, "failed %d", rc); return rc; } void sfc_mae_detach(struct sfc_adapter *sa) { struct sfc_mae *mae = &sa->mae; enum sfc_mae_status status_prev = mae->status; sfc_log_init(sa, "entry"); mae->nb_action_rule_prios_max = 0; mae->status = SFC_MAE_STATUS_UNKNOWN; if (status_prev != SFC_MAE_STATUS_ADMIN) return; rte_free(mae->bounce_aset_ids); rte_free(mae->bounce_aset_ctxs); rte_free(mae->bounce_aset_ptrs); rte_free(mae->bounce_eh.buf); sfc_mae_counter_registry_fini(&mae->counter_registry); efx_mae_fini(sa->nic); sfc_log_init(sa, "done"); } static struct sfc_mae_outer_rule * sfc_mae_outer_rule_attach(struct sfc_adapter *sa, const efx_mae_match_spec_t *match_spec, efx_tunnel_protocol_t encap_type) { struct sfc_mae_outer_rule *rule; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); TAILQ_FOREACH(rule, &mae->outer_rules, entries) { if (efx_mae_match_specs_equal(rule->match_spec, match_spec) && rule->encap_type == encap_type) { sfc_dbg(sa, "attaching to outer_rule=%p", rule); ++(rule->refcnt); return rule; } } return NULL; } static int sfc_mae_outer_rule_add(struct sfc_adapter *sa, efx_mae_match_spec_t *match_spec, efx_tunnel_protocol_t encap_type, struct sfc_mae_outer_rule **rulep) { struct sfc_mae_outer_rule *rule; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); rule = rte_zmalloc("sfc_mae_outer_rule", sizeof(*rule), 0); if (rule == NULL) return ENOMEM; rule->refcnt = 1; rule->match_spec = match_spec; rule->encap_type = encap_type; rule->fw_rsrc.rule_id.id = EFX_MAE_RSRC_ID_INVALID; TAILQ_INSERT_TAIL(&mae->outer_rules, rule, entries); *rulep = rule; sfc_dbg(sa, "added outer_rule=%p", rule); return 0; } static void sfc_mae_outer_rule_del(struct sfc_adapter *sa, struct sfc_mae_outer_rule *rule) { struct sfc_mae *mae = &sa->mae; if (rule == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(rule->refcnt != 0); --(rule->refcnt); if (rule->refcnt != 0) return; if (rule->fw_rsrc.rule_id.id != EFX_MAE_RSRC_ID_INVALID || rule->fw_rsrc.refcnt != 0) { sfc_err(sa, "deleting outer_rule=%p abandons its FW resource: OR_ID=0x%08x, refcnt=%u", rule, rule->fw_rsrc.rule_id.id, rule->fw_rsrc.refcnt); } efx_mae_match_spec_fini(sa->nic, rule->match_spec); TAILQ_REMOVE(&mae->outer_rules, rule, entries); sfc_dbg(sa, "deleted outer_rule=%p", rule); rte_free(rule); } static int sfc_mae_outer_rule_enable(struct sfc_adapter *sa, struct sfc_mae_outer_rule *rule, efx_mae_match_spec_t *match_spec_action) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (rule == NULL) return 0; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &rule->fw_rsrc; if (fw_rsrc->refcnt == 0) { SFC_ASSERT(fw_rsrc->rule_id.id == EFX_MAE_RSRC_ID_INVALID); SFC_ASSERT(rule->match_spec != NULL); rc = efx_mae_outer_rule_insert(sa->nic, rule->match_spec, rule->encap_type, &fw_rsrc->rule_id); if (rc != 0) { sfc_err(sa, "failed to enable outer_rule=%p: %s", rule, strerror(rc)); return rc; } } if (match_spec_action == NULL) goto skip_action_rule; rc = efx_mae_match_spec_outer_rule_id_set(match_spec_action, &fw_rsrc->rule_id); if (rc != 0) { if (fw_rsrc->refcnt == 0) { (void)efx_mae_outer_rule_remove(sa->nic, &fw_rsrc->rule_id); fw_rsrc->rule_id.id = EFX_MAE_RSRC_ID_INVALID; } sfc_err(sa, "can't match on outer rule ID: %s", strerror(rc)); return rc; } skip_action_rule: if (fw_rsrc->refcnt == 0) { sfc_dbg(sa, "enabled outer_rule=%p: OR_ID=0x%08x", rule, fw_rsrc->rule_id.id); } ++(fw_rsrc->refcnt); return 0; } static void sfc_mae_outer_rule_disable(struct sfc_adapter *sa, struct sfc_mae_outer_rule *rule, efx_mae_match_spec_t *match_spec_action) { efx_mae_rule_id_t invalid_rule_id = { .id = EFX_MAE_RSRC_ID_INVALID }; struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (rule == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &rule->fw_rsrc; if (match_spec_action == NULL) goto skip_action_rule; rc = efx_mae_match_spec_outer_rule_id_set(match_spec_action, &invalid_rule_id); if (rc != 0) { sfc_err(sa, "cannot restore match on invalid outer rule ID: %s", strerror(rc)); return; } skip_action_rule: if (fw_rsrc->rule_id.id == EFX_MAE_RSRC_ID_INVALID || fw_rsrc->refcnt == 0) { sfc_err(sa, "failed to disable outer_rule=%p: already disabled; OR_ID=0x%08x, refcnt=%u", rule, fw_rsrc->rule_id.id, fw_rsrc->refcnt); return; } if (fw_rsrc->refcnt == 1) { rc = efx_mae_outer_rule_remove(sa->nic, &fw_rsrc->rule_id); if (rc == 0) { sfc_dbg(sa, "disabled outer_rule=%p with OR_ID=0x%08x", rule, fw_rsrc->rule_id.id); } else { sfc_err(sa, "failed to disable outer_rule=%p with OR_ID=0x%08x: %s", rule, fw_rsrc->rule_id.id, strerror(rc)); } fw_rsrc->rule_id.id = EFX_MAE_RSRC_ID_INVALID; } --(fw_rsrc->refcnt); } static struct sfc_mae_mac_addr * sfc_mae_mac_addr_attach(struct sfc_adapter *sa, const uint8_t addr_bytes[EFX_MAC_ADDR_LEN]) { struct sfc_mae_mac_addr *mac_addr; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); TAILQ_FOREACH(mac_addr, &mae->mac_addrs, entries) { if (memcmp(mac_addr->addr_bytes, addr_bytes, EFX_MAC_ADDR_LEN) == 0) { sfc_dbg(sa, "attaching to mac_addr=%p", mac_addr); ++(mac_addr->refcnt); return mac_addr; } } return NULL; } static int sfc_mae_mac_addr_add(struct sfc_adapter *sa, const uint8_t addr_bytes[EFX_MAC_ADDR_LEN], struct sfc_mae_mac_addr **mac_addrp) { struct sfc_mae_mac_addr *mac_addr; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); mac_addr = rte_zmalloc("sfc_mae_mac_addr", sizeof(*mac_addr), 0); if (mac_addr == NULL) return ENOMEM; rte_memcpy(mac_addr->addr_bytes, addr_bytes, EFX_MAC_ADDR_LEN); mac_addr->refcnt = 1; mac_addr->fw_rsrc.mac_id.id = EFX_MAE_RSRC_ID_INVALID; TAILQ_INSERT_TAIL(&mae->mac_addrs, mac_addr, entries); *mac_addrp = mac_addr; sfc_dbg(sa, "added mac_addr=%p", mac_addr); return 0; } static void sfc_mae_mac_addr_del(struct sfc_adapter *sa, struct sfc_mae_mac_addr *mac_addr) { struct sfc_mae *mae = &sa->mae; if (mac_addr == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(mac_addr->refcnt != 0); --(mac_addr->refcnt); if (mac_addr->refcnt != 0) return; if (mac_addr->fw_rsrc.mac_id.id != EFX_MAE_RSRC_ID_INVALID || mac_addr->fw_rsrc.refcnt != 0) { sfc_err(sa, "deleting mac_addr=%p abandons its FW resource: MAC_ID=0x%08x, refcnt=%u", mac_addr, mac_addr->fw_rsrc.mac_id.id, mac_addr->fw_rsrc.refcnt); } TAILQ_REMOVE(&mae->mac_addrs, mac_addr, entries); sfc_dbg(sa, "deleted mac_addr=%p", mac_addr); rte_free(mac_addr); } enum sfc_mae_mac_addr_type { SFC_MAE_MAC_ADDR_DST, SFC_MAE_MAC_ADDR_SRC }; static int sfc_mae_mac_addr_enable(struct sfc_adapter *sa, struct sfc_mae_mac_addr *mac_addr, enum sfc_mae_mac_addr_type type, efx_mae_actions_t *aset_spec) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc = 0; if (mac_addr == NULL) return 0; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &mac_addr->fw_rsrc; if (fw_rsrc->refcnt == 0) { SFC_ASSERT(fw_rsrc->mac_id.id == EFX_MAE_RSRC_ID_INVALID); rc = efx_mae_mac_addr_alloc(sa->nic, mac_addr->addr_bytes, &fw_rsrc->mac_id); if (rc != 0) { sfc_err(sa, "failed to enable mac_addr=%p: %s", mac_addr, strerror(rc)); return rc; } } switch (type) { case SFC_MAE_MAC_ADDR_DST: rc = efx_mae_action_set_fill_in_dst_mac_id(aset_spec, &fw_rsrc->mac_id); break; case SFC_MAE_MAC_ADDR_SRC: rc = efx_mae_action_set_fill_in_src_mac_id(aset_spec, &fw_rsrc->mac_id); break; default: rc = EINVAL; break; } if (rc != 0) { if (fw_rsrc->refcnt == 0) { (void)efx_mae_mac_addr_free(sa->nic, &fw_rsrc->mac_id); fw_rsrc->mac_id.id = EFX_MAE_RSRC_ID_INVALID; } sfc_err(sa, "cannot fill in MAC address entry ID: %s", strerror(rc)); return rc; } if (fw_rsrc->refcnt == 0) { sfc_dbg(sa, "enabled mac_addr=%p: MAC_ID=0x%08x", mac_addr, fw_rsrc->mac_id.id); } ++(fw_rsrc->refcnt); return 0; } static void sfc_mae_mac_addr_disable(struct sfc_adapter *sa, struct sfc_mae_mac_addr *mac_addr) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (mac_addr == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &mac_addr->fw_rsrc; if (fw_rsrc->mac_id.id == EFX_MAE_RSRC_ID_INVALID || fw_rsrc->refcnt == 0) { sfc_err(sa, "failed to disable mac_addr=%p: already disabled; MAC_ID=0x%08x, refcnt=%u", mac_addr, fw_rsrc->mac_id.id, fw_rsrc->refcnt); return; } if (fw_rsrc->refcnt == 1) { rc = efx_mae_mac_addr_free(sa->nic, &fw_rsrc->mac_id); if (rc == 0) { sfc_dbg(sa, "disabled mac_addr=%p with MAC_ID=0x%08x", mac_addr, fw_rsrc->mac_id.id); } else { sfc_err(sa, "failed to disable mac_addr=%p with MAC_ID=0x%08x: %s", mac_addr, fw_rsrc->mac_id.id, strerror(rc)); } fw_rsrc->mac_id.id = EFX_MAE_RSRC_ID_INVALID; } --(fw_rsrc->refcnt); } static struct sfc_mae_encap_header * sfc_mae_encap_header_attach(struct sfc_adapter *sa, const struct sfc_mae_bounce_eh *bounce_eh) { struct sfc_mae_encap_header *encap_header; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); TAILQ_FOREACH(encap_header, &mae->encap_headers, entries) { if (encap_header->indirect) continue; if (encap_header->size == bounce_eh->size && memcmp(encap_header->buf, bounce_eh->buf, bounce_eh->size) == 0) { sfc_dbg(sa, "attaching to encap_header=%p", encap_header); ++(encap_header->refcnt); return encap_header; } } return NULL; } static int sfc_mae_encap_header_add(struct sfc_adapter *sa, const struct sfc_mae_bounce_eh *bounce_eh, struct sfc_mae_encap_header **encap_headerp) { struct sfc_mae_encap_header *encap_header; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); encap_header = rte_zmalloc("sfc_mae_encap_header", sizeof(*encap_header), 0); if (encap_header == NULL) return ENOMEM; encap_header->size = bounce_eh->size; encap_header->buf = rte_malloc("sfc_mae_encap_header_buf", encap_header->size, 0); if (encap_header->buf == NULL) { rte_free(encap_header); return ENOMEM; } rte_memcpy(encap_header->buf, bounce_eh->buf, bounce_eh->size); encap_header->refcnt = 1; encap_header->type = bounce_eh->type; encap_header->fw_rsrc.eh_id.id = EFX_MAE_RSRC_ID_INVALID; TAILQ_INSERT_TAIL(&mae->encap_headers, encap_header, entries); *encap_headerp = encap_header; sfc_dbg(sa, "added encap_header=%p", encap_header); return 0; } static void sfc_mae_encap_header_del(struct sfc_adapter *sa, struct sfc_mae_encap_header *encap_header) { struct sfc_mae *mae = &sa->mae; if (encap_header == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(encap_header->refcnt != 0); --(encap_header->refcnt); if (encap_header->refcnt != 0) return; if (encap_header->fw_rsrc.eh_id.id != EFX_MAE_RSRC_ID_INVALID || encap_header->fw_rsrc.refcnt != 0) { sfc_err(sa, "deleting encap_header=%p abandons its FW resource: EH_ID=0x%08x, refcnt=%u", encap_header, encap_header->fw_rsrc.eh_id.id, encap_header->fw_rsrc.refcnt); } TAILQ_REMOVE(&mae->encap_headers, encap_header, entries); sfc_dbg(sa, "deleted encap_header=%p", encap_header); rte_free(encap_header->buf); rte_free(encap_header); } static int sfc_mae_encap_header_update(struct sfc_adapter *sa, struct sfc_mae_encap_header *encap_header) { const struct sfc_mae_bounce_eh *bounce_eh = &sa->mae.bounce_eh; struct sfc_mae_fw_rsrc *fw_rsrc; uint8_t *buf; int ret; if (bounce_eh->type != encap_header->type || bounce_eh->size == 0) return EINVAL; buf = rte_malloc("sfc_mae_encap_header_buf", bounce_eh->size, 0); if (buf == NULL) return ENOMEM; rte_memcpy(buf, bounce_eh->buf, bounce_eh->size); fw_rsrc = &encap_header->fw_rsrc; if (fw_rsrc->refcnt > 0) { SFC_ASSERT(fw_rsrc->eh_id.id != EFX_MAE_RSRC_ID_INVALID); ret = efx_mae_encap_header_update(sa->nic, &fw_rsrc->eh_id, encap_header->type, buf, bounce_eh->size); if (ret != 0) { sfc_err(sa, "failed to update encap_header=%p: %s", encap_header, strerror(ret)); rte_free(buf); return ret; } } encap_header->size = bounce_eh->size; rte_free(encap_header->buf); encap_header->buf = buf; sfc_dbg(sa, "updated encap_header=%p", encap_header); return 0; } static int sfc_mae_encap_header_enable(struct sfc_adapter *sa, struct sfc_mae_encap_header *encap_header, efx_mae_actions_t *action_set_spec) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (encap_header == NULL) return 0; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &encap_header->fw_rsrc; if (fw_rsrc->refcnt == 0) { SFC_ASSERT(fw_rsrc->eh_id.id == EFX_MAE_RSRC_ID_INVALID); SFC_ASSERT(encap_header->buf != NULL); SFC_ASSERT(encap_header->size != 0); rc = efx_mae_encap_header_alloc(sa->nic, encap_header->type, encap_header->buf, encap_header->size, &fw_rsrc->eh_id); if (rc != 0) { sfc_err(sa, "failed to enable encap_header=%p: %s", encap_header, strerror(rc)); return rc; } } rc = efx_mae_action_set_fill_in_eh_id(action_set_spec, &fw_rsrc->eh_id); if (rc != 0) { if (fw_rsrc->refcnt == 0) { (void)efx_mae_encap_header_free(sa->nic, &fw_rsrc->eh_id); fw_rsrc->eh_id.id = EFX_MAE_RSRC_ID_INVALID; } sfc_err(sa, "can't fill in encap. header ID: %s", strerror(rc)); return rc; } if (fw_rsrc->refcnt == 0) { sfc_dbg(sa, "enabled encap_header=%p: EH_ID=0x%08x", encap_header, fw_rsrc->eh_id.id); } ++(fw_rsrc->refcnt); return 0; } static void sfc_mae_encap_header_disable(struct sfc_adapter *sa, struct sfc_mae_encap_header *encap_header) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (encap_header == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &encap_header->fw_rsrc; if (fw_rsrc->eh_id.id == EFX_MAE_RSRC_ID_INVALID || fw_rsrc->refcnt == 0) { sfc_err(sa, "failed to disable encap_header=%p: already disabled; EH_ID=0x%08x, refcnt=%u", encap_header, fw_rsrc->eh_id.id, fw_rsrc->refcnt); return; } if (fw_rsrc->refcnt == 1) { rc = efx_mae_encap_header_free(sa->nic, &fw_rsrc->eh_id); if (rc == 0) { sfc_dbg(sa, "disabled encap_header=%p with EH_ID=0x%08x", encap_header, fw_rsrc->eh_id.id); } else { sfc_err(sa, "failed to disable encap_header=%p with EH_ID=0x%08x: %s", encap_header, fw_rsrc->eh_id.id, strerror(rc)); } fw_rsrc->eh_id.id = EFX_MAE_RSRC_ID_INVALID; } --(fw_rsrc->refcnt); } static int sfc_mae_counter_add(struct sfc_adapter *sa, const struct sfc_mae_counter *counter_tmp, struct sfc_mae_counter **counterp) { struct sfc_mae_counter *counter; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); counter = rte_zmalloc("sfc_mae_counter", sizeof(*counter), 0); if (counter == NULL) return ENOMEM; if (counter_tmp != NULL) { counter->rte_id_valid = counter_tmp->rte_id_valid; counter->rte_id = counter_tmp->rte_id; counter->type = counter_tmp->type; } else { counter->type = EFX_COUNTER_TYPE_ACTION; } counter->fw_rsrc.counter_id.id = EFX_MAE_RSRC_ID_INVALID; counter->refcnt = 1; TAILQ_INSERT_TAIL(&mae->counters, counter, entries); *counterp = counter; sfc_dbg(sa, "added counter=%p", counter); return 0; } static void sfc_mae_counter_del(struct sfc_adapter *sa, struct sfc_mae_counter *counter) { struct sfc_mae *mae = &sa->mae; if (counter == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(counter->refcnt != 0); --(counter->refcnt); if (counter->refcnt != 0) return; if (counter->fw_rsrc.counter_id.id != EFX_MAE_RSRC_ID_INVALID || counter->fw_rsrc.refcnt != 0) { sfc_err(sa, "deleting counter=%p abandons its FW resource: COUNTER_ID=0x%x-#%u, refcnt=%u", counter, counter->type, counter->fw_rsrc.counter_id.id, counter->fw_rsrc.refcnt); } TAILQ_REMOVE(&mae->counters, counter, entries); sfc_dbg(sa, "deleted counter=%p", counter); rte_free(counter); } static int sfc_mae_counter_enable(struct sfc_adapter *sa, struct sfc_mae_counter *counter, efx_mae_actions_t *action_set_spec) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (counter == NULL) return 0; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &counter->fw_rsrc; if (fw_rsrc->refcnt == 0) { SFC_ASSERT(fw_rsrc->counter_id.id == EFX_MAE_RSRC_ID_INVALID); rc = sfc_mae_counter_fw_rsrc_enable(sa, counter); if (rc != 0) { sfc_err(sa, "failed to enable counter=%p: %s", counter, rte_strerror(rc)); return rc; } } if (action_set_spec != NULL) { rc = efx_mae_action_set_fill_in_counter_id( action_set_spec, &fw_rsrc->counter_id); if (rc != 0) { if (fw_rsrc->refcnt == 0) { (void)sfc_mae_counter_fw_rsrc_disable(sa, counter); fw_rsrc->counter_id.id = EFX_MAE_RSRC_ID_INVALID; } sfc_err(sa, "cannot fill in counter ID: %s", strerror(rc)); return rc; } } if (fw_rsrc->refcnt == 0) { sfc_dbg(sa, "enabled counter=%p: COUNTER_ID=0x%x-#%u", counter, counter->type, fw_rsrc->counter_id.id); } ++(fw_rsrc->refcnt); return 0; } static void sfc_mae_counter_disable(struct sfc_adapter *sa, struct sfc_mae_counter *counter) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (counter == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &counter->fw_rsrc; if (fw_rsrc->counter_id.id == EFX_MAE_RSRC_ID_INVALID || fw_rsrc->refcnt == 0) { sfc_err(sa, "failed to disable counter=%p: already disabled; COUNTER_ID=0x%x-#%u, refcnt=%u", counter, counter->type, fw_rsrc->counter_id.id, fw_rsrc->refcnt); return; } if (fw_rsrc->refcnt == 1) { uint32_t counter_id = fw_rsrc->counter_id.id; rc = sfc_mae_counter_fw_rsrc_disable(sa, counter); if (rc == 0) { sfc_dbg(sa, "disabled counter=%p with COUNTER_ID=0x%x-#%u", counter, counter->type, counter_id); } else { sfc_err(sa, "failed to disable counter=%p with COUNTER_ID=0x%x-#%u: %s", counter, counter->type, counter_id, strerror(rc)); } fw_rsrc->counter_id.id = EFX_MAE_RSRC_ID_INVALID; } --(fw_rsrc->refcnt); } static struct sfc_mae_action_set * sfc_mae_action_set_attach(struct sfc_adapter *sa, const struct sfc_mae_aset_ctx *ctx) { struct sfc_mae_action_set *action_set; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); TAILQ_FOREACH(action_set, &mae->action_sets, entries) { if (action_set->encap_header == ctx->encap_header && action_set->dst_mac_addr == ctx->dst_mac && action_set->src_mac_addr == ctx->src_mac && action_set->counter == ctx->counter && efx_mae_action_set_specs_equal(action_set->spec, ctx->spec)) { sfc_dbg(sa, "attaching to action_set=%p", action_set); ++(action_set->refcnt); return action_set; } } return NULL; } static int sfc_mae_action_set_add(struct sfc_adapter *sa, const struct sfc_mae_aset_ctx *ctx, struct sfc_mae_action_set **action_setp) { struct sfc_mae_action_set *action_set; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); action_set = rte_zmalloc("sfc_mae_action_set", sizeof(*action_set), 0); if (action_set == NULL) { sfc_err(sa, "failed to alloc action set"); return ENOMEM; } action_set->refcnt = 1; action_set->spec = ctx->spec; action_set->encap_header = ctx->encap_header; action_set->dst_mac_addr = ctx->dst_mac; action_set->src_mac_addr = ctx->src_mac; action_set->counter = ctx->counter; action_set->fw_rsrc.aset_id.id = EFX_MAE_RSRC_ID_INVALID; TAILQ_INSERT_TAIL(&mae->action_sets, action_set, entries); *action_setp = action_set; sfc_dbg(sa, "added action_set=%p", action_set); return 0; } static void sfc_mae_action_set_del(struct sfc_adapter *sa, struct sfc_mae_action_set *action_set) { struct sfc_mae *mae = &sa->mae; if (action_set == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(action_set->refcnt != 0); --(action_set->refcnt); if (action_set->refcnt != 0) return; if (action_set->fw_rsrc.aset_id.id != EFX_MAE_RSRC_ID_INVALID || action_set->fw_rsrc.refcnt != 0) { sfc_err(sa, "deleting action_set=%p abandons its FW resource: AS_ID=0x%08x, refcnt=%u", action_set, action_set->fw_rsrc.aset_id.id, action_set->fw_rsrc.refcnt); } efx_mae_action_set_spec_fini(sa->nic, action_set->spec); sfc_mae_encap_header_del(sa, action_set->encap_header); sfc_mae_mac_addr_del(sa, action_set->dst_mac_addr); sfc_mae_mac_addr_del(sa, action_set->src_mac_addr); sfc_mae_counter_del(sa, action_set->counter); TAILQ_REMOVE(&mae->action_sets, action_set, entries); sfc_dbg(sa, "deleted action_set=%p", action_set); rte_free(action_set); } static int sfc_mae_action_set_enable(struct sfc_adapter *sa, struct sfc_mae_action_set *action_set) { struct sfc_mae_encap_header *encap_header; struct sfc_mae_mac_addr *dst_mac_addr; struct sfc_mae_mac_addr *src_mac_addr; struct sfc_mae_counter *counter; struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (action_set == NULL) return 0; SFC_ASSERT(sfc_adapter_is_locked(sa)); encap_header = action_set->encap_header; dst_mac_addr = action_set->dst_mac_addr; src_mac_addr = action_set->src_mac_addr; fw_rsrc = &action_set->fw_rsrc; counter = action_set->counter; if (fw_rsrc->refcnt == 0) { SFC_ASSERT(fw_rsrc->aset_id.id == EFX_MAE_RSRC_ID_INVALID); SFC_ASSERT(action_set->spec != NULL); rc = sfc_mae_mac_addr_enable(sa, dst_mac_addr, SFC_MAE_MAC_ADDR_DST, action_set->spec); if (rc != 0) return rc; rc = sfc_mae_mac_addr_enable(sa, src_mac_addr, SFC_MAE_MAC_ADDR_SRC, action_set->spec); if (rc != 0) { sfc_mae_mac_addr_disable(sa, dst_mac_addr); return rc; } rc = sfc_mae_encap_header_enable(sa, encap_header, action_set->spec); if (rc != 0) { sfc_mae_mac_addr_disable(sa, src_mac_addr); sfc_mae_mac_addr_disable(sa, dst_mac_addr); return rc; } if (counter != NULL) { rc = sfc_mae_counter_start(sa); if (rc != 0) { sfc_err(sa, "failed to start MAE counters support: %s", rte_strerror(rc)); sfc_mae_encap_header_disable(sa, encap_header); sfc_mae_mac_addr_disable(sa, src_mac_addr); sfc_mae_mac_addr_disable(sa, dst_mac_addr); return rc; } } rc = sfc_mae_counter_enable(sa, counter, action_set->spec); if (rc != 0) { sfc_mae_encap_header_disable(sa, encap_header); sfc_mae_mac_addr_disable(sa, src_mac_addr); sfc_mae_mac_addr_disable(sa, dst_mac_addr); return rc; } rc = efx_mae_action_set_alloc(sa->nic, action_set->spec, &fw_rsrc->aset_id); if (rc != 0) { sfc_err(sa, "failed to enable action_set=%p: %s", action_set, strerror(rc)); sfc_mae_encap_header_disable(sa, encap_header); sfc_mae_mac_addr_disable(sa, src_mac_addr); sfc_mae_mac_addr_disable(sa, dst_mac_addr); sfc_mae_counter_disable(sa, counter); return rc; } sfc_dbg(sa, "enabled action_set=%p: AS_ID=0x%08x", action_set, fw_rsrc->aset_id.id); } ++(fw_rsrc->refcnt); return 0; } static void sfc_mae_action_set_disable(struct sfc_adapter *sa, struct sfc_mae_action_set *action_set) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (action_set == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &action_set->fw_rsrc; if (fw_rsrc->aset_id.id == EFX_MAE_RSRC_ID_INVALID || fw_rsrc->refcnt == 0) { sfc_err(sa, "failed to disable action_set=%p: already disabled; AS_ID=0x%08x, refcnt=%u", action_set, fw_rsrc->aset_id.id, fw_rsrc->refcnt); return; } if (fw_rsrc->refcnt == 1) { efx_mae_action_set_clear_fw_rsrc_ids(action_set->spec); rc = efx_mae_action_set_free(sa->nic, &fw_rsrc->aset_id); if (rc == 0) { sfc_dbg(sa, "disabled action_set=%p with AS_ID=0x%08x", action_set, fw_rsrc->aset_id.id); } else { sfc_err(sa, "failed to disable action_set=%p with AS_ID=0x%08x: %s", action_set, fw_rsrc->aset_id.id, strerror(rc)); } fw_rsrc->aset_id.id = EFX_MAE_RSRC_ID_INVALID; sfc_mae_encap_header_disable(sa, action_set->encap_header); sfc_mae_mac_addr_disable(sa, action_set->src_mac_addr); sfc_mae_mac_addr_disable(sa, action_set->dst_mac_addr); sfc_mae_counter_disable(sa, action_set->counter); } --(fw_rsrc->refcnt); } static struct sfc_mae_action_set_list * sfc_mae_action_set_list_attach(struct sfc_adapter *sa) { struct sfc_mae_action_set_list *action_set_list; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); TAILQ_FOREACH(action_set_list, &mae->action_set_lists, entries) { if (action_set_list->nb_action_sets != mae->nb_bounce_asets) continue; if (memcmp(action_set_list->action_sets, mae->bounce_aset_ptrs, sizeof(struct sfc_mae_action_set *) * mae->nb_bounce_asets) == 0) { sfc_dbg(sa, "attaching to action_set_list=%p", action_set_list); ++(action_set_list->refcnt); return action_set_list; } } return NULL; } static int sfc_mae_action_set_list_add(struct sfc_adapter *sa, struct sfc_mae_action_set_list **action_set_listp) { struct sfc_mae_action_set_list *action_set_list; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); action_set_list = rte_zmalloc("sfc_mae_action_set_list", sizeof(*action_set_list), 0); if (action_set_list == NULL) { sfc_err(sa, "failed to allocate action set list"); return ENOMEM; } action_set_list->refcnt = 1; action_set_list->nb_action_sets = mae->nb_bounce_asets; action_set_list->fw_rsrc.aset_list_id.id = EFX_MAE_RSRC_ID_INVALID; action_set_list->action_sets = rte_calloc("sfc_mae_action_set_list_action_sets", action_set_list->nb_action_sets, sizeof(struct sfc_mae_action_set *), 0); if (action_set_list->action_sets == NULL) { sfc_err(sa, "failed to allocate action set list"); rte_free(action_set_list); return ENOMEM; } rte_memcpy(action_set_list->action_sets, mae->bounce_aset_ptrs, sizeof(struct sfc_mae_action_set *) * action_set_list->nb_action_sets); TAILQ_INSERT_TAIL(&mae->action_set_lists, action_set_list, entries); *action_set_listp = action_set_list; sfc_dbg(sa, "added action_set_list=%p", action_set_list); return 0; } static void sfc_mae_action_set_list_del(struct sfc_adapter *sa, struct sfc_mae_action_set_list *action_set_list) { struct sfc_mae *mae = &sa->mae; unsigned int i; if (action_set_list == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(action_set_list->refcnt != 0); --(action_set_list->refcnt); if (action_set_list->refcnt != 0) return; if (action_set_list->fw_rsrc.aset_list_id.id != EFX_MAE_RSRC_ID_INVALID || action_set_list->fw_rsrc.refcnt != 0) { sfc_err(sa, "deleting action_set_list=%p abandons its FW resource: ASL_ID=0x%08x, refcnt=%u", action_set_list, action_set_list->fw_rsrc.aset_list_id.id, action_set_list->fw_rsrc.refcnt); } for (i = 0; i < action_set_list->nb_action_sets; ++i) sfc_mae_action_set_del(sa, action_set_list->action_sets[i]); TAILQ_REMOVE(&mae->action_set_lists, action_set_list, entries); sfc_dbg(sa, "deleted action_set_list=%p", action_set_list); rte_free(action_set_list->action_sets); rte_free(action_set_list); } static int sfc_mae_action_set_list_enable(struct sfc_adapter *sa, struct sfc_mae_action_set_list *action_set_list) { struct sfc_mae_fw_rsrc *fw_rsrc; unsigned int i; unsigned int j; int rc; if (action_set_list == NULL) return 0; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &action_set_list->fw_rsrc; if (fw_rsrc->refcnt == 0) { struct sfc_mae *mae = &sa->mae; SFC_ASSERT(fw_rsrc->aset_list_id.id == EFX_MAE_RSRC_ID_INVALID); for (i = 0; i < action_set_list->nb_action_sets; ++i) { const struct sfc_mae_fw_rsrc *as_fw_rsrc; rc = sfc_mae_action_set_enable(sa, action_set_list->action_sets[i]); if (rc != 0) goto fail_action_set_enable; as_fw_rsrc = &action_set_list->action_sets[i]->fw_rsrc; mae->bounce_aset_ids[i].id = as_fw_rsrc->aset_id.id; } rc = efx_mae_action_set_list_alloc(sa->nic, action_set_list->nb_action_sets, mae->bounce_aset_ids, &fw_rsrc->aset_list_id); if (rc != 0) { sfc_err(sa, "failed to enable action_set_list=%p: %s", action_set_list, strerror(rc)); goto fail_action_set_list_alloc; } sfc_dbg(sa, "enabled action_set_list=%p: ASL_ID=0x%08x", action_set_list, fw_rsrc->aset_list_id.id); } ++(fw_rsrc->refcnt); return 0; fail_action_set_list_alloc: fail_action_set_enable: for (j = 0; j < i; ++j) sfc_mae_action_set_disable(sa, action_set_list->action_sets[j]); return rc; } static void sfc_mae_action_set_list_disable(struct sfc_adapter *sa, struct sfc_mae_action_set_list *action_set_list) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; if (action_set_list == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &action_set_list->fw_rsrc; if (fw_rsrc->aset_list_id.id == EFX_MAE_RSRC_ID_INVALID || fw_rsrc->refcnt == 0) { sfc_err(sa, "failed to disable action_set_list=%p: already disabled; ASL_ID=0x%08x, refcnt=%u", action_set_list, fw_rsrc->aset_list_id.id, fw_rsrc->refcnt); return; } if (fw_rsrc->refcnt == 1) { unsigned int i; rc = efx_mae_action_set_list_free(sa->nic, &fw_rsrc->aset_list_id); if (rc == 0) { sfc_dbg(sa, "disabled action_set_list=%p with ASL_ID=0x%08x", action_set_list, fw_rsrc->aset_list_id.id); } else { sfc_err(sa, "failed to disable action_set_list=%p with ASL_ID=0x%08x: %s", action_set_list, fw_rsrc->aset_list_id.id, strerror(rc)); } fw_rsrc->aset_list_id.id = EFX_MAE_RSRC_ID_INVALID; for (i = 0; i < action_set_list->nb_action_sets; ++i) { sfc_mae_action_set_disable(sa, action_set_list->action_sets[i]); } } --(fw_rsrc->refcnt); } struct sfc_mae_action_rule_ctx { struct sfc_mae_outer_rule *outer_rule; /* * When action_set_list != NULL, action_set is NULL, and vice versa. */ struct sfc_mae_action_set *action_set; struct sfc_mae_action_set_list *action_set_list; efx_mae_match_spec_t *match_spec; uint32_t ct_mark; }; static int sfc_mae_action_rule_attach(struct sfc_adapter *sa, struct sfc_mae_action_rule_ctx *ctx, struct sfc_mae_action_rule **rulep, struct rte_flow_error *error) { uint32_t new_ct_mark = ctx->ct_mark; struct sfc_mae_action_rule *rule; int rc; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(ctx->ct_mark <= 1); /* * It is assumed that the caller of this helper has already properly * tailored ctx->match_spec to match on OR_ID / 0xffffffff (when * ctx->outer_rule refers to a currently active outer rule) or * on 0xffffffff / 0xffffffff, so that specs compare correctly. */ TAILQ_FOREACH(rule, &sa->mae.action_rules, entries) { if (rule->ct_mark == new_ct_mark) ++new_ct_mark; if (rule->outer_rule != ctx->outer_rule || rule->action_set != ctx->action_set || rule->action_set_list != ctx->action_set_list || !!rule->ct_mark != !!ctx->ct_mark) continue; if (ctx->ct_mark != 0) { rc = efx_mae_match_spec_ct_mark_set(ctx->match_spec, rule->ct_mark); if (rc != 0) { return rte_flow_error_set(error, EFAULT, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "AR: failed to set CT mark for comparison"); } } if (efx_mae_match_specs_equal(rule->match_spec, ctx->match_spec)) { sfc_dbg(sa, "attaching to action_rule=%p", rule); ++(rule->refcnt); *rulep = rule; return 0; } } if (ctx->ct_mark != 0) { if (new_ct_mark == UINT32_MAX) { return rte_flow_error_set(error, ERANGE, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "AR: failed to allocate CT mark"); } rc = efx_mae_match_spec_ct_mark_set(ctx->match_spec, new_ct_mark); if (rc != 0) { return rte_flow_error_set(error, EFAULT, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "AR: failed to set CT mark"); } ctx->ct_mark = new_ct_mark; } /* * No need to set RTE error, as this * code should be handled gracefully. */ return -ENOENT; } static int sfc_mae_action_rule_add(struct sfc_adapter *sa, const struct sfc_mae_action_rule_ctx *ctx, struct sfc_mae_action_rule **rulep) { struct sfc_mae_action_rule *rule; struct sfc_mae *mae = &sa->mae; SFC_ASSERT(sfc_adapter_is_locked(sa)); rule = rte_zmalloc("sfc_mae_action_rule", sizeof(*rule), 0); if (rule == NULL) return ENOMEM; rule->refcnt = 1; /* * It is assumed that the caller invoked sfc_mae_action_rule_attach() * and got (-ENOENT) before getting here. That ensures a unique CT * mark value or, if no CT is involved at all, simply zero. * * It is also assumed that match on the mark (if non-zero) * is already set in the action rule match specification. */ rule->ct_mark = ctx->ct_mark; rule->outer_rule = ctx->outer_rule; rule->action_set = ctx->action_set; rule->action_set_list = ctx->action_set_list; rule->match_spec = ctx->match_spec; rule->fw_rsrc.rule_id.id = EFX_MAE_RSRC_ID_INVALID; TAILQ_INSERT_TAIL(&mae->action_rules, rule, entries); *rulep = rule; sfc_dbg(sa, "added action_rule=%p", rule); return 0; } static void sfc_mae_action_rule_del(struct sfc_adapter *sa, struct sfc_mae_action_rule *rule) { struct sfc_mae *mae = &sa->mae; if (rule == NULL) return; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(rule->refcnt != 0); --(rule->refcnt); if (rule->refcnt != 0) return; if (rule->fw_rsrc.rule_id.id != EFX_MAE_RSRC_ID_INVALID || rule->fw_rsrc.refcnt != 0) { sfc_err(sa, "deleting action_rule=%p abandons its FW resource: AR_ID=0x%08x, refcnt=%u", rule, rule->fw_rsrc.rule_id.id, rule->fw_rsrc.refcnt); } efx_mae_match_spec_fini(sa->nic, rule->match_spec); sfc_mae_action_set_list_del(sa, rule->action_set_list); sfc_mae_action_set_del(sa, rule->action_set); sfc_mae_outer_rule_del(sa, rule->outer_rule); TAILQ_REMOVE(&mae->action_rules, rule, entries); sfc_dbg(sa, "deleted action_rule=%p", rule); rte_free(rule); } static int sfc_mae_action_rule_enable(struct sfc_adapter *sa, struct sfc_mae_action_rule *rule) { const efx_mae_aset_list_id_t *asl_idp = NULL; const efx_mae_aset_id_t *as_idp = NULL; struct sfc_mae_fw_rsrc *fw_rsrc; int rc; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &rule->fw_rsrc; if (fw_rsrc->refcnt != 0) goto success; rc = sfc_mae_outer_rule_enable(sa, rule->outer_rule, rule->match_spec); if (rc != 0) goto fail_outer_rule_enable; rc = sfc_mae_action_set_enable(sa, rule->action_set); if (rc != 0) goto fail_action_set_enable; rc = sfc_mae_action_set_list_enable(sa, rule->action_set_list); if (rc != 0) goto fail_action_set_list_enable; if (rule->action_set_list != NULL) asl_idp = &rule->action_set_list->fw_rsrc.aset_list_id; if (rule->action_set != NULL) as_idp = &rule->action_set->fw_rsrc.aset_id; rc = efx_mae_action_rule_insert(sa->nic, rule->match_spec, asl_idp, as_idp, &fw_rsrc->rule_id); if (rc != 0) { sfc_err(sa, "failed to enable action_rule=%p: %s", rule, strerror(rc)); goto fail_action_rule_insert; } success: if (fw_rsrc->refcnt == 0) { sfc_dbg(sa, "enabled action_rule=%p: AR_ID=0x%08x", rule, fw_rsrc->rule_id.id); } ++(fw_rsrc->refcnt); return 0; fail_action_rule_insert: sfc_mae_action_set_list_disable(sa, rule->action_set_list); fail_action_set_list_enable: sfc_mae_action_set_disable(sa, rule->action_set); fail_action_set_enable: sfc_mae_outer_rule_disable(sa, rule->outer_rule, rule->match_spec); fail_outer_rule_enable: return rc; } static void sfc_mae_action_rule_disable(struct sfc_adapter *sa, struct sfc_mae_action_rule *rule) { struct sfc_mae_fw_rsrc *fw_rsrc; int rc; SFC_ASSERT(sfc_adapter_is_locked(sa)); fw_rsrc = &rule->fw_rsrc; if (fw_rsrc->rule_id.id == EFX_MAE_RSRC_ID_INVALID || fw_rsrc->refcnt == 0) { sfc_err(sa, "failed to disable action_rule=%p: already disabled; AR_ID=0x%08x, refcnt=%u", rule, fw_rsrc->rule_id.id, fw_rsrc->refcnt); return; } if (fw_rsrc->refcnt == 1) { rc = efx_mae_action_rule_remove(sa->nic, &fw_rsrc->rule_id); if (rc == 0) { sfc_dbg(sa, "disabled action_rule=%p with AR_ID=0x%08x", rule, fw_rsrc->rule_id.id); } else { sfc_err(sa, "failed to disable action_rule=%p with AR_ID=0x%08x: %s", rule, fw_rsrc->rule_id.id, strerror(rc)); } fw_rsrc->rule_id.id = EFX_MAE_RSRC_ID_INVALID; sfc_mae_action_set_list_disable(sa, rule->action_set_list); sfc_mae_action_set_disable(sa, rule->action_set); sfc_mae_outer_rule_disable(sa, rule->outer_rule, rule->match_spec); } --(fw_rsrc->refcnt); } void sfc_mae_flow_cleanup(struct sfc_adapter *sa, struct rte_flow *flow) { struct sfc_flow_spec_mae *spec_mae; if (flow == NULL) return; spec_mae = &flow->spec.mae; if (spec_mae->ft_ctx != NULL) { if (spec_mae->ft_rule_type == SFC_FT_RULE_TUNNEL) spec_mae->ft_ctx->tunnel_rule_is_set = B_FALSE; SFC_ASSERT(spec_mae->ft_ctx->refcnt != 0); --(spec_mae->ft_ctx->refcnt); } sfc_mae_action_rule_del(sa, spec_mae->action_rule); sfc_mae_counter_del(sa, spec_mae->ct_counter); } static int sfc_mae_set_ethertypes(struct sfc_mae_parse_ctx *ctx) { struct sfc_mae_pattern_data *pdata = &ctx->pattern_data; const efx_mae_field_id_t *fremap = ctx->field_ids_remap; const efx_mae_field_id_t field_ids[] = { EFX_MAE_FIELD_VLAN0_PROTO_BE, EFX_MAE_FIELD_VLAN1_PROTO_BE, }; const struct sfc_mae_ethertype *et; unsigned int i; int rc; /* * In accordance with RTE flow API convention, the innermost L2 * item's "type" ("inner_type") is a L3 EtherType. If there is * no L3 item, it's 0x0000/0x0000. */ et = &pdata->ethertypes[pdata->nb_vlan_tags]; rc = efx_mae_match_spec_field_set(ctx->match_spec, fremap[EFX_MAE_FIELD_ETHER_TYPE_BE], sizeof(et->value), (const uint8_t *)&et->value, sizeof(et->mask), (const uint8_t *)&et->mask); if (rc != 0) return rc; /* * sfc_mae_rule_parse_item_vlan() has already made sure * that pdata->nb_vlan_tags does not exceed this figure. */ RTE_BUILD_BUG_ON(SFC_MAE_MATCH_VLAN_MAX_NTAGS != 2); for (i = 0; i < pdata->nb_vlan_tags; ++i) { et = &pdata->ethertypes[i]; rc = efx_mae_match_spec_field_set(ctx->match_spec, fremap[field_ids[i]], sizeof(et->value), (const uint8_t *)&et->value, sizeof(et->mask), (const uint8_t *)&et->mask); if (rc != 0) return rc; } return 0; } static int sfc_mae_rule_process_pattern_data(struct sfc_mae_parse_ctx *ctx, struct rte_flow_error *error) { const efx_mae_field_id_t *fremap = ctx->field_ids_remap; struct sfc_mae_pattern_data *pdata = &ctx->pattern_data; struct sfc_mae_ethertype *ethertypes = pdata->ethertypes; const rte_be16_t supported_tpids[] = { /* VLAN standard TPID (always the first element) */ RTE_BE16(RTE_ETHER_TYPE_VLAN), /* Double-tagging TPIDs */ RTE_BE16(RTE_ETHER_TYPE_QINQ), RTE_BE16(RTE_ETHER_TYPE_QINQ1), RTE_BE16(RTE_ETHER_TYPE_QINQ2), RTE_BE16(RTE_ETHER_TYPE_QINQ3), }; bool enforce_tag_presence[SFC_MAE_MATCH_VLAN_MAX_NTAGS] = {0}; unsigned int nb_supported_tpids = RTE_DIM(supported_tpids); unsigned int ethertype_idx; const uint8_t *valuep; const uint8_t *maskp; int rc; if (pdata->innermost_ethertype_restriction.mask != 0 && pdata->nb_vlan_tags < SFC_MAE_MATCH_VLAN_MAX_NTAGS) { /* * If a single item VLAN is followed by a L3 item, value * of "type" in item ETH can't be a double-tagging TPID. */ nb_supported_tpids = 1; } /* * sfc_mae_rule_parse_item_vlan() has already made sure * that pdata->nb_vlan_tags does not exceed this figure. */ RTE_BUILD_BUG_ON(SFC_MAE_MATCH_VLAN_MAX_NTAGS != 2); for (ethertype_idx = 0; ethertype_idx < pdata->nb_vlan_tags; ++ethertype_idx) { rte_be16_t tpid_v = ethertypes[ethertype_idx].value; rte_be16_t tpid_m = ethertypes[ethertype_idx].mask; unsigned int tpid_idx; /* * This loop can have only two iterations. On the second one, * drop outer tag presence enforcement bit because the inner * tag presence automatically assumes that for the outer tag. */ enforce_tag_presence[0] = B_FALSE; if (tpid_m == RTE_BE16(0)) { if (pdata->tci_masks[ethertype_idx] == RTE_BE16(0)) enforce_tag_presence[ethertype_idx] = B_TRUE; /* No match on this field, and no value check. */ nb_supported_tpids = 1; continue; } /* Exact match is supported only. */ if (tpid_m != RTE_BE16(0xffff)) { sfc_err(ctx->sa, "TPID mask must be 0x0 or 0xffff; got 0x%04x", rte_be_to_cpu_16(tpid_m)); rc = EINVAL; goto fail; } for (tpid_idx = pdata->nb_vlan_tags - ethertype_idx - 1; tpid_idx < nb_supported_tpids; ++tpid_idx) { if (tpid_v == supported_tpids[tpid_idx]) break; } if (tpid_idx == nb_supported_tpids) { sfc_err(ctx->sa, "TPID 0x%04x is unsupported", rte_be_to_cpu_16(tpid_v)); rc = EINVAL; goto fail; } nb_supported_tpids = 1; } if (pdata->innermost_ethertype_restriction.mask == RTE_BE16(0xffff)) { struct sfc_mae_ethertype *et = ðertypes[ethertype_idx]; rte_be16_t enforced_et; enforced_et = pdata->innermost_ethertype_restriction.value; if (et->mask == 0) { et->mask = RTE_BE16(0xffff); et->value = enforced_et; } else if (et->mask != RTE_BE16(0xffff) || et->value != enforced_et) { sfc_err(ctx->sa, "L3 EtherType must be 0x0/0x0 or 0x%04x/0xffff; got 0x%04x/0x%04x", rte_be_to_cpu_16(enforced_et), rte_be_to_cpu_16(et->value), rte_be_to_cpu_16(et->mask)); rc = EINVAL; goto fail; } } /* * Now, when the number of VLAN tags is known, set fields * ETHER_TYPE, VLAN0_PROTO and VLAN1_PROTO so that the first * one is either a valid L3 EtherType (or 0x0000/0x0000), * and the last two are valid TPIDs (or 0x0000/0x0000). */ rc = sfc_mae_set_ethertypes(ctx); if (rc != 0) goto fail; if (pdata->l3_next_proto_restriction_mask == 0xff) { if (pdata->l3_next_proto_mask == 0) { pdata->l3_next_proto_mask = 0xff; pdata->l3_next_proto_value = pdata->l3_next_proto_restriction_value; } else if (pdata->l3_next_proto_mask != 0xff || pdata->l3_next_proto_value != pdata->l3_next_proto_restriction_value) { sfc_err(ctx->sa, "L3 next protocol must be 0x0/0x0 or 0x%02x/0xff; got 0x%02x/0x%02x", pdata->l3_next_proto_restriction_value, pdata->l3_next_proto_value, pdata->l3_next_proto_mask); rc = EINVAL; goto fail; } } if (enforce_tag_presence[0] || pdata->has_ovlan_mask) { rc = efx_mae_match_spec_bit_set(ctx->match_spec, fremap[EFX_MAE_FIELD_HAS_OVLAN], enforce_tag_presence[0] || pdata->has_ovlan_value); if (rc != 0) goto fail; } if (enforce_tag_presence[1] || pdata->has_ivlan_mask) { rc = efx_mae_match_spec_bit_set(ctx->match_spec, fremap[EFX_MAE_FIELD_HAS_IVLAN], enforce_tag_presence[1] || pdata->has_ivlan_value); if (rc != 0) goto fail; } valuep = (const uint8_t *)&pdata->l3_next_proto_value; maskp = (const uint8_t *)&pdata->l3_next_proto_mask; rc = efx_mae_match_spec_field_set(ctx->match_spec, fremap[EFX_MAE_FIELD_IP_PROTO], sizeof(pdata->l3_next_proto_value), valuep, sizeof(pdata->l3_next_proto_mask), maskp); if (rc != 0) goto fail; if (pdata->l3_frag_ofst_mask != 0) { const rte_be16_t hdr_mask = RTE_BE16(RTE_IPV4_HDR_OFFSET_MASK); rte_be16_t value; rte_be16_t last; boolean_t first_frag; boolean_t is_ip_frag; boolean_t any_frag; if (pdata->l3_frag_ofst_mask & RTE_BE16(RTE_IPV4_HDR_DF_FLAG)) { sfc_err(ctx->sa, "Don't fragment flag is not supported."); rc = ENOTSUP; goto fail; } if ((pdata->l3_frag_ofst_mask & hdr_mask) != hdr_mask) { sfc_err(ctx->sa, "Invalid value for fragment offset mask."); rc = EINVAL; goto fail; } value = pdata->l3_frag_ofst_mask & pdata->l3_frag_ofst_value; last = pdata->l3_frag_ofst_mask & pdata->l3_frag_ofst_last; /* * value: last: matches: * 0 0 Non-fragmented packet * 1 0x1fff Non-first fragment * 1 0x1fff+MF Any fragment * MF 0 First fragment */ if (last == 0 && (pdata->l3_frag_ofst_value & hdr_mask) != 0) { sfc_err(ctx->sa, "Exact matching is prohibited for non-zero offsets, but ranges are allowed."); rc = EINVAL; goto fail; } if (value == 0 && last == 0) { is_ip_frag = false; any_frag = true; } else if (value == RTE_BE16(1) && (last & hdr_mask) == hdr_mask) { if (last & RTE_BE16(RTE_IPV4_HDR_MF_FLAG)) { is_ip_frag = true; any_frag = true; } else { is_ip_frag = true; any_frag = false; first_frag = false; } } else if (value == RTE_BE16(RTE_IPV4_HDR_MF_FLAG) && last == 0) { is_ip_frag = true; any_frag = false; first_frag = true; } else { sfc_err(ctx->sa, "Invalid value for fragment offset."); rc = EINVAL; goto fail; } rc = efx_mae_match_spec_bit_set(ctx->match_spec, fremap[EFX_MAE_FIELD_IS_IP_FRAG], is_ip_frag); if (rc != 0) goto fail; if (!any_frag) { rc = efx_mae_match_spec_bit_set(ctx->match_spec, fremap[EFX_MAE_FIELD_IP_FIRST_FRAG], first_frag); if (rc != 0) goto fail; } } return 0; fail: return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, NULL, "Failed to process pattern data"); } static int sfc_mae_rule_parse_item_mark(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { const struct rte_flow_item_mark *spec = item->spec; struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; struct sfc_ft_ctx *ft_ctx = ctx_mae->ft_ctx; if (spec == NULL) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, item, "NULL spec in item MARK"); } /* * This item is used in tunnel offload support only. * It must go before any network header items. This * way, sfc_mae_rule_preparse_item_mark() must have * already parsed it. Only one item MARK is allowed. */ if (ctx_mae->ft_rule_type != SFC_FT_RULE_SWITCH || spec->id != (uint32_t)SFC_FT_CTX_ID_TO_FLOW_MARK(ft_ctx->id)) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, item, "invalid item MARK"); } return 0; } static int sfc_mae_rule_parse_item_port_id(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; const struct rte_flow_item_port_id supp_mask = { .id = 0xffffffff, }; const void *def_mask = &rte_flow_item_port_id_mask; const struct rte_flow_item_port_id *spec = NULL; const struct rte_flow_item_port_id *mask = NULL; efx_mport_sel_t mport_sel; unsigned int type_mask; int rc; if (ctx_mae->match_mport_set) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ITEM, item, "Can't handle multiple traffic source items"); } rc = sfc_flow_parse_init(item, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, def_mask, sizeof(struct rte_flow_item_port_id), error); if (rc != 0) return rc; if (mask->id != supp_mask.id) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, item, "Bad mask in the PORT_ID pattern item"); } /* If "spec" is not set, could be any port ID */ if (spec == NULL) return 0; if (spec->id > UINT16_MAX) { return rte_flow_error_set(error, EOVERFLOW, RTE_FLOW_ERROR_TYPE_ITEM, item, "The port ID is too large"); } type_mask = 1U << SFC_MAE_SWITCH_PORT_INDEPENDENT; rc = sfc_mae_switch_get_ethdev_mport(ctx_mae->sa->mae.switch_domain_id, spec->id, type_mask, &mport_sel); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, item, "Can't get m-port for the given ethdev"); } rc = efx_mae_match_spec_mport_set(ctx_mae->match_spec, &mport_sel, NULL); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, item, "Failed to set MPORT for the port ID"); } ctx_mae->match_mport_set = B_TRUE; return 0; } static int sfc_mae_rule_parse_item_ethdev_based(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; const struct rte_flow_item_ethdev supp_mask = { .port_id = 0xffff, }; const void *def_mask = &rte_flow_item_ethdev_mask; const struct rte_flow_item_ethdev *spec = NULL; const struct rte_flow_item_ethdev *mask = NULL; efx_mport_sel_t mport_sel; unsigned int type_mask; int rc; if (ctx_mae->match_mport_set) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ITEM, item, "Can't handle multiple traffic source items"); } rc = sfc_flow_parse_init(item, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, def_mask, sizeof(struct rte_flow_item_ethdev), error); if (rc != 0) return rc; if (mask->port_id != supp_mask.port_id) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, item, "Bad mask in the ethdev-based pattern item"); } /* If "spec" is not set, could be any port ID */ if (spec == NULL) return 0; switch (item->type) { case RTE_FLOW_ITEM_TYPE_PORT_REPRESENTOR: type_mask = 1U << SFC_MAE_SWITCH_PORT_INDEPENDENT; rc = sfc_mae_switch_get_ethdev_mport( ctx_mae->sa->mae.switch_domain_id, spec->port_id, type_mask, &mport_sel); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, item, "Can't get m-port for the given ethdev"); } break; case RTE_FLOW_ITEM_TYPE_REPRESENTED_PORT: rc = sfc_mae_switch_get_entity_mport( ctx_mae->sa->mae.switch_domain_id, spec->port_id, &mport_sel); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, item, "Can't get m-port for the given ethdev"); } break; default: return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, item, "Unsupported ethdev-based flow item"); } rc = efx_mae_match_spec_mport_set(ctx_mae->match_spec, &mport_sel, NULL); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, item, "Failed to set MPORT for the port ID"); } ctx_mae->match_mport_set = B_TRUE; return 0; } /* * Having this field ID in a field locator means that this * locator cannot be used to actually set the field at the * time when the corresponding item gets encountered. Such * fields get stashed in the parsing context instead. This * is required to resolve dependencies between the stashed * fields. See sfc_mae_rule_process_pattern_data(). */ #define SFC_MAE_FIELD_HANDLING_DEFERRED EFX_MAE_FIELD_NIDS struct sfc_mae_field_locator { efx_mae_field_id_t field_id; size_t size; /* Field offset in the corresponding rte_flow_item_ struct */ size_t ofst; uint8_t ct_key_field; }; static void sfc_mae_item_build_supp_mask(const struct sfc_mae_field_locator *field_locators, unsigned int nb_field_locators, void *mask_ptr, size_t mask_size) { unsigned int i; memset(mask_ptr, 0, mask_size); for (i = 0; i < nb_field_locators; ++i) { const struct sfc_mae_field_locator *fl = &field_locators[i]; SFC_ASSERT(fl->ofst + fl->size <= mask_size); memset(RTE_PTR_ADD(mask_ptr, fl->ofst), 0xff, fl->size); } } static int sfc_mae_parse_item(const struct sfc_mae_field_locator *field_locators, unsigned int nb_field_locators, const uint8_t *spec, const uint8_t *mask, struct sfc_mae_parse_ctx *ctx, struct rte_flow_error *error) { const efx_mae_field_id_t *fremap = ctx->field_ids_remap; unsigned int i; int rc = 0; for (i = 0; i < nb_field_locators; ++i) { const struct sfc_mae_field_locator *fl = &field_locators[i]; if (fl->field_id == SFC_MAE_FIELD_HANDLING_DEFERRED) continue; rc = efx_mae_match_spec_field_set(ctx->match_spec, fremap[fl->field_id], fl->size, spec + fl->ofst, fl->size, mask + fl->ofst); if (rc != 0) break; } if (rc != 0) { rc = rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, NULL, "Failed to process item fields"); } return rc; } static const struct sfc_mae_field_locator flocs_eth[] = { { /* * This locator is used only for building supported fields mask. * The field is handled by sfc_mae_rule_process_pattern_data(). */ SFC_MAE_FIELD_HANDLING_DEFERRED, RTE_SIZEOF_FIELD(struct rte_flow_item_eth, hdr.ether_type), offsetof(struct rte_flow_item_eth, hdr.ether_type), }, { EFX_MAE_FIELD_ETH_DADDR_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_eth, hdr.dst_addr), offsetof(struct rte_flow_item_eth, hdr.dst_addr), }, { EFX_MAE_FIELD_ETH_SADDR_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_eth, hdr.src_addr), offsetof(struct rte_flow_item_eth, hdr.src_addr), }, }; static int sfc_mae_rule_parse_item_eth(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; struct rte_flow_item_eth override_mask; struct rte_flow_item_eth supp_mask; const uint8_t *spec = NULL; const uint8_t *mask = NULL; int rc; sfc_mae_item_build_supp_mask(flocs_eth, RTE_DIM(flocs_eth), &supp_mask, sizeof(supp_mask)); supp_mask.has_vlan = 1; rc = sfc_flow_parse_init(item, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, &rte_flow_item_eth_mask, sizeof(struct rte_flow_item_eth), error); if (rc != 0) return rc; if (ctx_mae->ft_rule_type == SFC_FT_RULE_TUNNEL && mask != NULL) { /* * The HW/FW hasn't got support for match on MAC addresses in * outer rules yet (this will change). Match on VLAN presence * isn't supported either. Ignore these match criteria. */ memcpy(&override_mask, mask, sizeof(override_mask)); memset(&override_mask.hdr.dst_addr, 0, sizeof(override_mask.hdr.dst_addr)); memset(&override_mask.hdr.src_addr, 0, sizeof(override_mask.hdr.src_addr)); override_mask.has_vlan = 0; mask = (const uint8_t *)&override_mask; } if (spec != NULL) { struct sfc_mae_pattern_data *pdata = &ctx_mae->pattern_data; struct sfc_mae_ethertype *ethertypes = pdata->ethertypes; const struct rte_flow_item_eth *item_spec; const struct rte_flow_item_eth *item_mask; item_spec = (const struct rte_flow_item_eth *)spec; item_mask = (const struct rte_flow_item_eth *)mask; /* * Remember various match criteria in the parsing context. * sfc_mae_rule_process_pattern_data() will consider them * altogether when the rest of the items have been parsed. */ ethertypes[0].value = item_spec->hdr.ether_type; ethertypes[0].mask = item_mask->hdr.ether_type; if (item_mask->has_vlan) { pdata->has_ovlan_mask = B_TRUE; if (item_spec->has_vlan) pdata->has_ovlan_value = B_TRUE; } } else { /* * The specification is empty. The overall pattern * validity will be enforced at the end of parsing. * See sfc_mae_rule_process_pattern_data(). */ return 0; } return sfc_mae_parse_item(flocs_eth, RTE_DIM(flocs_eth), spec, mask, ctx_mae, error); } static const struct sfc_mae_field_locator flocs_vlan[] = { /* Outermost tag */ { EFX_MAE_FIELD_VLAN0_TCI_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_vlan, hdr.vlan_tci), offsetof(struct rte_flow_item_vlan, hdr.vlan_tci), }, { /* * This locator is used only for building supported fields mask. * The field is handled by sfc_mae_rule_process_pattern_data(). */ SFC_MAE_FIELD_HANDLING_DEFERRED, RTE_SIZEOF_FIELD(struct rte_flow_item_vlan, hdr.eth_proto), offsetof(struct rte_flow_item_vlan, hdr.eth_proto), }, /* Innermost tag */ { EFX_MAE_FIELD_VLAN1_TCI_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_vlan, hdr.vlan_tci), offsetof(struct rte_flow_item_vlan, hdr.vlan_tci), }, { /* * This locator is used only for building supported fields mask. * The field is handled by sfc_mae_rule_process_pattern_data(). */ SFC_MAE_FIELD_HANDLING_DEFERRED, RTE_SIZEOF_FIELD(struct rte_flow_item_vlan, hdr.eth_proto), offsetof(struct rte_flow_item_vlan, hdr.eth_proto), }, }; static int sfc_mae_rule_parse_item_vlan(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; struct sfc_mae_pattern_data *pdata = &ctx_mae->pattern_data; boolean_t *has_vlan_mp_by_nb_tags[SFC_MAE_MATCH_VLAN_MAX_NTAGS] = { &pdata->has_ovlan_mask, &pdata->has_ivlan_mask, }; boolean_t *has_vlan_vp_by_nb_tags[SFC_MAE_MATCH_VLAN_MAX_NTAGS] = { &pdata->has_ovlan_value, &pdata->has_ivlan_value, }; boolean_t *cur_tag_presence_bit_mp; boolean_t *cur_tag_presence_bit_vp; const struct sfc_mae_field_locator *flocs; struct rte_flow_item_vlan supp_mask; const uint8_t *spec = NULL; const uint8_t *mask = NULL; unsigned int nb_flocs; int rc; RTE_BUILD_BUG_ON(SFC_MAE_MATCH_VLAN_MAX_NTAGS != 2); if (pdata->nb_vlan_tags == SFC_MAE_MATCH_VLAN_MAX_NTAGS) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ITEM, item, "Can't match that many VLAN tags"); } cur_tag_presence_bit_mp = has_vlan_mp_by_nb_tags[pdata->nb_vlan_tags]; cur_tag_presence_bit_vp = has_vlan_vp_by_nb_tags[pdata->nb_vlan_tags]; if (*cur_tag_presence_bit_mp == B_TRUE && *cur_tag_presence_bit_vp == B_FALSE) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, item, "The previous item enforces no (more) VLAN, " "so the current item (VLAN) must not exist"); } nb_flocs = RTE_DIM(flocs_vlan) / SFC_MAE_MATCH_VLAN_MAX_NTAGS; flocs = flocs_vlan + pdata->nb_vlan_tags * nb_flocs; sfc_mae_item_build_supp_mask(flocs, nb_flocs, &supp_mask, sizeof(supp_mask)); /* * This only means that the field is supported by the driver and libefx. * Support on NIC level will be checked when all items have been parsed. */ supp_mask.has_more_vlan = 1; rc = sfc_flow_parse_init(item, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, &rte_flow_item_vlan_mask, sizeof(struct rte_flow_item_vlan), error); if (rc != 0) return rc; if (spec != NULL) { struct sfc_mae_ethertype *et = pdata->ethertypes; const struct rte_flow_item_vlan *item_spec; const struct rte_flow_item_vlan *item_mask; item_spec = (const struct rte_flow_item_vlan *)spec; item_mask = (const struct rte_flow_item_vlan *)mask; /* * Remember various match criteria in the parsing context. * sfc_mae_rule_process_pattern_data() will consider them * altogether when the rest of the items have been parsed. */ et[pdata->nb_vlan_tags + 1].value = item_spec->hdr.eth_proto; et[pdata->nb_vlan_tags + 1].mask = item_mask->hdr.eth_proto; pdata->tci_masks[pdata->nb_vlan_tags] = item_mask->hdr.vlan_tci; if (item_mask->has_more_vlan) { if (pdata->nb_vlan_tags == SFC_MAE_MATCH_VLAN_MAX_NTAGS) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ITEM, item, "Can't use 'has_more_vlan' in " "the second item VLAN"); } pdata->has_ivlan_mask = B_TRUE; if (item_spec->has_more_vlan) pdata->has_ivlan_value = B_TRUE; } /* Convert TCI to MAE representation right now. */ rc = sfc_mae_parse_item(flocs, nb_flocs, spec, mask, ctx_mae, error); if (rc != 0) return rc; } ++(pdata->nb_vlan_tags); return 0; } static const struct sfc_mae_field_locator flocs_ipv4[] = { { EFX_MAE_FIELD_SRC_IP4_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.src_addr), offsetof(struct rte_flow_item_ipv4, hdr.src_addr), }, { EFX_MAE_FIELD_DST_IP4_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.dst_addr), offsetof(struct rte_flow_item_ipv4, hdr.dst_addr), }, { /* * This locator is used only for building supported fields mask. * The field is handled by sfc_mae_rule_process_pattern_data(). */ SFC_MAE_FIELD_HANDLING_DEFERRED, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.next_proto_id), offsetof(struct rte_flow_item_ipv4, hdr.next_proto_id), }, { /* * This locator is used only for building supported fields mask. * The field is handled by sfc_mae_rule_process_pattern_data(). */ SFC_MAE_FIELD_HANDLING_DEFERRED, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.fragment_offset), offsetof(struct rte_flow_item_ipv4, hdr.fragment_offset), }, { EFX_MAE_FIELD_IP_TOS, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.type_of_service), offsetof(struct rte_flow_item_ipv4, hdr.type_of_service), }, { EFX_MAE_FIELD_IP_TTL, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.time_to_live), offsetof(struct rte_flow_item_ipv4, hdr.time_to_live), }, }; static int sfc_mae_rule_parse_item_ipv4(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { rte_be16_t ethertype_ipv4_be = RTE_BE16(RTE_ETHER_TYPE_IPV4); struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; struct sfc_mae_pattern_data *pdata = &ctx_mae->pattern_data; struct rte_flow_item_ipv4 supp_mask; struct rte_flow_item item_dup; const uint8_t *spec = NULL; const uint8_t *mask = NULL; const uint8_t *last = NULL; int rc; item_dup.spec = item->spec; item_dup.mask = item->mask; item_dup.last = item->last; item_dup.type = item->type; sfc_mae_item_build_supp_mask(flocs_ipv4, RTE_DIM(flocs_ipv4), &supp_mask, sizeof(supp_mask)); /* We don't support IPv4 fragmentation in the outer frames. */ if (ctx_mae->match_spec != ctx_mae->match_spec_action) supp_mask.hdr.fragment_offset = 0; if (item->last != NULL) { last = item->last; item_dup.last = NULL; } rc = sfc_flow_parse_init(&item_dup, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, &rte_flow_item_ipv4_mask, sizeof(struct rte_flow_item_ipv4), error); if (rc != 0) return rc; pdata->innermost_ethertype_restriction.value = ethertype_ipv4_be; pdata->innermost_ethertype_restriction.mask = RTE_BE16(0xffff); if (spec != NULL) { const struct rte_flow_item_ipv4 *item_spec; const struct rte_flow_item_ipv4 *item_mask; const struct rte_flow_item_ipv4 *item_last; item_spec = (const struct rte_flow_item_ipv4 *)spec; item_mask = (const struct rte_flow_item_ipv4 *)mask; if (last != NULL) item_last = (const struct rte_flow_item_ipv4 *)last; pdata->l3_next_proto_value = item_spec->hdr.next_proto_id; pdata->l3_next_proto_mask = item_mask->hdr.next_proto_id; pdata->l3_frag_ofst_mask = item_mask->hdr.fragment_offset; pdata->l3_frag_ofst_value = item_spec->hdr.fragment_offset; if (last != NULL) pdata->l3_frag_ofst_last = item_last->hdr.fragment_offset; } else { return 0; } return sfc_mae_parse_item(flocs_ipv4, RTE_DIM(flocs_ipv4), spec, mask, ctx_mae, error); } static const struct sfc_mae_field_locator flocs_ipv6[] = { { EFX_MAE_FIELD_SRC_IP6_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv6, hdr.src_addr), offsetof(struct rte_flow_item_ipv6, hdr.src_addr), }, { EFX_MAE_FIELD_DST_IP6_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv6, hdr.dst_addr), offsetof(struct rte_flow_item_ipv6, hdr.dst_addr), }, { /* * This locator is used only for building supported fields mask. * The field is handled by sfc_mae_rule_process_pattern_data(). */ SFC_MAE_FIELD_HANDLING_DEFERRED, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv6, hdr.proto), offsetof(struct rte_flow_item_ipv6, hdr.proto), }, { EFX_MAE_FIELD_IP_TTL, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv6, hdr.hop_limits), offsetof(struct rte_flow_item_ipv6, hdr.hop_limits), }, }; static int sfc_mae_rule_parse_item_ipv6(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { rte_be16_t ethertype_ipv6_be = RTE_BE16(RTE_ETHER_TYPE_IPV6); struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; const efx_mae_field_id_t *fremap = ctx_mae->field_ids_remap; struct sfc_mae_pattern_data *pdata = &ctx_mae->pattern_data; struct rte_flow_item_ipv6 supp_mask; const uint8_t *spec = NULL; const uint8_t *mask = NULL; rte_be32_t vtc_flow_be; uint32_t vtc_flow; uint8_t tc_value; uint8_t tc_mask; int rc; sfc_mae_item_build_supp_mask(flocs_ipv6, RTE_DIM(flocs_ipv6), &supp_mask, sizeof(supp_mask)); vtc_flow_be = RTE_BE32(RTE_IPV6_HDR_TC_MASK); memcpy(&supp_mask, &vtc_flow_be, sizeof(vtc_flow_be)); rc = sfc_flow_parse_init(item, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, &rte_flow_item_ipv6_mask, sizeof(struct rte_flow_item_ipv6), error); if (rc != 0) return rc; pdata->innermost_ethertype_restriction.value = ethertype_ipv6_be; pdata->innermost_ethertype_restriction.mask = RTE_BE16(0xffff); if (spec != NULL) { const struct rte_flow_item_ipv6 *item_spec; const struct rte_flow_item_ipv6 *item_mask; item_spec = (const struct rte_flow_item_ipv6 *)spec; item_mask = (const struct rte_flow_item_ipv6 *)mask; pdata->l3_next_proto_value = item_spec->hdr.proto; pdata->l3_next_proto_mask = item_mask->hdr.proto; } else { return 0; } rc = sfc_mae_parse_item(flocs_ipv6, RTE_DIM(flocs_ipv6), spec, mask, ctx_mae, error); if (rc != 0) return rc; memcpy(&vtc_flow_be, spec, sizeof(vtc_flow_be)); vtc_flow = rte_be_to_cpu_32(vtc_flow_be); tc_value = (vtc_flow & RTE_IPV6_HDR_TC_MASK) >> RTE_IPV6_HDR_TC_SHIFT; memcpy(&vtc_flow_be, mask, sizeof(vtc_flow_be)); vtc_flow = rte_be_to_cpu_32(vtc_flow_be); tc_mask = (vtc_flow & RTE_IPV6_HDR_TC_MASK) >> RTE_IPV6_HDR_TC_SHIFT; rc = efx_mae_match_spec_field_set(ctx_mae->match_spec, fremap[EFX_MAE_FIELD_IP_TOS], sizeof(tc_value), &tc_value, sizeof(tc_mask), &tc_mask); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, NULL, "Failed to process item fields"); } return 0; } static const struct sfc_mae_field_locator flocs_tcp[] = { { EFX_MAE_FIELD_L4_SPORT_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_tcp, hdr.src_port), offsetof(struct rte_flow_item_tcp, hdr.src_port), }, { EFX_MAE_FIELD_L4_DPORT_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_tcp, hdr.dst_port), offsetof(struct rte_flow_item_tcp, hdr.dst_port), }, { EFX_MAE_FIELD_TCP_FLAGS_BE, /* * The values have been picked intentionally since the * target MAE field is oversize (16 bit). This mapping * relies on the fact that the MAE field is big-endian. */ RTE_SIZEOF_FIELD(struct rte_flow_item_tcp, hdr.data_off) + RTE_SIZEOF_FIELD(struct rte_flow_item_tcp, hdr.tcp_flags), offsetof(struct rte_flow_item_tcp, hdr.data_off), }, }; static int sfc_mae_rule_parse_item_tcp(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; struct sfc_mae_pattern_data *pdata = &ctx_mae->pattern_data; struct rte_flow_item_tcp supp_mask; const uint8_t *spec = NULL; const uint8_t *mask = NULL; int rc; /* * When encountered among outermost items, item TCP is invalid. * Check which match specification is being constructed now. */ if (ctx_mae->match_spec != ctx_mae->match_spec_action) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, item, "TCP in outer frame is invalid"); } sfc_mae_item_build_supp_mask(flocs_tcp, RTE_DIM(flocs_tcp), &supp_mask, sizeof(supp_mask)); rc = sfc_flow_parse_init(item, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, &rte_flow_item_tcp_mask, sizeof(struct rte_flow_item_tcp), error); if (rc != 0) return rc; pdata->l3_next_proto_restriction_value = IPPROTO_TCP; pdata->l3_next_proto_restriction_mask = 0xff; if (spec == NULL) return 0; return sfc_mae_parse_item(flocs_tcp, RTE_DIM(flocs_tcp), spec, mask, ctx_mae, error); } static const struct sfc_mae_field_locator flocs_udp[] = { { EFX_MAE_FIELD_L4_SPORT_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_udp, hdr.src_port), offsetof(struct rte_flow_item_udp, hdr.src_port), }, { EFX_MAE_FIELD_L4_DPORT_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_udp, hdr.dst_port), offsetof(struct rte_flow_item_udp, hdr.dst_port), }, }; static int sfc_mae_rule_parse_item_udp(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; struct sfc_mae_pattern_data *pdata = &ctx_mae->pattern_data; struct rte_flow_item_udp supp_mask; const uint8_t *spec = NULL; const uint8_t *mask = NULL; int rc; sfc_mae_item_build_supp_mask(flocs_udp, RTE_DIM(flocs_udp), &supp_mask, sizeof(supp_mask)); rc = sfc_flow_parse_init(item, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, &rte_flow_item_udp_mask, sizeof(struct rte_flow_item_udp), error); if (rc != 0) return rc; pdata->l3_next_proto_restriction_value = IPPROTO_UDP; pdata->l3_next_proto_restriction_mask = 0xff; if (spec == NULL) return 0; return sfc_mae_parse_item(flocs_udp, RTE_DIM(flocs_udp), spec, mask, ctx_mae, error); } static const struct sfc_mae_field_locator flocs_tunnel[] = { { /* * The size and offset values are relevant * for Geneve and NVGRE, too. */ .size = RTE_SIZEOF_FIELD(struct rte_flow_item_vxlan, hdr.vni), .ofst = offsetof(struct rte_flow_item_vxlan, hdr.vni), }, }; /* * An auxiliary registry which allows using non-encap. field IDs * directly when building a match specification of type ACTION. * * See sfc_mae_rule_parse_pattern() and sfc_mae_rule_parse_item_tunnel(). */ static const efx_mae_field_id_t field_ids_no_remap[] = { #define FIELD_ID_NO_REMAP(_field) \ [EFX_MAE_FIELD_##_field] = EFX_MAE_FIELD_##_field FIELD_ID_NO_REMAP(ETHER_TYPE_BE), FIELD_ID_NO_REMAP(ETH_SADDR_BE), FIELD_ID_NO_REMAP(ETH_DADDR_BE), FIELD_ID_NO_REMAP(VLAN0_TCI_BE), FIELD_ID_NO_REMAP(VLAN0_PROTO_BE), FIELD_ID_NO_REMAP(VLAN1_TCI_BE), FIELD_ID_NO_REMAP(VLAN1_PROTO_BE), FIELD_ID_NO_REMAP(SRC_IP4_BE), FIELD_ID_NO_REMAP(DST_IP4_BE), FIELD_ID_NO_REMAP(IP_PROTO), FIELD_ID_NO_REMAP(IP_TOS), FIELD_ID_NO_REMAP(IP_TTL), FIELD_ID_NO_REMAP(SRC_IP6_BE), FIELD_ID_NO_REMAP(DST_IP6_BE), FIELD_ID_NO_REMAP(L4_SPORT_BE), FIELD_ID_NO_REMAP(L4_DPORT_BE), FIELD_ID_NO_REMAP(TCP_FLAGS_BE), FIELD_ID_NO_REMAP(HAS_OVLAN), FIELD_ID_NO_REMAP(HAS_IVLAN), FIELD_ID_NO_REMAP(IS_IP_FRAG), FIELD_ID_NO_REMAP(IP_FIRST_FRAG), #undef FIELD_ID_NO_REMAP }; /* * An auxiliary registry which allows using "ENC" field IDs * when building a match specification of type OUTER. * * See sfc_mae_rule_encap_parse_init(). */ static const efx_mae_field_id_t field_ids_remap_to_encap[] = { #define FIELD_ID_REMAP_TO_ENCAP(_field) \ [EFX_MAE_FIELD_##_field] = EFX_MAE_FIELD_ENC_##_field FIELD_ID_REMAP_TO_ENCAP(ETHER_TYPE_BE), FIELD_ID_REMAP_TO_ENCAP(ETH_SADDR_BE), FIELD_ID_REMAP_TO_ENCAP(ETH_DADDR_BE), FIELD_ID_REMAP_TO_ENCAP(VLAN0_TCI_BE), FIELD_ID_REMAP_TO_ENCAP(VLAN0_PROTO_BE), FIELD_ID_REMAP_TO_ENCAP(VLAN1_TCI_BE), FIELD_ID_REMAP_TO_ENCAP(VLAN1_PROTO_BE), FIELD_ID_REMAP_TO_ENCAP(SRC_IP4_BE), FIELD_ID_REMAP_TO_ENCAP(DST_IP4_BE), FIELD_ID_REMAP_TO_ENCAP(IP_PROTO), FIELD_ID_REMAP_TO_ENCAP(IP_TOS), FIELD_ID_REMAP_TO_ENCAP(IP_TTL), FIELD_ID_REMAP_TO_ENCAP(SRC_IP6_BE), FIELD_ID_REMAP_TO_ENCAP(DST_IP6_BE), FIELD_ID_REMAP_TO_ENCAP(L4_SPORT_BE), FIELD_ID_REMAP_TO_ENCAP(L4_DPORT_BE), FIELD_ID_REMAP_TO_ENCAP(HAS_OVLAN), FIELD_ID_REMAP_TO_ENCAP(HAS_IVLAN), #undef FIELD_ID_REMAP_TO_ENCAP }; static int sfc_mae_rule_parse_item_tunnel(const struct rte_flow_item *item, struct sfc_flow_parse_ctx *ctx, struct rte_flow_error *error) { struct sfc_mae_parse_ctx *ctx_mae = ctx->mae; uint8_t vnet_id_v[sizeof(uint32_t)] = {0}; uint8_t vnet_id_m[sizeof(uint32_t)] = {0}; const struct rte_flow_item_vxlan *vxp; uint8_t supp_mask[sizeof(uint64_t)]; const uint8_t *spec = NULL; const uint8_t *mask = NULL; int rc; if (ctx_mae->ft_rule_type == SFC_FT_RULE_SWITCH) { /* * As a workaround, pattern processing has started from * this (tunnel) item. No pattern data to process yet. */ } else { /* * We're about to start processing inner frame items. * Process pattern data that has been deferred so far * and reset pattern data storage. */ rc = sfc_mae_rule_process_pattern_data(ctx_mae, error); if (rc != 0) return rc; } memset(&ctx_mae->pattern_data, 0, sizeof(ctx_mae->pattern_data)); sfc_mae_item_build_supp_mask(flocs_tunnel, RTE_DIM(flocs_tunnel), &supp_mask, sizeof(supp_mask)); /* * This tunnel item was preliminarily detected by * sfc_mae_rule_encap_parse_init(). Default mask * was also picked by that helper. Use it here. */ rc = sfc_flow_parse_init(item, (const void **)&spec, (const void **)&mask, (const void *)&supp_mask, ctx_mae->tunnel_def_mask, ctx_mae->tunnel_def_mask_size, error); if (rc != 0) return rc; /* * This item and later ones comprise a * match specification of type ACTION. */ ctx_mae->match_spec = ctx_mae->match_spec_action; /* This item and later ones use non-encap. EFX MAE field IDs. */ ctx_mae->field_ids_remap = field_ids_no_remap; if (spec == NULL) return 0; /* * Field EFX_MAE_FIELD_ENC_VNET_ID_BE is a 32-bit one. * Copy 24-bit VNI, which is BE, at offset 1 in it. * The extra byte is 0 both in the mask and in the value. */ vxp = (const struct rte_flow_item_vxlan *)spec; memcpy(vnet_id_v + 1, &vxp->hdr.vni, sizeof(vxp->hdr.vni)); vxp = (const struct rte_flow_item_vxlan *)mask; memcpy(vnet_id_m + 1, &vxp->hdr.vni, sizeof(vxp->hdr.vni)); rc = efx_mae_match_spec_field_set(ctx_mae->match_spec, EFX_MAE_FIELD_ENC_VNET_ID_BE, sizeof(vnet_id_v), vnet_id_v, sizeof(vnet_id_m), vnet_id_m); if (rc != 0) { rc = rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, item, "Failed to set VXLAN VNI"); } return rc; } static const struct sfc_flow_item sfc_flow_items[] = { { .type = RTE_FLOW_ITEM_TYPE_MARK, .name = "MARK", .prev_layer = SFC_FLOW_ITEM_ANY_LAYER, .layer = SFC_FLOW_ITEM_ANY_LAYER, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_mark, }, { .type = RTE_FLOW_ITEM_TYPE_PORT_ID, .name = "PORT_ID", /* * In terms of RTE flow, this item is a META one, * and its position in the pattern is don't care. */ .prev_layer = SFC_FLOW_ITEM_ANY_LAYER, .layer = SFC_FLOW_ITEM_ANY_LAYER, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_port_id, }, { .type = RTE_FLOW_ITEM_TYPE_PORT_REPRESENTOR, .name = "PORT_REPRESENTOR", /* * In terms of RTE flow, this item is a META one, * and its position in the pattern is don't care. */ .prev_layer = SFC_FLOW_ITEM_ANY_LAYER, .layer = SFC_FLOW_ITEM_ANY_LAYER, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_ethdev_based, }, { .type = RTE_FLOW_ITEM_TYPE_REPRESENTED_PORT, .name = "REPRESENTED_PORT", /* * In terms of RTE flow, this item is a META one, * and its position in the pattern is don't care. */ .prev_layer = SFC_FLOW_ITEM_ANY_LAYER, .layer = SFC_FLOW_ITEM_ANY_LAYER, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_ethdev_based, }, { .type = RTE_FLOW_ITEM_TYPE_ETH, .name = "ETH", .prev_layer = SFC_FLOW_ITEM_START_LAYER, .layer = SFC_FLOW_ITEM_L2, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_eth, }, { .type = RTE_FLOW_ITEM_TYPE_VLAN, .name = "VLAN", .prev_layer = SFC_FLOW_ITEM_L2, .layer = SFC_FLOW_ITEM_L2, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_vlan, }, { .type = RTE_FLOW_ITEM_TYPE_IPV4, .name = "IPV4", .prev_layer = SFC_FLOW_ITEM_L2, .layer = SFC_FLOW_ITEM_L3, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_ipv4, }, { .type = RTE_FLOW_ITEM_TYPE_IPV6, .name = "IPV6", .prev_layer = SFC_FLOW_ITEM_L2, .layer = SFC_FLOW_ITEM_L3, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_ipv6, }, { .type = RTE_FLOW_ITEM_TYPE_TCP, .name = "TCP", .prev_layer = SFC_FLOW_ITEM_L3, .layer = SFC_FLOW_ITEM_L4, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_tcp, }, { .type = RTE_FLOW_ITEM_TYPE_UDP, .name = "UDP", .prev_layer = SFC_FLOW_ITEM_L3, .layer = SFC_FLOW_ITEM_L4, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_udp, }, { .type = RTE_FLOW_ITEM_TYPE_VXLAN, .name = "VXLAN", .prev_layer = SFC_FLOW_ITEM_L4, .layer = SFC_FLOW_ITEM_START_LAYER, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_tunnel, }, { .type = RTE_FLOW_ITEM_TYPE_GENEVE, .name = "GENEVE", .prev_layer = SFC_FLOW_ITEM_L4, .layer = SFC_FLOW_ITEM_START_LAYER, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_tunnel, }, { .type = RTE_FLOW_ITEM_TYPE_NVGRE, .name = "NVGRE", .prev_layer = SFC_FLOW_ITEM_L3, .layer = SFC_FLOW_ITEM_START_LAYER, .ctx_type = SFC_FLOW_PARSE_CTX_MAE, .parse = sfc_mae_rule_parse_item_tunnel, }, }; #define SFC_MAE_CT_KEY_ET 0x01 /* EtherType */ #define SFC_MAE_CT_KEY_DA 0x02 /* IPv4/IPv6 destination address */ #define SFC_MAE_CT_KEY_SA 0x04 /* IPv4/IPv6 source address */ #define SFC_MAE_CT_KEY_L4 0x08 /* IPv4/IPv6 L4 protocol ID */ #define SFC_MAE_CT_KEY_DP 0x10 /* L4 destination port */ #define SFC_MAE_CT_KEY_SP 0x20 /* L4 source port */ #define SFC_MAE_CT_KEY_FIELD_SIZE_MAX sizeof(sfc_mae_conntrack_key_t) static const struct sfc_mae_field_locator flocs_ct[] = { { EFX_MAE_FIELD_ETHER_TYPE_BE, RTE_SIZEOF_FIELD(sfc_mae_conntrack_key_t, ether_type_le), offsetof(sfc_mae_conntrack_key_t, ether_type_le), SFC_MAE_CT_KEY_ET, }, { EFX_MAE_FIELD_DST_IP4_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.dst_addr), offsetof(sfc_mae_conntrack_key_t, dst_addr_le) + RTE_SIZEOF_FIELD(struct rte_flow_item_ipv6, hdr.dst_addr) - RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.dst_addr), SFC_MAE_CT_KEY_DA, }, { EFX_MAE_FIELD_SRC_IP4_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.src_addr), offsetof(sfc_mae_conntrack_key_t, src_addr_le) + RTE_SIZEOF_FIELD(struct rte_flow_item_ipv6, hdr.src_addr) - RTE_SIZEOF_FIELD(struct rte_flow_item_ipv4, hdr.src_addr), SFC_MAE_CT_KEY_SA, }, { EFX_MAE_FIELD_DST_IP6_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv6, hdr.dst_addr), offsetof(sfc_mae_conntrack_key_t, dst_addr_le), SFC_MAE_CT_KEY_DA, }, { EFX_MAE_FIELD_SRC_IP6_BE, RTE_SIZEOF_FIELD(struct rte_flow_item_ipv6, hdr.src_addr), offsetof(sfc_mae_conntrack_key_t, src_addr_le), SFC_MAE_CT_KEY_SA, }, { EFX_MAE_FIELD_IP_PROTO, RTE_SIZEOF_FIELD(sfc_mae_conntrack_key_t, ip_proto), offsetof(sfc_mae_conntrack_key_t, ip_proto), SFC_MAE_CT_KEY_L4, }, { EFX_MAE_FIELD_L4_DPORT_BE, RTE_SIZEOF_FIELD(sfc_mae_conntrack_key_t, dst_port_le), offsetof(sfc_mae_conntrack_key_t, dst_port_le), SFC_MAE_CT_KEY_DP, }, { EFX_MAE_FIELD_L4_SPORT_BE, RTE_SIZEOF_FIELD(sfc_mae_conntrack_key_t, src_port_le), offsetof(sfc_mae_conntrack_key_t, src_port_le), SFC_MAE_CT_KEY_SP, }, }; static int sfc_mae_rule_process_ct(struct sfc_adapter *sa, struct sfc_mae_parse_ctx *pctx, struct sfc_mae_action_rule_ctx *action_rule_ctx, struct sfc_flow_spec_mae *spec, struct rte_flow_error *error) { efx_mae_match_spec_t *match_spec_tmp; uint8_t ct_key_missing_fields = SFC_MAE_CT_KEY_ET | SFC_MAE_CT_KEY_DA | SFC_MAE_CT_KEY_SA | SFC_MAE_CT_KEY_L4 | SFC_MAE_CT_KEY_DP | SFC_MAE_CT_KEY_SP; unsigned int i; int rc; if (pctx->ft_rule_type == SFC_FT_RULE_TUNNEL) { /* * TUNNEL rules have no network match fields that belong * in an action rule match specification, so nothing can * be possibly utilised for conntrack assistance offload. */ return 0; } if (!sfc_mae_conntrack_is_supported(sa)) return 0; rc = efx_mae_match_spec_clone(sa->nic, pctx->match_spec_action, &match_spec_tmp); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "AR: failed to clone the match specification"); } for (i = 0; i < RTE_DIM(flocs_ct); ++i) { const struct sfc_mae_field_locator *fl = &flocs_ct[i]; uint8_t mask_full[SFC_MAE_CT_KEY_FIELD_SIZE_MAX]; uint8_t mask_zero[SFC_MAE_CT_KEY_FIELD_SIZE_MAX]; uint8_t value[SFC_MAE_CT_KEY_FIELD_SIZE_MAX]; uint8_t mask[SFC_MAE_CT_KEY_FIELD_SIZE_MAX]; uint8_t *ct_key = (uint8_t *)&spec->ct_key; efx_mae_field_id_t fid = fl->field_id; unsigned int j; rc = efx_mae_match_spec_field_get(match_spec_tmp, fid, fl->size, value, fl->size, mask); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "AR: failed to extract match field"); } memset(mask_full, 0xff, fl->size); if (memcmp(mask, mask_full, fl->size) != 0) continue; memset(mask_zero, 0, fl->size); rc = efx_mae_match_spec_field_set(match_spec_tmp, fid, fl->size, mask_zero, fl->size, mask_zero); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "AR: failed to erase match field"); } for (j = 0; j < fl->size; ++j) { uint8_t *byte_dst = ct_key + fl->ofst + fl->size - 1 - j; const uint8_t *byte_src = value + j; *byte_dst = *byte_src; } ct_key_missing_fields &= ~(fl->ct_key_field); } if (ct_key_missing_fields != 0) { efx_mae_match_spec_fini(sa->nic, match_spec_tmp); return 0; } efx_mae_match_spec_fini(sa->nic, pctx->match_spec_action); pctx->match_spec_action = match_spec_tmp; if (pctx->ft_rule_type == SFC_FT_RULE_SWITCH) { /* * A SWITCH rule re-uses the corresponding TUNNEL rule's * outer rule, where conntrack request should have been * configured already, so skip outer rule processing. */ goto skip_outer_rule; } if (pctx->match_spec_outer == NULL) { const struct sfc_mae_pattern_data *pdata = &pctx->pattern_data; const struct sfc_mae_ethertype *et; struct sfc_mae *mae = &sa->mae; rc = efx_mae_match_spec_init(sa->nic, EFX_MAE_RULE_OUTER, mae->nb_outer_rule_prios_max - 1, &pctx->match_spec_outer); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "OR: failed to initialise the match specification"); } /* Match on EtherType appears to be compulsory in outer rules */ et = &pdata->ethertypes[pdata->nb_vlan_tags]; rc = efx_mae_match_spec_field_set(pctx->match_spec_outer, EFX_MAE_FIELD_ENC_ETHER_TYPE_BE, sizeof(et->value), (const uint8_t *)&et->value, sizeof(et->mask), (const uint8_t *)&et->mask); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "OR: failed to set match on EtherType"); } } rc = efx_mae_outer_rule_do_ct_set(pctx->match_spec_outer); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "OR: failed to request CT lookup"); } skip_outer_rule: /* Initial/dummy CT mark value */ action_rule_ctx->ct_mark = 1; return 0; } #undef SFC_MAE_CT_KEY_ET #undef SFC_MAE_CT_KEY_DA #undef SFC_MAE_CT_KEY_SA #undef SFC_MAE_CT_KEY_L4 #undef SFC_MAE_CT_KEY_DP #undef SFC_MAE_CT_KEY_SP static int sfc_mae_rule_process_outer(struct sfc_adapter *sa, struct sfc_mae_parse_ctx *ctx, struct sfc_mae_outer_rule **rulep, struct rte_flow_error *error) { efx_mae_rule_id_t or_id = { .id = EFX_MAE_RSRC_ID_INVALID }; int rc; if (ctx->internal) { /* * A driver-internal flow may not comprise an outer rule, * but it must not match on invalid outer rule ID since * it must catch all missed packets, including those * that hit an outer rule of another flow entry but * do not hit a higher-priority action rule later. * So do not set match on outer rule ID here. */ SFC_ASSERT(ctx->match_spec_outer == NULL); *rulep = NULL; return 0; } if (ctx->match_spec_outer == NULL) { *rulep = NULL; goto no_or_id; } if (!efx_mae_match_spec_is_valid(sa->nic, ctx->match_spec_outer)) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ITEM, NULL, "Inconsistent pattern (outer)"); } *rulep = sfc_mae_outer_rule_attach(sa, ctx->match_spec_outer, ctx->encap_type); if (*rulep != NULL) { efx_mae_match_spec_fini(sa->nic, ctx->match_spec_outer); } else { rc = sfc_mae_outer_rule_add(sa, ctx->match_spec_outer, ctx->encap_type, rulep); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, NULL, "Failed to process the pattern"); } } /* The spec has now been tracked by the outer rule entry. */ ctx->match_spec_outer = NULL; or_id.id = (*rulep)->fw_rsrc.rule_id.id; no_or_id: switch (ctx->ft_rule_type) { case SFC_FT_RULE_NONE: break; case SFC_FT_RULE_TUNNEL: /* * Workaround. TUNNEL flows are not supposed to involve * MAE action rules, but, due to the currently limited * HW/FW implementation, action rules are still needed. * See sfc_mae_rule_parse_pattern(). */ break; case SFC_FT_RULE_SWITCH: /* * Match on recirculation ID rather than * on the outer rule allocation handle. */ rc = efx_mae_match_spec_recirc_id_set(ctx->match_spec_action, SFC_FT_CTX_ID_TO_CTX_MARK(ctx->ft_ctx->id)); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "FT: SWITCH: AR: failed to request match on RECIRC_ID"); } return 0; default: SFC_ASSERT(B_FALSE); } /* * In MAE, lookup sequence comprises outer parse, outer rule lookup, * inner parse (when some outer rule is hit) and action rule lookup. * If the currently processed flow does not come with an outer rule, * its action rule must be available only for packets which miss in * outer rule table. Set OR_ID match field to 0xffffffff/0xffffffff * in the action rule specification; this ensures correct behaviour. * * If, however, this flow does have an outer rule, OR_ID match must * be set to the currently known value for that outer rule. It will * be either 0xffffffff or some valid ID, depending on whether this * outer rule is currently active (adapter state is STARTED) or not. */ rc = efx_mae_match_spec_outer_rule_id_set(ctx->match_spec_action, &or_id); if (rc != 0) { sfc_mae_outer_rule_del(sa, *rulep); *rulep = NULL; return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, NULL, "Failed to process the pattern"); } return 0; } static int sfc_mae_rule_preparse_item_mark(const struct rte_flow_item_mark *spec, struct sfc_mae_parse_ctx *ctx) { struct sfc_ft_ctx *ft_ctx; uint32_t user_mark; if (spec == NULL) { sfc_err(ctx->sa, "FT: SWITCH: NULL spec in item MARK"); return EINVAL; } ft_ctx = sfc_ft_ctx_pick(ctx->sa, spec->id); if (ft_ctx == NULL) { sfc_err(ctx->sa, "FT: SWITCH: invalid context"); return EINVAL; } if (ft_ctx->refcnt == 0) { sfc_err(ctx->sa, "FT: SWITCH: inactive context (ID=%u)", ft_ctx->id); return ENOENT; } user_mark = SFC_FT_FLOW_MARK_TO_USER_MARK(spec->id); if (user_mark != 0) { sfc_err(ctx->sa, "FT: SWITCH: invalid item MARK"); return EINVAL; } sfc_dbg(ctx->sa, "FT: SWITCH: detected"); ctx->ft_rule_type = SFC_FT_RULE_SWITCH; ctx->ft_ctx = ft_ctx; return 0; } static int sfc_mae_rule_encap_parse_init(struct sfc_adapter *sa, struct sfc_mae_parse_ctx *ctx, struct rte_flow_error *error) { const struct rte_flow_item *pattern = ctx->pattern; struct sfc_mae *mae = &sa->mae; bool request_ct = false; uint8_t recirc_id = 0; int rc; if (pattern == NULL) { rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM_NUM, NULL, "NULL pattern"); return -rte_errno; } for (;;) { switch (pattern->type) { case RTE_FLOW_ITEM_TYPE_MARK: rc = sfc_mae_rule_preparse_item_mark(pattern->spec, ctx); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ITEM, pattern, "FT: SWITCH: invalid item MARK"); } ++pattern; continue; case RTE_FLOW_ITEM_TYPE_VXLAN: ctx->encap_type = EFX_TUNNEL_PROTOCOL_VXLAN; ctx->tunnel_def_mask = &rte_flow_item_vxlan_mask; ctx->tunnel_def_mask_size = sizeof(rte_flow_item_vxlan_mask); break; case RTE_FLOW_ITEM_TYPE_GENEVE: ctx->encap_type = EFX_TUNNEL_PROTOCOL_GENEVE; ctx->tunnel_def_mask = &rte_flow_item_geneve_mask; ctx->tunnel_def_mask_size = sizeof(rte_flow_item_geneve_mask); break; case RTE_FLOW_ITEM_TYPE_NVGRE: ctx->encap_type = EFX_TUNNEL_PROTOCOL_NVGRE; ctx->tunnel_def_mask = &rte_flow_item_nvgre_mask; ctx->tunnel_def_mask_size = sizeof(rte_flow_item_nvgre_mask); break; case RTE_FLOW_ITEM_TYPE_END: break; default: ++pattern; continue; }; break; } switch (ctx->ft_rule_type) { case SFC_FT_RULE_NONE: if (pattern->type == RTE_FLOW_ITEM_TYPE_END) return 0; break; case SFC_FT_RULE_TUNNEL: if (pattern->type != RTE_FLOW_ITEM_TYPE_END) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ITEM, pattern, "FT: TUNNEL: invalid item"); } ctx->encap_type = ctx->ft_ctx->encap_type; break; case SFC_FT_RULE_SWITCH: if (pattern->type == RTE_FLOW_ITEM_TYPE_END) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, NULL, "FT: SWITCH: missing tunnel item"); } else if (ctx->encap_type != ctx->ft_ctx->encap_type) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ITEM, pattern, "FT: SWITCH: tunnel type mismatch"); } /* * The HW/FW hasn't got support for the use of "ENC" fields in * action rules (except the VNET_ID one) yet. As a workaround, * start parsing the pattern from the tunnel item. */ ctx->pattern = pattern; break; default: SFC_ASSERT(B_FALSE); break; } if ((mae->encap_types_supported & (1U << ctx->encap_type)) == 0) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "OR: unsupported tunnel type"); } switch (ctx->ft_rule_type) { case SFC_FT_RULE_TUNNEL: recirc_id = SFC_FT_CTX_ID_TO_CTX_MARK(ctx->ft_ctx->id); if (sfc_mae_conntrack_is_supported(sa)) { /* * Request lookup in conntrack table since SWITCH rules * are eligible to utilise this type of assistance. */ request_ct = true; } /* FALLTHROUGH */ case SFC_FT_RULE_NONE: if (ctx->priority >= mae->nb_outer_rule_prios_max) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ATTR_PRIORITY, NULL, "OR: unsupported priority level"); } rc = efx_mae_match_spec_init(sa->nic, EFX_MAE_RULE_OUTER, ctx->priority, &ctx->match_spec_outer); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "OR: failed to initialise the match specification"); } /* * Outermost items comprise a match * specification of type OUTER. */ ctx->match_spec = ctx->match_spec_outer; /* Outermost items use "ENC" EFX MAE field IDs. */ ctx->field_ids_remap = field_ids_remap_to_encap; rc = efx_mae_outer_rule_recirc_id_set(ctx->match_spec, recirc_id); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "OR: failed to initialise RECIRC_ID"); } if (!request_ct) break; rc = efx_mae_outer_rule_do_ct_set(ctx->match_spec_outer); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "OR: failed to request CT lookup"); } break; case SFC_FT_RULE_SWITCH: /* Outermost items -> "ENC" match fields in the action rule. */ ctx->field_ids_remap = field_ids_remap_to_encap; ctx->match_spec = ctx->match_spec_action; /* No own outer rule; match on TUNNEL OR's RECIRC_ID is used. */ ctx->encap_type = EFX_TUNNEL_PROTOCOL_NONE; break; default: SFC_ASSERT(B_FALSE); break; } return 0; } static void sfc_mae_rule_encap_parse_fini(struct sfc_adapter *sa, struct sfc_mae_parse_ctx *ctx) { if (ctx->match_spec_outer != NULL) efx_mae_match_spec_fini(sa->nic, ctx->match_spec_outer); } static int sfc_mae_rule_parse_pattern(struct sfc_adapter *sa, const struct rte_flow_item pattern[], struct rte_flow *flow, struct sfc_mae_action_rule_ctx *action_rule_ctx, struct rte_flow_error *error) { struct sfc_flow_spec_mae *spec = &flow->spec.mae; struct sfc_mae_outer_rule **outer_rulep; struct sfc_mae_parse_ctx ctx_mae; unsigned int priority_shift = 0; struct sfc_flow_parse_ctx ctx; int rc; memset(&ctx_mae, 0, sizeof(ctx_mae)); ctx_mae.ft_rule_type = spec->ft_rule_type; ctx_mae.internal = flow->internal; ctx_mae.priority = spec->priority; ctx_mae.ft_ctx = spec->ft_ctx; ctx_mae.sa = sa; outer_rulep = &action_rule_ctx->outer_rule; switch (ctx_mae.ft_rule_type) { case SFC_FT_RULE_TUNNEL: /* * By design, this flow should be represented solely by the * outer rule. But the HW/FW hasn't got support for setting * Rx mark from RECIRC_ID on outer rule lookup yet. Neither * does it support outer rule counters. As a workaround, an * action rule of lower priority is used to do the job. */ priority_shift = 1; /* FALLTHROUGH */ case SFC_FT_RULE_SWITCH: if (ctx_mae.priority != 0) { /* * Because of the above workaround, deny the use * of priorities to TUNNEL and SWITCH rules. */ rc = rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ATTR_PRIORITY, NULL, "FT: priorities are not supported"); goto fail_priority_check; } /* FALLTHROUGH */ case SFC_FT_RULE_NONE: rc = efx_mae_match_spec_init(sa->nic, EFX_MAE_RULE_ACTION, spec->priority + priority_shift, &ctx_mae.match_spec_action); if (rc != 0) { rc = rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "AR: failed to initialise the match specification"); goto fail_init_match_spec_action; } break; default: rc = rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "FT: unexpected rule type"); goto fail_unexpected_ft_rule_type; } /* * As a preliminary setting, assume that there is no encapsulation * in the pattern. That is, pattern items are about to comprise a * match specification of type ACTION and use non-encap. field IDs. * * sfc_mae_rule_encap_parse_init() below may override this. */ ctx_mae.encap_type = EFX_TUNNEL_PROTOCOL_NONE; ctx_mae.match_spec = ctx_mae.match_spec_action; ctx_mae.field_ids_remap = field_ids_no_remap; ctx_mae.pattern = pattern; ctx.type = SFC_FLOW_PARSE_CTX_MAE; ctx.mae = &ctx_mae; rc = sfc_mae_rule_encap_parse_init(sa, &ctx_mae, error); if (rc != 0) goto fail_encap_parse_init; /* * sfc_mae_rule_encap_parse_init() may have detected tunnel offload * SWITCH rule. Remember its properties for later use. */ spec->ft_rule_type = ctx_mae.ft_rule_type; spec->ft_ctx = ctx_mae.ft_ctx; rc = sfc_flow_parse_pattern(sa, sfc_flow_items, RTE_DIM(sfc_flow_items), ctx_mae.pattern, &ctx, error); if (rc != 0) goto fail_parse_pattern; rc = sfc_mae_rule_process_pattern_data(&ctx_mae, error); if (rc != 0) goto fail_process_pattern_data; rc = sfc_mae_rule_process_ct(sa, &ctx_mae, action_rule_ctx, spec, error); if (rc != 0) goto fail_process_ct; rc = sfc_mae_rule_process_outer(sa, &ctx_mae, outer_rulep, error); if (rc != 0) goto fail_process_outer; if (ctx_mae.match_spec_action != NULL && !efx_mae_match_spec_is_valid(sa->nic, ctx_mae.match_spec_action)) { rc = rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ITEM, NULL, "Inconsistent pattern"); goto fail_validate_match_spec_action; } action_rule_ctx->match_spec = ctx_mae.match_spec_action; return 0; fail_validate_match_spec_action: fail_process_outer: fail_process_ct: fail_process_pattern_data: fail_parse_pattern: sfc_mae_rule_encap_parse_fini(sa, &ctx_mae); fail_encap_parse_init: if (ctx_mae.match_spec_action != NULL) efx_mae_match_spec_fini(sa->nic, ctx_mae.match_spec_action); fail_unexpected_ft_rule_type: fail_init_match_spec_action: fail_priority_check: return rc; } static int sfc_mae_rule_parse_action_set_mac(struct sfc_adapter *sa, enum sfc_mae_mac_addr_type type, const struct rte_flow_action_set_mac *conf, struct sfc_mae_aset_ctx *ctx, struct rte_flow_error *error) { struct sfc_mae_mac_addr **mac_addrp; int rc; if (conf == NULL) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "the MAC address entry definition is NULL"); } switch (type) { case SFC_MAE_MAC_ADDR_DST: rc = efx_mae_action_set_populate_set_dst_mac(ctx->spec); mac_addrp = &ctx->dst_mac; break; case SFC_MAE_MAC_ADDR_SRC: rc = efx_mae_action_set_populate_set_src_mac(ctx->spec); mac_addrp = &ctx->src_mac; break; default: rc = EINVAL; break; } if (rc != 0) goto error; *mac_addrp = sfc_mae_mac_addr_attach(sa, conf->mac_addr); if (*mac_addrp != NULL) return 0; rc = sfc_mae_mac_addr_add(sa, conf->mac_addr, mac_addrp); if (rc != 0) goto error; return 0; error: return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "failed to request set MAC action"); } /* * An action supported by MAE may correspond to a bundle of RTE flow actions, * in example, VLAN_PUSH = OF_PUSH_VLAN + OF_VLAN_SET_VID + OF_VLAN_SET_PCP. * That is, related RTE flow actions need to be tracked as parts of a whole * so that they can be combined into a single action and submitted to MAE * representation of a given rule's action set. * * Each RTE flow action provided by an application gets classified as * one belonging to some bundle type. If an action is not supposed to * belong to any bundle, or if this action is END, it is described as * one belonging to a dummy bundle of type EMPTY. * * A currently tracked bundle will be submitted if a repeating * action or an action of different bundle type follows. */ enum sfc_mae_actions_bundle_type { SFC_MAE_ACTIONS_BUNDLE_EMPTY = 0, SFC_MAE_ACTIONS_BUNDLE_VLAN_PUSH, SFC_MAE_ACTIONS_BUNDLE_NAT_DST, SFC_MAE_ACTIONS_BUNDLE_NAT_SRC, }; struct sfc_mae_actions_bundle { enum sfc_mae_actions_bundle_type type; /* Indicates actions already tracked by the current bundle */ uint64_t actions_mask; /* Parameters used by SFC_MAE_ACTIONS_BUNDLE_VLAN_PUSH */ rte_be16_t vlan_push_tpid; rte_be16_t vlan_push_tci; }; /* * Combine configuration of RTE flow actions tracked by the bundle into a * single action and submit the result to MAE action set specification. * Do nothing in the case of dummy action bundle. */ static int sfc_mae_actions_bundle_submit(const struct sfc_mae_actions_bundle *bundle, struct sfc_flow_spec_mae *flow_spec, bool ct, efx_mae_actions_t *spec) { int rc = 0; switch (bundle->type) { case SFC_MAE_ACTIONS_BUNDLE_EMPTY: break; case SFC_MAE_ACTIONS_BUNDLE_VLAN_PUSH: rc = efx_mae_action_set_populate_vlan_push( spec, bundle->vlan_push_tpid, bundle->vlan_push_tci); break; case SFC_MAE_ACTIONS_BUNDLE_NAT_DST: flow_spec->ct_resp.nat.dir_is_dst = true; /* FALLTHROUGH */ case SFC_MAE_ACTIONS_BUNDLE_NAT_SRC: if (ct && flow_spec->ct_resp.nat.ip_le != 0 && flow_spec->ct_resp.nat.port_le != 0) rc = efx_mae_action_set_populate_nat(spec); else rc = EINVAL; break; default: SFC_ASSERT(B_FALSE); break; } return rc; } /* * Given the type of the next RTE flow action in the line, decide * whether a new bundle is about to start, and, if this is the case, * submit and reset the current bundle. */ static int sfc_mae_actions_bundle_sync(const struct rte_flow_action *action, struct sfc_mae_actions_bundle *bundle, struct sfc_flow_spec_mae *flow_spec, efx_mae_actions_t *spec, bool ct, struct rte_flow_error *error) { enum sfc_mae_actions_bundle_type bundle_type_new; int rc; switch (action->type) { case RTE_FLOW_ACTION_TYPE_OF_PUSH_VLAN: case RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_VID: case RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_PCP: bundle_type_new = SFC_MAE_ACTIONS_BUNDLE_VLAN_PUSH; break; case RTE_FLOW_ACTION_TYPE_SET_IPV4_DST: case RTE_FLOW_ACTION_TYPE_SET_TP_DST: bundle_type_new = SFC_MAE_ACTIONS_BUNDLE_NAT_DST; break; case RTE_FLOW_ACTION_TYPE_SET_IPV4_SRC: case RTE_FLOW_ACTION_TYPE_SET_TP_SRC: bundle_type_new = SFC_MAE_ACTIONS_BUNDLE_NAT_SRC; break; default: /* * Self-sufficient actions, including END, are handled in this * case. No checks for unsupported actions are needed here * because parsing doesn't occur at this point. */ bundle_type_new = SFC_MAE_ACTIONS_BUNDLE_EMPTY; break; } if (bundle_type_new != bundle->type || (bundle->actions_mask & (1ULL << action->type)) != 0) { rc = sfc_mae_actions_bundle_submit(bundle, flow_spec, ct, spec); if (rc != 0) goto fail_submit; memset(bundle, 0, sizeof(*bundle)); } bundle->type = bundle_type_new; return 0; fail_submit: return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "Failed to request the (group of) action(s)"); } static void sfc_mae_rule_parse_action_nat_addr(const struct rte_flow_action_set_ipv4 *conf, uint32_t *nat_addr_le) { *nat_addr_le = rte_bswap32(conf->ipv4_addr); } static void sfc_mae_rule_parse_action_nat_port(const struct rte_flow_action_set_tp *conf, uint16_t *nat_port_le) { *nat_port_le = rte_bswap16(conf->port); } static void sfc_mae_rule_parse_action_of_push_vlan( const struct rte_flow_action_of_push_vlan *conf, struct sfc_mae_actions_bundle *bundle) { bundle->vlan_push_tpid = conf->ethertype; } static void sfc_mae_rule_parse_action_of_set_vlan_vid( const struct rte_flow_action_of_set_vlan_vid *conf, struct sfc_mae_actions_bundle *bundle) { bundle->vlan_push_tci |= (conf->vlan_vid & rte_cpu_to_be_16(RTE_LEN2MASK(12, uint16_t))); } static void sfc_mae_rule_parse_action_of_set_vlan_pcp( const struct rte_flow_action_of_set_vlan_pcp *conf, struct sfc_mae_actions_bundle *bundle) { uint16_t vlan_tci_pcp = (uint16_t)(conf->vlan_pcp & RTE_LEN2MASK(3, uint8_t)) << 13; bundle->vlan_push_tci |= rte_cpu_to_be_16(vlan_tci_pcp); } struct sfc_mae_parsed_item { const struct rte_flow_item *item; size_t proto_header_ofst; size_t proto_header_size; }; /* * For each 16-bit word of the given header, override * bits enforced by the corresponding 16-bit mask. */ static void sfc_mae_header_force_item_masks(uint8_t *header_buf, const struct sfc_mae_parsed_item *parsed_items, unsigned int nb_parsed_items) { unsigned int item_idx; for (item_idx = 0; item_idx < nb_parsed_items; ++item_idx) { const struct sfc_mae_parsed_item *parsed_item; const struct rte_flow_item *item; size_t proto_header_size; size_t ofst; parsed_item = &parsed_items[item_idx]; proto_header_size = parsed_item->proto_header_size; item = parsed_item->item; for (ofst = 0; ofst < proto_header_size; ofst += sizeof(rte_be16_t)) { rte_be16_t *wp = RTE_PTR_ADD(header_buf, ofst); const rte_be16_t *w_maskp; const rte_be16_t *w_specp; w_maskp = RTE_PTR_ADD(item->mask, ofst); w_specp = RTE_PTR_ADD(item->spec, ofst); *wp &= ~(*w_maskp); *wp |= (*w_specp & *w_maskp); } header_buf += proto_header_size; } } #define SFC_IPV4_TTL_DEF 0x40 #define SFC_IPV6_VTC_FLOW_DEF 0x60000000 #define SFC_IPV6_HOP_LIMITS_DEF 0xff #define SFC_VXLAN_FLAGS_DEF 0x08000000 static int sfc_mae_rule_parse_action_vxlan_encap( struct sfc_mae *mae, const struct rte_flow_action_vxlan_encap *conf, efx_mae_actions_t *spec, struct rte_flow_error *error) { struct sfc_mae_bounce_eh *bounce_eh = &mae->bounce_eh; struct rte_flow_item *pattern = conf->definition; uint8_t *buf = bounce_eh->buf; /* This array will keep track of non-VOID pattern items. */ struct sfc_mae_parsed_item parsed_items[1 /* Ethernet */ + 2 /* VLAN tags */ + 1 /* IPv4 or IPv6 */ + 1 /* UDP */ + 1 /* VXLAN */]; unsigned int nb_parsed_items = 0; size_t eth_ethertype_ofst = offsetof(struct rte_ether_hdr, ether_type); uint8_t dummy_buf[RTE_MAX(sizeof(struct rte_ipv4_hdr), sizeof(struct rte_ipv6_hdr))]; struct rte_ipv4_hdr *ipv4 = (void *)dummy_buf; struct rte_ipv6_hdr *ipv6 = (void *)dummy_buf; struct rte_vxlan_hdr *vxlan = NULL; struct rte_udp_hdr *udp = NULL; unsigned int nb_vlan_tags = 0; size_t next_proto_ofst = 0; size_t ethertype_ofst = 0; uint64_t exp_items; int rc; if (pattern == NULL) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "The encap. header definition is NULL"); } bounce_eh->type = EFX_TUNNEL_PROTOCOL_VXLAN; bounce_eh->size = 0; /* * Process pattern items and remember non-VOID ones. * Defer applying masks until after the complete header * has been built from the pattern items. */ exp_items = RTE_BIT64(RTE_FLOW_ITEM_TYPE_ETH); for (; pattern->type != RTE_FLOW_ITEM_TYPE_END; ++pattern) { struct sfc_mae_parsed_item *parsed_item; const uint64_t exp_items_extra_vlan[] = { RTE_BIT64(RTE_FLOW_ITEM_TYPE_VLAN), 0 }; size_t proto_header_size; rte_be16_t *ethertypep; uint8_t *next_protop; uint8_t *buf_cur; if (pattern->spec == NULL) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "NULL item spec in the encap. header"); } if (pattern->mask == NULL) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "NULL item mask in the encap. header"); } if (pattern->last != NULL) { /* This is not a match pattern, so disallow range. */ return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "Range item in the encap. header"); } if (pattern->type == RTE_FLOW_ITEM_TYPE_VOID) { /* Handle VOID separately, for clarity. */ continue; } if ((exp_items & RTE_BIT64(pattern->type)) == 0) { return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "Unexpected item in the encap. header"); } parsed_item = &parsed_items[nb_parsed_items]; buf_cur = buf + bounce_eh->size; switch (pattern->type) { case RTE_FLOW_ITEM_TYPE_ETH: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ITEM_TYPE_ETH, exp_items); RTE_BUILD_BUG_ON(offsetof(struct rte_flow_item_eth, hdr) != 0); proto_header_size = sizeof(struct rte_ether_hdr); ethertype_ofst = eth_ethertype_ofst; exp_items = RTE_BIT64(RTE_FLOW_ITEM_TYPE_VLAN) | RTE_BIT64(RTE_FLOW_ITEM_TYPE_IPV4) | RTE_BIT64(RTE_FLOW_ITEM_TYPE_IPV6); break; case RTE_FLOW_ITEM_TYPE_VLAN: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ITEM_TYPE_VLAN, exp_items); RTE_BUILD_BUG_ON(offsetof(struct rte_flow_item_vlan, hdr) != 0); proto_header_size = sizeof(struct rte_vlan_hdr); ethertypep = RTE_PTR_ADD(buf, eth_ethertype_ofst); *ethertypep = RTE_BE16(RTE_ETHER_TYPE_QINQ); ethertypep = RTE_PTR_ADD(buf, ethertype_ofst); *ethertypep = RTE_BE16(RTE_ETHER_TYPE_VLAN); ethertype_ofst = bounce_eh->size + offsetof(struct rte_vlan_hdr, eth_proto); exp_items = RTE_BIT64(RTE_FLOW_ITEM_TYPE_IPV4) | RTE_BIT64(RTE_FLOW_ITEM_TYPE_IPV6); exp_items |= exp_items_extra_vlan[nb_vlan_tags]; ++nb_vlan_tags; break; case RTE_FLOW_ITEM_TYPE_IPV4: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ITEM_TYPE_IPV4, exp_items); RTE_BUILD_BUG_ON(offsetof(struct rte_flow_item_ipv4, hdr) != 0); proto_header_size = sizeof(struct rte_ipv4_hdr); ethertypep = RTE_PTR_ADD(buf, ethertype_ofst); *ethertypep = RTE_BE16(RTE_ETHER_TYPE_IPV4); next_proto_ofst = bounce_eh->size + offsetof(struct rte_ipv4_hdr, next_proto_id); ipv4 = (struct rte_ipv4_hdr *)buf_cur; exp_items = RTE_BIT64(RTE_FLOW_ITEM_TYPE_UDP); break; case RTE_FLOW_ITEM_TYPE_IPV6: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ITEM_TYPE_IPV6, exp_items); RTE_BUILD_BUG_ON(offsetof(struct rte_flow_item_ipv6, hdr) != 0); proto_header_size = sizeof(struct rte_ipv6_hdr); ethertypep = RTE_PTR_ADD(buf, ethertype_ofst); *ethertypep = RTE_BE16(RTE_ETHER_TYPE_IPV6); next_proto_ofst = bounce_eh->size + offsetof(struct rte_ipv6_hdr, proto); ipv6 = (struct rte_ipv6_hdr *)buf_cur; exp_items = RTE_BIT64(RTE_FLOW_ITEM_TYPE_UDP); break; case RTE_FLOW_ITEM_TYPE_UDP: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ITEM_TYPE_UDP, exp_items); RTE_BUILD_BUG_ON(offsetof(struct rte_flow_item_udp, hdr) != 0); proto_header_size = sizeof(struct rte_udp_hdr); next_protop = RTE_PTR_ADD(buf, next_proto_ofst); *next_protop = IPPROTO_UDP; udp = (struct rte_udp_hdr *)buf_cur; exp_items = RTE_BIT64(RTE_FLOW_ITEM_TYPE_VXLAN); break; case RTE_FLOW_ITEM_TYPE_VXLAN: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ITEM_TYPE_VXLAN, exp_items); RTE_BUILD_BUG_ON(offsetof(struct rte_flow_item_vxlan, hdr) != 0); proto_header_size = sizeof(struct rte_vxlan_hdr); vxlan = (struct rte_vxlan_hdr *)buf_cur; udp->dst_port = RTE_BE16(RTE_VXLAN_DEFAULT_PORT); udp->dgram_len = RTE_BE16(sizeof(*udp) + sizeof(*vxlan)); udp->dgram_cksum = 0; exp_items = 0; break; default: return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "Unknown item in the encap. header"); } if (bounce_eh->size + proto_header_size > bounce_eh->buf_size) { return rte_flow_error_set(error, E2BIG, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "The encap. header is too big"); } if ((proto_header_size & 1) != 0) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "Odd layer size in the encap. header"); } rte_memcpy(buf_cur, pattern->spec, proto_header_size); bounce_eh->size += proto_header_size; parsed_item->item = pattern; parsed_item->proto_header_size = proto_header_size; ++nb_parsed_items; } if (exp_items != 0) { /* Parsing item VXLAN would have reset exp_items to 0. */ return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION_CONF, NULL, "No item VXLAN in the encap. header"); } /* One of the pointers (ipv4, ipv6) refers to a dummy area. */ ipv4->version_ihl = RTE_IPV4_VHL_DEF; ipv4->time_to_live = SFC_IPV4_TTL_DEF; ipv4->total_length = RTE_BE16(sizeof(*ipv4) + sizeof(*udp) + sizeof(*vxlan)); /* The HW cannot compute this checksum. */ ipv4->hdr_checksum = 0; ipv4->hdr_checksum = rte_ipv4_cksum(ipv4); ipv6->vtc_flow = RTE_BE32(SFC_IPV6_VTC_FLOW_DEF); ipv6->hop_limits = SFC_IPV6_HOP_LIMITS_DEF; ipv6->payload_len = udp->dgram_len; vxlan->vx_flags = RTE_BE32(SFC_VXLAN_FLAGS_DEF); /* Take care of the masks. */ sfc_mae_header_force_item_masks(buf, parsed_items, nb_parsed_items); if (spec == NULL) return 0; rc = efx_mae_action_set_populate_encap(spec); if (rc != 0) { rc = rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "failed to request action ENCAP"); } return rc; } static int sfc_mae_rule_parse_action_mark(struct sfc_adapter *sa, const struct rte_flow_action_mark *conf, const struct sfc_flow_spec_mae *spec_mae, efx_mae_actions_t *spec) { int rc; if (spec_mae->ft_rule_type == SFC_FT_RULE_TUNNEL) { /* Workaround. See sfc_flow_parse_rte_to_mae() */ } else if (conf->id > SFC_FT_USER_MARK_MASK) { sfc_err(sa, "the mark value is too large"); return EINVAL; } rc = efx_mae_action_set_populate_mark(spec, conf->id); if (rc != 0) sfc_err(sa, "failed to request action MARK: %s", strerror(rc)); return rc; } static int sfc_mae_rule_parse_action_count(struct sfc_adapter *sa, const struct rte_flow_action_count *conf, efx_counter_type_t mae_counter_type, struct sfc_mae_counter **counterp, efx_mae_actions_t *spec) { struct sfc_mae_counter counter_tmp = {}; int rc; if ((sa->counter_rxq.state & SFC_COUNTER_RXQ_INITIALIZED) == 0) { sfc_err(sa, "counter queue is not configured for COUNT action"); rc = EINVAL; goto fail_counter_queue_uninit; } if (sfc_get_service_lcore(SOCKET_ID_ANY) == RTE_MAX_LCORE) { rc = EINVAL; goto fail_no_service_core; } if (*counterp != NULL) { sfc_err(sa, "cannot request more than 1 action COUNT per flow"); rc = EINVAL; goto fail_more_than_one; } if (spec != NULL) { rc = efx_mae_action_set_populate_count(spec); if (rc != 0) { sfc_err(sa, "failed to populate counters in MAE action set: %s", rte_strerror(rc)); goto fail_populate_count; } } if (conf != NULL) { counter_tmp.rte_id_valid = true; counter_tmp.rte_id = conf->id; } counter_tmp.type = mae_counter_type; return sfc_mae_counter_add(sa, &counter_tmp, counterp); return 0; fail_populate_count: fail_more_than_one: fail_no_service_core: fail_counter_queue_uninit: return rc; } static int sfc_mae_rule_parse_action_indirect(struct sfc_adapter *sa, bool replayable_only, const struct rte_flow_action_handle *handle, enum sfc_ft_rule_type ft_rule_type, struct sfc_mae_aset_ctx *ctx, struct rte_flow_error *error) { struct rte_flow_action_handle *entry; int rc; TAILQ_FOREACH(entry, &sa->flow_indir_actions, entries) { if (entry == handle) { bool replayable = false; sfc_dbg(sa, "attaching to indirect_action=%p", entry); switch (entry->type) { case RTE_FLOW_ACTION_TYPE_COUNT: replayable = true; break; default: break; } if (replayable_only && !replayable) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "the indirect action handle cannot be used"); } switch (entry->type) { case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP: if (ctx->encap_header != NULL) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "cannot have multiple actions VXLAN_ENCAP in one flow"); } rc = efx_mae_action_set_populate_encap(ctx->spec); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "failed to add ENCAP to MAE action set"); } ctx->encap_header = entry->encap_header; ++(ctx->encap_header->refcnt); break; case RTE_FLOW_ACTION_TYPE_COUNT: if (!replayable_only && ctx->counter != NULL) { /* * Signal the caller to "replay" the action * set context and re-invoke this function. */ return EEXIST; } if (ft_rule_type != SFC_FT_RULE_NONE) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "cannot use indirect count action in tunnel model"); } SFC_ASSERT(ctx->counter == NULL); rc = efx_mae_action_set_populate_count(ctx->spec); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "failed to add COUNT to MAE action set"); } ctx->counter = entry->counter; ++(ctx->counter->refcnt); break; default: SFC_ASSERT(B_FALSE); break; } return 0; } } return rte_flow_error_set(error, ENOENT, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "indirect action handle not found"); } static int sfc_mae_rule_parse_action_pf_vf(struct sfc_adapter *sa, const struct rte_flow_action_vf *vf_conf, efx_mae_actions_t *spec) { const efx_nic_cfg_t *encp = efx_nic_cfg_get(sa->nic); efx_mport_sel_t mport; uint32_t vf; int rc; if (vf_conf == NULL) vf = EFX_PCI_VF_INVALID; else if (vf_conf->original != 0) vf = encp->enc_vf; else vf = vf_conf->id; rc = efx_mae_mport_by_pcie_function(encp->enc_pf, vf, &mport); if (rc != 0) { sfc_err(sa, "failed to convert PF %u VF %d to m-port: %s", encp->enc_pf, (vf != EFX_PCI_VF_INVALID) ? (int)vf : -1, strerror(rc)); return rc; } rc = efx_mae_action_set_populate_deliver(spec, &mport); if (rc != 0) { sfc_err(sa, "failed to request action DELIVER with m-port selector 0x%08x: %s", mport.sel, strerror(rc)); } return rc; } static int sfc_mae_rule_parse_action_port_id(struct sfc_adapter *sa, const struct rte_flow_action_port_id *conf, efx_mae_actions_t *spec) { struct sfc_adapter_shared * const sas = sfc_sa2shared(sa); struct sfc_mae *mae = &sa->mae; unsigned int type_mask; efx_mport_sel_t mport; uint16_t port_id; int rc; if (conf->id > UINT16_MAX) return EOVERFLOW; port_id = (conf->original != 0) ? sas->port_id : conf->id; type_mask = 1U << SFC_MAE_SWITCH_PORT_INDEPENDENT; rc = sfc_mae_switch_get_ethdev_mport(mae->switch_domain_id, port_id, type_mask, &mport); if (rc != 0) { sfc_err(sa, "failed to get m-port for the given ethdev (port_id=%u): %s", port_id, strerror(rc)); return rc; } rc = efx_mae_action_set_populate_deliver(spec, &mport); if (rc != 0) { sfc_err(sa, "failed to request action DELIVER with m-port selector 0x%08x: %s", mport.sel, strerror(rc)); } return rc; } static int sfc_mae_rule_parse_action_port_representor(struct sfc_adapter *sa, const struct rte_flow_action_ethdev *conf, unsigned int type_mask, efx_mae_actions_t *spec) { struct sfc_mae *mae = &sa->mae; efx_mport_sel_t mport; int rc; rc = sfc_mae_switch_get_ethdev_mport(mae->switch_domain_id, conf->port_id, type_mask, &mport); if (rc != 0) { sfc_err(sa, "failed to get m-port for the given ethdev (port_id=%u): %s", conf->port_id, strerror(rc)); return rc; } rc = efx_mae_action_set_populate_deliver(spec, &mport); if (rc != 0) { sfc_err(sa, "failed to request action DELIVER with m-port selector 0x%08x: %s", mport.sel, strerror(rc)); } return rc; } static int sfc_mae_rule_parse_action_represented_port(struct sfc_adapter *sa, const struct rte_flow_action_ethdev *conf, efx_mae_actions_t *spec) { struct sfc_mae *mae = &sa->mae; efx_mport_sel_t mport; int rc; rc = sfc_mae_switch_get_entity_mport(mae->switch_domain_id, conf->port_id, &mport); if (rc != 0) { sfc_err(sa, "failed to get m-port for the given ethdev (port_id=%u): %s", conf->port_id, strerror(rc)); return rc; } rc = efx_mae_action_set_populate_deliver(spec, &mport); if (rc != 0) { sfc_err(sa, "failed to request action DELIVER with m-port selector 0x%08x: %s", mport.sel, strerror(rc)); } return rc; } static const char * const action_names[] = { [RTE_FLOW_ACTION_TYPE_VXLAN_DECAP] = "VXLAN_DECAP", [RTE_FLOW_ACTION_TYPE_OF_POP_VLAN] = "OF_POP_VLAN", [RTE_FLOW_ACTION_TYPE_SET_MAC_DST] = "SET_MAC_DST", [RTE_FLOW_ACTION_TYPE_SET_MAC_SRC] = "SET_MAC_SRC", [RTE_FLOW_ACTION_TYPE_OF_DEC_NW_TTL] = "OF_DEC_NW_TTL", [RTE_FLOW_ACTION_TYPE_DEC_TTL] = "DEC_TTL", [RTE_FLOW_ACTION_TYPE_SET_IPV4_DST] = "SET_IPV4_DST", [RTE_FLOW_ACTION_TYPE_SET_IPV4_SRC] = "SET_IPV4_SRC", [RTE_FLOW_ACTION_TYPE_SET_TP_DST] = "SET_TP_DST", [RTE_FLOW_ACTION_TYPE_SET_TP_SRC] = "SET_TP_SRC", [RTE_FLOW_ACTION_TYPE_OF_PUSH_VLAN] = "OF_PUSH_VLAN", [RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_VID] = "OF_SET_VLAN_VID", [RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_PCP] = "OF_SET_VLAN_PCP", [RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP] = "VXLAN_ENCAP", [RTE_FLOW_ACTION_TYPE_COUNT] = "COUNT", [RTE_FLOW_ACTION_TYPE_INDIRECT] = "INDIRECT", [RTE_FLOW_ACTION_TYPE_FLAG] = "FLAG", [RTE_FLOW_ACTION_TYPE_MARK] = "MARK", [RTE_FLOW_ACTION_TYPE_PF] = "PF", [RTE_FLOW_ACTION_TYPE_VF] = "VF", [RTE_FLOW_ACTION_TYPE_PORT_ID] = "PORT_ID", [RTE_FLOW_ACTION_TYPE_PORT_REPRESENTOR] = "PORT_REPRESENTOR", [RTE_FLOW_ACTION_TYPE_REPRESENTED_PORT] = "REPRESENTED_PORT", [RTE_FLOW_ACTION_TYPE_DROP] = "DROP", [RTE_FLOW_ACTION_TYPE_JUMP] = "JUMP", }; static void sfc_mae_bounce_eh_invalidate(struct sfc_mae_bounce_eh *bounce_eh); static int sfc_mae_process_encap_header(struct sfc_adapter *sa, const struct sfc_mae_bounce_eh *bounce_eh, struct sfc_mae_encap_header **encap_headerp); static int sfc_mae_aset_ctx_replay(struct sfc_adapter *sa, struct sfc_mae_aset_ctx **ctxp) { const struct sfc_mae_aset_ctx *ctx_cur; struct sfc_mae_aset_ctx *ctx_new; struct sfc_mae *mae = &sa->mae; int rc; RTE_BUILD_BUG_ON(EFX_MAE_ACTION_SET_LIST_MAX_NENTRIES == 0); /* Check the number of complete action set contexts. */ if (mae->nb_bounce_asets >= (EFX_MAE_ACTION_SET_LIST_MAX_NENTRIES - 1)) return ENOSPC; ctx_cur = &mae->bounce_aset_ctxs[mae->nb_bounce_asets]; ++(mae->nb_bounce_asets); ctx_new = &mae->bounce_aset_ctxs[mae->nb_bounce_asets]; *ctx_new = *ctx_cur; ctx_new->counter = NULL; ctx_new->fate_set = false; /* * This clones the action set specification and drops * actions COUNT and DELIVER from the clone so that * such can be added to it by later action parsing. */ rc = efx_mae_action_set_replay(sa->nic, ctx_cur->spec, &ctx_new->spec); if (rc != 0) return rc; *ctxp = ctx_new; return 0; } static int sfc_mae_rule_parse_action_rc(struct sfc_adapter *sa, struct sfc_mae_actions_bundle *bundle, const struct rte_flow_action *action, struct rte_flow_error *error, int rc, bool custom_error) { if (rc == 0) { bundle->actions_mask |= (1ULL << action->type); } else if (!custom_error) { if (action->type < RTE_DIM(action_names)) { const char *action_name = action_names[action->type]; if (action_name != NULL) { sfc_err(sa, "action %s was rejected: %s", action_name, strerror(rc)); } } rc = rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "Failed to request the action"); } return rc; } static int sfc_mae_rule_parse_action_replayable(struct sfc_adapter *sa, const struct rte_flow *flow, struct sfc_mae_actions_bundle *bundle, const struct rte_flow_action *action, struct sfc_mae_aset_ctx *ctx, struct rte_flow_error *error) { const struct sfc_flow_spec_mae *spec_mae = &flow->spec.mae; efx_mae_actions_t *spec = ctx->spec; unsigned int switch_port_type_mask; bool custom_error = false; bool new_fate_set = false; bool need_replay = false; int rc; /* * Decide whether the current action set context is * complete. If yes, "replay" it = go to a new one. */ switch (action->type) { case RTE_FLOW_ACTION_TYPE_INDIRECT: if (ctx->fate_set || ctx->counter != NULL) need_replay = true; break; case RTE_FLOW_ACTION_TYPE_PF: case RTE_FLOW_ACTION_TYPE_VF: case RTE_FLOW_ACTION_TYPE_PORT_ID: case RTE_FLOW_ACTION_TYPE_PORT_REPRESENTOR: case RTE_FLOW_ACTION_TYPE_REPRESENTED_PORT: /* FALLTHROUGH */ case RTE_FLOW_ACTION_TYPE_DROP: if (ctx->fate_set) need_replay = true; new_fate_set = true; break; default: return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "Unsupported action"); } if (need_replay) { if (spec_mae->ft_rule_type != SFC_FT_RULE_NONE) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "no support for packet replay in tunnel offload"); } if (!ctx->fate_set) { /* * With regard to replayable actions, the current action * set is only needed to hold one of the counters. * That is, it does not have a fate action, so * add one to suppress undesired delivery. */ rc = efx_mae_action_set_populate_drop(spec); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "failed to auto-add action DROP"); } } rc = sfc_mae_aset_ctx_replay(sa, &ctx); if (rc != 0) { return rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "failed to replay the action set"); } spec = ctx->spec; } ctx->fate_set = new_fate_set; switch (action->type) { case RTE_FLOW_ACTION_TYPE_INDIRECT: rc = sfc_mae_rule_parse_action_indirect(sa, true, action->conf, spec_mae->ft_rule_type, ctx, error); custom_error = true; break; case RTE_FLOW_ACTION_TYPE_PF: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_PF, bundle->actions_mask); rc = sfc_mae_rule_parse_action_pf_vf(sa, NULL, spec); break; case RTE_FLOW_ACTION_TYPE_VF: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_VF, bundle->actions_mask); rc = sfc_mae_rule_parse_action_pf_vf(sa, action->conf, spec); break; case RTE_FLOW_ACTION_TYPE_PORT_ID: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_PORT_ID, bundle->actions_mask); rc = sfc_mae_rule_parse_action_port_id(sa, action->conf, spec); break; case RTE_FLOW_ACTION_TYPE_PORT_REPRESENTOR: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_PORT_REPRESENTOR, bundle->actions_mask); switch_port_type_mask = 1U << SFC_MAE_SWITCH_PORT_INDEPENDENT; if (flow->internal) { switch_port_type_mask |= 1U << SFC_MAE_SWITCH_PORT_REPRESENTOR; } rc = sfc_mae_rule_parse_action_port_representor(sa, action->conf, switch_port_type_mask, spec); break; case RTE_FLOW_ACTION_TYPE_REPRESENTED_PORT: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_REPRESENTED_PORT, bundle->actions_mask); rc = sfc_mae_rule_parse_action_represented_port(sa, action->conf, spec); break; case RTE_FLOW_ACTION_TYPE_DROP: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_DROP, bundle->actions_mask); rc = efx_mae_action_set_populate_drop(spec); break; default: SFC_ASSERT(B_FALSE); break; } return sfc_mae_rule_parse_action_rc(sa, bundle, action, error, rc, custom_error); } static int sfc_mae_rule_parse_action(struct sfc_adapter *sa, const struct rte_flow_action *action, struct rte_flow *flow, bool ct, struct sfc_mae_actions_bundle *bundle, struct rte_flow_error *error) { struct sfc_flow_spec_mae *spec_mae = &flow->spec.mae; const struct sfc_mae_outer_rule *outer_rule = spec_mae->outer_rule; efx_counter_type_t mae_counter_type = EFX_COUNTER_TYPE_ACTION; const uint64_t rx_metadata = sa->negotiated_rx_metadata; struct sfc_mae_counter **counterp; bool non_replayable_found = true; struct sfc_mae *mae = &sa->mae; struct sfc_mae_aset_ctx *ctx; efx_mae_actions_t *spec_ptr; bool custom_error = B_FALSE; efx_mae_actions_t *spec; int rc = 0; /* Check the number of complete action set contexts. */ if (mae->nb_bounce_asets > (EFX_MAE_ACTION_SET_LIST_MAX_NENTRIES - 1)) { return sfc_mae_rule_parse_action_rc(sa, bundle, action, error, ENOSPC, custom_error); } ctx = &mae->bounce_aset_ctxs[mae->nb_bounce_asets]; counterp = &ctx->counter; spec = ctx->spec; spec_ptr = spec; if (ct) { mae_counter_type = EFX_COUNTER_TYPE_CONNTRACK; counterp = &spec_mae->ct_counter; spec_ptr = NULL; } if (mae->nb_bounce_asets != 0 || ctx->fate_set) { /* * When at least one delivery action has been encountered, * non-replayable actions (packet edits, for instance) * will be turned down. */ return sfc_mae_rule_parse_action_replayable(sa, flow, bundle, action, ctx, error); } switch (action->type) { case RTE_FLOW_ACTION_TYPE_VXLAN_DECAP: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_VXLAN_DECAP, bundle->actions_mask); if (outer_rule == NULL || outer_rule->encap_type != EFX_TUNNEL_PROTOCOL_VXLAN) rc = EINVAL; else rc = efx_mae_action_set_populate_decap(spec); break; case RTE_FLOW_ACTION_TYPE_OF_POP_VLAN: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_OF_POP_VLAN, bundle->actions_mask); rc = efx_mae_action_set_populate_vlan_pop(spec); break; case RTE_FLOW_ACTION_TYPE_SET_MAC_DST: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_SET_MAC_DST, bundle->actions_mask); rc = sfc_mae_rule_parse_action_set_mac(sa, SFC_MAE_MAC_ADDR_DST, action->conf, ctx, error); custom_error = B_TRUE; break; case RTE_FLOW_ACTION_TYPE_SET_MAC_SRC: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_SET_MAC_SRC, bundle->actions_mask); rc = sfc_mae_rule_parse_action_set_mac(sa, SFC_MAE_MAC_ADDR_SRC, action->conf, ctx, error); custom_error = B_TRUE; break; case RTE_FLOW_ACTION_TYPE_OF_DEC_NW_TTL: case RTE_FLOW_ACTION_TYPE_DEC_TTL: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_OF_DEC_NW_TTL, bundle->actions_mask); SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_DEC_TTL, bundle->actions_mask); rc = efx_mae_action_set_populate_decr_ip_ttl(spec); break; case RTE_FLOW_ACTION_TYPE_SET_IPV4_DST: case RTE_FLOW_ACTION_TYPE_SET_IPV4_SRC: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_SET_IPV4_DST, bundle->actions_mask); SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_SET_IPV4_SRC, bundle->actions_mask); sfc_mae_rule_parse_action_nat_addr(action->conf, &spec_mae->ct_resp.nat.ip_le); break; case RTE_FLOW_ACTION_TYPE_SET_TP_DST: case RTE_FLOW_ACTION_TYPE_SET_TP_SRC: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_SET_TP_DST, bundle->actions_mask); SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_SET_TP_SRC, bundle->actions_mask); sfc_mae_rule_parse_action_nat_port(action->conf, &spec_mae->ct_resp.nat.port_le); break; case RTE_FLOW_ACTION_TYPE_OF_PUSH_VLAN: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_OF_PUSH_VLAN, bundle->actions_mask); sfc_mae_rule_parse_action_of_push_vlan(action->conf, bundle); break; case RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_VID: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_VID, bundle->actions_mask); sfc_mae_rule_parse_action_of_set_vlan_vid(action->conf, bundle); break; case RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_PCP: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_PCP, bundle->actions_mask); sfc_mae_rule_parse_action_of_set_vlan_pcp(action->conf, bundle); break; case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP, bundle->actions_mask); /* Cleanup after previous encap. header bounce buffer usage. */ sfc_mae_bounce_eh_invalidate(&mae->bounce_eh); rc = sfc_mae_rule_parse_action_vxlan_encap(mae, action->conf, spec, error); if (rc == 0) { rc = sfc_mae_process_encap_header(sa, &mae->bounce_eh, &ctx->encap_header); } else { custom_error = true; } break; case RTE_FLOW_ACTION_TYPE_COUNT: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_COUNT, bundle->actions_mask); rc = sfc_mae_rule_parse_action_count(sa, action->conf, mae_counter_type, counterp, spec_ptr); break; case RTE_FLOW_ACTION_TYPE_INDIRECT: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_INDIRECT, bundle->actions_mask); rc = sfc_mae_rule_parse_action_indirect(sa, false, action->conf, spec_mae->ft_rule_type, ctx, error); if (rc == EEXIST) { /* Handle the action as a replayable one below. */ non_replayable_found = false; } custom_error = B_TRUE; break; case RTE_FLOW_ACTION_TYPE_FLAG: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_FLAG, bundle->actions_mask); if ((rx_metadata & RTE_ETH_RX_METADATA_USER_FLAG) != 0) { rc = efx_mae_action_set_populate_flag(spec); } else { rc = rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION, action, "flag delivery has not been negotiated"); custom_error = B_TRUE; } break; case RTE_FLOW_ACTION_TYPE_MARK: SFC_BUILD_SET_OVERFLOW(RTE_FLOW_ACTION_TYPE_MARK, bundle->actions_mask); if ((rx_metadata & RTE_ETH_RX_METADATA_USER_MARK) != 0 || spec_mae->ft_rule_type == SFC_FT_RULE_TUNNEL) { rc = sfc_mae_rule_parse_action_mark(sa, action->conf, spec_mae, spec); } else { rc = rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION, action, "mark delivery has not been negotiated"); custom_error = B_TRUE; } break; case RTE_FLOW_ACTION_TYPE_JUMP: if (spec_mae->ft_rule_type == SFC_FT_RULE_TUNNEL) { /* Workaround. See sfc_flow_parse_rte_to_mae() */ break; } /* FALLTHROUGH */ default: non_replayable_found = false; } if (non_replayable_found) { return sfc_mae_rule_parse_action_rc(sa, bundle, action, error, rc, custom_error); } return sfc_mae_rule_parse_action_replayable(sa, flow, bundle, action, ctx, error); } static void sfc_mae_bounce_eh_invalidate(struct sfc_mae_bounce_eh *bounce_eh) { bounce_eh->type = EFX_TUNNEL_PROTOCOL_NONE; } static int sfc_mae_process_encap_header(struct sfc_adapter *sa, const struct sfc_mae_bounce_eh *bounce_eh, struct sfc_mae_encap_header **encap_headerp) { if (bounce_eh->type == EFX_TUNNEL_PROTOCOL_NONE) { encap_headerp = NULL; return 0; } *encap_headerp = sfc_mae_encap_header_attach(sa, bounce_eh); if (*encap_headerp != NULL) return 0; return sfc_mae_encap_header_add(sa, bounce_eh, encap_headerp); } static int sfc_mae_rule_process_replay(struct sfc_adapter *sa, struct sfc_mae_action_rule_ctx *action_rule_ctx) { struct sfc_mae_action_set *base_aset; struct sfc_mae_action_set **asetp; struct sfc_mae *mae = &sa->mae; struct sfc_mae_aset_ctx *ctx; unsigned int i; unsigned int j; int rc; if (mae->nb_bounce_asets == 1) return 0; mae->bounce_aset_ptrs[0] = action_rule_ctx->action_set; base_aset = mae->bounce_aset_ptrs[0]; for (i = 1; i < mae->nb_bounce_asets; ++i) { asetp = &mae->bounce_aset_ptrs[i]; ctx = &mae->bounce_aset_ctxs[i]; *asetp = sfc_mae_action_set_attach(sa, ctx); if (*asetp != NULL) { efx_mae_action_set_spec_fini(sa->nic, ctx->spec); sfc_mae_counter_del(sa, ctx->counter); continue; } rc = sfc_mae_action_set_add(sa, ctx, asetp); if (rc != 0) goto fail_action_set_add; if (base_aset->encap_header != NULL) ++(base_aset->encap_header->refcnt); if (base_aset->dst_mac_addr != NULL) ++(base_aset->dst_mac_addr->refcnt); if (base_aset->src_mac_addr != NULL) ++(base_aset->src_mac_addr->refcnt); } action_rule_ctx->action_set_list = sfc_mae_action_set_list_attach(sa); if (action_rule_ctx->action_set_list != NULL) { for (i = 0; i < mae->nb_bounce_asets; ++i) sfc_mae_action_set_del(sa, mae->bounce_aset_ptrs[i]); } else { rc = sfc_mae_action_set_list_add(sa, &action_rule_ctx->action_set_list); if (rc != 0) goto fail_action_set_list_add; } action_rule_ctx->action_set = NULL; return 0; fail_action_set_list_add: fail_action_set_add: for (j = i; j < mae->nb_bounce_asets; ++j) { ctx = &mae->bounce_aset_ctxs[j]; efx_mae_action_set_spec_fini(sa->nic, ctx->spec); sfc_mae_counter_del(sa, ctx->counter); } while (--i > 0) sfc_mae_action_set_del(sa, mae->bounce_aset_ptrs[i]); return rc; } static int sfc_mae_rule_parse_actions(struct sfc_adapter *sa, const struct rte_flow_action actions[], struct rte_flow *flow, struct sfc_mae_action_rule_ctx *action_rule_ctx, struct rte_flow_error *error) { struct sfc_flow_spec_mae *spec_mae = &flow->spec.mae; struct sfc_mae_actions_bundle bundle = {0}; bool ct = (action_rule_ctx->ct_mark != 0); const struct rte_flow_action *action; struct sfc_mae_aset_ctx *last_ctx; struct sfc_mae *mae = &sa->mae; struct sfc_mae_aset_ctx *ctx; int rc; rte_errno = 0; if (actions == NULL) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION_NUM, NULL, "NULL actions"); } /* * Cleanup after action parsing of the previous flow. * * This particular variable always points at the * 1st (base) action set context, which can hold * both non-replayable and replayable actions. */ ctx = &mae->bounce_aset_ctxs[0]; memset(ctx, 0, sizeof(*ctx)); mae->nb_bounce_asets = 0; rc = efx_mae_action_set_spec_init(sa->nic, &ctx->spec); if (rc != 0) goto fail_action_set_spec_init; if (spec_mae->ft_rule_type == SFC_FT_RULE_SWITCH) { bool have_user_action_count = false; /* TUNNEL rules don't decapsulate packets. SWITCH rules do. */ rc = efx_mae_action_set_populate_decap(ctx->spec); if (rc != 0) goto fail_enforce_ft_decap; for (action = actions; action->type != RTE_FLOW_ACTION_TYPE_END; ++action) { if (action->type == RTE_FLOW_ACTION_TYPE_COUNT) { have_user_action_count = true; break; } } if (!have_user_action_count && sfc_mae_counter_stream_enabled(sa)) { /* * The user opted not to use action COUNT in this rule, * but the counter should be enabled implicitly because * packets hitting this rule contribute to the tunnel's * total number of hits. See sfc_mae_counter_get(). */ rc = efx_mae_action_set_populate_count(ctx->spec); if (rc != 0) goto fail_enforce_ft_count; rc = sfc_mae_counter_add(sa, NULL, &ctx->counter); if (rc != 0) goto fail_enforce_ft_count; } } for (action = actions; action->type != RTE_FLOW_ACTION_TYPE_END; ++action) { if (mae->nb_bounce_asets == 0) { rc = sfc_mae_actions_bundle_sync(action, &bundle, spec_mae, ctx->spec, ct, error); if (rc != 0) goto fail_rule_parse_action; } rc = sfc_mae_rule_parse_action(sa, action, flow, ct, &bundle, error); if (rc != 0) goto fail_rule_parse_action; } if (mae->nb_bounce_asets == 0) { rc = sfc_mae_actions_bundle_sync(action, &bundle, spec_mae, ctx->spec, ct, error); if (rc != 0) goto fail_rule_parse_action; } switch (spec_mae->ft_rule_type) { case SFC_FT_RULE_NONE: break; case SFC_FT_RULE_TUNNEL: /* Workaround. See sfc_flow_parse_rte_to_mae() */ rc = sfc_mae_rule_parse_action_pf_vf(sa, NULL, ctx->spec); if (rc != 0) goto fail_workaround_tunnel_delivery; if (ctx->counter != NULL) (ctx->counter)->ft_ctx = spec_mae->ft_ctx; ctx->fate_set = true; break; case SFC_FT_RULE_SWITCH: /* * Packets that go to the rule's AR have FT mark set (from * the TUNNEL rule OR's RECIRC_ID). Reset the mark to zero. */ efx_mae_action_set_populate_mark_reset(ctx->spec); if (ctx->counter != NULL) { (ctx->counter)->ft_switch_hit_counter = &spec_mae->ft_ctx->switch_hit_counter; } else if (sfc_mae_counter_stream_enabled(sa)) { SFC_ASSERT(ct); spec_mae->ct_counter->ft_switch_hit_counter = &spec_mae->ft_ctx->switch_hit_counter; } break; default: SFC_ASSERT(B_FALSE); } SFC_ASSERT(mae->nb_bounce_asets < EFX_MAE_ACTION_SET_LIST_MAX_NENTRIES); last_ctx = &mae->bounce_aset_ctxs[mae->nb_bounce_asets]; ++(mae->nb_bounce_asets); if (!last_ctx->fate_set) { rc = rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "no fate action found"); goto fail_check_fate_action; } action_rule_ctx->action_set = sfc_mae_action_set_attach(sa, ctx); if (action_rule_ctx->action_set != NULL) { sfc_mae_counter_del(sa, ctx->counter); sfc_mae_mac_addr_del(sa, ctx->src_mac); sfc_mae_mac_addr_del(sa, ctx->dst_mac); sfc_mae_encap_header_del(sa, ctx->encap_header); efx_mae_action_set_spec_fini(sa->nic, ctx->spec); } else { rc = sfc_mae_action_set_add(sa, ctx, &action_rule_ctx->action_set); if (rc != 0) goto fail_action_set_add; } memset(ctx, 0, sizeof(*ctx)); rc = sfc_mae_rule_process_replay(sa, action_rule_ctx); if (rc != 0) goto fail_rule_parse_replay; return 0; fail_rule_parse_replay: sfc_mae_action_set_del(sa, action_rule_ctx->action_set); fail_action_set_add: fail_check_fate_action: fail_workaround_tunnel_delivery: fail_rule_parse_action: sfc_mae_encap_header_del(sa, ctx->encap_header); sfc_mae_counter_del(sa, ctx->counter); sfc_mae_mac_addr_del(sa, ctx->src_mac); sfc_mae_mac_addr_del(sa, ctx->dst_mac); if (ctx->spec != NULL) efx_mae_action_set_spec_fini(sa->nic, ctx->spec); fail_enforce_ft_count: fail_enforce_ft_decap: fail_action_set_spec_init: if (rc > 0 && rte_errno == 0) { rc = rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "Failed to process the action"); } return rc; } int sfc_mae_rule_parse(struct sfc_adapter *sa, const struct rte_flow_item pattern[], const struct rte_flow_action actions[], struct rte_flow *flow, struct rte_flow_error *error) { struct sfc_flow_spec *spec = &flow->spec; struct sfc_flow_spec_mae *spec_mae = &spec->mae; struct sfc_mae_action_rule_ctx ctx = {}; int rc; /* * If the flow is meant to be a TUNNEL rule in a FT context, * preparse its actions and save its properties in spec_mae. */ rc = sfc_ft_tunnel_rule_detect(sa, actions, spec_mae, error); if (rc != 0) goto fail; rc = sfc_mae_rule_parse_pattern(sa, pattern, flow, &ctx, error); if (rc != 0) goto fail; if (spec_mae->ft_rule_type == SFC_FT_RULE_TUNNEL) { /* * By design, this flow should be represented solely by the * outer rule. But the HW/FW hasn't got support for setting * Rx mark from RECIRC_ID on outer rule lookup yet. Neither * does it support outer rule counters. As a workaround, an * action rule of lower priority is used to do the job. * * So don't skip sfc_mae_rule_parse_actions() below. */ } spec_mae->outer_rule = ctx.outer_rule; rc = sfc_mae_rule_parse_actions(sa, actions, flow, &ctx, error); if (rc != 0) goto fail; rc = sfc_mae_action_rule_attach(sa, &ctx, &spec_mae->action_rule, error); if (rc == 0) { efx_mae_match_spec_fini(sa->nic, ctx.match_spec); sfc_mae_action_set_list_del(sa, ctx.action_set_list); sfc_mae_action_set_del(sa, ctx.action_set); sfc_mae_outer_rule_del(sa, ctx.outer_rule); } else if (rc == -ENOENT) { rc = sfc_mae_action_rule_add(sa, &ctx, &spec_mae->action_rule); if (rc != 0) { rc = rte_flow_error_set(error, rc, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "AR: failed to add the entry"); goto fail; } } else { goto fail; } if (spec_mae->ft_ctx != NULL) { if (spec_mae->ft_rule_type == SFC_FT_RULE_TUNNEL) spec_mae->ft_ctx->tunnel_rule_is_set = B_TRUE; ++(spec_mae->ft_ctx->refcnt); } return 0; fail: if (ctx.match_spec != NULL) efx_mae_match_spec_fini(sa->nic, ctx.match_spec); sfc_mae_action_set_list_del(sa, ctx.action_set_list); sfc_mae_action_set_del(sa, ctx.action_set); sfc_mae_outer_rule_del(sa, ctx.outer_rule); /* Reset these values to avoid confusing sfc_mae_flow_cleanup(). */ spec_mae->ft_rule_type = SFC_FT_RULE_NONE; spec_mae->ft_ctx = NULL; return rc; } static bool sfc_mae_rules_class_cmp(struct sfc_adapter *sa, const efx_mae_match_spec_t *left, const efx_mae_match_spec_t *right) { bool have_same_class; int rc; rc = efx_mae_match_specs_class_cmp(sa->nic, left, right, &have_same_class); return (rc == 0) ? have_same_class : false; } static int sfc_mae_outer_rule_class_verify(struct sfc_adapter *sa, struct sfc_mae_outer_rule *rule) { struct sfc_mae_outer_rule *entry; struct sfc_mae_fw_rsrc *fw_rsrc; struct sfc_mae *mae = &sa->mae; if (rule == NULL) return 0; fw_rsrc = &rule->fw_rsrc; if (fw_rsrc->rule_id.id != EFX_MAE_RSRC_ID_INVALID) { /* An active rule is reused. It's class is wittingly valid. */ return 0; } TAILQ_FOREACH_REVERSE(entry, &mae->outer_rules, sfc_mae_outer_rules, entries) { const efx_mae_match_spec_t *left = entry->match_spec; const efx_mae_match_spec_t *right = rule->match_spec; if (entry == rule) continue; if (sfc_mae_rules_class_cmp(sa, left, right)) return 0; } sfc_info(sa, "for now, the HW doesn't support rule validation, and HW " "support for outer frame pattern items is not guaranteed; " "other than that, the items are valid from SW standpoint"); return 0; } static int sfc_mae_action_rule_class_verify(struct sfc_adapter *sa, struct sfc_mae_action_rule *rule) { struct sfc_mae_fw_rsrc *fw_rsrc = &rule->fw_rsrc; const struct sfc_mae_action_rule *entry; struct sfc_mae *mae = &sa->mae; if (fw_rsrc->rule_id.id != EFX_MAE_RSRC_ID_INVALID) { /* An active rule is reused. Its class is known to be valid. */ return 0; } TAILQ_FOREACH_REVERSE(entry, &mae->action_rules, sfc_mae_action_rules, entries) { const efx_mae_match_spec_t *left = entry->match_spec; const efx_mae_match_spec_t *right = rule->match_spec; if (entry == rule) continue; if (sfc_mae_rules_class_cmp(sa, left, right)) return 0; } sfc_info(sa, "for now, the HW doesn't support rule validation, and HW " "support for inner frame pattern items is not guaranteed; " "other than that, the items are valid from SW standpoint"); return 0; } /** * Confirm that a given flow can be accepted by the FW. * * @param sa * Software adapter context * @param flow * Flow to be verified * @return * Zero on success and non-zero in the case of error. * A special value of EAGAIN indicates that the adapter is * not in started state. This state is compulsory because * it only makes sense to compare the rule class of the flow * being validated with classes of the active rules. * Such classes are wittingly supported by the FW. */ int sfc_mae_flow_verify(struct sfc_adapter *sa, struct rte_flow *flow) { struct sfc_flow_spec *spec = &flow->spec; struct sfc_flow_spec_mae *spec_mae = &spec->mae; struct sfc_mae_action_rule *action_rule = spec_mae->action_rule; struct sfc_mae_outer_rule *outer_rule = spec_mae->outer_rule; int rc; SFC_ASSERT(sfc_adapter_is_locked(sa)); if (sa->state != SFC_ETHDEV_STARTED) return EAGAIN; rc = sfc_mae_outer_rule_class_verify(sa, outer_rule); if (rc != 0) return rc; return sfc_mae_action_rule_class_verify(sa, action_rule); } int sfc_mae_flow_insert(struct sfc_adapter *sa, struct rte_flow *flow) { struct sfc_flow_spec *spec = &flow->spec; struct sfc_flow_spec_mae *spec_mae = &spec->mae; struct sfc_mae_action_rule *action_rule = spec_mae->action_rule; int rc; if (spec_mae->ft_rule_type == SFC_FT_RULE_TUNNEL) { spec_mae->ft_ctx->reset_tunnel_hit_counter = spec_mae->ft_ctx->switch_hit_counter; } if (action_rule == NULL) return 0; rc = sfc_mae_action_rule_enable(sa, action_rule); if (rc != 0) return rc; if (spec_mae->action_rule->ct_mark != 0) { struct sfc_mae_counter *counter = spec_mae->ct_counter; rc = sfc_mae_counter_enable(sa, counter, NULL); if (rc != 0) { sfc_mae_action_rule_disable(sa, action_rule); return rc; } if (counter != NULL) { struct sfc_mae_fw_rsrc *fw_rsrc = &counter->fw_rsrc; spec_mae->ct_resp.counter_id = fw_rsrc->counter_id.id; rc = sfc_mae_counter_start(sa); if (rc != 0) { sfc_mae_action_rule_disable(sa, action_rule); return rc; } } else { spec_mae->ct_resp.counter_id = EFX_MAE_RSRC_ID_INVALID; } spec_mae->ct_resp.ct_mark = spec_mae->action_rule->ct_mark; rc = sfc_mae_conntrack_insert(sa, &spec_mae->ct_key, &spec_mae->ct_resp); if (rc != 0) { sfc_mae_counter_disable(sa, counter); sfc_mae_action_rule_disable(sa, action_rule); return rc; } } return 0; } int sfc_mae_flow_remove(struct sfc_adapter *sa, struct rte_flow *flow) { struct sfc_flow_spec *spec = &flow->spec; struct sfc_flow_spec_mae *spec_mae = &spec->mae; struct sfc_mae_action_rule *action_rule = spec_mae->action_rule; if (action_rule == NULL) return 0; if (action_rule->ct_mark != 0) (void)sfc_mae_conntrack_delete(sa, &spec_mae->ct_key); sfc_mae_counter_disable(sa, spec_mae->ct_counter); sfc_mae_action_rule_disable(sa, action_rule); return 0; } static int sfc_mae_query_counter(struct sfc_adapter *sa, struct sfc_flow_spec_mae *spec, const struct rte_flow_action *action, struct rte_flow_query_count *data, struct rte_flow_error *error) { const struct sfc_mae_action_rule *action_rule = spec->action_rule; const struct rte_flow_action_count *conf = action->conf; struct sfc_mae_counter *counters[1 /* action rule counter */ + 1 /* conntrack counter */]; struct sfc_mae_counter *counter; unsigned int i; int rc; /* * The check for counter unavailability is done based * on counter traversal results. See error set below. */ if (action_rule != NULL && action_rule->action_set != NULL && action_rule->action_set->counter != NULL && !action_rule->action_set->counter->indirect) counters[0] = action_rule->action_set->counter; else counters[0] = NULL; counters[1] = spec->ct_counter; for (i = 0; i < RTE_DIM(counters); ++i) { counter = counters[i]; if (counter == NULL) continue; if (conf == NULL || (counter->rte_id_valid && conf->id == counter->rte_id)) { rc = sfc_mae_counter_get(sa, counter, data); if (rc != 0) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION, action, "Queried flow rule counter action is invalid"); } return 0; } } if (action_rule == NULL || action_rule->action_set_list == NULL) goto exit; for (i = 0; i < action_rule->action_set_list->nb_action_sets; ++i) { counter = action_rule->action_set_list->action_sets[i]->counter; if (counter == NULL || counter->indirect) continue; if (conf == NULL || (counter->rte_id_valid && conf->id == counter->rte_id)) { rc = sfc_mae_counter_get(sa, counter, data); if (rc != 0) { return rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION, action, "Queried flow rule counter action is invalid"); } return 0; } } exit: return rte_flow_error_set(error, ENOENT, RTE_FLOW_ERROR_TYPE_ACTION, action, "no such flow rule action or such count ID"); } int sfc_mae_flow_query(struct rte_eth_dev *dev, struct rte_flow *flow, const struct rte_flow_action *action, void *data, struct rte_flow_error *error) { struct sfc_adapter *sa = sfc_adapter_by_eth_dev(dev); struct sfc_flow_spec *spec = &flow->spec; struct sfc_flow_spec_mae *spec_mae = &spec->mae; switch (action->type) { case RTE_FLOW_ACTION_TYPE_COUNT: return sfc_mae_query_counter(sa, spec_mae, action, data, error); default: return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION, NULL, "Query for action of this type is not supported"); } } int sfc_mae_switchdev_init(struct sfc_adapter *sa) { struct sfc_adapter_shared *sas = sfc_sa2shared(sa); struct sfc_mae *mae = &sa->mae; int rc = EINVAL; sfc_log_init(sa, "entry"); if (!sa->switchdev) { sfc_log_init(sa, "switchdev is not enabled - skip"); return 0; } if (mae->status != SFC_MAE_STATUS_ADMIN) { rc = ENOTSUP; sfc_err(sa, "failed to init switchdev - no admin MAE privilege"); goto fail_no_mae; } mae->switchdev_rule_pf_to_ext = sfc_mae_repr_flow_create(sa, SFC_MAE_RULE_PRIO_LOWEST, sas->port_id, RTE_FLOW_ACTION_TYPE_REPRESENTED_PORT, RTE_FLOW_ITEM_TYPE_PORT_REPRESENTOR); if (mae->switchdev_rule_pf_to_ext == NULL) { sfc_err(sa, "failed add MAE rule to forward from PF to PHY"); goto fail_pf_add; } mae->switchdev_rule_ext_to_pf = sfc_mae_repr_flow_create(sa, SFC_MAE_RULE_PRIO_LOWEST, sas->port_id, RTE_FLOW_ACTION_TYPE_PORT_REPRESENTOR, RTE_FLOW_ITEM_TYPE_REPRESENTED_PORT); if (mae->switchdev_rule_ext_to_pf == NULL) { sfc_err(sa, "failed add MAE rule to forward from PHY to PF"); goto fail_phy_add; } sfc_log_init(sa, "done"); return 0; fail_phy_add: sfc_mae_repr_flow_destroy(sa, mae->switchdev_rule_pf_to_ext); fail_pf_add: fail_no_mae: sfc_log_init(sa, "failed: %s", rte_strerror(rc)); return rc; } void sfc_mae_switchdev_fini(struct sfc_adapter *sa) { struct sfc_mae *mae = &sa->mae; if (!sa->switchdev) return; sfc_mae_repr_flow_destroy(sa, mae->switchdev_rule_pf_to_ext); sfc_mae_repr_flow_destroy(sa, mae->switchdev_rule_ext_to_pf); } int sfc_mae_indir_action_create(struct sfc_adapter *sa, const struct rte_flow_action *action, struct rte_flow_action_handle *handle, struct rte_flow_error *error) { struct sfc_mae *mae = &sa->mae; bool custom_error = false; int ret; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(handle != NULL); switch (action->type) { case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP: /* Cleanup after previous encap. header bounce buffer usage. */ sfc_mae_bounce_eh_invalidate(&mae->bounce_eh); ret = sfc_mae_rule_parse_action_vxlan_encap(mae, action->conf, NULL, error); if (ret != 0) { custom_error = true; break; } ret = sfc_mae_encap_header_add(sa, &mae->bounce_eh, &handle->encap_header); if (ret == 0) handle->encap_header->indirect = true; break; case RTE_FLOW_ACTION_TYPE_COUNT: ret = sfc_mae_rule_parse_action_count(sa, action->conf, EFX_COUNTER_TYPE_ACTION, &handle->counter, NULL); if (ret == 0) handle->counter->indirect = true; break; default: ret = ENOTSUP; } if (custom_error) return ret; if (ret != 0) { return rte_flow_error_set(error, ret, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "failed to parse indirect action to mae object"); } handle->type = action->type; return 0; } int sfc_mae_indir_action_destroy(struct sfc_adapter *sa, const struct rte_flow_action_handle *handle, struct rte_flow_error *error) { SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(handle != NULL); switch (handle->type) { case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP: if (handle->encap_header->refcnt != 1) goto fail; sfc_mae_encap_header_del(sa, handle->encap_header); break; case RTE_FLOW_ACTION_TYPE_COUNT: if (handle->counter->refcnt != 1) goto fail; sfc_mae_counter_del(sa, handle->counter); break; default: SFC_ASSERT(B_FALSE); break; } return 0; fail: return rte_flow_error_set(error, EIO, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "indirect action is still in use"); } int sfc_mae_indir_action_update(struct sfc_adapter *sa, struct rte_flow_action_handle *handle, const void *update, struct rte_flow_error *error) { const struct rte_flow_action *action = update; struct sfc_mae *mae = &sa->mae; bool custom_error = false; int ret; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(action != NULL); SFC_ASSERT(handle != NULL); switch (handle->type) { case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP: /* Cleanup after previous encap. header bounce buffer usage. */ sfc_mae_bounce_eh_invalidate(&mae->bounce_eh); ret = sfc_mae_rule_parse_action_vxlan_encap(mae, action->conf, NULL, error); if (ret != 0) { custom_error = true; break; } ret = sfc_mae_encap_header_update(sa, handle->encap_header); break; default: ret = ENOTSUP; } if (custom_error) return ret; if (ret != 0) { return rte_flow_error_set(error, ret, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "failed to parse indirect action to mae object"); } return 0; } int sfc_mae_indir_action_query(struct sfc_adapter *sa, const struct rte_flow_action_handle *handle, void *data, struct rte_flow_error *error) { int ret; SFC_ASSERT(sfc_adapter_is_locked(sa)); SFC_ASSERT(handle != NULL); switch (handle->type) { case RTE_FLOW_ACTION_TYPE_COUNT: SFC_ASSERT(handle->counter != NULL); if (handle->counter->fw_rsrc.refcnt == 0) goto fail_not_in_use; ret = sfc_mae_counter_get(sa, handle->counter, data); if (ret != 0) goto fail_counter_get; break; default: goto fail_unsup; } return 0; fail_not_in_use: return rte_flow_error_set(error, EIO, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "indirect action is not in use"); fail_counter_get: return rte_flow_error_set(error, ret, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "failed to collect indirect action COUNT data"); fail_unsup: return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL, "indirect action of this type cannot be queried"); }