mirror of
https://github.com/ukui/kernel.git
synced 2026-03-09 10:07:04 -07:00
ice: Implement aRFS
Enable accelerated Receive Flow Steering (aRFS). It is used to steer Rx
flows to a specific queue. This functionality is triggered by the network
stack through ndo_rx_flow_steer and requires Flow Director (ntuple on) to
function.
The fltr_info is used to add/remove/update flow rules in the HW, the
fltr_state is used to determine what to do with the filter with respect
to HW and/or SW, and the flow_id is used in co-ordination with the
network stack.
The work for aRFS is split into two paths: the ndo_rx_flow_steer
operation and the ice_service_task. The former is where the kernel hands
us an Rx SKB among other items to setup aRFS and the latter is where
the driver adds/updates/removes filter rules from HW and updates filter
state.
In the Rx path the following things can happen:
1. New aRFS entries are added to the hash table and the state is
set to ICE_ARFS_INACTIVE so the filter can be updated in HW
by the ice_service_task path.
2. aRFS entries have their Rx Queue updated if we receive a
pre-existing flow_id and the filter state is ICE_ARFS_ACTIVE.
The state is set to ICE_ARFS_INACTIVE so the filter can be
updated in HW by the ice_service_task path.
3. aRFS entries marked as ICE_ARFS_TODEL are deleted
In the ice_service_task path the following things can happen:
1. New aRFS entries marked as ICE_ARFS_INACTIVE are added or
updated in HW.
and their state is updated to ICE_ARFS_ACTIVE.
2. aRFS entries are deleted from HW and their state is updated
to ICE_ARFS_TODEL.
Signed-off-by: Brett Creeley <brett.creeley@intel.com>
Signed-off-by: Madhu Chittim <madhu.chittim@intel.com>
Signed-off-by: Tony Nguyen <anthony.l.nguyen@intel.com>
Tested-by: Andrew Bowers <andrewx.bowers@intel.com>
Signed-off-by: Jeff Kirsher <jeffrey.t.kirsher@intel.com>
This commit is contained in:
committed by
Jeff Kirsher
parent
83af003951
commit
28bf26724f
@@ -26,4 +26,5 @@ ice-y := ice_main.o \
|
||||
ice_ethtool.o
|
||||
ice-$(CONFIG_PCI_IOV) += ice_virtchnl_pf.o ice_sriov.o
|
||||
ice-$(CONFIG_DCB) += ice_dcb.o ice_dcb_nl.o ice_dcb_lib.o
|
||||
ice-$(CONFIG_RFS_ACCEL) += ice_arfs.o
|
||||
ice-$(CONFIG_XDP_SOCKETS) += ice_xsk.o
|
||||
|
||||
@@ -34,6 +34,7 @@
|
||||
#include <linux/ctype.h>
|
||||
#include <linux/bpf.h>
|
||||
#include <linux/avf/virtchnl.h>
|
||||
#include <linux/cpu_rmap.h>
|
||||
#include <net/devlink.h>
|
||||
#include <net/ipv6.h>
|
||||
#include <net/xdp_sock.h>
|
||||
@@ -52,6 +53,7 @@
|
||||
#include "ice_sriov.h"
|
||||
#include "ice_fdir.h"
|
||||
#include "ice_xsk.h"
|
||||
#include "ice_arfs.h"
|
||||
|
||||
extern const char ice_drv_ver[];
|
||||
#define ICE_BAR0 0
|
||||
@@ -271,6 +273,14 @@ struct ice_vsi {
|
||||
u8 *rss_lut_user; /* User configured lookup table entries */
|
||||
u8 rss_lut_type; /* used to configure Get/Set RSS LUT AQ call */
|
||||
|
||||
/* aRFS members only allocated for the PF VSI */
|
||||
#define ICE_MAX_ARFS_LIST 1024
|
||||
#define ICE_ARFS_LST_MASK (ICE_MAX_ARFS_LIST - 1)
|
||||
struct hlist_head *arfs_fltr_list;
|
||||
struct ice_arfs_active_fltr_cntrs *arfs_fltr_cntrs;
|
||||
spinlock_t arfs_lock; /* protects aRFS hash table and filter state */
|
||||
atomic_t *arfs_last_fltr_id;
|
||||
|
||||
u16 max_frame;
|
||||
u16 rx_buf_len;
|
||||
|
||||
@@ -558,6 +568,9 @@ int ice_schedule_reset(struct ice_pf *pf, enum ice_reset_req reset);
|
||||
void ice_print_link_msg(struct ice_vsi *vsi, bool isup);
|
||||
const char *ice_stat_str(enum ice_status stat_err);
|
||||
const char *ice_aq_str(enum ice_aq_err aq_err);
|
||||
int
|
||||
ice_fdir_write_fltr(struct ice_pf *pf, struct ice_fdir_fltr *input, bool add,
|
||||
bool is_tun);
|
||||
void ice_vsi_manage_fdir(struct ice_vsi *vsi, bool ena);
|
||||
int ice_add_fdir_ethtool(struct ice_vsi *vsi, struct ethtool_rxnfc *cmd);
|
||||
int ice_del_fdir_ethtool(struct ice_vsi *vsi, struct ethtool_rxnfc *cmd);
|
||||
@@ -571,5 +584,6 @@ void ice_fdir_replay_fltrs(struct ice_pf *pf);
|
||||
int ice_fdir_create_dflt_rules(struct ice_pf *pf);
|
||||
int ice_open(struct net_device *netdev);
|
||||
int ice_stop(struct net_device *netdev);
|
||||
void ice_service_task_schedule(struct ice_pf *pf);
|
||||
|
||||
#endif /* _ICE_H_ */
|
||||
|
||||
File diff suppressed because it is too large
Load Diff
@@ -0,0 +1,82 @@
|
||||
/* SPDX-License-Identifier: GPL-2.0 */
|
||||
/* Copyright (C) 2018-2020, Intel Corporation. */
|
||||
|
||||
#ifndef _ICE_ARFS_H_
|
||||
#define _ICE_ARFS_H_
|
||||
enum ice_arfs_fltr_state {
|
||||
ICE_ARFS_INACTIVE,
|
||||
ICE_ARFS_ACTIVE,
|
||||
ICE_ARFS_TODEL,
|
||||
};
|
||||
|
||||
struct ice_arfs_entry {
|
||||
struct ice_fdir_fltr fltr_info;
|
||||
struct hlist_node list_entry;
|
||||
u64 time_activated; /* only valid for UDP flows */
|
||||
u32 flow_id;
|
||||
/* fltr_state = 0 - ICE_ARFS_INACTIVE:
|
||||
* filter needs to be updated or programmed in HW.
|
||||
* fltr_state = 1 - ICE_ARFS_ACTIVE:
|
||||
* filter is active and programmed in HW.
|
||||
* fltr_state = 2 - ICE_ARFS_TODEL:
|
||||
* filter has been deleted from HW and needs to be removed from
|
||||
* the aRFS hash table.
|
||||
*/
|
||||
u8 fltr_state;
|
||||
};
|
||||
|
||||
struct ice_arfs_entry_ptr {
|
||||
struct ice_arfs_entry *arfs_entry;
|
||||
struct hlist_node list_entry;
|
||||
};
|
||||
|
||||
struct ice_arfs_active_fltr_cntrs {
|
||||
atomic_t active_tcpv4_cnt;
|
||||
atomic_t active_tcpv6_cnt;
|
||||
atomic_t active_udpv4_cnt;
|
||||
atomic_t active_udpv6_cnt;
|
||||
};
|
||||
|
||||
#ifdef CONFIG_RFS_ACCEL
|
||||
int
|
||||
ice_rx_flow_steer(struct net_device *netdev, const struct sk_buff *skb,
|
||||
u16 rxq_idx, u32 flow_id);
|
||||
void ice_clear_arfs(struct ice_vsi *vsi);
|
||||
void ice_free_cpu_rx_rmap(struct ice_vsi *vsi);
|
||||
void ice_init_arfs(struct ice_vsi *vsi);
|
||||
void ice_sync_arfs_fltrs(struct ice_pf *pf);
|
||||
int ice_set_cpu_rx_rmap(struct ice_vsi *vsi);
|
||||
void ice_remove_arfs(struct ice_pf *pf);
|
||||
void ice_rebuild_arfs(struct ice_pf *pf);
|
||||
bool
|
||||
ice_is_arfs_using_perfect_flow(struct ice_hw *hw,
|
||||
enum ice_fltr_ptype flow_type);
|
||||
#else
|
||||
#define ice_sync_arfs_fltrs(pf) do {} while (0)
|
||||
#define ice_init_arfs(vsi) do {} while (0)
|
||||
#define ice_clear_arfs(vsi) do {} while (0)
|
||||
#define ice_remove_arfs(pf) do {} while (0)
|
||||
#define ice_free_cpu_rx_rmap(vsi) do {} while (0)
|
||||
#define ice_rebuild_arfs(pf) do {} while (0)
|
||||
|
||||
static inline int ice_set_cpu_rx_rmap(struct ice_vsi __always_unused *vsi)
|
||||
{
|
||||
return 0;
|
||||
}
|
||||
|
||||
static inline int
|
||||
ice_rx_flow_steer(struct net_device __always_unused *netdev,
|
||||
const struct sk_buff __always_unused *skb,
|
||||
u16 __always_unused rxq_idx, u32 __always_unused flow_id)
|
||||
{
|
||||
return -EOPNOTSUPP;
|
||||
}
|
||||
|
||||
static inline bool
|
||||
ice_is_arfs_using_perfect_flow(struct ice_hw __always_unused *hw,
|
||||
enum ice_fltr_ptype __always_unused flow_type)
|
||||
{
|
||||
return false;
|
||||
}
|
||||
#endif /* CONFIG_RFS_ACCEL */
|
||||
#endif /* _ICE_ARFS_H_ */
|
||||
@@ -566,6 +566,12 @@ ice_fdir_set_hw_fltr_rule(struct ice_pf *pf, struct ice_flow_seg_info *seg,
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
if (ice_is_arfs_using_perfect_flow(hw, flow)) {
|
||||
dev_err(dev, "aRFS using perfect flow type %d, cannot change input set\n",
|
||||
flow);
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
/* remove HW filter definition */
|
||||
ice_fdir_rem_flow(hw, ICE_BLK_FD, flow);
|
||||
}
|
||||
@@ -1176,7 +1182,7 @@ err_exit:
|
||||
*
|
||||
* returns 0 on success and negative value on error
|
||||
*/
|
||||
static int
|
||||
int
|
||||
ice_fdir_write_fltr(struct ice_pf *pf, struct ice_fdir_fltr *input, bool add,
|
||||
bool is_tun)
|
||||
{
|
||||
|
||||
@@ -2175,6 +2175,7 @@ ice_vsi_setup(struct ice_pf *pf, struct ice_port_info *pi,
|
||||
ice_vsi_cfg_rss_lut_key(vsi);
|
||||
ice_vsi_set_rss_flow_fld(vsi);
|
||||
}
|
||||
ice_init_arfs(vsi);
|
||||
break;
|
||||
case ICE_VSI_VF:
|
||||
/* VF driver will take care of creating netdev for this type and
|
||||
|
||||
@@ -1113,7 +1113,7 @@ static void ice_clean_mailboxq_subtask(struct ice_pf *pf)
|
||||
*
|
||||
* If not already scheduled, this puts the task into the work queue.
|
||||
*/
|
||||
static void ice_service_task_schedule(struct ice_pf *pf)
|
||||
void ice_service_task_schedule(struct ice_pf *pf)
|
||||
{
|
||||
if (!test_bit(__ICE_SERVICE_DIS, pf->state) &&
|
||||
!test_and_set_bit(__ICE_SERVICE_SCHED, pf->state) &&
|
||||
@@ -1483,7 +1483,7 @@ static void ice_service_task(struct work_struct *work)
|
||||
|
||||
ice_process_vflr_event(pf);
|
||||
ice_clean_mailboxq_subtask(pf);
|
||||
|
||||
ice_sync_arfs_fltrs(pf);
|
||||
/* Clear __ICE_SERVICE_SCHED flag to allow scheduling next event */
|
||||
ice_service_task_complete(pf);
|
||||
|
||||
@@ -1642,9 +1642,14 @@ static int ice_vsi_req_irq_msix(struct ice_vsi *vsi, char *basename)
|
||||
}
|
||||
|
||||
/* register for affinity change notifications */
|
||||
q_vector->affinity_notify.notify = ice_irq_affinity_notify;
|
||||
q_vector->affinity_notify.release = ice_irq_affinity_release;
|
||||
irq_set_affinity_notifier(irq_num, &q_vector->affinity_notify);
|
||||
if (!IS_ENABLED(CONFIG_RFS_ACCEL)) {
|
||||
struct irq_affinity_notify *affinity_notify;
|
||||
|
||||
affinity_notify = &q_vector->affinity_notify;
|
||||
affinity_notify->notify = ice_irq_affinity_notify;
|
||||
affinity_notify->release = ice_irq_affinity_release;
|
||||
irq_set_affinity_notifier(irq_num, affinity_notify);
|
||||
}
|
||||
|
||||
/* assign the mask for this irq */
|
||||
irq_set_affinity_hint(irq_num, &q_vector->affinity_mask);
|
||||
@@ -1656,8 +1661,9 @@ static int ice_vsi_req_irq_msix(struct ice_vsi *vsi, char *basename)
|
||||
free_q_irqs:
|
||||
while (vector) {
|
||||
vector--;
|
||||
irq_num = pf->msix_entries[base + vector].vector,
|
||||
irq_set_affinity_notifier(irq_num, NULL);
|
||||
irq_num = pf->msix_entries[base + vector].vector;
|
||||
if (!IS_ENABLED(CONFIG_RFS_ACCEL))
|
||||
irq_set_affinity_notifier(irq_num, NULL);
|
||||
irq_set_affinity_hint(irq_num, NULL);
|
||||
devm_free_irq(dev, irq_num, &vsi->q_vectors[vector]);
|
||||
}
|
||||
@@ -2611,12 +2617,22 @@ static int ice_setup_pf_sw(struct ice_pf *pf)
|
||||
*/
|
||||
ice_napi_add(vsi);
|
||||
|
||||
status = ice_set_cpu_rx_rmap(vsi);
|
||||
if (status) {
|
||||
dev_err(ice_pf_to_dev(pf), "Failed to set CPU Rx map VSI %d error %d\n",
|
||||
vsi->vsi_num, status);
|
||||
status = -EINVAL;
|
||||
goto unroll_napi_add;
|
||||
}
|
||||
status = ice_init_mac_fltr(pf);
|
||||
if (status)
|
||||
goto unroll_napi_add;
|
||||
goto free_cpu_rx_map;
|
||||
|
||||
return status;
|
||||
|
||||
free_cpu_rx_map:
|
||||
ice_free_cpu_rx_rmap(vsi);
|
||||
|
||||
unroll_napi_add:
|
||||
if (vsi) {
|
||||
ice_napi_del(vsi);
|
||||
@@ -3519,6 +3535,8 @@ static void ice_remove(struct pci_dev *pdev)
|
||||
ice_service_task_stop(pf);
|
||||
|
||||
mutex_destroy(&(&pf->hw)->fdir_fltr_lock);
|
||||
if (!ice_is_safe_mode(pf))
|
||||
ice_remove_arfs(pf);
|
||||
ice_devlink_destroy_port(pf);
|
||||
ice_vsi_release_all(pf);
|
||||
ice_free_irq_msix_misc(pf);
|
||||
@@ -4036,11 +4054,14 @@ ice_set_features(struct net_device *netdev, netdev_features_t features)
|
||||
ret = ice_cfg_vlan_pruning(vsi, false, false);
|
||||
|
||||
if ((features & NETIF_F_NTUPLE) &&
|
||||
!(netdev->features & NETIF_F_NTUPLE))
|
||||
!(netdev->features & NETIF_F_NTUPLE)) {
|
||||
ice_vsi_manage_fdir(vsi, true);
|
||||
else if (!(features & NETIF_F_NTUPLE) &&
|
||||
(netdev->features & NETIF_F_NTUPLE))
|
||||
ice_init_arfs(vsi);
|
||||
} else if (!(features & NETIF_F_NTUPLE) &&
|
||||
(netdev->features & NETIF_F_NTUPLE)) {
|
||||
ice_vsi_manage_fdir(vsi, false);
|
||||
ice_clear_arfs(vsi);
|
||||
}
|
||||
|
||||
return ret;
|
||||
}
|
||||
@@ -4942,6 +4963,8 @@ static void ice_rebuild(struct ice_pf *pf, enum ice_reset_req reset_type)
|
||||
|
||||
/* replay Flow Director filters */
|
||||
ice_fdir_replay_fltrs(pf);
|
||||
|
||||
ice_rebuild_arfs(pf);
|
||||
}
|
||||
|
||||
ice_update_pf_netdev_link(pf);
|
||||
@@ -5721,6 +5744,9 @@ static const struct net_device_ops ice_netdev_ops = {
|
||||
.ndo_bridge_setlink = ice_bridge_setlink,
|
||||
.ndo_fdb_add = ice_fdb_add,
|
||||
.ndo_fdb_del = ice_fdb_del,
|
||||
#ifdef CONFIG_RFS_ACCEL
|
||||
.ndo_rx_flow_steer = ice_rx_flow_steer,
|
||||
#endif
|
||||
.ndo_tx_timeout = ice_tx_timeout,
|
||||
.ndo_bpf = ice_xdp,
|
||||
.ndo_xdp_xmit = ice_xdp_xmit,
|
||||
|
||||
Reference in New Issue
Block a user