|
|
d8f823 |
From 5d039200e42b7e170778424514d9d02cbf9fc8e6 Mon Sep 17 00:00:00 2001
|
|
|
d8f823 |
From: Alaa Hleihel <ahleihel@redhat.com>
|
|
|
d8f823 |
Date: Sun, 10 May 2020 15:04:45 -0400
|
|
|
d8f823 |
Subject: [PATCH 120/312] [netdrv] Revert "net/mlx5: Support lockless FTE read
|
|
|
d8f823 |
lookups"
|
|
|
d8f823 |
|
|
|
d8f823 |
Message-id: <20200510150452.10307-81-ahleihel@redhat.com>
|
|
|
d8f823 |
Patchwork-id: 306704
|
|
|
d8f823 |
Patchwork-instance: patchwork
|
|
|
d8f823 |
O-Subject: [RHEL8.3 BZ 1789380 v2 80/87] Revert "net/mlx5: Support lockless FTE read lookups"
|
|
|
d8f823 |
Bugzilla: 1789380
|
|
|
d8f823 |
RH-Acked-by: Kamal Heib <kheib@redhat.com>
|
|
|
d8f823 |
RH-Acked-by: Jarod Wilson <jarod@redhat.com>
|
|
|
d8f823 |
RH-Acked-by: Tony Camuso <tcamuso@redhat.com>
|
|
|
d8f823 |
RH-Acked-by: Jonathan Toppins <jtoppins@redhat.com>
|
|
|
d8f823 |
|
|
|
d8f823 |
Bugzilla: http://bugzilla.redhat.com/1789380
|
|
|
d8f823 |
Upstream: v5.5-rc6
|
|
|
d8f823 |
|
|
|
d8f823 |
commit 1f0593e791ed3fb4074d4470a261cde62d806ed5
|
|
|
d8f823 |
Author: Parav Pandit <parav@mellanox.com>
|
|
|
d8f823 |
Date: Wed Dec 11 00:35:18 2019 -0600
|
|
|
d8f823 |
|
|
|
d8f823 |
Revert "net/mlx5: Support lockless FTE read lookups"
|
|
|
d8f823 |
|
|
|
d8f823 |
This reverts commit 7dee607ed0e04500459db53001d8e02f8831f084.
|
|
|
d8f823 |
|
|
|
d8f823 |
During cleanup path, FTE's parent node group is removed which is
|
|
|
d8f823 |
referenced by the FTE while freeing the FTE.
|
|
|
d8f823 |
Hence FTE's lockless read lookup optimization done in cited commit is
|
|
|
d8f823 |
not possible at the moment.
|
|
|
d8f823 |
|
|
|
d8f823 |
Hence, revert the commit.
|
|
|
d8f823 |
|
|
|
d8f823 |
This avoid below KAZAN call trace.
|
|
|
d8f823 |
|
|
|
d8f823 |
[ 110.390896] BUG: KASAN: use-after-free in find_root.isra.14+0x56/0x60
|
|
|
d8f823 |
[mlx5_core]
|
|
|
d8f823 |
[ 110.391048] Read of size 4 at addr ffff888c19e6d220 by task
|
|
|
d8f823 |
swapper/12/0
|
|
|
d8f823 |
|
|
|
d8f823 |
[ 110.391219] CPU: 12 PID: 0 Comm: swapper/12 Not tainted 5.5.0-rc1+
|
|
|
d8f823 |
[ 110.391222] Hardware name: HP ProLiant DL380p Gen8, BIOS P70
|
|
|
d8f823 |
08/02/2014
|
|
|
d8f823 |
[ 110.391225] Call Trace:
|
|
|
d8f823 |
[ 110.391229] <IRQ>
|
|
|
d8f823 |
[ 110.391246] dump_stack+0x95/0xd5
|
|
|
d8f823 |
[ 110.391307] ? find_root.isra.14+0x56/0x60 [mlx5_core]
|
|
|
d8f823 |
[ 110.391320] print_address_description.constprop.5+0x20/0x320
|
|
|
d8f823 |
[ 110.391379] ? find_root.isra.14+0x56/0x60 [mlx5_core]
|
|
|
d8f823 |
[ 110.391435] ? find_root.isra.14+0x56/0x60 [mlx5_core]
|
|
|
d8f823 |
[ 110.391441] __kasan_report+0x149/0x18c
|
|
|
d8f823 |
[ 110.391499] ? find_root.isra.14+0x56/0x60 [mlx5_core]
|
|
|
d8f823 |
[ 110.391504] kasan_report+0x12/0x20
|
|
|
d8f823 |
[ 110.391511] __asan_report_load4_noabort+0x14/0x20
|
|
|
d8f823 |
[ 110.391567] find_root.isra.14+0x56/0x60 [mlx5_core]
|
|
|
d8f823 |
[ 110.391625] del_sw_fte_rcu+0x4a/0x100 [mlx5_core]
|
|
|
d8f823 |
[ 110.391633] rcu_core+0x404/0x1950
|
|
|
d8f823 |
[ 110.391640] ? rcu_accelerate_cbs_unlocked+0x100/0x100
|
|
|
d8f823 |
[ 110.391649] ? run_rebalance_domains+0x201/0x280
|
|
|
d8f823 |
[ 110.391654] rcu_core_si+0xe/0x10
|
|
|
d8f823 |
[ 110.391661] __do_softirq+0x181/0x66c
|
|
|
d8f823 |
[ 110.391670] irq_exit+0x12c/0x150
|
|
|
d8f823 |
[ 110.391675] smp_apic_timer_interrupt+0xf0/0x370
|
|
|
d8f823 |
[ 110.391681] apic_timer_interrupt+0xf/0x20
|
|
|
d8f823 |
[ 110.391684] </IRQ>
|
|
|
d8f823 |
[ 110.391695] RIP: 0010:cpuidle_enter_state+0xfa/0xba0
|
|
|
d8f823 |
[ 110.391703] Code: 3d c3 9b b5 50 e8 56 75 6e fe 48 89 45 c8 0f 1f 44
|
|
|
d8f823 |
00 00 31 ff e8 a6 94 6e fe 45 84 ff 0f 85 f6 02 00 00 fb 66 0f 1f 44 00
|
|
|
d8f823 |
00 <45> 85 f6 0f 88 db 06 00 00 4d 63 fe 4b 8d 04 7f 49 8d 04 87 49 8d
|
|
|
d8f823 |
[ 110.391706] RSP: 0018:ffff888c23a6fce8 EFLAGS: 00000246 ORIG_RAX:
|
|
|
d8f823 |
ffffffffffffff13
|
|
|
d8f823 |
[ 110.391712] RAX: dffffc0000000000 RBX: ffffe8ffff7002f8 RCX:
|
|
|
d8f823 |
000000000000001f
|
|
|
d8f823 |
[ 110.391715] RDX: 1ffff11184ee6cb5 RSI: 0000000040277d83 RDI:
|
|
|
d8f823 |
ffff888c277365a8
|
|
|
d8f823 |
[ 110.391718] RBP: ffff888c23a6fd40 R08: 0000000000000002 R09:
|
|
|
d8f823 |
0000000000035280
|
|
|
d8f823 |
[ 110.391721] R10: ffff888c23a6fc80 R11: ffffed11847485d0 R12:
|
|
|
d8f823 |
ffffffffb1017740
|
|
|
d8f823 |
[ 110.391723] R13: 0000000000000003 R14: 0000000000000003 R15:
|
|
|
d8f823 |
0000000000000000
|
|
|
d8f823 |
[ 110.391732] ? cpuidle_enter_state+0xea/0xba0
|
|
|
d8f823 |
[ 110.391738] cpuidle_enter+0x4f/0xa0
|
|
|
d8f823 |
[ 110.391747] call_cpuidle+0x6d/0xc0
|
|
|
d8f823 |
[ 110.391752] do_idle+0x360/0x430
|
|
|
d8f823 |
[ 110.391758] ? arch_cpu_idle_exit+0x40/0x40
|
|
|
d8f823 |
[ 110.391765] ? complete+0x67/0x80
|
|
|
d8f823 |
[ 110.391771] cpu_startup_entry+0x1d/0x20
|
|
|
d8f823 |
[ 110.391779] start_secondary+0x2f3/0x3c0
|
|
|
d8f823 |
[ 110.391784] ? set_cpu_sibling_map+0x2500/0x2500
|
|
|
d8f823 |
[ 110.391795] secondary_startup_64+0xa4/0xb0
|
|
|
d8f823 |
|
|
|
d8f823 |
[ 110.391841] Allocated by task 290:
|
|
|
d8f823 |
[ 110.391917] save_stack+0x21/0x90
|
|
|
d8f823 |
[ 110.391921] __kasan_kmalloc.constprop.8+0xa7/0xd0
|
|
|
d8f823 |
[ 110.391925] kasan_kmalloc+0x9/0x10
|
|
|
d8f823 |
[ 110.391929] kmem_cache_alloc_trace+0xf6/0x270
|
|
|
d8f823 |
[ 110.391987] create_root_ns.isra.36+0x58/0x260 [mlx5_core]
|
|
|
d8f823 |
[ 110.392044] mlx5_init_fs+0x5fd/0x1ee0 [mlx5_core]
|
|
|
d8f823 |
[ 110.392092] mlx5_load_one+0xc7a/0x3860 [mlx5_core]
|
|
|
d8f823 |
[ 110.392139] init_one+0x6ff/0xf90 [mlx5_core]
|
|
|
d8f823 |
[ 110.392145] local_pci_probe+0xde/0x190
|
|
|
d8f823 |
[ 110.392150] work_for_cpu_fn+0x56/0xa0
|
|
|
d8f823 |
[ 110.392153] process_one_work+0x678/0x1140
|
|
|
d8f823 |
[ 110.392157] worker_thread+0x573/0xba0
|
|
|
d8f823 |
[ 110.392162] kthread+0x341/0x400
|
|
|
d8f823 |
[ 110.392166] ret_from_fork+0x1f/0x40
|
|
|
d8f823 |
|
|
|
d8f823 |
[ 110.392218] Freed by task 2742:
|
|
|
d8f823 |
[ 110.392288] save_stack+0x21/0x90
|
|
|
d8f823 |
[ 110.392292] __kasan_slab_free+0x137/0x190
|
|
|
d8f823 |
[ 110.392296] kasan_slab_free+0xe/0x10
|
|
|
d8f823 |
[ 110.392299] kfree+0x94/0x250
|
|
|
d8f823 |
[ 110.392357] tree_put_node+0x257/0x360 [mlx5_core]
|
|
|
d8f823 |
[ 110.392413] tree_remove_node+0x63/0xb0 [mlx5_core]
|
|
|
d8f823 |
[ 110.392469] clean_tree+0x199/0x240 [mlx5_core]
|
|
|
d8f823 |
[ 110.392525] mlx5_cleanup_fs+0x76/0x580 [mlx5_core]
|
|
|
d8f823 |
[ 110.392572] mlx5_unload+0x22/0xc0 [mlx5_core]
|
|
|
d8f823 |
[ 110.392619] mlx5_unload_one+0x99/0x260 [mlx5_core]
|
|
|
d8f823 |
[ 110.392666] remove_one+0x61/0x160 [mlx5_core]
|
|
|
d8f823 |
[ 110.392671] pci_device_remove+0x10b/0x2c0
|
|
|
d8f823 |
[ 110.392677] device_release_driver_internal+0x1e4/0x490
|
|
|
d8f823 |
[ 110.392681] device_driver_detach+0x36/0x40
|
|
|
d8f823 |
[ 110.392685] unbind_store+0x147/0x200
|
|
|
d8f823 |
[ 110.392688] drv_attr_store+0x6f/0xb0
|
|
|
d8f823 |
[ 110.392693] sysfs_kf_write+0x127/0x1d0
|
|
|
d8f823 |
[ 110.392697] kernfs_fop_write+0x296/0x420
|
|
|
d8f823 |
[ 110.392702] __vfs_write+0x66/0x110
|
|
|
d8f823 |
[ 110.392707] vfs_write+0x1a0/0x500
|
|
|
d8f823 |
[ 110.392711] ksys_write+0x164/0x250
|
|
|
d8f823 |
[ 110.392715] __x64_sys_write+0x73/0xb0
|
|
|
d8f823 |
[ 110.392720] do_syscall_64+0x9f/0x3a0
|
|
|
d8f823 |
[ 110.392725] entry_SYSCALL_64_after_hwframe+0x44/0xa9
|
|
|
d8f823 |
|
|
|
d8f823 |
Fixes: 7dee607ed0e0 ("net/mlx5: Support lockless FTE read lookups")
|
|
|
d8f823 |
Signed-off-by: Parav Pandit <parav@mellanox.com>
|
|
|
d8f823 |
Signed-off-by: Saeed Mahameed <saeedm@mellanox.com>
|
|
|
d8f823 |
|
|
|
d8f823 |
Signed-off-by: Alaa Hleihel <ahleihel@redhat.com>
|
|
|
d8f823 |
Signed-off-by: Frantisek Hrbata <fhrbata@redhat.com>
|
|
|
d8f823 |
---
|
|
|
d8f823 |
drivers/net/ethernet/mellanox/mlx5/core/fs_core.c | 70 +++++------------------
|
|
|
d8f823 |
drivers/net/ethernet/mellanox/mlx5/core/fs_core.h | 1 -
|
|
|
d8f823 |
2 files changed, 15 insertions(+), 56 deletions(-)
|
|
|
d8f823 |
|
|
|
d8f823 |
diff --git a/drivers/net/ethernet/mellanox/mlx5/core/fs_core.c b/drivers/net/ethernet/mellanox/mlx5/core/fs_core.c
|
|
|
d8f823 |
index 7138dcf2e538..0e6a89b81972 100644
|
|
|
d8f823 |
--- a/drivers/net/ethernet/mellanox/mlx5/core/fs_core.c
|
|
|
d8f823 |
+++ b/drivers/net/ethernet/mellanox/mlx5/core/fs_core.c
|
|
|
d8f823 |
@@ -531,16 +531,9 @@ static void del_hw_fte(struct fs_node *node)
|
|
|
d8f823 |
}
|
|
|
d8f823 |
}
|
|
|
d8f823 |
|
|
|
d8f823 |
-static void del_sw_fte_rcu(struct rcu_head *head)
|
|
|
d8f823 |
-{
|
|
|
d8f823 |
- struct fs_fte *fte = container_of(head, struct fs_fte, rcu);
|
|
|
d8f823 |
- struct mlx5_flow_steering *steering = get_steering(&fte->node);
|
|
|
d8f823 |
-
|
|
|
d8f823 |
- kmem_cache_free(steering->ftes_cache, fte);
|
|
|
d8f823 |
-}
|
|
|
d8f823 |
-
|
|
|
d8f823 |
static void del_sw_fte(struct fs_node *node)
|
|
|
d8f823 |
{
|
|
|
d8f823 |
+ struct mlx5_flow_steering *steering = get_steering(node);
|
|
|
d8f823 |
struct mlx5_flow_group *fg;
|
|
|
d8f823 |
struct fs_fte *fte;
|
|
|
d8f823 |
int err;
|
|
|
d8f823 |
@@ -553,8 +546,7 @@ static void del_sw_fte(struct fs_node *node)
|
|
|
d8f823 |
rhash_fte);
|
|
|
d8f823 |
WARN_ON(err);
|
|
|
d8f823 |
ida_simple_remove(&fg->fte_allocator, fte->index - fg->start_index);
|
|
|
d8f823 |
-
|
|
|
d8f823 |
- call_rcu(&fte->rcu, del_sw_fte_rcu);
|
|
|
d8f823 |
+ kmem_cache_free(steering->ftes_cache, fte);
|
|
|
d8f823 |
}
|
|
|
d8f823 |
|
|
|
d8f823 |
static void del_hw_flow_group(struct fs_node *node)
|
|
|
d8f823 |
@@ -1634,47 +1626,22 @@ static u64 matched_fgs_get_version(struct list_head *match_head)
|
|
|
d8f823 |
}
|
|
|
d8f823 |
|
|
|
d8f823 |
static struct fs_fte *
|
|
|
d8f823 |
-lookup_fte_for_write_locked(struct mlx5_flow_group *g, const u32 *match_value)
|
|
|
d8f823 |
+lookup_fte_locked(struct mlx5_flow_group *g,
|
|
|
d8f823 |
+ const u32 *match_value,
|
|
|
d8f823 |
+ bool take_write)
|
|
|
d8f823 |
{
|
|
|
d8f823 |
struct fs_fte *fte_tmp;
|
|
|
d8f823 |
|
|
|
d8f823 |
- nested_down_write_ref_node(&g->node, FS_LOCK_PARENT);
|
|
|
d8f823 |
-
|
|
|
d8f823 |
- fte_tmp = rhashtable_lookup_fast(&g->ftes_hash, match_value, rhash_fte);
|
|
|
d8f823 |
- if (!fte_tmp || !tree_get_node(&fte_tmp->node)) {
|
|
|
d8f823 |
- fte_tmp = NULL;
|
|
|
d8f823 |
- goto out;
|
|
|
d8f823 |
- }
|
|
|
d8f823 |
-
|
|
|
d8f823 |
- if (!fte_tmp->node.active) {
|
|
|
d8f823 |
- tree_put_node(&fte_tmp->node, false);
|
|
|
d8f823 |
- fte_tmp = NULL;
|
|
|
d8f823 |
- goto out;
|
|
|
d8f823 |
- }
|
|
|
d8f823 |
- nested_down_write_ref_node(&fte_tmp->node, FS_LOCK_CHILD);
|
|
|
d8f823 |
-
|
|
|
d8f823 |
-out:
|
|
|
d8f823 |
- up_write_ref_node(&g->node, false);
|
|
|
d8f823 |
- return fte_tmp;
|
|
|
d8f823 |
-}
|
|
|
d8f823 |
-
|
|
|
d8f823 |
-static struct fs_fte *
|
|
|
d8f823 |
-lookup_fte_for_read_locked(struct mlx5_flow_group *g, const u32 *match_value)
|
|
|
d8f823 |
-{
|
|
|
d8f823 |
- struct fs_fte *fte_tmp;
|
|
|
d8f823 |
-
|
|
|
d8f823 |
- if (!tree_get_node(&g->node))
|
|
|
d8f823 |
- return NULL;
|
|
|
d8f823 |
-
|
|
|
d8f823 |
- rcu_read_lock();
|
|
|
d8f823 |
- fte_tmp = rhashtable_lookup(&g->ftes_hash, match_value, rhash_fte);
|
|
|
d8f823 |
+ if (take_write)
|
|
|
d8f823 |
+ nested_down_write_ref_node(&g->node, FS_LOCK_PARENT);
|
|
|
d8f823 |
+ else
|
|
|
d8f823 |
+ nested_down_read_ref_node(&g->node, FS_LOCK_PARENT);
|
|
|
d8f823 |
+ fte_tmp = rhashtable_lookup_fast(&g->ftes_hash, match_value,
|
|
|
d8f823 |
+ rhash_fte);
|
|
|
d8f823 |
if (!fte_tmp || !tree_get_node(&fte_tmp->node)) {
|
|
|
d8f823 |
- rcu_read_unlock();
|
|
|
d8f823 |
fte_tmp = NULL;
|
|
|
d8f823 |
goto out;
|
|
|
d8f823 |
}
|
|
|
d8f823 |
- rcu_read_unlock();
|
|
|
d8f823 |
-
|
|
|
d8f823 |
if (!fte_tmp->node.active) {
|
|
|
d8f823 |
tree_put_node(&fte_tmp->node, false);
|
|
|
d8f823 |
fte_tmp = NULL;
|
|
|
d8f823 |
@@ -1682,19 +1649,12 @@ lookup_fte_for_read_locked(struct mlx5_flow_group *g, const u32 *match_value)
|
|
|
d8f823 |
}
|
|
|
d8f823 |
|
|
|
d8f823 |
nested_down_write_ref_node(&fte_tmp->node, FS_LOCK_CHILD);
|
|
|
d8f823 |
-
|
|
|
d8f823 |
out:
|
|
|
d8f823 |
- tree_put_node(&g->node, false);
|
|
|
d8f823 |
- return fte_tmp;
|
|
|
d8f823 |
-}
|
|
|
d8f823 |
-
|
|
|
d8f823 |
-static struct fs_fte *
|
|
|
d8f823 |
-lookup_fte_locked(struct mlx5_flow_group *g, const u32 *match_value, bool write)
|
|
|
d8f823 |
-{
|
|
|
d8f823 |
- if (write)
|
|
|
d8f823 |
- return lookup_fte_for_write_locked(g, match_value);
|
|
|
d8f823 |
+ if (take_write)
|
|
|
d8f823 |
+ up_write_ref_node(&g->node, false);
|
|
|
d8f823 |
else
|
|
|
d8f823 |
- return lookup_fte_for_read_locked(g, match_value);
|
|
|
d8f823 |
+ up_read_ref_node(&g->node);
|
|
|
d8f823 |
+ return fte_tmp;
|
|
|
d8f823 |
}
|
|
|
d8f823 |
|
|
|
d8f823 |
static struct mlx5_flow_handle *
|
|
|
d8f823 |
diff --git a/drivers/net/ethernet/mellanox/mlx5/core/fs_core.h b/drivers/net/ethernet/mellanox/mlx5/core/fs_core.h
|
|
|
d8f823 |
index 8e4ca13f4d74..c6221ccbdddf 100644
|
|
|
d8f823 |
--- a/drivers/net/ethernet/mellanox/mlx5/core/fs_core.h
|
|
|
d8f823 |
+++ b/drivers/net/ethernet/mellanox/mlx5/core/fs_core.h
|
|
|
d8f823 |
@@ -205,7 +205,6 @@ struct fs_fte {
|
|
|
d8f823 |
enum fs_fte_status status;
|
|
|
d8f823 |
struct mlx5_fc *counter;
|
|
|
d8f823 |
struct rhash_head hash;
|
|
|
d8f823 |
- struct rcu_head rcu;
|
|
|
d8f823 |
int modify_mask;
|
|
|
d8f823 |
};
|
|
|
d8f823 |
|
|
|
d8f823 |
--
|
|
|
d8f823 |
2.13.6
|
|
|
d8f823 |
|