-
Bug
-
Resolution: Done
-
Undefined
-
None
-
rhel-9.4
-
None
-
None
-
None
-
rhel-sst-network-fastdatapath
-
ssg_networking
-
None
-
False
-
-
None
-
None
-
None
-
None
-
None
What were you trying to do that didn't work?
Kernel panic when running the bbdev test on ACC100 card on dpdk-22.11-4.el9
Please provide the package NVR for which bug is seen:
[root@dell-per750-37 ~]# rpm -qa|grep dpdk
dpdk-22.11-4.el9.x86_64
dpdk-tools-22.11-4.el9.x86_64
[root@dell-per750-37 ~]# uname -r
5.14.0-427.13.1.el9_4.x86_64
How reproducible:
Steps to reproduce
[root@dell-per750-37 ~]# lspci|grep accelerators
b2:00.0 Processing accelerators: Intel Corporation Device 0d5c
- modprobe vfio-pci enable_sriov=1
- dpdk-devbind.py -b vfio-pci 0000:b2:00.0
- pf_bb_config acc100 -p 0000:b2:00.0 -v b99fb1ff-7e65-43d6-9e3f-c1fc341ba4a6 -c /usr/share/pf-bb-config/acc100/acc100_config_vf.cfg
- echo 16 > /sys/bus/pci/devices/0000:b2:00.0/sriov_numvfs
Expected results
There is no kernel panic
Actual results
job link:https://beaker.engineering.redhat.com/jobs/9461861
There is kernel panic
[ 738.703182] task:runtest.sh state stack:0 pid:2571 ppid:2545 flags:0x00004002
[ 738.703662] Call Trace:
[ 738.704110] <TASK>
[ 738.704582] __schedule+0x21b/0x550
[ 738.705094] schedule+0x2d/0x70
[ 738.705571] schedule_preempt_disabled+0x11/0x20
[ 738.706029] rwsem_down_write_slowpath+0x23d/0x500
[ 738.706475] down_write+0x58/0x60
[ 738.706922] pci_add_new_bus+0x2b/0x90
[ 738.707360] pci_iov_add_virtfn+0x2d3/0x330
[ 738.707804] sriov_enable+0x212/0x3e0
[ 738.708235] vfio_pci_core_sriov_configure+0x144/0x1b0 [vfio_pci_core]
[ 738.708691] sriov_numvfs_store+0xb7/0x140
[ 738.709120] kernfs_fop_write_iter+0x121/0x1b0
[ 738.709566] vfs_write+0x2cb/0x410
[ 738.710014] ksys_write+0x5f/0xe0
[ 738.710444] do_syscall_64+0x59/0x90
[ 738.710865] ? handle_mm_fault+0xcd/0x290
[ 738.711282] ? do_user_addr_fault+0x1d6/0x6a0
[ 738.711712] ? exc_page_fault+0x62/0x150
[ 738.712105] entry_SYSCALL_64_after_hwframe+0x72/0xdc
[ 738.712518] RIP: 0033:0x7f52918fda57
[ 738.712942] RSP: 002b:00007ffcaf999768 EFLAGS: 00000246 ORIG_RAX: 0000000000000001
[ 738.713341] RAX: ffffffffffffffda RBX: 0000000000000003 RCX: 00007f52918fda57
[ 738.713748] RDX: 0000000000000003 RSI: 000056048ea4ccb0 RDI: 0000000000000001
[ 738.714134] RBP: 000056048ea4ccb0 R08: 0000000000000000 R09: 00007f52919b14e0
[ 738.714548] R10: 00007f52919b13e0 R11: 0000000000000246 R12: 0000000000000003
[ 738.714976] R13: 00007f52919fb780 R14: 0000000000000003 R15: 00007f52919f69e0
[ 738.715390] </TASK>
[ 861.568571] INFO: task kworker/0:3:614 blocked for more than 245 seconds.
[ 861.569002] Not tainted 5.14.0-427.13.1.el9_4.x86_64 #1
[ 861.569428] "echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message.
[ 861.569884] task:kworker/0:3 state stack:0 pid:614 ppid:2 flags:0x00004000
[ 861.570377] Workqueue: events aer_recover_work_func
[ 861.570852] Call Trace:
[ 861.571316] <TASK>
[ 861.571774] __schedule+0x21b/0x550
[ 861.572237] schedule+0x2d/0x70
[ 861.572688] schedule_preempt_disabled+0x11/0x20
[ 861.573148] __mutex_lock.constprop.0+0x433/0x6a0
[ 861.573600] ? __pfx_aer_root_reset+0x10/0x10
[ 861.574063] report_error_detected+0x25/0x150
[ 861.574507] ? __pfx_report_frozen_detected+0x10/0x10
[ 861.574514] pci_walk_bus+0x6f/0x90
[ 861.574518] pcie_do_recovery+0x222/0x310
[ 861.574522] aer_recover_work_func.cold+0x8d/0x8f
[ 861.574526] process_one_work+0x1e2/0x3b0
[ 861.574530] ? __pfx_worker_thread+0x10/0x10
[ 861.574532] worker_thread+0x50/0x3a0
[ 861.574535] ? __pfx_worker_thread+0x10/0x10
[ 861.574536] kthread+0xdd/0x100
[ 861.574539] ? __pfx_kthread+0x10/0x10
[ 861.574543] ret_from_fork+0x29/0x50
[ 861.574548] </TASK>