This system crashes making apport-collect not possible after the fact, though I confirm it is a bug. As the upstream nvme driver maintainer, I can recommend either which driver commits need to be reverted, or which kernel commit needs to be cherry-picked (preferring the latter :)).
This system crashes making apport-collect not possible after the fact, though I confirm it is a bug. As the upstream nvme driver maintainer, I can recommend either which driver commits need to be reverted, or which kernel commit needs to be cherry-picked (preferring the latter :)).
Here is a snippet of stack trace:
<3>[51827.132142] BUG: scheduling while atomic: swapper/ 19/0/0x00000100 temp_thermal intel_powerclamp coretemp kvm irqbypass input_leds joydev sb_edac ipmi_ssif edac_core mei_me mei lpc_ich ioatdma shpchp ipmi_si ipmi_msghandler 8250_fintek acpi_pad acpi_power_meter mac_hid ib_iser rdma_cm iw_cm ib_cm ib_sa ib_mad ib_core ib_addr iscsi_tcp libiscsi_tcp libiscsi scsi_transport_ iscsi autofs4 btrfs raid10 raid456 async_raid6_recov async_memcpy async_pq async_xor async_tx xor raid6_pq libcrc32c raid1 raid0 multipath linear igb dca ptp ahci crct10dif_pclmul crc32_pclmul hid_generic mxm_wmi aesni_intel aes_x86_64 lrw gf128mul usbhid glue_helper ablk_helper pps_core cryptd hid libahci i2c_algo_bit fjes wmi 86B.11. 01.0132. 060620160917 06/06/2016 b23>] dump_stack+ 0x63/0x90 ceb>] __schedule_ bug+0x4b/ 0x60 7d6>] __schedule+ 0x726/0xa30 b15>] schedule+0x35/0x80 ba9>] schedule_ timeout+ 0x129/0x270 480>] ? trace_event_ raw_event_ tick_stop+ 0x120/0x120 89d>] msleep+0x2d/0x40 470>] nvme_wait_ ready+0x90/ 0x100 [nvme] e70>] nvme_disable_ ctrl+0x40/ 0x50 [nvme] b3d>] nvme_disable_ admin_queue+ 0x8d/0x90 [nvme] dde>] nvme_dev_ disable+ 0x29e/0x2c0 [nvme] 3a0>] ? __nvme_ process_ cq+0x200/ 0x200 [nvme] 55c>] ? dev_warn+0x6c/0x90 ff0>] nvme_timeout+ 0x110/0x1d0 [nvme] 92f>] ? cpumask_ next_and+ 0x2f/0x40 4bc>] ? load_balance+ 0x18c/0x980 cdf>] blk_mq_ rq_timed_ out+0x2f/ 0x70 d6e>] blk_mq_ check_expired+ 0x4e/0x80 6c8>] bt_for_ each+0xd8/ 0xe0 d20>] ? blk_mq_ rq_timed_ out+0x70/ 0x70 d20>] ? blk_mq_ rq_timed_ out+0x70/ 0x70 ed7>] blk_mq_ queue_tag_ busy_iter+ 0x47/0xc0 a80>] ? blk_mq_ attempt_ merge+0xb0/ 0xb0 ac1>] blk_mq_ rq_timer+ 0x41/0xf0 4c5>] call_timer_ fn+0x35/ 0x120 a80>] ? blk_mq_ attempt_ merge+0xb0/ 0xb0 e7a>] run_timer_ softirq+ 0x23a/0x2f0 b11>] __do_softirq+ 0x101/0x290 e13>] irq_exit+0xa3/0xb0 6a2>] smp_apic_ timer_interrupt +0x42/0x50 962>] apic_timer_ interrupt+ 0x82/0x90 d21>] ? cpuidle_ enter_state+ 0x111/0x2b0 ef7>] cpuidle_ enter+0x17/ 0x20 ec2>] call_cpuidle+ 0x32/0x60 ed3>] ? cpuidle_ select+ 0x13/0x20 180>] cpu_startup_ entry+0x290/ 0x350 714>] start_secondary +0x154/ 0x190
<4>[51827.242686] Modules linked in: nvme binfmt_misc PlxSvc(OE) ipmi_devintf intel_rapl x86_pkg_
<4>[51827.242743] CPU: 19 PID: 0 Comm: swapper/19 Tainted: G W OE 4.4.0-24-generic #43-Ubuntu
<4>[51827.242746] Hardware name: Intel Corporation S2600WT2/S2600WT2, BIOS SE5C610.
<4>[51827.242748] 0000000000000286 374975818f2884ca ffff88105de43a98 ffffffff813eab23
<4>[51827.242752] ffff88105de56d00 0000000000000000 ffff88105de43aa8 ffffffff810a5ceb
<4>[51827.242762] ffff88105de43af8 ffffffff818217d6 ffff88105de43ac8 3749758100000013
<4>[51827.242765] Call Trace:
<4>[51827.242768] <IRQ> [<ffffffff813ea
<4>[51827.242781] [<ffffffff810a5
<4>[51827.242788] [<ffffffff81821
<4>[51827.242792] [<ffffffff81821
<4>[51827.242797] [<ffffffff81824
<4>[51827.242802] [<ffffffff810ec
<4>[51827.242807] [<ffffffff810ec
<4>[51827.242813] [<ffffffffc02cd
<4>[51827.242818] [<ffffffffc02ce
<4>[51827.242823] [<ffffffffc02d1
<4>[51827.242828] [<ffffffffc02d1
<4>[51827.242833] [<ffffffffc02d0
<4>[51827.242838] [<ffffffff81549
<4>[51827.242843] [<ffffffffc02d1
<4>[51827.242847] [<ffffffff813ea
<4>[51827.242850] [<ffffffff810bd
<4>[51827.242854] [<ffffffff813c5
<4>[51827.242857] [<ffffffff813c5
<4>[51827.242861] [<ffffffff813c8
<4>[51827.242864] [<ffffffff813c5
<4>[51827.242868] [<ffffffff813c5
<4>[51827.242871] [<ffffffff813c8
<4>[51827.242875] [<ffffffff813c4
<4>[51827.242878] [<ffffffff813c4
<4>[51827.242882] [<ffffffff810ec
<4>[51827.242885] [<ffffffff813c4
<4>[51827.242890] [<ffffffff810ec
<4>[51827.242894] [<ffffffff81085
<4>[51827.242899] [<ffffffff81085
<4>[51827.242902] [<ffffffff81828
<4>[51827.242905] [<ffffffff81826
<4>[51827.242907] <EOI> [<ffffffff816bc
<4>[51827.242914] [<ffffffff816bc
<4>[51827.242918] [<ffffffff810c3
<4>[51827.242921] [<ffffffff816bc
<4>[51827.242925] [<ffffffff810c4
<4>[51827.242929] [<ffffffff81051
<3>[51827.242934] bad: scheduling from the idle thread!