Oops#2 Part17 <7>[ 439.558042] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[3] 0x400c 0x13c <7>[ 439.558156] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[4] 0x4010 0x100 <7>[ 439.558260] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[5] 0x4014 0x100 <7>[ 439.558362] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[6] 0x4018 0x100 <7>[ 439.558463] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[7] 0x401c 0x100 <7>[ 439.558534] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[8] 0x4020 0x100 <7>[ 439.558604] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[9] 0x4024 0x100 <7>[ 439.558674] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[10] 0x4028 0x100 <7>[ 439.558743] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[11] 0x402c 0x100 <7>[ 439.558811] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[12] 0x4030 0x100 <7>[ 439.558892] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[13] 0x4034 0x100 <7>[ 439.558993] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[14] 0x4038 0x100 <7>[ 439.559091] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[15] 0x403c 0x100 <7>[ 439.559224] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying rcs0 save-restore MMIOs <7>[ 439.559337] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x2050] = 0x10001000 <7>[ 439.559446] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x20c4] = 0x3f7e0306 <7>[ 439.559547] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x20d4] = 0xc080c080 Oops#2 Part16 <7>[ 439.559625] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x24d0] = 0x00006210 <7>[ 439.559697] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x24d4] = 0x000062a8 <7>[ 439.559768] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x24d8] = 0x1000dafc <7>[ 439.559836] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x24dc] = 0x1000db01 <7>[ 439.559905] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x24e0] = 0x0000db1c <7>[ 439.559990] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe194] = 0x00400040 <7>[ 439.560097] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe48c] = 0x02000200 <7>[ 439.560231] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe49c] = 0x40004000 <7>[ 439.560338] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe4c4] = 0x10401040 <7>[ 439.560446] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe4f0] = 0x00020002 <7>[ 439.560560] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe530] = 0x00000400 <7>[ 439.560654] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe7c8] = 0x04002000 <7>[ 439.560733] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe7cc] = 0x00009000 <7>[ 439.560809] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x14800] = 0x00020002 <7>[ 439.560956] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying bcs0 save-restore MMIOs <7>[ 439.561052] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x22050] = 0x10001000 Oops#2 Part15 <7>[ 439.561178] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x220c4] = 0x3f7e0306 <7>[ 439.561282] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x220d4] = 0xc080c080 <7>[ 439.561508] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying bcs8 save-restore MMIOs <7>[ 439.561619] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x3ee050] = 0x10001000 <7>[ 439.561693] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x3ee0c4] = 0x3f7e0306 <7>[ 439.561767] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x3ee0d4] = 0xc080c080 <7>[ 439.561912] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying ccs0 save-restore MMIOs <7>[ 439.561983] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a050] = 0x10001000 <7>[ 439.562086] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a0c4] = 0x3f7e0308 <7>[ 439.562218] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a0d4] = 0xc080c080 <7>[ 439.562332] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a4d0] = 0x1000dafc <7>[ 439.562434] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a4d4] = 0x1000db01 <7>[ 439.562538] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a4d8] = 0x0000db1c <7>[ 439.562734] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying ccs1 save-restore MMIOs <7>[ 439.562807] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c050] = 0x10001000 Oops#2 Part14 <7>[ 439.562879] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c0c4] = 0x3f7e0308 <7>[ 439.562951] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c0d4] = 0xc080c080 <7>[ 439.563022] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c4d0] = 0x1000dafc <7>[ 439.563114] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c4d4] = 0x1000db01 <7>[ 439.563255] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c4d8] = 0x0000db1c <7>[ 439.563788] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 439.567418] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 0] = 0x0196f1cf <7>[ 439.567493] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 1] = 0x00000800 <7>[ 439.567556] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 2] = 0x00000014 <7>[ 439.567616] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 3] = 0x00000001 <7>[ 439.567677] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 4] = 0x00000c00 <7>[ 439.567736] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 5] = 0xe20b0000 <7>[ 439.567796] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 6] = 0x00000000 <7>[ 439.567855] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 7] = 0x00000000 <7>[ 439.567914] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 8] = 0x00000000 <7>[ 439.567973] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 9] = 0x00000000 Oops#2 Part13 <7>[ 439.568032] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[10] = 0x00000000 <7>[ 439.568090] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[11] = 0x00000000 <7>[ 439.568164] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[12] = 0x00000000 <7>[ 439.568228] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[13] = 0x00000000 <7>[ 439.568320] xe 0000:03:00.0: [drm:xe_guc_id_mgr_init [xe]] Tile0: GT0: using 65535 GuC IDs <7>[ 439.568414] xe 0000:03:00.0: [drm:xe_guc_db_mgr_init [xe]] Tile0: GT0: using 256 doorbells <7>[ 439.569615] xe 0000:03:00.0: [drm:guc_buf_cache_init [xe]] Tile0: GT0: reusable buffer with 2097152 dwords at 0xe8c000 for xe_guc_buf_cache_init_with_size [xe] <7>[ 439.570596] xe 0000:03:00.0: [drm:xe_migrate_init [xe]] Migrate min chunk size is 0x00010000 <7>[ 439.571589] xe 0000:03:00.0: [drm:xe_guc_capture_steered_list_init [xe]] Tile0: GT0: capture found 120 ext-regs. <7>[ 439.593667] xe 0000:03:00.0: [drm:xe_guc_ads_populate [xe]] Tile0: GT0: Updated ADS capture size 20480 (was 49152) <7>[ 439.604458] xe 0000:03:00.0: [drm:guc_wait_ucode [xe]] Tile0: GT0: GuC load: init took 10ms, freq = 2150MHz (req = 2133MHz), before = 2150MHz, status = 0x8002F034 <7>[ 439.604731] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel enabled <7>[ 439.605370] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: LRC rcs0 WA job: 4146 dwords <7>[ 439.605454] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x5588] = 0x04000400 Oops#2 Part12 <7>[ 439.605524] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x6204] = 0x00400040 <7>[ 439.605588] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x6208] = 0x00200020 <7>[ 439.605655] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x62a8] = 0x02400240 <7>[ 439.605720] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x7010] = 0x40004000 <7>[ 439.605784] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x7044] = 0x04200420 <7>[ 439.605848] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x7300] = 0x10001000 <7>[ 439.605915] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x83a8] = 0x20002000 <7>[ 439.605986] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x6210] = ~0x3f18000|0x3f18000 (MCR) <7>[ 439.607712] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: LRC bcs0 WA job: 27 dwords <7>[ 439.607792] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x22204] = ~0x7e7e|0x606 <7>[ 439.607860] xe 0000:03:00.0: [drm:xe_lrc_emit_hwe_state_instructions [xe]] Tile0: GT0: No non-register state to emit on graphics ver 20.01 <7>[ 439.609689] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: LRC ccs0 WA job: 0 dwords <7>[ 439.609767] xe 0000:03:00.0: [drm:xe_lrc_emit_hwe_state_instructions [xe]] Tile0: GT0: No non-register state to emit on graphics ver 20.01 <5>[ 439.612486] FAULT_INJECTION: forcing a failure. <5>[ 439.612486] name fail_function, interval 0, probability 100, space 1, times 100 Oops#2 Part11 <3>[ 439.612490] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC PC query task state failed: -ENOMEM <4>[ 439.612506] ------------[ cut here ]------------ <4>[ 439.612507] xe 0000:03:00.0: [drm] Assertion `ct->g2h_outstanding == 0 || state == XE_GUC_CT_STATE_STOPPED` failed! <4>[ 439.612507] platform: BATTLEMAGE subplatform: 7 <4>[ 439.612507] graphics: Xe2_HPG 20.01 step A0 <4>[ 439.612507] media: Xe2_HPM 13.01 step A1 <4>[ 439.612507] tile: 0 VRAM 12.0 GiB <4>[ 439.612507] GT: 0 type 1 <4>[ 439.612510] WARNING: drivers/gpu/drm/xe/xe_guc_ct.c:541 at guc_ct_change_state+0x264/0x330 [xe], CPU#5: xe_fault_inject/6223 <4>[ 439.612589] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_gsc_proxy mei_lb mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp cmdlinepart hid_generic spi_nor coretemp eeepc_wmi mtd asus_wmi mei_hdcp mei_pxp sparse_keymap platform_profile wmi_bmof kvm_intel kvm irqbypass ghash_clmulni_intel usbhid aesni_intel hid rapl r8169 snd_intel_dspcfg snd_hda_codec intel_cstate snd_hda_core realtek snd_hwdep snd_pcm video binfmt_misc snd_timer i2c_i801 snd spi_intel_pci mei_me i2c_mux idma64 spi_intel soundcore i2c_smbus mei intel_pmc_core pmt_telemetry pmt_discovery nls_iso8859_1 pmt_class intel_pmc_ssram_telemetry acpi_tad acpi_pad pinctrl_alderlake wmi intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink Oops#2 Part10 <4>[ 439.612641] autofs4 [last unloaded: snd_hda_intel] <4>[ 439.612645] CPU: 5 UID: 0 PID: 6223 Comm: xe_fault_inject Tainted: G S U W L 7.0.0-rc2-lgci-xe-xe-4676-986ab51c0937c489d-debug+ #1 PREEMPT(lazy) <4>[ 439.612648] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN, [L]=SOFTLOCKUP <4>[ 439.612649] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 439.612650] RIP: 0010:guc_ct_change_state+0x2d8/0x330 [xe] <4>[ 439.612724] Code: 51 48 c1 ea 25 44 6b ca 64 44 29 c9 51 48 c7 c1 a0 7e 18 a1 52 4c 8b 55 88 41 52 44 8b 4d 9c 4c 8b 45 90 48 8b 95 78 ff ff ff <67> 48 0f b9 3a 8b 8b 50 01 00 00 48 83 c4 60 85 c9 75 13 44 89 bb <4>[ 439.612726] RSP: 0018:ffffc90007fdb668 EFLAGS: 00010002 <4>[ 439.612728] RAX: ffffffffa11fd6f9 RBX: ffff888250f68738 RCX: ffffffffa1187ea0 <4>[ 439.612729] RDX: ffff88810469c690 RSI: ffffffffa11fd6f9 RDI: ffffffffa1002f00 <4>[ 439.612730] RBP: ffffc90007fdb750 R08: ffffffffa11fd749 R09: 0000000000000007 <4>[ 439.612731] R10: ffffffffa11fd7fa R11: 0000000000000514 R12: ffff888250f687c8 <4>[ 439.612732] R13: 0000000000000001 R14: 0000000000000000 R15: 0000000000000001 Oops#2 Part9 <4>[ 439.612733] FS: 000073b6fac08980(0000) GS:ffff8888daf19000(0000) knlGS:0000000000000000 <4>[ 439.612735] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 439.612736] CR2: 00005ca49aee69f0 CR3: 0000000177ecf005 CR4: 0000000000f72ef0 <4>[ 439.612737] PKRU: 55555554 <4>[ 439.612738] Call Trace: <4>[ 439.612739] <4>[ 439.612747] ? xe_guc_submit_enable+0xa8/0xf0 [xe] <4>[ 439.612825] xe_guc_ct_disable+0x17/0x80 [xe] <4>[ 439.612896] xe_guc_sanitize+0x2a/0x50 [xe] <4>[ 439.612963] xe_uc_load_hw+0x19a/0x2b0 [xe] <4>[ 439.613060] ? xe_migrate_init+0x277/0x2d0 [xe] <4>[ 439.613143] xe_gt_init+0x35d/0xab0 [xe] <4>[ 439.613221] ? _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 439.613227] ? __devm_add_action+0x70/0xa0 <4>[ 439.613231] ? xe_irq_install+0x11a/0x490 [xe] <4>[ 439.613321] xe_device_probe+0x32c/0xbe0 [xe] <4>[ 439.613396] ? __drm_dev_dbg+0x7d/0xb0 <4>[ 439.613401] ? __drmm_add_action_or_reset+0x1e/0x50 <4>[ 439.613407] xe_pci_probe+0x39b/0x620 [xe] <4>[ 439.613498] ? trace_hardirqs_on+0x22/0x100 <4>[ 439.613506] local_pci_probe+0x47/0xb0 <4>[ 439.613511] pci_call_probe+0x6c/0x360 <4>[ 439.613516] ? _raw_spin_unlock+0x22/0x50 <4>[ 439.613521] pci_device_probe+0xae/0x110 <4>[ 439.613525] really_probe+0xf1/0x410 <4>[ 439.613529] __driver_probe_device+0x8c/0x190 <4>[ 439.613532] device_driver_attach+0x57/0xd0 <4>[ 439.613535] bind_store+0x142/0x150 <4>[ 439.613539] drv_attr_store+0x24/0x50 <4>[ 439.613542] sysfs_kf_write+0x4d/0x80 <4>[ 439.613547] kernfs_fop_write_iter+0x188/0x240 <4>[ 439.613551] vfs_write+0x283/0x540 <4>[ 439.613559] ksys_write+0x6f/0xf0 Oops#2 Part8 <4>[ 439.613562] __x64_sys_write+0x19/0x30 <4>[ 439.613564] x64_sys_call+0x259/0x26e0 <4>[ 439.613568] do_syscall_64+0xdd/0x1470 <4>[ 439.613573] ? putname+0x41/0x90 <4>[ 439.613575] ? do_sys_openat2+0x85/0xd0 <4>[ 439.613581] ? __x64_sys_openat+0x54/0xa0 <4>[ 439.613583] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 439.613587] ? do_syscall_64+0x22e/0x1470 <4>[ 439.613590] ? ksys_write+0x6f/0xf0 <4>[ 439.613593] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 439.613597] ? do_syscall_64+0x22e/0x1470 <4>[ 439.613599] ? do_syscall_64+0x22e/0x1470 <4>[ 439.613603] entry_SYSCALL_64_after_hwframe+0x76/0x7e <4>[ 439.613605] RIP: 0033:0x73b6fcd1c5a4 <4>[ 439.613609] Code: c7 00 16 00 00 00 b8 ff ff ff ff c3 66 2e 0f 1f 84 00 00 00 00 00 f3 0f 1e fa 80 3d a5 ea 0e 00 00 74 13 b8 01 00 00 00 0f 05 <48> 3d 00 f0 ff ff 77 54 c3 0f 1f 00 55 48 89 e5 48 83 ec 20 48 89 <4>[ 439.613610] RSP: 002b:00007fff26146558 EFLAGS: 00000202 ORIG_RAX: 0000000000000001 <4>[ 439.613612] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 000073b6fcd1c5a4 <4>[ 439.613613] RDX: 000000000000000c RSI: 00007fff26146a20 RDI: 0000000000000007 <4>[ 439.613614] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 439.613616] R10: 0000000000000000 R11: 0000000000000202 R12: 00007fff26146a20 <4>[ 439.613617] R13: 0000000000000007 R14: 0000000000000006 R15: 00007fff261466d0 <4>[ 439.613624] <4>[ 439.613626] irq event stamp: 1493636 <4>[ 439.613627] hardirqs last enabled at (1493635): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 439.613630] hardirqs last disabled at (1493636): [] _raw_spin_lock_irq+0x6f/0x80 Oops#2 Part7 <4>[ 439.613632] softirqs last enabled at (1491412): [] __irq_exit_rcu+0x13f/0x160 <4>[ 439.613635] softirqs last disabled at (1491405): [] __irq_exit_rcu+0x13f/0x160 <4>[ 439.613637] ---[ end trace 0000000000000000 ]--- <7>[ 439.613639] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <3>[ 439.613736] xe 0000:03:00.0: probe with driver xe failed with error -12 <3>[ 439.614317] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <7>[ 439.614681] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 439.616013] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 439.686033] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 439.687848] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. <6>[ 440.023783] pcieport 0000:00:06.0: AER: Multiple Correctable error message received from 0000:05:00.0 <4>[ 440.023791] nvme 0000:05:00.0: PCIe Bus Error: severity=Correctable, type=Physical Layer, (Receiver ID) <4>[ 440.023794] nvme 0000:05:00.0: device [15b7:5017] error status/mask=00000001/0000e000 <4>[ 440.023797] nvme 0000:05:00.0: [ 0] RxErr (First) <3>[ 441.879902] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=53 recv=52 <1>[ 441.881804] BUG: unable to handle page fault for address: ffffc9002238a188 Oops#2 Part6 <1>[ 441.881833] #PF: supervisor write access in kernel mode <1>[ 441.881852] #PF: error_code(0x0002) - not-present page <6>[ 441.881866] PGD 100000067 P4D 100000067 PUD 100ab7067 PMD 0 <4>[ 441.881891] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 441.881910] CPU: 12 UID: 0 PID: 2410 Comm: kworker/12:3 Tainted: G S U W L 7.0.0-rc2-lgci-xe-xe-4676-986ab51c0937c489d-debug+ #1 PREEMPT(lazy) <4>[ 441.881946] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN, [L]=SOFTLOCKUP <4>[ 441.881961] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 441.881983] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 441.882504] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 441.883000] Code: 24 66 90 65 8b 05 2c 6c 2e e3 48 0f a3 05 d0 d1 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 441.883036] RSP: 0018:ffffc90003ee37e0 EFLAGS: 00010086 <4>[ 441.883054] RAX: 0000000000000002 RBX: ffffc9002238a188 RCX: 0000000000000000 <4>[ 441.883072] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff888124dd8060 <4>[ 441.883089] RBP: ffffc90003ee3858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 441.883106] R10: ffff888275ca8000 R11: 0000000000000001 R12: ffff888124dd8060 <4>[ 441.883123] R13: 000000000000a188 R14: ffff888275ca8000 R15: 0000000000010001 <4>[ 441.883140] FS: 0000000000000000(0000) GS:ffff8888db299000(0000) knlGS:0000000000000000 <4>[ 441.883161] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 441.883176] CR2: ffffc9002238a188 CR3: 000000000344c004 CR4: 0000000000f72ef0 Oops#2 Part5 <4>[ 441.883194] PKRU: 55555554 <4>[ 441.883205] Call Trace: <4>[ 441.883214] <4>[ 441.883232] xe_force_wake_get+0x2a5/0x940 [xe] <4>[ 441.883653] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 441.883682] ? mark_held_locks+0x46/0x90 <4>[ 441.883704] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 441.884161] ? trace_hardirqs_on+0x22/0x100 <4>[ 441.884183] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 441.884201] ? xe_tlb_inval_fence_prep+0xce/0x1e0 [xe] <4>[ 441.884727] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 441.885246] ? xelpg_ggtt_pte_flags+0x27/0x1a0 [xe] <4>[ 441.885669] ? find_held_lock+0x31/0x90 <4>[ 441.885685] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 441.886108] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 441.886524] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 441.886938] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 441.887127] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 441.887228] ? _raw_write_unlock+0x22/0x50 <4>[ 441.887232] ? drm_vma_offset_remove+0x65/0x80 <4>[ 441.887238] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 441.887335] ? lock_is_held_type+0xa3/0x130 <4>[ 441.887342] ttm_bo_release+0x70/0x310 [ttm] <4>[ 441.887352] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 441.887452] ? lock_release+0xd0/0x2b0 <4>[ 441.887456] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 441.887465] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 441.887560] drm_gem_object_free+0x1d/0x40 <4>[ 441.887564] xe_bo_put+0x12a/0x190 [xe] <4>[ 441.887661] xe_lrc_destroy+0x74/0x90 [xe] <4>[ 441.887775] __xe_exec_queue_fini+0x6b/0xa0 [xe] <4>[ 441.887874] xe_exec_queue_fini+0x2b/0x60 [xe] <4>[ 441.887974] __guc_exec_queue_destroy_async+0x6c/0x1a0 [xe] Oops#2 Part4 <4>[ 441.888084] process_one_work+0x22e/0x740 <4>[ 441.888090] worker_thread+0x1e8/0x3d0 <4>[ 441.888093] ? __pfx_worker_thread+0x10/0x10 <4>[ 441.888097] kthread+0x10d/0x150 <4>[ 441.888101] ? __pfx_kthread+0x10/0x10 <4>[ 441.888106] ret_from_fork+0x3d4/0x480 <4>[ 441.888110] ? __pfx_kthread+0x10/0x10 <4>[ 441.888114] ret_from_fork_asm+0x1a/0x30 <4>[ 441.888121] <4>[ 441.888123] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_gsc_proxy mei_lb mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp cmdlinepart hid_generic spi_nor coretemp eeepc_wmi mtd asus_wmi mei_hdcp mei_pxp sparse_keymap platform_profile wmi_bmof kvm_intel kvm irqbypass ghash_clmulni_intel usbhid aesni_intel hid rapl r8169 snd_intel_dspcfg snd_hda_codec intel_cstate snd_hda_core realtek snd_hwdep snd_pcm video binfmt_misc snd_timer i2c_i801 snd spi_intel_pci mei_me i2c_mux idma64 spi_intel soundcore i2c_smbus mei intel_pmc_core pmt_telemetry pmt_discovery nls_iso8859_1 pmt_class intel_pmc_ssram_telemetry acpi_tad acpi_pad pinctrl_alderlake wmi intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 441.888168] autofs4 [last unloaded: snd_hda_intel] <4>[ 441.888203] CR2: ffffc9002238a188 <4>[ 441.888207] ---[ end trace 0000000000000000 ]--- <6>[ 441.992538] pcieport 0000:00:06.0: AER: Multiple Correctable error message received from 0000:05:00.0 Oops#2 Part3 <4>[ 441.992547] nvme 0000:05:00.0: PCIe Bus Error: severity=Correctable, type=Physical Layer, (Receiver ID) <4>[ 441.992551] nvme 0000:05:00.0: device [15b7:5017] error status/mask=00000001/0000e000 <4>[ 441.992554] nvme 0000:05:00.0: [ 0] RxErr (First) <4>[ 442.071637] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 442.071767] Code: 24 66 90 65 8b 05 2c 6c 2e e3 48 0f a3 05 d0 d1 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 442.071776] RSP: 0018:ffffc90003ee37e0 EFLAGS: 00010086 <4>[ 442.071780] RAX: 0000000000000002 RBX: ffffc9002238a188 RCX: 0000000000000000 <4>[ 442.071784] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff888124dd8060 <4>[ 442.071788] RBP: ffffc90003ee3858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 442.071792] R10: ffff888275ca8000 R11: 0000000000000001 R12: ffff888124dd8060 <4>[ 442.071795] R13: 000000000000a188 R14: ffff888275ca8000 R15: 0000000000010001 <4>[ 442.071799] FS: 0000000000000000(0000) GS:ffff8888db299000(0000) knlGS:0000000000000000 <4>[ 442.071804] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 442.071808] CR2: ffffc9002238a188 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 442.071811] PKRU: 55555554 <6>[ 442.071814] note: kworker/12:3[2410] exited with irqs disabled <6>[ 442.071838] note: kworker/12:3[2410] exited with preempt_count 1 <1>[ 444.182409] BUG: unable to handle page fault for address: ffffc90003ee3a90 <1>[ 444.182439] #PF: supervisor read access in kernel mode Oops#2 Part2 <1>[ 444.182452] #PF: error_code(0x0000) - not-present page <6>[ 444.182464] PGD 100000067 P4D 100000067 PUD 100ab7067 PMD 12cf34067 PTE 0 <4>[ 444.182486] Oops: Oops: 0000 [#2] SMP NOPTI <4>[ 444.182503] CPU: 4 UID: 0 PID: 3858 Comm: kworker/u64:56 Tainted: G S UD W L 7.0.0-rc2-lgci-xe-xe-4676-986ab51c0937c489d-debug+ #1 PREEMPT(lazy) <4>[ 444.182532] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN, [L]=SOFTLOCKUP <4>[ 444.182546] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 444.182561] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 444.183098] RIP: 0010:xe_tlb_inval_fence_timeout+0x65/0x220 [xe] <4>[ 444.183608] Code: 89 df 48 89 45 d0 49 8b 85 08 ff ff ff 48 8b 40 20 2e 2e 2e ff d0 49 8d 45 c0 48 89 c7 48 89 45 b8 e8 1f d2 c7 e1 49 8b 45 b0 <48> 8b 30 4c 8d 78 80 48 8d 5e 80 49 8d 75 b0 48 89 75 c8 48 39 c6 <4>[ 444.183643] RSP: 0018:ffffc9000a6d7db0 EFLAGS: 00010046 <4>[ 444.183660] RAX: ffffc90003ee3a90 RBX: ffff888124dd8458 RCX: 0000000000000000 <4>[ 444.183676] RDX: 0000000000000000 RSI: 0000000000000000 RDI: 0000000000000000 <4>[ 444.183692] RBP: ffffc9000a6d7df8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 444.183707] R10: 0000000000000000 R11: 0000000000000000 R12: ffff888275ca8000 <4>[ 444.183722] R13: ffff888124dd8560 R14: ffff888124dd8560 R15: ffff888271436ec0 <4>[ 444.183738] FS: 0000000000000000(0000) GS:ffff8888dae99000(0000) knlGS:0000000000000000 <4>[ 444.183758] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 444.183772] CR2: ffffc90003ee3a90 CR3: 000000000344c004 CR4: 0000000000f72ef0 Oops#2 Part1 <4>[ 444.183789] PKRU: 55555554 <4>[ 444.183798] Call Trace: <4>[ 444.183807] <4>[ 444.183823] process_one_work+0x22e/0x740 <4>[ 444.183851] worker_thread+0x1e8/0x3d0 <4>[ 444.183866] ? __pfx_worker_thread+0x10/0x10 <4>[ 444.183881] kthread+0x10d/0x150 <4>[ 444.183899] ? __pfx_kthread+0x10/0x10 <4>[ 444.183917] ret_from_fork+0x3d4/0x480 <4>[ 444.183931] ? __pfx_kthread+0x10/0x10 <4>[ 444.183949] ret_from_fork_asm+0x1a/0x30 <4>[ 444.183975] <4>[ 444.183983] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_gsc_proxy mei_lb mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp cmdlinepart hid_generic spi_nor coretemp eeepc_wmi mtd asus_wmi mei_hdcp mei_pxp sparse_keymap platform_profile wmi_bmof kvm_intel kvm irqbypass ghash_clmulni_intel usbhid aesni_intel hid rapl r8169 snd_intel_dspcfg snd_hda_codec intel_cstate snd_hda_core realtek snd_hwdep snd_pcm video binfmt_misc snd_timer i2c_i801 snd spi_intel_pci mei_me i2c_mux idma64 spi_intel soundcore i2c_smbus mei intel_pmc_core pmt_telemetry pmt_discovery nls_iso8859_1 pmt_class intel_pmc_ssram_telemetry acpi_tad acpi_pad pinctrl_alderlake wmi intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 444.184168] autofs4 [last unloaded: snd_hda_intel] <4>[ 444.184318] CR2: ffffc90003ee3a90 <4>[ 444.184331] ---[ end trace 0000000000000000 ]---