Oops#2 Part15 <7>[ 403.712946] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x7300] = 0x10001000 <7>[ 403.713046] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x83a8] = 0x20002000 <7>[ 403.713181] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x6210] = ~0x3f18000|0x3f18000 (MCR) <7>[ 403.715080] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: LRC bcs0 WA job: 27 dwords <7>[ 403.715147] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x22204] = ~0x7e7e|0x606 <7>[ 403.715206] xe 0000:03:00.0: [drm:xe_lrc_emit_hwe_state_instructions [xe]] Tile0: GT0: No non-register state to emit on graphics ver 20.01 <7>[ 403.717345] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: LRC ccs0 WA job: 0 dwords <7>[ 403.717410] xe 0000:03:00.0: [drm:xe_lrc_emit_hwe_state_instructions [xe]] Tile0: GT0: No non-register state to emit on graphics ver 20.01 <5>[ 403.719599] FAULT_INJECTION: forcing a failure. <5>[ 403.719599] name fail_function, interval 0, probability 100, space 1, times 100 <3>[ 403.719603] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC PC query task state failed: -ENOMEM <4>[ 403.719617] ------------[ cut here ]------------ <4>[ 403.719619] xe 0000:03:00.0: [drm] Assertion `ct->g2h_outstanding == 0 || state == XE_GUC_CT_STATE_STOPPED` failed! <4>[ 403.719619] platform: BATTLEMAGE subplatform: 7 <4>[ 403.719619] graphics: Xe2_HPG 20.01 step A0 <4>[ 403.719619] media: Xe2_HPM 13.01 step A1 <4>[ 403.719619] tile: 0 VRAM 12.0 GiB <4>[ 403.719619] GT: 0 type 1 Oops#2 Part14 <4>[ 403.719621] WARNING: drivers/gpu/drm/xe/xe_guc_ct.c:541 at guc_ct_change_state+0x264/0x330 [xe], CPU#4: xe_fault_inject/7193 <4>[ 403.719687] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp hid_generic cmdlinepart coretemp mei_hdcp spi_nor eeepc_wmi mei_pxp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel usbhid hid kvm irqbypass ghash_clmulni_intel aesni_intel rapl snd_intel_dspcfg snd_hda_codec snd_hda_core intel_cstate snd_hwdep snd_pcm video r8169 realtek snd_timer binfmt_misc i2c_i801 snd spi_intel_pci mei_me i2c_mux idma64 soundcore spi_intel i2c_smbus mei intel_pmc_core pmt_telemetry pmt_discovery nls_iso8859_1 pmt_class intel_pmc_ssram_telemetry wmi acpi_pad intel_vsec pinctrl_alderlake acpi_tad dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 403.719736] autofs4 [last unloaded: snd_hda_intel] <4>[ 403.719739] CPU: 4 UID: 0 PID: 7193 Comm: xe_fault_inject Tainted: G S U W N 7.0.0-rc3-lgci-xe-xe-4686-77e176657e782bb81-debug+ #1 PREEMPT(lazy) Oops#2 Part13 <4>[ 403.719742] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN, [N]=TEST <4>[ 403.719743] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 403.719744] RIP: 0010:guc_ct_change_state+0x2d8/0x330 [xe] <4>[ 403.719804] Code: 51 48 c1 ea 25 44 6b ca 64 44 29 c9 51 48 c7 c1 a0 7e 18 a1 52 4c 8b 55 88 41 52 44 8b 4d 9c 4c 8b 45 90 48 8b 95 78 ff ff ff <67> 48 0f b9 3a 8b 8b 50 01 00 00 48 83 c4 60 85 c9 75 13 44 89 bb <4>[ 403.719806] RSP: 0018:ffffc9000a3774c8 EFLAGS: 00010002 <4>[ 403.719808] RAX: ffffffffa11fd5d1 RBX: ffff88812c6e8738 RCX: ffffffffa1187ea0 <4>[ 403.719809] RDX: ffff888103cca010 RSI: ffffffffa11fd5d1 RDI: ffffffffa1002f00 <4>[ 403.719810] RBP: ffffc9000a3775b0 R08: ffffffffa11fd621 R09: 0000000000000007 <4>[ 403.719811] R10: ffffffffa11fd6d2 R11: 0000000000000514 R12: ffff88812c6e87c8 <4>[ 403.719812] R13: 0000000000000001 R14: 0000000000000000 R15: 0000000000000001 <4>[ 403.719813] FS: 00007f9a987e4980(0000) GS:ffff8888dae9b000(0000) knlGS:0000000000000000 <4>[ 403.719814] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 403.719815] CR2: 00005d42c52e1b80 CR3: 00000001188fb001 CR4: 0000000000f72ef0 <4>[ 403.719816] PKRU: 55555554 <4>[ 403.719817] Call Trace: <4>[ 403.719818] <4>[ 403.719825] ? xe_guc_submit_enable+0xa8/0xf0 [xe] <4>[ 403.719889] xe_guc_ct_disable+0x17/0x80 [xe] <4>[ 403.719947] xe_guc_sanitize+0x2a/0x50 [xe] <4>[ 403.720004] xe_uc_load_hw+0x19a/0x2b0 [xe] <4>[ 403.720094] ? xe_migrate_init+0x277/0x2d0 [xe] <4>[ 403.720178] xe_gt_init+0x35d/0xab0 [xe] Oops#2 Part12 <4>[ 403.720247] ? _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 403.720252] ? __devm_add_action+0x70/0xa0 <4>[ 403.720256] ? xe_irq_install+0x11a/0x490 [xe] <4>[ 403.720332] xe_device_probe+0x32c/0xbe0 [xe] <4>[ 403.720400] ? __drm_dev_dbg+0x7d/0xb0 <4>[ 403.720405] ? __drmm_add_action_or_reset+0x1e/0x50 <4>[ 403.720411] xe_pci_probe+0x39b/0x620 [xe] <4>[ 403.720487] ? trace_hardirqs_on+0x22/0x100 <4>[ 403.720494] local_pci_probe+0x47/0xb0 <4>[ 403.720498] pci_call_probe+0x6c/0x360 <4>[ 403.720503] ? _raw_spin_unlock+0x22/0x50 <4>[ 403.720507] pci_device_probe+0xae/0x110 <4>[ 403.720511] really_probe+0xf1/0x410 <4>[ 403.720514] __driver_probe_device+0x8c/0x190 <4>[ 403.720517] device_driver_attach+0x57/0xd0 <4>[ 403.720520] bind_store+0x77/0xd0 <4>[ 403.720523] drv_attr_store+0x24/0x50 <4>[ 403.720526] sysfs_kf_write+0x4d/0x80 <4>[ 403.720530] kernfs_fop_write_iter+0x188/0x240 <4>[ 403.720534] vfs_write+0x283/0x540 <4>[ 403.720541] ksys_write+0x6f/0xf0 <4>[ 403.720544] __x64_sys_write+0x19/0x30 <4>[ 403.720546] x64_sys_call+0x259/0x26e0 <4>[ 403.720549] do_syscall_64+0xdd/0x1470 <4>[ 403.720552] ? putname+0x41/0x90 <4>[ 403.720557] ? __slab_free+0x129/0x2b0 <4>[ 403.720561] ? __pcs_replace_full_main+0x2ad/0x710 <4>[ 403.720564] ? putname+0x41/0x90 <4>[ 403.720566] ? kmem_cache_free+0x165/0x510 <4>[ 403.720570] ? putname+0x41/0x90 <4>[ 403.720572] ? do_sys_openat2+0x85/0xd0 <4>[ 403.720577] ? __x64_sys_openat+0x54/0xa0 <4>[ 403.720579] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 403.720583] ? do_syscall_64+0x22e/0x1470 <4>[ 403.720585] ? fput_close_sync+0x3d/0xa0 Oops#2 Part11 <4>[ 403.720587] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 403.720591] ? do_syscall_64+0x22e/0x1470 <4>[ 403.720593] ? fput_close_sync+0x3d/0xa0 <4>[ 403.720595] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 403.720599] ? do_syscall_64+0x22e/0x1470 <4>[ 403.720603] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 403.720606] ? do_syscall_64+0x22e/0x1470 <4>[ 403.720608] ? do_syscall_64+0x22e/0x1470 <4>[ 403.720610] ? exc_page_fault+0xbd/0x2c0 <4>[ 403.720614] entry_SYSCALL_64_after_hwframe+0x76/0x7e <4>[ 403.720615] RIP: 0033:0x7f9a9a91c5a4 <4>[ 403.720618] Code: c7 00 16 00 00 00 b8 ff ff ff ff c3 66 2e 0f 1f 84 00 00 00 00 00 f3 0f 1e fa 80 3d a5 ea 0e 00 00 74 13 b8 01 00 00 00 0f 05 <48> 3d 00 f0 ff ff 77 54 c3 0f 1f 00 55 48 89 e5 48 83 ec 20 48 89 <4>[ 403.720619] RSP: 002b:00007ffda02a08d8 EFLAGS: 00000202 ORIG_RAX: 0000000000000001 <4>[ 403.720621] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 00007f9a9a91c5a4 <4>[ 403.720622] RDX: 000000000000000c RSI: 00007ffda02a0da0 RDI: 0000000000000007 <4>[ 403.720623] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 403.720624] R10: 0000000000000000 R11: 0000000000000202 R12: 00007ffda02a0da0 <4>[ 403.720625] R13: 0000000000000007 R14: 0000000000000006 R15: 00007ffda02a0a50 <4>[ 403.720632] <4>[ 403.720634] irq event stamp: 1667336 <4>[ 403.720635] hardirqs last enabled at (1667335): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 403.720637] hardirqs last disabled at (1667336): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 403.720639] softirqs last enabled at (1665856): [] __irq_exit_rcu+0x13f/0x160 Oops#2 Part10 <4>[ 403.720642] softirqs last disabled at (1665851): [] __irq_exit_rcu+0x13f/0x160 <4>[ 403.720644] ---[ end trace 0000000000000000 ]--- <7>[ 403.720646] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <4>[ 403.720731] ------------[ cut here ]------------ <3>[ 403.720739] xe 0000:03:00.0: probe with driver xe failed with error -12 <4>[ 403.720837] xe 0000:03:00.0: [drm] Tile0: GT0: Failed to invalidate GGTT (-ENODEV) <4>[ 403.720840] WARNING: drivers/gpu/drm/xe/xe_ggtt.c:576 at ggtt_invalidate_gt_tlb.part.0+0x76/0xb0 [xe], CPU#12: kworker/12:7/4000 <4>[ 403.720950] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp hid_generic cmdlinepart coretemp mei_hdcp spi_nor eeepc_wmi mei_pxp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel usbhid hid kvm irqbypass ghash_clmulni_intel aesni_intel rapl snd_intel_dspcfg snd_hda_codec snd_hda_core intel_cstate snd_hwdep snd_pcm video r8169 realtek snd_timer binfmt_misc i2c_i801 snd spi_intel_pci mei_me i2c_mux idma64 soundcore spi_intel i2c_smbus mei intel_pmc_core pmt_telemetry pmt_discovery nls_iso8859_1 pmt_class intel_pmc_ssram_telemetry wmi acpi_pad intel_vsec pinctrl_alderlake acpi_tad dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink Oops#2 Part9 <4>[ 403.721058] autofs4 [last unloaded: snd_hda_intel] <4>[ 403.721063] CPU: 12 UID: 0 PID: 4000 Comm: kworker/12:7 Tainted: G S U W N 7.0.0-rc3-lgci-xe-xe-4686-77e176657e782bb81-debug+ #1 PREEMPT(lazy) <4>[ 403.721067] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN, [N]=TEST <4>[ 403.721069] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 403.721071] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 403.721187] RIP: 0010:ggtt_invalidate_gt_tlb.part.0+0x81/0xb0 [xe] <4>[ 403.721288] Code: 48 8b 7f 08 4c 8b 77 50 4d 85 f6 75 03 4c 8b 37 e8 64 97 62 e1 48 89 c6 48 8d 3d ca c7 3d 00 4d 89 e1 45 89 e8 89 d9 4c 89 f2 <67> 48 0f b9 3a 5b 41 5c 41 5d 41 5e 5d 31 c0 31 d2 31 c9 31 f6 31 <4>[ 403.721290] RSP: 0018:ffffc9000bcffaf0 EFLAGS: 00010246 Oops#2 Part8 <4>[ 403.721293] RAX: ffffffffa11fd5d1 RBX: 0000000000000000 RCX: 0000000000000000 <4>[ 403.721295] RDX: ffff888103cca010 RSI: ffffffffa11fd5d1 RDI: ffffffffa1001fe0 <4>[ 403.721297] RBP: ffffc9000bcffb10 R08: 0000000000000000 R09: ffffffffffffffed <4>[ 403.721299] R10: 0000000000000000 R11: 0000000000000000 R12: ffffffffffffffed <4>[ 403.721301] R13: 0000000000000000 R14: ffff888103cca010 R15: 0000000000000000 <4>[ 403.721303] FS: 0000000000000000(0000) GS:ffff8888db29b000(0000) knlGS:0000000000000000 <4>[ 403.721305] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 403.721307] CR2: 00005d42c52e1b80 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 403.721309] PKRU: 55555554 <4>[ 403.721310] Call Trace: <4>[ 403.721312] <4>[ 403.721316] ggtt_node_remove+0x11a/0x140 [xe] <3>[ 403.721371] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <4>[ 403.721437] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 403.721539] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 403.721641] ? _raw_write_unlock+0x22/0x50 <4>[ 403.721647] ? drm_vma_offset_remove+0x65/0x80 <4>[ 403.721654] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 403.721752] ? lock_is_held_type+0xa3/0x130 <7>[ 403.721724] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <4>[ 403.721761] ttm_bo_release+0x70/0x310 [ttm] <4>[ 403.721770] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 403.721871] ? lock_release+0xd0/0x2b0 <4>[ 403.721878] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 403.721887] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 403.721982] drm_gem_object_free+0x1d/0x40 Oops#2 Part7 <4>[ 403.721986] xe_bo_put+0x12a/0x190 [xe] <4>[ 403.722122] xe_lrc_destroy+0x49/0x90 [xe] <4>[ 403.722241] __xe_exec_queue_fini+0x6b/0xa0 [xe] <4>[ 403.722340] xe_exec_queue_fini+0x2b/0x60 [xe] <4>[ 403.722441] __guc_exec_queue_destroy_async+0x6c/0x1a0 [xe] <4>[ 403.722552] process_one_work+0x22e/0x740 <4>[ 403.722563] worker_thread+0x1e8/0x3d0 <4>[ 403.722567] ? __pfx_worker_thread+0x10/0x10 <4>[ 403.722570] kthread+0x10d/0x150 <4>[ 403.722574] ? __pfx_kthread+0x10/0x10 <4>[ 403.722579] ret_from_fork+0x3d4/0x480 <4>[ 403.722582] ? __pfx_kthread+0x10/0x10 <4>[ 403.722587] ret_from_fork_asm+0x1a/0x30 <4>[ 403.722600] <4>[ 403.722601] irq event stamp: 8421 <4>[ 403.722603] hardirqs last enabled at (8427): [] __up_console_sem+0x79/0xa0 <4>[ 403.722607] hardirqs last disabled at (8432): [] __up_console_sem+0x5e/0xa0 <4>[ 403.722610] softirqs last enabled at (8338): [] __irq_exit_rcu+0x13f/0x160 <4>[ 403.722613] softirqs last disabled at (8251): [] __irq_exit_rcu+0x13f/0x160 <4>[ 403.722616] ---[ end trace 0000000000000000 ]--- <7>[ 403.723043] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 403.799403] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 403.803554] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. <3>[ 405.979929] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=50 recv=0 <1>[ 405.981921] BUG: unable to handle page fault for address: ffffc9000838a188 Oops#2 Part6 <1>[ 405.981950] #PF: supervisor write access in kernel mode <1>[ 405.981968] #PF: error_code(0x0002) - not-present page <6>[ 405.981983] PGD 100000067 P4D 100000067 PUD 100abd067 PMD 0 <4>[ 405.982007] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 405.982027] CPU: 12 UID: 0 PID: 132 Comm: kworker/12:1 Tainted: G S U W N 7.0.0-rc3-lgci-xe-xe-4686-77e176657e782bb81-debug+ #1 PREEMPT(lazy) <4>[ 405.982062] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN, [N]=TEST <4>[ 405.982076] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 405.982094] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 405.982617] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 405.983132] Code: 24 66 90 65 8b 05 1c 4c 2e e3 48 0f a3 05 c0 b2 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 405.983168] RSP: 0018:ffffc900005c37e0 EFLAGS: 00010086 <4>[ 405.983186] RAX: 0000000000000002 RBX: ffffc9000838a188 RCX: 0000000000000000 <4>[ 405.983203] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff8881341e0060 <4>[ 405.983219] RBP: ffffc900005c3858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 405.983235] R10: ffff8881803d8000 R11: 0000000000000001 R12: ffff8881341e0060 <4>[ 405.983250] R13: 000000000000a188 R14: ffff8881803d8000 R15: 0000000000010001 <4>[ 405.983266] FS: 0000000000000000(0000) GS:ffff8888db29b000(0000) knlGS:0000000000000000 <4>[ 405.983286] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 405.983300] CR2: ffffc9000838a188 CR3: 000000000344c004 CR4: 0000000000f72ef0 Oops#2 Part5 <4>[ 405.983317] PKRU: 55555554 <4>[ 405.983326] Call Trace: <4>[ 405.983336] <4>[ 405.983356] xe_force_wake_get+0x2a5/0x940 [xe] <4>[ 405.983804] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 405.983834] ? mark_held_locks+0x46/0x90 <4>[ 405.983858] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 405.984339] ? trace_hardirqs_on+0x22/0x100 <4>[ 405.984362] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 405.984382] ? xe_tlb_inval_fence_prep+0xce/0x1e0 [xe] <4>[ 405.984909] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 405.985435] ? xelpg_ggtt_pte_flags+0x27/0x1a0 [xe] <4>[ 405.985847] ? find_held_lock+0x31/0x90 <4>[ 405.985863] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 405.986284] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 405.986698] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 405.986949] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 405.987049] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 405.987150] ? _raw_write_unlock+0x22/0x50 <4>[ 405.987154] ? drm_vma_offset_remove+0x65/0x80 <4>[ 405.987160] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 405.987256] ? lock_is_held_type+0xa3/0x130 <4>[ 405.987263] ttm_bo_release+0x70/0x310 [ttm] <4>[ 405.987277] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 405.987376] ? lock_release+0xd0/0x2b0 <4>[ 405.987381] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 405.987390] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 405.987484] drm_gem_object_free+0x1d/0x40 <4>[ 405.987489] xe_bo_put+0x12a/0x190 [xe] <4>[ 405.987585] xe_lrc_destroy+0x49/0x90 [xe] <4>[ 405.987698] __xe_exec_queue_fini+0x6b/0xa0 [xe] <4>[ 405.987796] xe_exec_queue_fini+0x2b/0x60 [xe] Oops#2 Part4 <4>[ 405.987895] __guc_exec_queue_destroy_async+0x6c/0x1a0 [xe] <4>[ 405.988004] process_one_work+0x22e/0x740 <4>[ 405.988010] worker_thread+0x1e8/0x3d0 <4>[ 405.988013] ? __pfx_worker_thread+0x10/0x10 <4>[ 405.988017] kthread+0x10d/0x150 <4>[ 405.988022] ? __pfx_kthread+0x10/0x10 <4>[ 405.988026] ret_from_fork+0x3d4/0x480 <4>[ 405.988030] ? __pfx_kthread+0x10/0x10 <4>[ 405.988034] ret_from_fork_asm+0x1a/0x30 <4>[ 405.988041] <4>[ 405.988043] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp hid_generic cmdlinepart coretemp mei_hdcp spi_nor eeepc_wmi mei_pxp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel usbhid hid kvm irqbypass ghash_clmulni_intel aesni_intel rapl snd_intel_dspcfg snd_hda_codec snd_hda_core intel_cstate snd_hwdep snd_pcm video r8169 realtek snd_timer binfmt_misc i2c_i801 snd spi_intel_pci mei_me i2c_mux idma64 soundcore spi_intel i2c_smbus mei intel_pmc_core pmt_telemetry pmt_discovery nls_iso8859_1 pmt_class intel_pmc_ssram_telemetry wmi acpi_pad intel_vsec pinctrl_alderlake acpi_tad dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 405.988086] autofs4 [last unloaded: snd_hda_intel] <4>[ 405.988121] CR2: ffffc9000838a188 <4>[ 405.988124] ---[ end trace 0000000000000000 ]--- Oops#2 Part3 <4>[ 406.140273] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 406.140402] Code: 24 66 90 65 8b 05 1c 4c 2e e3 48 0f a3 05 c0 b2 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 406.140411] RSP: 0018:ffffc900005c37e0 EFLAGS: 00010086 <4>[ 406.140415] RAX: 0000000000000002 RBX: ffffc9000838a188 RCX: 0000000000000000 <4>[ 406.140418] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff8881341e0060 <4>[ 406.140422] RBP: ffffc900005c3858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 406.140426] R10: ffff8881803d8000 R11: 0000000000000001 R12: ffff8881341e0060 <4>[ 406.140429] R13: 000000000000a188 R14: ffff8881803d8000 R15: 0000000000010001 <4>[ 406.140433] FS: 0000000000000000(0000) GS:ffff8888db29b000(0000) knlGS:0000000000000000 <4>[ 406.140438] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 406.140441] CR2: ffffc9000838a188 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 406.140445] PKRU: 55555554 <6>[ 406.140447] note: kworker/12:1[132] exited with irqs disabled <6>[ 406.140462] note: kworker/12:1[132] exited with preempt_count 1 <6>[ 406.246053] pcieport 0000:00:06.0: AER: Multiple Correctable error message received from 0000:05:00.0 <4>[ 406.246095] nvme 0000:05:00.0: PCIe Bus Error: severity=Correctable, type=Physical Layer, (Receiver ID) <4>[ 406.246114] nvme 0000:05:00.0: device [15b7:5017] error status/mask=00000001/0000e000 <4>[ 406.246132] nvme 0000:05:00.0: [ 0] RxErr (First) <1>[ 408.282535] BUG: unable to handle page fault for address: ffffc900005c3a90 Oops#2 Part2 <1>[ 408.282566] #PF: supervisor read access in kernel mode <1>[ 408.282579] #PF: error_code(0x0000) - not-present page <6>[ 408.282591] PGD 100000067 P4D 100000067 PUD 100abd067 PMD 101722067 PTE 0 <4>[ 408.282613] Oops: Oops: 0000 [#2] SMP NOPTI <4>[ 408.282630] CPU: 10 UID: 0 PID: 5659 Comm: kworker/u64:86 Tainted: G S UD W N 7.0.0-rc3-lgci-xe-xe-4686-77e176657e782bb81-debug+ #1 PREEMPT(lazy) <4>[ 408.282658] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN, [N]=TEST <4>[ 408.282672] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 408.282687] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 408.283214] RIP: 0010:xe_tlb_inval_fence_timeout+0x65/0x220 [xe] <4>[ 408.283703] Code: 89 df 48 89 45 d0 49 8b 85 08 ff ff ff 48 8b 40 20 2e 2e 2e ff d0 49 8d 45 c0 48 89 c7 48 89 45 b8 e8 cf c1 c7 e1 49 8b 45 b0 <48> 8b 30 4c 8d 78 80 48 8d 5e 80 49 8d 75 b0 48 89 75 c8 48 39 c6 <4>[ 408.283738] RSP: 0018:ffffc9000739fdb0 EFLAGS: 00010046 <4>[ 408.283755] RAX: ffffc900005c3a90 RBX: ffff8881341e0458 RCX: 0000000000000000 <4>[ 408.283771] RDX: 0000000000000000 RSI: 0000000000000000 RDI: 0000000000000000 <4>[ 408.283787] RBP: ffffc9000739fdf8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 408.283802] R10: 0000000000000000 R11: 0000000000000000 R12: ffff8881803d8000 <4>[ 408.283817] R13: ffff8881341e0560 R14: ffff8881341e0560 R15: ffff8881f1a95cc0 <4>[ 408.283833] FS: 0000000000000000(0000) GS:ffff8888db19b000(0000) knlGS:0000000000000000 <4>[ 408.283852] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 408.283866] CR2: ffffc900005c3a90 CR3: 000000000344c002 CR4: 0000000000f72ef0 Oops#2 Part1 <4>[ 408.283883] PKRU: 55555554 <4>[ 408.283892] Call Trace: <4>[ 408.283901] <4>[ 408.283917] process_one_work+0x22e/0x740 <4>[ 408.283945] worker_thread+0x1e8/0x3d0 <4>[ 408.283960] ? __pfx_worker_thread+0x10/0x10 <4>[ 408.283976] kthread+0x10d/0x150 <4>[ 408.283993] ? __pfx_kthread+0x10/0x10 <4>[ 408.284012] ret_from_fork+0x3d4/0x480 <4>[ 408.284027] ? __pfx_kthread+0x10/0x10 <4>[ 408.284044] ret_from_fork_asm+0x1a/0x30 <4>[ 408.284071] <4>[ 408.284079] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp hid_generic cmdlinepart coretemp mei_hdcp spi_nor eeepc_wmi mei_pxp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel usbhid hid kvm irqbypass ghash_clmulni_intel aesni_intel rapl snd_intel_dspcfg snd_hda_codec snd_hda_core intel_cstate snd_hwdep snd_pcm video r8169 realtek snd_timer binfmt_misc i2c_i801 snd spi_intel_pci mei_me i2c_mux idma64 soundcore spi_intel i2c_smbus mei intel_pmc_core pmt_telemetry pmt_discovery nls_iso8859_1 pmt_class intel_pmc_ssram_telemetry wmi acpi_pad intel_vsec pinctrl_alderlake acpi_tad dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 408.284266] autofs4 [last unloaded: snd_hda_intel] <4>[ 408.284415] CR2: ffffc900005c3a90 <4>[ 408.284429] ---[ end trace 0000000000000000 ]---