Oops#2 Part10 <4>[ 213.534875] RSP: 002b:00007fffd6b50568 EFLAGS: 00000202 ORIG_RAX: 0000000000000001 <4>[ 213.534878] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 0000756ef251c5a4 <4>[ 213.534880] RDX: 000000000000000c RSI: 00007fffd6b50a30 RDI: 0000000000000007 <4>[ 213.534882] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 213.534884] R10: 0000000000000000 R11: 0000000000000202 R12: 00007fffd6b50a30 <4>[ 213.534886] R13: 0000000000000007 R14: 0000000000000006 R15: 00007fffd6b506e0 <4>[ 213.534899] <4>[ 213.534900] irq event stamp: 1564554 <4>[ 213.534902] hardirqs last enabled at (1564553): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 213.534906] hardirqs last disabled at (1564554): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 213.534909] softirqs last enabled at (1564548): [] __irq_exit_rcu+0x13f/0x160 <4>[ 213.534913] softirqs last disabled at (1564535): [] __irq_exit_rcu+0x13f/0x160 <4>[ 213.534916] ---[ end trace 0000000000000000 ]--- <7>[ 213.534919] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <4>[ 213.535055] ------------[ cut here ]------------ <4>[ 213.535066] xe 0000:03:00.0: [drm] Tile0: GT0: Failed to invalidate GGTT (-ENODEV) <4>[ 213.535069] WARNING: drivers/gpu/drm/xe/xe_ggtt.c:576 at ggtt_invalidate_gt_tlb.part.0+0x76/0xb0 [xe], CPU#12: kworker/12:8/4575 <4>[ 213.535186] Modules linked in: pmt_crashlog snd_hda_codec_intelhdmi snd_hda_codec_hdmi mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper Oops#2 Part9 <3>[ 213.535211] xe 0000:03:00.0: probe with driver xe failed with error -12 <4>[ 213.535212] drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp coretemp cmdlinepart hid_generic spi_nor asus_nb_wmi mei_hdcp mei_pxp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel kvm irqbypass usbhid ghash_clmulni_intel aesni_intel hid binfmt_misc rapl video intel_cstate r8169 snd_intel_dspcfg snd_hda_codec snd_hda_core realtek snd_hwdep snd_pcm i2c_i801 snd_timer mei_me i2c_mux snd idma64 spi_intel_pci soundcore i2c_smbus spi_intel mei intel_pmc_core nls_iso8859_1 pmt_telemetry pmt_discovery pmt_class intel_pmc_ssram_telemetry acpi_pad acpi_tad pinctrl_alderlake wmi intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink autofs4 [last unloaded: snd_hda_intel] <4>[ 213.535393] CPU: 12 UID: 0 PID: 4575 Comm: kworker/12:8 Tainted: G S U W 7.0.0-rc3-lgci-xe-xe-4686-77e176657e782bb81-debug+ #1 PREEMPT(lazy) <4>[ 213.535397] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 213.535399] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 213.535401] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 213.535517] RIP: 0010:ggtt_invalidate_gt_tlb.part.0+0x81/0xb0 [xe] <4>[ 213.535618] Code: 48 8b 7f 08 4c 8b 77 50 4d 85 f6 75 03 4c 8b 37 e8 64 97 62 e1 48 89 c6 48 8d 3d ca c7 3d 00 4d 89 e1 45 89 e8 89 d9 4c 89 f2 <67> 48 0f b9 3a 5b 41 5c 41 5d 41 5e 5d 31 c0 31 d2 31 c9 31 f6 31 Oops#2 Part8 <4>[ 213.535621] RSP: 0018:ffffc9000badfaf0 EFLAGS: 00010246 <4>[ 213.535624] RAX: ffffffffa11fd5d1 RBX: 0000000000000000 RCX: 0000000000000000 <4>[ 213.535626] RDX: ffff888103bfc210 RSI: ffffffffa11fd5d1 RDI: ffffffffa1001fe0 <4>[ 213.535628] RBP: ffffc9000badfb10 R08: 0000000000000000 R09: ffffffffffffffed <4>[ 213.535629] R10: 0000000000000000 R11: 0000000000000000 R12: ffffffffffffffed <4>[ 213.535631] R13: 0000000000000000 R14: ffff888103bfc210 R15: 0000000000000000 <4>[ 213.535633] FS: 0000000000000000(0000) GS:ffff8888db29b000(0000) knlGS:0000000000000000 <4>[ 213.535635] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 213.535637] CR2: 0000618d5f017e70 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 213.535639] PKRU: 55555554 <4>[ 213.535641] Call Trace: <4>[ 213.535642] <4>[ 213.535647] ggtt_node_remove+0x11a/0x140 [xe] <4>[ 213.535750] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 213.535850] xe_ggtt_remove_bo+0x87/0x250 [xe] <3>[ 213.535948] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <4>[ 213.535952] ? _raw_write_unlock+0x22/0x50 <4>[ 213.535968] ? drm_vma_offset_remove+0x65/0x80 <4>[ 213.535976] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 213.536071] ? lock_is_held_type+0xa3/0x130 <4>[ 213.536080] ttm_bo_release+0x70/0x310 [ttm] <4>[ 213.536090] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 213.536189] ? lock_release+0xd0/0x2b0 <4>[ 213.536196] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 213.536205] xe_gem_object_free+0x1a/0x30 [xe] Oops#2 Part7 <4>[ 213.536299] drm_gem_object_free+0x1d/0x40 <4>[ 213.536303] xe_bo_put+0x12a/0x190 [xe] <7>[ 213.536343] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <4>[ 213.536407] xe_lrc_destroy+0x74/0x90 [xe] <4>[ 213.536524] __xe_exec_queue_fini+0x6b/0xa0 [xe] <4>[ 213.536623] xe_exec_queue_fini+0x2b/0x60 [xe] <4>[ 213.536722] __guc_exec_queue_destroy_async+0x6c/0x1a0 [xe] <4>[ 213.536832] process_one_work+0x22e/0x740 <4>[ 213.536843] worker_thread+0x1e8/0x3d0 <4>[ 213.536847] ? __pfx_worker_thread+0x10/0x10 <4>[ 213.536850] kthread+0x10d/0x150 <4>[ 213.536854] ? __pfx_kthread+0x10/0x10 <4>[ 213.536859] ret_from_fork+0x3d4/0x480 <4>[ 213.536862] ? __pfx_kthread+0x10/0x10 <4>[ 213.536867] ret_from_fork_asm+0x1a/0x30 <4>[ 213.536880] <4>[ 213.536881] irq event stamp: 149581 <4>[ 213.536883] hardirqs last enabled at (149587): [] __up_console_sem+0x79/0xa0 <4>[ 213.536887] hardirqs last disabled at (149592): [] __up_console_sem+0x5e/0xa0 <4>[ 213.536890] softirqs last enabled at (149024): [] __irq_exit_rcu+0x13f/0x160 <4>[ 213.536893] softirqs last disabled at (149019): [] __irq_exit_rcu+0x13f/0x160 <4>[ 213.536896] ---[ end trace 0000000000000000 ]--- <7>[ 213.538189] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 213.614878] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 213.617474] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. Oops#2 Part6 <3>[ 215.802727] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=51 recv=50 <1>[ 215.803732] BUG: unable to handle page fault for address: ffffc9000838a188 <1>[ 215.803763] #PF: supervisor write access in kernel mode <1>[ 215.803779] #PF: error_code(0x0002) - not-present page <6>[ 215.803793] PGD 100000067 P4D 100000067 PUD 100aca067 PMD 0 <4>[ 215.803816] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 215.803836] CPU: 12 UID: 0 PID: 2847 Comm: kworker/12:3 Tainted: G S U W 7.0.0-rc3-lgci-xe-xe-4686-77e176657e782bb81-debug+ #1 PREEMPT(lazy) <4>[ 215.803871] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 215.803885] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 215.803906] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 215.804398] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 215.804888] Code: 24 66 90 65 8b 05 1c 4c 2e e3 48 0f a3 05 c0 b2 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 215.804924] RSP: 0018:ffffc90004e0b7e0 EFLAGS: 00010086 <4>[ 215.804941] RAX: 0000000000000002 RBX: ffffc9000838a188 RCX: 0000000000000000 <4>[ 215.804959] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff88812e460060 <4>[ 215.804977] RBP: ffffc90004e0b858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 215.804993] R10: ffff888168fb0000 R11: 0000000000000001 R12: ffff88812e460060 <4>[ 215.805010] R13: 000000000000a188 R14: ffff888168fb0000 R15: 0000000000010001 <4>[ 215.805027] FS: 0000000000000000(0000) GS:ffff8888db29b000(0000) knlGS:0000000000000000 Oops#2 Part5 <4>[ 215.805047] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 215.805063] CR2: ffffc9000838a188 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 215.805081] PKRU: 55555554 <4>[ 215.805091] Call Trace: <4>[ 215.805101] <4>[ 215.805121] xe_force_wake_get+0x2a5/0x940 [xe] <4>[ 215.805541] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 215.805569] ? mark_held_locks+0x46/0x90 <4>[ 215.805592] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 215.806051] ? trace_hardirqs_on+0x22/0x100 <4>[ 215.806073] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 215.806091] ? xe_tlb_inval_fence_prep+0xce/0x1e0 [xe] <4>[ 215.806616] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 215.807132] ? xelpg_ggtt_pte_flags+0x27/0x1a0 [xe] <4>[ 215.807545] ? find_held_lock+0x31/0x90 <4>[ 215.807561] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 215.807983] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 215.808398] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 215.808788] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 215.808888] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 215.808989] ? _raw_write_unlock+0x22/0x50 <4>[ 215.808993] ? drm_vma_offset_remove+0x65/0x80 <4>[ 215.809000] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 215.809096] ? lock_is_held_type+0xa3/0x130 <4>[ 215.809102] ttm_bo_release+0x70/0x310 [ttm] <4>[ 215.809112] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 215.809212] ? lock_release+0xd0/0x2b0 <4>[ 215.809217] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 215.809225] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 215.809320] drm_gem_object_free+0x1d/0x40 <4>[ 215.809325] xe_bo_put+0x12a/0x190 [xe] Oops#2 Part4 <4>[ 215.809421] xe_lrc_destroy+0x49/0x90 [xe] <4>[ 215.809535] __xe_exec_queue_fini+0x6b/0xa0 [xe] <4>[ 215.809634] xe_exec_queue_fini+0x2b/0x60 [xe] <4>[ 215.809733] __guc_exec_queue_destroy_async+0x6c/0x1a0 [xe] <4>[ 215.809843] process_one_work+0x22e/0x740 <4>[ 215.809849] worker_thread+0x1e8/0x3d0 <4>[ 215.809852] ? __pfx_worker_thread+0x10/0x10 <4>[ 215.809856] kthread+0x10d/0x150 <4>[ 215.809860] ? __pfx_kthread+0x10/0x10 <4>[ 215.809865] ret_from_fork+0x3d4/0x480 <4>[ 215.809869] ? __pfx_kthread+0x10/0x10 <4>[ 215.809873] ret_from_fork_asm+0x1a/0x30 <4>[ 215.809879] <4>[ 215.809881] Modules linked in: pmt_crashlog snd_hda_codec_intelhdmi snd_hda_codec_hdmi mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp coretemp cmdlinepart hid_generic spi_nor asus_nb_wmi mei_hdcp mei_pxp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel kvm irqbypass usbhid ghash_clmulni_intel aesni_intel hid binfmt_misc rapl video intel_cstate r8169 snd_intel_dspcfg snd_hda_codec snd_hda_core realtek snd_hwdep snd_pcm i2c_i801 snd_timer mei_me i2c_mux snd idma64 spi_intel_pci soundcore i2c_smbus spi_intel mei intel_pmc_core nls_iso8859_1 pmt_telemetry pmt_discovery pmt_class intel_pmc_ssram_telemetry acpi_pad acpi_tad pinctrl_alderlake wmi intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink Oops#2 Part3 <4>[ 215.809924] autofs4 [last unloaded: snd_hda_intel] <4>[ 215.809959] CR2: ffffc9000838a188 <4>[ 215.809963] ---[ end trace 0000000000000000 ]--- <4>[ 215.969272] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 215.969398] Code: 24 66 90 65 8b 05 1c 4c 2e e3 48 0f a3 05 c0 b2 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 215.969407] RSP: 0018:ffffc90004e0b7e0 EFLAGS: 00010086 <4>[ 215.969411] RAX: 0000000000000002 RBX: ffffc9000838a188 RCX: 0000000000000000 <4>[ 215.969415] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff88812e460060 <4>[ 215.969419] RBP: ffffc90004e0b858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 215.969422] R10: ffff888168fb0000 R11: 0000000000000001 R12: ffff88812e460060 <4>[ 215.969426] R13: 000000000000a188 R14: ffff888168fb0000 R15: 0000000000010001 <4>[ 215.969430] FS: 0000000000000000(0000) GS:ffff8888db29b000(0000) knlGS:0000000000000000 <4>[ 215.969435] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 215.969438] CR2: ffffc9000838a188 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 215.969442] PKRU: 55555554 <6>[ 215.969444] note: kworker/12:3[2847] exited with irqs disabled <6>[ 215.969467] note: kworker/12:3[2847] exited with preempt_count 1 <1>[ 218.105608] BUG: unable to handle page fault for address: ffffc90004e0ba90 Oops#2 Part2 <1>[ 218.105639] #PF: supervisor read access in kernel mode <1>[ 218.105653] #PF: error_code(0x0000) - not-present page <6>[ 218.105664] PGD 100000067 P4D 100000067 PUD 100aca067 PMD 1297bd067 PTE 0 <4>[ 218.105688] Oops: Oops: 0000 [#2] SMP NOPTI <4>[ 218.105704] CPU: 10 UID: 0 PID: 8954 Comm: kworker/u64:519 Tainted: G S UD W 7.0.0-rc3-lgci-xe-xe-4686-77e176657e782bb81-debug+ #1 PREEMPT(lazy) <4>[ 218.105732] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN <4>[ 218.105743] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 218.105758] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 218.106283] RIP: 0010:xe_tlb_inval_fence_timeout+0x65/0x220 [xe] <4>[ 218.106769] Code: 89 df 48 89 45 d0 49 8b 85 08 ff ff ff 48 8b 40 20 2e 2e 2e ff d0 49 8d 45 c0 48 89 c7 48 89 45 b8 e8 cf c1 c7 e1 49 8b 45 b0 <48> 8b 30 4c 8d 78 80 48 8d 5e 80 49 8d 75 b0 48 89 75 c8 48 39 c6 <4>[ 218.106803] RSP: 0018:ffffc90023b97db0 EFLAGS: 00010046 <4>[ 218.106820] RAX: ffffc90004e0ba90 RBX: ffff88812e460458 RCX: 0000000000000000 <4>[ 218.106836] RDX: 0000000000000000 RSI: 0000000000000000 RDI: 0000000000000000 <4>[ 218.106851] RBP: ffffc90023b97df8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 218.106866] R10: 0000000000000000 R11: 0000000000000000 R12: ffff888168fb0000 <4>[ 218.106882] R13: ffff88812e460560 R14: ffff88812e460560 R15: ffff8881e5402140 <4>[ 218.106898] FS: 0000000000000000(0000) GS:ffff8888db19b000(0000) knlGS:0000000000000000 <4>[ 218.106917] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 218.106932] CR2: ffffc90004e0ba90 CR3: 000000000344c003 CR4: 0000000000f72ef0 Oops#2 Part1 <4>[ 218.106948] PKRU: 55555554 <4>[ 218.106957] Call Trace: <4>[ 218.106967] <4>[ 218.106982] process_one_work+0x22e/0x740 <4>[ 218.107010] worker_thread+0x1e8/0x3d0 <4>[ 218.107025] ? __pfx_worker_thread+0x10/0x10 <4>[ 218.107041] kthread+0x10d/0x150 <4>[ 218.107059] ? __pfx_kthread+0x10/0x10 <4>[ 218.107078] ret_from_fork+0x3d4/0x480 <4>[ 218.107092] ? __pfx_kthread+0x10/0x10 <4>[ 218.107109] ret_from_fork_asm+0x1a/0x30 <4>[ 218.107136] <4>[ 218.107144] Modules linked in: pmt_crashlog snd_hda_codec_intelhdmi snd_hda_codec_hdmi mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp coretemp cmdlinepart hid_generic spi_nor asus_nb_wmi mei_hdcp mei_pxp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel kvm irqbypass usbhid ghash_clmulni_intel aesni_intel hid binfmt_misc rapl video intel_cstate r8169 snd_intel_dspcfg snd_hda_codec snd_hda_core realtek snd_hwdep snd_pcm i2c_i801 snd_timer mei_me i2c_mux snd idma64 spi_intel_pci soundcore i2c_smbus spi_intel mei intel_pmc_core nls_iso8859_1 pmt_telemetry pmt_discovery pmt_class intel_pmc_ssram_telemetry acpi_pad acpi_tad pinctrl_alderlake wmi intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 218.107331] autofs4 [last unloaded: snd_hda_intel] <4>[ 218.107480] CR2: ffffc90004e0ba90 <4>[ 218.107493] ---[ end trace 0000000000000000 ]---