Oops#2 Part12 <4>[ 159.138629] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 159.138630] CR2: 00005dddaf91d7b8 CR3: 00000001c42dd005 CR4: 0000000000f72ef0 <4>[ 159.138631] PKRU: 55555554 <4>[ 159.138632] Call Trace: <4>[ 159.138633] <4>[ 159.138640] ? xe_guc_submit_enable+0xa8/0xf0 [xe] <4>[ 159.138719] xe_guc_ct_disable+0x17/0x80 [xe] <4>[ 159.138797] xe_guc_sanitize+0x2a/0x50 [xe] <4>[ 159.138874] xe_uc_load_hw+0x19a/0x2b0 [xe] <4>[ 159.138975] ? xe_migrate_init+0x277/0x2d0 [xe] <4>[ 159.139063] xe_gt_init+0x35d/0xab0 [xe] <4>[ 159.139139] ? _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 159.139144] ? __devm_add_action+0x70/0xa0 <4>[ 159.139148] ? xe_irq_install+0x11a/0x490 [xe] <4>[ 159.139234] xe_device_probe+0x32c/0xbe0 [xe] <4>[ 159.139309] ? __drm_dev_dbg+0x7d/0xb0 <4>[ 159.139314] ? __drmm_add_action_or_reset+0x1e/0x50 <4>[ 159.139320] xe_pci_probe+0x39b/0x620 [xe] <4>[ 159.139407] ? trace_hardirqs_on+0x22/0x100 <4>[ 159.139415] local_pci_probe+0x47/0xb0 <4>[ 159.139420] pci_call_probe+0x6c/0x360 <4>[ 159.139425] ? _raw_spin_unlock+0x22/0x50 <4>[ 159.139430] pci_device_probe+0xae/0x110 <4>[ 159.139434] really_probe+0xf1/0x410 <4>[ 159.139437] __driver_probe_device+0x8c/0x190 <4>[ 159.139440] device_driver_attach+0x57/0xd0 <4>[ 159.139444] bind_store+0x142/0x150 <4>[ 159.139448] drv_attr_store+0x24/0x50 <4>[ 159.139451] sysfs_kf_write+0x4d/0x80 <4>[ 159.139455] kernfs_fop_write_iter+0x188/0x240 <4>[ 159.139459] vfs_write+0x283/0x540 <4>[ 159.139467] ksys_write+0x6f/0xf0 <4>[ 159.139471] __x64_sys_write+0x19/0x30 <4>[ 159.139473] x64_sys_call+0x259/0x26e0 Oops#2 Part11 <4>[ 159.139476] do_syscall_64+0xdd/0x1470 <4>[ 159.139481] ? putname+0x41/0x90 <4>[ 159.139483] ? do_sys_openat2+0x85/0xd0 <4>[ 159.139488] ? __x64_sys_openat+0x54/0xa0 <4>[ 159.139491] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 159.139495] ? do_syscall_64+0x22e/0x1470 <4>[ 159.139498] ? fput_close_sync+0x3d/0xa0 <4>[ 159.139500] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 159.139504] ? do_syscall_64+0x22e/0x1470 <4>[ 159.139506] ? fput_close_sync+0x3d/0xa0 <4>[ 159.139508] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 159.139512] ? do_syscall_64+0x22e/0x1470 <4>[ 159.139515] ? putname+0x41/0x90 <4>[ 159.139517] ? kmem_cache_free+0x165/0x510 <4>[ 159.139522] ? putname+0x41/0x90 <4>[ 159.139524] ? do_sys_openat2+0x85/0xd0 <4>[ 159.139529] ? __x64_sys_openat+0x54/0xa0 <4>[ 159.139531] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 159.139535] ? do_syscall_64+0x22e/0x1470 <4>[ 159.139537] ? trace_hardirqs_on_prepare+0xe1/0x100 <4>[ 159.139540] ? do_syscall_64+0x22e/0x1470 <4>[ 159.139542] ? exc_page_fault+0xbd/0x2c0 <4>[ 159.139546] entry_SYSCALL_64_after_hwframe+0x76/0x7e <4>[ 159.139548] RIP: 0033:0x75f65db1c5a4 <4>[ 159.139551] Code: c7 00 16 00 00 00 b8 ff ff ff ff c3 66 2e 0f 1f 84 00 00 00 00 00 f3 0f 1e fa 80 3d a5 ea 0e 00 00 74 13 b8 01 00 00 00 0f 05 <48> 3d 00 f0 ff ff 77 54 c3 0f 1f 00 55 48 89 e5 48 83 ec 20 48 89 <4>[ 159.139553] RSP: 002b:00007ffc150df2f8 EFLAGS: 00000202 ORIG_RAX: 0000000000000001 <4>[ 159.139555] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 000075f65db1c5a4 <4>[ 159.139556] RDX: 000000000000000c RSI: 00007ffc150df7c0 RDI: 0000000000000007 Oops#2 Part10 <4>[ 159.139557] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 159.139558] R10: 0000000000000000 R11: 0000000000000202 R12: 00007ffc150df7c0 <4>[ 159.139559] R13: 0000000000000007 R14: 0000000000000006 R15: 00007ffc150df470 <4>[ 159.139567] <4>[ 159.139568] irq event stamp: 1169428 <4>[ 159.139569] hardirqs last enabled at (1169427): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 159.139572] hardirqs last disabled at (1169428): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 159.139575] softirqs last enabled at (1169324): [] __irq_exit_rcu+0x13f/0x160 <4>[ 159.139577] softirqs last disabled at (1169319): [] __irq_exit_rcu+0x13f/0x160 <4>[ 159.139579] ---[ end trace 0000000000000000 ]--- <7>[ 159.139582] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <3>[ 159.139686] xe 0000:03:00.0: probe with driver xe failed with error -12 <3>[ 159.140273] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <7>[ 159.140637] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 159.141965] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 159.225014] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 159.226173] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. <3>[ 161.426132] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=51 recv=50 Oops#2 Part9 <3>[ 161.427050] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=52 recv=50 <1>[ 161.427192] BUG: unable to handle page fault for address: ffffc9000c38a188 <1>[ 161.427226] #PF: supervisor write access in kernel mode <1>[ 161.427240] #PF: error_code(0x0002) - not-present page <6>[ 161.427252] PGD 100000067 P4D 100000067 PUD 100abb067 PMD 0 <4>[ 161.427272] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 161.427288] CPU: 10 UID: 0 PID: 50 Comm: kworker/10:0 Tainted: G S U W 7.0.0-rc2-lgci-xe-xe-4655-cfc20c776480fda8c-debug+ #1 PREEMPT(lazy) <4>[ 161.427316] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 161.427328] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 161.427343] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 161.427821] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 161.428302] Code: 24 66 90 65 8b 05 0c 7e 2e e3 48 0f a3 05 b0 e3 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 161.428338] RSP: 0018:ffffc900002ff7e0 EFLAGS: 00010086 <4>[ 161.428355] RAX: 0000000000000002 RBX: ffffc9000c38a188 RCX: 0000000000000000 <4>[ 161.428372] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff88811bd20060 <4>[ 161.428390] RBP: ffffc900002ff858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 161.428406] R10: ffff88816eb70000 R11: 0000000000000001 R12: ffff88811bd20060 <4>[ 161.428422] R13: 000000000000a188 R14: ffff88816eb70000 R15: 0000000000010001 <4>[ 161.428439] FS: 0000000000000000(0000) GS:ffff8888db199000(0000) knlGS:0000000000000000 Oops#2 Part8 <4>[ 161.428459] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 161.428475] CR2: ffffc9000c38a188 CR3: 000000000344c005 CR4: 0000000000f72ef0 <4>[ 161.428492] PKRU: 55555554 <4>[ 161.428502] Call Trace: <4>[ 161.428513] <4>[ 161.428531] xe_force_wake_get+0x2a5/0x940 [xe] <4>[ 161.428940] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 161.428969] ? mark_held_locks+0x46/0x90 <4>[ 161.428992] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 161.429430] ? trace_hardirqs_on+0x22/0x100 <4>[ 161.429451] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 161.429470] ? xe_tlb_inval_fence_prep+0xce/0x1e0 [xe] <4>[ 161.429973] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 161.430473] ? xelpg_ggtt_pte_flags+0x27/0x1a0 [xe] <4>[ 161.430872] ? find_held_lock+0x31/0x90 <4>[ 161.430888] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 161.431294] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 161.431690] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 161.432083] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 161.432477] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 161.432720] ? _raw_write_unlock+0x22/0x50 <4>[ 161.432724] ? drm_vma_offset_remove+0x65/0x80 <4>[ 161.432729] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 161.432806] ? lock_is_held_type+0xa3/0x130 <4>[ 161.432811] ttm_bo_release+0x70/0x330 [ttm] <4>[ 161.432818] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 161.432886] ? lock_release+0xd0/0x2b0 <4>[ 161.432890] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 161.432896] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 161.432963] drm_gem_object_free+0x1d/0x40 <4>[ 161.432966] xe_bo_put+0x12a/0x190 [xe] Oops#2 Part7 <4>[ 161.433034] xe_lrc_destroy+0x49/0x90 [xe] <4>[ 161.433113] __xe_exec_queue_fini+0x6b/0xa0 [xe] <4>[ 161.433180] xe_exec_queue_fini+0x2b/0x60 [xe] <4>[ 161.433248] __guc_exec_queue_destroy_async+0x6c/0x1a0 [xe] <4>[ 161.433323] process_one_work+0x22e/0x740 <4>[ 161.433327] worker_thread+0x1e8/0x3d0 <4>[ 161.433330] ? __pfx_worker_thread+0x10/0x10 <4>[ 161.433332] kthread+0x10d/0x150 <4>[ 161.433336] ? __pfx_kthread+0x10/0x10 <4>[ 161.433339] ret_from_fork+0x3d4/0x480 <4>[ 161.433342] ? __pfx_kthread+0x10/0x10 <4>[ 161.433345] ret_from_fork_asm+0x1a/0x30 <4>[ 161.433350] <4>[ 161.433351] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit overlay intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal cmdlinepart hid_generic intel_powerclamp eeepc_wmi spi_nor asus_wmi mtd coretemp sparse_keymap mei_hdcp mei_pxp platform_profile wmi_bmof kvm_intel binfmt_misc kvm irqbypass ghash_clmulni_intel snd_intel_dspcfg aesni_intel snd_hda_codec r8169 rapl snd_hda_core usbhid snd_hwdep intel_cstate hid snd_pcm realtek snd_timer idma64 i2c_i801 snd i2c_mux nls_iso8859_1 spi_intel_pci i2c_smbus spi_intel soundcore video intel_pmc_core pmt_telemetry pmt_discovery mei_me pmt_class mei intel_pmc_ssram_telemetry wmi intel_vsec acpi_pad pinctrl_alderlake acpi_tad dm_multipath msr nvme_fabrics fuse efi_pstore Oops#2 Part6 <4>[ 161.433387] nfnetlink autofs4 [last unloaded: snd_hda_intel] <4>[ 161.433414] CR2: ffffc9000c38a188 <4>[ 161.433416] ---[ end trace 0000000000000000 ]--- <4>[ 161.574603] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 161.574702] Code: 24 66 90 65 8b 05 0c 7e 2e e3 48 0f a3 05 b0 e3 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 161.574708] RSP: 0018:ffffc900002ff7e0 EFLAGS: 00010086 <4>[ 161.574711] RAX: 0000000000000002 RBX: ffffc9000c38a188 RCX: 0000000000000000 <4>[ 161.574714] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff88811bd20060 <4>[ 161.574717] RBP: ffffc900002ff858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 161.574720] R10: ffff88816eb70000 R11: 0000000000000001 R12: ffff88811bd20060 <4>[ 161.574722] R13: 000000000000a188 R14: ffff88816eb70000 R15: 0000000000010001 <4>[ 161.574725] FS: 0000000000000000(0000) GS:ffff8888db199000(0000) knlGS:0000000000000000 <4>[ 161.574728] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 161.574731] CR2: ffffc9000c38a188 CR3: 000000000344c005 CR4: 0000000000f72ef0 Oops#2 Part5 <4>[ 161.574734] PKRU: 55555554 <6>[ 161.574735] note: kworker/10:0[50] exited with irqs disabled <6>[ 161.574746] note: kworker/10:0[50] exited with preempt_count 1 <3>[ 163.728772] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=3144512 recv=0 <4>[ 163.728811] non-slab/vmalloc memory <4>[ 163.728826] ------------[ cut here ]------------ <4>[ 163.728836] list_del corruption. prev->next should be ffffc900002ffa90, but was 003d48d44db60f44. (prev=ffffffff813917fe) <4>[ 163.728855] WARNING: lib/list_debug.c:62 at __list_del_entry_valid_or_report+0xd9/0x120, CPU#6: kworker/u64:2/121 <4>[ 163.728887] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit overlay intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal cmdlinepart hid_generic intel_powerclamp eeepc_wmi spi_nor asus_wmi mtd coretemp sparse_keymap mei_hdcp mei_pxp platform_profile wmi_bmof kvm_intel binfmt_misc kvm irqbypass ghash_clmulni_intel snd_intel_dspcfg aesni_intel snd_hda_codec r8169 rapl snd_hda_core usbhid snd_hwdep intel_cstate hid snd_pcm realtek snd_timer idma64 i2c_i801 snd i2c_mux nls_iso8859_1 spi_intel_pci i2c_smbus spi_intel soundcore video intel_pmc_core pmt_telemetry pmt_discovery mei_me pmt_class mei intel_pmc_ssram_telemetry wmi intel_vsec acpi_pad pinctrl_alderlake acpi_tad dm_multipath msr nvme_fabrics fuse efi_pstore Oops#2 Part4 <4>[ 163.729047] nfnetlink autofs4 [last unloaded: snd_hda_intel] <4>[ 163.729161] CPU: 6 UID: 0 PID: 121 Comm: kworker/u64:2 Tainted: G S UD W 7.0.0-rc2-lgci-xe-xe-4655-cfc20c776480fda8c-debug+ #1 PREEMPT(lazy) <4>[ 163.729190] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN <4>[ 163.729201] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 163.729216] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 163.729770] RIP: 0010:__list_del_entry_valid_or_report+0xe3/0x120 <4>[ 163.729792] Code: b5 01 4c 89 ea 48 89 de 67 48 0f b9 3a 31 c0 eb 8b 4c 89 ef e8 be e3 8e ff 48 8d 3d 17 4c b5 01 49 8b 55 00 4c 89 e9 48 89 de <67> 48 0f b9 3a 31 c0 e9 66 ff ff ff 4c 89 e7 e8 99 e3 8e ff 48 8d <4>[ 163.729826] RSP: 0018:ffffc90000563d58 EFLAGS: 00010046 <4>[ 163.729842] RAX: 0000000000000000 RBX: ffffc900002ffa90 RCX: ffffffff813917fe <4>[ 163.729859] RDX: 003d48d44db60f44 RSI: ffffc900002ffa90 RDI: ffffffff839e3330 <4>[ 163.729875] RBP: ffffc90000563d70 R08: 0000000000000000 R09: 0000000000000000 <4>[ 163.729890] R10: 0000000000000000 R11: 0000000000000000 R12: ffff88811bd20500 <4>[ 163.729906] R13: ffffffff813917fe R14: ffffffff814903c3 R15: ffff88811bd20480