Oops#2 Part7 <4>[ 89.560971] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 89.560972] R10: 0000000000000000 R11: 0000000000000202 R12: 00007fffc70128c0 <4>[ 89.560974] R13: 0000000000000007 R14: 0000000000000006 R15: 00007fffc7012570 <4>[ 89.560982] <4>[ 89.560983] irq event stamp: 1524330 <4>[ 89.560984] hardirqs last enabled at (1524329): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 89.560986] hardirqs last disabled at (1524330): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 89.560989] softirqs last enabled at (1524170): [] __irq_exit_rcu+0x13f/0x160 <4>[ 89.560992] softirqs last disabled at (1524161): [] __irq_exit_rcu+0x13f/0x160 <4>[ 89.560994] ---[ end trace 0000000000000000 ]--- <7>[ 89.560996] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <3>[ 89.561092] xe 0000:03:00.0: probe with driver xe failed with error -12 <3>[ 89.561720] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <7>[ 89.562081] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 89.563382] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 89.646689] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 89.647910] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. <3>[ 91.871329] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=51 recv=50 Oops#2 Part6 <3>[ 91.872176] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=52 recv=50 <1>[ 91.872314] BUG: unable to handle page fault for address: ffffc9000538a188 <1>[ 91.872346] #PF: supervisor write access in kernel mode <1>[ 91.872360] #PF: error_code(0x0002) - not-present page <6>[ 91.872372] PGD 100000067 P4D 100000067 PUD 100ab8067 PMD 0 <4>[ 91.872395] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 91.872412] CPU: 8 UID: 0 PID: 516 Comm: kworker/8:3 Tainted: G S U W 7.0.0-rc2-lgci-xe-xe-4655-cfc20c776480fda8c-debug+ #1 PREEMPT(lazy) <4>[ 91.872440] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 91.872450] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 91.872464] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 91.872936] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 91.873423] Code: 24 66 90 65 8b 05 0c 7e 2e e3 48 0f a3 05 b0 e3 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 91.873458] RSP: 0018:ffffc90001bd37e0 EFLAGS: 00010086 <4>[ 91.873474] RAX: 0000000000000002 RBX: ffffc9000538a188 RCX: 0000000000000000 <4>[ 91.873490] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff888168750060 <4>[ 91.873507] RBP: ffffc90001bd3858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 91.873522] R10: ffff88817f640000 R11: 0000000000000001 R12: ffff888168750060 <4>[ 91.873537] R13: 000000000000a188 R14: ffff88817f640000 R15: 0000000000010001 <4>[ 91.873553] FS: 0000000000000000(0000) GS:ffff8888db099000(0000) knlGS:0000000000000000 Oops#2 Part5 <4>[ 91.873572] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 91.873586] CR2: ffffc9000538a188 CR3: 000000000344c003 CR4: 0000000000f72ef0 <4>[ 91.873603] PKRU: 55555554 <4>[ 91.873612] Call Trace: <4>[ 91.873621] <4>[ 91.873639] xe_force_wake_get+0x2a5/0x940 [xe] <4>[ 91.874046] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 91.874074] ? mark_held_locks+0x46/0x90 <4>[ 91.874097] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 91.874537] ? trace_hardirqs_on+0x22/0x100 <4>[ 91.874558] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 91.874577] ? xe_tlb_inval_fence_prep+0xce/0x1e0 [xe] <4>[ 91.875092] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 91.875583] ? xelpg_ggtt_pte_flags+0x27/0x1a0 [xe] <4>[ 91.875979] ? find_held_lock+0x31/0x90 <4>[ 91.875995] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 91.876399] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 91.876795] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 91.877189] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 91.877583] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 91.877791] ? _raw_write_unlock+0x22/0x50 <4>[ 91.877794] ? drm_vma_offset_remove+0x65/0x80 <4>[ 91.877799] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 91.877868] ? lock_is_held_type+0xa3/0x130 <4>[ 91.877873] ttm_bo_release+0x70/0x330 [ttm] <4>[ 91.877880] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 91.877950] ? lock_release+0xd0/0x2b0 <4>[ 91.877953] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 91.877959] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 91.878026] drm_gem_object_free+0x1d/0x40 <4>[ 91.878030] xe_bo_put+0x12a/0x190 [xe] Oops#2 Part4 <4>[ 91.878097] xe_lrc_destroy+0x49/0x90 [xe] <4>[ 91.878176] __xe_exec_queue_fini+0x6b/0xa0 [xe] <4>[ 91.878244] xe_exec_queue_fini+0x2b/0x60 [xe] <4>[ 91.878312] __guc_exec_queue_destroy_async+0x6c/0x1a0 [xe] <4>[ 91.878386] process_one_work+0x22e/0x740 <4>[ 91.878390] worker_thread+0x1e8/0x3d0 <4>[ 91.878393] ? __pfx_worker_thread+0x10/0x10 <4>[ 91.878395] kthread+0x10d/0x150 <4>[ 91.878399] ? __pfx_kthread+0x10/0x10 <4>[ 91.878402] ret_from_fork+0x3d4/0x480 <4>[ 91.878405] ? __pfx_kthread+0x10/0x10 <4>[ 91.878408] ret_from_fork_asm+0x1a/0x30 <4>[ 91.878413] <4>[ 91.878414] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling cmdlinepart x86_pkg_temp_thermal hid_generic intel_powerclamp spi_nor mei_pxp eeepc_wmi mei_hdcp mtd asus_wmi sparse_keymap platform_profile wmi_bmof coretemp usbhid hid kvm_intel binfmt_misc r8169 kvm irqbypass ghash_clmulni_intel snd_intel_dspcfg snd_hda_codec aesni_intel rapl intel_cstate snd_hda_core snd_hwdep realtek video snd_pcm snd_timer i2c_i801 idma64 mei_me spi_intel_pci snd i2c_mux spi_intel soundcore i2c_smbus mei nls_iso8859_1 intel_pmc_core pmt_telemetry pmt_discovery pmt_class intel_pmc_ssram_telemetry wmi pinctrl_alderlake intel_vsec acpi_tad acpi_pad dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink Oops#2 Part3 <4>[ 91.878450] autofs4 [last unloaded: snd_hda_intel] <4>[ 91.878477] CR2: ffffc9000538a188 <4>[ 91.878480] ---[ end trace 0000000000000000 ]--- <4>[ 92.002808] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 92.002897] Code: 24 66 90 65 8b 05 0c 7e 2e e3 48 0f a3 05 b0 e3 d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 92.002904] RSP: 0018:ffffc90001bd37e0 EFLAGS: 00010086 <4>[ 92.002907] RAX: 0000000000000002 RBX: ffffc9000538a188 RCX: 0000000000000000 <4>[ 92.002910] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff888168750060 <4>[ 92.002912] RBP: ffffc90001bd3858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 92.002915] R10: ffff88817f640000 R11: 0000000000000001 R12: ffff888168750060 <4>[ 92.002918] R13: 000000000000a188 R14: ffff88817f640000 R15: 0000000000010001 <4>[ 92.002921] FS: 0000000000000000(0000) GS:ffff8888db099000(0000) knlGS:0000000000000000 <4>[ 92.002924] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 92.002926] CR2: ffffc9000538a188 CR3: 000000000344c003 CR4: 0000000000f72ef0 <4>[ 92.002929] PKRU: 55555554 <6>[ 92.002931] note: kworker/8:3[516] exited with irqs disabled <6>[ 92.002946] note: kworker/8:3[516] exited with preempt_count 1 <1>[ 94.174071] BUG: unable to handle page fault for address: ffffc90001bd3a90 Oops#2 Part2 <1>[ 94.174101] #PF: supervisor read access in kernel mode <1>[ 94.174113] #PF: error_code(0x0000) - not-present page <6>[ 94.174125] PGD 100000067 P4D 100000067 PUD 100ab8067 PMD 11af45067 PTE 0 <4>[ 94.174147] Oops: Oops: 0000 [#2] SMP NOPTI <4>[ 94.174164] CPU: 1 UID: 0 PID: 204 Comm: kworker/u64:5 Tainted: G S UD W 7.0.0-rc2-lgci-xe-xe-4655-cfc20c776480fda8c-debug+ #1 PREEMPT(lazy) <4>[ 94.174193] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN <4>[ 94.174204] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 94.174219] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 94.174748] RIP: 0010:xe_tlb_inval_fence_timeout+0x65/0x220 [xe] <4>[ 94.175260] Code: 89 df 48 89 45 d0 49 8b 85 08 ff ff ff 48 8b 40 20 2e 2e 2e ff d0 49 8d 45 c0 48 89 c7 48 89 45 b8 e8 6f e3 c7 e1 49 8b 45 b0 <48> 8b 30 4c 8d 78 80 48 8d 5e 80 49 8d 75 b0 48 89 75 c8 48 39 c6 <4>[ 94.175295] RSP: 0018:ffffc900014cbdb0 EFLAGS: 00010046 <4>[ 94.175311] RAX: ffffc90001bd3a90 RBX: ffff888168750458 RCX: 0000000000000000 <4>[ 94.175327] RDX: 0000000000000000 RSI: 0000000000000000 RDI: 0000000000000000 <4>[ 94.175342] RBP: ffffc900014cbdf8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 94.175358] R10: 0000000000000000 R11: 0000000000000000 R12: ffff88817f640000 <4>[ 94.175373] R13: ffff888168750560 R14: ffff888168750560 R15: ffff8881074e28c0 <4>[ 94.175389] FS: 0000000000000000(0000) GS:ffff8888dad19000(0000) knlGS:0000000000000000 <4>[ 94.175408] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 94.175422] CR2: ffffc90001bd3a90 CR3: 000000000344c002 CR4: 0000000000f72ef0 Oops#2 Part1 <4>[ 94.175438] PKRU: 55555554 <4>[ 94.175448] Call Trace: <4>[ 94.175457] <4>[ 94.175473] process_one_work+0x22e/0x740 <4>[ 94.175500] worker_thread+0x1e8/0x3d0 <4>[ 94.175514] ? __pfx_worker_thread+0x10/0x10 <4>[ 94.175529] kthread+0x10d/0x150 <4>[ 94.175546] ? __pfx_kthread+0x10/0x10 <4>[ 94.175564] ret_from_fork+0x3d4/0x480 <4>[ 94.175578] ? __pfx_kthread+0x10/0x10 <4>[ 94.175596] ret_from_fork_asm+0x1a/0x30 <4>[ 94.175622] <4>[ 94.175630] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling cmdlinepart x86_pkg_temp_thermal hid_generic intel_powerclamp spi_nor mei_pxp eeepc_wmi mei_hdcp mtd asus_wmi sparse_keymap platform_profile wmi_bmof coretemp usbhid hid kvm_intel binfmt_misc r8169 kvm irqbypass ghash_clmulni_intel snd_intel_dspcfg snd_hda_codec aesni_intel rapl intel_cstate snd_hda_core snd_hwdep realtek video snd_pcm snd_timer i2c_i801 idma64 mei_me spi_intel_pci snd i2c_mux spi_intel soundcore i2c_smbus mei nls_iso8859_1 intel_pmc_core pmt_telemetry pmt_discovery pmt_class intel_pmc_ssram_telemetry wmi pinctrl_alderlake intel_vsec acpi_tad acpi_pad dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 94.175814] autofs4 [last unloaded: snd_hda_intel] <4>[ 94.175964] CR2: ffffc90001bd3a90 <4>[ 94.175977] ---[ end trace 0000000000000000 ]---