Oops#2 Part8 <4>[ 326.094002] ? xe_migrate_init+0x277/0x2d0 [xe] <4>[ 326.094118] xe_gt_init+0x35d/0xab0 [xe] <4>[ 326.094217] ? trace_hardirqs_on+0x63/0xd0 <4>[ 326.094222] ? _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 326.094227] ? __devm_add_action+0x70/0xa0 <4>[ 326.094233] ? xe_irq_install+0x11a/0x490 [xe] <4>[ 326.094350] xe_device_probe+0x3c5/0xc10 [xe] <4>[ 326.094445] ? __drm_dev_dbg+0x7d/0xb0 <4>[ 326.094451] ? __drmm_add_action_or_reset+0x1e/0x50 <4>[ 326.094459] xe_pci_probe+0x396/0x610 [xe] <4>[ 326.094581] local_pci_probe+0x47/0xb0 <4>[ 326.094587] pci_device_probe+0xf3/0x260 <4>[ 326.094594] really_probe+0xf1/0x410 <4>[ 326.094598] __driver_probe_device+0x8c/0x190 <4>[ 326.094602] device_driver_attach+0x57/0xd0 <4>[ 326.094606] bind_store+0x77/0xd0 <4>[ 326.094611] drv_attr_store+0x24/0x50 <4>[ 326.094614] sysfs_kf_write+0x4d/0x80 <4>[ 326.094619] kernfs_fop_write_iter+0x188/0x240 <4>[ 326.094624] vfs_write+0x283/0x540 <4>[ 326.094635] ksys_write+0x6f/0xf0 <4>[ 326.094641] __x64_sys_write+0x19/0x30 <4>[ 326.094643] x64_sys_call+0x79/0x26b0 <4>[ 326.094647] do_syscall_64+0x93/0x1470 <4>[ 326.094651] ? do_syscall_64+0x1e4/0x1470 <4>[ 326.094659] ? do_syscall_64+0x1e4/0x1470 <4>[ 326.094663] ? do_syscall_64+0x1e4/0x1470 <4>[ 326.094665] ? exc_page_fault+0xbb/0x260 <4>[ 326.094670] entry_SYSCALL_64_after_hwframe+0x76/0x7e <4>[ 326.094672] RIP: 0033:0x7de90a51c5a4 <4>[ 326.094675] Code: c7 00 16 00 00 00 b8 ff ff ff ff c3 66 2e 0f 1f 84 00 00 00 00 00 f3 0f 1e fa 80 3d a5 ea 0e 00 00 74 13 b8 01 00 00 00 0f 05 <48> 3d 00 f0 ff ff 77 54 c3 0f 1f 00 55 48 89 e5 48 83 ec 20 48 89 Oops#2 Part7 <4>[ 326.094677] RSP: 002b:00007ffd47bd9d68 EFLAGS: 00000202 ORIG_RAX: 0000000000000001 <4>[ 326.094680] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 00007de90a51c5a4 <4>[ 326.094681] RDX: 000000000000000c RSI: 00007ffd47bda230 RDI: 0000000000000007 <4>[ 326.094683] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 326.094684] R10: 0000000000000000 R11: 0000000000000202 R12: 00007ffd47bda230 <4>[ 326.094686] R13: 0000000000000007 R14: 0000000000000006 R15: 00007ffd47bd9ee0 <4>[ 326.094697] <4>[ 326.094698] irq event stamp: 1218860 <4>[ 326.094699] hardirqs last enabled at (1218859): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 326.094702] hardirqs last disabled at (1218860): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 326.094705] softirqs last enabled at (1218028): [] __irq_exit_rcu+0x13f/0x160 <4>[ 326.094709] softirqs last disabled at (1218005): [] __irq_exit_rcu+0x13f/0x160 <4>[ 326.094711] ---[ end trace 0000000000000000 ]--- <7>[ 326.094714] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <3>[ 326.094853] xe 0000:03:00.0: probe with driver xe failed with error -12 <3>[ 326.095531] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <7>[ 326.095909] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 326.097356] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled Oops#2 Part6 <7>[ 326.201088] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 326.203143] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. <3>[ 328.356396] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=39 recv=38 <1>[ 328.357465] BUG: unable to handle page fault for address: ffffc9000c38a188 <1>[ 328.357495] #PF: supervisor write access in kernel mode <1>[ 328.357508] #PF: error_code(0x0002) - not-present page <6>[ 328.357520] PGD 100000067 P4D 100000067 PUD 100abd067 PMD 0 <4>[ 328.357539] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 328.357555] CPU: 10 UID: 0 PID: 2615 Comm: kworker/10:4 Tainted: G S U W 6.19.0-lgci-xe-xe-4574-e1032fc6a7b99e9b2-debug+ #1 PREEMPT(voluntary) <4>[ 328.357583] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 328.357593] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 328.357609] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 328.358083] RIP: 0010:xe_mmio_write32+0x58/0x280 [xe] <4>[ 328.358556] Code: 24 66 90 65 8b 05 4c 87 2a e3 48 0f a3 05 f0 a1 cd e2 0f 82 ee 00 00 00 41 f7 c5 00 00 00 01 0f 84 88 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 328.358592] RSP: 0018:ffffc90003fe7830 EFLAGS: 00010086 <4>[ 328.358610] RAX: 0000000000000002 RBX: ffffc9000c38a188 RCX: 0000000000000000 <4>[ 328.358628] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff888141a68060 <4>[ 328.358646] RBP: ffffc90003fe78a8 R08: 0000000000000000 R09: 0000000000000000 Oops#2 Part5 <4>[ 328.358663] R10: ffff888154a28000 R11: 0000000000000001 R12: ffff888141a68060 <4>[ 328.358680] R13: 000000000000a188 R14: ffff888154a28000 R15: 0000000000010001 <4>[ 328.358697] FS: 0000000000000000(0000) GS:ffff8888db1da000(0000) knlGS:0000000000000000 <4>[ 328.358718] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 328.358732] CR2: ffffc9000c38a188 CR3: 0000000003448001 CR4: 0000000000f72ef0 <4>[ 328.358750] PKRU: 55555554 <4>[ 328.358760] Call Trace: <4>[ 328.358770] <4>[ 328.358788] xe_force_wake_get+0x415/0x950 [xe] <4>[ 328.359195] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 328.359225] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 328.359660] ? trace_hardirqs_on+0x63/0xd0 <4>[ 328.359682] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 328.359699] ? xe_tlb_inval_fence_prep+0xbf/0x1a0 [xe] <4>[ 328.360204] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 328.360691] ? find_held_lock+0x31/0x90 <4>[ 328.360709] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 328.361114] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 328.361504] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 328.361573] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 328.361641] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 328.361710] ? _raw_write_unlock+0x22/0x50 <4>[ 328.361713] ? drm_vma_offset_remove+0x65/0x80 <4>[ 328.361718] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 328.361785] ? lock_is_held_type+0xa3/0x130 <4>[ 328.361790] ttm_bo_release+0x70/0x330 [ttm] <4>[ 328.361797] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 328.361868] ? lock_release+0xce/0x280 <4>[ 328.361872] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 328.361879] xe_gem_object_free+0x1a/0x30 [xe] Oops#2 Part4 <4>[ 328.361954] drm_gem_object_free+0x1d/0x40 <4>[ 328.361958] xe_bo_put+0x12a/0x190 [xe] <4>[ 328.362029] xe_lrc_destroy+0x47/0x60 [xe] <4>[ 328.362106] xe_exec_queue_fini+0x85/0xd0 [xe] <4>[ 328.362174] __guc_exec_queue_destroy_async+0x6c/0x170 [xe] <4>[ 328.362247] process_one_work+0x22e/0x6b0 <4>[ 328.362252] worker_thread+0x1e8/0x3d0 <4>[ 328.362255] ? __pfx_worker_thread+0x10/0x10 <4>[ 328.362257] kthread+0x11f/0x250 <4>[ 328.362261] ? __pfx_kthread+0x10/0x10 <4>[ 328.362264] ret_from_fork+0x344/0x3a0 <4>[ 328.362268] ? __pfx_kthread+0x10/0x10 <4>[ 328.362271] ret_from_fork_asm+0x1a/0x30 <4>[ 328.362275] <4>[ 328.362277] Modules linked in: pmt_crashlog snd_hda_codec_intelhdmi snd_hda_codec_hdmi mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling cmdlinepart x86_pkg_temp_thermal intel_powerclamp spi_nor hid_generic coretemp mtd eeepc_wmi asus_wmi sparse_keymap mei_hdcp mei_pxp platform_profile kvm_intel wmi_bmof snd_intel_dspcfg kvm snd_hda_codec irqbypass usbhid snd_hda_core ghash_clmulni_intel aesni_intel snd_hwdep hid video snd_pcm rapl intel_cstate snd_timer i2c_i801 r8169 snd spi_intel_pci i2c_mux binfmt_misc spi_intel soundcore i2c_smbus mei_me idma64 realtek mei intel_pmc_core pmt_telemetry nls_iso8859_1 pmt_discovery pmt_class intel_pmc_ssram_telemetry intel_vsec pinctrl_alderlake acpi_pad wmi acpi_tad dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink Oops#2 Part3 <4>[ 328.362313] autofs4 [last unloaded: snd_hda_intel] <4>[ 328.362339] CR2: ffffc9000c38a188 <4>[ 328.362342] ---[ end trace 0000000000000000 ]--- <4>[ 328.510674] RIP: 0010:xe_mmio_write32+0x58/0x280 [xe] <4>[ 328.510771] Code: 24 66 90 65 8b 05 4c 87 2a e3 48 0f a3 05 f0 a1 cd e2 0f 82 ee 00 00 00 41 f7 c5 00 00 00 01 0f 84 88 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 328.510778] RSP: 0018:ffffc90003fe7830 EFLAGS: 00010086 <4>[ 328.510781] RAX: 0000000000000002 RBX: ffffc9000c38a188 RCX: 0000000000000000 <4>[ 328.510785] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff888141a68060 <4>[ 328.510788] RBP: ffffc90003fe78a8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 328.510791] R10: ffff888154a28000 R11: 0000000000000001 R12: ffff888141a68060 <4>[ 328.510794] R13: 000000000000a188 R14: ffff888154a28000 R15: 0000000000010001 <4>[ 328.510797] FS: 0000000000000000(0000) GS:ffff8888db1da000(0000) knlGS:0000000000000000 <4>[ 328.510801] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 328.510803] CR2: ffffc9000c38a188 CR3: 0000000003448001 CR4: 0000000000f72ef0 <4>[ 328.510807] PKRU: 55555554 <6>[ 328.510809] note: kworker/10:4[2615] exited with irqs disabled <6>[ 328.510827] note: kworker/10:4[2615] exited with preempt_count 1 <1>[ 330.659045] BUG: unable to handle page fault for address: ffffc90003fe7aa8 Oops#2 Part2 <1>[ 330.659075] #PF: supervisor read access in kernel mode <1>[ 330.659087] #PF: error_code(0x0000) - not-present page <6>[ 330.659099] PGD 100000067 P4D 100000067 PUD 100abd067 PMD 130053067 PTE 0 <4>[ 330.659122] Oops: Oops: 0000 [#2] SMP NOPTI <4>[ 330.659139] CPU: 9 UID: 0 PID: 6653 Comm: kworker/u64:19 Tainted: G S UD W 6.19.0-lgci-xe-xe-4574-e1032fc6a7b99e9b2-debug+ #1 PREEMPT(voluntary) <4>[ 330.659167] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN <4>[ 330.659178] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 330.659192] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 330.659657] RIP: 0010:xe_tlb_inval_fence_timeout+0x65/0x1d0 [xe] <4>[ 330.660101] Code: 89 df 48 89 45 d0 49 8b 85 08 ff ff ff 48 8b 40 20 2e 2e 2e ff d0 49 8d 45 c0 48 89 c7 48 89 45 c0 e8 df e3 c2 e1 49 8b 45 b0 <48> 8b 30 4c 8d 78 b8 48 8d 5e b8 49 8d 75 b0 48 89 75 c8 48 39 c6 <4>[ 330.660135] RSP: 0018:ffffc90005d6fdb0 EFLAGS: 00010046 <4>[ 330.660151] RAX: ffffc90003fe7aa8 RBX: ffff888141a68458 RCX: 0000000000000000 <4>[ 330.660168] RDX: 0000000000000000 RSI: 0000000000000000 RDI: 0000000000000000 <4>[ 330.660182] RBP: ffffc90005d6fdf0 R08: 0000000000000000 R09: 0000000000000000 <4>[ 330.660197] R10: 0000000000000000 R11: 0000000000000000 R12: ffff888154a28000 <4>[ 330.660212] R13: ffff888141a68560 R14: ffff888141a68560 R15: ffff8881518c0940 <4>[ 330.660228] FS: 0000000000000000(0000) GS:ffff8888db15a000(0000) knlGS:0000000000000000 <4>[ 330.660247] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 330.660261] CR2: ffffc90003fe7aa8 CR3: 0000000003448001 CR4: 0000000000f72ef0 Oops#2 Part1 <4>[ 330.660278] PKRU: 55555554 <4>[ 330.660286] Call Trace: <4>[ 330.660296] <4>[ 330.660311] process_one_work+0x22e/0x6b0 <4>[ 330.660339] worker_thread+0x1e8/0x3d0 <4>[ 330.660354] ? __pfx_worker_thread+0x10/0x10 <4>[ 330.660371] kthread+0x11f/0x250 <4>[ 330.660389] ? __pfx_kthread+0x10/0x10 <4>[ 330.660407] ret_from_fork+0x344/0x3a0 <4>[ 330.660423] ? __pfx_kthread+0x10/0x10 <4>[ 330.660440] ret_from_fork_asm+0x1a/0x30 <4>[ 330.660464] <4>[ 330.660472] Modules linked in: pmt_crashlog snd_hda_codec_intelhdmi snd_hda_codec_hdmi mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling cmdlinepart x86_pkg_temp_thermal intel_powerclamp spi_nor hid_generic coretemp mtd eeepc_wmi asus_wmi sparse_keymap mei_hdcp mei_pxp platform_profile kvm_intel wmi_bmof snd_intel_dspcfg kvm snd_hda_codec irqbypass usbhid snd_hda_core ghash_clmulni_intel aesni_intel snd_hwdep hid video snd_pcm rapl intel_cstate snd_timer i2c_i801 r8169 snd spi_intel_pci i2c_mux binfmt_misc spi_intel soundcore i2c_smbus mei_me idma64 realtek mei intel_pmc_core pmt_telemetry nls_iso8859_1 pmt_discovery pmt_class intel_pmc_ssram_telemetry intel_vsec pinctrl_alderlake acpi_pad wmi acpi_tad dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 330.660657] autofs4 [last unloaded: snd_hda_intel] <4>[ 330.660806] CR2: ffffc90003fe7aa8 <4>[ 330.660819] ---[ end trace 0000000000000000 ]---