Oops#2 Part10 <4>[ 322.942267] RDX: 000000000000000c RSI: 00007ffca05a6d20 RDI: 0000000000000007 <4>[ 322.942269] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 322.942270] R10: 0000000000000000 R11: 0000000000000202 R12: 00007ffca05a6d20 <4>[ 322.942272] R13: 0000000000000007 R14: 0000000000000006 R15: 00007ffca05a69d0 <4>[ 322.942283] <4>[ 322.942284] irq event stamp: 1453474 <4>[ 322.942285] hardirqs last enabled at (1453473): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 322.942289] hardirqs last disabled at (1453474): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 322.942292] softirqs last enabled at (1452766): [] __irq_exit_rcu+0x13f/0x160 <4>[ 322.942296] softirqs last disabled at (1452759): [] __irq_exit_rcu+0x13f/0x160 <4>[ 322.942299] ---[ end trace 0000000000000000 ]--- <7>[ 322.942301] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <3>[ 322.942439] xe 0000:03:00.0: probe with driver xe failed with error -12 <3>[ 322.943177] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <7>[ 322.943566] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 322.945333] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 323.013678] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 323.015264] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. Oops#2 Part9 <3>[ 325.203641] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=52 recv=51 <1>[ 325.204738] BUG: unable to handle page fault for address: ffffc9000638a188 <1>[ 325.204769] #PF: supervisor write access in kernel mode <1>[ 325.204782] #PF: error_code(0x0002) - not-present page <6>[ 325.204793] PGD 100000067 P4D 100000067 PUD 100ac1067 PMD 0 <4>[ 325.204813] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 325.204830] CPU: 4 UID: 0 PID: 2442 Comm: kworker/4:3 Tainted: G S U W N 7.0.0-rc3-lgci-xe-xe-4697-c8f35befe90e623b4-debug+ #1 PREEMPT(lazy) <4>[ 325.204858] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN, [N]=TEST <4>[ 325.204870] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 325.204886] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 325.205361] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 325.205827] Code: 24 66 90 65 8b 05 2c 48 2e e3 48 0f a3 05 d0 ae d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 325.205862] RSP: 0018:ffffc9000276f7e0 EFLAGS: 00010086 <4>[ 325.205880] RAX: 0000000000000002 RBX: ffffc9000638a188 RCX: 0000000000000000 <4>[ 325.205898] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff88812c5a8060 <4>[ 325.205915] RBP: ffffc9000276f858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 325.205931] R10: ffff888128310000 R11: 0000000000000001 R12: ffff88812c5a8060 <4>[ 325.205947] R13: 000000000000a188 R14: ffff888128310000 R15: 0000000000010001 <4>[ 325.205964] FS: 0000000000000000(0000) GS:ffff8888dae9b000(0000) knlGS:0000000000000000 Oops#2 Part8 <4>[ 325.205984] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 325.206000] CR2: ffffc9000638a188 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 325.206017] PKRU: 55555554 <4>[ 325.206027] Call Trace: <4>[ 325.206037] <4>[ 325.206056] xe_force_wake_get+0x2a5/0x940 [xe] <4>[ 325.206458] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 325.206487] ? mark_held_locks+0x46/0x90 <4>[ 325.206511] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 325.206937] ? trace_hardirqs_on+0x22/0x100 <4>[ 325.206959] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 325.206979] ? xe_tlb_inval_fence_prep+0xce/0x1e0 [xe] <4>[ 325.207476] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 325.207944] ? xelpg_ggtt_pte_flags+0x27/0x1a0 [xe] <4>[ 325.208338] ? find_held_lock+0x31/0x90 <4>[ 325.208354] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 325.208753] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 325.209149] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 325.209429] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 325.209497] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 325.209565] ? _raw_write_unlock+0x22/0x50 <4>[ 325.209568] ? drm_vma_offset_remove+0x65/0x80 <4>[ 325.209573] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 325.209640] ? lock_is_held_type+0xa3/0x130 <4>[ 325.209645] ttm_bo_release+0x70/0x310 [ttm] <4>[ 325.209652] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 325.209720] ? lock_release+0xd0/0x2b0 <4>[ 325.209723] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 325.209729] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 325.209796] drm_gem_object_free+0x1d/0x40 <4>[ 325.209799] xe_bo_put+0x12a/0x190 [xe] Oops#2 Part7 <4>[ 325.209867] xe_lrc_destroy+0x49/0x90 [xe] <4>[ 325.209943] __xe_exec_queue_fini+0x6b/0xa0 [xe] <4>[ 325.210010] xe_exec_queue_fini+0x2b/0x60 [xe] <4>[ 325.210080] __guc_exec_queue_destroy_async+0x6c/0x1a0 [xe] <4>[ 325.210155] process_one_work+0x22e/0x740 <4>[ 325.210162] worker_thread+0x1e8/0x3d0 <4>[ 325.210164] ? __pfx_worker_thread+0x10/0x10 <4>[ 325.210167] kthread+0x10d/0x150 <4>[ 325.210170] ? __pfx_kthread+0x10/0x10 <4>[ 325.210174] ret_from_fork+0x3d4/0x480 <4>[ 325.210177] ? __pfx_kthread+0x10/0x10 <4>[ 325.210180] ret_from_fork_asm+0x1a/0x30 <4>[ 325.210185] <4>[ 325.210186] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal cmdlinepart intel_powerclamp spi_nor hid_generic asus_nb_wmi coretemp mtd asus_wmi mei_pxp mei_hdcp sparse_keymap platform_profile wmi_bmof kvm_intel usbhid hid binfmt_misc kvm irqbypass ghash_clmulni_intel aesni_intel snd_intel_dspcfg rapl r8169 snd_hda_codec intel_cstate snd_hda_core snd_hwdep video snd_pcm spi_intel_pci realtek spi_intel snd_timer mei_me nls_iso8859_1 i2c_i801 snd i2c_mux idma64 mei soundcore i2c_smbus intel_pmc_core pmt_telemetry pmt_discovery pmt_class intel_pmc_ssram_telemetry wmi acpi_tad pinctrl_alderlake acpi_pad intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink Oops#2 Part6 <4>[ 325.210222] autofs4 [last unloaded: snd_hda_intel] <4>[ 325.210248] CR2: ffffc9000638a188 <4>[ 325.210251] ---[ end trace 0000000000000000 ]--- <4>[ 325.354164] RIP: 0010:xe_mmio_write32+0x58/0x2b0 [xe] <4>[ 325.354253] Code: 24 66 90 65 8b 05 2c 48 2e e3 48 0f a3 05 d0 ae d0 e2 0f 82 1d 01 00 00 41 f7 c5 00 00 00 01 0f 84 b7 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 325.354259] RSP: 0018:ffffc9000276f7e0 EFLAGS: 00010086 <4>[ 325.354262] RAX: 0000000000000002 RBX: ffffc9000638a188 RCX: 0000000000000000 <4>[ 325.354265] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff88812c5a8060 <4>[ 325.354268] RBP: ffffc9000276f858 R08: 0000000000000000 R09: 0000000000000000 <4>[ 325.354270] R10: ffff888128310000 R11: 0000000000000001 R12: ffff88812c5a8060 <4>[ 325.354273] R13: 000000000000a188 R14: ffff888128310000 R15: 0000000000010001 <4>[ 325.354276] FS: 0000000000000000(0000) GS:ffff8888dae9b000(0000) knlGS:0000000000000000 <4>[ 325.354279] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 325.354282] CR2: ffffc9000638a188 CR3: 000000000344c004 CR4: 0000000000f72ef0 Oops#2 Part5 <4>[ 325.354284] PKRU: 55555554 <6>[ 325.354286] note: kworker/4:3[2442] exited with irqs disabled <6>[ 325.354301] note: kworker/4:3[2442] exited with preempt_count 1 <3>[ 327.506297] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=41352000 recv=0 <4>[ 327.506338] non-slab/vmalloc memory <4>[ 327.506352] ------------[ cut here ]------------ <4>[ 327.506362] list_del corruption. prev->next should be ffffc9000276fa90, but was 103d48d44db60f44. (prev=ffffffff81391a0e) <4>[ 327.506381] WARNING: lib/list_debug.c:62 at __list_del_entry_valid_or_report+0xd9/0x120, CPU#3: kworker/u64:14/3232 <4>[ 327.506413] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal cmdlinepart intel_powerclamp spi_nor hid_generic asus_nb_wmi coretemp mtd asus_wmi mei_pxp mei_hdcp sparse_keymap platform_profile wmi_bmof kvm_intel usbhid hid binfmt_misc kvm irqbypass ghash_clmulni_intel aesni_intel snd_intel_dspcfg rapl r8169 snd_hda_codec intel_cstate snd_hda_core snd_hwdep video snd_pcm spi_intel_pci realtek spi_intel snd_timer mei_me nls_iso8859_1 i2c_i801 snd i2c_mux idma64 mei soundcore i2c_smbus intel_pmc_core pmt_telemetry pmt_discovery pmt_class intel_pmc_ssram_telemetry wmi acpi_tad pinctrl_alderlake acpi_pad intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink Oops#2 Part4 <4>[ 327.506577] autofs4 [last unloaded: snd_hda_intel] <4>[ 327.506686] CPU: 3 UID: 0 PID: 3232 Comm: kworker/u64:14 Tainted: G S UD W N 7.0.0-rc3-lgci-xe-xe-4697-c8f35befe90e623b4-debug+ #1 PREEMPT(lazy) <4>[ 327.506715] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN, [N]=TEST <4>[ 327.506729] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 327.506744] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 327.507283] RIP: 0010:__list_del_entry_valid_or_report+0xe3/0x120 <4>[ 327.507306] Code: b5 01 4c 89 ea 48 89 de 67 48 0f b9 3a 31 c0 eb 8b 4c 89 ef e8 be de 8e ff 48 8d 3d a7 29 b5 01 49 8b 55 00 4c 89 e9 48 89 de <67> 48 0f b9 3a 31 c0 e9 66 ff ff ff 4c 89 e7 e8 99 de 8e ff 48 8d <4>[ 327.507341] RSP: 0018:ffffc90004eb7d58 EFLAGS: 00010046 <4>[ 327.507358] RAX: 0000000000000000 RBX: ffffc9000276fa90 RCX: ffffffff81391a0e <4>[ 327.507374] RDX: 103d48d44db60f44 RSI: ffffc9000276fa90 RDI: ffffffff839e1480 <4>[ 327.507390] RBP: ffffc90004eb7d70 R08: 0000000000000000 R09: 0000000000000000 <4>[ 327.507405] R10: 0000000000000000 R11: 0000000000000000 R12: ffff88812c5a8500 Oops#2 Part3 <4>[ 327.507420] R13: ffffffff81391a0e R14: ffffffff81490573 R15: ffff88812c5a8480 <4>[ 327.507436] FS: 0000000000000000(0000) GS:ffff8888dae1b000(0000) knlGS:0000000000000000 <4>[ 327.507455] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 327.507470] CR2: 000057dfb7c92920 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 327.507486] PKRU: 55555554 <4>[ 327.507495] Call Trace: <4>[ 327.507505] <4>[ 327.507520] xe_tlb_inval_fence_signal+0x40/0x200 [xe] <4>[ 327.508011] ? lock_acquire+0x2b3/0x2f0 <4>[ 327.508032] xe_tlb_inval_fence_timeout+0xb9/0x220 [xe] <4>[ 327.508501] process_one_work+0x22e/0x740 <4>[ 327.508526] worker_thread+0x1e8/0x3d0 <4>[ 327.508540] ? __pfx_worker_thread+0x10/0x10 <4>[ 327.508554] kthread+0x10d/0x150 <4>[ 327.508572] ? __pfx_kthread+0x10/0x10 <4>[ 327.508591] ret_from_fork+0x3d4/0x480 <4>[ 327.508605] ? __pfx_kthread+0x10/0x10 <4>[ 327.508623] ret_from_fork_asm+0x1a/0x30 <4>[ 327.508649] <4>[ 327.508658] irq event stamp: 180480 <4>[ 327.508668] hardirqs last enabled at (180479): [] _raw_spin_unlock_irq+0x27/0x70 <4>[ 327.508698] hardirqs last disabled at (180480): [] __schedule+0x11e7/0x1dd0 <4>[ 327.508724] softirqs last enabled at (177494): [] __irq_exit_rcu+0x13f/0x160 <4>[ 327.508748] softirqs last disabled at (177489): [] __irq_exit_rcu+0x13f/0x160 <4>[ 327.508770] ---[ end trace 0000000000000000 ]--- <1>[ 327.508793] BUG: unable to handle page fault for address: ffffffff0a5a8510 <1>[ 327.508808] #PF: supervisor read access in kernel mode Oops#2 Part2 <1>[ 327.508822] #PF: error_code(0x0000) - not-present page <6>[ 327.508835] PGD 344f067 P4D 344f067 PUD 0 <4>[ 327.508853] Oops: Oops: 0000 [#2] SMP NOPTI <4>[ 327.508868] CPU: 3 UID: 0 PID: 3232 Comm: kworker/u64:14 Tainted: G S UD W N 7.0.0-rc3-lgci-xe-xe-4697-c8f35befe90e623b4-debug+ #1 PREEMPT(lazy) <4>[ 327.508900] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN, [N]=TEST <4>[ 327.508916] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 327.508934] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 327.509383] RIP: 0010:xe_tlb_inval_fence_signal+0x75/0x200 [xe] <4>[ 327.509822] Code: 48 8b 83 88 00 00 00 48 89 42 08 48 89 10 48 b8 00 01 00 00 00 00 ad de 48 89 83 80 00 00 00 48 83 c0 22 48 89 83 88 00 00 00 <49> 8b 95 b8 00 00 00 49 8d 85 b8 00 00 00 48 39 c2 0f 84 53 01 00 <4>[ 327.509857] RSP: 0018:ffffc90004eb7d80 EFLAGS: 00010086 <4>[ 327.509872] RAX: dead000000000122 RBX: ffffc9000276fa10 RCX: 0000000000000000 <4>[ 327.509888] RDX: 0000000000000000 RSI: 0000000000000000 RDI: 0000000000000000 <4>[ 327.509903] RBP: ffffc90004eb7da0 R08: 0000000000000000 R09: 0000000000000000 <4>[ 327.509918] R10: 0000000000000000 R11: 0000000000000000 R12: 0000000000000000 <4>[ 327.509933] R13: ffffffff0a5a8458 R14: ffffffff81490573 R15: ffff88812c5a8480 <4>[ 327.509949] FS: 0000000000000000(0000) GS:ffff8888dae1b000(0000) knlGS:0000000000000000 <4>[ 327.509967] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 327.509981] CR2: ffffffff0a5a8510 CR3: 000000000344c004 CR4: 0000000000f72ef0 <4>[ 327.509998] PKRU: 55555554 <4>[ 327.510006] Call Trace: <4>[ 327.510014] Oops#2 Part1 <4>[ 327.510024] ? lock_acquire+0x2b3/0x2f0 <4>[ 327.510043] xe_tlb_inval_fence_timeout+0xb9/0x220 [xe] <4>[ 327.510481] process_one_work+0x22e/0x740 <4>[ 327.510503] worker_thread+0x1e8/0x3d0 <4>[ 327.510517] ? __pfx_worker_thread+0x10/0x10 <4>[ 327.510531] kthread+0x10d/0x150 <4>[ 327.510548] ? __pfx_kthread+0x10/0x10 <4>[ 327.510566] ret_from_fork+0x3d4/0x480 <4>[ 327.510578] ? __pfx_kthread+0x10/0x10 <4>[ 327.510596] ret_from_fork_asm+0x1a/0x30 <4>[ 327.510622] <4>[ 327.510629] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal cmdlinepart intel_powerclamp spi_nor hid_generic asus_nb_wmi coretemp mtd asus_wmi mei_pxp mei_hdcp sparse_keymap platform_profile wmi_bmof kvm_intel usbhid hid binfmt_misc kvm irqbypass ghash_clmulni_intel aesni_intel snd_intel_dspcfg rapl r8169 snd_hda_codec intel_cstate snd_hda_core snd_hwdep video snd_pcm spi_intel_pci realtek spi_intel snd_timer mei_me nls_iso8859_1 i2c_i801 snd i2c_mux idma64 mei soundcore i2c_smbus intel_pmc_core pmt_telemetry pmt_discovery pmt_class intel_pmc_ssram_telemetry wmi acpi_tad pinctrl_alderlake acpi_pad intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 327.510804] autofs4 [last unloaded: snd_hda_intel] <4>[ 327.510953] CR2: ffffffff0a5a8510 <4>[ 327.510966] ---[ end trace 0000000000000000 ]---