Oops#2 Part10 <4>[ 350.478429] RSP: 002b:00007ffdac5b4948 EFLAGS: 00000202 ORIG_RAX: 0000000000000001 <4>[ 350.478431] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 0000701fb5f1c5a4 <4>[ 350.478432] RDX: 000000000000000c RSI: 00007ffdac5b4e10 RDI: 0000000000000007 <4>[ 350.478433] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 350.478435] R10: 0000000000000000 R11: 0000000000000202 R12: 00007ffdac5b4e10 <4>[ 350.478436] R13: 0000000000000007 R14: 0000000000000006 R15: 00007ffdac5b4ac0 <4>[ 350.478444] <4>[ 350.478445] irq event stamp: 1267876 <4>[ 350.478446] hardirqs last enabled at (1267875): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 350.478448] hardirqs last disabled at (1267876): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 350.478450] softirqs last enabled at (1267046): [] __irq_exit_rcu+0x13f/0x160 <4>[ 350.478453] softirqs last disabled at (1267039): [] __irq_exit_rcu+0x13f/0x160 <4>[ 350.478456] ---[ end trace 0000000000000000 ]--- <7>[ 350.478458] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <3>[ 350.478561] xe 0000:03:00.0: probe with driver xe failed with error -12 <3>[ 350.479106] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <7>[ 350.479364] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 350.480420] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled Oops#2 Part9 <7>[ 350.579976] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 350.583426] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. <3>[ 352.754624] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=38 recv=0 <1>[ 352.755639] BUG: unable to handle page fault for address: ffffc9000838a188 <1>[ 352.755669] #PF: supervisor write access in kernel mode <1>[ 352.755683] #PF: error_code(0x0002) - not-present page <6>[ 352.755694] PGD 100000067 P4D 100000067 PUD 100aaa067 PMD 0 <4>[ 352.755714] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 352.755730] CPU: 8 UID: 0 PID: 4116 Comm: kworker/8:9 Tainted: G S U W 6.19.0-lgci-xe-xe-4574-e1032fc6a7b99e9b2-debug+ #1 PREEMPT(voluntary) <4>[ 352.755758] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 352.755769] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1656 04/18/2024 <4>[ 352.755784] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 352.756232] RIP: 0010:xe_mmio_write32+0x58/0x280 [xe] <4>[ 352.756710] Code: 24 66 90 65 8b 05 4c 87 2a e3 48 0f a3 05 f0 a1 cd e2 0f 82 ee 00 00 00 41 f7 c5 00 00 00 01 0f 84 88 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 352.756747] RSP: 0018:ffffc9000aec7830 EFLAGS: 00010086 <4>[ 352.756765] RAX: 0000000000000002 RBX: ffffc9000838a188 RCX: 0000000000000000 <4>[ 352.756782] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff888131810060 <4>[ 352.756799] RBP: ffffc9000aec78a8 R08: 0000000000000000 R09: 0000000000000000 Oops#2 Part8 <4>[ 352.756816] R10: ffff8882f0c30000 R11: 0000000000000001 R12: ffff888131810060 <4>[ 352.756832] R13: 000000000000a188 R14: ffff8882f0c30000 R15: 0000000000010001 <4>[ 352.756849] FS: 0000000000000000(0000) GS:ffff8888db0da000(0000) knlGS:0000000000000000 <4>[ 352.756869] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 352.756884] CR2: ffffc9000838a188 CR3: 0000000003448004 CR4: 0000000000f72ef0 <4>[ 352.756901] PKRU: 55555554 <4>[ 352.756912] Call Trace: <4>[ 352.756922] <4>[ 352.756941] xe_force_wake_get+0x415/0x950 [xe] <4>[ 352.757194] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 352.757200] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 352.757282] ? trace_hardirqs_on+0x63/0xd0 <4>[ 352.757287] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 352.757290] ? xe_tlb_inval_fence_prep+0xbf/0x1a0 [xe] <4>[ 352.757383] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 352.757467] ? find_held_lock+0x31/0x90 <4>[ 352.757471] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 352.757542] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 352.757611] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 352.757680] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 352.757748] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 352.757817] ? _raw_write_unlock+0x22/0x50 <4>[ 352.757820] ? drm_vma_offset_remove+0x65/0x80 <4>[ 352.757825] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 352.757892] ? lock_is_held_type+0xa3/0x130 <4>[ 352.757897] ttm_bo_release+0x70/0x330 [ttm] <4>[ 352.757904] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 352.757972] ? lock_release+0xce/0x280 <4>[ 352.757976] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 352.757982] xe_gem_object_free+0x1a/0x30 [xe] Oops#2 Part7 <4>[ 352.758050] drm_gem_object_free+0x1d/0x40 <4>[ 352.758053] xe_bo_put+0x12a/0x190 [xe] <4>[ 352.758121] xe_lrc_destroy+0x47/0x60 [xe] <4>[ 352.758199] xe_exec_queue_fini+0x85/0xd0 [xe] <4>[ 352.758273] __guc_exec_queue_destroy_async+0x6c/0x170 [xe] <4>[ 352.758348] process_one_work+0x22e/0x6b0 <4>[ 352.758353] worker_thread+0x1e8/0x3d0 <4>[ 352.758355] ? __pfx_worker_thread+0x10/0x10 <4>[ 352.758358] kthread+0x11f/0x250 <4>[ 352.758362] ? __pfx_kthread+0x10/0x10 <4>[ 352.758365] ret_from_fork+0x344/0x3a0 <4>[ 352.758375] ? __pfx_kthread+0x10/0x10 <4>[ 352.758392] ret_from_fork_asm+0x1a/0x30 <4>[ 352.758416] <4>[ 352.758424] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit overlay intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp cmdlinepart hid_generic coretemp spi_nor asus_nb_wmi mei_pxp mei_hdcp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel usbhid kvm irqbypass hid ghash_clmulni_intel aesni_intel snd_intel_dspcfg r8169 snd_hda_codec video rapl snd_hda_core intel_cstate snd_hwdep binfmt_misc realtek snd_pcm snd_timer i2c_i801 idma64 i2c_mux snd mei_me spi_intel_pci i2c_smbus spi_intel soundcore mei intel_pmc_core pmt_telemetry nls_iso8859_1 pmt_discovery pmt_class intel_pmc_ssram_telemetry wmi intel_vsec acpi_tad pinctrl_alderlake acpi_pad dm_multipath msr nvme_fabrics fuse efi_pstore Oops#2 Part6 <4>[ 352.758605] nfnetlink autofs4 [last unloaded: snd_hda_intel] <4>[ 352.758757] CR2: ffffc9000838a188 <4>[ 352.758771] ---[ end trace 0000000000000000 ]--- <4>[ 352.902239] RIP: 0010:xe_mmio_write32+0x58/0x280 [xe] <4>[ 352.902337] Code: 24 66 90 65 8b 05 4c 87 2a e3 48 0f a3 05 f0 a1 cd e2 0f 82 ee 00 00 00 41 f7 c5 00 00 00 01 0f 84 88 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 352.902343] RSP: 0018:ffffc9000aec7830 EFLAGS: 00010086 <4>[ 352.902346] RAX: 0000000000000002 RBX: ffffc9000838a188 RCX: 0000000000000000 <4>[ 352.902349] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff888131810060 <4>[ 352.902352] RBP: ffffc9000aec78a8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 352.902355] R10: ffff8882f0c30000 R11: 0000000000000001 R12: ffff888131810060 <4>[ 352.902357] R13: 000000000000a188 R14: ffff8882f0c30000 R15: 0000000000010001 <4>[ 352.902360] FS: 0000000000000000(0000) GS:ffff8888db0da000(0000) knlGS:0000000000000000 <4>[ 352.902363] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 352.902366] CR2: ffffc9000838a188 CR3: 0000000003448004 CR4: 0000000000f72ef0 Oops#2 Part5 <4>[ 352.902369] PKRU: 55555554 <6>[ 352.902370] note: kworker/8:9[4116] exited with irqs disabled <6>[ 352.902384] note: kworker/8:9[4116] exited with preempt_count 1 <3>[ 355.056337] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=0 recv=0 <4>[ 355.056375] non-slab/vmalloc memory <4>[ 355.056388] ------------[ cut here ]------------ <4>[ 355.056397] list_del corruption. prev->next should be ffffc9000aec7aa8, but was 850fc084a0558b44. (prev=ffffffff814856ad) <4>[ 355.056416] WARNING: lib/list_debug.c:62 at __list_del_entry_valid_or_report+0xd9/0x120, CPU#7: kworker/u64:42/5969 <4>[ 355.056450] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit overlay intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp cmdlinepart hid_generic coretemp spi_nor asus_nb_wmi mei_pxp mei_hdcp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel usbhid kvm irqbypass hid ghash_clmulni_intel aesni_intel snd_intel_dspcfg r8169 snd_hda_codec video rapl snd_hda_core intel_cstate snd_hwdep binfmt_misc realtek snd_pcm snd_timer i2c_i801 idma64 i2c_mux snd mei_me spi_intel_pci i2c_smbus spi_intel soundcore mei intel_pmc_core pmt_telemetry nls_iso8859_1 pmt_discovery pmt_class intel_pmc_ssram_telemetry wmi intel_vsec acpi_tad pinctrl_alderlake acpi_pad dm_multipath msr nvme_fabrics fuse efi_pstore Oops#2 Part4 <4>[ 355.056608] nfnetlink autofs4 [last unloaded: snd_hda_intel] <4>[ 355.056716] CPU: 7 UID: 0 PID: 5969 Comm: kworker/u64:42 Tainted: G S UD W 6.19.0-lgci-xe-xe-4574-e1032fc6a7b99e9b2-debug+ #1 PREEMPT(voluntary) <4>[ 355.056744] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN <4>[ 355.056755] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1656 04/18/2024 <4>[ 355.056770] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 355.057319] RIP: 0010:__list_del_entry_valid_or_report+0xe3/0x120 <4>[ 355.057344] Code: b5 01 4c 89 ea 48 89 de 67 48 0f b9 3a 31 c0 eb 8b 4c 89 ef e8 be 0d 91 ff 48 8d 3d 17 77 b5 01 49 8b 55 00 4c 89 e9 48 89 de <67> 48 0f b9 3a 31 c0 e9 66 ff ff ff 4c 89 e7 e8 99 0d 91 ff 48 8d <4>[ 355.057379] RSP: 0018:ffffc9000d9e3d60 EFLAGS: 00010046 <4>[ 355.057395] RAX: 0000000000000000 RBX: ffffc9000aec7aa8 RCX: ffffffff814856ad Oops#2 Part3 <4>[ 355.057411] RDX: 850fc084a0558b44 RSI: ffffc9000aec7aa8 RDI: ffffffff839acf60 <4>[ 355.057427] RBP: ffffc9000d9e3d78 R08: 0000000000000000 R09: 0000000000000000 <4>[ 355.057442] R10: 0000000000000000 R11: 0000000000000000 R12: ffffc9000aec7f20 <4>[ 355.057457] R13: ffffffff814856ad R14: ffffc9000aec7f38 R15: ffffc9000aec7ed8 <4>[ 355.057473] FS: 0000000000000000(0000) GS:ffff8888db05a000(0000) knlGS:0000000000000000 <4>[ 355.057492] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 355.057507] CR2: 00005c59731814a8 CR3: 0000000003448002 CR4: 0000000000f72ef0 <4>[ 355.057523] PKRU: 55555554 <4>[ 355.057532] Call Trace: <4>[ 355.057542] <4>[ 355.057554] ? update_stack_state+0x10e/0x1a0 <4>[ 355.057573] xe_tlb_inval_fence_signal+0x3b/0x1b0 [xe] <4>[ 355.058076] xe_tlb_inval_fence_timeout+0xb6/0x1d0 [xe] <4>[ 355.058554] process_one_work+0x22e/0x6b0 <4>[ 355.058580] worker_thread+0x1e8/0x3d0 <4>[ 355.058596] ? __pfx_worker_thread+0x10/0x10 <4>[ 355.058612] kthread+0x11f/0x250 <4>[ 355.058631] ? __pfx_kthread+0x10/0x10 <4>[ 355.058650] ret_from_fork+0x344/0x3a0 <4>[ 355.058666] ? __pfx_kthread+0x10/0x10 <4>[ 355.058684] ret_from_fork_asm+0x1a/0x30 <4>[ 355.058707] <4>[ 355.058716] irq event stamp: 12880 <4>[ 355.058726] hardirqs last enabled at (12879): [] _raw_spin_unlock_irq+0x27/0x70 <4>[ 355.058753] hardirqs last disabled at (12880): [] __schedule+0x11cf/0x1d20 <4>[ 355.058777] softirqs last enabled at (12746): [] kernel_fpu_end+0x53/0x70 <4>[ 355.058801] softirqs last disabled at (12744): [] kernel_fpu_begin_mask+0xc4/0x120 Oops#2 Part2 <4>[ 355.058827] ---[ end trace 0000000000000000 ]--- <4>[ 355.058856] Oops: general protection fault, probably for non-canonical address 0x468949677481675d: 0000 [#2] SMP NOPTI <4>[ 355.058881] CPU: 7 UID: 0 PID: 5969 Comm: kworker/u64:42 Tainted: G S UD W 6.19.0-lgci-xe-xe-4574-e1032fc6a7b99e9b2-debug+ #1 PREEMPT(voluntary) <4>[ 355.058913] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN <4>[ 355.058926] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1656 04/18/2024 <4>[ 355.058943] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 355.059421] RIP: 0010:xe_pm_runtime_put+0x30/0x110 [xe] <4>[ 355.059902] Code: 48 89 e5 41 54 53 48 89 fb 48 8b 55 08 66 90 65 8b 05 08 3e 29 e3 48 0f a3 05 ac 58 cc e2 0f 82 94 00 00 00 f0 83 44 24 fc 00 <48> 8b 83 b0 2f 00 00 65 48 39 05 c9 3d 29 e3 0f 84 97 00 00 00 4c <4>[ 355.059936] RSP: 0018:ffffc9000d9e3d68 EFLAGS: 00010086 <4>[ 355.059951] RAX: 0000000000000001 RBX: 46894967748137ad RCX: 0000000000000000 <4>[ 355.059966] RDX: ffffffffa0cc4220 RSI: 46894967748137ad RDI: 46894967748137ad <4>[ 355.059982] RBP: ffffc9000d9e3d78 R08: 0000000000000000 R09: 0000000000000000 <4>[ 355.059997] R10: 0000000000000000 R11: 0000000000000000 R12: 0000000000000001 <4>[ 355.060012] R13: ffffffff8138b29e R14: ffffc9000aec7f38 R15: ffffc9000aec7ed8 <4>[ 355.060027] FS: 0000000000000000(0000) GS:ffff8888db05a000(0000) knlGS:0000000000000000 <4>[ 355.060046] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 355.060060] CR2: 00005c59731814a8 CR3: 0000000003448002 CR4: 0000000000f72ef0 <4>[ 355.060076] PKRU: 55555554 <4>[ 355.060085] Call Trace: <4>[ 355.060093] Oops#2 Part1 <4>[ 355.060103] xe_tlb_inval_fence_signal+0xb0/0x1b0 [xe] <4>[ 355.060577] xe_tlb_inval_fence_timeout+0xb6/0x1d0 [xe] <4>[ 355.061043] process_one_work+0x22e/0x6b0 <4>[ 355.061066] worker_thread+0x1e8/0x3d0 <4>[ 355.061081] ? __pfx_worker_thread+0x10/0x10 <4>[ 355.061097] kthread+0x11f/0x250 <4>[ 355.061115] ? __pfx_kthread+0x10/0x10 <4>[ 355.061125] ret_from_fork+0x344/0x3a0 <4>[ 355.061128] ? __pfx_kthread+0x10/0x10 <4>[ 355.061131] ret_from_fork_asm+0x1a/0x30 <4>[ 355.061135] <4>[ 355.061136] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit overlay intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp cmdlinepart hid_generic coretemp spi_nor asus_nb_wmi mei_pxp mei_hdcp asus_wmi mtd sparse_keymap platform_profile wmi_bmof kvm_intel usbhid kvm irqbypass hid ghash_clmulni_intel aesni_intel snd_intel_dspcfg r8169 snd_hda_codec video rapl snd_hda_core intel_cstate snd_hwdep binfmt_misc realtek snd_pcm snd_timer i2c_i801 idma64 i2c_mux snd mei_me spi_intel_pci i2c_smbus spi_intel soundcore mei intel_pmc_core pmt_telemetry nls_iso8859_1 pmt_discovery pmt_class intel_pmc_ssram_telemetry wmi intel_vsec acpi_tad pinctrl_alderlake acpi_pad dm_multipath msr nvme_fabrics fuse efi_pstore <4>[ 355.061166] nfnetlink autofs4 [last unloaded: snd_hda_intel] <4>[ 355.061193] ---[ end trace 0000000000000000 ]---