Oops#2 Part15 <4>[ 183.944259] autofs4 [last unloaded: snd_hda_intel] <4>[ 183.944263] CPU: 3 UID: 0 PID: 5355 Comm: xe_fault_inject Tainted: G S U W 6.19.0-lgci-xe-xe-4570-d9e4e8f5c4e7aa0d4-debug+ #1 PREEMPT(voluntary) <4>[ 183.944266] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 183.944267] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 183.944268] RIP: 0010:guc_ct_change_state+0x2ed/0x350 [xe] <4>[ 183.944343] Code: 1f 85 eb 51 48 c1 ea 25 44 6b ca 64 44 29 c9 51 48 c7 c1 d0 63 18 a1 52 ff 75 b0 44 8b 4d 94 4c 8b 45 88 48 8b 95 78 ff ff ff <67> 48 0f b9 3a 8b 8b 48 01 00 00 48 83 c4 60 85 c9 75 13 44 89 bb <4>[ 183.944344] RSP: 0018:ffffc9000d5f77b0 EFLAGS: 00010002 <4>[ 183.944346] RAX: ffffffffa11fa8f2 RBX: ffff888176a288a8 RCX: ffffffffa11863d0 <4>[ 183.944348] RDX: ffff888101bd3090 RSI: ffffffffa11fa8f2 RDI: ffffffffa1002ef0 <4>[ 183.944349] RBP: ffffc9000d5f7898 R08: ffffffffa11fa942 R09: 0000000000000007 <4>[ 183.944350] R10: 0000000000000001 R11: 0000000000000514 R12: ffff888176a288b0 <4>[ 183.944351] R13: ffff888176a28940 R14: 0000000000000515 R15: 0000000000000001 <4>[ 183.944352] FS: 000073aff6224980(0000) GS:ffff8888dae5a000(0000) knlGS:0000000000000000 <4>[ 183.944354] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 183.944355] CR2: 00007e9d84c0b048 CR3: 00000001b42eb004 CR4: 0000000000f72ef0 <4>[ 183.944356] PKRU: 55555554 <4>[ 183.944358] Call Trace: <4>[ 183.944359] <4>[ 183.944367] ? xe_guc_submit_enable+0xa8/0xf0 [xe] Oops#2 Part14 <4>[ 183.944454] xe_guc_ct_disable+0x17/0x80 [xe] <4>[ 183.944533] xe_guc_sanitize+0x2a/0x50 [xe] <4>[ 183.944612] xe_uc_load_hw+0x19a/0x2b0 [xe] <4>[ 183.944716] ? xe_migrate_init+0x277/0x2d0 [xe] <4>[ 183.944808] xe_gt_init+0x363/0xab0 [xe] <4>[ 183.944885] ? trace_hardirqs_on+0x63/0xd0 <4>[ 183.944889] ? _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 183.944893] ? __devm_add_action+0x70/0xa0 <4>[ 183.944898] ? xe_irq_install+0x11a/0x490 [xe] <4>[ 183.944988] xe_device_probe+0x3cc/0xc20 [xe] <4>[ 183.945064] ? __drm_dev_dbg+0x7d/0xb0 <4>[ 183.945068] ? __drmm_add_action_or_reset+0x1e/0x50 <4>[ 183.945075] xe_pci_probe+0x396/0x610 [xe] <4>[ 183.945170] local_pci_probe+0x47/0xb0 <4>[ 183.945175] pci_device_probe+0xf3/0x260 <4>[ 183.945180] really_probe+0xf1/0x410 <4>[ 183.945183] __driver_probe_device+0x8c/0x190 <4>[ 183.945186] device_driver_attach+0x57/0xd0 <4>[ 183.945189] bind_store+0x77/0xd0 <4>[ 183.945193] drv_attr_store+0x24/0x50 <4>[ 183.945195] sysfs_kf_write+0x4d/0x80 <4>[ 183.945199] kernfs_fop_write_iter+0x188/0x240 <4>[ 183.945204] vfs_write+0x283/0x540 <4>[ 183.945212] ksys_write+0x6f/0xf0 <4>[ 183.945216] __x64_sys_write+0x19/0x30 <4>[ 183.945219] x64_sys_call+0x79/0x26b0 <4>[ 183.945221] do_syscall_64+0x93/0x1470 <4>[ 183.945223] ? putname+0x3e/0x80 <4>[ 183.945226] ? do_sys_openat2+0x95/0xe0 <4>[ 183.945232] ? __x64_sys_openat+0x54/0xa0 <4>[ 183.945236] ? do_syscall_64+0x1e4/0x1470 <4>[ 183.945239] ? do_syscall_64+0x1e4/0x1470 <4>[ 183.945241] ? exc_page_fault+0xbb/0x260 <4>[ 183.945245] entry_SYSCALL_64_after_hwframe+0x76/0x7e <4>[ 183.945247] RIP: 0033:0x73aff851c5a4 Oops#2 Part13 <4>[ 183.945249] Code: c7 00 16 00 00 00 b8 ff ff ff ff c3 66 2e 0f 1f 84 00 00 00 00 00 f3 0f 1e fa 80 3d a5 ea 0e 00 00 74 13 b8 01 00 00 00 0f 05 <48> 3d 00 f0 ff ff 77 54 c3 0f 1f 00 55 48 89 e5 48 83 ec 20 48 89 <4>[ 183.945251] RSP: 002b:00007ffe4d37e148 EFLAGS: 00000202 ORIG_RAX: 0000000000000001 <4>[ 183.945253] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 000073aff851c5a4 <4>[ 183.945254] RDX: 000000000000000c RSI: 00007ffe4d37e610 RDI: 000000000000000b <4>[ 183.945255] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 183.945256] R10: 0000000000000000 R11: 0000000000000202 R12: 00007ffe4d37e610 <4>[ 183.945257] R13: 000000000000000b R14: 00005cc0a365135b R15: 00007ffe4d37e2c0 <4>[ 183.945265] <4>[ 183.945266] irq event stamp: 1135818 <4>[ 183.945267] hardirqs last enabled at (1135817): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 183.945270] hardirqs last disabled at (1135818): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 183.945272] softirqs last enabled at (1134976): [] __irq_exit_rcu+0x13f/0x160 <4>[ 183.945275] softirqs last disabled at (1134967): [] __irq_exit_rcu+0x13f/0x160 <4>[ 183.945277] ---[ end trace 0000000000000000 ]--- <7>[ 183.945279] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <4>[ 183.945371] ------------[ cut here ]------------ <4>[ 183.945388] xe 0000:03:00.0: [drm] Tile0: GT0: Failed to invalidate GGTT (-ENODEV) <4>[ 183.945391] WARNING: drivers/gpu/drm/xe/xe_ggtt.c:576 at ggtt_invalidate_gt_tlb.part.0+0x76/0xb0 [xe], CPU#13: kworker/13:4/3440 Oops#2 Part12 <3>[ 183.945494] xe 0000:03:00.0: probe with driver xe failed with error -12 <4>[ 183.945618] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp coretemp cmdlinepart hid_generic spi_nor asus_nb_wmi mtd asus_wmi mei_pxp mei_hdcp sparse_keymap platform_profile wmi_bmof kvm_intel binfmt_misc kvm irqbypass snd_intel_dspcfg ghash_clmulni_intel aesni_intel snd_hda_codec rapl snd_hda_core r8169 usbhid snd_hwdep video intel_cstate snd_pcm hid realtek i2c_i801 snd_timer i2c_mux spi_intel_pci snd idma64 spi_intel i2c_smbus soundcore nls_iso8859_1 intel_pmc_core pmt_telemetry mei_me pmt_discovery pmt_class mei intel_pmc_ssram_telemetry wmi pinctrl_alderlake acpi_tad acpi_pad intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink <4>[ 183.945712] autofs4 [last unloaded: snd_hda_intel] <4>[ 183.945717] CPU: 13 UID: 0 PID: 3440 Comm: kworker/13:4 Tainted: G S U W 6.19.0-lgci-xe-xe-4570-d9e4e8f5c4e7aa0d4-debug+ #1 PREEMPT(voluntary) <4>[ 183.945721] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 183.945723] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 183.945725] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] Oops#2 Part11 <4>[ 183.945839] RIP: 0010:ggtt_invalidate_gt_tlb.part.0+0x81/0xb0 [xe] <4>[ 183.945938] Code: 48 8b 7f 08 4c 8b 77 50 4d 85 f6 75 03 4c 8b 37 e8 b4 7e 5e e1 48 89 c6 48 8d 3d ca d3 3d 00 4d 89 e1 45 89 e8 89 d9 4c 89 f2 <67> 48 0f b9 3a 5b 41 5c 41 5d 41 5e 5d 31 c0 31 d2 31 c9 31 f6 31 <4>[ 183.945941] RSP: 0018:ffffc90005e53b08 EFLAGS: 00010246 <4>[ 183.945944] RAX: ffffffffa11fa8f2 RBX: 0000000000000000 RCX: 0000000000000000 <4>[ 183.945946] RDX: ffff888101bd3090 RSI: ffffffffa11fa8f2 RDI: ffffffffa1001fc0 <4>[ 183.945947] RBP: ffffc90005e53b28 R08: 0000000000000000 R09: ffffffffffffffed <4>[ 183.945949] R10: 0000000000000000 R11: 0000000000000000 R12: ffffffffffffffed <4>[ 183.945951] R13: 0000000000000000 R14: ffff888101bd3090 R15: 0000000000000000 <4>[ 183.945953] FS: 0000000000000000(0000) GS:ffff8888db35a000(0000) knlGS:0000000000000000 <4>[ 183.945955] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 183.945957] CR2: 0000614f744e6188 CR3: 0000000003448006 CR4: 0000000000f72ef0 <4>[ 183.945959] PKRU: 55555554 <4>[ 183.945960] Call Trace: <4>[ 183.945962] <4>[ 183.945966] ggtt_node_remove+0x11a/0x140 [xe] <3>[ 183.946033] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <4>[ 183.946084] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 183.946185] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 183.946285] ? _raw_write_unlock+0x22/0x50 <4>[ 183.946290] ? drm_vma_offset_remove+0x65/0x80 <4>[ 183.946305] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <7>[ 183.946341] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled Oops#2 Part10 <4>[ 183.946404] ? lock_is_held_type+0xa3/0x130 <4>[ 183.946412] ttm_bo_release+0x70/0x330 [ttm] <4>[ 183.946421] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 183.946520] ? lock_release+0xce/0x280 <4>[ 183.946527] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 183.946535] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 183.946629] drm_gem_object_free+0x1d/0x40 <4>[ 183.946632] xe_bo_put+0x12a/0x190 [xe] <4>[ 183.946729] xe_lrc_destroy+0x47/0x60 [xe] <4>[ 183.946843] xe_exec_queue_fini+0x85/0xd0 [xe] <4>[ 183.946942] __guc_exec_queue_destroy_async+0x6c/0x170 [xe] <4>[ 183.947051] process_one_work+0x22e/0x6b0 <4>[ 183.947062] worker_thread+0x1e8/0x3d0 <4>[ 183.947066] ? __pfx_worker_thread+0x10/0x10 <4>[ 183.947069] kthread+0x11f/0x250 <4>[ 183.947074] ? __pfx_kthread+0x10/0x10 <4>[ 183.947078] ret_from_fork+0x344/0x3a0 <4>[ 183.947082] ? __pfx_kthread+0x10/0x10 <4>[ 183.947086] ret_from_fork_asm+0x1a/0x30 <4>[ 183.947097] <4>[ 183.947099] irq event stamp: 10317 <4>[ 183.947100] hardirqs last enabled at (10323): [] __up_console_sem+0x79/0xa0 <4>[ 183.947104] hardirqs last disabled at (10328): [] __up_console_sem+0x5e/0xa0 <4>[ 183.947107] softirqs last enabled at (10190): [] __irq_exit_rcu+0x13f/0x160 <4>[ 183.947110] softirqs last disabled at (10185): [] __irq_exit_rcu+0x13f/0x160 <4>[ 183.947113] ---[ end trace 0000000000000000 ]--- <7>[ 183.947440] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 184.029945] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. Oops#2 Part9 <7>[ 184.033517] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. <3>[ 186.227723] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=38 recv=0 <1>[ 186.228717] BUG: unable to handle page fault for address: ffffc9000e38a188 <1>[ 186.228749] #PF: supervisor write access in kernel mode <1>[ 186.228765] #PF: error_code(0x0002) - not-present page <6>[ 186.228779] PGD 100000067 P4D 100000067 PUD 100ad2067 PMD 0 <4>[ 186.228801] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 186.228820] CPU: 13 UID: 0 PID: 61 Comm: kworker/13:0 Tainted: G S U W 6.19.0-lgci-xe-xe-4570-d9e4e8f5c4e7aa0d4-debug+ #1 PREEMPT(voluntary) <4>[ 186.228854] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 186.228869] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 186.228890] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 186.229387] RIP: 0010:xe_mmio_write32+0x58/0x280 [xe] <4>[ 186.229876] Code: 24 66 90 65 8b 05 4c 86 2a e3 48 0f a3 05 f0 a0 cd e2 0f 82 ee 00 00 00 41 f7 c5 00 00 00 01 0f 84 88 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 186.229912] RSP: 0018:ffffc9000035f830 EFLAGS: 00010086 <4>[ 186.229929] RAX: 0000000000000002 RBX: ffffc9000e38a188 RCX: 0000000000000000 <4>[ 186.229946] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff88812ed281d0 <4>[ 186.229964] RBP: ffffc9000035f8a8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 186.229980] R10: ffff888112e80000 R11: 0000000000000001 R12: ffff88812ed281d0 Oops#2 Part8 <4>[ 186.229996] R13: 000000000000a188 R14: ffff888112e80000 R15: 0000000000010001 <4>[ 186.230013] FS: 0000000000000000(0000) GS:ffff8888db35a000(0000) knlGS:0000000000000000 <4>[ 186.230033] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 186.230048] CR2: ffffc9000e38a188 CR3: 0000000003448006 CR4: 0000000000f72ef0 <4>[ 186.230064] PKRU: 55555554 <4>[ 186.230074] Call Trace: <4>[ 186.230084] <4>[ 186.230103] xe_force_wake_get+0x417/0x950 [xe] <4>[ 186.230521] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 186.230551] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 186.231005] ? trace_hardirqs_on+0x63/0xd0 <4>[ 186.231026] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 186.231042] ? xe_tlb_inval_fence_prep+0xbf/0x1a0 [xe] <4>[ 186.231560] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 186.232065] ? find_held_lock+0x31/0x90 <4>[ 186.232083] ? ggtt_node_remove+0xcb/0x140 [xe] <4>[ 186.232501] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 186.232665] ggtt_node_remove+0x12c/0x140 [xe] <4>[ 186.232764] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 186.232863] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 186.232962] ? _raw_write_unlock+0x22/0x50 <4>[ 186.232966] ? drm_vma_offset_remove+0x65/0x80 <4>[ 186.232972] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 186.233067] ? lock_is_held_type+0xa3/0x130 <4>[ 186.233074] ttm_bo_release+0x70/0x330 [ttm] <4>[ 186.233083] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 186.233182] ? lock_release+0xce/0x280 <4>[ 186.233187] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 186.233195] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 186.233289] drm_gem_object_free+0x1d/0x40 Oops#2 Part7 <4>[ 186.233294] xe_bo_put+0x12a/0x190 [xe] <4>[ 186.233389] xe_lrc_destroy+0x47/0x60 [xe] <4>[ 186.233502] xe_exec_queue_fini+0x85/0xd0 [xe] <4>[ 186.233600] __guc_exec_queue_destroy_async+0x6c/0x170 [xe] <4>[ 186.233708] process_one_work+0x22e/0x6b0 <4>[ 186.233714] worker_thread+0x1e8/0x3d0 <4>[ 186.233718] ? __pfx_worker_thread+0x10/0x10 <4>[ 186.233722] kthread+0x11f/0x250 <4>[ 186.233726] ? __pfx_kthread+0x10/0x10 <4>[ 186.233730] ret_from_fork+0x344/0x3a0 <4>[ 186.233735] ? __pfx_kthread+0x10/0x10 <4>[ 186.233739] ret_from_fork_asm+0x1a/0x30 <4>[ 186.233745] <4>[ 186.233747] Modules linked in: snd_hda_codec_intelhdmi snd_hda_codec_hdmi pmt_crashlog mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp coretemp cmdlinepart hid_generic spi_nor asus_nb_wmi mtd asus_wmi mei_pxp mei_hdcp sparse_keymap platform_profile wmi_bmof kvm_intel binfmt_misc kvm irqbypass snd_intel_dspcfg ghash_clmulni_intel aesni_intel snd_hda_codec rapl snd_hda_core r8169 usbhid snd_hwdep video intel_cstate snd_pcm hid realtek i2c_i801 snd_timer i2c_mux spi_intel_pci snd idma64 spi_intel i2c_smbus soundcore nls_iso8859_1 intel_pmc_core pmt_telemetry mei_me pmt_discovery pmt_class mei intel_pmc_ssram_telemetry wmi pinctrl_alderlake acpi_tad acpi_pad intel_vsec dm_multipath msr nvme_fabrics fuse efi_pstore nfnetlink Oops#2 Part6 <4>[ 186.233792] autofs4 [last unloaded: snd_hda_intel] <4>[ 186.233826] CR2: ffffc9000e38a188 <4>[ 186.233830] ---[ end trace 0000000000000000 ]--- <4>[ 186.392458] RIP: 0010:xe_mmio_write32+0x58/0x280 [xe] <4>[ 186.392584] Code: 24 66 90 65 8b 05 4c 86 2a e3 48 0f a3 05 f0 a0 cd e2 0f 82 ee 00 00 00 41 f7 c5 00 00 00 01 0f 84 88 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 186.392593] RSP: 0018:ffffc9000035f830 EFLAGS: 00010086 <4>[ 186.392597] RAX: 0000000000000002 RBX: ffffc9000e38a188 RCX: 0000000000000000 <4>[ 186.392600] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff88812ed281d0 <4>[ 186.392604] RBP: ffffc9000035f8a8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 186.392608] R10: ffff888112e80000 R11: 0000000000000001 R12: ffff88812ed281d0 <4>[ 186.392611] R13: 000000000000a188 R14: ffff888112e80000 R15: 0000000000010001 <4>[ 186.392615] FS: 0000000000000000(0000) GS:ffff8888db35a000(0000) knlGS:0000000000000000 <4>[ 186.392620] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 186.392623] CR2: ffffc9000e38a188 CR3: 0000000003448001 CR4: 0000000000f72ef0