Oops#2 Part18 <7>[ 310.435867] xe 0000:03:00.0: [drm:whitelist_apply_to_hwe [xe]] Tile0: GT0: REG[0xdb1c-0xdb1f]: allow rw access <7>[ 310.436033] xe 0000:03:00.0: [drm:whitelist_apply_to_hwe [xe]] Tile0: GT0: Add ccs1 whitelist to engine <7>[ 310.436103] xe 0000:03:00.0: [drm:whitelist_apply_to_hwe [xe]] Tile0: GT0: REG[0xdafc-0xdaff]: allow read access <7>[ 310.436175] xe 0000:03:00.0: [drm:whitelist_apply_to_hwe [xe]] Tile0: GT0: REG[0xdb00-0xdb1f]: allow read access <7>[ 310.436246] xe 0000:03:00.0: [drm:whitelist_apply_to_hwe [xe]] Tile0: GT0: REG[0xdb1c-0xdb1f]: allow rw access <7>[ 310.437147] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying GT save-restore MMIOs <7>[ 310.437226] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x4148] = 0x00000000 <7>[ 310.437302] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x8828] = 0x00800000 <7>[ 310.437374] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xb0c8] = 0x55555440 <7>[ 310.437446] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xb104] = 0x08104440 <7>[ 310.437518] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xb108] = 0x30200000 <7>[ 310.437591] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xb158] = 0x0000007f <7>[ 310.437665] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: flag:0x1 <7>[ 310.437730] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: mocs entries: 16 <7>[ 310.437794] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[0] 0x4000 0xc Oops#2 Part17 <7>[ 310.437859] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[1] 0x4004 0x10c <7>[ 310.437945] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[2] 0x4008 0x130 <7>[ 310.438020] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[3] 0x400c 0x13c <7>[ 310.438087] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[4] 0x4010 0x100 <7>[ 310.438152] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[5] 0x4014 0x100 <7>[ 310.438216] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[6] 0x4018 0x100 <7>[ 310.438280] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[7] 0x401c 0x100 <7>[ 310.438344] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[8] 0x4020 0x100 <7>[ 310.438409] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[9] 0x4024 0x100 <7>[ 310.438473] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[10] 0x4028 0x100 <7>[ 310.438538] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[11] 0x402c 0x100 <7>[ 310.438601] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[12] 0x4030 0x100 <7>[ 310.438664] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[13] 0x4034 0x100 <7>[ 310.438728] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[14] 0x4038 0x100 <7>[ 310.438792] xe 0000:03:00.0: [drm:xe_mocs_init [xe]] Tile0: GT0: GLOB_MOCS[15] 0x403c 0x100 <7>[ 310.438858] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying rcs0 save-restore MMIOs <7>[ 310.438946] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x2050] = 0x10001000 Oops#2 Part16 <7>[ 310.439041] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x20c4] = 0x3f7e0306 <7>[ 310.439110] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x20d4] = 0xc080c080 <7>[ 310.439180] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x24d0] = 0x1000dafc <7>[ 310.439249] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x24d4] = 0x1000db01 <7>[ 310.439317] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x24d8] = 0x0000db1c <7>[ 310.439389] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe194] = 0x00400040 <7>[ 310.439458] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe48c] = 0x02000200 <7>[ 310.439525] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe49c] = 0x40004000 <7>[ 310.439593] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe4c4] = 0x10401040 <7>[ 310.439662] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe4f0] = 0x00020002 <7>[ 310.439737] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe530] = 0x00000400 <7>[ 310.439813] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe7c8] = 0x04002000 <7>[ 310.439887] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0xe7cc] = 0x00009000 <7>[ 310.439975] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x14800] = 0x00020002 <7>[ 310.440128] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying bcs0 save-restore MMIOs <7>[ 310.440198] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x22050] = 0x10001000 Oops#2 Part15 <7>[ 310.440265] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x220c4] = 0x3f7e0306 <7>[ 310.440331] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x220d4] = 0xc080c080 <7>[ 310.440471] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying bcs8 save-restore MMIOs <7>[ 310.440540] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x3ee050] = 0x10001000 <7>[ 310.440607] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x3ee0c4] = 0x3f7e0306 <7>[ 310.440672] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x3ee0d4] = 0xc080c080 <7>[ 310.440801] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying ccs0 save-restore MMIOs <7>[ 310.440871] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a050] = 0x10001000 <7>[ 310.440956] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a0c4] = 0x3f7e0308 <7>[ 310.441034] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a0d4] = 0xc080c080 <7>[ 310.441111] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a4d0] = 0x1000dafc <7>[ 310.441182] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a4d4] = 0x1000db01 <7>[ 310.441248] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1a4d8] = 0x0000db1c <7>[ 310.441396] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: Applying ccs1 save-restore MMIOs <7>[ 310.441463] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c050] = 0x10001000 Oops#2 Part14 <7>[ 310.441530] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c0c4] = 0x3f7e0308 <7>[ 310.441596] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c0d4] = 0xc080c080 <7>[ 310.441662] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c4d0] = 0x1000dafc <7>[ 310.441728] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c4d4] = 0x1000db01 <7>[ 310.441793] xe 0000:03:00.0: [drm:xe_reg_sr_apply_mmio [xe]] Tile0: GT0: REG[0x1c4d8] = 0x0000db1c <7>[ 310.442182] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 310.444424] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 0] = 0x010823f7 <7>[ 310.444486] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 1] = 0x00000800 <7>[ 310.444544] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 2] = 0x00000014 <7>[ 310.444600] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 3] = 0x00000001 <7>[ 310.444655] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 4] = 0x0000232e <7>[ 310.444711] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 5] = 0xe20b0000 <7>[ 310.444766] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 6] = 0x00000000 <7>[ 310.444820] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 7] = 0x00000000 <7>[ 310.444875] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 8] = 0x00000000 <7>[ 310.444951] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[ 9] = 0x00000000 Oops#2 Part13 <7>[ 310.445013] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[10] = 0x00000000 <7>[ 310.445073] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[11] = 0x00000000 <7>[ 310.445132] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[12] = 0x00000000 <7>[ 310.445188] xe 0000:03:00.0: [drm:guc_print_params [xe]] Tile0: GT0: GuC param[13] = 0x00000000 <7>[ 310.445268] xe 0000:03:00.0: [drm:xe_guc_id_mgr_init [xe]] Tile0: GT0: using 65535 GuC IDs <7>[ 310.445346] xe 0000:03:00.0: [drm:xe_guc_db_mgr_init [xe]] Tile0: GT0: using 256 doorbells <7>[ 310.446546] xe 0000:03:00.0: [drm:guc_buf_cache_init [xe]] Tile0: GT0: reusable buffer with 2097152 dwords at 0x627000 for xe_guc_buf_cache_init_with_size [xe] <7>[ 310.447429] xe 0000:03:00.0: [drm:xe_migrate_init [xe]] Migrate min chunk size is 0x00010000 <7>[ 310.448434] xe 0000:03:00.0: [drm:xe_guc_capture_steered_list_init [xe]] Tile0: GT0: capture found 120 ext-regs. <7>[ 310.470860] xe 0000:03:00.0: [drm:xe_guc_ads_populate [xe]] Tile0: GT0: Updated ADS capture size 20480 (was 49152) <7>[ 310.481665] xe 0000:03:00.0: [drm:guc_wait_ucode [xe]] Tile0: GT0: GuC load: init took 10ms, freq = 2150MHz (req = 2133MHz), before = 2150MHz, status = 0x8002F034 <7>[ 310.481976] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel enabled <7>[ 310.482557] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: LRC rcs0 WA job: 4140 dwords <7>[ 310.482638] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x5588] = 0x04000400 Oops#2 Part12 <7>[ 310.482707] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x6204] = 0x01400140 <7>[ 310.482771] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x6208] = 0x00200020 <7>[ 310.482837] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x62a8] = 0x02400240 <7>[ 310.482918] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x7010] = 0x40004000 <7>[ 310.483002] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x7044] = 0x04200420 <7>[ 310.483063] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x7300] = 0x10001000 <7>[ 310.483128] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x83a8] = 0x20002000 <7>[ 310.483195] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x6210] = ~0x3f18000|0x3f18000 <7>[ 310.484998] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: LRC bcs0 WA job: 27 dwords <7>[ 310.485067] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: REG[0x22204] = ~0x7e7e|0x606 <7>[ 310.485132] xe 0000:03:00.0: [drm:xe_lrc_emit_hwe_state_instructions [xe]] Tile0: GT0: No non-register state to emit on graphics ver 20.01 <7>[ 310.486349] xe 0000:03:00.0: [drm:xe_gt_record_default_lrcs [xe]] Tile0: GT0: LRC ccs0 WA job: 0 dwords <7>[ 310.486418] xe 0000:03:00.0: [drm:xe_lrc_emit_hwe_state_instructions [xe]] Tile0: GT0: No non-register state to emit on graphics ver 20.01 <5>[ 310.489391] FAULT_INJECTION: forcing a failure. <5>[ 310.489391] name fail_function, interval 0, probability 100, space 1, times 100 Oops#2 Part11 <3>[ 310.489394] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC PC query task state failed: -ENOMEM <4>[ 310.489410] ------------[ cut here ]------------ <4>[ 310.489411] xe 0000:03:00.0: [drm] Assertion `ct->g2h_outstanding == 0 || state == XE_GUC_CT_STATE_STOPPED` failed! <4>[ 310.489411] platform: BATTLEMAGE subplatform: 7 <4>[ 310.489411] graphics: Xe2_HPG 20.01 step A0 <4>[ 310.489411] media: Xe2_HPM 13.01 step A1 <4>[ 310.489411] tile: 0 VRAM 12.0 GiB <4>[ 310.489411] GT: 0 type 1 <4>[ 310.489414] WARNING: drivers/gpu/drm/xe/xe_guc_ct.c:527 at guc_ct_change_state+0x279/0x350 [xe], CPU#0: xe_fault_inject/7023 <4>[ 310.489483] Modules linked in: pmt_crashlog snd_hda_codec_intelhdmi snd_hda_codec_hdmi mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp hid_generic coretemp cmdlinepart spi_nor asus_nb_wmi mei_pxp mei_hdcp mtd asus_wmi sparse_keymap platform_profile wmi_bmof kvm_intel usbhid snd_hda_intel kvm hid irqbypass ghash_clmulni_intel snd_intel_dspcfg aesni_intel snd_hda_codec rapl video r8169 intel_cstate snd_hda_core snd_hwdep realtek snd_pcm i2c_i801 snd_timer binfmt_misc i2c_mux snd spi_intel_pci mei_me i2c_smbus soundcore spi_intel idma64 mei intel_pmc_core pmt_telemetry pmt_discovery pmt_class nls_iso8859_1 intel_pmc_ssram_telemetry wmi acpi_tad pinctrl_alderlake intel_vsec acpi_pad dm_multipath msr nvme_fabrics fuse Oops#2 Part10 <4>[ 310.489535] efi_pstore nfnetlink autofs4 <4>[ 310.489539] CPU: 0 UID: 0 PID: 7023 Comm: xe_fault_inject Tainted: G S U W 6.19.0-lgci-xe-xe-4551-8a3c5ed4673e2028f-debug+ #1 PREEMPT(voluntary) <4>[ 310.489542] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 310.489543] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 310.489544] RIP: 0010:guc_ct_change_state+0x2ed/0x350 [xe] <4>[ 310.489611] Code: 1f 85 eb 51 48 c1 ea 25 44 6b ca 64 44 29 c9 51 48 c7 c1 f0 63 18 a1 52 ff 75 b0 44 8b 4d 94 4c 8b 45 88 48 8b 95 78 ff ff ff <67> 48 0f b9 3a 8b 8b 48 01 00 00 48 83 c4 60 85 c9 75 13 44 89 bb <4>[ 310.489612] RSP: 0018:ffffc9000422f640 EFLAGS: 00010002 Oops#2 Part9 <4>[ 310.489614] RAX: ffffffffa11fa9f4 RBX: ffff888156f988a8 RCX: ffffffffa11863f0 <4>[ 310.489616] RDX: ffff888104119310 RSI: ffffffffa11fa9f4 RDI: ffffffffa1002f80 <4>[ 310.489617] RBP: ffffc9000422f728 R08: ffffffffa11faa44 R09: 0000000000000007 <4>[ 310.489618] R10: 0000000000000001 R11: 0000000000000514 R12: ffff888156f988b0 <4>[ 310.489619] R13: ffff888156f98940 R14: 0000000000000515 R15: 0000000000000001 <4>[ 310.489620] FS: 00007abb72aeb980(0000) GS:ffff8888dacda000(0000) knlGS:0000000000000000 <4>[ 310.489621] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 310.489622] CR2: 00005e3aacb11310 CR3: 00000003b6df8001 CR4: 0000000000f72ef0 <4>[ 310.489623] PKRU: 55555554 <4>[ 310.489624] Call Trace: <4>[ 310.489625] <4>[ 310.489633] ? xe_guc_submit_enable+0xa8/0xf0 [xe] <4>[ 310.489704] xe_guc_ct_disable+0x17/0x80 [xe] <4>[ 310.489768] xe_guc_sanitize+0x2a/0x50 [xe] <4>[ 310.489830] xe_uc_load_hw+0x19a/0x2b0 [xe] <4>[ 310.489922] ? xe_migrate_init+0x277/0x2d0 [xe] <4>[ 310.490007] xe_gt_init+0x363/0xab0 [xe] <4>[ 310.490083] ? trace_hardirqs_on+0x63/0xd0 <4>[ 310.490087] ? _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 310.490091] ? __devm_add_action+0x70/0xa0 <4>[ 310.490096] ? xe_irq_install+0x11a/0x490 [xe] <4>[ 310.490182] xe_device_probe+0x3cc/0xc20 [xe] <4>[ 310.490257] ? __drm_dev_dbg+0x7d/0xb0 <4>[ 310.490261] ? __drmm_add_action_or_reset+0x1e/0x50 <4>[ 310.490268] xe_pci_probe+0x396/0x610 [xe] <4>[ 310.490357] local_pci_probe+0x47/0xb0 <4>[ 310.490362] pci_device_probe+0xf3/0x260 <4>[ 310.490366] really_probe+0xf1/0x410 <4>[ 310.490370] __driver_probe_device+0x8c/0x190 Oops#2 Part8 <4>[ 310.490373] device_driver_attach+0x57/0xd0 <4>[ 310.490376] bind_store+0x77/0xd0 <4>[ 310.490380] drv_attr_store+0x24/0x50 <4>[ 310.490382] sysfs_kf_write+0x4d/0x80 <4>[ 310.490386] kernfs_fop_write_iter+0x188/0x240 <4>[ 310.490390] vfs_write+0x283/0x540 <4>[ 310.490398] ksys_write+0x6f/0xf0 <4>[ 310.490402] __x64_sys_write+0x19/0x30 <4>[ 310.490405] x64_sys_call+0x79/0x26b0 <4>[ 310.490407] do_syscall_64+0x93/0x1470 <4>[ 310.490410] ? __slab_free+0x15e/0x2c0 <4>[ 310.490414] ? call_rcu+0x34/0x50 <4>[ 310.490417] ? __delete_object+0x60/0xa0 <4>[ 310.490423] ? kmem_cache_free+0x49f/0x5c0 <4>[ 310.490424] ? putname+0x3e/0x80 <4>[ 310.490430] ? putname+0x3e/0x80 <4>[ 310.490432] ? putname+0x3e/0x80 <4>[ 310.490434] ? do_sys_openat2+0x95/0xe0 <4>[ 310.490439] ? __x64_sys_openat+0x54/0xa0 <4>[ 310.490444] ? do_syscall_64+0x1e4/0x1470 <4>[ 310.490446] ? do_syscall_64+0x1e4/0x1470 <4>[ 310.490450] ? do_syscall_64+0x1e4/0x1470 <4>[ 310.490452] ? do_syscall_64+0x1e4/0x1470 <4>[ 310.490454] ? do_syscall_64+0x1e4/0x1470 <4>[ 310.490457] entry_SYSCALL_64_after_hwframe+0x76/0x7e <4>[ 310.490459] RIP: 0033:0x7abb74d1c5a4 <4>[ 310.490462] Code: c7 00 16 00 00 00 b8 ff ff ff ff c3 66 2e 0f 1f 84 00 00 00 00 00 f3 0f 1e fa 80 3d a5 ea 0e 00 00 74 13 b8 01 00 00 00 0f 05 <48> 3d 00 f0 ff ff 77 54 c3 0f 1f 00 55 48 89 e5 48 83 ec 20 48 89 <4>[ 310.490463] RSP: 002b:00007fff997b7eb8 EFLAGS: 00000202 ORIG_RAX: 0000000000000001 <4>[ 310.490465] RAX: ffffffffffffffda RBX: 0000000000000000 RCX: 00007abb74d1c5a4 <4>[ 310.490466] RDX: 000000000000000c RSI: 00007fff997b9370 RDI: 000000000000000b Oops#2 Part7 <4>[ 310.490467] RBP: 000000000000000c R08: 0000000000000073 R09: 0000000000000000 <4>[ 310.490469] R10: 0000000000000000 R11: 0000000000000202 R12: 00007fff997b9370 <4>[ 310.490470] R13: 000000000000000b R14: 0000650e4c0f635b R15: 00007fff997b9020 <4>[ 310.490478] <4>[ 310.490479] irq event stamp: 1192914 <4>[ 310.490480] hardirqs last enabled at (1192913): [] _raw_spin_unlock_irqrestore+0x51/0x80 <4>[ 310.490483] hardirqs last disabled at (1192914): [] _raw_spin_lock_irq+0x6f/0x80 <4>[ 310.490484] softirqs last enabled at (1192022): [] __irq_exit_rcu+0x13f/0x160 <4>[ 310.490487] softirqs last disabled at (1192017): [] __irq_exit_rcu+0x13f/0x160 <4>[ 310.490490] ---[ end trace 0000000000000000 ]--- <7>[ 310.490492] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <3>[ 310.490587] xe 0000:03:00.0: probe with driver xe failed with error -12 <3>[ 310.491144] xe 0000:03:00.0: [drm] *ERROR* Tile0: GT0: GuC RC setup HOST_CONTROL(0) failed (-ENODEV) <7>[ 310.491506] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 310.492578] xe 0000:03:00.0: [drm:guc_ct_change_state [xe]] Tile0: GT0: GuC CT communication channel disabled <7>[ 310.594036] xe 0000:03:00.0: [drm:drm_pagemap_cache_fini [drm_gpusvm_helper]] Destroying dpagemap cache. <7>[ 310.595589] xe 0000:03:00.0: [drm:drm_pagemap_shrinker_fini [drm_gpusvm_helper]] Destroying dpagemap shrinker. <3>[ 312.775100] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=39 recv=38 Oops#2 Part6 <1>[ 312.777724] BUG: unable to handle page fault for address: ffffc9002338a188 <1>[ 312.777742] #PF: supervisor write access in kernel mode <1>[ 312.777754] #PF: error_code(0x0002) - not-present page <6>[ 312.777765] PGD 100000067 P4D 100000067 PUD 100ab3067 PMD 0 <4>[ 312.777787] Oops: Oops: 0002 [#1] SMP NOPTI <4>[ 312.777805] CPU: 8 UID: 0 PID: 206 Comm: kworker/8:1 Tainted: G S U W 6.19.0-lgci-xe-xe-4551-8a3c5ed4673e2028f-debug+ #1 PREEMPT(voluntary) <4>[ 312.777850] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [W]=WARN <4>[ 312.777867] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 312.777882] Workqueue: xe-destroy-wq __guc_exec_queue_destroy_async [xe] <4>[ 312.778183] RIP: 0010:xe_mmio_write32+0x58/0x280 [xe] <4>[ 312.778256] Code: 24 66 90 65 8b 05 5c 7a 2a e3 48 0f a3 05 00 95 cd e2 0f 82 ee 00 00 00 41 f7 c5 00 00 00 01 0f 84 88 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 <4>[ 312.778261] RSP: 0018:ffffc90001647830 EFLAGS: 00010086 <4>[ 312.778264] RAX: 0000000000000002 RBX: ffffc9002338a188 RCX: 0000000000000000 <4>[ 312.778266] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff8881802481d0 <4>[ 312.778269] RBP: ffffc900016478a8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 312.778271] R10: ffff8883d2ca0000 R11: 0000000000000001 R12: ffff8881802481d0 <4>[ 312.778273] R13: 000000000000a188 R14: ffff8883d2ca0000 R15: 0000000000010001 <4>[ 312.778276] FS: 0000000000000000(0000) GS:ffff8888db0da000(0000) knlGS:0000000000000000 <4>[ 312.778279] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 Oops#2 Part5 <4>[ 312.778281] CR2: ffffc9002338a188 CR3: 0000000003448006 CR4: 0000000000f72ef0 <4>[ 312.778284] PKRU: 55555554 <4>[ 312.778285] Call Trace: <4>[ 312.778287] <4>[ 312.778290] xe_force_wake_get+0x417/0x950 [xe] <4>[ 312.778347] ? _raw_spin_unlock_irqrestore+0x27/0x80 <4>[ 312.778353] send_tlb_inval_ggtt+0xfa/0x270 [xe] <4>[ 312.778418] ? trace_hardirqs_on+0x63/0xd0 <4>[ 312.778421] ? _raw_spin_unlock_irq+0x27/0x70 <4>[ 312.778424] ? xe_tlb_inval_fence_prep+0xbf/0x1a0 [xe] <4>[ 312.778500] xe_tlb_inval_ggtt+0x73/0x250 [xe] <4>[ 312.778576] ggtt_invalidate_gt_tlb.part.0+0x1f/0xb0 [xe] <4>[ 312.778646] ggtt_node_remove+0x122/0x140 [xe] <4>[ 312.778717] xe_ggtt_node_remove+0x40/0xa0 [xe] <4>[ 312.778784] xe_ggtt_remove_bo+0x87/0x250 [xe] <4>[ 312.778852] ? _raw_write_unlock+0x22/0x50 <4>[ 312.778855] ? drm_vma_offset_remove+0x65/0x80 <4>[ 312.778860] xe_ttm_bo_destroy+0xa2/0x2d0 [xe] <4>[ 312.778926] ? lock_is_held_type+0xa3/0x130 <4>[ 312.778931] ttm_bo_release+0x70/0x330 [ttm] <4>[ 312.778937] ? xe_ggtt_might_lock+0x29/0x60 [xe] <4>[ 312.779005] ? lock_release+0xce/0x280 <4>[ 312.779009] ttm_bo_fini+0x3c/0x70 [ttm] <4>[ 312.779015] xe_gem_object_free+0x1a/0x30 [xe] <4>[ 312.779082] drm_gem_object_free+0x1d/0x40 <4>[ 312.779085] xe_bo_put+0x12a/0x190 [xe] <4>[ 312.779152] xe_lrc_destroy+0x47/0x60 [xe] <4>[ 312.779226] xe_exec_queue_fini+0x85/0xd0 [xe] <4>[ 312.779294] __guc_exec_queue_destroy_async+0x6c/0x170 [xe] <4>[ 312.779365] process_one_work+0x22e/0x6b0 <4>[ 312.779369] worker_thread+0x1e8/0x3d0 <4>[ 312.779372] ? __pfx_worker_thread+0x10/0x10 <4>[ 312.779375] kthread+0x11f/0x250 Oops#2 Part4 <4>[ 312.779378] ? __pfx_kthread+0x10/0x10 <4>[ 312.779381] ret_from_fork+0x344/0x3a0 <4>[ 312.779385] ? __pfx_kthread+0x10/0x10 <4>[ 312.779388] ret_from_fork_asm+0x1a/0x30 <4>[ 312.779392] <4>[ 312.779394] Modules linked in: pmt_crashlog snd_hda_codec_intelhdmi snd_hda_codec_hdmi mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp hid_generic coretemp cmdlinepart spi_nor asus_nb_wmi mei_pxp mei_hdcp mtd asus_wmi sparse_keymap platform_profile wmi_bmof kvm_intel usbhid snd_hda_intel kvm hid irqbypass ghash_clmulni_intel snd_intel_dspcfg aesni_intel snd_hda_codec rapl video r8169 intel_cstate snd_hda_core snd_hwdep realtek snd_pcm i2c_i801 snd_timer binfmt_misc i2c_mux snd spi_intel_pci mei_me i2c_smbus soundcore spi_intel idma64 mei intel_pmc_core pmt_telemetry pmt_discovery pmt_class nls_iso8859_1 intel_pmc_ssram_telemetry wmi acpi_tad pinctrl_alderlake intel_vsec acpi_pad dm_multipath msr nvme_fabrics fuse <4>[ 312.779426] efi_pstore nfnetlink autofs4 <4>[ 312.779453] CR2: ffffc9002338a188 <4>[ 312.779455] ---[ end trace 0000000000000000 ]--- <4>[ 312.919459] RIP: 0010:xe_mmio_write32+0x58/0x280 [xe] <4>[ 312.919561] Code: 24 66 90 65 8b 05 5c 7a 2a e3 48 0f a3 05 00 95 cd e2 0f 82 ee 00 00 00 41 f7 c5 00 00 00 01 0f 84 88 00 00 00 49 03 5c 24 08 <44> 89 3b 48 8d 65 d8 5b 41 5c 41 5d 41 5e 41 5f 5d 31 c0 31 d2 31 Oops#2 Part3 <4>[ 312.919568] RSP: 0018:ffffc90001647830 EFLAGS: 00010086 <4>[ 312.919572] RAX: 0000000000000002 RBX: ffffc9002338a188 RCX: 0000000000000000 <4>[ 312.919575] RDX: 0000000000010001 RSI: 000000000000a188 RDI: ffff8881802481d0 <4>[ 312.919578] RBP: ffffc900016478a8 R08: 0000000000000000 R09: 0000000000000000 <4>[ 312.919583] R10: ffff8883d2ca0000 R11: 0000000000000001 R12: ffff8881802481d0 <4>[ 312.919585] R13: 000000000000a188 R14: ffff8883d2ca0000 R15: 0000000000010001 <4>[ 312.919588] FS: 0000000000000000(0000) GS:ffff8888db0da000(0000) knlGS:0000000000000000 <4>[ 312.919591] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 312.919594] CR2: ffffc9002338a188 CR3: 0000000003448001 CR4: 0000000000f72ef0 <4>[ 312.919597] PKRU: 55555554 <6>[ 312.919599] note: kworker/8:1[206] exited with irqs disabled <6>[ 312.919613] note: kworker/8:1[206] exited with preempt_count 1 <6>[ 313.025710] pcieport 0000:00:06.0: AER: Multiple Correctable error message received from 0000:05:00.0 <4>[ 313.025751] nvme 0000:05:00.0: PCIe Bus Error: severity=Correctable, type=Physical Layer, (Receiver ID) <4>[ 313.025769] nvme 0000:05:00.0: device [15b7:5017] error status/mask=00000001/0000e000 <4>[ 313.025787] nvme 0000:05:00.0: [ 0] RxErr (First) <3>[ 315.076442] xe 0000:03:00.0: [drm] *ERROR* TLB invalidation fence timeout, seqno=23362336 recv=0 <1>[ 315.076482] BUG: unable to handle page fault for address: 00000001000a0ac0 <1>[ 315.076497] #PF: supervisor read access in kernel mode <1>[ 315.076508] #PF: error_code(0x0000) - not-present page Oops#2 Part2 <6>[ 315.076519] PGD 0 P4D 0 <4>[ 315.076532] Oops: Oops: 0000 [#2] SMP NOPTI <4>[ 315.076548] CPU: 3 UID: 0 PID: 6113 Comm: kworker/u64:54 Tainted: G S UD W 6.19.0-lgci-xe-xe-4551-8a3c5ed4673e2028f-debug+ #1 PREEMPT(voluntary) <4>[ 315.076576] Tainted: [S]=CPU_OUT_OF_SPEC, [U]=USER, [D]=DIE, [W]=WARN <4>[ 315.076586] Hardware name: ASUS System Product Name/PRIME Z790-P WIFI, BIOS 1645 03/15/2024 <4>[ 315.076601] Workqueue: gt-ordered-wq xe_tlb_inval_fence_timeout [xe] <4>[ 315.077080] RIP: 0010:__list_del_entry_valid_or_report+0x3b/0x120 <4>[ 315.077105] Code: 6f 08 4d 85 e4 74 50 4d 85 ed 74 5e 48 b8 00 01 00 00 00 00 ad de 49 39 c4 74 62 48 b8 22 01 00 00 00 00 ad de 49 39 c5 74 71 <49> 39 7d 00 0f 85 85 00 00 00 49 39 7c 24 08 0f 85 9f 00 00 00 b8 <4>[ 315.077132] RSP: 0018:ffffc9000afc3d60 EFLAGS: 00010013 <4>[ 315.077146] RAX: dead000000000122 RBX: ffffc90001647aa8 RCX: 0000000000000000 <4>[ 315.077159] RDX: 0000000000000000 RSI: 0000000000000000 RDI: ffffc90001647aa8 <4>[ 315.077172] RBP: ffffc9000afc3d78 R08: 0000000000000000 R09: 0000000000000000 <4>[ 315.077183] R10: 0000000000000000 R11: 0000000000000000 R12: ffffc90001647f20 <4>[ 315.077196] R13: 00000001000a0ac0 R14: ffffc90001647f38 R15: ffffc90001647ed8 <4>[ 315.077209] FS: 0000000000000000(0000) GS:ffff8888dae5a000(0000) knlGS:0000000000000000 <4>[ 315.077224] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 <4>[ 315.077238] CR2: 00000001000a0ac0 CR3: 0000000003448005 CR4: 0000000000f72ef0 <4>[ 315.077255] PKRU: 55555554 <4>[ 315.077264] Call Trace: <4>[ 315.077274] <4>[ 315.077286] ? update_stack_state+0x10e/0x1a0 Oops#2 Part1 <4>[ 315.077305] xe_tlb_inval_fence_signal+0x3b/0x1b0 [xe] <4>[ 315.077778] xe_tlb_inval_fence_timeout+0xb6/0x1d0 [xe] <4>[ 315.078235] process_one_work+0x22e/0x6b0 <4>[ 315.078260] worker_thread+0x1e8/0x3d0 <4>[ 315.078276] ? __pfx_worker_thread+0x10/0x10 <4>[ 315.078292] kthread+0x11f/0x250 <4>[ 315.078310] ? __pfx_kthread+0x10/0x10 <4>[ 315.078329] ret_from_fork+0x344/0x3a0 <4>[ 315.078344] ? __pfx_kthread+0x10/0x10 <4>[ 315.078362] ret_from_fork_asm+0x1a/0x30 <4>[ 315.078386] <4>[ 315.078393] Modules linked in: pmt_crashlog snd_hda_codec_intelhdmi snd_hda_codec_hdmi mei_lb mei_gsc_proxy mtd_intel_dg mei_gsc xe drm_gpuvm drm_gpusvm_helper drm_buddy drm_ttm_helper ttm gpu_sched drm_suballoc_helper drm_exec drm_display_helper cec rc_core drm_kunit_helpers i2c_algo_bit kunit intel_rapl_msr intel_rapl_common intel_uncore_frequency intel_uncore_frequency_common intel_tcc_cooling x86_pkg_temp_thermal intel_powerclamp hid_generic coretemp cmdlinepart spi_nor asus_nb_wmi mei_pxp mei_hdcp mtd asus_wmi sparse_keymap platform_profile wmi_bmof kvm_intel usbhid snd_hda_intel kvm hid irqbypass ghash_clmulni_intel snd_intel_dspcfg aesni_intel snd_hda_codec rapl video r8169 intel_cstate snd_hda_core snd_hwdep realtek snd_pcm i2c_i801 snd_timer binfmt_misc i2c_mux snd spi_intel_pci mei_me i2c_smbus soundcore spi_intel idma64 mei intel_pmc_core pmt_telemetry pmt_discovery pmt_class nls_iso8859_1 intel_pmc_ssram_telemetry wmi acpi_tad pinctrl_alderlake intel_vsec acpi_pad dm_multipath msr nvme_fabrics fuse <4>[ 315.078576] efi_pstore nfnetlink autofs4 <4>[ 315.078725] CR2: 00000001000a0ac0 <4>[ 315.078738] ---[ end trace 0000000000000000 ]---