Face kernel BUG at drivers/gpu/drm/xe/xe_res_cursor.h:174 under ATS-M
Found this issue under Neo&/ ./memory_benchmark_ocl --gtest_filter=RemoteAccess - where fp64 are rejected, but cause bad behavior ending to this kernel bug.
Was reproduce with this simple igt test: xe_issue_res_cursor.c
[ 59.946245] ------------[ cut here ]------------
[ 59.946245] kernel BUG at drivers/gpu/drm/xe/xe_res_cursor.h:174!
[ 59.952398] invalid opcode: 0000 [#1] PREEMPT SMP NOPTI
[ 59.957674] CPU: 10 PID: 2855 Comm: xe_alloc Not tainted 6.1.0-rc1-0712+ #1
[ 59.964673] Hardware name: Gigabyte Technology Co., Ltd. H610M S2H DDR4/H610M S2H DDR4, BIOS F20 10/26/2022
[ 59.974465] RIP: 0010:emit_pte.constprop.0+0x216/0x240 [xe]
[ 59.980079] Code: ff 49 8b 07 4c 8d a8 00 10 00 00 4d 89 2f 8b 47 18 49 39 c5 72 16 49 29 c5 e8 d6 ca d4 d0 48 89 c7 48 85 c0 75 e8 0f 0b 0f 0b <0f> 0b 4d 89 2f 8b 47 18 49 89 7f 28 4c 29 e8 49 89 47 08 41 83 ec
[ 59.998925] RSP: 0018:ffffad93429f37b0 EFLAGS: 00010293
[ 60.004185] RAX: 0000000000000000 RBX: ffff9b300c3b68e0 RCX: 0000000000000001
[ 60.011365] RDX: ffff9b3050d00390 RSI: 0000000000008008 RDI: ffff9b3050d00390
[ 60.018537] RBP: ffffad93429f37e8 R08: 0000000000000029 R09: 0000000000000001
[ 60.025714] R10: ffff9b300a78c470 R11: 0000000000000478 R12: 0000000000000000
[ 60.032890] R13: ffff9b300c3b68e0 R14: 0000000000000001 R15: ffffad93429f38e0
[ 60.040068] FS: 00007feabc8959c0(0000) GS:ffff9b379f880000(0000) knlGS:0000000000000000
[ 60.048198] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[ 60.053983] CR2: 000056044c8a3dc0 CR3: 000000010ce08001 CR4: 0000000000770ee0
[ 60.061155] PKRU: 55555554
[ 60.063890] Call Trace:
[ 60.066362] <TASK>
[ 60.068493] xe_migrate_copy+0xb1f/0xf50 [xe]
[ 60.072908] xe_bo_move+0x3bf/0x6e0 [xe]
[ 60.076885] ? xe_ttm_tt_populate+0xb7/0xe0 [xe]
[ 60.081543] ttm_bo_handle_move_mem+0xbd/0x180 [ttm]
[ 60.086539] ttm_bo_bounce_temp_buffer.constprop.0+0x81/0xa0 [ttm]
[ 60.092758] ttm_bo_evict+0x94/0x170 [ttm]
[ 60.096886] ? dma_resv_list_alloc+0x1f/0x50
[ 60.101189] ? ttm_bo_eviction_valuable+0x37/0x40 [ttm]
[ 60.106457] ttm_mem_evict_first+0x144/0x360 [ttm]
[ 60.111288] ttm_bo_mem_space+0x1de/0x230 [ttm]
[ 60.115854] ttm_bo_validate+0xa7/0x120 [ttm]
[ 60.120244] ? _raw_write_unlock+0x16/0x40
[ 60.124368] ? drm_vma_offset_add+0x34/0x70 [drm]
[ 60.129123] ttm_bo_init_reserved+0x16d/0x1a0 [ttm]
[ 60.134033] __xe_bo_create_locked+0x154/0x240 [xe]
[ 60.138953] ? xe_ttm_io_mem_pfn+0xf0/0xf0 [xe]
[ 60.143526] xe_bo_create_locked+0xcd/0x160 [xe]
[ 60.148182] xe_gem_create_ioctl+0xb9/0x2a0 [xe]
[ 60.152839] ? xe_bo_vunmap+0x60/0x60 [xe]
[ 60.156972] drm_ioctl_kernel+0xb8/0x150 [drm]
[ 60.161470] drm_ioctl+0x24d/0x440 [drm]
[ 60.165443] ? xe_bo_vunmap+0x60/0x60 [xe]
[ 60.169583] ? arch_do_signal_or_restart+0x37/0x740
[ 60.174495] ? preempt_count_add+0x82/0xc0
[ 60.178621] ? _raw_spin_unlock_irq+0x1f/0x40
[ 60.183011] __x64_sys_ioctl+0x40c/0x930
[ 60.186968] ? debug_smp_processor_id+0x17/0x20
[ 60.191525] ? fpregs_assert_state_consistent+0x2a/0x50
[ 60.196786] ? exit_to_user_mode_prepare+0x45/0x1a0
[ 60.201700] do_syscall_64+0x38/0x90
[ 60.205306] entry_SYSCALL_64_after_hwframe+0x63/0xcd
[ 60.210392] RIP: 0033:0x7feabdf1aaff
[ 60.213996] Code: 00 48 89 44 24 18 31 c0 48 8d 44 24 60 c7 04 24 10 00 00 00 48 89 44 24 08 48 8d 44 24 20 48 89 44 24 10 b8 10 00 00 00 0f 05 <41> 89 c0 3d 00 f0 ff ff 77 1f 48 8b 44 24 18 64 48 2b 04 25 28 00
[ 60.232833] RSP: 002b:00007ffecee17aa0 EFLAGS: 00000246 ORIG_RAX: 0000000000000010
[ 60.240447] RAX: ffffffffffffffda RBX: 00007ffecee17b30 RCX: 00007feabdf1aaff
[ 60.247626] RDX: 00007ffecee17b30 RSI: 00000000c0306441 RDI: 0000000000000003
[ 60.254801] RBP: 00000000c0306441 R08: 00007ffecee17840 R09: 0000000000000000
[ 60.261974] R10: 0000000000000008 R11: 0000000000000246 R12: 00005578bc972008
[ 60.269145] R13: 0000000000000003 R14: 00005578bc973cf0 R15: 00007feabe18d040
[ 60.276318] </TASK>
[ 60.278526] Modules linked in: xe drm_ttm_helper drm_suballoc_helper gpu_sched drm_buddy ttm xt_conntrack xt_MASQUERADE nf_conntrack_netlink nfnetlink xfrm_user xfrm_algo xt_addrtype iptable_filter iptable_nat nf_nat nf_conntrack nf_defrag_ipv6 nf_defrag_ipv4 libcrc32c bpfilter br_netfilter bridge stp llc overlay binfmt_misc nls_iso8859_1 intel_rapl_msr intel_rapl_common x86_pkg_temp_thermal intel_powerclamp coretemp kvm_intel kvm mei_hdcp crct10dif_pclmul ghash_clmulni_intel input_leds sha512_ssse3 ee1004 aesni_intel mei_me crypto_simd cryptd mei rapl intel_hid wmi_bmof intel_cstate mac_hid efi_pstore sparse_keymap acpi_pad acpi_tad sch_fq_codel ipmi_devintf ipmi_msghandler msr parport_pc ppdev lp parport drm nfsd auth_rpcgss nfs_acl lockd grace sunrpc ip_tables x_tables autofs4 hid_generic usbhid hid nvme i2c_i801 crc32_pclmul nvme_core e1000e ahci intel_lpss_pci i2c_smbus intel_lpss libahci idma64 xhci_pci virt_dma xhci_pci_renesas video wmi pinctrl_alderlake
[ 60.364020] ---[ end trace 0000000000000000 ]---
[ 60.383366] RIP: 0010:emit_pte.constprop.0+0x216/0x240 [xe]
[ 60.388988] Code: ff 49 8b 07 4c 8d a8 00 10 00 00 4d 89 2f 8b 47 18 49 39 c5 72 16 49 29 c5 e8 d6 ca d4 d0 48 89 c7 48 85 c0 75 e8 0f 0b 0f 0b <0f> 0b 4d 89 2f 8b 47 18 49 89 7f 28 4c 29 e8 49 89 47 08 41 83 ec
[ 60.407827] RSP: 0018:ffffad93429f37b0 EFLAGS: 00010293
[ 60.413082] RAX: 0000000000000000 RBX: ffff9b300c3b68e0 RCX: 0000000000000001
[ 60.420256] RDX: ffff9b3050d00390 RSI: 0000000000008008 RDI: ffff9b3050d00390
[ 60.427428] RBP: ffffad93429f37e8 R08: 0000000000000029 R09: 0000000000000001
[ 60.434605] R10: ffff9b300a78c470 R11: 0000000000000478 R12: 0000000000000000
[ 60.441775] R13: ffff9b300c3b68e0 R14: 0000000000000001 R15: ffffad93429f38e0
[ 60.448952] FS: 00007feabc8959c0(0000) GS:ffff9b379f880000(0000) knlGS:0000000000000000
[ 60.457086] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[ 60.462863] CR2: 000056044c8a3dc0 CR3: 000000010ce08001 CR4: 0000000000770ee0
[ 60.470038] PKRU: 55555554