Another amdgpu bug: dc_validate_global_state+0x30a/0x3e0
This happened after a resume from suspend, kernel 6.4.12:
[53072.882164] [drm] DM_MST: starting TM on aconnector: 0000000055eb9bb7 [id: 99]
[53072.892882] [drm] DM_MST: DP14, 4-lane link detected
[53074.285873] ------------[ cut here ]------------
[53074.285878] WARNING: CPU: 4 PID: 724 at drivers/gpu/drm/amd/amdgpu/../display/dc/dce/dmub_psr.c:126 dmub_psr_get_state+0xc6/0xd0 [amdgpu]
[53074.286242] Modules linked in: hid_jabra uinput rfcomm snd_seq_dummy snd_hrtimer snd_seq uhid 8021q garp mrp stp llc ccm michael_mic cmac algif_hash algif_skcipher af_alg bnep snd_soc_acp6x_mach snd_soc_dmic snd_acp6x_pdm_dma snd_sof_amd_rembrandt snd_sof_amd_renoir snd_sof_amd_acp snd_sof_pci r8153_ecm snd_sof_xtensa_dsp cdc_ether qrtr_mhi usbnet snd_ctl_led snd_sof snd_sof_utils qrtr snd_soc_core snd_hda_codec_realtek ath11k_pci snd_hda_codec_generic snd_compress amdgpu snd_hda_codec_hdmi ledtrig_audio ac97_bus ath11k btusb btrtl snd_pcm_dmaengine snd_hda_intel snd_hda_scodec_cs35l41_spi btbcm snd_pci_ps snd_intel_dspcfg qmi_helpers drm_buddy btintel intel_rapl_msr gpu_sched snd_usb_audio snd_rpl_pci_acp6x hid_sensor_als snd_intel_sdw_acpi intel_rapl_common btmtk mac80211 i2c_algo_bit snd_acp_pci hid_sensor_trigger drm_suballoc_helper snd_hda_codec snd_usbmidi_lib uvcvideo bluetooth edac_mce_amd videobuf2_vmalloc snd_rawmidi snd_pci_acp6x libarc4 industrialio_triggered_buffer drm_ttm_helper snd_hda_core uvc
[53074.286313] snd_seq_device snd_hda_scodec_cs35l41_i2c hp_wmi videobuf2_memops kfifo_buf kvm_amd snd_pci_acp5x ttm snd_hda_scodec_cs35l41 hid_sensor_iio_common snd_hwdep videobuf2_v4l2 cfg80211 industrialio hid_multitouch ecdh_generic sparse_keymap videodev snd_rn_pci_acp3x snd_hda_cs_dsp_ctls drm_display_helper snd_pcm snd_acp_config kvm hid_sensor_hub ucsi_acpi cs_dsp snd_soc_acpi videobuf2_common r8152 cec rfkill sp5100_tco typec_ucsi snd_soc_cs35l41_lib snd_timer wmi_bmof irqbypass mc thunderbolt rapl mii typec pcspkr crc16 k10temp i2c_piix4 snd_pci_acp3x snd video amd_sfh soundcore mhi roles mousedev wmi amd_pmf i2c_hid_acpi joydev i2c_hid platform_profile serial_multi_instantiate wireless_hotkey amd_pmc acpi_tad mac_hid crypto_user loop fuse bpf_preload ip_tables x_tables btrfs blake2b_generic libcrc32c crc32c_generic xor raid6_pq vfat fat hid_logitech_hidpp hid_logitech_dj usbhid uas usb_storage dm_crypt cbc encrypted_keys trusted asn1_encoder tee dm_mod serio_raw atkbd libps2 crct10dif_pclmul crc32_pclmul
[53074.286388] crc32c_intel polyval_clmulni polyval_generic gf128mul vivaldi_fmap ghash_clmulni_intel sha512_ssse3 aesni_intel nvme crypto_simd nvme_core cryptd xhci_pci i8042 ccp nvme_common xhci_pci_renesas serio
[53074.286404] CPU: 4 PID: 724 Comm: Xorg Not tainted 6.4.12-arch1-1 #1 3e6fa2753a2d75925c34ecb78e22e85a65d083df
[53074.286407] Hardware name: HP HP EliteBook 845 14 inch G9 Notebook PC/8990, BIOS U82 Ver. 01.06.00 07/03/2023
[53074.286409] RIP: 0010:dmub_psr_get_state+0xc6/0xd0 [amdgpu]
[53074.286606] Code: 00 00 74 b4 48 8b 44 24 08 65 48 2b 04 25 28 00 00 00 75 1a 48 83 c4 10 5b 5d 41 5c 41 5d e9 d1 5d 2f f7 3d ff 00 00 00 75 da <0f> 0b eb d6 e8 41 d8 2d f7 90 90 90 90 90 90 90 90 90 90 90 90 90
[53074.286607] RSP: 0018:ffffc204021bb630 EFLAGS: 00010246
[53074.286609] RAX: 00000000000000ff RBX: 00000000000003e9 RCX: 0000000000000004
[53074.286611] RDX: 0000000000000000 RSI: 0000000000001681 RDI: ffff9cf095780000
[53074.286612] RBP: ffff9cf09ea3d400 R08: 0000000000000000 R09: ffffc204409e4000
[53074.286613] R10: 0000000000000000 R11: 0000000000000000 R12: 0000000000000000
[53074.286614] R13: ffffc204021bb66c R14: ffff9cf08460a000 R15: 0000000000000000
[53074.286616] FS: 00007f657eb62480(0000) GS:ffff9cf3ce900000(0000) knlGS:0000000000000000
[53074.286617] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[53074.286618] CR2: 00007f656181c000 CR3: 000000010b036000 CR4: 0000000000750ee0
[53074.286620] PKRU: 55555554
[53074.286620] Call Trace:
[53074.286624] <TASK>
[53074.286626] ? dmub_psr_get_state+0xc6/0xd0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.286811] ? __warn+0x81/0x130
[53074.286817] ? dmub_psr_get_state+0xc6/0xd0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.287002] ? report_bug+0x171/0x1a0
[53074.287008] ? handle_bug+0x3c/0x80
[53074.287011] ? exc_invalid_op+0x17/0x70
[53074.287013] ? asm_exc_invalid_op+0x1a/0x20
[53074.287022] ? dmub_psr_get_state+0xc6/0xd0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.287210] dmub_psr_enable+0xde/0x120 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.287391] edp_set_psr_allow_active+0x27e/0x3b0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.287573] dc_set_psr_allow_active+0x91/0xf0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.287737] amdgpu_dm_atomic_commit_tail+0x5ad/0x3ab0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.287927] ? srso_alias_return_thunk+0x5/0x7f
[53074.287931] ? dcn31x_populate_dml_pipes_from_context+0x32/0x90 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.288098] ? srso_alias_return_thunk+0x5/0x7f
[53074.288101] ? dcn31_populate_dml_pipes_from_context+0x5c/0x320 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.288265] ? srso_alias_return_thunk+0x5/0x7f
[53074.288267] ? dcn30_internal_validate_bw+0xf1/0x9d0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.288430] ? srso_alias_return_thunk+0x5/0x7f
[53074.288432] ? dcn31_calculate_wm_and_dlg_fp+0x5b/0x650 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.288618] ? srso_alias_return_thunk+0x5/0x7f
[53074.288620] ? dcn31_validate_bandwidth+0x12f/0x2d0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.288787] ? srso_alias_return_thunk+0x5/0x7f
[53074.288789] ? dc_validate_global_state+0x30a/0x3e0 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.288949] ? srso_alias_return_thunk+0x5/0x7f
[53074.288951] ? dma_resv_iter_first_unlocked+0x66/0x70
[53074.288955] ? srso_alias_return_thunk+0x5/0x7f
[53074.288956] ? dma_resv_get_fences+0x61/0x220
[53074.288959] ? srso_alias_return_thunk+0x5/0x7f
[53074.288961] ? dma_resv_get_singleton+0x46/0x140
[53074.288963] ? srso_alias_return_thunk+0x5/0x7f
[53074.288964] ? wait_for_completion_timeout+0x13e/0x170
[53074.288967] ? wait_for_completion_interruptible+0x139/0x1e0
[53074.288971] commit_tail+0x94/0x130
[53074.288976] drm_atomic_helper_commit+0x11a/0x140
[53074.288979] drm_atomic_commit+0x9a/0xd0
[53074.288983] ? __pfx___drm_printfn_info+0x10/0x10
[53074.288988] drm_atomic_connector_commit_dpms+0xce/0xf0
[53074.288990] drm_mode_obj_set_property_ioctl+0x197/0x3d0
[53074.288995] ? __pfx_drm_connector_property_set_ioctl+0x10/0x10
[53074.288998] drm_connector_property_set_ioctl+0x3d/0x60
[53074.289001] drm_ioctl_kernel+0xcd/0x170
[53074.289004] drm_ioctl+0x26d/0x4b0
[53074.289006] ? __pfx_drm_connector_property_set_ioctl+0x10/0x10
[53074.289011] amdgpu_drm_ioctl+0x4e/0x90 [amdgpu ea9e65dd5e9c96aec8b9df1aea0447da7c31ea64]
[53074.289138] __x64_sys_ioctl+0x94/0xd0
[53074.289144] do_syscall_64+0x60/0x90
[53074.289147] ? srso_alias_return_thunk+0x5/0x7f
[53074.289149] ? do_writev+0x117/0x160
[53074.289152] ? srso_alias_return_thunk+0x5/0x7f
[53074.289154] ? syscall_exit_to_user_mode+0x2b/0x40
[53074.289157] ? srso_alias_return_thunk+0x5/0x7f
[53074.289159] ? do_syscall_64+0x6c/0x90
[53074.289160] ? do_syscall_64+0x6c/0x90
[53074.289161] ? syscall_exit_to_user_mode+0x2b/0x40
[53074.289163] ? srso_alias_return_thunk+0x5/0x7f
[53074.289165] ? do_syscall_64+0x6c/0x90
[53074.289166] ? srso_alias_return_thunk+0x5/0x7f
[53074.289168] ? syscall_exit_to_user_mode+0x2b/0x40
[53074.289169] ? srso_alias_return_thunk+0x5/0x7f
[53074.289171] ? do_syscall_64+0x6c/0x90
[53074.289172] ? srso_alias_return_thunk+0x5/0x7f
[53074.289174] ? do_syscall_64+0x6c/0x90
[53074.289176] entry_SYSCALL_64_after_hwframe+0x72/0xdc
[53074.289178] RIP: 0033:0x7f657f50c9df
[53074.289224] Code: 00 48 89 44 24 18 31 c0 48 8d 44 24 60 c7 04 24 10 00 00 00 48 89 44 24 08 48 8d 44 24 20 48 89 44 24 10 b8 10 00 00 00 0f 05 <89> c2 3d 00 f0 ff ff 77 18 48 8b 44 24 18 64 48 2b 04 25 28 00 00
[53074.289230] RSP: 002b:00007ffd2a6babf0 EFLAGS: 00000246 ORIG_RAX: 0000000000000010
[53074.289233] RAX: ffffffffffffffda RBX: 0000000000000003 RCX: 00007f657f50c9df
[53074.289234] RDX: 00007ffd2a6bac80 RSI: 00000000c01064ab RDI: 0000000000000012
[53074.289234] RBP: 00007ffd2a6bac80 R08: 0000000000000002 R09: 000055566ed84490
[53074.289236] R10: 0000000000000000 R11: 0000000000000246 R12: 00000000c01064ab
[53074.289237] R13: 0000000000000012 R14: 0000000000000000 R15: 0000000000000000
[53074.289240] </TASK>
[53074.289241] ---[ end trace 0000000000000000 ]---
[53074.675640] [drm] perform_link_training_with_retries: Link(3) training attempt 1 of 10 failed @ rate(30) x lane(4) @ spread = 10 : fail reason:(1)
[53074.920862] [drm] perform_link_training_with_retries: Link(3) training attempt 2 of 10 failed @ rate(30) x lane(4) @ spread = 10 : fail reason:(1)
[53075.215375] [drm] perform_link_training_with_retries: Link(3) training attempt 3 of 10 failed @ rate(30) x lane(4) @ spread = 10 : fail reason:(1)
[53076.614366] [drm] perform_link_training_with_retries: Link(3) training attempt 4 of 10 failed @ rate(30) x lane(4) @ spread = 10 : fail reason:(1)
[53078.102698] [drm] perform_link_training_with_retries: Link(3) training attempt 5 of 10 failed @ rate(30) x lane(4) @ spread = 10 : fail reason:(1)
[53079.630551] [drm] perform_link_training_with_retries: Link(3) training attempt 6 of 10 failed @ rate(30) x lane(4) @ spread = 10 : fail reason:(1)