On Fri, Sep 06, 2024 at 06:06:00AM +0000, Bunkmate wrote:
> >Synopsis:    kernel drm errors running latest snapshot
> >Category:    kernel drm
> >Environment:
>       System      : OpenBSD 7.6
>       Details     : OpenBSD 7.6-beta (GENERIC.MP) #311: Thu Sep  5 10:15:45 
> MDT 2024
>                        
> dera...@amd64.openbsd.org:/usr/src/sys/arch/amd64/compile/GENERIC.MP
> 
>       Architecture: OpenBSD.amd64
>       Machine     : amd64
> >Description:
>       The latest snapshot has introduced drm errors.
> >How-To-Repeat:
>       Reboot system and review dmesg output.
> >Fix:
>       Unknown.
> 
> dmesg:
> OpenBSD 7.6-beta (GENERIC.MP) #311: Thu Sep  5 10:15:45 MDT 2024
>     dera...@amd64.openbsd.org:/usr/src/sys/arch/amd64/compile/GENERIC.MP
> real mem = 16450445312 (15688MB)
> avail mem = 15928520704 (15190MB)
> random: good seed from bootblocks
> mpath0 at root
> scsibus0 at mpath0: 256 targets
> mainbus0 at root
> bios0 at mainbus0: SMBIOS rev. 3.3 @ 0xe8d60 (52 entries)
> bios0: vendor American Megatrends International, LLC. version "F18" date 
> 03/22/2024
> bios0: Gigabyte Technology Co., Ltd. A520M S2H
> acpi0 at bios0: ACPI 6.2
> acpi0: sleep states S0 S3 S4 S5
> acpi0: tables DSDT FACP SSDT IVRS SSDT SSDT SSDT FIDT MCFG HPET FPDT TPM2 
> SSDT CRAT CDIT WPBT SSDT SSDT SSDT WSMT APIC SSDT SSDT SSDT
> acpi0: wakeup devices GP17(S4) XHC0(S4) XHC1(S4) GPP0(S4) PTXH(S4) PT20(S4) 
> PT21(S4) PT22(S4) PT23(S4) PT24(S4) PT26(S4) PT27(S4) PT28(S4) PT29(S4)
> acpitimer0 at acpi0: 3579545 Hz, 32 bits
> acpimcfg0 at acpi0
> acpimcfg0: addr 0xf0000000, bus 0-127
> acpihpet0 at acpi0: 14318180 Hz
> acpimadt0 at acpi0 addr 0xfee00000: PC-AT compat
> cpu0 at mainbus0: apid 0 (boot processor)
> cpu0: AMD Ryzen 5 5600G with Radeon Graphics, 3900.01 MHz, 19-50-00, patch 
> 0a50000f
> cpu0: cpuid 1 
> edx=178bfbff<FPU,VME,DE,PSE,TSC,MSR,PAE,MCE,CX8,APIC,SEP,MTRR,PGE,MCA,CMOV,PAT,PSE36,CFLUSH,MMX,FXSR,SSE,SSE2,HTT>
>  
> ecx=76f8320b<SSE3,PCLMUL,MWAIT,SSSE3,FMA3,CX16,SSE4.1,SSE4.2,x2APIC,MOVBE,POPCNT,AES,XSAVE,AVX,F16C,RDRAND>
> cpu0: cpuid 6 eax=4<ARAT> ecx=1<EFFFREQ>
> cpu0: cpuid 7.0 
> ebx=219c97a9<FSGSBASE,BMI1,AVX2,SMEP,BMI2,ERMS,INVPCID,PQM,RDSEED,ADX,SMAP,CLFLUSHOPT,CLWB,SHA>
>  ecx=40068c<UMIP,PKU> edx=10
> cpu0: cpuid d.1 eax=f<XSAVEOPT,XSAVEC,XGETBV1,XSAVES>
> cpu0: cpuid 80000001 edx=2fd3fbff<NXE,MMXX,FFXSR,PAGE1GB,RDTSCP,LONG> 
> ecx=75c237ff<LAHF,CMPLEG,SVM,EAPICSP,AMCR8,ABM,SSE4A,MASSE,3DNOWP,OSVW,IBS,SKINIT,TCE,TOPEXT,CPCTR,DBKP,PCTRL3,MWAITX>
> cpu0: cpuid 80000007 edx=6799<HWPSTATE,ITSC>
> cpu0: cpuid 80000008 
> ebx=191ef657<IBPB,IBRS,STIBP,STIBP_ALL,IBRS_PREF,IBRS_SM,SSBD>
> cpu0: cpuid 8000001F 
> eax=1780f<SME,SEV,PFLUSH_MSR,SEVES,REQ64BITHOST,RESTINJ,ALTINJ,DBGSTSW,VTE> 
> edx=1
> cpu0: 32KB 64b/line 8-way D-cache, 32KB 64b/line 8-way I-cache, 512KB 
> 64b/line 8-way L2 cache, 16MB 64b/line 16-way L3 cache
> cpu0: smt 0, core 0, package 0
> mtrr: Pentium Pro MTRR support, 8 var ranges, 88 fixed ranges
> cpu0: apic clock running at 100MHz
> cpu0: mwait min=64, max=64, C-substates=1.1, IBE
> cpu1 at mainbus0: apid 2 (application processor)
> cpu1: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu1: smt 0, core 1, package 0
> cpu2 at mainbus0: apid 4 (application processor)
> cpu2: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu2: smt 0, core 2, package 0
> cpu3 at mainbus0: apid 6 (application processor)
> cpu3: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu3: smt 0, core 3, package 0
> cpu4 at mainbus0: apid 8 (application processor)
> cpu4: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu4: smt 0, core 4, package 0
> cpu5 at mainbus0: apid 10 (application processor)
> cpu5: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu5: smt 0, core 5, package 0
> cpu6 at mainbus0: apid 1 (application processor)
> cpu6: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu6: smt 1, core 0, package 0
> cpu7 at mainbus0: apid 3 (application processor)
> cpu7: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu7: smt 1, core 1, package 0
> cpu8 at mainbus0: apid 5 (application processor)
> cpu8: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu8: smt 1, core 2, package 0
> cpu9 at mainbus0: apid 7 (application processor)
> cpu9: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu9: smt 1, core 3, package 0
> cpu10 at mainbus0: apid 9 (application processor)
> cpu10: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu10: smt 1, core 4, package 0
> cpu11 at mainbus0: apid 11 (application processor)
> cpu11: AMD Ryzen 5 5600G with Radeon Graphics, 3900.00 MHz, 19-50-00, patch 
> 0a50000f
> cpu11: smt 1, core 5, package 0
> ioapic0 at mainbus0: apid 13 pa 0xfec00000, version 21, 24 pins
> ioapic1 at mainbus0: apid 14 pa 0xfec01000, version 21, 32 pins
> acpiprt0 at acpi0: bus 0 (PCI0)
> acpiprt1 at acpi0: bus -1 (GPP6)
> acpiprt2 at acpi0: bus -1 (GPP7)
> acpiprt3 at acpi0: bus -1 (GPP8)
> acpiprt4 at acpi0: bus -1 (GPP9)
> acpiprt5 at acpi0: bus 6 (GP17)
> acpiprt6 at acpi0: bus -1 (GPP0)
> acpiprt7 at acpi0: bus -1 (GP18)
> acpiprt8 at acpi0: bus 5 (GPP4)
> acpiprt9 at acpi0: bus -1 (GPP5)
> acpiprt10 at acpi0: bus 1 (GPP3)
> acpipci0 at acpi0 PCI0: 0x00000010 0x00000011 0x00000000
> acpicmos0 at acpi0
> com0 at acpi0 UAR1 addr 0x3f8/0x8 irq 4: ns16550a, 16 byte fifo
> acpibtn0 at acpi0: PWRB
> amdgpio0 at acpi0 GPIO uid 0 addr 0xfed81500/0x400 irq 7, 184 pins
> tpm0 at acpi0 TPM_: unsupported TPM2 start method 2
> "ACPI0010" at acpi0 not configured
> acpicpu0 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu1 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu2 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu3 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu4 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu5 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu6 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu7 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu8 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu9 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu10 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> acpicpu11 at acpi0: C3(0@350 io@0x415), C2(0@18 io@0x414), C1(0@1 mwait), PSS
> "AMDIF030" at acpi0 not configured
> "PNP0C14" at acpi0 not configured
> "PNP0C14" at acpi0 not configured
> acpitz0 at acpi0: critical temperature is 20 degC
> acpitz1 at acpi0: critical temperature is 20 degC
> acpivideo0 at acpi0: VGA_
> acpivout0 at acpivideo0: LCD_
> cpu0: 3900 MHz: speeds: 3900 1700 1400 MHz
> pci0 at mainbus0 bus 0
> ksmn0 at pci0 dev 0 function 0 "AMD 17h/6xh Root Complex" rev 0x00
> "AMD 17h/6xh IOMMU" rev 0x00 at pci0 dev 0 function 2 not configured
> pchb0 at pci0 dev 1 function 0 "AMD 17h/6xh Host" rev 0x00
> pchb1 at pci0 dev 2 function 0 "AMD 17h/6xh Host" rev 0x00
> ppb0 at pci0 dev 2 function 1 "AMD 17h/6xh PCIE" rev 0x00: msi
> pci1 at ppb0 bus 1
> xhci0 at pci1 dev 0 function 0 vendor "AMD", unknown product 0x43ec rev 0x00: 
> msix, xHCI 1.10
> usb0 at xhci0: USB revision 3.0
> uhub0 at usb0 configuration 1 interface 0 "AMD xHCI root hub" rev 3.00/1.00 
> addr 1
> ahci0 at pci1 dev 0 function 1 "AMD 500 Series AHCI" rev 0x00: msi, AHCI 1.3.1
> scsibus1 at ahci0: 32 targets
> ppb1 at pci1 dev 0 function 2 "AMD 500 Series PCIE" rev 0x00
> pci2 at ppb1 bus 2
> ppb2 at pci2 dev 1 function 0 "AMD 500 Series PCIE" rev 0x00: msi
> pci3 at ppb2 bus 3
> re0 at pci3 dev 0 function 0 "Realtek 8168" rev 0x06: RTL8168E/8111E-VL 
> (0x2c80), msi, address 00:13:3b:e4:03:c4
> rgephy0 at re0 phy 7: RTL8169S/8110S/8211, rev. 5
> ppb3 at pci2 dev 3 function 0 "AMD 500 Series PCIE" rev 0x00: msi
> pci4 at ppb3 bus 4
> re1 at pci4 dev 0 function 0 "Realtek 8168" rev 0x16: RTL8168H/8111H 
> (0x5400), msi, address 18:c0:4d:6e:31:49
> rgephy1 at re1 phy 7: RTL8251, rev. 0
> ppb4 at pci0 dev 2 function 2 "AMD 17h/6xh PCIE" rev 0x00: msi
> pci5 at ppb4 bus 5
> nvme0 at pci5 dev 0 function 0 "SanDisk SN750" rev 0x00: msix, NVMe 1.4
> nvme0: WD Blue SN570 1TB, firmware 234100WD, serial 21411U801035
> scsibus2 at nvme0: 2 targets, initiator 0
> sd0 at scsibus2 targ 1 lun 0: <NVMe, WD Blue SN570 1T, 2341>
> sd0: 953869MB, 512 bytes/sector, 1953525168 sectors
> pchb2 at pci0 dev 8 function 0 "AMD 17h/6xh Host" rev 0x00
> ppb5 at pci0 dev 8 function 1 "AMD 17h/6xh PCIE" rev 0x00
> pci6 at ppb5 bus 6
> amdgpu0 at pci6 dev 0 function 0 "ATI Cezanne" rev 0xc9
> drm0 at amdgpu0
> amdgpu0: msi
> azalia0 at pci6 dev 0 function 1 "ATI Renoir HD Audio" rev 0x00: msi
> azalia0: no supported codecs
> ccp0 at pci6 dev 0 function 2 "AMD 17h/1xh Crypto" rev 0x00: msix
> xhci1 at pci6 dev 0 function 3 "AMD 17h/6xh xHCI" rev 0x00: msix, xHCI 1.10
> usb1 at xhci1: USB revision 3.0
> uhub1 at usb1 configuration 1 interface 0 "AMD xHCI root hub" rev 3.00/1.00 
> addr 1
> xhci2 at pci6 dev 0 function 4 "AMD 17h/6xh xHCI" rev 0x00: msix, xHCI 1.10
> usb2 at xhci2: USB revision 3.0
> uhub2 at usb2 configuration 1 interface 0 "AMD xHCI root hub" rev 3.00/1.00 
> addr 1
> azalia1 at pci6 dev 0 function 6 "AMD 17h/1xh HD Audio" rev 0x00: msi
> azalia1: codecs: Realtek ALC887
> audio0 at azalia1
> piixpm0 at pci0 dev 20 function 0 "AMD FCH SMBus" rev 0x51: SMI
> iic0 at piixpm0
> spdmem0 at iic0 addr 0x52: 8GB DDR4 SDRAM PC4-17000
> spdmem1 at iic0 addr 0x53: 8GB DDR4 SDRAM PC4-17000
> iic1 at piixpm0
> pcib0 at pci0 dev 20 function 3 "AMD FCH LPC" rev 0x51
> pchb3 at pci0 dev 24 function 0 "AMD 19h/5xh Data Fabric" rev 0x00
> pchb4 at pci0 dev 24 function 1 "AMD 19h/5xh Data Fabric" rev 0x00
> pchb5 at pci0 dev 24 function 2 "AMD 19h/5xh Data Fabric" rev 0x00
> pchb6 at pci0 dev 24 function 3 "AMD 19h/5xh Data Fabric" rev 0x00
> pchb7 at pci0 dev 24 function 4 "AMD 19h/5xh Data Fabric" rev 0x00
> pchb8 at pci0 dev 24 function 5 "AMD 19h/5xh Data Fabric" rev 0x00
> pchb9 at pci0 dev 24 function 6 "AMD 19h/5xh Data Fabric" rev 0x00
> pchb10 at pci0 dev 24 function 7 "AMD 19h/5xh Data Fabric" rev 0x00
> isa0 at pcib0
> isadma0 at isa0
> pckbc0 at isa0 port 0x60/5 irq 1 irq 12
> pckbd0 at pckbc0 (kbd slot)
> wskbd0 at pckbd0: console keyboard
> pcppi0 at isa0 port 0x61
> spkr0 at pcppi0
> uhidev0 at uhub0 port 10 configuration 1 interface 0 "NOVATEK USB Keyboard" 
> rev 1.10/1.04 addr 2
> uhidev0: iclass 3/1
> ukbd0 at uhidev0: 8 variable keys, 6 key codes
> wskbd1 at ukbd0 mux 1
> uhidev1 at uhub0 port 10 configuration 1 interface 1 "NOVATEK USB Keyboard" 
> rev 1.10/1.04 addr 2
> uhidev1: iclass 3/0, 2 report ids
> uhid0 at uhidev1 reportid 1: input=1, output=0, feature=0
> ucc0 at uhidev1 reportid 2: 24 usages, 15 keys, enum
> wskbd2 at ucc0 mux 1
> uhidev2 at uhub0 port 11 configuration 1 interface 0 "Microsoft Microsoft 
> 3-Button Mouse with IntelliEye(TM)" rev 1.10/3.00 addr 3
> uhidev2: iclass 3/1
> ums0 at uhidev2: 3 buttons, Z dir
> wsmouse0 at ums0 mux 0
> uhidev3 at uhub0 port 12 configuration 1 interface 0 "ITE Tech. Inc. ITE 
> Device" rev 2.00/0.01 addr 4
> uhidev3: iclass 3/0, 204 report ids
> uhid1 at uhidev3 reportid 90: input=0, output=0, feature=16
> uhid2 at uhidev3 reportid 204: input=0, output=0, feature=63
> umass0 at uhub2 port 1 configuration 1 interface 0 "Lexar USB Flash Drive" 
> rev 2.00/11.00 addr 2
> umass0: using SCSI over Bulk-Only
> scsibus3 at umass0: 2 targets, initiator 0
> sd1 at scsibus3 targ 1 lun 0: <Lexar, USB Flash Drive, 1100> removable 
> serial.05dca8154UW4WBL5UG4T
> sd1: 59904MB, 512 bytes/sector, 122683392 sectors
> vscsi0 at root
> scsibus4 at vscsi0: 256 targets
> softraid0 at root
> scsibus5 at softraid0: 256 targets
> sd2 at scsibus5 targ 1 lun 0: <OPENBSD, SR CRYPTO, 006>
> sd2: 953869MB, 512 bytes/sector, 1953524576 sectors
> root on sd2a (f151aaf060fa90b5.a) swap on sd2b dump on sd2b
> amdgpu0: GREEN_SARDINE GC 9.3.0 7 CU rev 0x00
> drm:pid0:smu_adjust_power_state_dynamic *ERROR* Failed to set performance 
> level!drm:pid16547:smu_dpm_set_power_gate *ERROR* Failed to enable gfxoff!
> drm:pid51437:smu_dpm_set_power_gate *ERROR* Failed to power gate VCN!
> [drm] *ERROR* Dpm disable uvd failed, ret = -5. 
> drm:pid51437:smu_dpm_set_power_gate *ERROR* Failed to power gate JPEG!
> [drm] *ERROR* Dpm disable jpeg failed, ret = -5. 
> drm:pid16547:renoir_set_power_profile_mode *ERROR* Fail to set workload type 2
> amdgpu0: 1920x1080, 32bpp
> wsdisplay0 at amdgpu0 mux 1: console (std, vt100 emulation), using wskbd0
> wskbd1: connecting to wsdisplay0
> wskbd2: connecting to wsdisplay0
> wsdisplay0: screen 1-5 added (std, vt100 emulation)
> drm:pid17964:smu_dpm_set_power_gate *ERROR* Failed to power gate VCN!
> [drm] *ERROR* Dpm disable uvd failed, ret = -5. 
> drm:pid17964:smu_dpm_set_power_gate *ERROR* Failed to power gate JPEG!
> [drm] *ERROR* Dpm disable jpeg failed, ret = -5. 
> drm:pid41399:renoir_get_dpm_ultimate_freq *ERROR* Attempt to get max GX 
> frequency from SMC Failed !
> drm:pid41399:renoir_get_dpm_ultimate_freq *ERROR* Attempt to get min GX 
> frequency from SMC Failed !
> drm:pid17964:smu_dpm_set_power_gate *ERROR* Failed to enable gfxoff!
> drm:pid41399:renoir_get_dpm_ultimate_freq *ERROR* Attempt to get max GX 
> frequency from SMC Failed !
> drm:pid41399:renoir_get_dpm_ultimate_freq *ERROR* Attempt to get min GX 
> frequency from SMC Failed !

do you still this with the following diff to revert
'drm/amdgpu/swsmu: always force a state reprogram on init' ?

Index: sys/dev/pci/drm/amd/pm/swsmu/amdgpu_smu.c
===================================================================
RCS file: /cvs/src/sys/dev/pci/drm/amd/pm/swsmu/amdgpu_smu.c,v
diff -u -p -r1.19 amdgpu_smu.c
--- sys/dev/pci/drm/amd/pm/swsmu/amdgpu_smu.c   5 Sep 2024 04:29:04 -0000       
1.19
+++ sys/dev/pci/drm/amd/pm/swsmu/amdgpu_smu.c   8 Sep 2024 07:21:27 -0000
@@ -1841,9 +1841,8 @@ static int smu_bump_power_profile_mode(s
 }
 
 static int smu_adjust_power_state_dynamic(struct smu_context *smu,
-                                         enum amd_dpm_forced_level level,
-                                         bool skip_display_settings,
-                                         bool force_update)
+                                  enum amd_dpm_forced_level level,
+                                  bool skip_display_settings)
 {
        int ret = 0;
        int index = 0;
@@ -1872,7 +1871,7 @@ static int smu_adjust_power_state_dynami
                }
        }
 
-       if (force_update || smu_dpm_ctx->dpm_level != level) {
+       if (smu_dpm_ctx->dpm_level != level) {
                ret = smu_asic_set_performance_level(smu, level);
                if (ret) {
                        dev_err(smu->adev->dev, "Failed to set performance 
level!");
@@ -1888,7 +1887,7 @@ static int smu_adjust_power_state_dynami
                index = index > 0 && index <= WORKLOAD_POLICY_MAX ? index - 1 : 
0;
                workload[0] = smu->workload_setting[index];
 
-               if (force_update || smu->power_profile_mode != workload[0])
+               if (smu->power_profile_mode != workload[0])
                        smu_bump_power_profile_mode(smu, workload, 0);
        }
 
@@ -1909,13 +1908,11 @@ static int smu_handle_task(struct smu_co
                ret = smu_pre_display_config_changed(smu);
                if (ret)
                        return ret;
-               ret = smu_adjust_power_state_dynamic(smu, level, false, false);
+               ret = smu_adjust_power_state_dynamic(smu, level, false);
                break;
        case AMD_PP_TASK_COMPLETE_INIT:
-               ret = smu_adjust_power_state_dynamic(smu, level, true, true);
-               break;
        case AMD_PP_TASK_READJUST_POWER_STATE:
-               ret = smu_adjust_power_state_dynamic(smu, level, true, false);
+               ret = smu_adjust_power_state_dynamic(smu, level, true);
                break;
        default:
                break;

Reply via email to