Hi
While loading AMDGPU driver in T1040 board , i getting following error, what could be the issue here
root@t1042d4rdb:~# insmod /amdgpu.ko
[drm] amdgpu kernel modesetting enabled.
amdgpu 0001:01:00.0: enabling device (0006 -> 0007)
[drm] initializing kernel modesetting (POLARIS12 0x1002:0x6987 0x1787:0x2389 0x80).
amdgpu 0001:01:00.0: amdgpu: Trusted Memory Zone (TMZ) feature not supported
[drm] register mmio base: 0xA0000000
[drm] register mmio size: 262144
[drm] PCIE atomic ops is not supported
[drm] add ip block number 0 <vi_common>
[drm] add ip block number 1 <gmc_v8_0>
[drm] add ip block number 2 <tonga_ih>
[drm] add ip block number 3 <gfx_v8_0>
[drm] add ip block number 4 <sdma_v3_0>
[drm] add ip block number 5 <powerplay>
[drm] add ip block number 6 <dm>
[drm] add ip block number 7 <uvd_v6_0>
[drm] add ip block number 8 <vce_v3_0>
[drm:.check_atom_bios [amdgpu]] ATOMBIOS detected
amdgpu 0001:01:00.0: amdgpu: Fetched VBIOS from ROM BAR
amdgpu: ATOM BIOS: 113-ER16BFE-001
[drm:.amdgpu_atombios_init [amdgpu]] atom firmware requested 00000000 0kb
[drm] UVD is enabled in VM mode
[drm] UVD ENC is enabled in VM mode
[drm] VCE enabled in VM mode
[drm] GPU posting now...
[drm] vm size is 64 GB, 2 levels, block size is 10-bit, fragment size is 9-bit
[drm:.gmc_v8_0_sw_init [amdgpu]]
amdgpu 0001:01:00.0: BAR 2: releasing [mem 0xd10000000-0xd101fffff 64bit pref]
amdgpu 0001:01:00.0: BAR 0: releasing [mem 0xd00000000-0xd0fffffff 64bit pref]
pcieport 0001:00:00.0: BAR 9: releasing [mem 0xd00000000-0xeffffffff 64bit pref]
pcieport 0001:00:00.0: BAR 9: assigned [mem 0xd00000000-0xe7fffffff 64bit pref]
amdgpu 0001:01:00.0: BAR 0: assigned [mem 0xd00000000-0xdffffffff 64bit pref]
amdgpu 0001:01:00.0: BAR 2: assigned [mem 0xe00000000-0xe001fffff 64bit pref]
pcieport 0001:00:00.0: PCI bridge to [bus 01]
pcieport 0001:00:00.0: bridge window [io 0x8000080000010000-0x800008000001ffff]
pcieport 0001:00:00.0: bridge window [mem 0xa0000000-0xafffffff]
pcieport 0001:00:00.0: bridge window [mem 0xd00000000-0xe7fffffff 64bit pref]
amdgpu 0001:01:00.0: amdgpu: VRAM: 4096M 0x000000F400000000 - 0x000000F4FFFFFFFF (4096M used)
amdgpu 0001:01:00.0: amdgpu: GART: 256M 0x000000FF00000000 - 0x000000FF0FFFFFFF
[drm] Detected VRAM RAM=4096M, BAR=4096M
[drm] RAM width 128bits GDDR5
[drm] amdgpu: 4096M of VRAM memory ready
[drm] amdgpu: 1457M of GTT memory ready.
[drm] GART: num cpu pages 65536, num gpu pages 65536
[drm:.amdgpu_ucode_print_mc_hdr [amdgpu]] MC
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] size_bytes: 32608
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] header_size_bytes: 40
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] header_version_major: 1
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] header_version_minor: 0
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ip_version_major: 8
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ip_version_minor: 1
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ucode_version: 0x00b4dc50
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ucode_size_bytes: 32160
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ucode_array_offset_bytes: 448
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] crc32: 0x9b1e395c
[drm:.amdgpu_ucode_print_mc_hdr [amdgpu]] io_debug_size_bytes: 192
[drm:.amdgpu_ucode_print_mc_hdr [amdgpu]] io_debug_array_offset_bytes: 256
[drm] PCIE GART of 256M enabled (table at 0x000000F400000000).
[drm:.amdgpu_irq_init [amdgpu]] amdgpu: irq initialized.
[drm:.gfx_v8_0_sw_init [amdgpu]]
[drm] Chained IB support enabled!
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring gfx use gpu addr 0x000000ff00400040
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring comp_1.0.0 use gpu addr 0x000000ff004000e0
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring comp_1.1.0 use gpu addr 0x000000ff00400180
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring comp_1.2.0 use gpu addr 0x000000ff00400220
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring comp_1.3.0 use gpu addr 0x000000ff004002c0
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring comp_1.0.1 use gpu addr 0x000000ff00400360
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring comp_1.1.1 use gpu addr 0x000000ff00400400
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring comp_1.2.1 use gpu addr 0x000000ff004004a0
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring comp_1.3.1 use gpu addr 0x000000ff00400540
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring kiq_2.1.0 use gpu addr 0x000000ff004005e0
[drm:.sdma_v3_0_sw_init [amdgpu]]
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring sdma0 use gpu addr 0x000000ff00400680
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring sdma1 use gpu addr 0x000000ff00400720
amdgpu: hwmgr_sw_init smu backed is polaris10_smu
[drm] Found UVD firmware Version: 1.130 Family ID: 16
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring uvd use gpu addr 0x000000f4001afa80
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring uvd_enc0 use gpu addr 0x000000ff00400860
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring uvd_enc1 use gpu addr 0x000000ff00400900
[drm] Found VCE firmware Version: 53.26 Binary ID: 3
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring vce0 use gpu addr 0x000000ff004009a0
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring vce1 use gpu addr 0x000000ff00400a40
amdgpu 0001:01:00.0: [drm:.amdgpu_fence_driver_start_ring [amdgpu]] fence driver on ring vce2 use gpu addr 0x000000ff00400ae0
[drm:.amdgpu_ucode_print_smc_hdr [amdgpu]] SMC
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] size_bytes: 130388
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] header_size_bytes: 36
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] header_version_major: 1
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] header_version_minor: 0
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ip_version_major: 7
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ip_version_minor: 2
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ucode_version: 0x00221700
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ucode_size_bytes: 130132
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] ucode_array_offset_bytes: 256
[drm:.amdgpu_ucode_print_common_hdr [amdgpu]] crc32: 0xae2b3b78
[drm:.amdgpu_ucode_print_smc_hdr [amdgpu]] ucode_start_addr: 131072
amdgpu:
failed to send message 100 ret is 0
amdgpu: SMU Firmware start failed!
amdgpu: Failed to load SMU ucode.
amdgpu: fw load failed
amdgpu: smu firmware loading failed
amdgpu 0001:01:00.0: amdgpu: amdgpu_device_ip_init failed
amdgpu 0001:01:00.0: amdgpu: Fatal error during GPU init
amdgpu 0001:01:00.0: amdgpu: amdgpu: finishing device.
[drm:.gfx_v8_0_set_eop_interrupt_state [amdgpu]] invalid me 2
[drm:.gfx_v8_0_set_eop_interrupt_state [amdgpu]] invalid me 2
[drm:.gfx_v8_0_set_eop_interrupt_state [amdgpu]] invalid me 2
[drm:.gfx_v8_0_set_eop_interrupt_state [amdgpu]] invalid me 2
amdgpu: probe of 0001:01:00.0 failed with error -22
BUG: Unable to handle kernel data access on read at 0x8000080080954000
Faulting instruction address: 0xc000000000011870
Oops: Kernel access of bad area, sig: 11 [#1]
BE PAGE_SIZE=4K SMP NR_CPUS=24 CoreNet Generic
Modules linked in: amdgpu(+) backlight drm_ttm_helper ttm gpu_sched ucc_uart fsl_jr_uio
CPU: 2 PID: 816 Comm: insmod Not tainted 5.15.71+g95448dd0dc9b #1
**bleep**: c000000000011870 LR: 8000000000e0d120 CTR: 0000000000058400
REGS: c00000000a956d80 TRAP: 0300 Not tainted (5.15.71+g95448dd0dc9b)
MSR: 0000000080029002 <CE,EE,ME> CR: 22002228 XER: 00000000
DEAR: 8000080080954000 ESR: 0000000000000000 IRQMASK: 0
GPR00: 8000000000e0d100 c00000000a957020 c0000000013faa00 c00000000c000000
GPR04: 8000080080954000 00000000002c2000 00000000000b0800 000000007ecc9000
GPR08: 0000000000058400 8000080080954000 c00000000bfffffc 80000000010b76d8
GPR12: c0000000000117f4 c00000003ffff140 000000010b5456f0 000000010b4fa188
GPR16: 0000000000000000 000000010b545810 000000010b5202b0 0000000000000000
GPR20: 0000000000000000 0000000000000000 c00000000ae16a48 8000080080954000
GPR24: 00000000002c2000 0000000000000000 c00000000ae00010 0000000000000001
GPR28: c00000000ae00000 c00000000ae10000 0000000000000000 c00000000ae10000
**bleep** [c000000000011870] ._memcpy_fromio+0x7c/0x100
LR [8000000000e0d120] .amdgpu_uvd_suspend+0x1d4/0x268 [amdgpu]
Call Trace:
[c00000000a957020] [8000000000e0d100] .amdgpu_uvd_suspend+0x1b4/0x268 [amdgpu] (unreliable)
[c00000000a9570f0] [8000000000e1110c] .uvd_v6_0_sw_fini+0x1c/0xcc [amdgpu]
[c00000000a957180] [8000000000cf24b0] .amdgpu_device_fini_sw+0x124/0x378 [amdgpu]
[c00000000a957240] [8000000000cf9e0c] .amdgpu_driver_release_kms+0x1c/0x40 [amdgpu]
[c00000000a9572c0] [c000000000704380] .devm_drm_dev_init_release+0x78/0xcc
[c00000000a957340] [c000000000755248] .devm_action_release+0x28/0x3c
[c00000000a9573b0] [c00000000075576c] .release_nodes+0x78/0x108
[c00000000a957450] [c000000000757174] .devres_release_all+0xa8/0x11c
[c00000000a957510] [c00000000074f788] .really_probe.part.0+0x1b8/0x440
[c00000000a9575b0] [c00000000074fad8] .__driver_probe_device+0xc8/0x198
[c00000000a957640] [c00000000074fbf8] .driver_probe_device+0x50/0x16c
[c00000000a9576e0] [c00000000075055c] .__driver_attach+0xb4/0x200
[c00000000a957770] [c00000000074c518] .bus_for_each_dev+0x9c/0x110
[c00000000a957820] [c00000000074eca4] .driver_attach+0x24/0x38
[c00000000a957890] [c00000000074e4ec] .bus_add_driver+0x1d4/0x2a8
[c00000000a957940] [c00000000075107c] .driver_register+0xa4/0x194
[c00000000a9579c0] [c0000000006217ec] .__pci_register_driver+0x58/0x6c
[c00000000a957a30] [80000000010a9608] .amdgpu_init+0x74/0x94 [amdgpu]
[c00000000a957ab0] [c0000000000021cc] .do_one_initcall+0x6c/0x284
[c00000000a957b90] [c0000000001174a4] .do_init_module+0x5c/0x2bc
[c00000000a957c30] [c00000000011a980] .__do_sys_finit_module+0xc4/0x10c
[c00000000a957d60] [c000000000012454] .system_call_exception+0x11c/0x1c4
[c00000000a957e10] [c0000000000001f8] system_call_common+0xf0/0x210
--- interrupt: c00 at 0x3fffbe532ee4
**bleep**: 00003fffbe532ee4 LR: 00000001366cdbfc CTR: 0000000000000000
REGS: c00000000a957e80 TRAP: 0c00 Not tainted (5.15.71+g95448dd0dc9b)
MSR: 000000008002d002 <CE,EE,PR,ME> CR: 28002882 XER: 00000000
IRQMASK: 0
GPR00: 0000000000000161 00003fffd14f61a0 00003fffbe637200 0000000000000003
GPR04: 00000001366d9148 0000000000000000 0000000000000000 0000000000000000
GPR08: 0000000000000000 0000000000000000 0000000000000000 0000000000000000
GPR12: 0000000000000000 00003fffbe6cf810 000000010b5456f0 000000010b4fa188
GPR16: 0000000000000000 000000010b545810 000000010b5202b0 0000000000000000
GPR20: 0000000000000000 0000000000000000 0000000000000002 00003fffd14f6ee5
GPR24: 00003fffd14f6860 00000001366fd9e8 0000000000000000 00000001366fcbd0
GPR28: 00000001366d9148 0000000000000000 0000000000000000 0000000136701760
**bleep** [00003fffbe532ee4] 0x3fffbe532ee4
LR [00000001366cdbfc] 0x1366cdbfc
--- interrupt: c00
Instruction dump:
4e800020 28250003 40810068 3905fffc 7908f082 38c80001 70c90001 3943fffc
7c892378 40820070 78c8f842 7d0903a6 <80e90000> 390a0004 90ea0004 7c0006ac
---[ end trace e1f14bc598aaf8c6 ]---
Segmentation fault