Skip to content
Navigation Menu
Toggle navigation
Sign in
In this repository
All GitHub Enterprise
↵
Jump to
↵
No suggested jump to results
In this repository
All GitHub Enterprise
↵
Jump to
↵
In this organization
All GitHub Enterprise
↵
Jump to
↵
In this repository
All GitHub Enterprise
↵
Jump to
↵
Sign in
Reseting focus
You signed in with another tab or window.
Reload
to refresh your session.
You signed out in another tab or window.
Reload
to refresh your session.
You switched accounts on another tab or window.
Reload
to refresh your session.
Dismiss alert
{{ message }}
mariux64
/
linux
Public
Notifications
You must be signed in to change notification settings
Fork
0
Star
0
Code
Issues
2
Pull requests
0
Actions
Projects
0
Wiki
Security
Insights
Additional navigation options
Code
Issues
Pull requests
Actions
Projects
Wiki
Security
Insights
Files
5493ee1
Breadcrumbs
linux
/
drivers
/
gpu
/
drm
/
amd
/
amdgpu
/
amdgpu_discovery.c
Blame
Blame
Latest commit
History
History
2405 lines (2157 loc) · 69.5 KB
Breadcrumbs
linux
/
drivers
/
gpu
/
drm
/
amd
/
amdgpu
/
amdgpu_discovery.c
Top
File metadata and controls
Code
Blame
2405 lines (2157 loc) · 69.5 KB
Raw
/* * Copyright 2018 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. * */ #include <linux/firmware.h> #include "amdgpu.h" #include "amdgpu_discovery.h" #include "soc15_hw_ip.h" #include "discovery.h" #include "soc15.h" #include "gfx_v9_0.h" #include "gmc_v9_0.h" #include "df_v1_7.h" #include "df_v3_6.h" #include "nbio_v6_1.h" #include "nbio_v7_0.h" #include "nbio_v7_4.h" #include "hdp_v4_0.h" #include "vega10_ih.h" #include "vega20_ih.h" #include "sdma_v4_0.h" #include "uvd_v7_0.h" #include "vce_v4_0.h" #include "vcn_v1_0.h" #include "vcn_v2_5.h" #include "jpeg_v2_5.h" #include "smuio_v9_0.h" #include "gmc_v10_0.h" #include "gmc_v11_0.h" #include "gfxhub_v2_0.h" #include "mmhub_v2_0.h" #include "nbio_v2_3.h" #include "nbio_v4_3.h" #include "nbio_v7_2.h" #include "nbio_v7_7.h" #include "hdp_v5_0.h" #include "hdp_v5_2.h" #include "hdp_v6_0.h" #include "nv.h" #include "soc21.h" #include "navi10_ih.h" #include "ih_v6_0.h" #include "gfx_v10_0.h" #include "gfx_v11_0.h" #include "sdma_v5_0.h" #include "sdma_v5_2.h" #include "sdma_v6_0.h" #include "lsdma_v6_0.h" #include "vcn_v2_0.h" #include "jpeg_v2_0.h" #include "vcn_v3_0.h" #include "jpeg_v3_0.h" #include "vcn_v4_0.h" #include "jpeg_v4_0.h" #include "amdgpu_vkms.h" #include "mes_v10_1.h" #include "mes_v11_0.h" #include "smuio_v11_0.h" #include "smuio_v11_0_6.h" #include "smuio_v13_0.h" #include "smuio_v13_0_6.h" #define FIRMWARE_IP_DISCOVERY "amdgpu/ip_discovery.bin" MODULE_FIRMWARE(FIRMWARE_IP_DISCOVERY); #define mmRCC_CONFIG_MEMSIZE 0xde3 #define mmMM_INDEX 0x0 #define mmMM_INDEX_HI 0x6 #define mmMM_DATA 0x1 static const char *hw_id_names[HW_ID_MAX] = { [MP1_HWID] = "MP1", [MP2_HWID] = "MP2", [THM_HWID] = "THM", [SMUIO_HWID] = "SMUIO", [FUSE_HWID] = "FUSE", [CLKA_HWID] = "CLKA", [PWR_HWID] = "PWR", [GC_HWID] = "GC", [UVD_HWID] = "UVD", [AUDIO_AZ_HWID] = "AUDIO_AZ", [ACP_HWID] = "ACP", [DCI_HWID] = "DCI", [DMU_HWID] = "DMU", [DCO_HWID] = "DCO", [DIO_HWID] = "DIO", [XDMA_HWID] = "XDMA", [DCEAZ_HWID] = "DCEAZ", [DAZ_HWID] = "DAZ", [SDPMUX_HWID] = "SDPMUX", [NTB_HWID] = "NTB", [IOHC_HWID] = "IOHC", [L2IMU_HWID] = "L2IMU", [VCE_HWID] = "VCE", [MMHUB_HWID] = "MMHUB", [ATHUB_HWID] = "ATHUB", [DBGU_NBIO_HWID] = "DBGU_NBIO", [DFX_HWID] = "DFX", [DBGU0_HWID] = "DBGU0", [DBGU1_HWID] = "DBGU1", [OSSSYS_HWID] = "OSSSYS", [HDP_HWID] = "HDP", [SDMA0_HWID] = "SDMA0", [SDMA1_HWID] = "SDMA1", [SDMA2_HWID] = "SDMA2", [SDMA3_HWID] = "SDMA3", [LSDMA_HWID] = "LSDMA", [ISP_HWID] = "ISP", [DBGU_IO_HWID] = "DBGU_IO", [DF_HWID] = "DF", [CLKB_HWID] = "CLKB", [FCH_HWID] = "FCH", [DFX_DAP_HWID] = "DFX_DAP", [L1IMU_PCIE_HWID] = "L1IMU_PCIE", [L1IMU_NBIF_HWID] = "L1IMU_NBIF", [L1IMU_IOAGR_HWID] = "L1IMU_IOAGR", [L1IMU3_HWID] = "L1IMU3", [L1IMU4_HWID] = "L1IMU4", [L1IMU5_HWID] = "L1IMU5", [L1IMU6_HWID] = "L1IMU6", [L1IMU7_HWID] = "L1IMU7", [L1IMU8_HWID] = "L1IMU8", [L1IMU9_HWID] = "L1IMU9", [L1IMU10_HWID] = "L1IMU10", [L1IMU11_HWID] = "L1IMU11", [L1IMU12_HWID] = "L1IMU12", [L1IMU13_HWID] = "L1IMU13", [L1IMU14_HWID] = "L1IMU14", [L1IMU15_HWID] = "L1IMU15", [WAFLC_HWID] = "WAFLC", [FCH_USB_PD_HWID] = "FCH_USB_PD", [PCIE_HWID] = "PCIE", [PCS_HWID] = "PCS", [DDCL_HWID] = "DDCL", [SST_HWID] = "SST", [IOAGR_HWID] = "IOAGR", [NBIF_HWID] = "NBIF", [IOAPIC_HWID] = "IOAPIC", [SYSTEMHUB_HWID] = "SYSTEMHUB", [NTBCCP_HWID] = "NTBCCP", [UMC_HWID] = "UMC", [SATA_HWID] = "SATA", [USB_HWID] = "USB", [CCXSEC_HWID] = "CCXSEC", [XGMI_HWID] = "XGMI", [XGBE_HWID] = "XGBE", [MP0_HWID] = "MP0", }; static int hw_id_map[MAX_HWIP] = { [GC_HWIP] = GC_HWID, [HDP_HWIP] = HDP_HWID, [SDMA0_HWIP] = SDMA0_HWID, [SDMA1_HWIP] = SDMA1_HWID, [SDMA2_HWIP] = SDMA2_HWID, [SDMA3_HWIP] = SDMA3_HWID, [LSDMA_HWIP] = LSDMA_HWID, [MMHUB_HWIP] = MMHUB_HWID, [ATHUB_HWIP] = ATHUB_HWID, [NBIO_HWIP] = NBIF_HWID, [MP0_HWIP] = MP0_HWID, [MP1_HWIP] = MP1_HWID, [UVD_HWIP] = UVD_HWID, [VCE_HWIP] = VCE_HWID, [DF_HWIP] = DF_HWID, [DCE_HWIP] = DMU_HWID, [OSSSYS_HWIP] = OSSSYS_HWID, [SMUIO_HWIP] = SMUIO_HWID, [PWR_HWIP] = PWR_HWID, [NBIF_HWIP] = NBIF_HWID, [THM_HWIP] = THM_HWID, [CLK_HWIP] = CLKA_HWID, [UMC_HWIP] = UMC_HWID, [XGMI_HWIP] = XGMI_HWID, [DCI_HWIP] = DCI_HWID, [PCIE_HWIP] = PCIE_HWID, }; static int amdgpu_discovery_read_binary_from_vram(struct amdgpu_device *adev, uint8_t *binary) { uint64_t vram_size = (uint64_t)RREG32(mmRCC_CONFIG_MEMSIZE) << 20; uint64_t pos = vram_size - DISCOVERY_TMR_OFFSET; amdgpu_device_vram_access(adev, pos, (uint32_t *)binary, adev->mman.discovery_tmr_size, false); return 0; } static int amdgpu_discovery_read_binary_from_file(struct amdgpu_device *adev, uint8_t *binary) { const struct firmware *fw; const char *fw_name; int r; switch (amdgpu_discovery) { case 2: fw_name = FIRMWARE_IP_DISCOVERY; break; default: dev_warn(adev->dev, "amdgpu_discovery is not set properly\n"); return -EINVAL; } r = request_firmware(&fw, fw_name, adev->dev); if (r) { dev_err(adev->dev, "can't load firmware \"%s\"\n", fw_name); return r; } memcpy((u8 *)binary, (u8 *)fw->data, adev->mman.discovery_tmr_size); release_firmware(fw); return 0; } static uint16_t amdgpu_discovery_calculate_checksum(uint8_t *data, uint32_t size) { uint16_t checksum = 0; int i; for (i = 0; i < size; i++) checksum += data[i]; return checksum; } static inline bool amdgpu_discovery_verify_checksum(uint8_t *data, uint32_t size, uint16_t expected) { return !!(amdgpu_discovery_calculate_checksum(data, size) == expected); } static inline bool amdgpu_discovery_verify_binary_signature(uint8_t *binary) { struct binary_header *bhdr; bhdr = (struct binary_header *)binary; return (le32_to_cpu(bhdr->binary_signature) == BINARY_SIGNATURE); } static void amdgpu_discovery_harvest_config_quirk(struct amdgpu_device *adev) { /* * So far, apply this quirk only on those Navy Flounder boards which * have a bad harvest table of VCN config. */ if ((adev->ip_versions[UVD_HWIP][1] == IP_VERSION(3, 0, 1)) && (adev->ip_versions[GC_HWIP][0] == IP_VERSION(10, 3, 2))) { switch (adev->pdev->revision) { case 0xC1: case 0xC2: case 0xC3: case 0xC5: case 0xC7: case 0xCF: case 0xDF: adev->vcn.harvest_config |= AMDGPU_VCN_HARVEST_VCN1; break; default: break; } } } static int amdgpu_discovery_init(struct amdgpu_device *adev) { struct table_info *info; struct binary_header *bhdr; uint16_t offset; uint16_t size; uint16_t checksum; int r; adev->mman.discovery_tmr_size = DISCOVERY_TMR_SIZE; adev->mman.discovery_bin = kzalloc(adev->mman.discovery_tmr_size, GFP_KERNEL); if (!adev->mman.discovery_bin) return -ENOMEM; r = amdgpu_discovery_read_binary_from_vram(adev, adev->mman.discovery_bin); if (r) { dev_err(adev->dev, "failed to read ip discovery binary from vram\n"); r = -EINVAL; goto out; } if (!amdgpu_discovery_verify_binary_signature(adev->mman.discovery_bin)) { dev_warn(adev->dev, "get invalid ip discovery binary signature from vram\n"); /* retry read ip discovery binary from file */ r = amdgpu_discovery_read_binary_from_file(adev, adev->mman.discovery_bin); if (r) { dev_err(adev->dev, "failed to read ip discovery binary from file\n"); r = -EINVAL; goto out; } /* check the ip discovery binary signature */ if(!amdgpu_discovery_verify_binary_signature(adev->mman.discovery_bin)) { dev_warn(adev->dev, "get invalid ip discovery binary signature from file\n"); r = -EINVAL; goto out; } } bhdr = (struct binary_header *)adev->mman.discovery_bin; offset = offsetof(struct binary_header, binary_checksum) + sizeof(bhdr->binary_checksum); size = le16_to_cpu(bhdr->binary_size) - offset; checksum = le16_to_cpu(bhdr->binary_checksum); if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset, size, checksum)) { dev_err(adev->dev, "invalid ip discovery binary checksum\n"); r = -EINVAL; goto out; } info = &bhdr->table_list[IP_DISCOVERY]; offset = le16_to_cpu(info->offset); checksum = le16_to_cpu(info->checksum); if (offset) { struct ip_discovery_header *ihdr = (struct ip_discovery_header *)(adev->mman.discovery_bin + offset); if (le32_to_cpu(ihdr->signature) != DISCOVERY_TABLE_SIGNATURE) { dev_err(adev->dev, "invalid ip discovery data table signature\n"); r = -EINVAL; goto out; } if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset, le16_to_cpu(ihdr->size), checksum)) { dev_err(adev->dev, "invalid ip discovery data table checksum\n"); r = -EINVAL; goto out; } } info = &bhdr->table_list[GC]; offset = le16_to_cpu(info->offset); checksum = le16_to_cpu(info->checksum); if (offset) { struct gpu_info_header *ghdr = (struct gpu_info_header *)(adev->mman.discovery_bin + offset); if (le32_to_cpu(ghdr->table_id) != GC_TABLE_ID) { dev_err(adev->dev, "invalid ip discovery gc table id\n"); r = -EINVAL; goto out; } if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset, le32_to_cpu(ghdr->size), checksum)) { dev_err(adev->dev, "invalid gc data table checksum\n"); r = -EINVAL; goto out; } } info = &bhdr->table_list[HARVEST_INFO]; offset = le16_to_cpu(info->offset); checksum = le16_to_cpu(info->checksum); if (offset) { struct harvest_info_header *hhdr = (struct harvest_info_header *)(adev->mman.discovery_bin + offset); if (le32_to_cpu(hhdr->signature) != HARVEST_TABLE_SIGNATURE) { dev_err(adev->dev, "invalid ip discovery harvest table signature\n"); r = -EINVAL; goto out; } if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset, sizeof(struct harvest_table), checksum)) { dev_err(adev->dev, "invalid harvest data table checksum\n"); r = -EINVAL; goto out; } } info = &bhdr->table_list[VCN_INFO]; offset = le16_to_cpu(info->offset); checksum = le16_to_cpu(info->checksum); if (offset) { struct vcn_info_header *vhdr = (struct vcn_info_header *)(adev->mman.discovery_bin + offset); if (le32_to_cpu(vhdr->table_id) != VCN_INFO_TABLE_ID) { dev_err(adev->dev, "invalid ip discovery vcn table id\n"); r = -EINVAL; goto out; } if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset, le32_to_cpu(vhdr->size_bytes), checksum)) { dev_err(adev->dev, "invalid vcn data table checksum\n"); r = -EINVAL; goto out; } } info = &bhdr->table_list[MALL_INFO]; offset = le16_to_cpu(info->offset); checksum = le16_to_cpu(info->checksum); if (0 && offset) { struct mall_info_header *mhdr = (struct mall_info_header *)(adev->mman.discovery_bin + offset); if (le32_to_cpu(mhdr->table_id) != MALL_INFO_TABLE_ID) { dev_err(adev->dev, "invalid ip discovery mall table id\n"); r = -EINVAL; goto out; } if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset, le32_to_cpu(mhdr->size_bytes), checksum)) { dev_err(adev->dev, "invalid mall data table checksum\n"); r = -EINVAL; goto out; } } return 0; out: kfree(adev->mman.discovery_bin); adev->mman.discovery_bin = NULL; return r; } static void amdgpu_discovery_sysfs_fini(struct amdgpu_device *adev); void amdgpu_discovery_fini(struct amdgpu_device *adev) { amdgpu_discovery_sysfs_fini(adev); kfree(adev->mman.discovery_bin); adev->mman.discovery_bin = NULL; } static int amdgpu_discovery_validate_ip(const struct ip *ip) { if (ip->number_instance >= HWIP_MAX_INSTANCE) { DRM_ERROR("Unexpected number_instance (%d) from ip discovery blob\n", ip->number_instance); return -EINVAL; } if (le16_to_cpu(ip->hw_id) >= HW_ID_MAX) { DRM_ERROR("Unexpected hw_id (%d) from ip discovery blob\n", le16_to_cpu(ip->hw_id)); return -EINVAL; } return 0; } static void amdgpu_discovery_read_harvest_bit_per_ip(struct amdgpu_device *adev, uint32_t *vcn_harvest_count) { struct binary_header *bhdr; struct ip_discovery_header *ihdr; struct die_header *dhdr; struct ip *ip; uint16_t die_offset, ip_offset, num_dies, num_ips; int i, j; bhdr = (struct binary_header *)adev->mman.discovery_bin; ihdr = (struct ip_discovery_header *)(adev->mman.discovery_bin + le16_to_cpu(bhdr->table_list[IP_DISCOVERY].offset)); num_dies = le16_to_cpu(ihdr->num_dies); /* scan harvest bit of all IP data structures */ for (i = 0; i < num_dies; i++) { die_offset = le16_to_cpu(ihdr->die_info[i].die_offset); dhdr = (struct die_header *)(adev->mman.discovery_bin + die_offset); num_ips = le16_to_cpu(dhdr->num_ips); ip_offset = die_offset + sizeof(*dhdr); for (j = 0; j < num_ips; j++) { ip = (struct ip *)(adev->mman.discovery_bin + ip_offset); if (amdgpu_discovery_validate_ip(ip)) goto next_ip; if (le16_to_cpu(ip->harvest) == 1) { switch (le16_to_cpu(ip->hw_id)) { case VCN_HWID: (*vcn_harvest_count)++; if (ip->number_instance == 0) adev->vcn.harvest_config |= AMDGPU_VCN_HARVEST_VCN0; else adev->vcn.harvest_config |= AMDGPU_VCN_HARVEST_VCN1; break; case DMU_HWID: adev->harvest_ip_mask |= AMD_HARVEST_IP_DMU_MASK; break; default: break; } } next_ip: ip_offset += struct_size(ip, base_address, ip->num_base_address); } } } static void amdgpu_discovery_read_from_harvest_table(struct amdgpu_device *adev, uint32_t *vcn_harvest_count, uint32_t *umc_harvest_count) { struct binary_header *bhdr; struct harvest_table *harvest_info; u16 offset; int i; bhdr = (struct binary_header *)adev->mman.discovery_bin; offset = le16_to_cpu(bhdr->table_list[HARVEST_INFO].offset); if (!offset) { dev_err(adev->dev, "invalid harvest table offset\n"); return; } harvest_info = (struct harvest_table *)(adev->mman.discovery_bin + offset); for (i = 0; i < 32; i++) { if (le16_to_cpu(harvest_info->list[i].hw_id) == 0) break; switch (le16_to_cpu(harvest_info->list[i].hw_id)) { case VCN_HWID: (*vcn_harvest_count)++; if (harvest_info->list[i].number_instance == 0) adev->vcn.harvest_config |= AMDGPU_VCN_HARVEST_VCN0; else adev->vcn.harvest_config |= AMDGPU_VCN_HARVEST_VCN1; break; case DMU_HWID: adev->harvest_ip_mask |= AMD_HARVEST_IP_DMU_MASK; break; case UMC_HWID: (*umc_harvest_count)++; break; default: break; } } } /* ================================================== */ struct ip_hw_instance { struct kobject kobj; /* ip_discovery/die/#die/#hw_id/#instance/<attrs...> */ int hw_id; u8 num_instance; u8 major, minor, revision; u8 harvest; int num_base_addresses; u32 base_addr[]; }; struct ip_hw_id { struct kset hw_id_kset; /* ip_discovery/die/#die/#hw_id/, contains ip_hw_instance */ int hw_id; }; struct ip_die_entry { struct kset ip_kset; /* ip_discovery/die/#die/, contains ip_hw_id */ u16 num_ips; }; /* -------------------------------------------------- */ struct ip_hw_instance_attr { struct attribute attr; ssize_t (*show)(struct ip_hw_instance *ip_hw_instance, char *buf); }; static ssize_t hw_id_show(struct ip_hw_instance *ip_hw_instance, char *buf) { return sysfs_emit(buf, "%d\n", ip_hw_instance->hw_id); } static ssize_t num_instance_show(struct ip_hw_instance *ip_hw_instance, char *buf) { return sysfs_emit(buf, "%d\n", ip_hw_instance->num_instance); } static ssize_t major_show(struct ip_hw_instance *ip_hw_instance, char *buf) { return sysfs_emit(buf, "%d\n", ip_hw_instance->major); } static ssize_t minor_show(struct ip_hw_instance *ip_hw_instance, char *buf) { return sysfs_emit(buf, "%d\n", ip_hw_instance->minor); } static ssize_t revision_show(struct ip_hw_instance *ip_hw_instance, char *buf) { return sysfs_emit(buf, "%d\n", ip_hw_instance->revision); } static ssize_t harvest_show(struct ip_hw_instance *ip_hw_instance, char *buf) { return sysfs_emit(buf, "0x%01X\n", ip_hw_instance->harvest); } static ssize_t num_base_addresses_show(struct ip_hw_instance *ip_hw_instance, char *buf) { return sysfs_emit(buf, "%d\n", ip_hw_instance->num_base_addresses); } static ssize_t base_addr_show(struct ip_hw_instance *ip_hw_instance, char *buf) { ssize_t res, at; int ii; for (res = at = ii = 0; ii < ip_hw_instance->num_base_addresses; ii++) { /* Here we satisfy the condition that, at + size <= PAGE_SIZE. */ if (at + 12 > PAGE_SIZE) break; res = sysfs_emit_at(buf, at, "0x%08X\n", ip_hw_instance->base_addr[ii]); if (res <= 0) break; at += res; } return res < 0 ? res : at; } static struct ip_hw_instance_attr ip_hw_attr[] = { __ATTR_RO(hw_id), __ATTR_RO(num_instance), __ATTR_RO(major), __ATTR_RO(minor), __ATTR_RO(revision), __ATTR_RO(harvest), __ATTR_RO(num_base_addresses), __ATTR_RO(base_addr), }; static struct attribute *ip_hw_instance_attrs[ARRAY_SIZE(ip_hw_attr) + 1]; ATTRIBUTE_GROUPS(ip_hw_instance); #define to_ip_hw_instance(x) container_of(x, struct ip_hw_instance, kobj) #define to_ip_hw_instance_attr(x) container_of(x, struct ip_hw_instance_attr, attr) static ssize_t ip_hw_instance_attr_show(struct kobject *kobj, struct attribute *attr, char *buf) { struct ip_hw_instance *ip_hw_instance = to_ip_hw_instance(kobj); struct ip_hw_instance_attr *ip_hw_attr = to_ip_hw_instance_attr(attr); if (!ip_hw_attr->show) return -EIO; return ip_hw_attr->show(ip_hw_instance, buf); } static const struct sysfs_ops ip_hw_instance_sysfs_ops = { .show = ip_hw_instance_attr_show, }; static void ip_hw_instance_release(struct kobject *kobj) { struct ip_hw_instance *ip_hw_instance = to_ip_hw_instance(kobj); kfree(ip_hw_instance); } static struct kobj_type ip_hw_instance_ktype = { .release = ip_hw_instance_release, .sysfs_ops = &ip_hw_instance_sysfs_ops, .default_groups = ip_hw_instance_groups, }; /* -------------------------------------------------- */ #define to_ip_hw_id(x) container_of(to_kset(x), struct ip_hw_id, hw_id_kset) static void ip_hw_id_release(struct kobject *kobj) { struct ip_hw_id *ip_hw_id = to_ip_hw_id(kobj); if (!list_empty(&ip_hw_id->hw_id_kset.list)) DRM_ERROR("ip_hw_id->hw_id_kset is not empty"); kfree(ip_hw_id); } static struct kobj_type ip_hw_id_ktype = { .release = ip_hw_id_release, .sysfs_ops = &kobj_sysfs_ops, }; /* -------------------------------------------------- */ static void die_kobj_release(struct kobject *kobj); static void ip_disc_release(struct kobject *kobj); struct ip_die_entry_attribute { struct attribute attr; ssize_t (*show)(struct ip_die_entry *ip_die_entry, char *buf); }; #define to_ip_die_entry_attr(x) container_of(x, struct ip_die_entry_attribute, attr) static ssize_t num_ips_show(struct ip_die_entry *ip_die_entry, char *buf) { return sysfs_emit(buf, "%d\n", ip_die_entry->num_ips); } /* If there are more ip_die_entry attrs, other than the number of IPs, * we can make this intro an array of attrs, and then initialize * ip_die_entry_attrs in a loop. */ static struct ip_die_entry_attribute num_ips_attr = __ATTR_RO(num_ips); static struct attribute *ip_die_entry_attrs[] = { &num_ips_attr.attr, NULL, }; ATTRIBUTE_GROUPS(ip_die_entry); /* ip_die_entry_groups */ #define to_ip_die_entry(x) container_of(to_kset(x), struct ip_die_entry, ip_kset) static ssize_t ip_die_entry_attr_show(struct kobject *kobj, struct attribute *attr, char *buf) { struct ip_die_entry_attribute *ip_die_entry_attr = to_ip_die_entry_attr(attr); struct ip_die_entry *ip_die_entry = to_ip_die_entry(kobj); if (!ip_die_entry_attr->show) return -EIO; return ip_die_entry_attr->show(ip_die_entry, buf); } static void ip_die_entry_release(struct kobject *kobj) { struct ip_die_entry *ip_die_entry = to_ip_die_entry(kobj); if (!list_empty(&ip_die_entry->ip_kset.list)) DRM_ERROR("ip_die_entry->ip_kset is not empty"); kfree(ip_die_entry); } static const struct sysfs_ops ip_die_entry_sysfs_ops = { .show = ip_die_entry_attr_show, }; static struct kobj_type ip_die_entry_ktype = { .release = ip_die_entry_release, .sysfs_ops = &ip_die_entry_sysfs_ops, .default_groups = ip_die_entry_groups, }; static struct kobj_type die_kobj_ktype = { .release = die_kobj_release, .sysfs_ops = &kobj_sysfs_ops, }; static struct kobj_type ip_discovery_ktype = { .release = ip_disc_release, .sysfs_ops = &kobj_sysfs_ops, }; struct ip_discovery_top { struct kobject kobj; /* ip_discovery/ */ struct kset die_kset; /* ip_discovery/die/, contains ip_die_entry */ struct amdgpu_device *adev; }; static void die_kobj_release(struct kobject *kobj) { struct ip_discovery_top *ip_top = container_of(to_kset(kobj), struct ip_discovery_top, die_kset); if (!list_empty(&ip_top->die_kset.list)) DRM_ERROR("ip_top->die_kset is not empty"); } static void ip_disc_release(struct kobject *kobj) { struct ip_discovery_top *ip_top = container_of(kobj, struct ip_discovery_top, kobj); struct amdgpu_device *adev = ip_top->adev; adev->ip_top = NULL; kfree(ip_top); } static int amdgpu_discovery_sysfs_ips(struct amdgpu_device *adev, struct ip_die_entry *ip_die_entry, const size_t _ip_offset, const int num_ips) { int ii, jj, kk, res; DRM_DEBUG("num_ips:%d", num_ips); /* Find all IPs of a given HW ID, and add their instance to * #die/#hw_id/#instance/<attributes> */ for (ii = 0; ii < HW_ID_MAX; ii++) { struct ip_hw_id *ip_hw_id = NULL; size_t ip_offset = _ip_offset; for (jj = 0; jj < num_ips; jj++) { struct ip *ip; struct ip_hw_instance *ip_hw_instance; ip = (struct ip *)(adev->mman.discovery_bin + ip_offset); if (amdgpu_discovery_validate_ip(ip) || le16_to_cpu(ip->hw_id) != ii) goto next_ip; DRM_DEBUG("match:%d @ ip_offset:%zu", ii, ip_offset); /* We have a hw_id match; register the hw * block if not yet registered. */ if (!ip_hw_id) { ip_hw_id = kzalloc(sizeof(*ip_hw_id), GFP_KERNEL); if (!ip_hw_id) return -ENOMEM; ip_hw_id->hw_id = ii; kobject_set_name(&ip_hw_id->hw_id_kset.kobj, "%d", ii); ip_hw_id->hw_id_kset.kobj.kset = &ip_die_entry->ip_kset; ip_hw_id->hw_id_kset.kobj.ktype = &ip_hw_id_ktype; res = kset_register(&ip_hw_id->hw_id_kset); if (res) { DRM_ERROR("Couldn't register ip_hw_id kset"); kfree(ip_hw_id); return res; } if (hw_id_names[ii]) { res = sysfs_create_link(&ip_die_entry->ip_kset.kobj, &ip_hw_id->hw_id_kset.kobj, hw_id_names[ii]); if (res) { DRM_ERROR("Couldn't create IP link %s in IP Die:%s\n", hw_id_names[ii], kobject_name(&ip_die_entry->ip_kset.kobj)); } } } /* Now register its instance. */ ip_hw_instance = kzalloc(struct_size(ip_hw_instance, base_addr, ip->num_base_address), GFP_KERNEL); if (!ip_hw_instance) { DRM_ERROR("no memory for ip_hw_instance"); return -ENOMEM; } ip_hw_instance->hw_id = le16_to_cpu(ip->hw_id); /* == ii */ ip_hw_instance->num_instance = ip->number_instance; ip_hw_instance->major = ip->major; ip_hw_instance->minor = ip->minor; ip_hw_instance->revision = ip->revision; ip_hw_instance->harvest = ip->harvest; ip_hw_instance->num_base_addresses = ip->num_base_address; for (kk = 0; kk < ip_hw_instance->num_base_addresses; kk++) ip_hw_instance->base_addr[kk] = ip->base_address[kk]; kobject_init(&ip_hw_instance->kobj, &ip_hw_instance_ktype); ip_hw_instance->kobj.kset = &ip_hw_id->hw_id_kset; res = kobject_add(&ip_hw_instance->kobj, NULL, "%d", ip_hw_instance->num_instance); next_ip: ip_offset += struct_size(ip, base_address, ip->num_base_address); } } return 0; } static int amdgpu_discovery_sysfs_recurse(struct amdgpu_device *adev) { struct binary_header *bhdr; struct ip_discovery_header *ihdr; struct die_header *dhdr; struct kset *die_kset = &adev->ip_top->die_kset; u16 num_dies, die_offset, num_ips; size_t ip_offset; int ii, res; bhdr = (struct binary_header *)adev->mman.discovery_bin; ihdr = (struct ip_discovery_header *)(adev->mman.discovery_bin + le16_to_cpu(bhdr->table_list[IP_DISCOVERY].offset)); num_dies = le16_to_cpu(ihdr->num_dies); DRM_DEBUG("number of dies: %d\n", num_dies); for (ii = 0; ii < num_dies; ii++) { struct ip_die_entry *ip_die_entry; die_offset = le16_to_cpu(ihdr->die_info[ii].die_offset); dhdr = (struct die_header *)(adev->mman.discovery_bin + die_offset); num_ips = le16_to_cpu(dhdr->num_ips); ip_offset = die_offset + sizeof(*dhdr); /* Add the die to the kset. * * dhdr->die_id == ii, which was checked in * amdgpu_discovery_reg_base_init(). */ ip_die_entry = kzalloc(sizeof(*ip_die_entry), GFP_KERNEL); if (!ip_die_entry) return -ENOMEM; ip_die_entry->num_ips = num_ips; kobject_set_name(&ip_die_entry->ip_kset.kobj, "%d", le16_to_cpu(dhdr->die_id)); ip_die_entry->ip_kset.kobj.kset = die_kset; ip_die_entry->ip_kset.kobj.ktype = &ip_die_entry_ktype; res = kset_register(&ip_die_entry->ip_kset); if (res) { DRM_ERROR("Couldn't register ip_die_entry kset"); kfree(ip_die_entry); return res; } amdgpu_discovery_sysfs_ips(adev, ip_die_entry, ip_offset, num_ips); } return 0; } static int amdgpu_discovery_sysfs_init(struct amdgpu_device *adev) { struct kset *die_kset; int res, ii; adev->ip_top = kzalloc(sizeof(*adev->ip_top), GFP_KERNEL); if (!adev->ip_top) return -ENOMEM; adev->ip_top->adev = adev; res = kobject_init_and_add(&adev->ip_top->kobj, &ip_discovery_ktype, &adev->dev->kobj, "ip_discovery"); if (res) { DRM_ERROR("Couldn't init and add ip_discovery/"); goto Err; } die_kset = &adev->ip_top->die_kset; kobject_set_name(&die_kset->kobj, "%s", "die"); die_kset->kobj.parent = &adev->ip_top->kobj; die_kset->kobj.ktype = &die_kobj_ktype; res = kset_register(&adev->ip_top->die_kset); if (res) { DRM_ERROR("Couldn't register die_kset"); goto Err; } for (ii = 0; ii < ARRAY_SIZE(ip_hw_attr); ii++) ip_hw_instance_attrs[ii] = &ip_hw_attr[ii].attr; ip_hw_instance_attrs[ii] = NULL; res = amdgpu_discovery_sysfs_recurse(adev); return res; Err: kobject_put(&adev->ip_top->kobj); return res; } /* -------------------------------------------------- */ #define list_to_kobj(el) container_of(el, struct kobject, entry) static void amdgpu_discovery_sysfs_ip_hw_free(struct ip_hw_id *ip_hw_id) { struct list_head *el, *tmp; struct kset *hw_id_kset; hw_id_kset = &ip_hw_id->hw_id_kset; spin_lock(&hw_id_kset->list_lock); list_for_each_prev_safe(el, tmp, &hw_id_kset->list) { list_del_init(el); spin_unlock(&hw_id_kset->list_lock); /* kobject is embedded in ip_hw_instance */ kobject_put(list_to_kobj(el)); spin_lock(&hw_id_kset->list_lock); } spin_unlock(&hw_id_kset->list_lock); kobject_put(&ip_hw_id->hw_id_kset.kobj); } static void amdgpu_discovery_sysfs_die_free(struct ip_die_entry *ip_die_entry) { struct list_head *el, *tmp; struct kset *ip_kset; ip_kset = &ip_die_entry->ip_kset; spin_lock(&ip_kset->list_lock); list_for_each_prev_safe(el, tmp, &ip_kset->list) { list_del_init(el); spin_unlock(&ip_kset->list_lock); amdgpu_discovery_sysfs_ip_hw_free(to_ip_hw_id(list_to_kobj(el))); spin_lock(&ip_kset->list_lock); } spin_unlock(&ip_kset->list_lock); kobject_put(&ip_die_entry->ip_kset.kobj); } static void amdgpu_discovery_sysfs_fini(struct amdgpu_device *adev) { struct list_head *el, *tmp; struct kset *die_kset; die_kset = &adev->ip_top->die_kset; spin_lock(&die_kset->list_lock); list_for_each_prev_safe(el, tmp, &die_kset->list) { list_del_init(el); spin_unlock(&die_kset->list_lock); amdgpu_discovery_sysfs_die_free(to_ip_die_entry(list_to_kobj(el))); spin_lock(&die_kset->list_lock); } spin_unlock(&die_kset->list_lock); kobject_put(&adev->ip_top->die_kset.kobj); kobject_put(&adev->ip_top->kobj); } /* ================================================== */ static int amdgpu_discovery_reg_base_init(struct amdgpu_device *adev) { struct binary_header *bhdr; struct ip_discovery_header *ihdr; struct die_header *dhdr; struct ip *ip; uint16_t die_offset; uint16_t ip_offset; uint16_t num_dies; uint16_t num_ips; uint8_t num_base_address; int hw_ip; int i, j, k; int r; r = amdgpu_discovery_init(adev); if (r) { DRM_ERROR("amdgpu_discovery_init failed\n"); return r; } bhdr = (struct binary_header *)adev->mman.discovery_bin; ihdr = (struct ip_discovery_header *)(adev->mman.discovery_bin + le16_to_cpu(bhdr->table_list[IP_DISCOVERY].offset)); num_dies = le16_to_cpu(ihdr->num_dies); DRM_DEBUG("number of dies: %d\n", num_dies); for (i = 0; i < num_dies; i++) { die_offset = le16_to_cpu(ihdr->die_info[i].die_offset); dhdr = (struct die_header *)(adev->mman.discovery_bin + die_offset); num_ips = le16_to_cpu(dhdr->num_ips); ip_offset = die_offset + sizeof(*dhdr); if (le16_to_cpu(dhdr->die_id) != i) { DRM_ERROR("invalid die id %d, expected %d\n", le16_to_cpu(dhdr->die_id), i); return -EINVAL; } DRM_DEBUG("number of hardware IPs on die%d: %d\n", le16_to_cpu(dhdr->die_id), num_ips); for (j = 0; j < num_ips; j++) { ip = (struct ip *)(adev->mman.discovery_bin + ip_offset); if (amdgpu_discovery_validate_ip(ip)) goto next_ip; num_base_address = ip->num_base_address; DRM_DEBUG("%s(%d) #%d v%d.%d.%d:\n", hw_id_names[le16_to_cpu(ip->hw_id)], le16_to_cpu(ip->hw_id), ip->number_instance, ip->major, ip->minor, ip->revision); if (le16_to_cpu(ip->hw_id) == VCN_HWID) { /* Bit [5:0]: original revision value * Bit [7:6]: en/decode capability: * 0b00 : VCN function normally * 0b10 : encode is disabled * 0b01 : decode is disabled */ adev->vcn.vcn_config[adev->vcn.num_vcn_inst] = ip->revision & 0xc0; ip->revision &= ~0xc0; if (adev->vcn.num_vcn_inst < AMDGPU_MAX_VCN_INSTANCES) adev->vcn.num_vcn_inst++; else dev_err(adev->dev, "Too many VCN instances: %d vs %d\n", adev->vcn.num_vcn_inst + 1, AMDGPU_MAX_VCN_INSTANCES); } if (le16_to_cpu(ip->hw_id) == SDMA0_HWID || le16_to_cpu(ip->hw_id) == SDMA1_HWID || le16_to_cpu(ip->hw_id) == SDMA2_HWID || le16_to_cpu(ip->hw_id) == SDMA3_HWID) { if (adev->sdma.num_instances < AMDGPU_MAX_SDMA_INSTANCES) adev->sdma.num_instances++; else dev_err(adev->dev, "Too many SDMA instances: %d vs %d\n", adev->sdma.num_instances + 1, AMDGPU_MAX_SDMA_INSTANCES); } if (le16_to_cpu(ip->hw_id) == UMC_HWID) adev->gmc.num_umc++; for (k = 0; k < num_base_address; k++) { /* * convert the endianness of base addresses in place, * so that we don't need to convert them when accessing adev->reg_offset. */ ip->base_address[k] = le32_to_cpu(ip->base_address[k]); DRM_DEBUG("\t0x%08x\n", ip->base_address[k]); } for (hw_ip = 0; hw_ip < MAX_HWIP; hw_ip++) { if (hw_id_map[hw_ip] == le16_to_cpu(ip->hw_id)) { DRM_DEBUG("set register base offset for %s\n", hw_id_names[le16_to_cpu(ip->hw_id)]); adev->reg_offset[hw_ip][ip->number_instance] = ip->base_address; /* Instance support is somewhat inconsistent. * SDMA is a good example. Sienna cichlid has 4 total * SDMA instances, each enumerated separately (HWIDs * 42, 43, 68, 69). Arcturus has 8 total SDMA instances, * but they are enumerated as multiple instances of the * same HWIDs (4x HWID 42, 4x HWID 43). UMC is another * example. On most chips there are multiple instances * with the same HWID. */ adev->ip_versions[hw_ip][ip->number_instance] = IP_VERSION(ip->major, ip->minor, ip->revision); } } next_ip: ip_offset += struct_size(ip, base_address, ip->num_base_address); } } amdgpu_discovery_sysfs_init(adev); return 0; } int amdgpu_discovery_get_ip_version(struct amdgpu_device *adev, int hw_id, int number_instance, int *major, int *minor, int *revision) { struct binary_header *bhdr; struct ip_discovery_header *ihdr; struct die_header *dhdr; struct ip *ip; uint16_t die_offset; uint16_t ip_offset; uint16_t num_dies; uint16_t num_ips; int i, j; if (!adev->mman.discovery_bin) { DRM_ERROR("ip discovery uninitialized\n"); return -EINVAL; } bhdr = (struct binary_header *)adev->mman.discovery_bin; ihdr = (struct ip_discovery_header *)(adev->mman.discovery_bin + le16_to_cpu(bhdr->table_list[IP_DISCOVERY].offset)); num_dies = le16_to_cpu(ihdr->num_dies); for (i = 0; i < num_dies; i++) { die_offset = le16_to_cpu(ihdr->die_info[i].die_offset); dhdr = (struct die_header *)(adev->mman.discovery_bin + die_offset); num_ips = le16_to_cpu(dhdr->num_ips); ip_offset = die_offset + sizeof(*dhdr); for (j = 0; j < num_ips; j++) { ip = (struct ip *)(adev->mman.discovery_bin + ip_offset); if ((le16_to_cpu(ip->hw_id) == hw_id) && (ip->number_instance == number_instance)) { if (major) *major = ip->major; if (minor) *minor = ip->minor; if (revision) *revision = ip->revision; return 0; } ip_offset += struct_size(ip, base_address, ip->num_base_address); } } return -EINVAL; } static void amdgpu_discovery_harvest_ip(struct amdgpu_device *adev) { int vcn_harvest_count = 0; int umc_harvest_count = 0; /* * Harvest table does not fit Navi1x and legacy GPUs, * so read harvest bit per IP data structure to set * harvest configuration. */ if (adev->ip_versions[GC_HWIP][0] < IP_VERSION(10, 2, 0)) { if ((adev->pdev->device == 0x731E && (adev->pdev->revision == 0xC6 || adev->pdev->revision == 0xC7)) || (adev->pdev->device == 0x7340 && adev->pdev->revision == 0xC9) || (adev->pdev->device == 0x7360 && adev->pdev->revision == 0xC7)) amdgpu_discovery_read_harvest_bit_per_ip(adev, &vcn_harvest_count); } else { amdgpu_discovery_read_from_harvest_table(adev, &vcn_harvest_count, &umc_harvest_count); } amdgpu_discovery_harvest_config_quirk(adev); if (vcn_harvest_count == adev->vcn.num_vcn_inst) { adev->harvest_ip_mask |= AMD_HARVEST_IP_VCN_MASK; adev->harvest_ip_mask |= AMD_HARVEST_IP_JPEG_MASK; } if (umc_harvest_count < adev->gmc.num_umc) { adev->gmc.num_umc -= umc_harvest_count; } } union gc_info { struct gc_info_v1_0 v1; struct gc_info_v1_1 v1_1; struct gc_info_v1_2 v1_2; struct gc_info_v2_0 v2; }; static int amdgpu_discovery_get_gfx_info(struct amdgpu_device *adev) { struct binary_header *bhdr; union gc_info *gc_info; u16 offset; if (!adev->mman.discovery_bin) { DRM_ERROR("ip discovery uninitialized\n"); return -EINVAL; } bhdr = (struct binary_header *)adev->mman.discovery_bin; offset = le16_to_cpu(bhdr->table_list[GC].offset); if (!offset) return 0; gc_info = (union gc_info *)(adev->mman.discovery_bin + offset); switch (le16_to_cpu(gc_info->v1.header.version_major)) { case 1: adev->gfx.config.max_shader_engines = le32_to_cpu(gc_info->v1.gc_num_se); adev->gfx.config.max_cu_per_sh = 2 * (le32_to_cpu(gc_info->v1.gc_num_wgp0_per_sa) + le32_to_cpu(gc_info->v1.gc_num_wgp1_per_sa)); adev->gfx.config.max_sh_per_se = le32_to_cpu(gc_info->v1.gc_num_sa_per_se); adev->gfx.config.max_backends_per_se = le32_to_cpu(gc_info->v1.gc_num_rb_per_se); adev->gfx.config.max_texture_channel_caches = le32_to_cpu(gc_info->v1.gc_num_gl2c); adev->gfx.config.max_gprs = le32_to_cpu(gc_info->v1.gc_num_gprs); adev->gfx.config.max_gs_threads = le32_to_cpu(gc_info->v1.gc_num_max_gs_thds); adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gc_info->v1.gc_gs_table_depth); adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gc_info->v1.gc_gsprim_buff_depth); adev->gfx.config.double_offchip_lds_buf = le32_to_cpu(gc_info->v1.gc_double_offchip_lds_buffer); adev->gfx.cu_info.wave_front_size = le32_to_cpu(gc_info->v1.gc_wave_size); adev->gfx.cu_info.max_waves_per_simd = le32_to_cpu(gc_info->v1.gc_max_waves_per_simd); adev->gfx.cu_info.max_scratch_slots_per_cu = le32_to_cpu(gc_info->v1.gc_max_scratch_slots_per_cu); adev->gfx.cu_info.lds_size = le32_to_cpu(gc_info->v1.gc_lds_size); adev->gfx.config.num_sc_per_sh = le32_to_cpu(gc_info->v1.gc_num_sc_per_se) / le32_to_cpu(gc_info->v1.gc_num_sa_per_se); adev->gfx.config.num_packer_per_sc = le32_to_cpu(gc_info->v1.gc_num_packer_per_sc); if (gc_info->v1.header.version_minor >= 1) { adev->gfx.config.gc_num_tcp_per_sa = le32_to_cpu(gc_info->v1_1.gc_num_tcp_per_sa); adev->gfx.config.gc_num_sdp_interface = le32_to_cpu(gc_info->v1_1.gc_num_sdp_interface); adev->gfx.config.gc_num_tcps = le32_to_cpu(gc_info->v1_1.gc_num_tcps); } if (gc_info->v1.header.version_minor >= 2) { adev->gfx.config.gc_num_tcp_per_wpg = le32_to_cpu(gc_info->v1_2.gc_num_tcp_per_wpg); adev->gfx.config.gc_tcp_l1_size = le32_to_cpu(gc_info->v1_2.gc_tcp_l1_size); adev->gfx.config.gc_num_sqc_per_wgp = le32_to_cpu(gc_info->v1_2.gc_num_sqc_per_wgp); adev->gfx.config.gc_l1_instruction_cache_size_per_sqc = le32_to_cpu(gc_info->v1_2.gc_l1_instruction_cache_size_per_sqc); adev->gfx.config.gc_l1_data_cache_size_per_sqc = le32_to_cpu(gc_info->v1_2.gc_l1_data_cache_size_per_sqc); adev->gfx.config.gc_gl1c_per_sa = le32_to_cpu(gc_info->v1_2.gc_gl1c_per_sa); adev->gfx.config.gc_gl1c_size_per_instance = le32_to_cpu(gc_info->v1_2.gc_gl1c_size_per_instance); adev->gfx.config.gc_gl2c_per_gpu = le32_to_cpu(gc_info->v1_2.gc_gl2c_per_gpu); } break; case 2: adev->gfx.config.max_shader_engines = le32_to_cpu(gc_info->v2.gc_num_se); adev->gfx.config.max_cu_per_sh = le32_to_cpu(gc_info->v2.gc_num_cu_per_sh); adev->gfx.config.max_sh_per_se = le32_to_cpu(gc_info->v2.gc_num_sh_per_se); adev->gfx.config.max_backends_per_se = le32_to_cpu(gc_info->v2.gc_num_rb_per_se); adev->gfx.config.max_texture_channel_caches = le32_to_cpu(gc_info->v2.gc_num_tccs); adev->gfx.config.max_gprs = le32_to_cpu(gc_info->v2.gc_num_gprs); adev->gfx.config.max_gs_threads = le32_to_cpu(gc_info->v2.gc_num_max_gs_thds); adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gc_info->v2.gc_gs_table_depth); adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gc_info->v2.gc_gsprim_buff_depth); adev->gfx.config.double_offchip_lds_buf = le32_to_cpu(gc_info->v2.gc_double_offchip_lds_buffer); adev->gfx.cu_info.wave_front_size = le32_to_cpu(gc_info->v2.gc_wave_size); adev->gfx.cu_info.max_waves_per_simd = le32_to_cpu(gc_info->v2.gc_max_waves_per_simd); adev->gfx.cu_info.max_scratch_slots_per_cu = le32_to_cpu(gc_info->v2.gc_max_scratch_slots_per_cu); adev->gfx.cu_info.lds_size = le32_to_cpu(gc_info->v2.gc_lds_size); adev->gfx.config.num_sc_per_sh = le32_to_cpu(gc_info->v2.gc_num_sc_per_se) / le32_to_cpu(gc_info->v2.gc_num_sh_per_se); adev->gfx.config.num_packer_per_sc = le32_to_cpu(gc_info->v2.gc_num_packer_per_sc); break; default: dev_err(adev->dev, "Unhandled GC info table %d.%d\n", le16_to_cpu(gc_info->v1.header.version_major), le16_to_cpu(gc_info->v1.header.version_minor)); return -EINVAL; } return 0; } union mall_info { struct mall_info_v1_0 v1; }; static int amdgpu_discovery_get_mall_info(struct amdgpu_device *adev) { struct binary_header *bhdr; union mall_info *mall_info; u32 u, mall_size_per_umc, m_s_present, half_use; u64 mall_size; u16 offset; if (!adev->mman.discovery_bin) { DRM_ERROR("ip discovery uninitialized\n"); return -EINVAL; } bhdr = (struct binary_header *)adev->mman.discovery_bin; offset = le16_to_cpu(bhdr->table_list[MALL_INFO].offset); if (!offset) return 0; mall_info = (union mall_info *)(adev->mman.discovery_bin + offset); switch (le16_to_cpu(mall_info->v1.header.version_major)) { case 1: mall_size = 0; mall_size_per_umc = le32_to_cpu(mall_info->v1.mall_size_per_m); m_s_present = le32_to_cpu(mall_info->v1.m_s_present); half_use = le32_to_cpu(mall_info->v1.m_half_use); for (u = 0; u < adev->gmc.num_umc; u++) { if (m_s_present & (1 << u)) mall_size += mall_size_per_umc * 2; else if (half_use & (1 << u)) mall_size += mall_size_per_umc / 2; else mall_size += mall_size_per_umc; } adev->gmc.mall_size = mall_size; break; default: dev_err(adev->dev, "Unhandled MALL info table %d.%d\n", le16_to_cpu(mall_info->v1.header.version_major), le16_to_cpu(mall_info->v1.header.version_minor)); return -EINVAL; } return 0; } union vcn_info { struct vcn_info_v1_0 v1; }; static int amdgpu_discovery_get_vcn_info(struct amdgpu_device *adev) { struct binary_header *bhdr; union vcn_info *vcn_info; u16 offset; int v; if (!adev->mman.discovery_bin) { DRM_ERROR("ip discovery uninitialized\n"); return -EINVAL; } /* num_vcn_inst is currently limited to AMDGPU_MAX_VCN_INSTANCES * which is smaller than VCN_INFO_TABLE_MAX_NUM_INSTANCES * but that may change in the future with new GPUs so keep this * check for defensive purposes. */ if (adev->vcn.num_vcn_inst > VCN_INFO_TABLE_MAX_NUM_INSTANCES) { dev_err(adev->dev, "invalid vcn instances\n"); return -EINVAL; } bhdr = (struct binary_header *)adev->mman.discovery_bin; offset = le16_to_cpu(bhdr->table_list[VCN_INFO].offset); if (!offset) return 0; vcn_info = (union vcn_info *)(adev->mman.discovery_bin + offset); switch (le16_to_cpu(vcn_info->v1.header.version_major)) { case 1: /* num_vcn_inst is currently limited to AMDGPU_MAX_VCN_INSTANCES * so this won't overflow. */ for (v = 0; v < adev->vcn.num_vcn_inst; v++) { adev->vcn.vcn_codec_disable_mask[v] = le32_to_cpu(vcn_info->v1.instance_info[v].fuse_data.all_bits); } break; default: dev_err(adev->dev, "Unhandled VCN info table %d.%d\n", le16_to_cpu(vcn_info->v1.header.version_major), le16_to_cpu(vcn_info->v1.header.version_minor)); return -EINVAL; } return 0; } static int amdgpu_discovery_set_common_ip_blocks(struct amdgpu_device *adev) { /* what IP to use for this? */ switch (adev->ip_versions[GC_HWIP][0]) { case IP_VERSION(9, 0, 1): case IP_VERSION(9, 1, 0): case IP_VERSION(9, 2, 1): case IP_VERSION(9, 2, 2): case IP_VERSION(9, 3, 0): case IP_VERSION(9, 4, 0): case IP_VERSION(9, 4, 1): case IP_VERSION(9, 4, 2): amdgpu_device_ip_block_add(adev, &vega10_common_ip_block); break; case IP_VERSION(10, 1, 10): case IP_VERSION(10, 1, 1): case IP_VERSION(10, 1, 2): case IP_VERSION(10, 1, 3): case IP_VERSION(10, 1, 4): case IP_VERSION(10, 3, 0): case IP_VERSION(10, 3, 1): case IP_VERSION(10, 3, 2): case IP_VERSION(10, 3, 3): case IP_VERSION(10, 3, 4): case IP_VERSION(10, 3, 5): case IP_VERSION(10, 3, 6): case IP_VERSION(10, 3, 7): amdgpu_device_ip_block_add(adev, &nv_common_ip_block); break; case IP_VERSION(11, 0, 0): case IP_VERSION(11, 0, 1): case IP_VERSION(11, 0, 2): amdgpu_device_ip_block_add(adev, &soc21_common_ip_block); break; default: dev_err(adev->dev, "Failed to add common ip block(GC_HWIP:0x%x)\n", adev->ip_versions[GC_HWIP][0]); return -EINVAL; } return 0; } static int amdgpu_discovery_set_gmc_ip_blocks(struct amdgpu_device *adev) { /* use GC or MMHUB IP version */ switch (adev->ip_versions[GC_HWIP][0]) { case IP_VERSION(9, 0, 1): case IP_VERSION(9, 1, 0): case IP_VERSION(9, 2, 1): case IP_VERSION(9, 2, 2): case IP_VERSION(9, 3, 0): case IP_VERSION(9, 4, 0): case IP_VERSION(9, 4, 1): case IP_VERSION(9, 4, 2): amdgpu_device_ip_block_add(adev, &gmc_v9_0_ip_block); break; case IP_VERSION(10, 1, 10): case IP_VERSION(10, 1, 1): case IP_VERSION(10, 1, 2): case IP_VERSION(10, 1, 3): case IP_VERSION(10, 1, 4): case IP_VERSION(10, 3, 0): case IP_VERSION(10, 3, 1): case IP_VERSION(10, 3, 2): case IP_VERSION(10, 3, 3): case IP_VERSION(10, 3, 4): case IP_VERSION(10, 3, 5): case IP_VERSION(10, 3, 6): case IP_VERSION(10, 3, 7): amdgpu_device_ip_block_add(adev, &gmc_v10_0_ip_block); break; case IP_VERSION(11, 0, 0): case IP_VERSION(11, 0, 1): case IP_VERSION(11, 0, 2): amdgpu_device_ip_block_add(adev, &gmc_v11_0_ip_block); break; default: dev_err(adev->dev, "Failed to add gmc ip block(GC_HWIP:0x%x)\n", adev->ip_versions[GC_HWIP][0]); return -EINVAL; } return 0; } static int amdgpu_discovery_set_ih_ip_blocks(struct amdgpu_device *adev) { switch (adev->ip_versions[OSSSYS_HWIP][0]) { case IP_VERSION(4, 0, 0): case IP_VERSION(4, 0, 1): case IP_VERSION(4, 1, 0): case IP_VERSION(4, 1, 1): case IP_VERSION(4, 3, 0): amdgpu_device_ip_block_add(adev, &vega10_ih_ip_block); break; case IP_VERSION(4, 2, 0): case IP_VERSION(4, 2, 1): case IP_VERSION(4, 4, 0): amdgpu_device_ip_block_add(adev, &vega20_ih_ip_block); break; case IP_VERSION(5, 0, 0): case IP_VERSION(5, 0, 1): case IP_VERSION(5, 0, 2): case IP_VERSION(5, 0, 3): case IP_VERSION(5, 2, 0): case IP_VERSION(5, 2, 1): amdgpu_device_ip_block_add(adev, &navi10_ih_ip_block); break; case IP_VERSION(6, 0, 0): case IP_VERSION(6, 0, 1): case IP_VERSION(6, 0, 2): amdgpu_device_ip_block_add(adev, &ih_v6_0_ip_block); break; default: dev_err(adev->dev, "Failed to add ih ip block(OSSSYS_HWIP:0x%x)\n", adev->ip_versions[OSSSYS_HWIP][0]); return -EINVAL; } return 0; } static int amdgpu_discovery_set_psp_ip_blocks(struct amdgpu_device *adev) { switch (adev->ip_versions[MP0_HWIP][0]) { case IP_VERSION(9, 0, 0): amdgpu_device_ip_block_add(adev, &psp_v3_1_ip_block); break; case IP_VERSION(10, 0, 0): case IP_VERSION(10, 0, 1): amdgpu_device_ip_block_add(adev, &psp_v10_0_ip_block); break; case IP_VERSION(11, 0, 0): case IP_VERSION(11, 0, 2): case IP_VERSION(11, 0, 4): case IP_VERSION(11, 0, 5): case IP_VERSION(11, 0, 9): case IP_VERSION(11, 0, 7): case IP_VERSION(11, 0, 11): case IP_VERSION(11, 0, 12): case IP_VERSION(11, 0, 13): case IP_VERSION(11, 5, 0): amdgpu_device_ip_block_add(adev, &psp_v11_0_ip_block); break; case IP_VERSION(11, 0, 8): amdgpu_device_ip_block_add(adev, &psp_v11_0_8_ip_block); break; case IP_VERSION(11, 0, 3): case IP_VERSION(12, 0, 1): amdgpu_device_ip_block_add(adev, &psp_v12_0_ip_block); break; case IP_VERSION(13, 0, 0): case IP_VERSION(13, 0, 1): case IP_VERSION(13, 0, 2): case IP_VERSION(13, 0, 3): case IP_VERSION(13, 0, 5): case IP_VERSION(13, 0, 7): case IP_VERSION(13, 0, 8): amdgpu_device_ip_block_add(adev, &psp_v13_0_ip_block); break; case IP_VERSION(13, 0, 4): amdgpu_device_ip_block_add(adev, &psp_v13_0_4_ip_block); break; default: dev_err(adev->dev, "Failed to add psp ip block(MP0_HWIP:0x%x)\n", adev->ip_versions[MP0_HWIP][0]); return -EINVAL; } return 0; } static int amdgpu_discovery_set_smu_ip_blocks(struct amdgpu_device *adev) { switch (adev->ip_versions[MP1_HWIP][0]) { case IP_VERSION(9, 0, 0): case IP_VERSION(10, 0, 0): case IP_VERSION(10, 0, 1): case IP_VERSION(11, 0, 2): if (adev->asic_type == CHIP_ARCTURUS) amdgpu_device_ip_block_add(adev, &smu_v11_0_ip_block); else amdgpu_device_ip_block_add(adev, &pp_smu_ip_block); break; case IP_VERSION(11, 0, 0): case IP_VERSION(11, 0, 5): case IP_VERSION(11, 0, 9): case IP_VERSION(11, 0, 7): case IP_VERSION(11, 0, 8): case IP_VERSION(11, 0, 11): case IP_VERSION(11, 0, 12): case IP_VERSION(11, 0, 13): case IP_VERSION(11, 5, 0): amdgpu_device_ip_block_add(adev, &smu_v11_0_ip_block); break; case IP_VERSION(12, 0, 0): case IP_VERSION(12, 0, 1): amdgpu_device_ip_block_add(adev, &smu_v12_0_ip_block); break; case IP_VERSION(13, 0, 0): case IP_VERSION(13, 0, 1): case IP_VERSION(13, 0, 2): case IP_VERSION(13, 0, 3): case IP_VERSION(13, 0, 4): case IP_VERSION(13, 0, 5): case IP_VERSION(13, 0, 7): case IP_VERSION(13, 0, 8): amdgpu_device_ip_block_add(adev, &smu_v13_0_ip_block); break; default: dev_err(adev->dev, "Failed to add smu ip block(MP1_HWIP:0x%x)\n", adev->ip_versions[MP1_HWIP][0]); return -EINVAL; } return 0; } static int amdgpu_discovery_set_display_ip_blocks(struct amdgpu_device *adev) { if (adev->enable_virtual_display || amdgpu_sriov_vf(adev)) { amdgpu_device_ip_block_add(adev, &amdgpu_vkms_ip_block); return 0; } if (!amdgpu_device_has_dc_support(adev)) return 0; #if defined(CONFIG_DRM_AMD_DC) if (adev->ip_versions[DCE_HWIP][0]) { switch (adev->ip_versions[DCE_HWIP][0]) { case IP_VERSION(1, 0, 0): case IP_VERSION(1, 0, 1): case IP_VERSION(2, 0, 2): case IP_VERSION(2, 0, 0): case IP_VERSION(2, 0, 3): case IP_VERSION(2, 1, 0): case IP_VERSION(3, 0, 0): case IP_VERSION(3, 0, 2): case IP_VERSION(3, 0, 3): case IP_VERSION(3, 0, 1): case IP_VERSION(3, 1, 2): case IP_VERSION(3, 1, 3): case IP_VERSION(3, 1, 4): case IP_VERSION(3, 1, 5): case IP_VERSION(3, 1, 6): case IP_VERSION(3, 2, 0): case IP_VERSION(3, 2, 1): amdgpu_device_ip_block_add(adev, &dm_ip_block); break; default: dev_err(adev->dev, "Failed to add dm ip block(DCE_HWIP:0x%x)\n", adev->ip_versions[DCE_HWIP][0]); return -EINVAL; } } else if (adev->ip_versions[DCI_HWIP][0]) { switch (adev->ip_versions[DCI_HWIP][0]) { case IP_VERSION(12, 0, 0): case IP_VERSION(12, 0, 1): case IP_VERSION(12, 1, 0): amdgpu_device_ip_block_add(adev, &dm_ip_block); break; default: dev_err(adev->dev, "Failed to add dm ip block(DCI_HWIP:0x%x)\n", adev->ip_versions[DCI_HWIP][0]); return -EINVAL; } } #endif return 0; } static int amdgpu_discovery_set_gc_ip_blocks(struct amdgpu_device *adev) { switch (adev->ip_versions[GC_HWIP][0]) { case IP_VERSION(9, 0, 1): case IP_VERSION(9, 1, 0): case IP_VERSION(9, 2, 1): case IP_VERSION(9, 2, 2): case IP_VERSION(9, 3, 0): case IP_VERSION(9, 4, 0): case IP_VERSION(9, 4, 1): case IP_VERSION(9, 4, 2): amdgpu_device_ip_block_add(adev, &gfx_v9_0_ip_block); break; case IP_VERSION(10, 1, 10): case IP_VERSION(10, 1, 2): case IP_VERSION(10, 1, 1): case IP_VERSION(10, 1, 3): case IP_VERSION(10, 1, 4): case IP_VERSION(10, 3, 0): case IP_VERSION(10, 3, 2): case IP_VERSION(10, 3, 1): case IP_VERSION(10, 3, 4): case IP_VERSION(10, 3, 5): case IP_VERSION(10, 3, 6): case IP_VERSION(10, 3, 3): case IP_VERSION(10, 3, 7): amdgpu_device_ip_block_add(adev, &gfx_v10_0_ip_block); break; case IP_VERSION(11, 0, 0): case IP_VERSION(11, 0, 1): case IP_VERSION(11, 0, 2): amdgpu_device_ip_block_add(adev, &gfx_v11_0_ip_block); break; default: dev_err(adev->dev, "Failed to add gfx ip block(GC_HWIP:0x%x)\n", adev->ip_versions[GC_HWIP][0]); return -EINVAL; } return 0; } static int amdgpu_discovery_set_sdma_ip_blocks(struct amdgpu_device *adev) { switch (adev->ip_versions[SDMA0_HWIP][0]) { case IP_VERSION(4, 0, 0): case IP_VERSION(4, 0, 1): case IP_VERSION(4, 1, 0): case IP_VERSION(4, 1, 1): case IP_VERSION(4, 1, 2): case IP_VERSION(4, 2, 0): case IP_VERSION(4, 2, 2): case IP_VERSION(4, 4, 0): amdgpu_device_ip_block_add(adev, &sdma_v4_0_ip_block); break; case IP_VERSION(5, 0, 0): case IP_VERSION(5, 0, 1): case IP_VERSION(5, 0, 2): case IP_VERSION(5, 0, 5): amdgpu_device_ip_block_add(adev, &sdma_v5_0_ip_block); break; case IP_VERSION(5, 2, 0): case IP_VERSION(5, 2, 2): case IP_VERSION(5, 2, 4): case IP_VERSION(5, 2, 5): case IP_VERSION(5, 2, 6): case IP_VERSION(5, 2, 3): case IP_VERSION(5, 2, 1): case IP_VERSION(5, 2, 7): amdgpu_device_ip_block_add(adev, &sdma_v5_2_ip_block); break; case IP_VERSION(6, 0, 0): case IP_VERSION(6, 0, 1): case IP_VERSION(6, 0, 2): amdgpu_device_ip_block_add(adev, &sdma_v6_0_ip_block); break; default: dev_err(adev->dev, "Failed to add sdma ip block(SDMA0_HWIP:0x%x)\n", adev->ip_versions[SDMA0_HWIP][0]); return -EINVAL; } return 0; } static int amdgpu_discovery_set_mm_ip_blocks(struct amdgpu_device *adev) { if (adev->ip_versions[VCE_HWIP][0]) { switch (adev->ip_versions[UVD_HWIP][0]) { case IP_VERSION(7, 0, 0): case IP_VERSION(7, 2, 0): /* UVD is not supported on vega20 SR-IOV */ if (!(adev->asic_type == CHIP_VEGA20 && amdgpu_sriov_vf(adev))) amdgpu_device_ip_block_add(adev, &uvd_v7_0_ip_block); break; default: dev_err(adev->dev, "Failed to add uvd v7 ip block(UVD_HWIP:0x%x)\n", adev->ip_versions[UVD_HWIP][0]); return -EINVAL; } switch (adev->ip_versions[VCE_HWIP][0]) { case IP_VERSION(4, 0, 0): case IP_VERSION(4, 1, 0): /* VCE is not supported on vega20 SR-IOV */ if (!(adev->asic_type == CHIP_VEGA20 && amdgpu_sriov_vf(adev))) amdgpu_device_ip_block_add(adev, &vce_v4_0_ip_block); break; default: dev_err(adev->dev, "Failed to add VCE v4 ip block(VCE_HWIP:0x%x)\n", adev->ip_versions[VCE_HWIP][0]); return -EINVAL; } } else { switch (adev->ip_versions[UVD_HWIP][0]) { case IP_VERSION(1, 0, 0): case IP_VERSION(1, 0, 1): amdgpu_device_ip_block_add(adev, &vcn_v1_0_ip_block); break; case IP_VERSION(2, 0, 0): case IP_VERSION(2, 0, 2): case IP_VERSION(2, 2, 0): amdgpu_device_ip_block_add(adev, &vcn_v2_0_ip_block); if (!amdgpu_sriov_vf(adev)) amdgpu_device_ip_block_add(adev, &jpeg_v2_0_ip_block); break; case IP_VERSION(2, 0, 3): break; case IP_VERSION(2, 5, 0): amdgpu_device_ip_block_add(adev, &vcn_v2_5_ip_block); amdgpu_device_ip_block_add(adev, &jpeg_v2_5_ip_block); break; case IP_VERSION(2, 6, 0): amdgpu_device_ip_block_add(adev, &vcn_v2_6_ip_block); amdgpu_device_ip_block_add(adev, &jpeg_v2_6_ip_block); break; case IP_VERSION(3, 0, 0): case IP_VERSION(3, 0, 16): case IP_VERSION(3, 1, 1): case IP_VERSION(3, 1, 2): case IP_VERSION(3, 0, 2): case IP_VERSION(3, 0, 192): amdgpu_device_ip_block_add(adev, &vcn_v3_0_ip_block); if (!amdgpu_sriov_vf(adev)) amdgpu_device_ip_block_add(adev, &jpeg_v3_0_ip_block); break; case IP_VERSION(3, 0, 33): amdgpu_device_ip_block_add(adev, &vcn_v3_0_ip_block); break; case IP_VERSION(4, 0, 0): case IP_VERSION(4, 0, 2): case IP_VERSION(4, 0, 4): amdgpu_device_ip_block_add(adev, &vcn_v4_0_ip_block); amdgpu_device_ip_block_add(adev, &jpeg_v4_0_ip_block); break; default: dev_err(adev->dev, "Failed to add vcn/jpeg ip block(UVD_HWIP:0x%x)\n", adev->ip_versions[UVD_HWIP][0]); return -EINVAL; } } return 0; } static int amdgpu_discovery_set_mes_ip_blocks(struct amdgpu_device *adev) { switch (adev->ip_versions[GC_HWIP][0]) { case IP_VERSION(10, 1, 10): case IP_VERSION(10, 1, 1): case IP_VERSION(10, 1, 2): case IP_VERSION(10, 1, 3): case IP_VERSION(10, 1, 4): case IP_VERSION(10, 3, 0): case IP_VERSION(10, 3, 1): case IP_VERSION(10, 3, 2): case IP_VERSION(10, 3, 3): case IP_VERSION(10, 3, 4): case IP_VERSION(10, 3, 5): case IP_VERSION(10, 3, 6): if (amdgpu_mes) { amdgpu_device_ip_block_add(adev, &mes_v10_1_ip_block); adev->enable_mes = true; if (amdgpu_mes_kiq) adev->enable_mes_kiq = true; } break; case IP_VERSION(11, 0, 0): case IP_VERSION(11, 0, 1): case IP_VERSION(11, 0, 2): amdgpu_device_ip_block_add(adev, &mes_v11_0_ip_block); adev->enable_mes = true; adev->enable_mes_kiq = true; break; default: break; } return 0; } int amdgpu_discovery_set_ip_blocks(struct amdgpu_device *adev) { int r; switch (adev->asic_type) { case CHIP_VEGA10: vega10_reg_base_init(adev); adev->sdma.num_instances = 2; adev->gmc.num_umc = 4; adev->ip_versions[MMHUB_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[ATHUB_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[OSSSYS_HWIP][0] = IP_VERSION(4, 0, 0); adev->ip_versions[HDP_HWIP][0] = IP_VERSION(4, 0, 0); adev->ip_versions[SDMA0_HWIP][0] = IP_VERSION(4, 0, 0); adev->ip_versions[SDMA1_HWIP][0] = IP_VERSION(4, 0, 0); adev->ip_versions[DF_HWIP][0] = IP_VERSION(2, 1, 0); adev->ip_versions[NBIO_HWIP][0] = IP_VERSION(6, 1, 0); adev->ip_versions[UMC_HWIP][0] = IP_VERSION(6, 0, 0); adev->ip_versions[MP0_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[MP1_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[THM_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[SMUIO_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[GC_HWIP][0] = IP_VERSION(9, 0, 1); adev->ip_versions[UVD_HWIP][0] = IP_VERSION(7, 0, 0); adev->ip_versions[VCE_HWIP][0] = IP_VERSION(4, 0, 0); adev->ip_versions[DCI_HWIP][0] = IP_VERSION(12, 0, 0); break; case CHIP_VEGA12: vega10_reg_base_init(adev); adev->sdma.num_instances = 2; adev->gmc.num_umc = 4; adev->ip_versions[MMHUB_HWIP][0] = IP_VERSION(9, 3, 0); adev->ip_versions[ATHUB_HWIP][0] = IP_VERSION(9, 3, 0); adev->ip_versions[OSSSYS_HWIP][0] = IP_VERSION(4, 0, 1); adev->ip_versions[HDP_HWIP][0] = IP_VERSION(4, 0, 1); adev->ip_versions[SDMA0_HWIP][0] = IP_VERSION(4, 0, 1); adev->ip_versions[SDMA1_HWIP][0] = IP_VERSION(4, 0, 1); adev->ip_versions[DF_HWIP][0] = IP_VERSION(2, 5, 0); adev->ip_versions[NBIO_HWIP][0] = IP_VERSION(6, 2, 0); adev->ip_versions[UMC_HWIP][0] = IP_VERSION(6, 1, 0); adev->ip_versions[MP0_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[MP1_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[THM_HWIP][0] = IP_VERSION(9, 0, 0); adev->ip_versions[SMUIO_HWIP][0] = IP_VERSION(9, 0, 1); adev->ip_versions[GC_HWIP][0] = IP_VERSION(9, 2, 1); adev->ip_versions[UVD_HWIP][0] = IP_VERSION(7, 0, 0); adev->ip_versions[VCE_HWIP][0] = IP_VERSION(4, 0, 0); adev->ip_versions[DCI_HWIP][0] = IP_VERSION(12, 0, 1); break; case CHIP_RAVEN: vega10_reg_base_init(adev); adev->sdma.num_instances = 1; adev->vcn.num_vcn_inst = 1; adev->gmc.num_umc = 2; if (adev->apu_flags & AMD_APU_IS_RAVEN2) { adev->ip_versions[MMHUB_HWIP][0] = IP_VERSION(9, 2, 0); adev->ip_versions[ATHUB_HWIP][0] = IP_VERSION(9, 2, 0); adev->ip_versions[OSSSYS_HWIP][0] = IP_VERSION(4, 1, 1); adev->ip_versions[HDP_HWIP][0] = IP_VERSION(4, 1, 1); adev->ip_versions[SDMA0_HWIP][0] = IP_VERSION(4, 1, 1); adev->ip_versions[DF_HWIP][0] = IP_VERSION(2, 1, 1); adev->ip_versions[NBIO_HWIP][0] = IP_VERSION(7, 0, 1); adev->ip_versions[UMC_HWIP][0] = IP_VERSION(7, 5, 0); adev->ip_versions[MP0_HWIP][0] = IP_VERSION(10, 0, 1); adev->ip_versions[MP1_HWIP][0] = IP_VERSION(10, 0, 1); adev->ip_versions[THM_HWIP][0] = IP_VERSION(10, 1, 0); adev->ip_versions[SMUIO_HWIP][0] = IP_VERSION(10, 0, 1); adev->ip_versions[GC_HWIP][0] = IP_VERSION(9, 2, 2); adev->ip_versions[UVD_HWIP][0] = IP_VERSION(1, 0, 1); adev->ip_versions[DCE_HWIP][0] = IP_VERSION(1, 0, 1); } else { adev->ip_versions[MMHUB_HWIP][0] = IP_VERSION(9, 1, 0); adev->ip_versions[ATHUB_HWIP][0] = IP_VERSION(9, 1, 0); adev->ip_versions[OSSSYS_HWIP][0] = IP_VERSION(4, 1, 0); adev->ip_versions[HDP_HWIP][0] = IP_VERSION(4, 1, 0); adev->ip_versions[SDMA0_HWIP][0] = IP_VERSION(4, 1, 0); adev->ip_versions[DF_HWIP][0] = IP_VERSION(2, 1, 0); adev->ip_versions[NBIO_HWIP][0] = IP_VERSION(7, 0, 0); adev->ip_versions[UMC_HWIP][0] = IP_VERSION(7, 0, 0); adev->ip_versions[MP0_HWIP][0] = IP_VERSION(10, 0, 0); adev->ip_versions[MP1_HWIP][0] = IP_VERSION(10, 0, 0); adev->ip_versions[THM_HWIP][0] = IP_VERSION(10, 0, 0); adev->ip_versions[SMUIO_HWIP][0] = IP_VERSION(10, 0, 0); adev->ip_versions[GC_HWIP][0] = IP_VERSION(9, 1, 0); adev->ip_versions[UVD_HWIP][0] = IP_VERSION(1, 0, 0); adev->ip_versions[DCE_HWIP][0] = IP_VERSION(1, 0, 0); } break; case CHIP_VEGA20: vega20_reg_base_init(adev); adev->sdma.num_instances = 2; adev->gmc.num_umc = 8; adev->ip_versions[MMHUB_HWIP][0] = IP_VERSION(9, 4, 0); adev->ip_versions[ATHUB_HWIP][0] = IP_VERSION(9, 4, 0); adev->ip_versions[OSSSYS_HWIP][0] = IP_VERSION(4, 2, 0); adev->ip_versions[HDP_HWIP][0] = IP_VERSION(4, 2, 0); adev->ip_versions[SDMA0_HWIP][0] = IP_VERSION(4, 2, 0); adev->ip_versions[SDMA1_HWIP][0] = IP_VERSION(4, 2, 0); adev->ip_versions[DF_HWIP][0] = IP_VERSION(3, 6, 0); adev->ip_versions[NBIO_HWIP][0] = IP_VERSION(7, 4, 0); adev->ip_versions[UMC_HWIP][0] = IP_VERSION(6, 1, 1); adev->ip_versions[MP0_HWIP][0] = IP_VERSION(11, 0, 2); adev->ip_versions[MP1_HWIP][0] = IP_VERSION(11, 0, 2); adev->ip_versions[THM_HWIP][0] = IP_VERSION(11, 0, 2); adev->ip_versions[SMUIO_HWIP][0] = IP_VERSION(11, 0, 2); adev->ip_versions[GC_HWIP][0] = IP_VERSION(9, 4, 0); adev->ip_versions[UVD_HWIP][0] = IP_VERSION(7, 2, 0); adev->ip_versions[UVD_HWIP][1] = IP_VERSION(7, 2, 0); adev->ip_versions[VCE_HWIP][0] = IP_VERSION(4, 1, 0); adev->ip_versions[DCI_HWIP][0] = IP_VERSION(12, 1, 0); break; case CHIP_ARCTURUS: arct_reg_base_init(adev); adev->sdma.num_instances = 8; adev->vcn.num_vcn_inst = 2; adev->gmc.num_umc = 8; adev->ip_versions[MMHUB_HWIP][0] = IP_VERSION(9, 4, 1); adev->ip_versions[ATHUB_HWIP][0] = IP_VERSION(9, 4, 1); adev->ip_versions[OSSSYS_HWIP][0] = IP_VERSION(4, 2, 1); adev->ip_versions[HDP_HWIP][0] = IP_VERSION(4, 2, 1); adev->ip_versions[SDMA0_HWIP][0] = IP_VERSION(4, 2, 2); adev->ip_versions[SDMA1_HWIP][0] = IP_VERSION(4, 2, 2); adev->ip_versions[SDMA1_HWIP][1] = IP_VERSION(4, 2, 2); adev->ip_versions[SDMA1_HWIP][2] = IP_VERSION(4, 2, 2); adev->ip_versions[SDMA1_HWIP][3] = IP_VERSION(4, 2, 2); adev->ip_versions[SDMA1_HWIP][4] = IP_VERSION(4, 2, 2); adev->ip_versions[SDMA1_HWIP][5] = IP_VERSION(4, 2, 2); adev->ip_versions[SDMA1_HWIP][6] = IP_VERSION(4, 2, 2); adev->ip_versions[DF_HWIP][0] = IP_VERSION(3, 6, 1); adev->ip_versions[NBIO_HWIP][0] = IP_VERSION(7, 4, 1); adev->ip_versions[UMC_HWIP][0] = IP_VERSION(6, 1, 2); adev->ip_versions[MP0_HWIP][0] = IP_VERSION(11, 0, 4); adev->ip_versions[MP1_HWIP][0] = IP_VERSION(11, 0, 2); adev->ip_versions[THM_HWIP][0] = IP_VERSION(11, 0, 3); adev->ip_versions[SMUIO_HWIP][0] = IP_VERSION(11, 0, 3); adev->ip_versions[GC_HWIP][0] = IP_VERSION(9, 4, 1); adev->ip_versions[UVD_HWIP][0] = IP_VERSION(2, 5, 0); adev->ip_versions[UVD_HWIP][1] = IP_VERSION(2, 5, 0); break; case CHIP_ALDEBARAN: aldebaran_reg_base_init(adev); adev->sdma.num_instances = 5; adev->vcn.num_vcn_inst = 2; adev->gmc.num_umc = 4; adev->ip_versions[MMHUB_HWIP][0] = IP_VERSION(9, 4, 2); adev->ip_versions[ATHUB_HWIP][0] = IP_VERSION(9, 4, 2); adev->ip_versions[OSSSYS_HWIP][0] = IP_VERSION(4, 4, 0); adev->ip_versions[HDP_HWIP][0] = IP_VERSION(4, 4, 0); adev->ip_versions[SDMA0_HWIP][0] = IP_VERSION(4, 4, 0); adev->ip_versions[SDMA0_HWIP][1] = IP_VERSION(4, 4, 0); adev->ip_versions[SDMA0_HWIP][2] = IP_VERSION(4, 4, 0); adev->ip_versions[SDMA0_HWIP][3] = IP_VERSION(4, 4, 0); adev->ip_versions[SDMA0_HWIP][4] = IP_VERSION(4, 4, 0); adev->ip_versions[DF_HWIP][0] = IP_VERSION(3, 6, 2); adev->ip_versions[NBIO_HWIP][0] = IP_VERSION(7, 4, 4); adev->ip_versions[UMC_HWIP][0] = IP_VERSION(6, 7, 0); adev->ip_versions[MP0_HWIP][0] = IP_VERSION(13, 0, 2); adev->ip_versions[MP1_HWIP][0] = IP_VERSION(13, 0, 2); adev->ip_versions[THM_HWIP][0] = IP_VERSION(13, 0, 2); adev->ip_versions[SMUIO_HWIP][0] = IP_VERSION(13, 0, 2); adev->ip_versions[GC_HWIP][0] = IP_VERSION(9, 4, 2); adev->ip_versions[UVD_HWIP][0] = IP_VERSION(2, 6, 0); adev->ip_versions[UVD_HWIP][1] = IP_VERSION(2, 6, 0); adev->ip_versions[XGMI_HWIP][0] = IP_VERSION(6, 1, 0); break; default: r = amdgpu_discovery_reg_base_init(adev); if (r) return -EINVAL; amdgpu_discovery_harvest_ip(adev); amdgpu_discovery_get_gfx_info(adev); amdgpu_discovery_get_mall_info(adev); amdgpu_discovery_get_vcn_info(adev); break; } switch (adev->ip_versions[GC_HWIP][0]) { case IP_VERSION(9, 0, 1): case IP_VERSION(9, 2, 1): case IP_VERSION(9, 4, 0): case IP_VERSION(9, 4, 1): case IP_VERSION(9, 4, 2): adev->family = AMDGPU_FAMILY_AI; break; case IP_VERSION(9, 1, 0): case IP_VERSION(9, 2, 2): case IP_VERSION(9, 3, 0): adev->family = AMDGPU_FAMILY_RV; break; case IP_VERSION(10, 1, 10): case IP_VERSION(10, 1, 1): case IP_VERSION(10, 1, 2): case IP_VERSION(10, 1, 3): case IP_VERSION(10, 1, 4): case IP_VERSION(10, 3, 0): case IP_VERSION(10, 3, 2): case IP_VERSION(10, 3, 4): case IP_VERSION(10, 3, 5): adev->family = AMDGPU_FAMILY_NV; break; case IP_VERSION(10, 3, 1): adev->family = AMDGPU_FAMILY_VGH; break; case IP_VERSION(10, 3, 3): adev->family = AMDGPU_FAMILY_YC; break; case IP_VERSION(10, 3, 6): adev->family = AMDGPU_FAMILY_GC_10_3_6; break; case IP_VERSION(10, 3, 7): adev->family = AMDGPU_FAMILY_GC_10_3_7; break; case IP_VERSION(11, 0, 0): case IP_VERSION(11, 0, 2): adev->family = AMDGPU_FAMILY_GC_11_0_0; break; case IP_VERSION(11, 0, 1): adev->family = AMDGPU_FAMILY_GC_11_0_1; break; default: return -EINVAL; } switch (adev->ip_versions[GC_HWIP][0]) { case IP_VERSION(9, 1, 0): case IP_VERSION(9, 2, 2): case IP_VERSION(9, 3, 0): case IP_VERSION(10, 1, 3): case IP_VERSION(10, 1, 4): case IP_VERSION(10, 3, 1): case IP_VERSION(10, 3, 3): case IP_VERSION(10, 3, 6): case IP_VERSION(10, 3, 7): case IP_VERSION(11, 0, 1): adev->flags |= AMD_IS_APU; break; default: break; } if (adev->ip_versions[XGMI_HWIP][0] == IP_VERSION(4, 8, 0)) adev->gmc.xgmi.supported = true; /* set NBIO version */ switch (adev->ip_versions[NBIO_HWIP][0]) { case IP_VERSION(6, 1, 0): case IP_VERSION(6, 2, 0): adev->nbio.funcs = &nbio_v6_1_funcs; adev->nbio.hdp_flush_reg = &nbio_v6_1_hdp_flush_reg; break; case IP_VERSION(7, 0, 0): case IP_VERSION(7, 0, 1): case IP_VERSION(2, 5, 0): adev->nbio.funcs = &nbio_v7_0_funcs; adev->nbio.hdp_flush_reg = &nbio_v7_0_hdp_flush_reg; break; case IP_VERSION(7, 4, 0): case IP_VERSION(7, 4, 1): case IP_VERSION(7, 4, 4): adev->nbio.funcs = &nbio_v7_4_funcs; adev->nbio.hdp_flush_reg = &nbio_v7_4_hdp_flush_reg; break; case IP_VERSION(7, 2, 0): case IP_VERSION(7, 2, 1): case IP_VERSION(7, 3, 0): case IP_VERSION(7, 5, 0): case IP_VERSION(7, 5, 1): adev->nbio.funcs = &nbio_v7_2_funcs; adev->nbio.hdp_flush_reg = &nbio_v7_2_hdp_flush_reg; break; case IP_VERSION(2, 1, 1): case IP_VERSION(2, 3, 0): case IP_VERSION(2, 3, 1): case IP_VERSION(2, 3, 2): case IP_VERSION(3, 3, 0): case IP_VERSION(3, 3, 1): case IP_VERSION(3, 3, 2): case IP_VERSION(3, 3, 3): adev->nbio.funcs = &nbio_v2_3_funcs; adev->nbio.hdp_flush_reg = &nbio_v2_3_hdp_flush_reg; break; case IP_VERSION(4, 3, 0): case IP_VERSION(4, 3, 1): adev->nbio.funcs = &nbio_v4_3_funcs; adev->nbio.hdp_flush_reg = &nbio_v4_3_hdp_flush_reg; break; case IP_VERSION(7, 7, 0): adev->nbio.funcs = &nbio_v7_7_funcs; adev->nbio.hdp_flush_reg = &nbio_v7_7_hdp_flush_reg; break; default: break; } switch (adev->ip_versions[HDP_HWIP][0]) { case IP_VERSION(4, 0, 0): case IP_VERSION(4, 0, 1): case IP_VERSION(4, 1, 0): case IP_VERSION(4, 1, 1): case IP_VERSION(4, 1, 2): case IP_VERSION(4, 2, 0): case IP_VERSION(4, 2, 1): case IP_VERSION(4, 4, 0): adev->hdp.funcs = &hdp_v4_0_funcs; break; case IP_VERSION(5, 0, 0): case IP_VERSION(5, 0, 1): case IP_VERSION(5, 0, 2): case IP_VERSION(5, 0, 3): case IP_VERSION(5, 0, 4): case IP_VERSION(5, 2, 0): adev->hdp.funcs = &hdp_v5_0_funcs; break; case IP_VERSION(5, 2, 1): adev->hdp.funcs = &hdp_v5_2_funcs; break; case IP_VERSION(6, 0, 0): case IP_VERSION(6, 0, 1): adev->hdp.funcs = &hdp_v6_0_funcs; break; default: break; } switch (adev->ip_versions[DF_HWIP][0]) { case IP_VERSION(3, 6, 0): case IP_VERSION(3, 6, 1): case IP_VERSION(3, 6, 2): adev->df.funcs = &df_v3_6_funcs; break; case IP_VERSION(2, 1, 0): case IP_VERSION(2, 1, 1): case IP_VERSION(2, 5, 0): case IP_VERSION(3, 5, 1): case IP_VERSION(3, 5, 2): adev->df.funcs = &df_v1_7_funcs; break; default: break; } switch (adev->ip_versions[SMUIO_HWIP][0]) { case IP_VERSION(9, 0, 0): case IP_VERSION(9, 0, 1): case IP_VERSION(10, 0, 0): case IP_VERSION(10, 0, 1): case IP_VERSION(10, 0, 2): adev->smuio.funcs = &smuio_v9_0_funcs; break; case IP_VERSION(11, 0, 0): case IP_VERSION(11, 0, 2): case IP_VERSION(11, 0, 3): case IP_VERSION(11, 0, 4): case IP_VERSION(11, 0, 7): case IP_VERSION(11, 0, 8): adev->smuio.funcs = &smuio_v11_0_funcs; break; case IP_VERSION(11, 0, 6): case IP_VERSION(11, 0, 10): case IP_VERSION(11, 0, 11): case IP_VERSION(11, 5, 0): case IP_VERSION(13, 0, 1): case IP_VERSION(13, 0, 9): case IP_VERSION(13, 0, 10): adev->smuio.funcs = &smuio_v11_0_6_funcs; break; case IP_VERSION(13, 0, 2): adev->smuio.funcs = &smuio_v13_0_funcs; break; case IP_VERSION(13, 0, 6): case IP_VERSION(13, 0, 8): adev->smuio.funcs = &smuio_v13_0_6_funcs; break; default: break; } switch (adev->ip_versions[LSDMA_HWIP][0]) { case IP_VERSION(6, 0, 0): case IP_VERSION(6, 0, 1): case IP_VERSION(6, 0, 2): adev->lsdma.funcs = &lsdma_v6_0_funcs; break; default: break; } r = amdgpu_discovery_set_common_ip_blocks(adev); if (r) return r; r = amdgpu_discovery_set_gmc_ip_blocks(adev); if (r) return r; /* For SR-IOV, PSP needs to be initialized before IH */ if (amdgpu_sriov_vf(adev)) { r = amdgpu_discovery_set_psp_ip_blocks(adev); if (r) return r; r = amdgpu_discovery_set_ih_ip_blocks(adev); if (r) return r; } else { r = amdgpu_discovery_set_ih_ip_blocks(adev); if (r) return r; if (likely(adev->firmware.load_type == AMDGPU_FW_LOAD_PSP)) { r = amdgpu_discovery_set_psp_ip_blocks(adev); if (r) return r; } } if (likely(adev->firmware.load_type == AMDGPU_FW_LOAD_PSP)) { r = amdgpu_discovery_set_smu_ip_blocks(adev); if (r) return r; } r = amdgpu_discovery_set_display_ip_blocks(adev); if (r) return r; r = amdgpu_discovery_set_gc_ip_blocks(adev); if (r) return r; r = amdgpu_discovery_set_sdma_ip_blocks(adev); if (r) return r; if ((adev->firmware.load_type == AMDGPU_FW_LOAD_DIRECT && !amdgpu_sriov_vf(adev)) || (adev->firmware.load_type == AMDGPU_FW_LOAD_RLC_BACKDOOR_AUTO && amdgpu_dpm == 1)) { r = amdgpu_discovery_set_smu_ip_blocks(adev); if (r) return r; } r = amdgpu_discovery_set_mm_ip_blocks(adev); if (r) return r; r = amdgpu_discovery_set_mes_ip_blocks(adev); if (r) return r; return 0; }
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
2331
2332
2333
2334
2335
2336
2337
2338
2339
2340
2341
2342
2343
2344
2345
2346
2347
2348
2349
2350
2351
2352
2353
2354
2355
2356
2357
2358
2359
2360
2361
2362
2363
2364
2365
2366
2367
2368
2369
2370
2371
2372
2373
2374
2375
2376
2377
2378
2379
2380
2381
2382
2383
2384
2385
2386
2387
2388
2389
2390
2391
2392
2393
2394
2395
2396
2397
2398
2399
2400
2401
2402
2403
2404
You can’t perform that action at this time.