mirror of
https://github.com/torvalds/linux.git
synced 2024-11-25 21:51:40 +00:00
Merge tag 'drm-next-5.3-2019-07-18' of git://people.freedesktop.org/~agd5f/linux into drm-next
drm-next-5.3-2019-07-18: amdgpu: - Navi DC fix for secondary adapters - Fix Navi flickering with high res panels - Navi SMU fixes - Vega20 SMU fixes - Fixes for audio hotplug on HG systems - Fix for potential integer overflows on large buffer migrations - debugfs fixes for umr - Various other small fixes amdkfd: - Apply noretry setting consistently - Fix hang in eviction - Properly clean up GWS on uninit UAPI: - clarify a comment on ctx priority Signed-off-by: Dave Airlie <airlied@redhat.com> From: Alex Deucher <alexdeucher@gmail.com> Link: https://patchwork.freedesktop.org/patch/msgid/20190718211525.3374-1-alexander.deucher@amd.com
This commit is contained in:
commit
9fb7dc73b9
@ -164,6 +164,7 @@ extern int amdgpu_async_gfx_ring;
|
||||
extern int amdgpu_mcbp;
|
||||
extern int amdgpu_discovery;
|
||||
extern int amdgpu_mes;
|
||||
extern int amdgpu_noretry;
|
||||
|
||||
#ifdef CONFIG_DRM_AMDGPU_SI
|
||||
extern int amdgpu_si_support;
|
||||
|
@ -106,10 +106,10 @@ static int amdgpu_debugfs_process_reg_op(bool read, struct file *f,
|
||||
ssize_t result = 0;
|
||||
int r;
|
||||
bool pm_pg_lock, use_bank, use_ring;
|
||||
unsigned instance_bank, sh_bank, se_bank, me, pipe, queue;
|
||||
unsigned instance_bank, sh_bank, se_bank, me, pipe, queue, vmid;
|
||||
|
||||
pm_pg_lock = use_bank = use_ring = false;
|
||||
instance_bank = sh_bank = se_bank = me = pipe = queue = 0;
|
||||
instance_bank = sh_bank = se_bank = me = pipe = queue = vmid = 0;
|
||||
|
||||
if (size & 0x3 || *pos & 0x3 ||
|
||||
((*pos & (1ULL << 62)) && (*pos & (1ULL << 61))))
|
||||
@ -135,6 +135,7 @@ static int amdgpu_debugfs_process_reg_op(bool read, struct file *f,
|
||||
me = (*pos & GENMASK_ULL(33, 24)) >> 24;
|
||||
pipe = (*pos & GENMASK_ULL(43, 34)) >> 34;
|
||||
queue = (*pos & GENMASK_ULL(53, 44)) >> 44;
|
||||
vmid = (*pos & GENMASK_ULL(58, 54)) >> 54;
|
||||
|
||||
use_ring = 1;
|
||||
} else {
|
||||
@ -152,7 +153,7 @@ static int amdgpu_debugfs_process_reg_op(bool read, struct file *f,
|
||||
sh_bank, instance_bank);
|
||||
} else if (use_ring) {
|
||||
mutex_lock(&adev->srbm_mutex);
|
||||
amdgpu_gfx_select_me_pipe_q(adev, me, pipe, queue);
|
||||
amdgpu_gfx_select_me_pipe_q(adev, me, pipe, queue, vmid);
|
||||
}
|
||||
|
||||
if (pm_pg_lock)
|
||||
@ -185,7 +186,7 @@ end:
|
||||
amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff);
|
||||
mutex_unlock(&adev->grbm_idx_mutex);
|
||||
} else if (use_ring) {
|
||||
amdgpu_gfx_select_me_pipe_q(adev, 0, 0, 0);
|
||||
amdgpu_gfx_select_me_pipe_q(adev, 0, 0, 0, 0);
|
||||
mutex_unlock(&adev->srbm_mutex);
|
||||
}
|
||||
|
||||
|
@ -2537,6 +2537,7 @@ int amdgpu_device_init(struct amdgpu_device *adev,
|
||||
hash_init(adev->mn_hash);
|
||||
mutex_init(&adev->lock_reset);
|
||||
mutex_init(&adev->virt.dpm_mutex);
|
||||
mutex_init(&adev->psp.mutex);
|
||||
|
||||
r = amdgpu_device_check_arguments(adev);
|
||||
if (r)
|
||||
|
@ -123,7 +123,7 @@ static int hw_id_map[MAX_HWIP] = {
|
||||
[UVD_HWIP] = UVD_HWID,
|
||||
[VCE_HWIP] = VCE_HWID,
|
||||
[DF_HWIP] = DF_HWID,
|
||||
[DCE_HWIP] = DCEAZ_HWID,
|
||||
[DCE_HWIP] = DMU_HWID,
|
||||
[OSSSYS_HWIP] = OSSSYS_HWID,
|
||||
[SMUIO_HWIP] = SMUIO_HWID,
|
||||
[PWR_HWIP] = PWR_HWID,
|
||||
|
@ -140,8 +140,9 @@ uint amdgpu_smu_memory_pool_size = 0;
|
||||
uint amdgpu_dc_feature_mask = 0;
|
||||
int amdgpu_async_gfx_ring = 1;
|
||||
int amdgpu_mcbp = 0;
|
||||
int amdgpu_discovery = 0;
|
||||
int amdgpu_discovery = -1;
|
||||
int amdgpu_mes = 0;
|
||||
int amdgpu_noretry;
|
||||
|
||||
struct amdgpu_mgpu_info mgpu_info = {
|
||||
.mutex = __MUTEX_INITIALIZER(mgpu_info.mutex),
|
||||
@ -593,6 +594,7 @@ module_param_named(mcbp, amdgpu_mcbp, int, 0444);
|
||||
/**
|
||||
* DOC: discovery (int)
|
||||
* Allow driver to discover hardware IP information from IP Discovery table at the top of VRAM.
|
||||
* (-1 = auto (default), 0 = disabled, 1 = enabled)
|
||||
*/
|
||||
MODULE_PARM_DESC(discovery,
|
||||
"Allow driver to discover hardware IPs from IP Discovery table at the top of VRAM");
|
||||
@ -607,6 +609,10 @@ MODULE_PARM_DESC(mes,
|
||||
"Enable Micro Engine Scheduler (0 = disabled (default), 1 = enabled)");
|
||||
module_param_named(mes, amdgpu_mes, int, 0444);
|
||||
|
||||
MODULE_PARM_DESC(noretry,
|
||||
"Disable retry faults (0 = retry enabled (default), 1 = retry disabled)");
|
||||
module_param_named(noretry, amdgpu_noretry, int, 0644);
|
||||
|
||||
#ifdef CONFIG_HSA_AMD
|
||||
/**
|
||||
* DOC: sched_policy (int)
|
||||
@ -682,17 +688,6 @@ module_param(ignore_crat, int, 0444);
|
||||
MODULE_PARM_DESC(ignore_crat,
|
||||
"Ignore CRAT table during KFD initialization (0 = use CRAT (default), 1 = ignore CRAT)");
|
||||
|
||||
/**
|
||||
* DOC: noretry (int)
|
||||
* This parameter sets sh_mem_config.retry_disable. Default value, 0, enables retry.
|
||||
* Setting 1 disables retry.
|
||||
* Retry is needed for recoverable page faults.
|
||||
*/
|
||||
int noretry;
|
||||
module_param(noretry, int, 0644);
|
||||
MODULE_PARM_DESC(noretry,
|
||||
"Set sh_mem_config.retry_disable on Vega10 (0 = retry enabled (default), 1 = retry disabled)");
|
||||
|
||||
/**
|
||||
* DOC: halt_if_hws_hang (int)
|
||||
* Halt if HWS hang is detected. Default value, 0, disables the halt on hang.
|
||||
|
@ -195,7 +195,7 @@ struct amdgpu_gfx_funcs {
|
||||
uint32_t wave, uint32_t start, uint32_t size,
|
||||
uint32_t *dst);
|
||||
void (*select_me_pipe_q)(struct amdgpu_device *adev, u32 me, u32 pipe,
|
||||
u32 queue);
|
||||
u32 queue, u32 vmid);
|
||||
};
|
||||
|
||||
struct amdgpu_ngg_buf {
|
||||
@ -327,7 +327,7 @@ struct amdgpu_gfx {
|
||||
|
||||
#define amdgpu_gfx_get_gpu_clock_counter(adev) (adev)->gfx.funcs->get_gpu_clock_counter((adev))
|
||||
#define amdgpu_gfx_select_se_sh(adev, se, sh, instance) (adev)->gfx.funcs->select_se_sh((adev), (se), (sh), (instance))
|
||||
#define amdgpu_gfx_select_me_pipe_q(adev, me, pipe, q) (adev)->gfx.funcs->select_me_pipe_q((adev), (me), (pipe), (q))
|
||||
#define amdgpu_gfx_select_me_pipe_q(adev, me, pipe, q, vmid) (adev)->gfx.funcs->select_me_pipe_q((adev), (me), (pipe), (q), (vmid))
|
||||
|
||||
/**
|
||||
* amdgpu_gfx_create_bitmask - create a bitmask
|
||||
|
@ -2077,11 +2077,6 @@ static ssize_t amdgpu_hwmon_show_sclk(struct device *dev,
|
||||
(ddev->switch_power_state != DRM_SWITCH_POWER_ON))
|
||||
return -EINVAL;
|
||||
|
||||
/* sanity check PP is enabled */
|
||||
if (!(adev->powerplay.pp_funcs &&
|
||||
adev->powerplay.pp_funcs->read_sensor))
|
||||
return -EINVAL;
|
||||
|
||||
/* get the sclk */
|
||||
r = amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_GFX_SCLK,
|
||||
(void *)&sclk, &size);
|
||||
@ -2112,11 +2107,6 @@ static ssize_t amdgpu_hwmon_show_mclk(struct device *dev,
|
||||
(ddev->switch_power_state != DRM_SWITCH_POWER_ON))
|
||||
return -EINVAL;
|
||||
|
||||
/* sanity check PP is enabled */
|
||||
if (!(adev->powerplay.pp_funcs &&
|
||||
adev->powerplay.pp_funcs->read_sensor))
|
||||
return -EINVAL;
|
||||
|
||||
/* get the sclk */
|
||||
r = amdgpu_dpm_read_sensor(adev, AMDGPU_PP_SENSOR_GFX_MCLK,
|
||||
(void *)&mclk, &size);
|
||||
@ -2996,13 +2986,10 @@ void amdgpu_pm_compute_clocks(struct amdgpu_device *adev)
|
||||
}
|
||||
|
||||
if (is_support_sw_smu(adev)) {
|
||||
struct smu_context *smu = &adev->smu;
|
||||
struct smu_dpm_context *smu_dpm = &adev->smu.smu_dpm;
|
||||
mutex_lock(&(smu->mutex));
|
||||
smu_handle_task(&adev->smu,
|
||||
smu_dpm->dpm_level,
|
||||
AMD_PP_TASK_DISPLAY_CONFIG_CHANGE);
|
||||
mutex_unlock(&(smu->mutex));
|
||||
} else {
|
||||
if (adev->powerplay.pp_funcs->dispatch_tasks) {
|
||||
if (!amdgpu_device_has_dc_support(adev)) {
|
||||
|
@ -130,6 +130,8 @@ psp_cmd_submit_buf(struct psp_context *psp,
|
||||
int index;
|
||||
int timeout = 2000;
|
||||
|
||||
mutex_lock(&psp->mutex);
|
||||
|
||||
memset(psp->cmd_buf_mem, 0, PSP_CMD_BUFFER_SIZE);
|
||||
|
||||
memcpy(psp->cmd_buf_mem, cmd, sizeof(struct psp_gfx_cmd_resp));
|
||||
@ -139,6 +141,7 @@ psp_cmd_submit_buf(struct psp_context *psp,
|
||||
fence_mc_addr, index);
|
||||
if (ret) {
|
||||
atomic_dec(&psp->fence_value);
|
||||
mutex_unlock(&psp->mutex);
|
||||
return ret;
|
||||
}
|
||||
|
||||
@ -161,8 +164,10 @@ psp_cmd_submit_buf(struct psp_context *psp,
|
||||
ucode->ucode_id);
|
||||
DRM_WARN("psp command failed and response status is (%d)\n",
|
||||
psp->cmd_buf_mem->resp.status);
|
||||
if (!timeout)
|
||||
if (!timeout) {
|
||||
mutex_unlock(&psp->mutex);
|
||||
return -EINVAL;
|
||||
}
|
||||
}
|
||||
|
||||
/* get xGMI session id from response buffer */
|
||||
@ -172,6 +177,7 @@ psp_cmd_submit_buf(struct psp_context *psp,
|
||||
ucode->tmr_mc_addr_lo = psp->cmd_buf_mem->resp.fw_addr_lo;
|
||||
ucode->tmr_mc_addr_hi = psp->cmd_buf_mem->resp.fw_addr_hi;
|
||||
}
|
||||
mutex_unlock(&psp->mutex);
|
||||
|
||||
return ret;
|
||||
}
|
||||
@ -763,6 +769,15 @@ static int psp_hw_start(struct psp_context *psp)
|
||||
int ret;
|
||||
|
||||
if (!amdgpu_sriov_vf(adev) || !adev->in_gpu_reset) {
|
||||
if (psp->kdb_bin_size &&
|
||||
(psp->funcs->bootloader_load_kdb != NULL)) {
|
||||
ret = psp_bootloader_load_kdb(psp);
|
||||
if (ret) {
|
||||
DRM_ERROR("PSP load kdb failed!\n");
|
||||
return ret;
|
||||
}
|
||||
}
|
||||
|
||||
ret = psp_bootloader_load_sysdrv(psp);
|
||||
if (ret) {
|
||||
DRM_ERROR("PSP load sysdrv failed!\n");
|
||||
@ -1188,10 +1203,16 @@ failed:
|
||||
|
||||
int psp_gpu_reset(struct amdgpu_device *adev)
|
||||
{
|
||||
int ret;
|
||||
|
||||
if (adev->firmware.load_type != AMDGPU_FW_LOAD_PSP)
|
||||
return 0;
|
||||
|
||||
return psp_mode1_reset(&adev->psp);
|
||||
mutex_lock(&adev->psp.mutex);
|
||||
ret = psp_mode1_reset(&adev->psp);
|
||||
mutex_unlock(&adev->psp.mutex);
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
int psp_rlc_autoload_start(struct psp_context *psp)
|
||||
|
@ -42,6 +42,12 @@ struct psp_context;
|
||||
struct psp_xgmi_node_info;
|
||||
struct psp_xgmi_topology_info;
|
||||
|
||||
enum psp_bootloader_cmd {
|
||||
PSP_BL__LOAD_SYSDRV = 0x10000,
|
||||
PSP_BL__LOAD_SOSDRV = 0x20000,
|
||||
PSP_BL__LOAD_KEY_DATABASE = 0x80000,
|
||||
};
|
||||
|
||||
enum psp_ring_type
|
||||
{
|
||||
PSP_RING_TYPE__INVALID = 0,
|
||||
@ -73,6 +79,7 @@ enum psp_reg_prog_id {
|
||||
struct psp_funcs
|
||||
{
|
||||
int (*init_microcode)(struct psp_context *psp);
|
||||
int (*bootloader_load_kdb)(struct psp_context *psp);
|
||||
int (*bootloader_load_sysdrv)(struct psp_context *psp);
|
||||
int (*bootloader_load_sos)(struct psp_context *psp);
|
||||
int (*ring_init)(struct psp_context *psp, enum psp_ring_type ring_type);
|
||||
@ -156,9 +163,11 @@ struct psp_context
|
||||
uint32_t sys_bin_size;
|
||||
uint32_t sos_bin_size;
|
||||
uint32_t toc_bin_size;
|
||||
uint32_t kdb_bin_size;
|
||||
uint8_t *sys_start_addr;
|
||||
uint8_t *sos_start_addr;
|
||||
uint8_t *toc_start_addr;
|
||||
uint8_t *kdb_start_addr;
|
||||
|
||||
/* tmr buffer */
|
||||
struct amdgpu_bo *tmr_bo;
|
||||
@ -201,6 +210,7 @@ struct psp_context
|
||||
uint8_t *ta_ras_start_addr;
|
||||
struct psp_xgmi_context xgmi_context;
|
||||
struct psp_ras_context ras;
|
||||
struct mutex mutex;
|
||||
};
|
||||
|
||||
struct amdgpu_psp_funcs {
|
||||
@ -219,6 +229,8 @@ struct amdgpu_psp_funcs {
|
||||
(psp)->funcs->compare_sram_data((psp), (ucode), (type))
|
||||
#define psp_init_microcode(psp) \
|
||||
((psp)->funcs->init_microcode ? (psp)->funcs->init_microcode((psp)) : 0)
|
||||
#define psp_bootloader_load_kdb(psp) \
|
||||
((psp)->funcs->bootloader_load_kdb ? (psp)->funcs->bootloader_load_kdb((psp)) : 0)
|
||||
#define psp_bootloader_load_sysdrv(psp) \
|
||||
((psp)->funcs->bootloader_load_sysdrv ? (psp)->funcs->bootloader_load_sysdrv((psp)) : 0)
|
||||
#define psp_bootloader_load_sos(psp) \
|
||||
|
@ -391,6 +391,7 @@ int amdgpu_ttm_copy_mem_to_mem(struct amdgpu_device *adev,
|
||||
src_node_start = amdgpu_mm_node_addr(src->bo, ++src_mm,
|
||||
src->mem);
|
||||
src_node_size = (src_mm->size << PAGE_SHIFT);
|
||||
src_page_offset = 0;
|
||||
} else {
|
||||
src_node_start += cur_size;
|
||||
src_page_offset = src_node_start & (PAGE_SIZE - 1);
|
||||
@ -400,6 +401,7 @@ int amdgpu_ttm_copy_mem_to_mem(struct amdgpu_device *adev,
|
||||
dst_node_start = amdgpu_mm_node_addr(dst->bo, ++dst_mm,
|
||||
dst->mem);
|
||||
dst_node_size = (dst_mm->size << PAGE_SHIFT);
|
||||
dst_page_offset = 0;
|
||||
} else {
|
||||
dst_node_start += cur_size;
|
||||
dst_page_offset = dst_node_start & (PAGE_SIZE - 1);
|
||||
@ -487,6 +489,7 @@ static int amdgpu_move_vram_ram(struct ttm_buffer_object *bo, bool evict,
|
||||
placements.flags = TTM_PL_MASK_CACHING | TTM_PL_FLAG_TT;
|
||||
r = ttm_bo_mem_space(bo, &placement, &tmp_mem, ctx);
|
||||
if (unlikely(r)) {
|
||||
pr_err("Failed to find GTT space for blit from VRAM\n");
|
||||
return r;
|
||||
}
|
||||
|
||||
@ -545,6 +548,7 @@ static int amdgpu_move_ram_vram(struct ttm_buffer_object *bo, bool evict,
|
||||
placements.flags = TTM_PL_MASK_CACHING | TTM_PL_FLAG_TT;
|
||||
r = ttm_bo_mem_space(bo, &placement, &tmp_mem, ctx);
|
||||
if (unlikely(r)) {
|
||||
pr_err("Failed to find GTT space for blit to VRAM\n");
|
||||
return r;
|
||||
}
|
||||
|
||||
@ -564,6 +568,30 @@ out_cleanup:
|
||||
return r;
|
||||
}
|
||||
|
||||
/**
|
||||
* amdgpu_mem_visible - Check that memory can be accessed by ttm_bo_move_memcpy
|
||||
*
|
||||
* Called by amdgpu_bo_move()
|
||||
*/
|
||||
static bool amdgpu_mem_visible(struct amdgpu_device *adev,
|
||||
struct ttm_mem_reg *mem)
|
||||
{
|
||||
struct drm_mm_node *nodes = mem->mm_node;
|
||||
|
||||
if (mem->mem_type == TTM_PL_SYSTEM ||
|
||||
mem->mem_type == TTM_PL_TT)
|
||||
return true;
|
||||
if (mem->mem_type != TTM_PL_VRAM)
|
||||
return false;
|
||||
|
||||
/* ttm_mem_reg_ioremap only supports contiguous memory */
|
||||
if (nodes->size != mem->num_pages)
|
||||
return false;
|
||||
|
||||
return ((nodes->start + nodes->size) << PAGE_SHIFT)
|
||||
<= adev->gmc.visible_vram_size;
|
||||
}
|
||||
|
||||
/**
|
||||
* amdgpu_bo_move - Move a buffer object to a new memory location
|
||||
*
|
||||
@ -608,8 +636,10 @@ static int amdgpu_bo_move(struct ttm_buffer_object *bo, bool evict,
|
||||
return 0;
|
||||
}
|
||||
|
||||
if (!adev->mman.buffer_funcs_enabled)
|
||||
if (!adev->mman.buffer_funcs_enabled) {
|
||||
r = -ENODEV;
|
||||
goto memcpy;
|
||||
}
|
||||
|
||||
if (old_mem->mem_type == TTM_PL_VRAM &&
|
||||
new_mem->mem_type == TTM_PL_SYSTEM) {
|
||||
@ -624,10 +654,16 @@ static int amdgpu_bo_move(struct ttm_buffer_object *bo, bool evict,
|
||||
|
||||
if (r) {
|
||||
memcpy:
|
||||
r = ttm_bo_move_memcpy(bo, ctx, new_mem);
|
||||
if (r) {
|
||||
/* Check that all memory is CPU accessible */
|
||||
if (!amdgpu_mem_visible(adev, old_mem) ||
|
||||
!amdgpu_mem_visible(adev, new_mem)) {
|
||||
pr_err("Move buffer fallback to memcpy unavailable\n");
|
||||
return r;
|
||||
}
|
||||
|
||||
r = ttm_bo_move_memcpy(bo, ctx, new_mem);
|
||||
if (r)
|
||||
return r;
|
||||
}
|
||||
|
||||
if (bo->type == ttm_bo_type_device &&
|
||||
@ -2059,9 +2095,9 @@ int amdgpu_fill_buffer(struct amdgpu_bo *bo,
|
||||
mm_node = bo->tbo.mem.mm_node;
|
||||
num_loops = 0;
|
||||
while (num_pages) {
|
||||
uint32_t byte_count = mm_node->size << PAGE_SHIFT;
|
||||
uint64_t byte_count = mm_node->size << PAGE_SHIFT;
|
||||
|
||||
num_loops += DIV_ROUND_UP(byte_count, max_bytes);
|
||||
num_loops += DIV_ROUND_UP_ULL(byte_count, max_bytes);
|
||||
num_pages -= mm_node->size;
|
||||
++mm_node;
|
||||
}
|
||||
@ -2087,12 +2123,13 @@ int amdgpu_fill_buffer(struct amdgpu_bo *bo,
|
||||
mm_node = bo->tbo.mem.mm_node;
|
||||
|
||||
while (num_pages) {
|
||||
uint32_t byte_count = mm_node->size << PAGE_SHIFT;
|
||||
uint64_t byte_count = mm_node->size << PAGE_SHIFT;
|
||||
uint64_t dst_addr;
|
||||
|
||||
dst_addr = amdgpu_mm_node_addr(&bo->tbo, mm_node, &bo->tbo.mem);
|
||||
while (byte_count) {
|
||||
uint32_t cur_size_in_bytes = min(byte_count, max_bytes);
|
||||
uint32_t cur_size_in_bytes = min_t(uint64_t, byte_count,
|
||||
max_bytes);
|
||||
|
||||
amdgpu_emit_fill_buffer(adev, &job->ibs[0], src_data,
|
||||
dst_addr, cur_size_in_bytes);
|
||||
|
@ -262,6 +262,12 @@ void amdgpu_ucode_print_psp_hdr(const struct common_firmware_header *hdr)
|
||||
le32_to_cpu(psp_hdr_v1_1->toc_offset_bytes));
|
||||
DRM_DEBUG("toc_size_bytes: %u\n",
|
||||
le32_to_cpu(psp_hdr_v1_1->toc_size_bytes));
|
||||
DRM_DEBUG("kdb_header_version: %u\n",
|
||||
le32_to_cpu(psp_hdr_v1_1->kdb_header_version));
|
||||
DRM_DEBUG("kdb_offset_bytes: %u\n",
|
||||
le32_to_cpu(psp_hdr_v1_1->kdb_offset_bytes));
|
||||
DRM_DEBUG("kdb_size_bytes: %u\n",
|
||||
le32_to_cpu(psp_hdr_v1_1->kdb_size_bytes));
|
||||
}
|
||||
} else {
|
||||
DRM_ERROR("Unknown PSP ucode version: %u.%u\n",
|
||||
|
@ -85,6 +85,9 @@ struct psp_firmware_header_v1_1 {
|
||||
uint32_t toc_header_version;
|
||||
uint32_t toc_offset_bytes;
|
||||
uint32_t toc_size_bytes;
|
||||
uint32_t kdb_header_version;
|
||||
uint32_t kdb_offset_bytes;
|
||||
uint32_t kdb_size_bytes;
|
||||
};
|
||||
|
||||
/* version_major=1, version_minor=0 */
|
||||
|
@ -390,7 +390,8 @@ static uint32_t parse_clk(char *buf, bool min)
|
||||
if (!ptr)
|
||||
break;
|
||||
ptr+=2;
|
||||
clk = simple_strtoul(ptr, NULL, 10);
|
||||
if (kstrtou32(ptr, 10, &clk))
|
||||
return 0;
|
||||
} while (!min);
|
||||
|
||||
return clk * 100;
|
||||
|
@ -109,6 +109,13 @@ static const struct soc15_reg_golden golden_settings_gc_10_0_nv10[] =
|
||||
/* Pending on emulation bring up */
|
||||
};
|
||||
|
||||
#define DEFAULT_SH_MEM_CONFIG \
|
||||
((SH_MEM_ADDRESS_MODE_64 << SH_MEM_CONFIG__ADDRESS_MODE__SHIFT) | \
|
||||
(SH_MEM_ALIGNMENT_MODE_UNALIGNED << SH_MEM_CONFIG__ALIGNMENT_MODE__SHIFT) | \
|
||||
(SH_MEM_RETRY_MODE_ALL << SH_MEM_CONFIG__RETRY_MODE__SHIFT) | \
|
||||
(3 << SH_MEM_CONFIG__INITIAL_INST_PREFETCH__SHIFT))
|
||||
|
||||
|
||||
static void gfx_v10_0_set_ring_funcs(struct amdgpu_device *adev);
|
||||
static void gfx_v10_0_set_irq_funcs(struct amdgpu_device *adev);
|
||||
static void gfx_v10_0_set_gds_init(struct amdgpu_device *adev);
|
||||
@ -995,6 +1002,12 @@ static void gfx_v10_0_read_wave_vgprs(struct amdgpu_device *adev, uint32_t simd,
|
||||
start + SQIND_WAVE_VGPRS_OFFSET, size, dst);
|
||||
}
|
||||
|
||||
static void gfx_v10_0_select_me_pipe_q(struct amdgpu_device *adev,
|
||||
u32 me, u32 pipe, u32 q, u32 vm)
|
||||
{
|
||||
nv_grbm_select(adev, me, pipe, q, vm);
|
||||
}
|
||||
|
||||
|
||||
static const struct amdgpu_gfx_funcs gfx_v10_0_gfx_funcs = {
|
||||
.get_gpu_clock_counter = &gfx_v10_0_get_gpu_clock_counter,
|
||||
@ -1002,6 +1015,7 @@ static const struct amdgpu_gfx_funcs gfx_v10_0_gfx_funcs = {
|
||||
.read_wave_data = &gfx_v10_0_read_wave_data,
|
||||
.read_wave_sgprs = &gfx_v10_0_read_wave_sgprs,
|
||||
.read_wave_vgprs = &gfx_v10_0_read_wave_vgprs,
|
||||
.select_me_pipe_q = &gfx_v10_0_select_me_pipe_q,
|
||||
};
|
||||
|
||||
static void gfx_v10_0_gpu_early_init(struct amdgpu_device *adev)
|
||||
@ -1408,7 +1422,6 @@ static u32 gfx_v10_0_init_pa_sc_tile_steering_override(struct amdgpu_device *ade
|
||||
static void gfx_v10_0_init_compute_vmid(struct amdgpu_device *adev)
|
||||
{
|
||||
int i;
|
||||
uint32_t sh_mem_config;
|
||||
uint32_t sh_mem_bases;
|
||||
|
||||
/*
|
||||
@ -1419,15 +1432,11 @@ static void gfx_v10_0_init_compute_vmid(struct amdgpu_device *adev)
|
||||
*/
|
||||
sh_mem_bases = DEFAULT_SH_MEM_BASES | (DEFAULT_SH_MEM_BASES << 16);
|
||||
|
||||
sh_mem_config = SH_MEM_ADDRESS_MODE_64 |
|
||||
SH_MEM_ALIGNMENT_MODE_UNALIGNED <<
|
||||
SH_MEM_CONFIG__ALIGNMENT_MODE__SHIFT;
|
||||
|
||||
mutex_lock(&adev->srbm_mutex);
|
||||
for (i = FIRST_COMPUTE_VMID; i < LAST_COMPUTE_VMID; i++) {
|
||||
nv_grbm_select(adev, 0, 0, 0, i);
|
||||
/* CP and shaders */
|
||||
WREG32_SOC15(GC, 0, mmSH_MEM_CONFIG, sh_mem_config);
|
||||
WREG32_SOC15(GC, 0, mmSH_MEM_CONFIG, DEFAULT_SH_MEM_CONFIG);
|
||||
WREG32_SOC15(GC, 0, mmSH_MEM_BASES, sh_mem_bases);
|
||||
}
|
||||
nv_grbm_select(adev, 0, 0, 0, 0);
|
||||
@ -1520,17 +1529,8 @@ static void gfx_v10_0_constants_init(struct amdgpu_device *adev)
|
||||
for (i = 0; i < adev->vm_manager.id_mgr[AMDGPU_GFXHUB].num_ids; i++) {
|
||||
nv_grbm_select(adev, 0, 0, 0, i);
|
||||
/* CP and shaders */
|
||||
if (i == 0) {
|
||||
tmp = REG_SET_FIELD(0, SH_MEM_CONFIG, ALIGNMENT_MODE,
|
||||
SH_MEM_ALIGNMENT_MODE_UNALIGNED);
|
||||
tmp = REG_SET_FIELD(tmp, SH_MEM_CONFIG, RETRY_MODE, 0);
|
||||
WREG32_SOC15(GC, 0, mmSH_MEM_CONFIG, tmp);
|
||||
WREG32_SOC15(GC, 0, mmSH_MEM_BASES, 0);
|
||||
} else {
|
||||
tmp = REG_SET_FIELD(0, SH_MEM_CONFIG, ALIGNMENT_MODE,
|
||||
SH_MEM_ALIGNMENT_MODE_UNALIGNED);
|
||||
tmp = REG_SET_FIELD(tmp, SH_MEM_CONFIG, RETRY_MODE, 0);
|
||||
WREG32_SOC15(GC, 0, mmSH_MEM_CONFIG, tmp);
|
||||
WREG32_SOC15(GC, 0, mmSH_MEM_CONFIG, DEFAULT_SH_MEM_CONFIG);
|
||||
if (i != 0) {
|
||||
tmp = REG_SET_FIELD(0, SH_MEM_BASES, PRIVATE_BASE,
|
||||
(adev->gmc.private_aperture_start >> 48));
|
||||
tmp = REG_SET_FIELD(tmp, SH_MEM_BASES, SHARED_BASE,
|
||||
|
@ -3043,7 +3043,7 @@ static void gfx_v6_0_read_wave_sgprs(struct amdgpu_device *adev, uint32_t simd,
|
||||
}
|
||||
|
||||
static void gfx_v6_0_select_me_pipe_q(struct amdgpu_device *adev,
|
||||
u32 me, u32 pipe, u32 q)
|
||||
u32 me, u32 pipe, u32 q, u32 vm)
|
||||
{
|
||||
DRM_INFO("Not implemented\n");
|
||||
}
|
||||
|
@ -4169,9 +4169,9 @@ static void gfx_v7_0_read_wave_sgprs(struct amdgpu_device *adev, uint32_t simd,
|
||||
}
|
||||
|
||||
static void gfx_v7_0_select_me_pipe_q(struct amdgpu_device *adev,
|
||||
u32 me, u32 pipe, u32 q)
|
||||
u32 me, u32 pipe, u32 q, u32 vm)
|
||||
{
|
||||
cik_srbm_select(adev, me, pipe, q, 0);
|
||||
cik_srbm_select(adev, me, pipe, q, vm);
|
||||
}
|
||||
|
||||
static const struct amdgpu_gfx_funcs gfx_v7_0_gfx_funcs = {
|
||||
|
@ -3436,9 +3436,9 @@ static void gfx_v8_0_select_se_sh(struct amdgpu_device *adev,
|
||||
}
|
||||
|
||||
static void gfx_v8_0_select_me_pipe_q(struct amdgpu_device *adev,
|
||||
u32 me, u32 pipe, u32 q)
|
||||
u32 me, u32 pipe, u32 q, u32 vm)
|
||||
{
|
||||
vi_srbm_select(adev, me, pipe, q, 0);
|
||||
vi_srbm_select(adev, me, pipe, q, vm);
|
||||
}
|
||||
|
||||
static u32 gfx_v8_0_get_rb_active_bitmap(struct amdgpu_device *adev)
|
||||
|
@ -1313,9 +1313,9 @@ static void gfx_v9_0_read_wave_vgprs(struct amdgpu_device *adev, uint32_t simd,
|
||||
}
|
||||
|
||||
static void gfx_v9_0_select_me_pipe_q(struct amdgpu_device *adev,
|
||||
u32 me, u32 pipe, u32 q)
|
||||
u32 me, u32 pipe, u32 q, u32 vm)
|
||||
{
|
||||
soc15_grbm_select(adev, me, pipe, q, 0);
|
||||
soc15_grbm_select(adev, me, pipe, q, vm);
|
||||
}
|
||||
|
||||
static const struct amdgpu_gfx_funcs gfx_v9_0_gfx_funcs = {
|
||||
@ -1942,11 +1942,15 @@ static void gfx_v9_0_constants_init(struct amdgpu_device *adev)
|
||||
if (i == 0) {
|
||||
tmp = REG_SET_FIELD(0, SH_MEM_CONFIG, ALIGNMENT_MODE,
|
||||
SH_MEM_ALIGNMENT_MODE_UNALIGNED);
|
||||
tmp = REG_SET_FIELD(tmp, SH_MEM_CONFIG, RETRY_DISABLE,
|
||||
!!amdgpu_noretry);
|
||||
WREG32_SOC15_RLC(GC, 0, mmSH_MEM_CONFIG, tmp);
|
||||
WREG32_SOC15_RLC(GC, 0, mmSH_MEM_BASES, 0);
|
||||
} else {
|
||||
tmp = REG_SET_FIELD(0, SH_MEM_CONFIG, ALIGNMENT_MODE,
|
||||
SH_MEM_ALIGNMENT_MODE_UNALIGNED);
|
||||
tmp = REG_SET_FIELD(tmp, SH_MEM_CONFIG, RETRY_DISABLE,
|
||||
!!amdgpu_noretry);
|
||||
WREG32_SOC15_RLC(GC, 0, mmSH_MEM_CONFIG, tmp);
|
||||
tmp = REG_SET_FIELD(0, SH_MEM_BASES, PRIVATE_BASE,
|
||||
(adev->gmc.private_aperture_start >> 48));
|
||||
|
@ -236,7 +236,8 @@ static void gfxhub_v1_0_setup_vmid_config(struct amdgpu_device *adev)
|
||||
block_size);
|
||||
/* Send no-retry XNACK on fault to suppress VM fault storm. */
|
||||
tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
|
||||
RETRY_PERMISSION_OR_INVALID_PAGE_FAULT, 1);
|
||||
RETRY_PERMISSION_OR_INVALID_PAGE_FAULT,
|
||||
!amdgpu_noretry);
|
||||
WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_CNTL, i, tmp);
|
||||
WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_PAGE_TABLE_START_ADDR_LO32, i*2, 0);
|
||||
WREG32_SOC15_OFFSET(GC, 0, mmVM_CONTEXT1_PAGE_TABLE_START_ADDR_HI32, i*2, 0);
|
||||
|
@ -215,7 +215,8 @@ static void gfxhub_v2_0_setup_vmid_config(struct amdgpu_device *adev)
|
||||
adev->vm_manager.block_size - 9);
|
||||
/* Send no-retry XNACK on fault to suppress VM fault storm. */
|
||||
tmp = REG_SET_FIELD(tmp, GCVM_CONTEXT1_CNTL,
|
||||
RETRY_PERMISSION_OR_INVALID_PAGE_FAULT, 0);
|
||||
RETRY_PERMISSION_OR_INVALID_PAGE_FAULT,
|
||||
!amdgpu_noretry);
|
||||
WREG32_SOC15_OFFSET(GC, 0, mmGCVM_CONTEXT1_CNTL, i, tmp);
|
||||
WREG32_SOC15_OFFSET(GC, 0, mmGCVM_CONTEXT1_PAGE_TABLE_START_ADDR_LO32, i*2, 0);
|
||||
WREG32_SOC15_OFFSET(GC, 0, mmGCVM_CONTEXT1_PAGE_TABLE_START_ADDR_HI32, i*2, 0);
|
||||
|
@ -265,7 +265,8 @@ static void mmhub_v1_0_setup_vmid_config(struct amdgpu_device *adev)
|
||||
block_size);
|
||||
/* Send no-retry XNACK on fault to suppress VM fault storm. */
|
||||
tmp = REG_SET_FIELD(tmp, VM_CONTEXT1_CNTL,
|
||||
RETRY_PERMISSION_OR_INVALID_PAGE_FAULT, 1);
|
||||
RETRY_PERMISSION_OR_INVALID_PAGE_FAULT,
|
||||
!amdgpu_noretry);
|
||||
WREG32_SOC15_OFFSET(MMHUB, 0, mmVM_CONTEXT1_CNTL, i, tmp);
|
||||
WREG32_SOC15_OFFSET(MMHUB, 0, mmVM_CONTEXT1_PAGE_TABLE_START_ADDR_LO32, i*2, 0);
|
||||
WREG32_SOC15_OFFSET(MMHUB, 0, mmVM_CONTEXT1_PAGE_TABLE_START_ADDR_HI32, i*2, 0);
|
||||
|
@ -205,7 +205,8 @@ static void mmhub_v2_0_setup_vmid_config(struct amdgpu_device *adev)
|
||||
adev->vm_manager.block_size - 9);
|
||||
/* Send no-retry XNACK on fault to suppress VM fault storm. */
|
||||
tmp = REG_SET_FIELD(tmp, MMVM_CONTEXT1_CNTL,
|
||||
RETRY_PERMISSION_OR_INVALID_PAGE_FAULT, 0);
|
||||
RETRY_PERMISSION_OR_INVALID_PAGE_FAULT,
|
||||
!amdgpu_noretry);
|
||||
WREG32_SOC15_OFFSET(MMHUB, 0, mmMMVM_CONTEXT1_CNTL, i, tmp);
|
||||
WREG32_SOC15_OFFSET(MMHUB, 0, mmMMVM_CONTEXT1_PAGE_TABLE_START_ADDR_LO32, i*2, 0);
|
||||
WREG32_SOC15_OFFSET(MMHUB, 0, mmMMVM_CONTEXT1_PAGE_TABLE_START_ADDR_HI32, i*2, 0);
|
||||
|
@ -392,8 +392,6 @@ int nv_set_ip_blocks(struct amdgpu_device *adev)
|
||||
#if defined(CONFIG_DRM_AMD_DC)
|
||||
else if (amdgpu_device_has_dc_support(adev))
|
||||
amdgpu_device_ip_block_add(adev, &dm_ip_block);
|
||||
#else
|
||||
# warning "Enable CONFIG_DRM_AMD_DC for display support on navi."
|
||||
#endif
|
||||
amdgpu_device_ip_block_add(adev, &gfx_v10_0_ip_block);
|
||||
amdgpu_device_ip_block_add(adev, &sdma_v5_0_ip_block);
|
||||
|
@ -103,6 +103,9 @@ static int psp_v11_0_init_microcode(struct psp_context *psp)
|
||||
adev->psp.toc_bin_size = le32_to_cpu(sos_hdr_v1_1->toc_size_bytes);
|
||||
adev->psp.toc_start_addr = (uint8_t *)adev->psp.sys_start_addr +
|
||||
le32_to_cpu(sos_hdr_v1_1->toc_offset_bytes);
|
||||
adev->psp.kdb_bin_size = le32_to_cpu(sos_hdr_v1_1->kdb_size_bytes);
|
||||
adev->psp.kdb_start_addr = (uint8_t *)adev->psp.sys_start_addr +
|
||||
le32_to_cpu(sos_hdr_v1_1->kdb_offset_bytes);
|
||||
}
|
||||
break;
|
||||
default:
|
||||
@ -177,6 +180,48 @@ out:
|
||||
return err;
|
||||
}
|
||||
|
||||
static int psp_v11_0_bootloader_load_kdb(struct psp_context *psp)
|
||||
{
|
||||
int ret;
|
||||
uint32_t psp_gfxdrv_command_reg = 0;
|
||||
struct amdgpu_device *adev = psp->adev;
|
||||
uint32_t sol_reg;
|
||||
|
||||
/* Check tOS sign of life register to confirm sys driver and sOS
|
||||
* are already been loaded.
|
||||
*/
|
||||
sol_reg = RREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_81);
|
||||
if (sol_reg) {
|
||||
psp->sos_fw_version = RREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_58);
|
||||
dev_info(adev->dev, "sos fw version = 0x%x.\n", psp->sos_fw_version);
|
||||
return 0;
|
||||
}
|
||||
|
||||
/* Wait for bootloader to signify that is ready having bit 31 of C2PMSG_35 set to 1 */
|
||||
ret = psp_wait_for(psp, SOC15_REG_OFFSET(MP0, 0, mmMP0_SMN_C2PMSG_35),
|
||||
0x80000000, 0x80000000, false);
|
||||
if (ret)
|
||||
return ret;
|
||||
|
||||
memset(psp->fw_pri_buf, 0, PSP_1_MEG);
|
||||
|
||||
/* Copy PSP KDB binary to memory */
|
||||
memcpy(psp->fw_pri_buf, psp->kdb_start_addr, psp->kdb_bin_size);
|
||||
|
||||
/* Provide the sys driver to bootloader */
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_36,
|
||||
(uint32_t)(psp->fw_pri_mc_addr >> 20));
|
||||
psp_gfxdrv_command_reg = PSP_BL__LOAD_KEY_DATABASE;
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_35,
|
||||
psp_gfxdrv_command_reg);
|
||||
|
||||
/* Wait for bootloader to signify that is ready having bit 31 of C2PMSG_35 set to 1*/
|
||||
ret = psp_wait_for(psp, SOC15_REG_OFFSET(MP0, 0, mmMP0_SMN_C2PMSG_35),
|
||||
0x80000000, 0x80000000, false);
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
static int psp_v11_0_bootloader_load_sysdrv(struct psp_context *psp)
|
||||
{
|
||||
int ret;
|
||||
@ -190,7 +235,7 @@ static int psp_v11_0_bootloader_load_sysdrv(struct psp_context *psp)
|
||||
sol_reg = RREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_81);
|
||||
if (sol_reg) {
|
||||
psp->sos_fw_version = RREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_58);
|
||||
printk("sos fw version = 0x%x.\n", psp->sos_fw_version);
|
||||
dev_info(adev->dev, "sos fw version = 0x%x.\n", psp->sos_fw_version);
|
||||
return 0;
|
||||
}
|
||||
|
||||
@ -208,7 +253,7 @@ static int psp_v11_0_bootloader_load_sysdrv(struct psp_context *psp)
|
||||
/* Provide the sys driver to bootloader */
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_36,
|
||||
(uint32_t)(psp->fw_pri_mc_addr >> 20));
|
||||
psp_gfxdrv_command_reg = 1 << 16;
|
||||
psp_gfxdrv_command_reg = PSP_BL__LOAD_SYSDRV;
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_35,
|
||||
psp_gfxdrv_command_reg);
|
||||
|
||||
@ -249,7 +294,7 @@ static int psp_v11_0_bootloader_load_sos(struct psp_context *psp)
|
||||
/* Provide the PSP secure OS to bootloader */
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_36,
|
||||
(uint32_t)(psp->fw_pri_mc_addr >> 20));
|
||||
psp_gfxdrv_command_reg = 2 << 16;
|
||||
psp_gfxdrv_command_reg = PSP_BL__LOAD_SOSDRV;
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_35,
|
||||
psp_gfxdrv_command_reg);
|
||||
|
||||
@ -822,6 +867,7 @@ static int psp_v11_0_rlc_autoload_start(struct psp_context *psp)
|
||||
|
||||
static const struct psp_funcs psp_v11_0_funcs = {
|
||||
.init_microcode = psp_v11_0_init_microcode,
|
||||
.bootloader_load_kdb = psp_v11_0_bootloader_load_kdb,
|
||||
.bootloader_load_sysdrv = psp_v11_0_bootloader_load_sysdrv,
|
||||
.bootloader_load_sos = psp_v11_0_bootloader_load_sos,
|
||||
.ring_init = psp_v11_0_ring_init,
|
||||
|
@ -155,7 +155,7 @@ static int psp_v3_1_bootloader_load_sysdrv(struct psp_context *psp)
|
||||
/* Provide the sys driver to bootloader */
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_36,
|
||||
(uint32_t)(psp->fw_pri_mc_addr >> 20));
|
||||
psp_gfxdrv_command_reg = 1 << 16;
|
||||
psp_gfxdrv_command_reg = PSP_BL__LOAD_SYSDRV;
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_35,
|
||||
psp_gfxdrv_command_reg);
|
||||
|
||||
@ -218,7 +218,7 @@ static int psp_v3_1_bootloader_load_sos(struct psp_context *psp)
|
||||
/* Provide the PSP secure OS to bootloader */
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_36,
|
||||
(uint32_t)(psp->fw_pri_mc_addr >> 20));
|
||||
psp_gfxdrv_command_reg = 2 << 16;
|
||||
psp_gfxdrv_command_reg = PSP_BL__LOAD_SOSDRV;
|
||||
WREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_35,
|
||||
psp_gfxdrv_command_reg);
|
||||
|
||||
|
@ -649,8 +649,6 @@ int soc15_set_ip_blocks(struct amdgpu_device *adev)
|
||||
#if defined(CONFIG_DRM_AMD_DC)
|
||||
else if (amdgpu_device_has_dc_support(adev))
|
||||
amdgpu_device_ip_block_add(adev, &dm_ip_block);
|
||||
#else
|
||||
# warning "Enable CONFIG_DRM_AMD_DC for display support on SOC15."
|
||||
#endif
|
||||
if (!(adev->asic_type == CHIP_VEGA20 && amdgpu_sriov_vf(adev))) {
|
||||
amdgpu_device_ip_block_add(adev, &uvd_v7_0_ip_block);
|
||||
@ -671,8 +669,6 @@ int soc15_set_ip_blocks(struct amdgpu_device *adev)
|
||||
#if defined(CONFIG_DRM_AMD_DC)
|
||||
else if (amdgpu_device_has_dc_support(adev))
|
||||
amdgpu_device_ip_block_add(adev, &dm_ip_block);
|
||||
#else
|
||||
# warning "Enable CONFIG_DRM_AMD_DC for display support on SOC15."
|
||||
#endif
|
||||
amdgpu_device_ip_block_add(adev, &vcn_v1_0_ip_block);
|
||||
break;
|
||||
@ -717,9 +713,15 @@ static void soc15_get_pcie_usage(struct amdgpu_device *adev, uint64_t *count0,
|
||||
return;
|
||||
|
||||
/* Set the 2 events that we wish to watch, defined above */
|
||||
/* Reg 40 is # received msgs, Reg 104 is # of posted requests sent */
|
||||
/* Reg 40 is # received msgs */
|
||||
perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK, EVENT0_SEL, 40);
|
||||
perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK, EVENT1_SEL, 104);
|
||||
/* Pre-VG20, Reg 104 is # of posted requests sent. On VG20 it's 108 */
|
||||
if (adev->asic_type == CHIP_VEGA20)
|
||||
perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK,
|
||||
EVENT1_SEL, 108);
|
||||
else
|
||||
perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK,
|
||||
EVENT1_SEL, 104);
|
||||
|
||||
/* Write to enable desired perf counters */
|
||||
WREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK, perfctr);
|
||||
|
@ -59,7 +59,6 @@
|
||||
|
||||
#include "vid.h"
|
||||
#include "vi.h"
|
||||
#include "vi_dpm.h"
|
||||
#include "gmc_v8_0.h"
|
||||
#include "gmc_v7_0.h"
|
||||
#include "gfx_v8_0.h"
|
||||
|
@ -1,32 +0,0 @@
|
||||
/*
|
||||
* Copyright 2014 Advanced Micro Devices, Inc.
|
||||
*
|
||||
* Permission is hereby granted, free of charge, to any person obtaining a
|
||||
* copy of this software and associated documentation files (the "Software"),
|
||||
* to deal in the Software without restriction, including without limitation
|
||||
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
||||
* and/or sell copies of the Software, and to permit persons to whom the
|
||||
* Software is furnished to do so, subject to the following conditions:
|
||||
*
|
||||
* The above copyright notice and this permission notice shall be included in
|
||||
* all copies or substantial portions of the Software.
|
||||
*
|
||||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
||||
* THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
||||
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
||||
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
||||
* OTHER DEALINGS IN THE SOFTWARE.
|
||||
*
|
||||
*/
|
||||
|
||||
#ifndef __VI_DPM_H__
|
||||
#define __VI_DPM_H__
|
||||
|
||||
extern const struct amd_ip_funcs cz_dpm_ip_funcs;
|
||||
int cz_smu_init(struct amdgpu_device *adev);
|
||||
int cz_smu_start(struct amdgpu_device *adev);
|
||||
int cz_smu_fini(struct amdgpu_device *adev);
|
||||
|
||||
#endif
|
@ -1157,12 +1157,7 @@ static int create_queue_cpsch(struct device_queue_manager *dqm, struct queue *q,
|
||||
|
||||
mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
|
||||
q->properties.type)];
|
||||
/*
|
||||
* Eviction state logic: mark all queues as evicted, even ones
|
||||
* not currently active. Restoring inactive queues later only
|
||||
* updates the is_evicted flag but is a no-op otherwise.
|
||||
*/
|
||||
q->properties.is_evicted = !!qpd->evicted;
|
||||
|
||||
if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
|
||||
q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)
|
||||
dqm->asic_ops.init_sdma_vm(dqm, q, qpd);
|
||||
@ -1173,9 +1168,16 @@ static int create_queue_cpsch(struct device_queue_manager *dqm, struct queue *q,
|
||||
retval = -ENOMEM;
|
||||
goto out_deallocate_doorbell;
|
||||
}
|
||||
|
||||
dqm_lock(dqm);
|
||||
/*
|
||||
* Eviction state logic: mark all queues as evicted, even ones
|
||||
* not currently active. Restoring inactive queues later only
|
||||
* updates the is_evicted flag but is a no-op otherwise.
|
||||
*/
|
||||
q->properties.is_evicted = !!qpd->evicted;
|
||||
mqd_mgr->init_mqd(mqd_mgr, &q->mqd, q->mqd_mem_obj,
|
||||
&q->gart_mqd_addr, &q->properties);
|
||||
dqm_lock(dqm);
|
||||
|
||||
list_add(&q->list, &qpd->queues_list);
|
||||
qpd->queue_count++;
|
||||
|
@ -61,7 +61,7 @@ static int update_qpd_v9(struct device_queue_manager *dqm,
|
||||
qpd->sh_mem_config =
|
||||
SH_MEM_ALIGNMENT_MODE_UNALIGNED <<
|
||||
SH_MEM_CONFIG__ALIGNMENT_MODE__SHIFT;
|
||||
if (noretry &&
|
||||
if (amdgpu_noretry &&
|
||||
!dqm->dev->device_info->needs_iommu_device)
|
||||
qpd->sh_mem_config |=
|
||||
1 << SH_MEM_CONFIG__RETRY_DISABLE__SHIFT;
|
||||
|
@ -157,7 +157,7 @@ extern int ignore_crat;
|
||||
/*
|
||||
* Set sh_mem_config.retry_disable on Vega10
|
||||
*/
|
||||
extern int noretry;
|
||||
extern int amdgpu_noretry;
|
||||
|
||||
/*
|
||||
* Halt if HWS hang is detected
|
||||
|
@ -150,6 +150,9 @@ void pqm_uninit(struct process_queue_manager *pqm)
|
||||
struct process_queue_node *pqn, *next;
|
||||
|
||||
list_for_each_entry_safe(pqn, next, &pqm->queues, process_queue_list) {
|
||||
if (pqn->q && pqn->q->gws)
|
||||
amdgpu_amdkfd_remove_gws_from_process(pqm->process->kgd_process_info,
|
||||
pqn->q->gws);
|
||||
uninit_queue(pqn->q);
|
||||
list_del(&pqn->process_queue_list);
|
||||
kfree(pqn);
|
||||
|
@ -5,6 +5,7 @@ menu "Display Engine Configuration"
|
||||
config DRM_AMD_DC
|
||||
bool "AMD DC - Enable new display engine"
|
||||
default y
|
||||
select SND_HDA_COMPONENT if SND_HDA_CORE
|
||||
select DRM_AMD_DC_DCN1_0 if X86 && !(KCOV_INSTRUMENT_ALL && KCOV_ENABLE_COMPARISONS)
|
||||
help
|
||||
Choose this option if you want to use the new display engine
|
||||
|
@ -56,6 +56,7 @@
|
||||
#include <linux/pm_runtime.h>
|
||||
#include <linux/pci.h>
|
||||
#include <linux/firmware.h>
|
||||
#include <linux/component.h>
|
||||
|
||||
#include <drm/drm_atomic.h>
|
||||
#include <drm/drm_atomic_uapi.h>
|
||||
@ -65,6 +66,7 @@
|
||||
#include <drm/drm_fourcc.h>
|
||||
#include <drm/drm_edid.h>
|
||||
#include <drm/drm_vblank.h>
|
||||
#include <drm/drm_audio_component.h>
|
||||
|
||||
#if defined(CONFIG_DRM_AMD_DC_DCN1_0)
|
||||
#include "ivsrcid/dcn/irqsrcs_dcn_1_0.h"
|
||||
@ -508,6 +510,139 @@ static void amdgpu_dm_fbc_init(struct drm_connector *connector)
|
||||
|
||||
}
|
||||
|
||||
static int amdgpu_dm_audio_component_get_eld(struct device *kdev, int port,
|
||||
int pipe, bool *enabled,
|
||||
unsigned char *buf, int max_bytes)
|
||||
{
|
||||
struct drm_device *dev = dev_get_drvdata(kdev);
|
||||
struct amdgpu_device *adev = dev->dev_private;
|
||||
struct drm_connector *connector;
|
||||
struct drm_connector_list_iter conn_iter;
|
||||
struct amdgpu_dm_connector *aconnector;
|
||||
int ret = 0;
|
||||
|
||||
*enabled = false;
|
||||
|
||||
mutex_lock(&adev->dm.audio_lock);
|
||||
|
||||
drm_connector_list_iter_begin(dev, &conn_iter);
|
||||
drm_for_each_connector_iter(connector, &conn_iter) {
|
||||
aconnector = to_amdgpu_dm_connector(connector);
|
||||
if (aconnector->audio_inst != port)
|
||||
continue;
|
||||
|
||||
*enabled = true;
|
||||
ret = drm_eld_size(connector->eld);
|
||||
memcpy(buf, connector->eld, min(max_bytes, ret));
|
||||
|
||||
break;
|
||||
}
|
||||
drm_connector_list_iter_end(&conn_iter);
|
||||
|
||||
mutex_unlock(&adev->dm.audio_lock);
|
||||
|
||||
DRM_DEBUG_KMS("Get ELD : idx=%d ret=%d en=%d\n", port, ret, *enabled);
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
static const struct drm_audio_component_ops amdgpu_dm_audio_component_ops = {
|
||||
.get_eld = amdgpu_dm_audio_component_get_eld,
|
||||
};
|
||||
|
||||
static int amdgpu_dm_audio_component_bind(struct device *kdev,
|
||||
struct device *hda_kdev, void *data)
|
||||
{
|
||||
struct drm_device *dev = dev_get_drvdata(kdev);
|
||||
struct amdgpu_device *adev = dev->dev_private;
|
||||
struct drm_audio_component *acomp = data;
|
||||
|
||||
acomp->ops = &amdgpu_dm_audio_component_ops;
|
||||
acomp->dev = kdev;
|
||||
adev->dm.audio_component = acomp;
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void amdgpu_dm_audio_component_unbind(struct device *kdev,
|
||||
struct device *hda_kdev, void *data)
|
||||
{
|
||||
struct drm_device *dev = dev_get_drvdata(kdev);
|
||||
struct amdgpu_device *adev = dev->dev_private;
|
||||
struct drm_audio_component *acomp = data;
|
||||
|
||||
acomp->ops = NULL;
|
||||
acomp->dev = NULL;
|
||||
adev->dm.audio_component = NULL;
|
||||
}
|
||||
|
||||
static const struct component_ops amdgpu_dm_audio_component_bind_ops = {
|
||||
.bind = amdgpu_dm_audio_component_bind,
|
||||
.unbind = amdgpu_dm_audio_component_unbind,
|
||||
};
|
||||
|
||||
static int amdgpu_dm_audio_init(struct amdgpu_device *adev)
|
||||
{
|
||||
int i, ret;
|
||||
|
||||
if (!amdgpu_audio)
|
||||
return 0;
|
||||
|
||||
adev->mode_info.audio.enabled = true;
|
||||
|
||||
adev->mode_info.audio.num_pins = adev->dm.dc->res_pool->audio_count;
|
||||
|
||||
for (i = 0; i < adev->mode_info.audio.num_pins; i++) {
|
||||
adev->mode_info.audio.pin[i].channels = -1;
|
||||
adev->mode_info.audio.pin[i].rate = -1;
|
||||
adev->mode_info.audio.pin[i].bits_per_sample = -1;
|
||||
adev->mode_info.audio.pin[i].status_bits = 0;
|
||||
adev->mode_info.audio.pin[i].category_code = 0;
|
||||
adev->mode_info.audio.pin[i].connected = false;
|
||||
adev->mode_info.audio.pin[i].id =
|
||||
adev->dm.dc->res_pool->audios[i]->inst;
|
||||
adev->mode_info.audio.pin[i].offset = 0;
|
||||
}
|
||||
|
||||
ret = component_add(adev->dev, &amdgpu_dm_audio_component_bind_ops);
|
||||
if (ret < 0)
|
||||
return ret;
|
||||
|
||||
adev->dm.audio_registered = true;
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void amdgpu_dm_audio_fini(struct amdgpu_device *adev)
|
||||
{
|
||||
if (!amdgpu_audio)
|
||||
return;
|
||||
|
||||
if (!adev->mode_info.audio.enabled)
|
||||
return;
|
||||
|
||||
if (adev->dm.audio_registered) {
|
||||
component_del(adev->dev, &amdgpu_dm_audio_component_bind_ops);
|
||||
adev->dm.audio_registered = false;
|
||||
}
|
||||
|
||||
/* TODO: Disable audio? */
|
||||
|
||||
adev->mode_info.audio.enabled = false;
|
||||
}
|
||||
|
||||
void amdgpu_dm_audio_eld_notify(struct amdgpu_device *adev, int pin)
|
||||
{
|
||||
struct drm_audio_component *acomp = adev->dm.audio_component;
|
||||
|
||||
if (acomp && acomp->audio_ops && acomp->audio_ops->pin_eld_notify) {
|
||||
DRM_DEBUG_KMS("Notify ELD: %d\n", pin);
|
||||
|
||||
acomp->audio_ops->pin_eld_notify(acomp->audio_ops->audio_ptr,
|
||||
pin, -1);
|
||||
}
|
||||
}
|
||||
|
||||
static int amdgpu_dm_init(struct amdgpu_device *adev)
|
||||
{
|
||||
struct dc_init_data init_data;
|
||||
@ -518,6 +653,7 @@ static int amdgpu_dm_init(struct amdgpu_device *adev)
|
||||
memset(&init_data, 0, sizeof(init_data));
|
||||
|
||||
mutex_init(&adev->dm.dc_lock);
|
||||
mutex_init(&adev->dm.audio_lock);
|
||||
|
||||
if(amdgpu_dm_irq_init(adev)) {
|
||||
DRM_ERROR("amdgpu: failed to initialize DM IRQ support.\n");
|
||||
@ -621,6 +757,8 @@ error:
|
||||
|
||||
static void amdgpu_dm_fini(struct amdgpu_device *adev)
|
||||
{
|
||||
amdgpu_dm_audio_fini(adev);
|
||||
|
||||
amdgpu_dm_destroy_drm_device(&adev->dm);
|
||||
|
||||
/* DC Destroy TODO: Replace destroy DAL */
|
||||
@ -641,6 +779,7 @@ static void amdgpu_dm_fini(struct amdgpu_device *adev)
|
||||
adev->dm.freesync_module = NULL;
|
||||
}
|
||||
|
||||
mutex_destroy(&adev->dm.audio_lock);
|
||||
mutex_destroy(&adev->dm.dc_lock);
|
||||
|
||||
return;
|
||||
@ -1888,6 +2027,10 @@ static int amdgpu_dm_mode_config_init(struct amdgpu_device *adev)
|
||||
if (r)
|
||||
return r;
|
||||
|
||||
r = amdgpu_dm_audio_init(adev);
|
||||
if (r)
|
||||
return r;
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
@ -4834,6 +4977,7 @@ void amdgpu_dm_connector_init_helper(struct amdgpu_display_manager *dm,
|
||||
aconnector->base.stereo_allowed = false;
|
||||
aconnector->base.dpms = DRM_MODE_DPMS_OFF;
|
||||
aconnector->hpd.hpd = AMDGPU_HPD_NONE; /* not used */
|
||||
aconnector->audio_inst = -1;
|
||||
mutex_init(&aconnector->hpd_lock);
|
||||
|
||||
/*
|
||||
@ -5728,6 +5872,81 @@ cleanup:
|
||||
kfree(bundle);
|
||||
}
|
||||
|
||||
static void amdgpu_dm_commit_audio(struct drm_device *dev,
|
||||
struct drm_atomic_state *state)
|
||||
{
|
||||
struct amdgpu_device *adev = dev->dev_private;
|
||||
struct amdgpu_dm_connector *aconnector;
|
||||
struct drm_connector *connector;
|
||||
struct drm_connector_state *old_con_state, *new_con_state;
|
||||
struct drm_crtc_state *new_crtc_state;
|
||||
struct dm_crtc_state *new_dm_crtc_state;
|
||||
const struct dc_stream_status *status;
|
||||
int i, inst;
|
||||
|
||||
/* Notify device removals. */
|
||||
for_each_oldnew_connector_in_state(state, connector, old_con_state, new_con_state, i) {
|
||||
if (old_con_state->crtc != new_con_state->crtc) {
|
||||
/* CRTC changes require notification. */
|
||||
goto notify;
|
||||
}
|
||||
|
||||
if (!new_con_state->crtc)
|
||||
continue;
|
||||
|
||||
new_crtc_state = drm_atomic_get_new_crtc_state(
|
||||
state, new_con_state->crtc);
|
||||
|
||||
if (!new_crtc_state)
|
||||
continue;
|
||||
|
||||
if (!drm_atomic_crtc_needs_modeset(new_crtc_state))
|
||||
continue;
|
||||
|
||||
notify:
|
||||
aconnector = to_amdgpu_dm_connector(connector);
|
||||
|
||||
mutex_lock(&adev->dm.audio_lock);
|
||||
inst = aconnector->audio_inst;
|
||||
aconnector->audio_inst = -1;
|
||||
mutex_unlock(&adev->dm.audio_lock);
|
||||
|
||||
amdgpu_dm_audio_eld_notify(adev, inst);
|
||||
}
|
||||
|
||||
/* Notify audio device additions. */
|
||||
for_each_new_connector_in_state(state, connector, new_con_state, i) {
|
||||
if (!new_con_state->crtc)
|
||||
continue;
|
||||
|
||||
new_crtc_state = drm_atomic_get_new_crtc_state(
|
||||
state, new_con_state->crtc);
|
||||
|
||||
if (!new_crtc_state)
|
||||
continue;
|
||||
|
||||
if (!drm_atomic_crtc_needs_modeset(new_crtc_state))
|
||||
continue;
|
||||
|
||||
new_dm_crtc_state = to_dm_crtc_state(new_crtc_state);
|
||||
if (!new_dm_crtc_state->stream)
|
||||
continue;
|
||||
|
||||
status = dc_stream_get_status(new_dm_crtc_state->stream);
|
||||
if (!status)
|
||||
continue;
|
||||
|
||||
aconnector = to_amdgpu_dm_connector(connector);
|
||||
|
||||
mutex_lock(&adev->dm.audio_lock);
|
||||
inst = status->audio_inst;
|
||||
aconnector->audio_inst = inst;
|
||||
mutex_unlock(&adev->dm.audio_lock);
|
||||
|
||||
amdgpu_dm_audio_eld_notify(adev, inst);
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
* Enable interrupts on CRTCs that are newly active, undergone
|
||||
* a modeset, or have active planes again.
|
||||
@ -6106,6 +6325,9 @@ static void amdgpu_dm_atomic_commit_tail(struct drm_atomic_state *state)
|
||||
/* Enable interrupts for CRTCs going from 0 to n active planes. */
|
||||
amdgpu_dm_enable_crtc_interrupts(dev, state, false);
|
||||
|
||||
/* Update audio instances for each connector. */
|
||||
amdgpu_dm_commit_audio(dev, state);
|
||||
|
||||
/*
|
||||
* send vblank event on all events not handled in flip and
|
||||
* mark consumed event for drm_atomic_helper_commit_hw_done
|
||||
|
@ -143,6 +143,28 @@ struct amdgpu_display_manager {
|
||||
*/
|
||||
struct mutex dc_lock;
|
||||
|
||||
/**
|
||||
* @audio_lock:
|
||||
*
|
||||
* Guards access to audio instance changes.
|
||||
*/
|
||||
struct mutex audio_lock;
|
||||
|
||||
/**
|
||||
* @audio_component:
|
||||
*
|
||||
* Used to notify ELD changes to sound driver.
|
||||
*/
|
||||
struct drm_audio_component *audio_component;
|
||||
|
||||
/**
|
||||
* @audio_registered:
|
||||
*
|
||||
* True if the audio component has been registered
|
||||
* successfully, false otherwise.
|
||||
*/
|
||||
bool audio_registered;
|
||||
|
||||
/**
|
||||
* @irq_handler_list_low_tab:
|
||||
*
|
||||
@ -254,6 +276,9 @@ struct amdgpu_dm_connector {
|
||||
int max_vfreq ;
|
||||
int pixel_clock_mhz;
|
||||
|
||||
/* Audio instance - protected by audio_lock. */
|
||||
int audio_inst;
|
||||
|
||||
struct mutex hpd_lock;
|
||||
|
||||
bool fake_enable;
|
||||
|
@ -308,7 +308,8 @@ static void pp_to_dc_clock_levels_with_voltage(
|
||||
DC_DECODE_PP_CLOCK_TYPE(dc_clk_type));
|
||||
|
||||
for (i = 0; i < clk_level_info->num_levels; i++) {
|
||||
DRM_INFO("DM_PPLIB:\t %d in kHz\n", pp_clks->data[i].clocks_in_khz);
|
||||
DRM_INFO("DM_PPLIB:\t %d in kHz, %d in mV\n", pp_clks->data[i].clocks_in_khz,
|
||||
pp_clks->data[i].voltage_in_mv);
|
||||
clk_level_info->data[i].clocks_in_khz = pp_clks->data[i].clocks_in_khz;
|
||||
clk_level_info->data[i].voltage_in_mv = pp_clks->data[i].voltage_in_mv;
|
||||
}
|
||||
@ -910,11 +911,11 @@ void dm_pp_get_funcs(
|
||||
/* todo set_pme_wa_enable cause 4k@6ohz display not light up */
|
||||
funcs->nv_funcs.set_pme_wa_enable = NULL;
|
||||
/* todo debug waring message */
|
||||
funcs->nv_funcs.set_hard_min_uclk_by_freq = NULL;
|
||||
funcs->nv_funcs.set_hard_min_uclk_by_freq = pp_nv_set_hard_min_uclk_by_freq;
|
||||
/* todo compare data with window driver*/
|
||||
funcs->nv_funcs.get_maximum_sustainable_clocks = NULL;
|
||||
funcs->nv_funcs.get_maximum_sustainable_clocks = pp_nv_get_maximum_sustainable_clocks;
|
||||
/*todo compare data with window driver */
|
||||
funcs->nv_funcs.get_uclk_dpm_states = NULL;
|
||||
funcs->nv_funcs.get_uclk_dpm_states = pp_nv_get_uclk_dpm_states;
|
||||
break;
|
||||
#endif
|
||||
default:
|
||||
|
@ -175,32 +175,22 @@ struct resource_pool *dc_create_resource_pool(struct dc *dc,
|
||||
if (res_pool != NULL) {
|
||||
struct dc_firmware_info fw_info = { { 0 } };
|
||||
|
||||
if (dc->ctx->dc_bios->funcs->get_firmware_info(
|
||||
dc->ctx->dc_bios, &fw_info) == BP_RESULT_OK) {
|
||||
res_pool->ref_clocks.xtalin_clock_inKhz = fw_info.pll_info.crystal_frequency;
|
||||
|
||||
if (IS_FPGA_MAXIMUS_DC(dc->ctx->dce_environment)) {
|
||||
// On FPGA these dividers are currently not configured by GDB
|
||||
res_pool->ref_clocks.dccg_ref_clock_inKhz = res_pool->ref_clocks.xtalin_clock_inKhz;
|
||||
res_pool->ref_clocks.dchub_ref_clock_inKhz = res_pool->ref_clocks.xtalin_clock_inKhz;
|
||||
} else if (res_pool->dccg && res_pool->hubbub) {
|
||||
// If DCCG reference frequency cannot be determined (usually means not set to xtalin) then this is a critical error
|
||||
// as this value must be known for DCHUB programming
|
||||
(res_pool->dccg->funcs->get_dccg_ref_freq)(res_pool->dccg,
|
||||
fw_info.pll_info.crystal_frequency,
|
||||
&res_pool->ref_clocks.dccg_ref_clock_inKhz);
|
||||
|
||||
// Similarly, if DCHUB reference frequency cannot be determined, then it is also a critical error
|
||||
(res_pool->hubbub->funcs->get_dchub_ref_freq)(res_pool->hubbub,
|
||||
res_pool->ref_clocks.dccg_ref_clock_inKhz,
|
||||
&res_pool->ref_clocks.dchub_ref_clock_inKhz);
|
||||
} else {
|
||||
// Not all ASICs have DCCG sw component
|
||||
res_pool->ref_clocks.dccg_ref_clock_inKhz = res_pool->ref_clocks.xtalin_clock_inKhz;
|
||||
res_pool->ref_clocks.dchub_ref_clock_inKhz = res_pool->ref_clocks.xtalin_clock_inKhz;
|
||||
}
|
||||
} else
|
||||
ASSERT_CRITICAL(false);
|
||||
if (dc->ctx->dc_bios->funcs->get_firmware_info(dc->ctx->dc_bios,
|
||||
&fw_info) == BP_RESULT_OK) {
|
||||
res_pool->ref_clocks.xtalin_clock_inKhz =
|
||||
fw_info.pll_info.crystal_frequency;
|
||||
/* initialize with firmware data first, no all
|
||||
* ASIC have DCCG SW component. FPGA or
|
||||
* simulation need initialization of
|
||||
* dccg_ref_clock_inKhz, dchub_ref_clock_inKhz
|
||||
* with xtalin_clock_inKhz
|
||||
*/
|
||||
res_pool->ref_clocks.dccg_ref_clock_inKhz =
|
||||
res_pool->ref_clocks.xtalin_clock_inKhz;
|
||||
res_pool->ref_clocks.dchub_ref_clock_inKhz =
|
||||
res_pool->ref_clocks.xtalin_clock_inKhz;
|
||||
} else
|
||||
ASSERT_CRITICAL(false);
|
||||
}
|
||||
|
||||
return res_pool;
|
||||
@ -2011,6 +2001,9 @@ enum dc_status resource_map_pool_resources(
|
||||
if (context->streams[i] == stream) {
|
||||
context->stream_status[i].primary_otg_inst = pipe_ctx->stream_res.tg->inst;
|
||||
context->stream_status[i].stream_enc_inst = pipe_ctx->stream_res.stream_enc->id;
|
||||
context->stream_status[i].audio_inst =
|
||||
pipe_ctx->stream_res.audio ? pipe_ctx->stream_res.audio->inst : -1;
|
||||
|
||||
return DC_OK;
|
||||
}
|
||||
|
||||
|
@ -42,6 +42,7 @@ struct dc_stream_status {
|
||||
int primary_otg_inst;
|
||||
int stream_enc_inst;
|
||||
int plane_count;
|
||||
int audio_inst;
|
||||
struct timing_sync_info timing_sync_info;
|
||||
struct dc_plane_state *plane_states[MAX_SURFACE_NUM];
|
||||
};
|
||||
|
@ -10,7 +10,13 @@ ifdef CONFIG_DRM_AMD_DC_DSC_SUPPORT
|
||||
DCN20 += dcn20_dsc.o
|
||||
endif
|
||||
|
||||
CFLAGS_dcn20_resource.o := -mhard-float -msse -mpreferred-stack-boundary=4
|
||||
ifneq ($(call cc-option, -mpreferred-stack-boundary=4),)
|
||||
cc_stack_align := -mpreferred-stack-boundary=4
|
||||
else ifneq ($(call cc-option, -mstack-alignment=16),)
|
||||
cc_stack_align := -mstack-alignment=16
|
||||
endif
|
||||
|
||||
CFLAGS_dcn20_resource.o := -mhard-float -msse $(cc_stack_align)
|
||||
|
||||
AMD_DAL_DCN20 = $(addprefix $(AMDDALPATH)/dc/dcn20/,$(DCN20))
|
||||
|
||||
|
@ -523,6 +523,7 @@ static void dcn20_init_hw(struct dc *dc)
|
||||
struct dc_bios *dcb = dc->ctx->dc_bios;
|
||||
struct resource_pool *res_pool = dc->res_pool;
|
||||
struct dc_state *context = dc->current_state;
|
||||
struct dc_firmware_info fw_info = { { 0 } };
|
||||
|
||||
if (dc->clk_mgr && dc->clk_mgr->funcs->init_clocks)
|
||||
dc->clk_mgr->funcs->init_clocks(dc->clk_mgr);
|
||||
@ -546,6 +547,30 @@ static void dcn20_init_hw(struct dc *dc)
|
||||
} else {
|
||||
if (!dcb->funcs->is_accelerated_mode(dcb)) {
|
||||
bios_golden_init(dc);
|
||||
if (dc->ctx->dc_bios->funcs->get_firmware_info(
|
||||
dc->ctx->dc_bios, &fw_info) == BP_RESULT_OK) {
|
||||
res_pool->ref_clocks.xtalin_clock_inKhz = fw_info.pll_info.crystal_frequency;
|
||||
|
||||
if (!IS_FPGA_MAXIMUS_DC(dc->ctx->dce_environment)) {
|
||||
if (res_pool->dccg && res_pool->hubbub) {
|
||||
|
||||
(res_pool->dccg->funcs->get_dccg_ref_freq)(res_pool->dccg,
|
||||
fw_info.pll_info.crystal_frequency,
|
||||
&res_pool->ref_clocks.dccg_ref_clock_inKhz);
|
||||
|
||||
(res_pool->hubbub->funcs->get_dchub_ref_freq)(res_pool->hubbub,
|
||||
res_pool->ref_clocks.dccg_ref_clock_inKhz,
|
||||
&res_pool->ref_clocks.dchub_ref_clock_inKhz);
|
||||
} else {
|
||||
// Not all ASICs have DCCG sw component
|
||||
res_pool->ref_clocks.dccg_ref_clock_inKhz =
|
||||
res_pool->ref_clocks.xtalin_clock_inKhz;
|
||||
res_pool->ref_clocks.dchub_ref_clock_inKhz =
|
||||
res_pool->ref_clocks.xtalin_clock_inKhz;
|
||||
}
|
||||
}
|
||||
} else
|
||||
ASSERT_CRITICAL(false);
|
||||
disable_vga(dc->hwseq);
|
||||
}
|
||||
|
||||
|
@ -2415,7 +2415,7 @@ struct pipe_ctx *dcn20_acquire_idle_pipe_for_layer(
|
||||
ASSERT(0);
|
||||
|
||||
if (!idle_pipe)
|
||||
return false;
|
||||
return NULL;
|
||||
|
||||
idle_pipe->stream = head_pipe->stream;
|
||||
idle_pipe->stream_res.tg = head_pipe->stream_res.tg;
|
||||
@ -2576,6 +2576,9 @@ static void cap_soc_clocks(
|
||||
&& max_clocks.uClockInKhz != 0)
|
||||
bb->clock_limits[i].dram_speed_mts = (max_clocks.uClockInKhz / 1000) * 16;
|
||||
|
||||
// HACK: Force every uclk to max for now to "disable" uclk switching.
|
||||
bb->clock_limits[i].dram_speed_mts = (max_clocks.uClockInKhz / 1000) * 16;
|
||||
|
||||
if ((bb->clock_limits[i].fabricclk_mhz > (max_clocks.fabricClockInKhz / 1000))
|
||||
&& max_clocks.fabricClockInKhz != 0)
|
||||
bb->clock_limits[i].fabricclk_mhz = (max_clocks.fabricClockInKhz / 1000);
|
||||
@ -2783,6 +2786,8 @@ static bool init_soc_bounding_box(struct dc *dc,
|
||||
le32_to_cpu(bb->vmm_page_size_bytes);
|
||||
dcn2_0_soc.dram_clock_change_latency_us =
|
||||
fixed16_to_double_to_cpu(bb->dram_clock_change_latency_us);
|
||||
// HACK!! Lower uclock latency switch time so we don't switch
|
||||
dcn2_0_soc.dram_clock_change_latency_us = 10;
|
||||
dcn2_0_soc.writeback_dram_clock_change_latency_us =
|
||||
fixed16_to_double_to_cpu(bb->writeback_dram_clock_change_latency_us);
|
||||
dcn2_0_soc.return_bus_width_bytes =
|
||||
@ -2824,6 +2829,7 @@ static bool init_soc_bounding_box(struct dc *dc,
|
||||
struct pp_smu_nv_clock_table max_clocks = {0};
|
||||
unsigned int uclk_states[8] = {0};
|
||||
unsigned int num_states = 0;
|
||||
int i;
|
||||
enum pp_smu_status status;
|
||||
bool clock_limits_available = false;
|
||||
bool uclk_states_available = false;
|
||||
@ -2845,6 +2851,10 @@ static bool init_soc_bounding_box(struct dc *dc,
|
||||
clock_limits_available = (status == PP_SMU_RESULT_OK);
|
||||
}
|
||||
|
||||
// HACK: Use the max uclk_states value for all elements.
|
||||
for (i = 0; i < num_states; i++)
|
||||
uclk_states[i] = uclk_states[num_states - 1];
|
||||
|
||||
if (clock_limits_available && uclk_states_available && num_states)
|
||||
update_bounding_box(dc, &dcn2_0_soc, &max_clocks, uclk_states, num_states);
|
||||
else if (clock_limits_available)
|
||||
|
@ -1,10 +1,18 @@
|
||||
#
|
||||
# Makefile for the 'dsc' sub-component of DAL.
|
||||
|
||||
CFLAGS_rc_calc.o := -mhard-float -msse -mpreferred-stack-boundary=4
|
||||
CFLAGS_rc_calc_dpi.o := -mhard-float -msse -mpreferred-stack-boundary=4
|
||||
CFLAGS_codec_main_amd.o := -mhard-float -msse -mpreferred-stack-boundary=4
|
||||
CFLAGS_dc_dsc.o := -mhard-float -msse -mpreferred-stack-boundary=4
|
||||
ifneq ($(call cc-option, -mpreferred-stack-boundary=4),)
|
||||
cc_stack_align := -mpreferred-stack-boundary=4
|
||||
else ifneq ($(call cc-option, -mstack-alignment=16),)
|
||||
cc_stack_align := -mstack-alignment=16
|
||||
endif
|
||||
|
||||
dsc_ccflags := -mhard-float -msse $(cc_stack_align)
|
||||
|
||||
CFLAGS_rc_calc.o := $(dsc_ccflags)
|
||||
CFLAGS_rc_calc_dpi.o := $(dsc_ccflags)
|
||||
CFLAGS_codec_main_amd.o := $(dsc_ccflags)
|
||||
CFLAGS_dc_dsc.o := $(dsc_ccflags)
|
||||
|
||||
DSC = dc_dsc.o rc_calc.o rc_calc_dpi.o
|
||||
|
||||
|
@ -26,7 +26,7 @@
|
||||
#include <drm/amd_asic_type.h>
|
||||
|
||||
|
||||
#define AMD_MAX_USEC_TIMEOUT 200000 /* 200 ms */
|
||||
#define AMD_MAX_USEC_TIMEOUT 1000000 /* 1000 ms */
|
||||
|
||||
/*
|
||||
* Chip flags
|
||||
|
@ -69,6 +69,9 @@ int smu_set_soft_freq_range(struct smu_context *smu, enum smu_clk_type clk_type,
|
||||
if (min <= 0 && max <= 0)
|
||||
return -EINVAL;
|
||||
|
||||
if (!smu_clk_dpm_is_enabled(smu, clk_type))
|
||||
return 0;
|
||||
|
||||
clk_id = smu_clk_get_index(smu, clk_type);
|
||||
if (clk_id < 0)
|
||||
return clk_id;
|
||||
@ -102,6 +105,9 @@ int smu_set_hard_freq_range(struct smu_context *smu, enum smu_clk_type clk_type,
|
||||
if (min <= 0 && max <= 0)
|
||||
return -EINVAL;
|
||||
|
||||
if (!smu_clk_dpm_is_enabled(smu, clk_type))
|
||||
return 0;
|
||||
|
||||
clk_id = smu_clk_get_index(smu, clk_type);
|
||||
if (clk_id < 0)
|
||||
return clk_id;
|
||||
@ -135,23 +141,8 @@ int smu_get_dpm_freq_range(struct smu_context *smu, enum smu_clk_type clk_type,
|
||||
if (!min && !max)
|
||||
return -EINVAL;
|
||||
|
||||
switch (clk_type) {
|
||||
case SMU_UCLK:
|
||||
if (!smu_feature_is_enabled(smu, SMU_FEATURE_DPM_UCLK_BIT)) {
|
||||
pr_warn("uclk dpm is not enabled\n");
|
||||
return 0;
|
||||
}
|
||||
break;
|
||||
case SMU_GFXCLK:
|
||||
case SMU_SCLK:
|
||||
if (!smu_feature_is_enabled(smu, SMU_FEATURE_DPM_GFXCLK_BIT)) {
|
||||
pr_warn("gfxclk dpm is not enabled\n");
|
||||
return 0;
|
||||
}
|
||||
break;
|
||||
default:
|
||||
break;
|
||||
}
|
||||
if (!smu_clk_dpm_is_enabled(smu, clk_type))
|
||||
return 0;
|
||||
|
||||
mutex_lock(&smu->mutex);
|
||||
clk_id = smu_clk_get_index(smu, clk_type);
|
||||
@ -194,6 +185,9 @@ int smu_get_dpm_freq_by_index(struct smu_context *smu, enum smu_clk_type clk_typ
|
||||
if (!value)
|
||||
return -EINVAL;
|
||||
|
||||
if (!smu_clk_dpm_is_enabled(smu, clk_type))
|
||||
return 0;
|
||||
|
||||
clk_id = smu_clk_get_index(smu, clk_type);
|
||||
if (clk_id < 0)
|
||||
return clk_id;
|
||||
@ -222,6 +216,35 @@ int smu_get_dpm_level_count(struct smu_context *smu, enum smu_clk_type clk_type,
|
||||
return smu_get_dpm_freq_by_index(smu, clk_type, 0xff, value);
|
||||
}
|
||||
|
||||
bool smu_clk_dpm_is_enabled(struct smu_context *smu, enum smu_clk_type clk_type)
|
||||
{
|
||||
enum smu_feature_mask feature_id = 0;
|
||||
|
||||
switch (clk_type) {
|
||||
case SMU_MCLK:
|
||||
case SMU_UCLK:
|
||||
feature_id = SMU_FEATURE_DPM_UCLK_BIT;
|
||||
break;
|
||||
case SMU_GFXCLK:
|
||||
case SMU_SCLK:
|
||||
feature_id = SMU_FEATURE_DPM_GFXCLK_BIT;
|
||||
break;
|
||||
case SMU_SOCCLK:
|
||||
feature_id = SMU_FEATURE_DPM_SOCCLK_BIT;
|
||||
break;
|
||||
default:
|
||||
return true;
|
||||
}
|
||||
|
||||
if(!smu_feature_is_enabled(smu, feature_id)) {
|
||||
pr_warn("smu %d clk dpm feature %d is not enabled\n", clk_type, feature_id);
|
||||
return false;
|
||||
}
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
|
||||
int smu_dpm_set_power_gate(struct smu_context *smu, uint32_t block_type,
|
||||
bool gate)
|
||||
{
|
||||
@ -300,7 +323,7 @@ int smu_common_read_sensor(struct smu_context *smu, enum amd_pp_sensors sensor,
|
||||
return ret;
|
||||
}
|
||||
|
||||
int smu_update_table(struct smu_context *smu, enum smu_table_id table_index,
|
||||
int smu_update_table(struct smu_context *smu, enum smu_table_id table_index, int argument,
|
||||
void *table_data, bool drv2smu)
|
||||
{
|
||||
struct smu_table_context *smu_table = &smu->smu_table;
|
||||
@ -327,7 +350,7 @@ int smu_update_table(struct smu_context *smu, enum smu_table_id table_index,
|
||||
ret = smu_send_smc_msg_with_param(smu, drv2smu ?
|
||||
SMU_MSG_TransferTableDram2Smu :
|
||||
SMU_MSG_TransferTableSmu2Dram,
|
||||
table_id);
|
||||
table_id | ((argument & 0xFFFF) << 16));
|
||||
if (ret)
|
||||
return ret;
|
||||
|
||||
@ -1372,10 +1395,10 @@ int smu_adjust_power_state_dynamic(struct smu_context *smu,
|
||||
break;
|
||||
|
||||
case AMD_DPM_FORCED_LEVEL_AUTO:
|
||||
case AMD_DPM_FORCED_LEVEL_PROFILE_STANDARD:
|
||||
ret = smu_unforce_dpm_levels(smu);
|
||||
break;
|
||||
|
||||
case AMD_DPM_FORCED_LEVEL_PROFILE_STANDARD:
|
||||
case AMD_DPM_FORCED_LEVEL_PROFILE_MIN_SCLK:
|
||||
case AMD_DPM_FORCED_LEVEL_PROFILE_MIN_MCLK:
|
||||
case AMD_DPM_FORCED_LEVEL_PROFILE_PEAK:
|
||||
@ -1385,8 +1408,9 @@ int smu_adjust_power_state_dynamic(struct smu_context *smu,
|
||||
&soc_mask);
|
||||
if (ret)
|
||||
return ret;
|
||||
smu_force_clk_levels(smu, PP_SCLK, 1 << sclk_mask);
|
||||
smu_force_clk_levels(smu, PP_MCLK, 1 << mclk_mask);
|
||||
smu_force_clk_levels(smu, SMU_SCLK, 1 << sclk_mask);
|
||||
smu_force_clk_levels(smu, SMU_MCLK, 1 << mclk_mask);
|
||||
smu_force_clk_levels(smu, SMU_SOCCLK, 1 << soc_mask);
|
||||
break;
|
||||
|
||||
case AMD_DPM_FORCED_LEVEL_MANUAL:
|
||||
@ -1441,17 +1465,16 @@ int smu_handle_task(struct smu_context *smu,
|
||||
enum amd_dpm_forced_level smu_get_performance_level(struct smu_context *smu)
|
||||
{
|
||||
struct smu_dpm_context *smu_dpm_ctx = &(smu->smu_dpm);
|
||||
enum amd_dpm_forced_level level;
|
||||
|
||||
if (!smu_dpm_ctx->dpm_context)
|
||||
return -EINVAL;
|
||||
|
||||
mutex_lock(&(smu->mutex));
|
||||
if (smu_dpm_ctx->dpm_level != smu_dpm_ctx->saved_dpm_level) {
|
||||
smu_dpm_ctx->saved_dpm_level = smu_dpm_ctx->dpm_level;
|
||||
}
|
||||
level = smu_dpm_ctx->dpm_level;
|
||||
mutex_unlock(&(smu->mutex));
|
||||
|
||||
return smu_dpm_ctx->dpm_level;
|
||||
return level;
|
||||
}
|
||||
|
||||
int smu_force_performance_level(struct smu_context *smu, enum amd_dpm_forced_level level)
|
||||
|
@ -1067,8 +1067,6 @@ static int pp_tables_v1_0_initialize(struct pp_hwmgr *hwmgr)
|
||||
PP_ASSERT_WITH_CODE((NULL != hwmgr->pptable),
|
||||
"Failed to allocate hwmgr->pptable!", return -ENOMEM);
|
||||
|
||||
memset(hwmgr->pptable, 0x00, sizeof(struct phm_ppt_v1_information));
|
||||
|
||||
powerplay_table = get_powerplay_table(hwmgr);
|
||||
|
||||
PP_ASSERT_WITH_CODE((NULL != powerplay_table),
|
||||
|
@ -937,7 +937,7 @@ extern int smu_feature_is_supported(struct smu_context *smu,
|
||||
extern int smu_feature_set_supported(struct smu_context *smu,
|
||||
enum smu_feature_mask mask, bool enable);
|
||||
|
||||
int smu_update_table(struct smu_context *smu, uint32_t table_index,
|
||||
int smu_update_table(struct smu_context *smu, enum smu_table_id table_index, int argument,
|
||||
void *table_data, bool drv2smu);
|
||||
|
||||
bool is_support_sw_smu(struct amdgpu_device *adev);
|
||||
@ -973,5 +973,6 @@ int smu_set_hard_freq_range(struct smu_context *smu, enum smu_clk_type clk_type,
|
||||
enum amd_dpm_forced_level smu_get_performance_level(struct smu_context *smu);
|
||||
int smu_force_performance_level(struct smu_context *smu, enum amd_dpm_forced_level level);
|
||||
int smu_set_display_count(struct smu_context *smu, uint32_t count);
|
||||
bool smu_clk_dpm_is_enabled(struct smu_context *smu, enum smu_clk_type clk_type);
|
||||
|
||||
#endif
|
||||
|
@ -27,7 +27,7 @@
|
||||
// *** IMPORTANT ***
|
||||
// SMU TEAM: Always increment the interface version if
|
||||
// any structure is changed in this file
|
||||
#define SMU11_DRIVER_IF_VERSION 0x12
|
||||
#define SMU11_DRIVER_IF_VERSION 0x13
|
||||
|
||||
#define PPTABLE_V20_SMU_VERSION 3
|
||||
|
||||
@ -615,6 +615,7 @@ typedef struct {
|
||||
uint16_t UclkAverageLpfTau;
|
||||
uint16_t GfxActivityLpfTau;
|
||||
uint16_t UclkActivityLpfTau;
|
||||
uint16_t SocketPowerLpfTau;
|
||||
|
||||
|
||||
uint32_t MmHubPadding[8];
|
||||
@ -665,7 +666,8 @@ typedef struct {
|
||||
uint32_t ThrottlerStatus ;
|
||||
|
||||
uint8_t LinkDpmLevel;
|
||||
uint8_t Padding[3];
|
||||
uint16_t AverageSocketPower;
|
||||
uint8_t Padding;
|
||||
|
||||
|
||||
uint32_t MmHubPadding[7];
|
||||
|
@ -331,7 +331,10 @@ navi10_get_allowed_feature_mask(struct smu_context *smu,
|
||||
| FEATURE_MASK(FEATURE_DS_DCEFCLK_BIT)
|
||||
| FEATURE_MASK(FEATURE_FW_DSTATE_BIT)
|
||||
| FEATURE_MASK(FEATURE_BACO_BIT)
|
||||
| FEATURE_MASK(FEATURE_ACDC_BIT);
|
||||
| FEATURE_MASK(FEATURE_ACDC_BIT)
|
||||
| FEATURE_MASK(FEATURE_GFX_SS_BIT)
|
||||
| FEATURE_MASK(FEATURE_APCC_DFLL_BIT)
|
||||
| FEATURE_MASK(FEATURE_FW_CTF_BIT);
|
||||
|
||||
if (adev->pm.pp_feature & PP_MCLK_DPM_MASK)
|
||||
*(uint64_t *)feature_mask |= FEATURE_MASK(FEATURE_DPM_UCLK_BIT)
|
||||
@ -339,8 +342,7 @@ navi10_get_allowed_feature_mask(struct smu_context *smu,
|
||||
| FEATURE_MASK(FEATURE_MEM_MVDD_SCALING_BIT);
|
||||
|
||||
if (adev->pm.pp_feature & PP_GFXOFF_MASK) {
|
||||
*(uint64_t *)feature_mask |= FEATURE_MASK(FEATURE_GFX_SS_BIT)
|
||||
| FEATURE_MASK(FEATURE_GFXOFF_BIT);
|
||||
*(uint64_t *)feature_mask |= FEATURE_MASK(FEATURE_GFXOFF_BIT);
|
||||
/* TODO: remove it once fw fix the bug */
|
||||
*(uint64_t *)feature_mask &= ~FEATURE_MASK(FEATURE_FW_DSTATE_BIT);
|
||||
}
|
||||
@ -465,9 +467,6 @@ static int navi10_append_powerplay_table(struct smu_context *smu)
|
||||
smc_pptable->MvddRatio = smc_dpm_table->MvddRatio;
|
||||
|
||||
if (adev->pm.pp_feature & PP_GFXOFF_MASK) {
|
||||
*(uint64_t *)smc_pptable->FeaturesToRun |= FEATURE_MASK(FEATURE_GFX_SS_BIT)
|
||||
| FEATURE_MASK(FEATURE_GFXOFF_BIT);
|
||||
|
||||
/* TODO: remove it once SMU fw fix it */
|
||||
smc_pptable->DebugOverrides |= DPM_OVERRIDE_DISABLE_DFLL_PLL_SHUTDOWN;
|
||||
}
|
||||
@ -614,7 +613,7 @@ static int navi10_get_current_clk_freq_by_table(struct smu_context *smu,
|
||||
|
||||
memset(&metrics, 0, sizeof(metrics));
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, (void *)&metrics, false);
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, 0, (void *)&metrics, false);
|
||||
if (ret)
|
||||
return ret;
|
||||
|
||||
@ -709,7 +708,7 @@ static int navi10_force_clk_levels(struct smu_context *smu,
|
||||
static int navi10_populate_umd_state_clk(struct smu_context *smu)
|
||||
{
|
||||
int ret = 0;
|
||||
uint32_t min_sclk_freq = 0;
|
||||
uint32_t min_sclk_freq = 0, min_mclk_freq = 0;
|
||||
|
||||
ret = smu_get_dpm_freq_range(smu, SMU_SCLK, &min_sclk_freq, NULL);
|
||||
if (ret)
|
||||
@ -717,6 +716,12 @@ static int navi10_populate_umd_state_clk(struct smu_context *smu)
|
||||
|
||||
smu->pstate_sclk = min_sclk_freq * 100;
|
||||
|
||||
ret = smu_get_dpm_freq_range(smu, SMU_MCLK, &min_mclk_freq, NULL);
|
||||
if (ret)
|
||||
return ret;
|
||||
|
||||
smu->pstate_mclk = min_mclk_freq * 100;
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
@ -827,27 +832,20 @@ static int navi10_force_dpm_limit_value(struct smu_context *smu, bool highest)
|
||||
return ret;
|
||||
}
|
||||
|
||||
static int navi10_unforce_dpm_levels(struct smu_context *smu) {
|
||||
|
||||
static int navi10_unforce_dpm_levels(struct smu_context *smu)
|
||||
{
|
||||
int ret = 0, i = 0;
|
||||
uint32_t min_freq, max_freq;
|
||||
enum smu_clk_type clk_type;
|
||||
|
||||
struct clk_feature_map {
|
||||
enum smu_clk_type clk_type;
|
||||
uint32_t feature;
|
||||
} clk_feature_map[] = {
|
||||
{SMU_GFXCLK, SMU_FEATURE_DPM_GFXCLK_BIT},
|
||||
{SMU_MCLK, SMU_FEATURE_DPM_UCLK_BIT},
|
||||
{SMU_SOCCLK, SMU_FEATURE_DPM_SOCCLK_BIT},
|
||||
enum smu_clk_type clks[] = {
|
||||
SMU_GFXCLK,
|
||||
SMU_MCLK,
|
||||
SMU_SOCCLK,
|
||||
};
|
||||
|
||||
for (i = 0; i < ARRAY_SIZE(clk_feature_map); i++) {
|
||||
if (!smu_feature_is_enabled(smu, clk_feature_map[i].feature))
|
||||
continue;
|
||||
|
||||
clk_type = clk_feature_map[i].clk_type;
|
||||
|
||||
for (i = 0; i < ARRAY_SIZE(clks); i++) {
|
||||
clk_type = clks[i];
|
||||
ret = smu_get_dpm_freq_range(smu, clk_type, &min_freq, &max_freq);
|
||||
if (ret)
|
||||
return ret;
|
||||
@ -868,7 +866,7 @@ static int navi10_get_gpu_power(struct smu_context *smu, uint32_t *value)
|
||||
if (!value)
|
||||
return -EINVAL;
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, (void *)&metrics,
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, 0, (void *)&metrics,
|
||||
false);
|
||||
if (ret)
|
||||
return ret;
|
||||
@ -890,7 +888,7 @@ static int navi10_get_current_activity_percent(struct smu_context *smu,
|
||||
|
||||
msleep(1);
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS,
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, 0,
|
||||
(void *)&metrics, false);
|
||||
if (ret)
|
||||
return ret;
|
||||
@ -931,7 +929,7 @@ static int navi10_get_fan_speed(struct smu_context *smu, uint16_t *value)
|
||||
|
||||
memset(&metrics, 0, sizeof(metrics));
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS,
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, 0,
|
||||
(void *)&metrics, false);
|
||||
if (ret)
|
||||
return ret;
|
||||
@ -997,7 +995,7 @@ static int navi10_get_power_profile_mode(struct smu_context *smu, char *buf)
|
||||
/* conv PP_SMC_POWER_PROFILE* to WORKLOAD_PPLIB_*_BIT */
|
||||
workload_type = smu_workload_get_type(smu, i);
|
||||
result = smu_update_table(smu,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF | workload_type << 16,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF, workload_type,
|
||||
(void *)(&activity_monitor), false);
|
||||
if (result) {
|
||||
pr_err("[%s] Failed to get activity monitor!", __func__);
|
||||
@ -1070,7 +1068,7 @@ static int navi10_set_power_profile_mode(struct smu_context *smu, long *input, u
|
||||
return -EINVAL;
|
||||
|
||||
ret = smu_update_table(smu,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF | WORKLOAD_PPLIB_CUSTOM_BIT << 16,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF, WORKLOAD_PPLIB_CUSTOM_BIT,
|
||||
(void *)(&activity_monitor), false);
|
||||
if (ret) {
|
||||
pr_err("[%s] Failed to get activity monitor!", __func__);
|
||||
@ -1114,7 +1112,7 @@ static int navi10_set_power_profile_mode(struct smu_context *smu, long *input, u
|
||||
}
|
||||
|
||||
ret = smu_update_table(smu,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF | WORKLOAD_PPLIB_CUSTOM_BIT << 16,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF, WORKLOAD_PPLIB_CUSTOM_BIT,
|
||||
(void *)(&activity_monitor), true);
|
||||
if (ret) {
|
||||
pr_err("[%s] Failed to set activity monitor!", __func__);
|
||||
@ -1157,14 +1155,14 @@ static int navi10_get_profiling_clk_mask(struct smu_context *smu,
|
||||
ret = smu_get_dpm_level_count(smu, SMU_MCLK, &level_count);
|
||||
if (ret)
|
||||
return ret;
|
||||
*sclk_mask = level_count - 1;
|
||||
*mclk_mask = level_count - 1;
|
||||
}
|
||||
|
||||
if(soc_mask) {
|
||||
ret = smu_get_dpm_level_count(smu, SMU_SOCCLK, &level_count);
|
||||
if (ret)
|
||||
return ret;
|
||||
*sclk_mask = level_count - 1;
|
||||
*soc_mask = level_count - 1;
|
||||
}
|
||||
}
|
||||
|
||||
@ -1280,7 +1278,7 @@ static int navi10_thermal_get_temperature(struct smu_context *smu,
|
||||
if (!value)
|
||||
return -EINVAL;
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, (void *)&metrics, false);
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, 0, (void *)&metrics, false);
|
||||
if (ret)
|
||||
return ret;
|
||||
|
||||
|
@ -261,14 +261,20 @@ static int smu_v11_0_check_fw_version(struct smu_context *smu)
|
||||
smu_minor = (smu_version >> 8) & 0xff;
|
||||
smu_debug = (smu_version >> 0) & 0xff;
|
||||
|
||||
|
||||
/*
|
||||
* 1. if_version mismatch is not critical as our fw is designed
|
||||
* to be backward compatible.
|
||||
* 2. New fw usually brings some optimizations. But that's visible
|
||||
* only on the paired driver.
|
||||
* Considering above, we just leave user a warning message instead
|
||||
* of halt driver loading.
|
||||
*/
|
||||
if (if_version != smu->smc_if_version) {
|
||||
pr_info("smu driver if version = 0x%08x, smu fw if version = 0x%08x, "
|
||||
"smu fw version = 0x%08x (%d.%d.%d)\n",
|
||||
smu->smc_if_version, if_version,
|
||||
smu_version, smu_major, smu_minor, smu_debug);
|
||||
pr_err("SMU driver if version not matched\n");
|
||||
ret = -EINVAL;
|
||||
pr_warn("SMU driver if version not matched\n");
|
||||
}
|
||||
|
||||
return ret;
|
||||
@ -703,7 +709,7 @@ static int smu_v11_0_write_pptable(struct smu_context *smu)
|
||||
struct smu_table_context *table_context = &smu->smu_table;
|
||||
int ret = 0;
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_PPTABLE,
|
||||
ret = smu_update_table(smu, SMU_TABLE_PPTABLE, 0,
|
||||
table_context->driver_pptable, true);
|
||||
|
||||
return ret;
|
||||
@ -722,7 +728,7 @@ static int smu_v11_0_write_watermarks_table(struct smu_context *smu)
|
||||
if (!table->cpu_addr)
|
||||
return -EINVAL;
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_WATERMARKS, table->cpu_addr,
|
||||
ret = smu_update_table(smu, SMU_TABLE_WATERMARKS, 0, table->cpu_addr,
|
||||
true);
|
||||
|
||||
return ret;
|
||||
|
@ -2705,8 +2705,6 @@ static int ci_initialize_mc_reg_table(struct pp_hwmgr *hwmgr)
|
||||
cgs_write_register(hwmgr->device, mmMC_SEQ_PMG_CMD_MRS2_LP, cgs_read_register(hwmgr->device, mmMC_PMG_CMD_MRS2));
|
||||
cgs_write_register(hwmgr->device, mmMC_SEQ_WR_CTL_2_LP, cgs_read_register(hwmgr->device, mmMC_SEQ_WR_CTL_2));
|
||||
|
||||
memset(table, 0x00, sizeof(pp_atomctrl_mc_reg_table));
|
||||
|
||||
result = atomctrl_initialize_mc_reg_table(hwmgr, module_index, table);
|
||||
|
||||
if (0 == result)
|
||||
|
@ -2634,8 +2634,6 @@ static int iceland_initialize_mc_reg_table(struct pp_hwmgr *hwmgr)
|
||||
cgs_write_register(hwmgr->device, mmMC_SEQ_PMG_CMD_MRS2_LP, cgs_read_register(hwmgr->device, mmMC_PMG_CMD_MRS2));
|
||||
cgs_write_register(hwmgr->device, mmMC_SEQ_WR_CTL_2_LP, cgs_read_register(hwmgr->device, mmMC_SEQ_WR_CTL_2));
|
||||
|
||||
memset(table, 0x00, sizeof(pp_atomctrl_mc_reg_table));
|
||||
|
||||
result = atomctrl_initialize_mc_reg_table(hwmgr, module_index, table);
|
||||
|
||||
if (0 == result)
|
||||
|
@ -3117,8 +3117,6 @@ static int tonga_initialize_mc_reg_table(struct pp_hwmgr *hwmgr)
|
||||
cgs_write_register(hwmgr->device, mmMC_SEQ_WR_CTL_2_LP,
|
||||
cgs_read_register(hwmgr->device, mmMC_SEQ_WR_CTL_2));
|
||||
|
||||
memset(table, 0x00, sizeof(pp_atomctrl_mc_reg_table));
|
||||
|
||||
result = atomctrl_initialize_mc_reg_table(hwmgr, module_index, table);
|
||||
|
||||
if (!result)
|
||||
|
@ -319,7 +319,7 @@ static int vega20_tables_init(struct smu_context *smu, struct smu_table *tables)
|
||||
AMDGPU_GEM_DOMAIN_VRAM);
|
||||
|
||||
smu_table->metrics_table = kzalloc(sizeof(SmuMetrics_t), GFP_KERNEL);
|
||||
if (smu_table->metrics_table)
|
||||
if (!smu_table->metrics_table)
|
||||
return -ENOMEM;
|
||||
smu_table->metrics_time = 0;
|
||||
|
||||
@ -441,7 +441,6 @@ static int vega20_store_powerplay_table(struct smu_context *smu)
|
||||
{
|
||||
ATOM_Vega20_POWERPLAYTABLE *powerplay_table = NULL;
|
||||
struct smu_table_context *table_context = &smu->smu_table;
|
||||
int ret;
|
||||
|
||||
if (!table_context->power_play_table)
|
||||
return -EINVAL;
|
||||
@ -455,9 +454,7 @@ static int vega20_store_powerplay_table(struct smu_context *smu)
|
||||
table_context->thermal_controller_type = powerplay_table->ucThermalControllerType;
|
||||
table_context->TDPODLimit = le32_to_cpu(powerplay_table->OverDrive8Table.ODSettingsMax[ATOM_VEGA20_ODSETTING_POWERPERCENTAGE]);
|
||||
|
||||
ret = vega20_setup_od8_information(smu);
|
||||
|
||||
return ret;
|
||||
return 0;
|
||||
}
|
||||
|
||||
static int vega20_append_powerplay_table(struct smu_context *smu)
|
||||
@ -992,7 +989,7 @@ static int vega20_print_clk_levels(struct smu_context *smu,
|
||||
break;
|
||||
|
||||
case SMU_SOCCLK:
|
||||
ret = smu_get_current_clk_freq(smu, PPCLK_SOCCLK, &now);
|
||||
ret = smu_get_current_clk_freq(smu, SMU_SOCCLK, &now);
|
||||
if (ret) {
|
||||
pr_err("Attempt to get current socclk Failed!");
|
||||
return ret;
|
||||
@ -1013,7 +1010,7 @@ static int vega20_print_clk_levels(struct smu_context *smu,
|
||||
break;
|
||||
|
||||
case SMU_FCLK:
|
||||
ret = smu_get_current_clk_freq(smu, PPCLK_FCLK, &now);
|
||||
ret = smu_get_current_clk_freq(smu, SMU_FCLK, &now);
|
||||
if (ret) {
|
||||
pr_err("Attempt to get current fclk Failed!");
|
||||
return ret;
|
||||
@ -1028,7 +1025,7 @@ static int vega20_print_clk_levels(struct smu_context *smu,
|
||||
break;
|
||||
|
||||
case SMU_DCEFCLK:
|
||||
ret = smu_get_current_clk_freq(smu, PPCLK_DCEFCLK, &now);
|
||||
ret = smu_get_current_clk_freq(smu, SMU_DCEFCLK, &now);
|
||||
if (ret) {
|
||||
pr_err("Attempt to get current dcefclk Failed!");
|
||||
return ret;
|
||||
@ -1502,11 +1499,17 @@ static int vega20_set_default_od8_setttings(struct smu_context *smu)
|
||||
|
||||
od8_settings = kzalloc(sizeof(struct vega20_od8_settings), GFP_KERNEL);
|
||||
|
||||
if (od8_settings)
|
||||
if (!od8_settings)
|
||||
return -ENOMEM;
|
||||
|
||||
smu->od_settings = (void *)od8_settings;
|
||||
|
||||
ret = vega20_setup_od8_information(smu);
|
||||
if (ret) {
|
||||
pr_err("Retrieve board OD limits failed!\n");
|
||||
return ret;
|
||||
}
|
||||
|
||||
if (smu_feature_is_enabled(smu, SMU_FEATURE_DPM_SOCCLK_BIT)) {
|
||||
if (od8_settings->od_feature_capabilities[ATOM_VEGA20_ODFEATURE_GFXCLK_LIMITS] &&
|
||||
od8_settings->od_settings_max[OD8_SETTING_GFXCLK_FMAX] > 0 &&
|
||||
@ -1677,7 +1680,7 @@ static int vega20_get_metrics_table(struct smu_context *smu,
|
||||
int ret = 0;
|
||||
|
||||
if (!smu_table->metrics_time || time_after(jiffies, smu_table->metrics_time + HZ / 1000)) {
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS,
|
||||
ret = smu_update_table(smu, SMU_TABLE_SMU_METRICS, 0,
|
||||
(void *)smu_table->metrics_table, false);
|
||||
if (ret) {
|
||||
pr_info("Failed to export SMU metrics table!\n");
|
||||
@ -1706,7 +1709,7 @@ static int vega20_set_default_od_settings(struct smu_context *smu,
|
||||
if (!table_context->overdrive_table)
|
||||
return -ENOMEM;
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE,
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE, 0,
|
||||
table_context->overdrive_table, false);
|
||||
if (ret) {
|
||||
pr_err("Failed to export over drive table!\n");
|
||||
@ -1718,7 +1721,7 @@ static int vega20_set_default_od_settings(struct smu_context *smu,
|
||||
return ret;
|
||||
}
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE,
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE, 0,
|
||||
table_context->overdrive_table, true);
|
||||
if (ret) {
|
||||
pr_err("Failed to import over drive table!\n");
|
||||
@ -1802,7 +1805,7 @@ static int vega20_get_power_profile_mode(struct smu_context *smu, char *buf)
|
||||
/* conv PP_SMC_POWER_PROFILE* to WORKLOAD_PPLIB_*_BIT */
|
||||
workload_type = smu_workload_get_type(smu, i);
|
||||
result = smu_update_table(smu,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF | workload_type << 16,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF, workload_type,
|
||||
(void *)(&activity_monitor), false);
|
||||
if (result) {
|
||||
pr_err("[%s] Failed to get activity monitor!", __func__);
|
||||
@ -1888,7 +1891,7 @@ static int vega20_set_power_profile_mode(struct smu_context *smu, long *input, u
|
||||
|
||||
if (smu->power_profile_mode == PP_SMC_POWER_PROFILE_CUSTOM) {
|
||||
ret = smu_update_table(smu,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF | WORKLOAD_PPLIB_CUSTOM_BIT << 16,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF, WORKLOAD_PPLIB_CUSTOM_BIT,
|
||||
(void *)(&activity_monitor), false);
|
||||
if (ret) {
|
||||
pr_err("[%s] Failed to get activity monitor!", __func__);
|
||||
@ -1943,7 +1946,7 @@ static int vega20_set_power_profile_mode(struct smu_context *smu, long *input, u
|
||||
}
|
||||
|
||||
ret = smu_update_table(smu,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF | WORKLOAD_PPLIB_CUSTOM_BIT << 16,
|
||||
SMU_TABLE_ACTIVITY_MONITOR_COEFF, WORKLOAD_PPLIB_CUSTOM_BIT,
|
||||
(void *)(&activity_monitor), true);
|
||||
if (ret) {
|
||||
pr_err("[%s] Failed to set activity monitor!", __func__);
|
||||
@ -2492,7 +2495,7 @@ static int vega20_update_od8_settings(struct smu_context *smu,
|
||||
struct smu_table_context *table_context = &smu->smu_table;
|
||||
int ret;
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE,
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE, 0,
|
||||
table_context->overdrive_table, false);
|
||||
if (ret) {
|
||||
pr_err("Failed to export over drive table!\n");
|
||||
@ -2503,7 +2506,7 @@ static int vega20_update_od8_settings(struct smu_context *smu,
|
||||
if (ret)
|
||||
return ret;
|
||||
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE,
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE, 0,
|
||||
table_context->overdrive_table, true);
|
||||
if (ret) {
|
||||
pr_err("Failed to import over drive table!\n");
|
||||
@ -2767,7 +2770,7 @@ static int vega20_odn_edit_dpm_table(struct smu_context *smu,
|
||||
break;
|
||||
|
||||
case PP_OD_RESTORE_DEFAULT_TABLE:
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE, table_context->overdrive_table, false);
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE, 0, table_context->overdrive_table, false);
|
||||
if (ret) {
|
||||
pr_err("Failed to export over drive table!\n");
|
||||
return ret;
|
||||
@ -2776,7 +2779,7 @@ static int vega20_odn_edit_dpm_table(struct smu_context *smu,
|
||||
break;
|
||||
|
||||
case PP_OD_COMMIT_DPM_TABLE:
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE, table_context->overdrive_table, true);
|
||||
ret = smu_update_table(smu, SMU_TABLE_OVERDRIVE, 0, table_context->overdrive_table, true);
|
||||
if (ret) {
|
||||
pr_err("Failed to import over drive table!\n");
|
||||
return ret;
|
||||
|
@ -219,7 +219,10 @@ union drm_amdgpu_bo_list {
|
||||
#define AMDGPU_CTX_PRIORITY_VERY_LOW -1023
|
||||
#define AMDGPU_CTX_PRIORITY_LOW -512
|
||||
#define AMDGPU_CTX_PRIORITY_NORMAL 0
|
||||
/* Selecting a priority above NORMAL requires CAP_SYS_NICE or DRM_MASTER */
|
||||
/*
|
||||
* When used in struct drm_amdgpu_ctx_in, a priority above NORMAL requires
|
||||
* CAP_SYS_NICE or DRM_MASTER
|
||||
*/
|
||||
#define AMDGPU_CTX_PRIORITY_HIGH 512
|
||||
#define AMDGPU_CTX_PRIORITY_VERY_HIGH 1023
|
||||
|
||||
@ -229,6 +232,7 @@ struct drm_amdgpu_ctx_in {
|
||||
/** For future use, no flags defined so far */
|
||||
__u32 flags;
|
||||
__u32 ctx_id;
|
||||
/** AMDGPU_CTX_PRIORITY_* */
|
||||
__s32 priority;
|
||||
};
|
||||
|
||||
@ -281,6 +285,7 @@ struct drm_amdgpu_sched_in {
|
||||
/* AMDGPU_SCHED_OP_* */
|
||||
__u32 op;
|
||||
__u32 fd;
|
||||
/** AMDGPU_CTX_PRIORITY_* */
|
||||
__s32 priority;
|
||||
__u32 ctx_id;
|
||||
};
|
||||
|
Loading…
Reference in New Issue
Block a user