Vega20 arbitrates pstate at hive level and not device level. Last peer to remote buffer unmap could drop P-State while another process is still remote buffer mapped. With this fix, P-States still needs to be disabled for now as SMU bug was discovered on synchronous P2P transfers. This should be fixed in the next FW update. Signed-off-by: Jonathan Kim <Jonathan.Kim@amd.com> Reviewed-by: Felix Kuehling <Felix.Kuehling@amd.com> Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
		
			
				
	
	
		
			77 lines
		
	
	
		
			2.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			77 lines
		
	
	
		
			2.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Copyright 2016 Advanced Micro Devices, Inc.
 | |
|  *
 | |
|  * Permission is hereby granted, free of charge, to any person obtaining a
 | |
|  * copy of this software and associated documentation files (the "Software"),
 | |
|  * to deal in the Software without restriction, including without limitation
 | |
|  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 | |
|  * and/or sell copies of the Software, and to permit persons to whom the
 | |
|  * Software is furnished to do so, subject to the following conditions:
 | |
|  *
 | |
|  * The above copyright notice and this permission notice shall be included in
 | |
|  * all copies or substantial portions of the Software.
 | |
|  *
 | |
|  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 | |
|  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 | |
|  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 | |
|  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 | |
|  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 | |
|  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 | |
|  * OTHER DEALINGS IN THE SOFTWARE.
 | |
|  */
 | |
| #ifndef __AMDGPU_XGMI_H__
 | |
| #define __AMDGPU_XGMI_H__
 | |
| 
 | |
| #include <drm/task_barrier.h>
 | |
| #include "amdgpu_psp.h"
 | |
| 
 | |
| 
 | |
| struct amdgpu_hive_info {
 | |
| 	uint64_t		hive_id;
 | |
| 	struct list_head	device_list;
 | |
| 	int number_devices;
 | |
| 	struct mutex hive_lock, reset_lock;
 | |
| 	struct kobject *kobj;
 | |
| 	struct device_attribute dev_attr;
 | |
| 	struct amdgpu_device *adev;
 | |
| 	int hi_req_count;
 | |
| 	struct amdgpu_device *hi_req_gpu;
 | |
| 	struct task_barrier tb;
 | |
| 	enum {
 | |
| 		AMDGPU_XGMI_PSTATE_MIN,
 | |
| 		AMDGPU_XGMI_PSTATE_MAX_VEGA20,
 | |
| 		AMDGPU_XGMI_PSTATE_UNKNOWN
 | |
| 	} pstate;
 | |
| };
 | |
| 
 | |
| struct amdgpu_pcs_ras_field {
 | |
| 	const char *err_name;
 | |
| 	uint32_t pcs_err_mask;
 | |
| 	uint32_t pcs_err_shift;
 | |
| };
 | |
| 
 | |
| struct amdgpu_hive_info *amdgpu_get_xgmi_hive(struct amdgpu_device *adev, int lock);
 | |
| int amdgpu_xgmi_update_topology(struct amdgpu_hive_info *hive, struct amdgpu_device *adev);
 | |
| int amdgpu_xgmi_add_device(struct amdgpu_device *adev);
 | |
| int amdgpu_xgmi_remove_device(struct amdgpu_device *adev);
 | |
| int amdgpu_xgmi_set_pstate(struct amdgpu_device *adev, int pstate);
 | |
| int amdgpu_xgmi_get_hops_count(struct amdgpu_device *adev,
 | |
| 		struct amdgpu_device *peer_adev);
 | |
| int amdgpu_xgmi_ras_late_init(struct amdgpu_device *adev);
 | |
| void amdgpu_xgmi_ras_fini(struct amdgpu_device *adev);
 | |
| uint64_t amdgpu_xgmi_get_relative_phy_addr(struct amdgpu_device *adev,
 | |
| 					   uint64_t addr);
 | |
| int amdgpu_xgmi_query_ras_error_count(struct amdgpu_device *adev,
 | |
| 				      void *ras_error_status);
 | |
| void amdgpu_xgmi_reset_ras_error_count(struct amdgpu_device *adev);
 | |
| 
 | |
| static inline bool amdgpu_xgmi_same_hive(struct amdgpu_device *adev,
 | |
| 		struct amdgpu_device *bo_adev)
 | |
| {
 | |
| 	return (adev != bo_adev &&
 | |
| 		adev->gmc.xgmi.hive_id &&
 | |
| 		adev->gmc.xgmi.hive_id == bo_adev->gmc.xgmi.hive_id);
 | |
| }
 | |
| 
 | |
| #endif
 |