]> git.baikalelectronics.ru Git - kernel.git/commitdiff
drm/amdgpu: Albebaran: MTYPE_NC for coarse-grain remote memory
authorFelix Kuehling <Felix.Kuehling@amd.com>
Mon, 10 May 2021 22:50:11 +0000 (18:50 -0400)
committerAlex Deucher <alexander.deucher@amd.com>
Thu, 20 May 2021 02:29:56 +0000 (22:29 -0400)
MTYPE UC was used for a specific use case that ended up not being
implemented. Use NC for better performance for coarse-grained memory where
cache coherence during shader execution is not required.

Signed-off-by: Felix Kuehling <Felix.Kuehling@amd.com>
Reviewed-by: Oak Zeng <Oak.Zeng@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/amdgpu_amdkfd_gpuvm.c
drivers/gpu/drm/amd/amdkfd/kfd_svm.c

index 941a204d28f5af07f5cebb8770938860f511e126..93ee569f6a63e3e7bf78306dd9c8e041ccc18656 100644 (file)
@@ -453,7 +453,8 @@ static uint64_t get_pte_flags(struct amdgpu_device *adev, struct kgd_mem *mem)
                                if (adev->gmc.xgmi.connected_to_cpu)
                                        snoop = true;
                        } else {
-                               mapping_flags |= AMDGPU_VM_MTYPE_UC;
+                               mapping_flags |= coherent ?
+                                       AMDGPU_VM_MTYPE_UC : AMDGPU_VM_MTYPE_NC;
                                if (amdgpu_xgmi_same_hive(adev, bo_adev))
                                        snoop = true;
                        }
index 12c827854d1d22f0caac3ad37476bb8d5daecc67..3886c630286bf30f7ad3b31cac17934c28e6d857 100644 (file)
@@ -1040,7 +1040,8 @@ svm_range_get_pte_flags(struct amdgpu_device *adev, struct svm_range *prange)
                                if (adev->gmc.xgmi.connected_to_cpu)
                                        snoop = true;
                        } else {
-                               mapping_flags |= AMDGPU_VM_MTYPE_UC;
+                               mapping_flags |= coherent ?
+                                       AMDGPU_VM_MTYPE_UC : AMDGPU_VM_MTYPE_NC;
                                if (amdgpu_xgmi_same_hive(adev, bo_adev))
                                        snoop = true;
                        }