gpu: nvgpu: Fix IPA to PA translation

Background: In Hypervisor mode dGPU device is configured in pass through mode for the Guest (QNX/Linux). GMMU programming is handled by the guest which converts a mapped buffer's GVA into SGLes in IPA (Intermediate/Guest Physical address) which is then translated into PA (Acutual Physical address) and programs the GMMU PTEes with correct GVA to PA mapping. Incase of the vgpu this work is delegated to the RM server which takes care of the GMMU programming and IPA to PA conversion. Problem: The current GMMU mapping logic in the guest assumes that PA range is continuous over a given IPA range. Hence, it doesn't account for holes being present in the PA range. But this is not the case, a continous IPA range can be mapped to dis-contiguous PA ranges. In this situation the mapping logic sets up GMMU PTEes ignoring the holes in physical memory and creates GVA => PA mapping which intrudes into the PA ranges which are reserved. This results in memory being corrupted. This change takes into account holes being present in a given PA range and for a given IPA range it also identifies the discontiguous PA ranges and sets up the PTE's appropriately. Bug 200451447 Jira VQRM-5069 Change-Id: I354d984f6c44482e4576a173fce1e90ab52283ac Signed-off-by: aalex <aalex@nvidia.com> Signed-off-by: Antony Clince Alex <aalex@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1850972 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
2025-12-25 02:52:51 +03:00 · 2018-09-28 15:24:20 +05:30
parent 6c8be7cfe2
commit 80d03f34f7
8 changed files with 157 additions and 25 deletions
--- a/drivers/gpu/nvgpu/common/mm/gmmu.c
+++ b/drivers/gpu/nvgpu/common/mm/gmmu.c
@@ -537,8 +537,20 @@ static int __nvgpu_gmmu_do_update_page_table(struct vm_gk20a *vm,
 	 * we really are mapping physical pages directly.
 	 */
 	nvgpu_sgt_for_each_sgl(sgl, sgt) {
+		/*
+		 * ipa_addr == phys_addr for non virtualized OSes.
+		 */
 		u64 phys_addr;
-		u64 chunk_length;
+		u64 ipa_addr;
+		/*
+		 * For non virtualized OSes SGL entries are contiguous in
+		 * physical memory (sgl_length == phys_length). For virtualized
+		 * OSes SGL entries are mapped to intermediate physical memory
+		 * which may subsequently point to discontiguous physical
+		 * memory. Therefore phys_length may not be equal to sgl_length.
+		 */
+		u64 phys_length;
+		u64 sgl_length;

 		/*
 		 * Cut out sgl ents for space_to_skip.
@@ -549,31 +561,83 @@ static int __nvgpu_gmmu_do_update_page_table(struct vm_gk20a *vm,
 			continue;
 		}

-		phys_addr = g->ops.mm.gpu_phys_addr(g, attrs,
-			    nvgpu_sgt_get_phys(g, sgt, sgl)) + space_to_skip;
-		chunk_length = min(length,
-			nvgpu_sgt_get_length(sgt, sgl) - space_to_skip);
-
-		err = __set_pd_level(vm, &vm->pdb,
-				     0,
-				     phys_addr,
-				     virt_addr,
-				     chunk_length,
-				     attrs);
-		if (err != 0) {
-			break;
-		}
-
-		/* Space has been skipped so zero this for future chunks. */
-		space_to_skip = 0;
+		/*
+		 * IPA and PA have 1:1 mapping for non virtualized OSes.
+		 */
+		ipa_addr = nvgpu_sgt_get_ipa(g, sgt, sgl);

 		/*
-		 * Update the map pointer and the remaining length.
+		 * For non-virtualized OSes SGL entries are contiguous and hence
+		 * sgl_length == phys_length. For virtualized OSes the
+		 * phys_length will be updated by nvgpu_sgt_ipa_to_pa.
 		 */
-		virt_addr += chunk_length;
-		length    -= chunk_length;
+		sgl_length = nvgpu_sgt_get_length(sgt, sgl);
+		phys_length = sgl_length;

-		if (length == 0U) {
+		while (sgl_length > 0ULL && length > 0ULL) {
+			/*
+			 * Holds the size of the portion of SGL that is backed
+			 * with physically contiguous memory.
+			 */
+			u64 sgl_contiguous_length;
+			/*
+			 * Number of bytes of the SGL entry that is actually
+			 * mapped after accounting for space_to_skip.
+			 */
+			u64 mapped_sgl_length;
+
+			/*
+			 * For virtualized OSes translate IPA to PA. Retrieve
+			 * the size of the underlying physical memory chunk to
+			 * which SGL has been mapped.
+			 */
+			phys_addr = nvgpu_sgt_ipa_to_pa(g, sgt, sgl, ipa_addr,
+					&phys_length);
+			phys_addr = g->ops.mm.gpu_phys_addr(g, attrs, phys_addr)
+				+ space_to_skip;
+
+			/*
+			 * For virtualized OSes when phys_length is less than
+			 * sgl_length check if space_to_skip exceeds phys_length
+			 * if so skip this memory chunk
+			 */
+			if (space_to_skip >= phys_length) {
+				space_to_skip -= phys_length;
+				ipa_addr += phys_length;
+				sgl_length -= phys_length;
+				continue;
+			}
+
+			sgl_contiguous_length = min(phys_length, sgl_length);
+			mapped_sgl_length = min(length, sgl_contiguous_length -
+					space_to_skip);
+
+			err = __set_pd_level(vm, &vm->pdb,
+						 0,
+						 phys_addr,
+						 virt_addr,
+						 mapped_sgl_length,
+						 attrs);
+			if (err != 0) {
+				return err;
+			}
+
+			/*
+			 * Update the map pointer and the remaining length.
+			 */
+			virt_addr  += mapped_sgl_length;
+			length     -= mapped_sgl_length;
+			sgl_length -= mapped_sgl_length + space_to_skip;
+			ipa_addr   += mapped_sgl_length + space_to_skip;
+
+			/*
+			 * Space has been skipped so zero this for future
+			 * chunks.
+			 */
+			space_to_skip = 0;
+		}
+
+		if (length == 0ULL) {
 			break;
 		}
 	}
--- a/drivers/gpu/nvgpu/common/mm/nvgpu_mem.c
+++ b/drivers/gpu/nvgpu/common/mm/nvgpu_mem.c
@@ -99,6 +99,18 @@ u64 nvgpu_sgt_get_phys(struct gk20a *g, struct nvgpu_sgt *sgt,
 	return sgt->ops->sgl_phys(g, sgl);
 }

+u64 nvgpu_sgt_get_ipa(struct gk20a *g, struct nvgpu_sgt *sgt,
+		       struct nvgpu_sgl *sgl)
+{
+	return sgt->ops->sgl_ipa(g, sgl);
+}
+
+u64 nvgpu_sgt_ipa_to_pa(struct gk20a *g, struct nvgpu_sgt *sgt,
+		       struct nvgpu_sgl *sgl, u64 ipa, u64 *pa_len)
+{
+	return sgt->ops->sgl_ipa_to_pa(g, sgl, ipa, pa_len);
+}
+
 u64 nvgpu_sgt_get_dma(struct nvgpu_sgt *sgt, struct nvgpu_sgl *sgl)
 {
 	return sgt->ops->sgl_dma(sgl);
--- a/drivers/gpu/nvgpu/common/mm/page_allocator.c
+++ b/drivers/gpu/nvgpu/common/mm/page_allocator.c
@@ -167,6 +167,12 @@ static u64 nvgpu_page_alloc_sgl_phys(struct gk20a *g, struct nvgpu_sgl *sgl)
 	return sgl_impl->phys;
 }

+static u64 nvgpu_page_alloc_sgl_ipa_to_pa(struct gk20a *g,
+		struct nvgpu_sgl *sgl, u64 ipa, u64 *pa_len)
+{
+	return ipa;
+}
+
 static u64 nvgpu_page_alloc_sgl_dma(struct nvgpu_sgl *sgl)
 {
 	struct nvgpu_mem_sgl *sgl_impl = (struct nvgpu_mem_sgl *)sgl;
@@ -205,6 +211,8 @@ static void nvgpu_page_alloc_sgt_free(struct gk20a *g, struct nvgpu_sgt *sgt)
 static const struct nvgpu_sgt_ops page_alloc_sgl_ops = {
 	.sgl_next = nvgpu_page_alloc_sgl_next,
 	.sgl_phys = nvgpu_page_alloc_sgl_phys,
+	.sgl_ipa = nvgpu_page_alloc_sgl_phys,
+	.sgl_ipa_to_pa = nvgpu_page_alloc_sgl_ipa_to_pa,
 	.sgl_dma = nvgpu_page_alloc_sgl_dma,
 	.sgl_length = nvgpu_page_alloc_sgl_length,
 	.sgl_gpu_addr = nvgpu_page_alloc_sgl_gpu_addr,
--- a/drivers/gpu/nvgpu/include/nvgpu/nvgpu_mem.h
+++ b/drivers/gpu/nvgpu/include/nvgpu/nvgpu_mem.h
@@ -71,6 +71,9 @@ struct nvgpu_sgl;
 struct nvgpu_sgt_ops {
 	struct nvgpu_sgl *(*sgl_next)(struct nvgpu_sgl *sgl);
 	u64   (*sgl_phys)(struct gk20a *g, struct nvgpu_sgl *sgl);
+	u64   (*sgl_ipa)(struct gk20a *g, struct nvgpu_sgl *sgl);
+	u64   (*sgl_ipa_to_pa)(struct gk20a *g, struct nvgpu_sgl *sgl,
+			      u64 ipa, u64 *pa_len);
 	u64   (*sgl_dma)(struct nvgpu_sgl *sgl);
 	u64   (*sgl_length)(struct nvgpu_sgl *sgl);
 	u64   (*sgl_gpu_addr)(struct gk20a *g, struct nvgpu_sgl *sgl,
@@ -255,6 +258,10 @@ struct nvgpu_sgt *nvgpu_sgt_create_from_mem(struct gk20a *g,

 struct nvgpu_sgl *nvgpu_sgt_get_next(struct nvgpu_sgt *sgt,
 					  struct nvgpu_sgl *sgl);
+u64 nvgpu_sgt_get_ipa(struct gk20a *g, struct nvgpu_sgt *sgt,
+				struct nvgpu_sgl *sgl);
+u64 nvgpu_sgt_ipa_to_pa(struct gk20a *g, struct nvgpu_sgt *sgt,
+				struct nvgpu_sgl *sgl, u64 ipa, u64 *pa_len);
 u64 nvgpu_sgt_get_phys(struct gk20a *g, struct nvgpu_sgt *sgt,
 		       struct nvgpu_sgl *sgl);
 u64 nvgpu_sgt_get_dma(struct nvgpu_sgt *sgt, struct nvgpu_sgl *sgl);
--- a/drivers/gpu/nvgpu/os/linux/nvgpu_mem.c
+++ b/drivers/gpu/nvgpu/os/linux/nvgpu_mem.c
@@ -36,6 +36,11 @@
 #include "gk20a/mm_gk20a.h"
 #include "platform_gk20a.h"

+static u64 __nvgpu_sgl_ipa(struct gk20a *g, struct nvgpu_sgl *sgl)
+{
+	return sg_phys((struct scatterlist *)sgl);
+}
+
 static u64 __nvgpu_sgl_phys(struct gk20a *g, struct nvgpu_sgl *sgl)
 {
 	struct device *dev = dev_from_gk20a(g);
@@ -43,7 +48,7 @@ static u64 __nvgpu_sgl_phys(struct gk20a *g, struct nvgpu_sgl *sgl)
 	u64 ipa = sg_phys((struct scatterlist *)sgl);

 	if (platform->phys_addr)
-		return platform->phys_addr(g, ipa);
+		return platform->phys_addr(g, ipa, NULL);

 	return ipa;
 }
@@ -251,6 +256,23 @@ static struct nvgpu_sgl *nvgpu_mem_linux_sgl_next(struct nvgpu_sgl *sgl)
 	return (struct nvgpu_sgl *)sg_next((struct scatterlist *)sgl);
 }

+static u64 nvgpu_mem_linux_sgl_ipa(struct gk20a *g, struct nvgpu_sgl *sgl)
+{
+	return __nvgpu_sgl_ipa(g, sgl);
+}
+
+static u64 nvgpu_mem_linux_sgl_ipa_to_pa(struct gk20a *g,
+		struct nvgpu_sgl *sgl, u64 ipa, u64 *pa_len)
+{
+	struct device *dev = dev_from_gk20a(g);
+	struct gk20a_platform *platform = gk20a_get_platform(dev);
+
+	if (platform->phys_addr)
+		return platform->phys_addr(g, ipa, pa_len);
+
+	return ipa;
+}
+
 static u64 nvgpu_mem_linux_sgl_phys(struct gk20a *g, struct nvgpu_sgl *sgl)
 {
 	return (u64)__nvgpu_sgl_phys(g, sgl);
@@ -301,6 +323,8 @@ static void nvgpu_mem_linux_sgl_free(struct gk20a *g, struct nvgpu_sgt *sgt)
 static const struct nvgpu_sgt_ops nvgpu_linux_sgt_ops = {
 	.sgl_next      = nvgpu_mem_linux_sgl_next,
 	.sgl_phys      = nvgpu_mem_linux_sgl_phys,
+	.sgl_ipa       = nvgpu_mem_linux_sgl_ipa,
+	.sgl_ipa_to_pa = nvgpu_mem_linux_sgl_ipa_to_pa,
 	.sgl_dma       = nvgpu_mem_linux_sgl_dma,
 	.sgl_length    = nvgpu_mem_linux_sgl_length,
 	.sgl_gpu_addr  = nvgpu_mem_linux_sgl_gpu_addr,
--- a/drivers/gpu/nvgpu/os/linux/platform_gk20a.h
+++ b/drivers/gpu/nvgpu/os/linux/platform_gk20a.h
@@ -234,7 +234,7 @@ struct gk20a_platform {
 	 * addresses (not IPA). This is the case for GV100 nvlink in HV+L
 	 * configuration, when dGPU is in pass-through mode.
 	 */
-	u64 (*phys_addr)(struct gk20a *g, u64 ipa);
+	u64 (*phys_addr)(struct gk20a *g, u64 ipa, u64 *pa_len);

 	/* Callbacks to assert/deassert GPU reset */
 	int (*reset_assert)(struct device *dev);
--- a/drivers/gpu/nvgpu/os/linux/soc.c
+++ b/drivers/gpu/nvgpu/os/linux/soc.c
@@ -65,7 +65,7 @@ bool nvgpu_is_soc_t194_a01(struct gk20a *g)
 * is enabled), the addresses we get from dma_alloc are IPAs. We need to
 * convert them to PA.
 */
-static u64 nvgpu_tegra_hv_ipa_pa(struct gk20a *g, u64 ipa)
+static u64 nvgpu_tegra_hv_ipa_pa(struct gk20a *g, u64 ipa, u64 *pa_len)
 {
 	struct device *dev = dev_from_gk20a(g);
 	struct gk20a_platform *platform = gk20a_get_platform(dev);
@@ -92,6 +92,13 @@ static u64 nvgpu_tegra_hv_ipa_pa(struct gk20a *g, u64 ipa)
 		}
 	} else {
 		pa = info.base + info.offset;
+		if (pa_len != NULL) {
+			/*
+			 * Update the size of physical memory chunk after the
+			 * specified offset.
+			 */
+			*pa_len = info.size - info.offset;
+		}
 		nvgpu_log(g, gpu_dbg_map_v,
 				"ipa=%llx vmid=%d -> pa=%llx "
 				"base=%llx offset=%llx size=%llx\n",
--- a/drivers/gpu/nvgpu/os/posix/posix-nvgpu_mem.c
+++ b/drivers/gpu/nvgpu/os/posix/posix-nvgpu_mem.c
@@ -56,6 +56,14 @@ static u64 nvgpu_mem_sgl_phys(struct gk20a *g, struct nvgpu_sgl *sgl)
 	return (u64)(uintptr_t)mem->phys;
 }

+static u64 nvgpu_mem_sgl_ipa_to_pa(struct gk20a *g, struct nvgpu_sgl *sgl,
+		u64 ipa, u64 *pa_len)
+{
+	struct nvgpu_mem *mem = (struct nvgpu_mem *)sgl;
+
+	return (u64)(uintptr_t)mem->cpu_va;
+}
+
 static u64 nvgpu_mem_sgl_dma(struct nvgpu_sgl *sgl)
 {
 	struct nvgpu_mem_sgl *mem = (struct nvgpu_mem_sgl *)sgl;
@@ -99,6 +107,8 @@ static void nvgpu_mem_sgt_free(struct gk20a *g, struct nvgpu_sgt *sgt)
 static struct nvgpu_sgt_ops nvgpu_sgt_posix_ops = {
 	.sgl_next	= nvgpu_mem_sgl_next,
 	.sgl_phys	= nvgpu_mem_sgl_phys,
+	.sgl_ipa    = nvgpu_mem_sgl_phys,
+	.sgl_ipa_to_pa = nvgpu_mem_sgl_ipa_to_pa,
 	.sgl_dma	= nvgpu_mem_sgl_dma,
 	.sgl_length	= nvgpu_mem_sgl_length,
 	.sgl_gpu_addr	= nvgpu_mem_sgl_gpu_addr,