gpu: nvgpu: Remove buffer_attrs struct

Remove the buffer_attrs struct and replace it with a more streamlined nvgpu_ctag_buffer_info struct. This struct allows several different fields to all be passed by pointer to the various kind/compression functions in the VM map process. This path also moves several comptag/kind related functions to the core vm.c code since these functions can be reused by other OSes. Change-Id: I2a0f0a1c4b554ce4c8f2acdbe3161392e717d3bf Signed-off-by: Alex Waterman <alexw@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1583984 GVS: Gerrit_Virtual_Submit Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
2025-12-24 02:22:34 +03:00 · 2017-10-17 17:12:28 -07:00
parent a8bd154f79
commit 88ee812d56
4 changed files with 190 additions and 197 deletions
--- a/drivers/gpu/nvgpu/common/linux/vm.c
+++ b/drivers/gpu/nvgpu/common/linux/vm.c
@@ -115,84 +115,6 @@ static u64 nvgpu_get_buffer_alignment(struct gk20a *g, struct scatterlist *sgl,
 	return align;
 }
 static int setup_kind_legacy(struct vm_gk20a *vm, struct buffer_attrs *bfr,
 			     bool *pkind_compressible)
 {
 	struct gk20a *g = gk20a_from_vm(vm);
 	bool kind_compressible;
 	if (unlikely(bfr->kind_v == g->ops.mm.get_kind_invalid()))
 		bfr->kind_v = g->ops.mm.get_kind_pitch();
 	if (unlikely(!gk20a_kind_is_supported(bfr->kind_v))) {
 		nvgpu_err(g, "kind 0x%x not supported", bfr->kind_v);
 		return -EINVAL;
 	}
 	bfr->uc_kind_v = g->ops.mm.get_kind_invalid();
 	/* find a suitable incompressible kind if it becomes necessary later */
 	kind_compressible = gk20a_kind_is_compressible(bfr->kind_v);
 	if (kind_compressible) {
 		bfr->uc_kind_v = gk20a_get_uncompressed_kind(bfr->kind_v);
 		if (unlikely(bfr->uc_kind_v == g->ops.mm.get_kind_invalid())) {
 			/* shouldn't happen, but it is worth cross-checking */
 			nvgpu_err(g, "comptag kind 0x%x can't be"
 				   " downgraded to uncompressed kind",
 				   bfr->kind_v);
 			return -EINVAL;
 		}
 	}
 	*pkind_compressible = kind_compressible;
 	return 0;
 }
 static int setup_buffer_kind_and_compression(struct vm_gk20a *vm,
 					     u32 flags,
 					     struct buffer_attrs *bfr,
 					     enum gmmu_pgsz_gk20a pgsz_idx)
 {
 	bool kind_compressible;
 	struct gk20a *g = gk20a_from_vm(vm);
 	int ctag_granularity = g->ops.fb.compression_page_size(g);
 	if (!bfr->use_kind_v)
 		bfr->kind_v = g->ops.mm.get_kind_invalid();
 	if (!bfr->use_uc_kind_v)
 		bfr->uc_kind_v = g->ops.mm.get_kind_invalid();
 	if (flags & NVGPU_AS_MAP_BUFFER_FLAGS_DIRECT_KIND_CTRL) {
 		kind_compressible = (bfr->kind_v !=
 				     g->ops.mm.get_kind_invalid());
 		if (!kind_compressible)
 			bfr->kind_v = bfr->uc_kind_v;
 	} else {
 		int err = setup_kind_legacy(vm, bfr, &kind_compressible);
 		if (err)
 			return err;
 	}
 	/* comptags only supported for suitable kinds, 128KB pagesize */
 	if (kind_compressible &&
 	    vm->gmmu_page_sizes[pgsz_idx] <
 	    g->ops.fb.compressible_page_size(g)) {
 		/* it is safe to fall back to uncompressed as
 		   functionality is not harmed */
 		bfr->kind_v = bfr->uc_kind_v;
 		kind_compressible = false;
 	}
 	if (kind_compressible)
 		bfr->ctag_lines = DIV_ROUND_UP_ULL(bfr->size, ctag_granularity);
 	else
 		bfr->ctag_lines = 0;
 	bfr->use_kind_v = (bfr->kind_v != g->ops.mm.get_kind_invalid());
 	bfr->use_uc_kind_v = (bfr->uc_kind_v != g->ops.mm.get_kind_invalid());
 	return 0;
 }
 int nvgpu_vm_find_buf(struct vm_gk20a *vm, u64 gpu_va,
 		      struct dma_buf **dmabuf,
 		      u64 *offset)
@@ -279,40 +201,6 @@ static u64 __nvgpu_vm_find_mapping(struct vm_gk20a *vm,
 	return mapped_buffer->addr;
 }
 static int setup_bfr_kind_fields(struct buffer_attrs *bfr, s16 compr_kind,
 				 s16 incompr_kind, u32 flags)
 {
 	if (flags & NVGPU_AS_MAP_BUFFER_FLAGS_DIRECT_KIND_CTRL) {
 		/* were we supplied with a kind in either parameter? */
 		if ((compr_kind < 0 || compr_kind >= NV_KIND_ATTR_SIZE) &&
 		    (incompr_kind < 0 || incompr_kind >= NV_KIND_ATTR_SIZE))
 			return -EINVAL;
 		if (compr_kind != NV_KIND_INVALID) {
 			bfr->use_kind_v = true;
 			bfr->kind_v = (u8)compr_kind;
 		}
 		if (incompr_kind != NV_KIND_INVALID) {
 			bfr->use_uc_kind_v = true;
 			bfr->uc_kind_v = (u8)incompr_kind;
 		}
 	} else {
 		if (compr_kind < 0 || compr_kind >= NV_KIND_ATTR_SIZE)
 			return -EINVAL;
 		bfr->use_kind_v = true;
 		bfr->kind_v = (u8)compr_kind;
 		/*
 		 * Note: setup_buffer_kind_and_compression() will
 		 * figure out uc_kind_v or return an error
 		 */
 	}
 	return 0;
 }
 u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 		       struct dma_buf *dmabuf,
 		       u64 offset_align,
@@ -326,19 +214,19 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 {
 	struct gk20a *g = gk20a_from_vm(vm);
 	struct device *dev = dev_from_gk20a(g);
-	struct gk20a_comptag_allocator *ctag_allocator = &g->gr.comp_tags;
+	struct nvgpu_ctag_buffer_info binfo = { 0 };
 	struct nvgpu_mapped_buf *mapped_buffer = NULL;
 	bool va_allocated = false;
 	u64 map_offset = 0;
 	int err = 0;
 	struct buffer_attrs bfr = {NULL};
 	struct gk20a_comptags comptags;
 	bool clear_ctags = false;
 	struct scatterlist *sgl;
 	struct nvgpu_vm_area *vm_area = NULL;
 	u32 ctag_offset;
 	enum nvgpu_aperture aperture;
 	struct nvgpu_sgt *nvgpu_sgt;
 	struct sg_table *sgt;
 	struct nvgpu_mapped_buf *mapped_buffer = NULL;
 	enum nvgpu_aperture aperture;
 	bool va_allocated = false;
 	bool clear_ctags = false;
 	u64 map_offset = 0;
 	u64 align;
 	u32 ctag_offset;
 	int err = 0;
 	/*
 	 * The kind used as part of the key for map caching. HW may
@@ -347,6 +235,9 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 	 */
 	s16 map_key_kind;
 	binfo.flags = flags;
 	binfo.size = dmabuf->size;
 	if (flags & NVGPU_AS_MAP_BUFFER_FLAGS_DIRECT_KIND_CTRL) {
 		if (compr_kind != NV_KIND_INVALID)
 			map_key_kind = compr_kind;
@@ -376,28 +267,16 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 		}
 	}
-	/* pin buffer to get phys/iovmm addr */
+	sgt = gk20a_mm_pin(dev, dmabuf);
-	bfr.sgt = gk20a_mm_pin(dev, dmabuf);
+	if (IS_ERR(sgt)) {
 	if (IS_ERR(bfr.sgt)) {
 		/* Falling back to physical is actually possible
 		 * here in many cases if we use 4K phys pages in the
 		 * gmmu.  However we have some regions which require
 		 * contig regions to work properly (either phys-contig
 		 * or contig through smmu io_vaspace).  Until we can
 		 * track the difference between those two cases we have
 		 * to fail the mapping when we run out of SMMU space.
 		 */
 		nvgpu_warn(g, "oom allocating tracking buffer");
 		goto clean_up;
 	}
-	err = setup_bfr_kind_fields(&bfr, compr_kind, incompr_kind, flags);
+	err = nvgpu_vm_init_kind_info(&binfo, compr_kind, incompr_kind);
 	if (err)
 		goto clean_up;
 	bfr.size = dmabuf->size;
 	sgl = bfr.sgt->sgl;
 	aperture = gk20a_dmabuf_aperture(g, dmabuf);
 	if (aperture == APERTURE_INVALID) {
 		err = -EINVAL;
@@ -407,60 +286,59 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 	if (flags & NVGPU_AS_MAP_BUFFER_FLAGS_FIXED_OFFSET)
 		map_offset = offset_align;
-	bfr.align = nvgpu_get_buffer_alignment(g, sgl, aperture);
+	align = nvgpu_get_buffer_alignment(g, sgt->sgl, aperture);
 	if (g->mm.disable_bigpage)
-		bfr.pgsz_idx = gmmu_page_size_small;
+		binfo.pgsz_idx = gmmu_page_size_small;
 	else
-		bfr.pgsz_idx = __get_pte_size(vm, map_offset,
+		binfo.pgsz_idx = __get_pte_size(vm, map_offset,
-				      min_t(u64, bfr.size, bfr.align));
+						min_t(u64, binfo.size, align));
-	mapping_size = mapping_size ? mapping_size : bfr.size;
+	mapping_size = mapping_size ? mapping_size : binfo.size;
 	mapping_size = ALIGN(mapping_size, SZ_4K);
-	if ((mapping_size > bfr.size) ||
+	if ((mapping_size > binfo.size) ||
-	    (buffer_offset > (bfr.size - mapping_size))) {
+	    (buffer_offset > (binfo.size - mapping_size))) {
 		err = -EINVAL;
 		goto clean_up;
 	}
 	/* Check if we should use a fixed offset for mapping this buffer */
 	if (flags & NVGPU_AS_MAP_BUFFER_FLAGS_FIXED_OFFSET)  {
-		err = nvgpu_vm_area_validate_buffer(vm, offset_align, mapping_size,
+		err = nvgpu_vm_area_validate_buffer(vm,
-						    bfr.pgsz_idx, &vm_area);
+						    offset_align,
 						    mapping_size,
 						    binfo.pgsz_idx,
 						    &vm_area);
 		if (err)
 			goto clean_up;
 		map_offset = offset_align;
 		va_allocated = false;
-	} else
+	} else {
 		va_allocated = true;
 	}
-	err = setup_buffer_kind_and_compression(vm, flags, &bfr, bfr.pgsz_idx);
+	err = nvgpu_vm_compute_kind_and_compression(vm, &binfo);
-	if (unlikely(err)) {
+	if (err) {
 		nvgpu_err(g, "failure setting up kind and compression");
 		goto clean_up;
 	}
 	/* bar1 and pmu vm don't need ctag */
 	if (!vm->enable_ctag)
-		bfr.ctag_lines = 0;
+		binfo.ctag_lines = 0;
 	gk20a_get_comptags(dev, dmabuf, &comptags);
-	/* ensure alignment to compression page size if compression enabled */
+	if (binfo.ctag_lines && !comptags.lines) {
 	if (bfr.ctag_offset)
 		mapping_size = ALIGN(mapping_size,
 				     g->ops.fb.compression_page_size(g));
 	if (bfr.ctag_lines && !comptags.lines) {
 		/* allocate compression resources if needed */
 		err = gk20a_alloc_comptags(g, dev, dmabuf,
-					   ctag_allocator,
+					   &g->gr.comp_tags,
-					   bfr.ctag_lines);
+					   binfo.ctag_lines);
-		if (unlikely(err)) {
+		if (err) {
 			/* TBD: we can partially alloc ctags as well... */
-			if (bfr.use_uc_kind_v) {
+			if (binfo.use_uc_kind_v) {
 				/* no comptags, but fallback kind available */
-				bfr.kind_v = bfr.uc_kind_v;
+				binfo.kind_v = binfo.uc_kind_v;
 			} else {
 				nvgpu_err(g, "comptag alloc failed and no fallback kind specified");
 				goto clean_up;
@@ -479,12 +357,6 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 		}
 	}
 	/* store the comptag info */
 	bfr.ctag_offset = comptags.offset;
 	bfr.ctag_lines = comptags.lines;
 	bfr.ctag_allocated_lines = comptags.allocated_lines;
 	bfr.ctag_user_mappable = comptags.user_mappable;
 	/*
 	 * Calculate comptag index for this mapping. Differs in
 	 * case of partial mapping.
@@ -494,7 +366,7 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 		ctag_offset += buffer_offset >>
 			       ilog2(g->ops.fb.compression_page_size(g));
-	nvgpu_sgt = nvgpu_linux_sgt_create(g, bfr.sgt);
+	nvgpu_sgt = nvgpu_linux_sgt_create(g, sgt);
 	/* update gmmu ptes */
 	map_offset = g->ops.mm.gmmu_map(vm,
@@ -502,8 +374,8 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 					nvgpu_sgt,
 					buffer_offset, /* sg offset */
 					mapping_size,
-					bfr.pgsz_idx,
+					binfo.pgsz_idx,
-					bfr.kind_v,
+					binfo.kind_v,
 					ctag_offset,
 					flags, rw_flag,
 					clear_ctags,
@@ -522,13 +394,13 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 		goto clean_up;
 	}
 	mapped_buffer->dmabuf      = dmabuf;
-	mapped_buffer->sgt         = bfr.sgt;
+	mapped_buffer->sgt         = sgt;
 	mapped_buffer->addr        = map_offset;
 	mapped_buffer->size        = mapping_size;
-	mapped_buffer->pgsz_idx    = bfr.pgsz_idx;
+	mapped_buffer->pgsz_idx    = binfo.pgsz_idx;
-	mapped_buffer->ctag_offset = bfr.ctag_offset;
+	mapped_buffer->ctag_offset = ctag_offset;
-	mapped_buffer->ctag_lines  = bfr.ctag_lines;
+	mapped_buffer->ctag_lines  = binfo.ctag_lines;
-	mapped_buffer->ctag_allocated_lines = bfr.ctag_allocated_lines;
+	mapped_buffer->ctag_allocated_lines = comptags.allocated_lines;
 	mapped_buffer->vm          = vm;
 	mapped_buffer->flags       = flags;
 	mapped_buffer->kind        = map_key_kind;
@@ -557,9 +429,9 @@ u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 clean_up:
 	nvgpu_kfree(g, mapped_buffer);
 	if (va_allocated)
-		__nvgpu_vm_free_va(vm, map_offset, bfr.pgsz_idx);
+		__nvgpu_vm_free_va(vm, map_offset, binfo.pgsz_idx);
-	if (!IS_ERR(bfr.sgt))
+	if (!IS_ERR(sgt))
-		gk20a_mm_unpin(dev, dmabuf, bfr.sgt);
+		gk20a_mm_unpin(dev, dmabuf, sgt);
 	nvgpu_mutex_release(&vm->update_gmmu_lock);
 	nvgpu_log_info(g, "err=%d", err);
--- a/drivers/gpu/nvgpu/common/mm/vm.c
+++ b/drivers/gpu/nvgpu/common/mm/vm.c
@@ -35,6 +35,7 @@
 #include "gk20a/gk20a.h"
 #include "gk20a/mm_gk20a.h"
 #include "gk20a/kind_gk20a.h"
 static void __nvgpu_vm_unmap(struct nvgpu_mapped_buf *mapped_buffer,
 			     struct vm_gk20a_mapping_batch *batch);
@@ -827,3 +828,124 @@ done:
 	nvgpu_mutex_release(&vm->update_gmmu_lock);
 	return;
 }
 int nvgpu_vm_init_kind_info(struct nvgpu_ctag_buffer_info *binfo,
 			    s16 compr_kind, s16 incompr_kind)
 {
 	if (binfo->flags & NVGPU_AS_MAP_BUFFER_FLAGS_DIRECT_KIND_CTRL) {
 		/* were we supplied with a kind in either parameter? */
 		if ((compr_kind < 0 || compr_kind >= NV_KIND_ATTR_SIZE) &&
 		    (incompr_kind < 0 || incompr_kind >= NV_KIND_ATTR_SIZE))
 			return -EINVAL;
 		if (compr_kind != NV_KIND_INVALID) {
 			binfo->use_kind_v = true;
 			binfo->kind_v = (u8)compr_kind;
 		}
 		if (incompr_kind != NV_KIND_INVALID) {
 			binfo->use_uc_kind_v = true;
 			binfo->uc_kind_v = (u8)incompr_kind;
 		}
 	} else {
 		if (compr_kind < 0 || compr_kind >= NV_KIND_ATTR_SIZE)
 			return -EINVAL;
 		binfo->use_kind_v = true;
 		binfo->kind_v = (u8)compr_kind;
 		/*
 		 * Note: nvgpu_vm_kind_and_compression() will figure out
 		 * uc_kind_v or return an error.
 		 */
 	}
 	return 0;
 }
 static int nvgpu_vm_setup_kind_legacy(struct vm_gk20a *vm,
 				      struct nvgpu_ctag_buffer_info *binfo,
 				      bool *pkind_compressible)
 {
 	struct gk20a *g = gk20a_from_vm(vm);
 	bool kind_compressible;
 	if (unlikely(binfo->kind_v == g->ops.mm.get_kind_invalid()))
 		binfo->kind_v = g->ops.mm.get_kind_pitch();
 	if (unlikely(!gk20a_kind_is_supported(binfo->kind_v))) {
 		nvgpu_err(g, "kind 0x%x not supported", binfo->kind_v);
 		return -EINVAL;
 	}
 	binfo->uc_kind_v = g->ops.mm.get_kind_invalid();
 	/*
 	 * Find a suitable incompressible kind if it becomes necessary later.
 	 */
 	kind_compressible = gk20a_kind_is_compressible(binfo->kind_v);
 	if (kind_compressible) {
 		binfo->uc_kind_v = gk20a_get_uncompressed_kind(binfo->kind_v);
 		if (binfo->uc_kind_v == g->ops.mm.get_kind_invalid()) {
 			/*
 			 * Shouldn't happen, but it is worth cross-checking.
 			 */
 			nvgpu_err(g, "comptag kind 0x%x can't be"
 				  " downgraded to uncompressed kind",
 				  binfo->kind_v);
 			return -EINVAL;
 		}
 	}
 	*pkind_compressible = kind_compressible;
 	return 0;
 }
 int nvgpu_vm_compute_kind_and_compression(struct vm_gk20a *vm,
 					  struct nvgpu_ctag_buffer_info *binfo)
 {
 	bool kind_compressible;
 	struct gk20a *g = gk20a_from_vm(vm);
 	int ctag_granularity = g->ops.fb.compression_page_size(g);
 	if (!binfo->use_kind_v)
 		binfo->kind_v = g->ops.mm.get_kind_invalid();
 	if (!binfo->use_uc_kind_v)
 		binfo->uc_kind_v = g->ops.mm.get_kind_invalid();
 	if (binfo->flags & NVGPU_AS_MAP_BUFFER_FLAGS_DIRECT_KIND_CTRL) {
 		kind_compressible = (binfo->kind_v !=
 				     g->ops.mm.get_kind_invalid());
 		if (!kind_compressible)
 			binfo->kind_v = binfo->uc_kind_v;
 	} else {
 		int err = nvgpu_vm_setup_kind_legacy(vm, binfo,
 						     &kind_compressible);
 		if (err)
 			return err;
 	}
 	/* comptags only supported for suitable kinds, 128KB pagesize */
 	if (kind_compressible &&
 	    vm->gmmu_page_sizes[binfo->pgsz_idx] <
 	    g->ops.fb.compressible_page_size(g)) {
 		/* it is safe to fall back to uncompressed as
 		   functionality is not harmed */
 		binfo->kind_v = binfo->uc_kind_v;
 		kind_compressible = false;
 	}
 	if (kind_compressible)
 		binfo->ctag_lines = DIV_ROUND_UP_ULL(binfo->size,
 						     ctag_granularity);
 	else
 		binfo->ctag_lines = 0;
 	binfo->use_kind_v = (binfo->kind_v != g->ops.mm.get_kind_invalid());
 	binfo->use_uc_kind_v = (binfo->uc_kind_v !=
 				g->ops.mm.get_kind_invalid());
 	return 0;
 }
--- a/drivers/gpu/nvgpu/include/nvgpu/linux/vm.h
+++ b/drivers/gpu/nvgpu/include/nvgpu/linux/vm.h
@@ -38,21 +38,6 @@ struct vm_gk20a;
 struct vm_gk20a_mapping_batch;
 struct nvgpu_vm_area;
 struct buffer_attrs {
 	struct sg_table *sgt;
 	u64 size;
 	u64 align;
 	u32 ctag_offset;
 	u32 ctag_lines;
 	u32 ctag_allocated_lines;
 	int pgsz_idx;
 	u8 kind_v;
 	bool use_kind_v;
 	u8 uc_kind_v;
 	bool use_uc_kind_v;
 	bool ctag_user_mappable;
 };
 u64 nvgpu_vm_map_linux(struct vm_gk20a *vm,
 		       struct dma_buf *dmabuf,
 		       u64 offset_align,
@@ -104,9 +89,5 @@ int nvgpu_vm_find_buf(struct vm_gk20a *vm, u64 gpu_va,
 enum nvgpu_aperture gk20a_dmabuf_aperture(struct gk20a *g,
 					  struct dma_buf *dmabuf);
 int validate_fixed_buffer(struct vm_gk20a *vm,
 			  struct buffer_attrs *bfr,
 			  u64 map_offset, u64 map_size,
 			  struct nvgpu_vm_area **pva_node);
 #endif
--- a/drivers/gpu/nvgpu/include/nvgpu/vm.h
+++ b/drivers/gpu/nvgpu/include/nvgpu/vm.h
@@ -122,6 +122,19 @@ mapped_buffer_from_rbtree_node(struct nvgpu_rbtree_node *node)
 		  ((uintptr_t)node - offsetof(struct nvgpu_mapped_buf, node));
 }
 struct nvgpu_ctag_buffer_info {
 	u64			size;
 	enum gmmu_pgsz_gk20a	pgsz_idx;
 	u32			flags;
 	u8			kind_v;
 	u8			uc_kind_v;
 	bool			use_kind_v;
 	bool			use_uc_kind_v;
 	u32			ctag_lines;
 };
 struct vm_gk20a {
 	struct mm_gk20a *mm;
 	struct gk20a_as_share *as_share; /* as_share this represents */
@@ -189,6 +202,11 @@ void nvgpu_vm_put(struct vm_gk20a *vm);
 int vm_aspace_id(struct vm_gk20a *vm);
 int nvgpu_big_pages_possible(struct vm_gk20a *vm, u64 base, u64 size);
 int nvgpu_vm_init_kind_info(struct nvgpu_ctag_buffer_info *binfo,
 			    s16 compr_kind, s16 incompr_kind);
 int nvgpu_vm_compute_kind_and_compression(struct vm_gk20a *vm,
 					  struct nvgpu_ctag_buffer_info *binfo);
 /* batching eliminates redundant cache flushes and invalidates */
 void nvgpu_vm_mapping_batch_start(struct vm_gk20a_mapping_batch *batch);
 void nvgpu_vm_mapping_batch_finish(