gpu: nvgpu: restructure gmmu cache maintenance

Move the logic that manages tlb invalidation and l2 flushes to separate functions to keep the complexity manageable and to help reuse the logic. Bug 200778663 Change-Id: Ib9dd79c1ec92933a59dc2c8e4cd3fa8355433bbe Signed-off-by: Konsta Hölttä <kholtta@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/c/linux-nvgpu/+/2604939 Reviewed-by: Alex Waterman <alexw@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com> GVS: Gerrit_Virtual_Submit
2025-12-22 17:36:20 +03:00 · 2021-10-04 16:25:07 +03:00
parent 243e52a771
commit 5e7d459927
1 changed files with 45 additions and 25 deletions
--- a/drivers/gpu/nvgpu/common/mm/gmmu/page_table.c
+++ b/drivers/gpu/nvgpu/common/mm/gmmu/page_table.c
@@ -811,6 +811,47 @@ static int nvgpu_gmmu_do_update_page_table(struct vm_gk20a *vm,
 	return err;
 }
 static int nvgpu_gmmu_cache_maint_map(struct gk20a *g, struct vm_gk20a *vm,
 		struct vm_gk20a_mapping_batch *batch)
 {
 	int err = 0;
 	if (batch == NULL) {
 		err = g->ops.fb.tlb_invalidate(g, vm->pdb.mem);
 		if (err != 0) {
 			nvgpu_err(g, "fb.tlb_invalidate() failed err=%d", err);
 		}
 	} else {
 		batch->need_tlb_invalidate = true;
 	}
 	return err;
 }
 static void nvgpu_gmmu_cache_maint_unmap(struct gk20a *g, struct vm_gk20a *vm,
 		struct vm_gk20a_mapping_batch *batch)
 {
 	int err;
 	if (batch == NULL) {
 		if (g->ops.mm.cache.l2_flush(g, true) != 0) {
 			nvgpu_err(g, "gk20a_mm_l2_flush[1] failed");
 		}
 		err = g->ops.fb.tlb_invalidate(g, vm->pdb.mem);
 		if (err != 0) {
 			nvgpu_err(g, "fb.tlb_invalidate() failed err=%d", err);
 		}
 	} else {
 		if (!batch->gpu_l2_flushed) {
 			if (g->ops.mm.cache.l2_flush(g, true) != 0) {
 				nvgpu_err(g, "gk20a_mm_l2_flush[2] failed");
 			}
 			batch->gpu_l2_flushed = true;
 		}
 		batch->need_tlb_invalidate = true;
 	}
 }
 /*
 * This is the true top level GMMU mapping logic. This breaks down the incoming
 * scatter gather table and does actual programming of GPU virtual address to
@@ -1003,15 +1044,10 @@ u64 nvgpu_gmmu_map_locked(struct vm_gk20a *vm,
 		goto fail_validate;
 	}
-	if (batch == NULL) {
+	err = nvgpu_gmmu_cache_maint_map(g, vm, batch);
 		err = g->ops.fb.tlb_invalidate(g, vm->pdb.mem);
 	if (err != 0) {
 			nvgpu_err(g, "fb.tlb_invalidate() failed err=%d", err);
 		goto fail_validate;
 	}
 	} else {
 		batch->need_tlb_invalidate = true;
 	}
 	return vaddr;
@@ -1066,23 +1102,7 @@ void nvgpu_gmmu_unmap_locked(struct vm_gk20a *vm,
 		nvgpu_err(g, "failed to update gmmu ptes on unmap");
 	}
-	if (batch == NULL) {
+	nvgpu_gmmu_cache_maint_unmap(g, vm, batch);
 		if (g->ops.mm.cache.l2_flush(g, true) != 0) {
 			nvgpu_err(g, "gk20a_mm_l2_flush[1] failed");
 		}
 		err = g->ops.fb.tlb_invalidate(g, vm->pdb.mem);
 		if (err != 0) {
 			nvgpu_err(g, "fb.tlb_invalidate() failed err=%d", err);
 		}
 	} else {
 		if (!batch->gpu_l2_flushed) {
 			if (g->ops.mm.cache.l2_flush(g, true) != 0) {
 				nvgpu_err(g, "gk20a_mm_l2_flush[2] failed");
 			}
 			batch->gpu_l2_flushed = true;
 		}
 		batch->need_tlb_invalidate = true;
 	}
 }
 u32 nvgpu_pte_words(struct gk20a *g)