gpu: nvgpu: load context image from gr/ctx unit

We currently load and create new graphics context image in gr_gk20a_load_golden_ctx_image() This API will first load local golden image in new context image and then initialize context appropriately by calling g->ops.gr.ctxsw_prog() HALs Move this sequence to gr/ctx unit and rename the API as nvgpu_gr_ctx_load_golden_ctx_image() Note that call to g->ops.gr.update_ctxsw_preemption_mode() is moved out of this API and called directly from gk20a_alloc_obj_ctx() Jira NVGPU-1527 Change-Id: Id5a5b2cd2c0704fbefe536d581a37a60ec185ea9 Signed-off-by: Deepak Nibade <dnibade@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1989157 Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com> Reviewed-by: svc-mobile-misra <svc-mobile-misra@nvidia.com> GVS: Gerrit_Virtual_Submit Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
2025-12-24 02:22:34 +03:00 · 2019-01-07 14:45:11 +05:30
parent f048bb5a71
commit 58bc18b794
4 changed files with 83 additions and 78 deletions
--- a/drivers/gpu/nvgpu/common/gr/ctx.c
+++ b/drivers/gpu/nvgpu/common/gr/ctx.c
@@ -458,3 +458,73 @@ u64 nvgpu_gr_ctx_get_global_ctx_va(struct nvgpu_gr_ctx *gr_ctx,
 {
 	return gr_ctx->global_ctx_buffer_va[index];
 }
+
+/* load saved fresh copy of gloden image into channel gr_ctx */
+int nvgpu_gr_ctx_load_golden_ctx_image(struct gk20a *g,
+	struct nvgpu_gr_ctx *gr_ctx,
+	struct nvgpu_gr_global_ctx_local_golden_image *local_golden_image,
+	bool cde)
+{
+	u64 virt_addr = 0;
+	struct nvgpu_mem *mem;
+
+	nvgpu_log_fn(g, " ");
+
+	mem = &gr_ctx->mem;
+
+	nvgpu_gr_global_ctx_load_local_golden_image(g,
+		local_golden_image, mem);
+
+	if (g->ops.gr.ctxsw_prog.init_ctxsw_hdr_data != NULL) {
+		g->ops.gr.ctxsw_prog.init_ctxsw_hdr_data(g, mem);
+	}
+
+	if ((g->ops.gr.ctxsw_prog.set_cde_enabled != NULL) && cde) {
+		g->ops.gr.ctxsw_prog.set_cde_enabled(g, mem);
+	}
+
+	/* set priv access map */
+	g->ops.gr.ctxsw_prog.set_priv_access_map_config_mode(g, mem,
+		g->allow_all);
+	g->ops.gr.ctxsw_prog.set_priv_access_map_addr(g, mem,
+		nvgpu_gr_ctx_get_global_ctx_va(gr_ctx,
+			NVGPU_GR_CTX_PRIV_ACCESS_MAP_VA));
+
+	/* disable verif features */
+	g->ops.gr.ctxsw_prog.disable_verif_features(g, mem);
+
+	if (g->ops.gr.ctxsw_prog.set_pmu_options_boost_clock_frequencies !=
+			NULL) {
+		g->ops.gr.ctxsw_prog.set_pmu_options_boost_clock_frequencies(g,
+			mem, gr_ctx->boosted_ctx);
+	}
+
+	nvgpu_log(g, gpu_dbg_info, "write patch count = %d",
+			gr_ctx->patch_ctx.data_count);
+	g->ops.gr.ctxsw_prog.set_patch_count(g, mem,
+		gr_ctx->patch_ctx.data_count);
+	g->ops.gr.ctxsw_prog.set_patch_addr(g, mem,
+		gr_ctx->patch_ctx.mem.gpu_va);
+
+	/* Update main header region of the context buffer with the info needed
+	 * for PM context switching, including mode and possibly a pointer to
+	 * the PM backing store.
+	 */
+	if (gr_ctx->pm_ctx.pm_mode !=
+	    g->ops.gr.ctxsw_prog.hw_get_pm_mode_no_ctxsw()) {
+		if (gr_ctx->pm_ctx.mem.gpu_va == 0ULL) {
+			nvgpu_err(g,
+				"context switched pm with no pm buffer!");
+			return -EFAULT;
+		}
+
+		virt_addr = gr_ctx->pm_ctx.mem.gpu_va;
+	} else {
+		virt_addr = 0;
+	}
+
+	g->ops.gr.ctxsw_prog.set_pm_mode(g, mem, gr_ctx->pm_ctx.pm_mode);
+	g->ops.gr.ctxsw_prog.set_pm_ptr(g, mem, virt_addr);
+
+	return 0;
+}
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -1668,80 +1668,6 @@ int gr_gk20a_update_hwpm_ctxsw_mode(struct gk20a *g,
 	return 0;
 }

-/* load saved fresh copy of gloden image into channel gr_ctx */
-int gr_gk20a_load_golden_ctx_image(struct gk20a *g,
-					struct channel_gk20a *c,
-					struct nvgpu_gr_ctx *gr_ctx)
-{
-	struct gr_gk20a *gr = &g->gr;
-	u64 virt_addr = 0;
-	struct nvgpu_mem *mem;
-
-	nvgpu_log_fn(g, " ");
-
-	mem = &gr_ctx->mem;
-
-	nvgpu_gr_global_ctx_load_local_golden_image(g,
-		gr->local_golden_image, mem);
-
-	if (g->ops.gr.ctxsw_prog.init_ctxsw_hdr_data != NULL) {
-		g->ops.gr.ctxsw_prog.init_ctxsw_hdr_data(g, mem);
-	}
-
-	if ((g->ops.gr.ctxsw_prog.set_cde_enabled != NULL) && c->cde) {
-		g->ops.gr.ctxsw_prog.set_cde_enabled(g, mem);
-	}
-
-	/* set priv access map */
-	g->ops.gr.ctxsw_prog.set_priv_access_map_config_mode(g, mem,
-		g->allow_all);
-	g->ops.gr.ctxsw_prog.set_priv_access_map_addr(g, mem,
-		nvgpu_gr_ctx_get_global_ctx_va(gr_ctx,
-			NVGPU_GR_CTX_PRIV_ACCESS_MAP_VA));
-
-	/* disable verif features */
-	g->ops.gr.ctxsw_prog.disable_verif_features(g, mem);
-
-	if (g->ops.gr.update_ctxsw_preemption_mode != NULL) {
-		g->ops.gr.update_ctxsw_preemption_mode(g, gr_ctx, &c->ctx_header);
-	}
-
-	if (g->ops.gr.ctxsw_prog.set_pmu_options_boost_clock_frequencies !=
-			NULL) {
-		g->ops.gr.ctxsw_prog.set_pmu_options_boost_clock_frequencies(g,
-			mem, gr_ctx->boosted_ctx);
-	}
-
-	nvgpu_log(g, gpu_dbg_info, "write patch count = %d",
-			gr_ctx->patch_ctx.data_count);
-	g->ops.gr.ctxsw_prog.set_patch_count(g, mem,
-		gr_ctx->patch_ctx.data_count);
-	g->ops.gr.ctxsw_prog.set_patch_addr(g, mem,
-		gr_ctx->patch_ctx.mem.gpu_va);
-
-	/* Update main header region of the context buffer with the info needed
-	 * for PM context switching, including mode and possibly a pointer to
-	 * the PM backing store.
-	 */
-	if (gr_ctx->pm_ctx.pm_mode !=
-	    g->ops.gr.ctxsw_prog.hw_get_pm_mode_no_ctxsw()) {
-		if (gr_ctx->pm_ctx.mem.gpu_va == 0ULL) {
-			nvgpu_err(g,
-				"context switched pm with no pm buffer!");
-			return -EFAULT;
-		}
-
-		virt_addr = gr_ctx->pm_ctx.mem.gpu_va;
-	} else {
-		virt_addr = 0;
-	}
-
-	g->ops.gr.ctxsw_prog.set_pm_mode(g, mem, gr_ctx->pm_ctx.pm_mode);
-	g->ops.gr.ctxsw_prog.set_pm_ptr(g, mem, virt_addr);
-
-	return 0;
-}
-
 static void gr_gk20a_start_falcon_ucode(struct gk20a *g)
 {
 	nvgpu_log_fn(g, " ");
@@ -2476,12 +2402,19 @@ int gk20a_alloc_obj_ctx(struct channel_gk20a  *c, u32 class_num, u32 flags)
 		}

 		/* load golden image */
-		gr_gk20a_load_golden_ctx_image(g, c, gr_ctx);
+		nvgpu_gr_ctx_load_golden_ctx_image(g, gr_ctx,
+			g->gr.local_golden_image, c->cde);
 		if (err != 0) {
 			nvgpu_err(g,
 				"fail to load golden ctx image");
 			goto out;
 		}
+
+		if (g->ops.gr.update_ctxsw_preemption_mode != NULL) {
+			g->ops.gr.update_ctxsw_preemption_mode(g, gr_ctx,
+				&c->ctx_header);
+		}
+
 #ifdef CONFIG_GK20A_CTXSW_TRACE
 		if (g->ops.fecs_trace.bind_channel && !c->vpr) {
 			err = g->ops.fecs_trace.bind_channel(g, c, 0, gr_ctx);
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
@@ -457,9 +457,6 @@ struct gpu_ops;
 int gr_gk20a_init_golden_ctx_image(struct gk20a *g,
 					  struct channel_gk20a *c,
 					  struct nvgpu_gr_ctx *gr_ctx);
-int gr_gk20a_load_golden_ctx_image(struct gk20a *g,
-		struct channel_gk20a *c,
-		struct nvgpu_gr_ctx *gr_ctx);
 void gk20a_init_gr(struct gk20a *g);
 int gk20a_init_gr_support(struct gk20a *g);
 int gk20a_enable_gr_hw(struct gk20a *g);
--- a/drivers/gpu/nvgpu/include/nvgpu/gr/ctx.h
+++ b/drivers/gpu/nvgpu/include/nvgpu/gr/ctx.h
@@ -153,4 +153,9 @@ int nvgpu_gr_ctx_map_global_ctx_buffers(struct gk20a *g,
 u64 nvgpu_gr_ctx_get_global_ctx_va(struct nvgpu_gr_ctx *gr_ctx,
 	enum nvgpu_gr_ctx_global_ctx_va index);

+int nvgpu_gr_ctx_load_golden_ctx_image(struct gk20a *g,
+	struct nvgpu_gr_ctx *gr_ctx,
+	struct nvgpu_gr_global_ctx_local_golden_image *local_golden_image,
+	bool cde);
+
 #endif /* NVGPU_INCLUDE_GR_CTX_H */