From cc74fd93039d1ec007983a526cb11964e4fd6167 Mon Sep 17 00:00:00 2001
From: Seshendra Gadagottu <sgadagottu@nvidia.com>
Date: Fri, 1 Mar 2019 14:18:51 -0800
Subject: [PATCH] gpu: nvgpu: unify cbc_init in cbc and fb units

Pre-volta, cbc config is part of hw ltc and from volta onwards this is
moved to hw fb. Because of this, cbc_init functions are present in both
cbc unit and fb unit. Pre-volta uses cbc_init from cbc unit and from
volta onwards it uses cbc_init from fb unit.

With this patch, unified two cbc_init functions to cbc unit and created
new fb hal for cbc_configure. cbc unit uses fb hal for cbc_config and
fb unit is independent of cbc unit.

JIRA NVGPU-2897

Change-Id: Ib62f0b08547b031bcb5011c837e43c74931a22fe
Signed-off-by: Seshendra Gadagottu <sgadagottu@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/2030906
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/Makefile                    |  1 +
 drivers/gpu/nvgpu/Makefile.sources            |  1 +
 drivers/gpu/nvgpu/common/fb/fb_gv11b.c        |  8 +---
 drivers/gpu/nvgpu/common/fb/fb_gv11b.h        |  4 +-
 drivers/gpu/nvgpu/common/fb/fb_tu104.c        |  4 +-
 drivers/gpu/nvgpu/common/fb/fb_tu104.h        |  2 +-
 .../nvgpu/common/vgpu/gv11b/vgpu_hal_gv11b.c  |  1 -
 drivers/gpu/nvgpu/gk20a/gr_gk20a.c            |  4 --
 drivers/gpu/nvgpu/gv11b/hal_gv11b.c           |  5 ++-
 drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.c         | 45 +++++++++++++++++++
 drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.h         | 30 +++++++++++++
 drivers/gpu/nvgpu/hal/cbc/cbc_tu104.c         | 12 ++++-
 drivers/gpu/nvgpu/hal/cbc/cbc_tu104.h         |  1 +
 drivers/gpu/nvgpu/include/nvgpu/gk20a.h       |  2 +-
 drivers/gpu/nvgpu/tu104/hal_tu104.c           |  6 +--
 15 files changed, 101 insertions(+), 25 deletions(-)
 create mode 100644 drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.c
 create mode 100644 drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.h

diff --git a/drivers/gpu/nvgpu/Makefile b/drivers/gpu/nvgpu/Makefile
index cc76de2a3..17ae2685b 100644
--- a/drivers/gpu/nvgpu/Makefile
+++ b/drivers/gpu/nvgpu/Makefile
@@ -180,6 +180,7 @@ nvgpu-y += \
 	hal/power_features/cg/tu104_gating_reglist.o \
 	hal/cbc/cbc_gm20b.o \
 	hal/cbc/cbc_gp10b.o \
+	hal/cbc/cbc_gv11b.o \
 	hal/cbc/cbc_tu104.o \
 	hal/fuse/fuse_gm20b.o \
 	hal/fuse/fuse_gp10b.o \
diff --git a/drivers/gpu/nvgpu/Makefile.sources b/drivers/gpu/nvgpu/Makefile.sources
index 393049b8b..24908e959 100644
--- a/drivers/gpu/nvgpu/Makefile.sources
+++ b/drivers/gpu/nvgpu/Makefile.sources
@@ -346,6 +346,7 @@ srcs += common/sim.c \
 	hal/power_features/cg/tu104_gating_reglist.c \
 	hal/cbc/cbc_gm20b.c \
 	hal/cbc/cbc_gp10b.c \
+	hal/cbc/cbc_gv11b.c \
 	hal/cbc/cbc_tu104.c \
 	hal/fuse/fuse_gm20b.c \
 	hal/fuse/fuse_gp10b.c \
diff --git a/drivers/gpu/nvgpu/common/fb/fb_gv11b.c b/drivers/gpu/nvgpu/common/fb/fb_gv11b.c
index 378b6005d..17e0a0a3f 100644
--- a/drivers/gpu/nvgpu/common/fb/fb_gv11b.c
+++ b/drivers/gpu/nvgpu/common/fb/fb_gv11b.c
@@ -121,11 +121,8 @@ void gv11b_fb_init_fs_state(struct gk20a *g)
 	}
 }
 
-void gv11b_fb_init_cbc(struct gk20a *g, struct gr_gk20a *gr)
+void gv11b_fb_cbc_configure(struct gk20a *g, struct gr_gk20a *gr)
 {
-	u32 max_size = gr->max_comptag_mem;
-	/* one tag line covers 64KB */
-	u32 max_comptag_lines = max_size << 4;
 	u32 compbit_base_post_divide;
 	u64 compbit_base_post_multiply64;
 	u64 compbit_store_iova;
@@ -172,9 +169,6 @@ void gv11b_fb_init_cbc(struct gk20a *g, struct gr_gk20a *gr)
 
 	gr->compbit_store.base_hw = compbit_base_post_divide;
 
-	g->ops.cbc.ctrl(g, gk20a_cbc_op_invalidate,
-			0, max_comptag_lines - 1U);
-
 }
 
 static const char * const invalid_str = "invalid";
diff --git a/drivers/gpu/nvgpu/common/fb/fb_gv11b.h b/drivers/gpu/nvgpu/common/fb/fb_gv11b.h
index 66bf8e2c7..1c68ff222 100644
--- a/drivers/gpu/nvgpu/common/fb/fb_gv11b.h
+++ b/drivers/gpu/nvgpu/common/fb/fb_gv11b.h
@@ -1,7 +1,7 @@
 /*
  * GV11B FB
  *
- * Copyright (c) 2016-2018, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2016-2019, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -34,7 +34,7 @@ struct gr_gk20a;
 void gv11b_fb_init_hw(struct gk20a *g);
 
 void gv11b_fb_init_fs_state(struct gk20a *g);
-void gv11b_fb_init_cbc(struct gk20a *g, struct gr_gk20a *gr);
+void gv11b_fb_cbc_configure(struct gk20a *g, struct gr_gk20a *gr);
 void gv11b_fb_reset(struct gk20a *g);
 void gv11b_fb_hub_isr(struct gk20a *g);
 
diff --git a/drivers/gpu/nvgpu/common/fb/fb_tu104.c b/drivers/gpu/nvgpu/common/fb/fb_tu104.c
index d414ce708..d883262b8 100644
--- a/drivers/gpu/nvgpu/common/fb/fb_tu104.c
+++ b/drivers/gpu/nvgpu/common/fb/fb_tu104.c
@@ -424,7 +424,7 @@ int fb_tu104_mmu_invalidate_replay(struct gk20a *g,
 	return err;
 }
 
-void fb_tu104_init_cbc(struct gk20a *g, struct gr_gk20a *gr)
+void tu104_fb_cbc_configure(struct gk20a *g, struct gr_gk20a *gr)
 {
 	u64 base_divisor;
 	u64 compbit_store_base;
@@ -466,8 +466,6 @@ void fb_tu104_init_cbc(struct gk20a *g, struct gr_gk20a *gr)
 
 	gr->compbit_store.base_hw = compbit_store_base;
 
-	g->ops.cbc.ctrl(g, gk20a_cbc_op_invalidate,
-			0, gr->max_comptag_lines - 1U);
 }
 
 static int tu104_fb_wait_mmu_bind(struct gk20a *g)
diff --git a/drivers/gpu/nvgpu/common/fb/fb_tu104.h b/drivers/gpu/nvgpu/common/fb/fb_tu104.h
index a81a08ecf..68d4ad52b 100644
--- a/drivers/gpu/nvgpu/common/fb/fb_tu104.h
+++ b/drivers/gpu/nvgpu/common/fb/fb_tu104.h
@@ -55,7 +55,7 @@ int fb_tu104_tlb_invalidate(struct gk20a *g, struct nvgpu_mem *pdb);
 int fb_tu104_mmu_invalidate_replay(struct gk20a *g,
 	u32 invalidate_replay_val);
 
-void fb_tu104_init_cbc(struct gk20a *g, struct gr_gk20a *gr);
+void tu104_fb_cbc_configure(struct gk20a *g, struct gr_gk20a *gr);
 
 int tu104_fb_apply_pdb_cache_war(struct gk20a *g);
 size_t tu104_fb_get_vidmem_size(struct gk20a *g);
diff --git a/drivers/gpu/nvgpu/common/vgpu/gv11b/vgpu_hal_gv11b.c b/drivers/gpu/nvgpu/common/vgpu/gv11b/vgpu_hal_gv11b.c
index 17d5a4c72..bbad8ed64 100644
--- a/drivers/gpu/nvgpu/common/vgpu/gv11b/vgpu_hal_gv11b.c
+++ b/drivers/gpu/nvgpu/common/vgpu/gv11b/vgpu_hal_gv11b.c
@@ -365,7 +365,6 @@ static const struct gpu_ops vgpu_gv11b_ops = {
 	.fb = {
 		.init_hw = NULL,
 		.init_fs_state = NULL,
-		.init_cbc = NULL,
 		.set_mmu_page_size = NULL,
 		.set_use_full_comp_tag_line = NULL,
 		.compression_page_size = gp10b_fb_compression_page_size,
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
index 49ac09014..108155222 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -2815,10 +2815,6 @@ static int gk20a_init_gr_setup_hw(struct gk20a *g)
 		g->ops.cbc.init(g, gr);
 	}
 
-	if (g->ops.fb.init_cbc != NULL) {
-		g->ops.fb.init_cbc(g, gr);
-	}
-
 	if (g->ops.gr.disable_rd_coalesce != NULL) {
 		g->ops.gr.disable_rd_coalesce(g);
 	}
diff --git a/drivers/gpu/nvgpu/gv11b/hal_gv11b.c b/drivers/gpu/nvgpu/gv11b/hal_gv11b.c
index 7e2d8e48c..25dd73172 100644
--- a/drivers/gpu/nvgpu/gv11b/hal_gv11b.c
+++ b/drivers/gpu/nvgpu/gv11b/hal_gv11b.c
@@ -33,6 +33,7 @@
 #include "hal/power_features/cg/gv11b_gating_reglist.h"
 #include "hal/cbc/cbc_gm20b.h"
 #include "hal/cbc/cbc_gp10b.h"
+#include "hal/cbc/cbc_gv11b.h"
 #include "hal/fuse/fuse_gm20b.h"
 #include "hal/fuse/fuse_gp10b.h"
 
@@ -290,7 +291,7 @@ static const struct gpu_ops gv11b_ops = {
 		.split_ltc_broadcast_addr = gm20b_ltc_split_ltc_broadcast_addr,
 	},
 	.cbc = {
-		.init = NULL,
+		.init = gv11b_cbc_init,
 		.alloc_comptags = gp10b_cbc_alloc_comptags,
 		.ctrl = gp10b_cbc_ctrl,
 	},
@@ -567,7 +568,7 @@ static const struct gpu_ops gv11b_ops = {
 	.fb = {
 		.init_hw = gv11b_fb_init_hw,
 		.init_fs_state = gv11b_fb_init_fs_state,
-		.init_cbc = gv11b_fb_init_cbc,
+		.cbc_configure = gv11b_fb_cbc_configure,
 		.set_mmu_page_size = NULL,
 		.set_use_full_comp_tag_line =
 			gm20b_fb_set_use_full_comp_tag_line,
diff --git a/drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.c b/drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.c
new file mode 100644
index 000000000..e895a3704
--- /dev/null
+++ b/drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.c
@@ -0,0 +1,45 @@
+/*
+ * GP10B CBC
+ *
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+
+#include <nvgpu/cbc.h>
+#include <nvgpu/log.h>
+#include <nvgpu/gk20a.h>
+
+#include "cbc_gv11b.h"
+
+void gv11b_cbc_init(struct gk20a *g, struct gr_gk20a *gr)
+{
+	u32 max_size = gr->max_comptag_mem;
+	/* one tag line covers 64KB */
+	u32 max_comptag_lines = max_size << 4;
+
+	nvgpu_log_fn(g, " ");
+
+	g->ops.fb.cbc_configure(g, gr);
+
+	g->ops.cbc.ctrl(g, gk20a_cbc_op_invalidate,
+			0, max_comptag_lines - 1U);
+
+}
diff --git a/drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.h b/drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.h
new file mode 100644
index 000000000..3bc33c528
--- /dev/null
+++ b/drivers/gpu/nvgpu/hal/cbc/cbc_gv11b.h
@@ -0,0 +1,30 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef CBC_GV11B_H
+#define CBC_GV11B_H
+struct gk20a;
+struct gpu_ops;
+
+void gv11b_cbc_init(struct gk20a *g, struct gr_gk20a *gr);
+
+#endif
diff --git a/drivers/gpu/nvgpu/hal/cbc/cbc_tu104.c b/drivers/gpu/nvgpu/hal/cbc/cbc_tu104.c
index 64470ff8c..8b144e8a0 100644
--- a/drivers/gpu/nvgpu/hal/cbc/cbc_tu104.c
+++ b/drivers/gpu/nvgpu/hal/cbc/cbc_tu104.c
@@ -30,11 +30,12 @@
 
 #include <trace/events/gk20a.h>
 
+#include <nvgpu/hw/tu104/hw_ltc_tu104.h>
+
 #include "cbc_tu104.h"
 
 #include "common/ltc/ltc_gv11b.h"
 
-#include <nvgpu/hw/tu104/hw_ltc_tu104.h>
 
 u64 tu104_cbc_get_base_divisor(struct gk20a *g)
 {
@@ -216,3 +217,12 @@ out:
 	nvgpu_mutex_release(&g->mm.l2_op_lock);
 	return err;
 }
+
+void tu104_cbc_init(struct gk20a *g, struct gr_gk20a *gr)
+{
+
+	g->ops.fb.cbc_configure(g, gr);
+
+	g->ops.cbc.ctrl(g, gk20a_cbc_op_invalidate,
+			0, gr->max_comptag_lines - 1U);
+}
diff --git a/drivers/gpu/nvgpu/hal/cbc/cbc_tu104.h b/drivers/gpu/nvgpu/hal/cbc/cbc_tu104.h
index 0c3a94f28..ea058b7fc 100644
--- a/drivers/gpu/nvgpu/hal/cbc/cbc_tu104.h
+++ b/drivers/gpu/nvgpu/hal/cbc/cbc_tu104.h
@@ -33,5 +33,6 @@ u64 tu104_cbc_get_base_divisor(struct gk20a *g);
 int tu104_cbc_alloc_comptags(struct gk20a *g, struct gr_gk20a *gr);
 int tu104_cbc_ctrl(struct gk20a *g, enum gk20a_cbc_op op,
 		       u32 min, u32 max);
+void tu104_cbc_init(struct gk20a *g, struct gr_gk20a *gr);
 
 #endif
diff --git a/drivers/gpu/nvgpu/include/nvgpu/gk20a.h b/drivers/gpu/nvgpu/include/nvgpu/gk20a.h
index 84936f6e1..8cd6c7729 100644
--- a/drivers/gpu/nvgpu/include/nvgpu/gk20a.h
+++ b/drivers/gpu/nvgpu/include/nvgpu/gk20a.h
@@ -658,7 +658,7 @@ struct gpu_ops {
 	} gr;
 	struct {
 		void (*init_hw)(struct gk20a *g);
-		void (*init_cbc)(struct gk20a *g, struct gr_gk20a *gr);
+		void (*cbc_configure)(struct gk20a *g, struct gr_gk20a *gr);
 		void (*init_fs_state)(struct gk20a *g);
 		void (*init_uncompressed_kind_map)(struct gk20a *g);
 		void (*init_kind_attr)(struct gk20a *g);
diff --git a/drivers/gpu/nvgpu/tu104/hal_tu104.c b/drivers/gpu/nvgpu/tu104/hal_tu104.c
index 6b9a417de..bbbaa2479 100644
--- a/drivers/gpu/nvgpu/tu104/hal_tu104.c
+++ b/drivers/gpu/nvgpu/tu104/hal_tu104.c
@@ -356,7 +356,7 @@ static const struct gpu_ops tu104_ops = {
 		.split_ltc_broadcast_addr = gm20b_ltc_split_ltc_broadcast_addr,
 	},
 	.cbc = {
-		.init = NULL,
+		.init = tu104_cbc_init,
 		.get_base_divisor = tu104_cbc_get_base_divisor,
 		.alloc_comptags = tu104_cbc_alloc_comptags,
 		.ctrl = tu104_cbc_ctrl,
@@ -637,7 +637,7 @@ static const struct gpu_ops tu104_ops = {
 	.fb = {
 		.init_hw = gv11b_fb_init_hw,
 		.init_fs_state = gp106_fb_init_fs_state,
-		.init_cbc = fb_tu104_init_cbc,
+		.cbc_configure = tu104_fb_cbc_configure,
 		.set_mmu_page_size = NULL,
 		.set_use_full_comp_tag_line =
 			gm20b_fb_set_use_full_comp_tag_line,
@@ -1318,9 +1318,9 @@ int tu104_init_hal(struct gk20a *g)
 	/* dGpu VDK support */
 	if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)){
 		/* Disable compression */
+		gops->cbc.init = NULL;
 		gops->cbc.ctrl = NULL;
 		gops->cbc.alloc_comptags = NULL;
-		gops->fb.init_cbc = NULL;
 
 		gops->gr.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode;