From 00203b42f2ffccd7d947c1e631595e709f5401c4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Konsta=20H=C3=B6ltt=C3=A4?= <kholtta@nvidia.com>
Date: Fri, 3 Apr 2020 15:12:16 +0300
Subject: [PATCH] gpu: nvgpu: split add_sema_cmd to wait and incr
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The internal add_sema_cmd() used when making cmd buf entries has so many
branches it makes sense to split it at the bool acquire flag into two
functions. The wait part doesn't even need the wfi flag, and the incr
part doesn't need offset.

Jira NVGPU-4548

Change-Id: Iab26b9bc14564e2958935ab7ffda03aa873dd9b1
Signed-off-by: Konsta Hölttä <kholtta@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/c/linux-nvgpu/+/2323320
(cherry picked from commit 9fe2830aa9ee2b0b165edc959defa74dfb49c6ba)
Reviewed-on: https://git-master.nvidia.com/r/c/linux-nvgpu/+/2328410
Reviewed-by: automaticguardword <automaticguardword@nvidia.com>
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: Alex Waterman <alexw@nvidia.com>
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
GVS: Gerrit_Virtual_Submit
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 .../common/sync/channel_sync_semaphore.c      | 68 +++++++++----------
 1 file changed, 34 insertions(+), 34 deletions(-)

diff --git a/drivers/gpu/nvgpu/common/sync/channel_sync_semaphore.c b/drivers/gpu/nvgpu/common/sync/channel_sync_semaphore.c
index 9fa79c2e6..02ea03230 100644
--- a/drivers/gpu/nvgpu/common/sync/channel_sync_semaphore.c
+++ b/drivers/gpu/nvgpu/common/sync/channel_sync_semaphore.c
@@ -56,44 +56,44 @@ nvgpu_channel_sync_semaphore_from_base(struct nvgpu_channel_sync *base)
 			offsetof(struct nvgpu_channel_sync_semaphore, base));
 }
 
-static void add_sema_cmd(struct gk20a *g, struct nvgpu_channel *c,
+static void add_sema_wait_cmd(struct gk20a *g, struct nvgpu_channel *c,
 			 struct nvgpu_semaphore *s, struct priv_cmd_entry *cmd,
-			 u32 offset, bool acquire, bool wfi)
+			 u32 offset)
 {
 	int ch = c->chid;
 	u64 va;
 
-	/*
-	 * RO for acquire (since we just need to read the mem) and RW for
-	 * release since we will need to write back to the semaphore memory.
-	 */
-	va = acquire ? nvgpu_semaphore_gpu_ro_va(s) :
-		       nvgpu_semaphore_gpu_rw_va(s);
+	/* acquire just needs to read the mem. */
+	va = nvgpu_semaphore_gpu_ro_va(s);
 
-	/*
-	 * If the op is not an acquire (so therefor a release) we should
-	 * incr the underlying sema next_value.
-	 */
-	if (!acquire) {
-		nvgpu_semaphore_prepare(s, c->hw_sema);
-	}
+	g->ops.sync.sema.add_wait_cmd(g, cmd, offset, s, va);
+	gpu_sema_verbose_dbg(g, "(A) c=%d ACQ_GE %-4u pool=%-3llu"
+			     "va=0x%llx cmd_mem=0x%llx b=0x%llx off=%u",
+			     ch, nvgpu_semaphore_get_value(s),
+			     nvgpu_semaphore_get_hw_pool_page_idx(s),
+			     va, cmd->gva, cmd->mem->gpu_va, offset);
+}
 
-	if (acquire) {
-		g->ops.sync.sema.add_wait_cmd(g, cmd, offset, s, va);
-		gpu_sema_verbose_dbg(g, "(A) c=%d ACQ_GE %-4u pool=%-3llu"
-				     "va=0x%llx cmd_mem=0x%llx b=0x%llx off=%u",
-				     ch, nvgpu_semaphore_get_value(s),
-				     nvgpu_semaphore_get_hw_pool_page_idx(s),
-				     va, cmd->gva, cmd->mem->gpu_va, offset);
-	} else {
-		g->ops.sync.sema.add_incr_cmd(g, cmd, s, va, wfi);
-		gpu_sema_verbose_dbg(g, "(R) c=%d INCR %u (%u) pool=%-3llu"
-				     "va=0x%llx cmd_mem=0x%llx b=0x%llx off=%u",
-				     ch, nvgpu_semaphore_get_value(s),
-				     nvgpu_semaphore_read(s),
-				     nvgpu_semaphore_get_hw_pool_page_idx(s),
-				     va, cmd->gva, cmd->mem->gpu_va, offset);
-	}
+static void add_sema_incr_cmd(struct gk20a *g, struct nvgpu_channel *c,
+			 struct nvgpu_semaphore *s, struct priv_cmd_entry *cmd,
+			 bool wfi)
+{
+	int ch = c->chid;
+	u64 va;
+
+	/* release will need to write back to the semaphore memory. */
+	va = nvgpu_semaphore_gpu_rw_va(s);
+
+	/* incr the underlying sema next_value (like syncpt's max). */
+	nvgpu_semaphore_prepare(s, c->hw_sema);
+
+	g->ops.sync.sema.add_incr_cmd(g, cmd, s, va, wfi);
+	gpu_sema_verbose_dbg(g, "(R) c=%d INCR %u (%u) pool=%-3llu"
+			     "va=0x%llx cmd_mem=0x%llx b=0x%llx",
+			     ch, nvgpu_semaphore_get_value(s),
+			     nvgpu_semaphore_read(s),
+			     nvgpu_semaphore_get_hw_pool_page_idx(s),
+			     va, cmd->gva, cmd->mem->gpu_va);
 }
 
 static void channel_sync_semaphore_gen_wait_cmd(struct nvgpu_channel *c,
@@ -110,8 +110,8 @@ static void channel_sync_semaphore_gen_wait_cmd(struct nvgpu_channel *c,
 	} else {
 		has_incremented = nvgpu_semaphore_can_wait(sema);
 		nvgpu_assert(has_incremented);
-		add_sema_cmd(c->g, c, sema, wait_cmd,
-			pos * wait_cmd_size, true, false);
+		add_sema_wait_cmd(c->g, c, sema, wait_cmd,
+			pos * wait_cmd_size);
 		nvgpu_semaphore_put(sema);
 	}
 }
@@ -201,7 +201,7 @@ static int channel_sync_semaphore_incr_common(
 	}
 
 	/* Release the completion semaphore. */
-	add_sema_cmd(c->g, c, semaphore, incr_cmd, 0, false, wfi_cmd);
+	add_sema_incr_cmd(c->g, c, semaphore, incr_cmd, wfi_cmd);
 
 	if (need_sync_fence) {
 		err = nvgpu_os_fence_sema_create(&os_fence, c,