From 8880c82111a36c8a5db9997ff434f549fd6419ea Mon Sep 17 00:00:00 2001
From: Vinod G <vinodg@nvidia.com>
Date: Thu, 18 Apr 2019 11:55:05 -0700
Subject: [PATCH] gpu: nvgpu: move gk20a_gr_isr to hal

Move gk20a_gr_isr function to stall_isr hal in gr.intr unit.
Move all static functions accessed in gk20a_gr_isr function
to gr_intr file from gr_gk20a file.

Update mc hal functions to use g->ops.gr.intr.stall_isr

JIRA NVGPU-1891
JIRA NVGPU-3016

Change-Id: If379348eef863b8d794a726b98e190ebe8585cb2
Signed-off-by: Vinod G <vinodg@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/2100670
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: svc-mobile-misra <svc-mobile-misra@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/common/gr/gr_intr.c        | 273 ++++++++++++++++++-
 drivers/gpu/nvgpu/gk20a/gr_gk20a.c           | 264 +-----------------
 drivers/gpu/nvgpu/gk20a/gr_gk20a.h           |   2 -
 drivers/gpu/nvgpu/hal/init/hal_gm20b.c       |   1 +
 drivers/gpu/nvgpu/hal/init/hal_gp10b.c       |   1 +
 drivers/gpu/nvgpu/hal/init/hal_gv100.c       |   1 +
 drivers/gpu/nvgpu/hal/init/hal_gv11b.c       |   1 +
 drivers/gpu/nvgpu/hal/init/hal_tu104.c       |   1 +
 drivers/gpu/nvgpu/hal/mc/mc_gm20b.c          |   3 +-
 drivers/gpu/nvgpu/hal/mc/mc_gp10b.c          |   3 +-
 drivers/gpu/nvgpu/include/nvgpu/gk20a.h      |   5 +-
 drivers/gpu/nvgpu/include/nvgpu/gr/gr_intr.h |   7 +-
 12 files changed, 284 insertions(+), 278 deletions(-)

diff --git a/drivers/gpu/nvgpu/common/gr/gr_intr.c b/drivers/gpu/nvgpu/common/gr/gr_intr.c
index ea9a5ebfc..2f5772eba 100644
--- a/drivers/gpu/nvgpu/common/gr/gr_intr.c
+++ b/drivers/gpu/nvgpu/common/gr/gr_intr.c
@@ -24,7 +24,8 @@
 #include <nvgpu/io.h>
 #include <nvgpu/channel.h>
 #include <nvgpu/regops.h>
-#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/rc.h>
+#include <nvgpu/error_notifier.h>
 
 #include <nvgpu/gr/gr.h>
 #include <nvgpu/gr/gr_intr.h>
@@ -105,6 +106,52 @@ static int gr_intr_handle_tpc_exception(struct gk20a *g, u32 gpc, u32 tpc,
 	return ret;
 }
 
+static void gr_intr_post_bpt_events(struct gk20a *g, struct tsg_gk20a *tsg,
+				    u32 global_esr)
+{
+	if (g->ops.gr.esr_bpt_pending_events(global_esr,
+						NVGPU_EVENT_ID_BPT_INT)) {
+		g->ops.tsg.post_event_id(tsg, NVGPU_EVENT_ID_BPT_INT);
+	}
+
+	if (g->ops.gr.esr_bpt_pending_events(global_esr,
+						NVGPU_EVENT_ID_BPT_PAUSE)) {
+		g->ops.tsg.post_event_id(tsg, NVGPU_EVENT_ID_BPT_PAUSE);
+	}
+}
+
+static int gr_intr_handle_illegal_method(struct gk20a *g,
+					  struct nvgpu_gr_isr_data *isr_data)
+{
+	int ret = g->ops.gr.handle_sw_method(g, isr_data->addr,
+			isr_data->class_num, isr_data->offset,
+			isr_data->data_lo);
+	if (ret != 0) {
+		nvgpu_gr_intr_set_error_notifier(g, isr_data,
+			 NVGPU_ERR_NOTIFIER_GR_ILLEGAL_NOTIFY);
+		nvgpu_err(g, "invalid method class 0x%08x"
+			", offset 0x%08x address 0x%08x",
+			isr_data->class_num, isr_data->offset, isr_data->addr);
+	}
+	return ret;
+}
+
+static int gr_intr_handle_class_error(struct gk20a *g,
+				       struct nvgpu_gr_isr_data *isr_data)
+{
+	u32 chid = isr_data->ch != NULL ?
+		isr_data->ch->chid : FIFO_INVAL_CHANNEL_ID;
+
+	nvgpu_log_fn(g, " ");
+
+	g->ops.gr.intr.handle_class_error(g, chid, isr_data);
+
+	nvgpu_gr_intr_set_error_notifier(g, isr_data,
+			 NVGPU_ERR_NOTIFIER_GR_ERROR_SW_NOTIFY);
+
+	return -EINVAL;
+}
+
 /* Used by sw interrupt thread to translate current ctx to chid.
  * Also used by regops to translate current ctx to chid and tsgid.
  * For performance, we don't want to go through 128 channels every time.
@@ -227,6 +274,26 @@ void nvgpu_gr_intr_report_exception(struct gk20a *g, u32 inst,
 	}
 }
 
+void nvgpu_gr_intr_set_error_notifier(struct gk20a *g,
+		  struct nvgpu_gr_isr_data *isr_data, u32 error_notifier)
+{
+	struct channel_gk20a *ch;
+	struct tsg_gk20a *tsg;
+
+	ch = isr_data->ch;
+
+	if (ch == NULL) {
+		return;
+	}
+
+	tsg = tsg_gk20a_from_ch(ch);
+	if (tsg != NULL) {
+		nvgpu_tsg_set_error_notifier(g, tsg, error_notifier);
+	} else {
+		nvgpu_err(g, "chid: %d is not bound to tsg", ch->chid);
+	}
+}
+
 int nvgpu_gr_intr_handle_gpc_exception(struct gk20a *g, bool *post_event,
 	struct nvgpu_gr_config *gr_config, struct channel_gk20a *fault_ch,
 	u32 *hww_global_esr)
@@ -315,7 +382,7 @@ static inline bool is_valid_cyclestats_bar0_offset_gk20a(struct gk20a *g,
 }
 #endif
 
-int nvgpu_gr_intr_handle_notify_pending(struct gk20a *g,
+void nvgpu_gr_intr_handle_notify_pending(struct gk20a *g,
 					struct nvgpu_gr_isr_data *isr_data)
 {
 	struct channel_gk20a *ch = isr_data->ch;
@@ -327,14 +394,14 @@ int nvgpu_gr_intr_handle_notify_pending(struct gk20a *g,
 	bool exit;
 #endif
 	if (ch == NULL || tsg_gk20a_from_ch(ch) == NULL) {
-		return 0;
+		return;
 	}
 
 #if defined(CONFIG_GK20A_CYCLE_STATS)
 	/* GL will never use payload 0 for cycle state */
 	if ((ch->cyclestate.cyclestate_buffer == NULL) ||
 	    (isr_data->data_lo == 0)) {
-		return 0;
+		return;
 	}
 
 	nvgpu_mutex_acquire(&ch->cyclestate.cyclestate_buffer_mutex);
@@ -445,17 +512,16 @@ int nvgpu_gr_intr_handle_notify_pending(struct gk20a *g,
 #endif
 	nvgpu_log_fn(g, " ");
 	nvgpu_cond_broadcast_interruptible(&ch->notifier_wq);
-	return 0;
 }
 
-int nvgpu_gr_intr_handle_semaphore_pending(struct gk20a *g,
+void nvgpu_gr_intr_handle_semaphore_pending(struct gk20a *g,
 					   struct nvgpu_gr_isr_data *isr_data)
 {
 	struct channel_gk20a *ch = isr_data->ch;
 	struct tsg_gk20a *tsg;
 
 	if (ch == NULL) {
-		return 0;
+		return;
 	}
 
 	tsg = tsg_gk20a_from_ch(ch);
@@ -467,6 +533,199 @@ int nvgpu_gr_intr_handle_semaphore_pending(struct gk20a *g,
 	} else {
 		nvgpu_err(g, "chid: %d is not bound to tsg", ch->chid);
 	}
+}
+
+int nvgpu_gr_intr_stall_isr(struct gk20a *g)
+{
+	struct nvgpu_gr_isr_data isr_data;
+	struct nvgpu_gr_intr_info intr_info;
+	bool need_reset = false;
+	struct channel_gk20a *ch = NULL;
+	struct channel_gk20a *fault_ch = NULL;
+	u32 tsgid = NVGPU_INVALID_TSG_ID;
+	struct tsg_gk20a *tsg = NULL;
+	u32 global_esr = 0;
+	u32 chid;
+	struct nvgpu_gr_config *gr_config = g->gr->config;
+	u32 gr_intr = g->ops.gr.intr.read_pending_interrupts(g, &intr_info);
+	u32 clear_intr = gr_intr;
+
+	nvgpu_log_fn(g, " ");
+	nvgpu_log(g, gpu_dbg_intr, "pgraph intr 0x%08x", gr_intr);
+
+	if (gr_intr == 0U) {
+		return 0;
+	}
+
+	/* Disable fifo access */
+	g->ops.gr.init.fifo_access(g, false);
+
+	g->ops.gr.intr.trapped_method_info(g, &isr_data);
+
+	ch = nvgpu_gr_intr_get_channel_from_ctx(g, isr_data.curr_ctx, &tsgid);
+	isr_data.ch = ch;
+	chid = ch != NULL ? ch->chid : FIFO_INVAL_CHANNEL_ID;
+
+	if (ch == NULL) {
+		nvgpu_err(g, "pgraph intr: 0x%08x, chid: INVALID", gr_intr);
+	} else {
+		tsg = tsg_gk20a_from_ch(ch);
+		if (tsg == NULL) {
+			nvgpu_err(g, "pgraph intr: 0x%08x, chid: %d "
+				"not bound to tsg", gr_intr, chid);
+		}
+	}
+
+	nvgpu_log(g, gpu_dbg_intr | gpu_dbg_gpu_dbg,
+		"channel %d: addr 0x%08x, "
+		"data 0x%08x 0x%08x,"
+		"ctx 0x%08x, offset 0x%08x, "
+		"subchannel 0x%08x, class 0x%08x",
+		chid, isr_data.addr,
+		isr_data.data_hi, isr_data.data_lo,
+		isr_data.curr_ctx, isr_data.offset,
+		isr_data.sub_chan, isr_data.class_num);
+
+	if (intr_info.notify != 0U) {
+		g->ops.gr.intr.handle_notify_pending(g, &isr_data);
+		clear_intr &= ~intr_info.notify;
+	}
+
+	if (intr_info.semaphore != 0U) {
+		g->ops.gr.intr.handle_semaphore_pending(g, &isr_data);
+		clear_intr &= ~intr_info.semaphore;
+	}
+
+	if (intr_info.illegal_notify != 0U) {
+		nvgpu_err(g, "illegal notify pending");
+
+		nvgpu_gr_intr_set_error_notifier(g, &isr_data,
+				NVGPU_ERR_NOTIFIER_GR_ILLEGAL_NOTIFY);
+		need_reset = true;
+		clear_intr &= ~intr_info.illegal_notify;
+	}
+
+	if (intr_info.illegal_method != 0U) {
+		if (gr_intr_handle_illegal_method(g, &isr_data) != 0) {
+			need_reset = true;
+		}
+		clear_intr &= ~intr_info.illegal_method;
+	}
+
+	if (intr_info.illegal_class != 0U) {
+		nvgpu_err(g, "invalid class 0x%08x, offset 0x%08x",
+			  isr_data.class_num, isr_data.offset);
+
+		nvgpu_gr_intr_set_error_notifier(g, &isr_data,
+				NVGPU_ERR_NOTIFIER_GR_ERROR_SW_NOTIFY);
+		need_reset = true;
+		clear_intr &= ~intr_info.illegal_class;
+	}
+
+	if (intr_info.fecs_error != 0U) {
+		if (g->ops.gr.handle_fecs_error(g, ch, &isr_data) != 0) {
+			need_reset = true;
+		}
+		clear_intr &= ~intr_info.fecs_error;
+	}
+
+	if (intr_info.class_error != 0U) {
+		if (gr_intr_handle_class_error(g, &isr_data) != 0) {
+			need_reset = true;
+		}
+		clear_intr &= ~intr_info.class_error;
+	}
+
+	/* this one happens if someone tries to hit a non-whitelisted
+	 * register using set_falcon[4] */
+	if (intr_info.fw_method != 0U) {
+		u32 ch_id = isr_data.ch != NULL ?
+			isr_data.ch->chid : FIFO_INVAL_CHANNEL_ID;
+		nvgpu_err(g,
+		   "firmware method 0x%08x, offset 0x%08x for channel %u",
+		   isr_data.class_num, isr_data.offset,
+		   ch_id);
+
+		nvgpu_gr_intr_set_error_notifier(g, &isr_data,
+			 NVGPU_ERR_NOTIFIER_GR_ERROR_SW_NOTIFY);
+		need_reset = true;
+		clear_intr &= ~intr_info.fw_method;
+	}
+
+	if (intr_info.exception != 0U) {
+		bool is_gpc_exception = false;
+
+		need_reset = g->ops.gr.intr.handle_exceptions(g,
+							&is_gpc_exception);
+
+		/* check if a gpc exception has occurred */
+		if (is_gpc_exception &&	!need_reset) {
+			bool post_event = false;
+
+			nvgpu_log(g, gpu_dbg_intr | gpu_dbg_gpu_dbg,
+					 "GPC exception pending");
+
+			if (tsg != NULL) {
+				fault_ch = isr_data.ch;
+			}
+
+			/* fault_ch can be NULL */
+			/* check if any gpc has an exception */
+			if (nvgpu_gr_intr_handle_gpc_exception(g, &post_event,
+				gr_config, fault_ch, &global_esr) != 0) {
+				need_reset = true;
+			}
+
+#ifdef NVGPU_DEBUGGER
+			/* signal clients waiting on an event */
+			if (g->ops.gr.sm_debugger_attached(g) &&
+				post_event && (fault_ch != NULL)) {
+				g->ops.debugger.post_events(fault_ch);
+			}
+#endif
+		}
+		clear_intr &= ~intr_info.exception;
+
+		if (need_reset) {
+			nvgpu_err(g, "set gr exception notifier");
+			nvgpu_gr_intr_set_error_notifier(g, &isr_data,
+					 NVGPU_ERR_NOTIFIER_GR_EXCEPTION);
+		}
+	}
+
+	if (need_reset) {
+		nvgpu_rc_gr_fault(g, tsg, ch);
+	}
+
+	if (clear_intr != 0U) {
+		if (ch == NULL) {
+			/*
+			 * This is probably an interrupt during
+			 * gk20a_free_channel()
+			 */
+			nvgpu_err(g, "unhandled gr intr 0x%08x for "
+				"unreferenceable channel, clearing",
+				gr_intr);
+		} else {
+			nvgpu_err(g, "unhandled gr intr 0x%08x for chid: %d",
+				gr_intr, chid);
+		}
+	}
+
+	/* clear handled and unhandled interrupts */
+	g->ops.gr.intr.clear_pending_interrupts(g, gr_intr);
+
+	/* Enable fifo access */
+	g->ops.gr.init.fifo_access(g, true);
+
+	/* Posting of BPT events should be the last thing in this function */
+	if ((global_esr != 0U) && (tsg != NULL) && (need_reset == false)) {
+		gr_intr_post_bpt_events(g, tsg, global_esr);
+	}
+
+	if (ch != NULL) {
+		gk20a_channel_put(ch);
+	}
 
 	return 0;
 }
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
index 1782d37af..3caf9e57f 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -41,7 +41,6 @@
 #include <nvgpu/io.h>
 #include <nvgpu/utils.h>
 #include <nvgpu/fifo.h>
-#include <nvgpu/rc.h>
 #include <nvgpu/gk20a.h>
 #include <nvgpu/channel.h>
 #include <nvgpu/string.h>
@@ -248,42 +247,6 @@ int gr_gk20a_update_hwpm_ctxsw_mode(struct gk20a *g,
 	return ret;
 }
 
-static void gk20a_gr_set_error_notifier(struct gk20a *g,
-		  struct nvgpu_gr_isr_data *isr_data, u32 error_notifier)
-{
-	struct channel_gk20a *ch;
-	struct tsg_gk20a *tsg;
-
-	ch = isr_data->ch;
-
-	if (ch == NULL) {
-		return;
-	}
-
-	tsg = tsg_gk20a_from_ch(ch);
-	if (tsg != NULL) {
-		nvgpu_tsg_set_error_notifier(g, tsg, error_notifier);
-	} else {
-		nvgpu_err(g, "chid: %d is not bound to tsg", ch->chid);
-	}
-}
-
-static int gk20a_gr_handle_illegal_method(struct gk20a *g,
-					  struct nvgpu_gr_isr_data *isr_data)
-{
-	int ret = g->ops.gr.handle_sw_method(g, isr_data->addr,
-			isr_data->class_num, isr_data->offset,
-			isr_data->data_lo);
-	if (ret != 0) {
-		gk20a_gr_set_error_notifier(g, isr_data,
-			 NVGPU_ERR_NOTIFIER_GR_ILLEGAL_NOTIFY);
-		nvgpu_err(g, "invalid method class 0x%08x"
-			", offset 0x%08x address 0x%08x",
-			isr_data->class_num, isr_data->offset, isr_data->addr);
-	}
-	return ret;
-}
-
 int gk20a_gr_handle_fecs_error(struct gk20a *g, struct channel_gk20a *ch,
 					  struct nvgpu_gr_isr_data *isr_data)
 {
@@ -303,7 +266,7 @@ int gk20a_gr_handle_fecs_error(struct gk20a *g, struct channel_gk20a *ch,
 	if (fecs_host_intr.unimp_fw_method_active) {
 		mailbox_value = g->ops.gr.falcon.read_fecs_ctxsw_mailbox(g,
 								mailbox_id);
-		gk20a_gr_set_error_notifier(g, isr_data,
+		nvgpu_gr_intr_set_error_notifier(g, isr_data,
 			 NVGPU_ERR_NOTIFIER_FECS_ERR_UNIMP_FIRMWARE_METHOD);
 		nvgpu_err(g,
 			  "firmware method error 0x%08x for offset 0x%04x",
@@ -371,22 +334,6 @@ int gk20a_gr_handle_fecs_error(struct gk20a *g, struct channel_gk20a *ch,
 	return ret;
 }
 
-static int gk20a_gr_handle_class_error(struct gk20a *g,
-				       struct nvgpu_gr_isr_data *isr_data)
-{
-	u32 chid = isr_data->ch != NULL ?
-		isr_data->ch->chid : FIFO_INVAL_CHANNEL_ID;
-
-	nvgpu_log_fn(g, " ");
-
-	g->ops.gr.intr.handle_class_error(g, chid, isr_data);
-
-	gk20a_gr_set_error_notifier(g, isr_data,
-			 NVGPU_ERR_NOTIFIER_GR_ERROR_SW_NOTIFY);
-
-	return -EINVAL;
-}
-
 int gk20a_gr_lock_down_sm(struct gk20a *g,
 			 u32 gpc, u32 tpc, u32 sm, u32 global_esr_mask,
 			 bool check_errors)
@@ -535,215 +482,6 @@ void gk20a_gr_get_esr_sm_sel(struct gk20a *g, u32 gpc, u32 tpc,
 	*esr_sm_sel = 1;
 }
 
-void gr_intr_post_bpt_events(struct gk20a *g, struct tsg_gk20a *tsg,
-				    u32 global_esr)
-{
-	if (g->ops.gr.esr_bpt_pending_events(global_esr,
-						NVGPU_EVENT_ID_BPT_INT)) {
-		g->ops.tsg.post_event_id(tsg, NVGPU_EVENT_ID_BPT_INT);
-	}
-
-	if (g->ops.gr.esr_bpt_pending_events(global_esr,
-						NVGPU_EVENT_ID_BPT_PAUSE)) {
-		g->ops.tsg.post_event_id(tsg, NVGPU_EVENT_ID_BPT_PAUSE);
-	}
-}
-
-int gk20a_gr_isr(struct gk20a *g)
-{
-	struct nvgpu_gr_isr_data isr_data;
-	struct nvgpu_gr_intr_info intr_info;
-	bool need_reset = false;
-	struct channel_gk20a *ch = NULL;
-	struct channel_gk20a *fault_ch = NULL;
-	u32 tsgid = NVGPU_INVALID_TSG_ID;
-	struct tsg_gk20a *tsg = NULL;
-	u32 global_esr = 0;
-	u32 chid;
-	struct nvgpu_gr_config *gr_config = g->gr->config;
-	u32 gr_intr = g->ops.gr.intr.read_pending_interrupts(g, &intr_info);
-	u32 clear_intr = gr_intr;
-
-	nvgpu_log_fn(g, " ");
-	nvgpu_log(g, gpu_dbg_intr, "pgraph intr 0x%08x", gr_intr);
-
-	if (gr_intr == 0U) {
-		return 0;
-	}
-
-	/* Disable fifo access */
-	g->ops.gr.init.fifo_access(g, false);
-
-	g->ops.gr.intr.trapped_method_info(g, &isr_data);
-
-	ch = nvgpu_gr_intr_get_channel_from_ctx(g, isr_data.curr_ctx, &tsgid);
-	isr_data.ch = ch;
-	chid = ch != NULL ? ch->chid : FIFO_INVAL_CHANNEL_ID;
-
-	if (ch == NULL) {
-		nvgpu_err(g, "pgraph intr: 0x%08x, chid: INVALID", gr_intr);
-	} else {
-		tsg = tsg_gk20a_from_ch(ch);
-		if (tsg == NULL) {
-			nvgpu_err(g, "pgraph intr: 0x%08x, chid: %d "
-				"not bound to tsg", gr_intr, chid);
-		}
-	}
-
-	nvgpu_log(g, gpu_dbg_intr | gpu_dbg_gpu_dbg,
-		"channel %d: addr 0x%08x, "
-		"data 0x%08x 0x%08x,"
-		"ctx 0x%08x, offset 0x%08x, "
-		"subchannel 0x%08x, class 0x%08x",
-		chid, isr_data.addr,
-		isr_data.data_hi, isr_data.data_lo,
-		isr_data.curr_ctx, isr_data.offset,
-		isr_data.sub_chan, isr_data.class_num);
-
-	if (intr_info.notify != 0U) {
-		g->ops.gr.intr.handle_notify_pending(g, &isr_data);
-		clear_intr &= ~intr_info.notify;
-	}
-
-	if (intr_info.semaphore != 0U) {
-		g->ops.gr.intr.handle_semaphore_pending(g, &isr_data);
-		clear_intr &= ~intr_info.semaphore;
-	}
-
-	if (intr_info.illegal_notify != 0U) {
-		nvgpu_err(g, "illegal notify pending");
-
-		gk20a_gr_set_error_notifier(g, &isr_data,
-				NVGPU_ERR_NOTIFIER_GR_ILLEGAL_NOTIFY);
-		need_reset = true;
-		clear_intr &= ~intr_info.illegal_notify;
-	}
-
-	if (intr_info.illegal_method != 0U) {
-		if (gk20a_gr_handle_illegal_method(g, &isr_data) != 0) {
-			need_reset = true;
-		}
-		clear_intr &= ~intr_info.illegal_method;
-	}
-
-	if (intr_info.illegal_class != 0U) {
-		nvgpu_err(g, "invalid class 0x%08x, offset 0x%08x",
-			  isr_data.class_num, isr_data.offset);
-
-		gk20a_gr_set_error_notifier(g, &isr_data,
-				NVGPU_ERR_NOTIFIER_GR_ERROR_SW_NOTIFY);
-		need_reset = true;
-		clear_intr &= ~intr_info.illegal_class;
-	}
-
-	if (intr_info.fecs_error != 0U) {
-		if (g->ops.gr.handle_fecs_error(g, ch, &isr_data) != 0) {
-			need_reset = true;
-		}
-		clear_intr &= ~intr_info.fecs_error;
-	}
-
-	if (intr_info.class_error != 0U) {
-		if (gk20a_gr_handle_class_error(g, &isr_data) != 0) {
-			need_reset = true;
-		}
-		clear_intr &= ~intr_info.class_error;
-	}
-
-	/* this one happens if someone tries to hit a non-whitelisted
-	 * register using set_falcon[4] */
-	if (intr_info.fw_method != 0U) {
-		u32 ch_id = isr_data.ch != NULL ?
-			isr_data.ch->chid : FIFO_INVAL_CHANNEL_ID;
-		nvgpu_err(g,
-		   "firmware method 0x%08x, offset 0x%08x for channel %u",
-		   isr_data.class_num, isr_data.offset,
-		   ch_id);
-
-		gk20a_gr_set_error_notifier(g, &isr_data,
-			 NVGPU_ERR_NOTIFIER_GR_ERROR_SW_NOTIFY);
-		need_reset = true;
-		clear_intr &= ~intr_info.fw_method;
-	}
-
-	if (intr_info.exception != 0U) {
-		bool is_gpc_exception = false;
-
-		need_reset = g->ops.gr.intr.handle_exceptions(g,
-							&is_gpc_exception);
-
-		/* check if a gpc exception has occurred */
-		if (is_gpc_exception &&	!need_reset) {
-			bool post_event = false;
-
-			nvgpu_log(g, gpu_dbg_intr | gpu_dbg_gpu_dbg,
-					 "GPC exception pending");
-
-			if (tsg != NULL) {
-				fault_ch = isr_data.ch;
-			}
-
-			/* fault_ch can be NULL */
-			/* check if any gpc has an exception */
-			if (nvgpu_gr_intr_handle_gpc_exception(g, &post_event,
-				gr_config, fault_ch, &global_esr) != 0) {
-				need_reset = true;
-			}
-
-#ifdef NVGPU_DEBUGGER
-			/* signal clients waiting on an event */
-			if (g->ops.gr.sm_debugger_attached(g) &&
-				post_event && (fault_ch != NULL)) {
-				g->ops.debugger.post_events(fault_ch);
-			}
-#endif
-		}
-		clear_intr &= ~intr_info.exception;
-
-		if (need_reset) {
-			nvgpu_err(g, "set gr exception notifier");
-			gk20a_gr_set_error_notifier(g, &isr_data,
-					 NVGPU_ERR_NOTIFIER_GR_EXCEPTION);
-		}
-	}
-
-	if (need_reset) {
-		nvgpu_rc_gr_fault(g, tsg, ch);
-	}
-
-	if (clear_intr != 0U) {
-		if (ch == NULL) {
-			/*
-			 * This is probably an interrupt during
-			 * gk20a_free_channel()
-			 */
-			nvgpu_err(g, "unhandled gr intr 0x%08x for "
-				"unreferenceable channel, clearing",
-				gr_intr);
-		} else {
-			nvgpu_err(g, "unhandled gr intr 0x%08x for chid: %d",
-				gr_intr, chid);
-		}
-	}
-
-	/* clear handled and unhandled interrupts */
-	g->ops.gr.intr.clear_pending_interrupts(g, gr_intr);
-
-	/* Enable fifo access */
-	g->ops.gr.init.fifo_access(g, true);
-
-	/* Posting of BPT events should be the last thing in this function */
-	if ((global_esr != 0U) && (tsg != NULL) && (need_reset == false)) {
-		gr_intr_post_bpt_events(g, tsg, global_esr);
-	}
-
-	if (ch != NULL) {
-		gk20a_channel_put(ch);
-	}
-
-	return 0;
-}
-
 static int gr_gk20a_find_priv_offset_in_buffer(struct gk20a *g,
 					       u32 addr,
 					       bool is_quad, u32 quad,
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
index 21e538693..e43f35d8f 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
@@ -147,8 +147,6 @@ struct nvgpu_warpstate {
 	u64 paused_warps[2];
 };
 
-int gk20a_gr_isr(struct gk20a *g);
-
 /* sm */
 bool gk20a_gr_sm_debugger_attached(struct gk20a *g);
 u32 gk20a_gr_get_sm_no_lock_down_hww_global_esr_mask(struct gk20a *g);
diff --git a/drivers/gpu/nvgpu/hal/init/hal_gm20b.c b/drivers/gpu/nvgpu/hal/init/hal_gm20b.c
index e311c8849..3ebd37cbe 100644
--- a/drivers/gpu/nvgpu/hal/init/hal_gm20b.c
+++ b/drivers/gpu/nvgpu/hal/init/hal_gm20b.c
@@ -498,6 +498,7 @@ static const struct gpu_ops gm20b_ops = {
 				gm20ab_gr_intr_tpc_exception_sm_enable,
 			.tpc_exception_sm_disable =
 				gm20ab_gr_intr_tpc_exception_sm_disable,
+			.stall_isr = nvgpu_gr_intr_stall_isr,
 		},
 		.falcon = {
 			.read_fecs_ctxsw_mailbox =
diff --git a/drivers/gpu/nvgpu/hal/init/hal_gp10b.c b/drivers/gpu/nvgpu/hal/init/hal_gp10b.c
index 5419beff1..99ac9db1d 100644
--- a/drivers/gpu/nvgpu/hal/init/hal_gp10b.c
+++ b/drivers/gpu/nvgpu/hal/init/hal_gp10b.c
@@ -590,6 +590,7 @@ static const struct gpu_ops gp10b_ops = {
 				gm20ab_gr_intr_tpc_exception_sm_enable,
 			.tpc_exception_sm_disable =
 				gm20ab_gr_intr_tpc_exception_sm_disable,
+			.stall_isr = nvgpu_gr_intr_stall_isr,
 		},
 		.falcon = {
 			.read_fecs_ctxsw_mailbox =
diff --git a/drivers/gpu/nvgpu/hal/init/hal_gv100.c b/drivers/gpu/nvgpu/hal/init/hal_gv100.c
index 5b7fbeb8f..46ac72876 100644
--- a/drivers/gpu/nvgpu/hal/init/hal_gv100.c
+++ b/drivers/gpu/nvgpu/hal/init/hal_gv100.c
@@ -731,6 +731,7 @@ static const struct gpu_ops gv100_ops = {
 				gm20ab_gr_intr_tpc_exception_sm_enable,
 			.tpc_exception_sm_disable =
 				gm20ab_gr_intr_tpc_exception_sm_disable,
+			.stall_isr = nvgpu_gr_intr_stall_isr,
 		},
 		.falcon = {
 			.read_fecs_ctxsw_mailbox =
diff --git a/drivers/gpu/nvgpu/hal/init/hal_gv11b.c b/drivers/gpu/nvgpu/hal/init/hal_gv11b.c
index 054e16b5d..e7aba11e8 100644
--- a/drivers/gpu/nvgpu/hal/init/hal_gv11b.c
+++ b/drivers/gpu/nvgpu/hal/init/hal_gv11b.c
@@ -708,6 +708,7 @@ static const struct gpu_ops gv11b_ops = {
 				gm20ab_gr_intr_tpc_exception_sm_enable,
 			.tpc_exception_sm_disable =
 				gm20ab_gr_intr_tpc_exception_sm_disable,
+			.stall_isr = nvgpu_gr_intr_stall_isr,
 		},
 		.falcon = {
 			.read_fecs_ctxsw_mailbox =
diff --git a/drivers/gpu/nvgpu/hal/init/hal_tu104.c b/drivers/gpu/nvgpu/hal/init/hal_tu104.c
index 093a2fd72..0fae7bf4e 100644
--- a/drivers/gpu/nvgpu/hal/init/hal_tu104.c
+++ b/drivers/gpu/nvgpu/hal/init/hal_tu104.c
@@ -761,6 +761,7 @@ static const struct gpu_ops tu104_ops = {
 				gm20ab_gr_intr_tpc_exception_sm_enable,
 			.tpc_exception_sm_disable =
 				gm20ab_gr_intr_tpc_exception_sm_disable,
+			.stall_isr = nvgpu_gr_intr_stall_isr,
 		},
 		.falcon = {
 			.read_fecs_ctxsw_mailbox =
diff --git a/drivers/gpu/nvgpu/hal/mc/mc_gm20b.c b/drivers/gpu/nvgpu/hal/mc/mc_gm20b.c
index c16a20a88..14d7fefd3 100644
--- a/drivers/gpu/nvgpu/hal/mc/mc_gm20b.c
+++ b/drivers/gpu/nvgpu/hal/mc/mc_gm20b.c
@@ -58,7 +58,8 @@ void gm20b_mc_isr_stall(struct gk20a *g)
 		engine_enum = g->fifo.engine_info[act_eng_id].engine_enum;
 		/* GR Engine */
 		if (engine_enum == NVGPU_ENGINE_GR_GK20A) {
-			nvgpu_pg_elpg_protected_call(g, gk20a_gr_isr(g));
+			nvgpu_pg_elpg_protected_call(g,
+						g->ops.gr.intr.stall_isr(g));
 		}
 
 		/* CE Engine */
diff --git a/drivers/gpu/nvgpu/hal/mc/mc_gp10b.c b/drivers/gpu/nvgpu/hal/mc/mc_gp10b.c
index 57905b0ae..854722901 100644
--- a/drivers/gpu/nvgpu/hal/mc/mc_gp10b.c
+++ b/drivers/gpu/nvgpu/hal/mc/mc_gp10b.c
@@ -111,7 +111,8 @@ void mc_gp10b_isr_stall(struct gk20a *g)
 		engine_enum = g->fifo.engine_info[act_eng_id].engine_enum;
 		/* GR Engine */
 		if (engine_enum == NVGPU_ENGINE_GR_GK20A) {
-			nvgpu_pg_elpg_protected_call(g, gk20a_gr_isr(g));
+			nvgpu_pg_elpg_protected_call(g,
+						g->ops.gr.intr.stall_isr(g));
 		}
 
 		/* CE Engine */
diff --git a/drivers/gpu/nvgpu/include/nvgpu/gk20a.h b/drivers/gpu/nvgpu/include/nvgpu/gk20a.h
index 58c53016f..f66b1b7aa 100644
--- a/drivers/gpu/nvgpu/include/nvgpu/gk20a.h
+++ b/drivers/gpu/nvgpu/include/nvgpu/gk20a.h
@@ -802,9 +802,9 @@ struct gpu_ops {
 			u32 (*read_exception1)(struct gk20a *g);
 			void (*trapped_method_info)(struct gk20a *g,
 				    struct nvgpu_gr_isr_data *isr_data);
-			int (*handle_semaphore_pending)(struct gk20a *g,
+			void (*handle_semaphore_pending)(struct gk20a *g,
 				struct nvgpu_gr_isr_data *isr_data);
-			int (*handle_notify_pending)(struct gk20a *g,
+			void (*handle_notify_pending)(struct gk20a *g,
 				struct nvgpu_gr_isr_data *isr_data);
 			void (*handle_gcc_exception)(struct gk20a *g, u32 gpc,
 				u32 tpc, u32 gpc_exception,
@@ -832,6 +832,7 @@ struct gpu_ops {
 			void (*tpc_exception_sm_disable)(struct gk20a *g,
 							       u32 offset);
 			void (*tpc_exception_sm_enable)(struct gk20a *g);
+			int (*stall_isr)(struct gk20a *g);
 		} intr;
 
 		u32 (*get_ctxsw_checksum_mismatch_mailbox_val)(void);
diff --git a/drivers/gpu/nvgpu/include/nvgpu/gr/gr_intr.h b/drivers/gpu/nvgpu/include/nvgpu/gr/gr_intr.h
index 775f56a99..ff90c47ae 100644
--- a/drivers/gpu/nvgpu/include/nvgpu/gr/gr_intr.h
+++ b/drivers/gpu/nvgpu/include/nvgpu/gr/gr_intr.h
@@ -59,12 +59,15 @@ struct nvgpu_gr_isr_data {
 int nvgpu_gr_intr_handle_gpc_exception(struct gk20a *g, bool *post_event,
 	struct nvgpu_gr_config *gr_config, struct channel_gk20a *fault_ch,
 	u32 *hww_global_esr);
-int nvgpu_gr_intr_handle_notify_pending(struct gk20a *g,
+void nvgpu_gr_intr_handle_notify_pending(struct gk20a *g,
 					struct nvgpu_gr_isr_data *isr_data);
-int nvgpu_gr_intr_handle_semaphore_pending(struct gk20a *g,
+void nvgpu_gr_intr_handle_semaphore_pending(struct gk20a *g,
 					   struct nvgpu_gr_isr_data *isr_data);
 void nvgpu_gr_intr_report_exception(struct gk20a *g, u32 inst,
 				u32 err_type, u32 status);
 struct channel_gk20a *nvgpu_gr_intr_get_channel_from_ctx(struct gk20a *g,
 				u32 curr_ctx, u32 *curr_tsgid);
+void nvgpu_gr_intr_set_error_notifier(struct gk20a *g,
+		  struct nvgpu_gr_isr_data *isr_data, u32 error_notifier);
+int nvgpu_gr_intr_stall_isr(struct gk20a *g);
 #endif /* NVGPU_GR_INTR_H */