Open source GPL/LGPL release

2025-12-22 17:36:20 +03:00 · 2022-02-18 10:53:32 -08:00
commit f235e7c89d
2490 changed files with 683529 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1,98 @@
+#
+# NOTE! Don't add files that are generated in specific
+# subdirectories here. Add them in the ".gitignore" file
+# in that subdirectory instead.
+#
+# NOTE! Please use 'git ls-files -i --exclude-standard'
+# command after changing this file, to see if there are
+# any tracked files which get ignored after the change.
+#
+# Normal rules
+#
+.*
+*.o
+*.o.*
+*.a
+*.s
+*.ko
+*.so
+*.so.dbg
+*.mod.c
+*.i
+*.lst
+*.symtypes
+*.order
+*.elf
+*.bin
+*.gz
+*.bz2
+*.lzma
+*.xz
+*.lz4
+*.lzo
+*.patch
+*.gcno
+modules.builtin
+Module.symvers
+*.dwo
+
+#
+# Top-level generic files
+#
+/tags
+/TAGS
+/linux
+/vmlinux
+/vmlinuz
+/System.map
+/Module.markers
+
+#
+# Debian directory (make deb-pkg)
+#
+/debian/
+
+#
+# git files that we don't want to ignore even it they are dot-files
+#
+!.gitignore
+!.mailmap
+
+#
+# Generated include files
+#
+include/config
+include/generated
+arch/*/include/generated
+
+# stgit generated dirs
+patches-*
+
+# quilt's files
+patches
+series
+
+# cscope files
+cscope.*
+ncscope.*
+
+# gnu global files
+GPATH
+GRTAGS
+GSYMS
+GTAGS
+
+*.orig
+*~
+\#*#
+
+#
+# Leavings from module signing
+#
+extra_certificates
+signing_key.priv
+signing_key.x509
+x509.genkey
+
+# Kconfig presets
+all.config
--- a/Makefile.umbrella.tmk
+++ b/Makefile.umbrella.tmk
@@ -0,0 +1,172 @@
+################################### tell Emacs this is a -*- makefile-gmake -*-
+#
+# Copyright (c) 2018-2021, NVIDIA CORPORATION.  All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a
+# copy of this software and associated documentation files (the "Software"),
+# to deal in the Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish, distribute, sublicense,
+# and/or sell copies of the Software, and to permit persons to whom the
+# Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+# DEALINGS IN THE SOFTWARE.
+#
+# tmake for SW Mobile
+#
+# Repository umbrella makefile fragment for "nvgpu"
+#
+###############################################################################
+
+#
+# Components common to all builds
+#
+NV_REPOSITORY_COMPONENTS :=
+
+ifneq ($(NV_BUILD_CONFIGURATION_OS_IS_INTEGRITY),1)
+
+ifeq ($(NV_BUILD_CONFIGURATION_OS_IS_QNX),1)
+ifeq ($(NV_BUILD_CONFIGURATION_IS_SAFETY),1)
+# On QNX, the unit tests are built only for safety profile.
+build_nvgpu_ut := 1
+endif
+else
+# On L4T, the unit tests are built with safety profile forced.
+build_nvgpu_ut := 1
+endif
+
+ifeq ($(build_nvgpu_ut),1)
+NV_REPOSITORY_COMPONENTS := libs/igpu
+NV_REPOSITORY_COMPONENTS += libs/dgpu
+NV_REPOSITORY_COMPONENTS += userspace
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/bitops
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/env
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/fault-injection
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/bug
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/os_sched
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/sizes
+NV_REPOSITORY_COMPONENTS += userspace/units/init
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/log2
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/thread
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/cond
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/timers
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/kmem
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/rwsem
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/queue
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/utils
+NV_REPOSITORY_COMPONENTS += userspace/units/posix/circ_buf
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/bit-utils
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/lock
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/nvgpu_gk20a
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/atomic
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/rbtree
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/static_analysis
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/string
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/worker
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/kref
+NV_REPOSITORY_COMPONENTS += userspace/units/interface/list
+NV_REPOSITORY_COMPONENTS += userspace/units/bus
+NV_REPOSITORY_COMPONENTS += userspace/units/pramin
+NV_REPOSITORY_COMPONENTS += userspace/units/priv_ring
+NV_REPOSITORY_COMPONENTS += userspace/units/ptimer
+NV_REPOSITORY_COMPONENTS += userspace/units/mc
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/nvgpu_sgt
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/nvgpu_mem
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/nvgpu_mem/dgpu
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/allocators/buddy_allocator
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/allocators/nvgpu_allocator
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/allocators/bitmap_allocator
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/allocators/page_allocator
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/as
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/dma
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/gmmu/pd_cache
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/gmmu/page_table
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/cache/flush_gk20a_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/cache/flush_gv11b_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/gmmu/gmmu_gk20a_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/gmmu/gmmu_gm20b_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/gmmu/gmmu_gp10b_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/gmmu/gmmu_gv11b_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/gp10b_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/gv11b_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/hal/mmu_fault/gv11b_fusa
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/mm
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/page_table_faults
+NV_REPOSITORY_COMPONENTS += userspace/units/mm/vm
+NV_REPOSITORY_COMPONENTS += userspace/units/netlist
+NV_REPOSITORY_COMPONENTS += userspace/units/fb
+NV_REPOSITORY_COMPONENTS += userspace/units/fbp
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/channel
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/channel/gk20a
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/channel/gm20b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/channel/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/ctxsw_timeout/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/engine
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/engine/gm20b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/engine/gp10b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/engine/gv100
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/engine/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/fifo
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/fifo/gk20a
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/fifo/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/pbdma
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/pbdma/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/pbdma/gm20b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/pbdma/gp10b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/preempt
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/preempt/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/ramfc/gp10b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/ramfc/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/ramin/gk20a
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/ramin/gm20b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/ramin/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/runlist
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/runlist/gk20a
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/runlist/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/tsg
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/tsg/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/userd/gk20a
+NV_REPOSITORY_COMPONENTS += userspace/units/fifo/usermode/gv11b
+NV_REPOSITORY_COMPONENTS += userspace/units/fuse
+NV_REPOSITORY_COMPONENTS += userspace/units/ltc
+NV_REPOSITORY_COMPONENTS += userspace/units/enabled
+NV_REPOSITORY_COMPONENTS += userspace/units/falcon
+NV_REPOSITORY_COMPONENTS += userspace/units/falcon/falcon_tests
+NV_REPOSITORY_COMPONENTS += userspace/units/pmu
+NV_REPOSITORY_COMPONENTS += userspace/units/therm
+NV_REPOSITORY_COMPONENTS += userspace/units/top
+NV_REPOSITORY_COMPONENTS += userspace/units/class
+NV_REPOSITORY_COMPONENTS += userspace/units/gr
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/falcon
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/config
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/init
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/setup
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/fs_state
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/global_ctx
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/ctx
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/obj_ctx
+NV_REPOSITORY_COMPONENTS += userspace/units/gr/intr
+NV_REPOSITORY_COMPONENTS += userspace/units/acr
+NV_REPOSITORY_COMPONENTS += userspace/units/ce
+NV_REPOSITORY_COMPONENTS += userspace/units/cg
+NV_REPOSITORY_COMPONENTS += userspace/units/rc
+NV_REPOSITORY_COMPONENTS += userspace/units/sync
+NV_REPOSITORY_COMPONENTS += userspace/units/ecc
+NV_REPOSITORY_COMPONENTS += userspace/units/io
+endif
+endif
+
+# Local Variables:
+# indent-tabs-mode: t
+# tab-width: 8
+# End:
+# vi: set tabstop=8 noexpandtab:
--- a/65
+++ b/65
@@ -0,0 +1,65 @@
+This is a reviewers file that can be parsed by get_nv_reviewers.py that
+internally uses scripts/get_maintainer.pl from kernel.
+
+See the MAINTAINERS file in the Linux kernel source tree for details of the
+file format. The file format is defined by the upstream Linux kernel community,
+so don't modify it without upstreaming any changes to get_maintainer.pl.
+
+Descriptions of section entries (copied from MAINTAINERS):
+
+	P: Person (obsolete)
+	M: Mail patches to: FullName <address@domain>
+	L: Mailing list that is relevant to this area
+	B: NvBugs Module Name
+	W: Web-page with status/info
+	Q: Patchwork web based patch tracking system site
+	T: SCM tree type and location.  Type is one of: git, hg, quilt, stgit, topgit.
+	S: Status, one of the following:
+	   Supported:	Someone is actually paid to look after this.
+	   Maintained:	Someone actually looks after it.
+	   Odd Fixes:	It has a maintainer but they don't have time to do
+			much other than throw the odd patch in. See below..
+	   Orphan:	No current maintainer [but maybe you could take the
+			role as you write your new code].
+	   Obsolete:	Old code. Something tagged obsolete generally means
+			it has been replaced by a better system and you
+			should be using that.
+	F: Files and directories with wildcard patterns.
+	   A trailing slash includes all files and subdirectory files.
+	   F:	drivers/net/	all files in and below drivers/net
+	   F:	drivers/net/*	all files in drivers/net, but not below
+	   F:	*/net/*		all files in "any top level directory"/net
+	   One pattern per line.  Multiple F: lines acceptable.
+	X: Files and directories that are NOT maintained, same rules as F:
+	   Files exclusions are tested before file matches.
+	   Can be useful for excluding a specific subdirectory, for instance:
+	   F:	net/
+	   X:	net/ipv6/
+	   matches all files in and below net excluding net/ipv6/
+	K: Keyword perl extended regex pattern to match content in a
+	   patch or file.  For instance:
+	   K: of_get_profile
+	      matches patches or files that contain "of_get_profile"
+	   K: \b(printk|pr_(info|err))\b
+	      matches patches or files that contain one or more of the words
+	      printk, pr_info or pr_err
+	   One regex pattern per line.  Multiple K: lines acceptable.
+
+Note: For the hard of thinking, this list is meant to remain in alphabetical
+order. If you could add yourselves to it in alphabetical order that would be
+so much easier [Ed]
+
+Maintainers List (try to look for most precise areas first)
+
+----------------------------------------------------------------------
+GPU
+M:	Vijayakumar Subbu <vsubbu@nvidia.com>
+M:	Terje Bergstrom <tbergstrom@nvidia.com>
+L:	sw-mobile-nvgpu-core@exchange.nvidia.com
+B:	Mobile_Android_Kernel <keyword = nvgpu-tegra>
+B:	Mobile_Linux_Kernel <keyword = nvgpu-tegra>
+B:	Embedded Resource Manager - Linux <keyword = nvgpu-tegra>
+S:	Supported
+F:	drivers/gpu/nvgpu/*
+F:	include/*
+F:	../../gpu-firmware-private/
--- a/arch/nvgpu-common.yaml
+++ b/arch/nvgpu-common.yaml
--- a/arch/nvgpu-gpu_hw.yaml
+++ b/arch/nvgpu-gpu_hw.yaml
@@ -0,0 +1,224 @@
+# Copyright (c) 2019, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# Define meta elements and units for describing GPU HW interactions in
+# nvgpu.
+#
+
+headers:
+  safe: yes
+  owner: Terje B
+  sources: [ include/nvgpu/hw/gk20a/hw_bus_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_ccsr_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_ce2_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_ctxsw_prog_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_falcon_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_fb_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_fifo_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_flush_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_gmmu_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_gr_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_ltc_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_mc_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_pbdma_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_perf_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_pram_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_pri_ringmaster_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_pri_ringstation_gpc_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_pri_ringstation_sys_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_proj_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_pwr_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_ram_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_therm_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_timer_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_top_gk20a.h,
+             include/nvgpu/hw/gk20a/hw_trim_gk20a.h,
+             include/nvgpu/hw/gm20b/hw_bus_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_ccsr_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_ce2_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_ctxsw_prog_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_falcon_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_fb_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_fifo_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_flush_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_fuse_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_gmmu_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_gr_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_ltc_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_mc_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_pbdma_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_perf_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_pram_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_pri_ringmaster_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_pri_ringstation_gpc_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_pri_ringstation_sys_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_proj_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_pwr_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_ram_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_therm_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_timer_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_top_gm20b.h,
+             include/nvgpu/hw/gm20b/hw_trim_gm20b.h,
+             include/nvgpu/hw/gp106/hw_bus_gp106.h,
+             include/nvgpu/hw/gp106/hw_ccsr_gp106.h,
+             include/nvgpu/hw/gp106/hw_ce_gp106.h,
+             include/nvgpu/hw/gp106/hw_ctxsw_prog_gp106.h,
+             include/nvgpu/hw/gp106/hw_falcon_gp106.h,
+             include/nvgpu/hw/gp106/hw_fb_gp106.h,
+             include/nvgpu/hw/gp106/hw_fbpa_gp106.h,
+             include/nvgpu/hw/gp106/hw_fifo_gp106.h,
+             include/nvgpu/hw/gp106/hw_flush_gp106.h,
+             include/nvgpu/hw/gp106/hw_fuse_gp106.h,
+             include/nvgpu/hw/gp106/hw_gmmu_gp106.h,
+             include/nvgpu/hw/gp106/hw_gr_gp106.h,
+             include/nvgpu/hw/gp106/hw_ltc_gp106.h,
+             include/nvgpu/hw/gp106/hw_mc_gp106.h,
+             include/nvgpu/hw/gp106/hw_pbdma_gp106.h,
+             include/nvgpu/hw/gp106/hw_perf_gp106.h,
+             include/nvgpu/hw/gp106/hw_pnvdec_gp106.h,
+             include/nvgpu/hw/gp106/hw_pram_gp106.h,
+             include/nvgpu/hw/gp106/hw_pri_ringmaster_gp106.h,
+             include/nvgpu/hw/gp106/hw_pri_ringstation_gpc_gp106.h,
+             include/nvgpu/hw/gp106/hw_pri_ringstation_sys_gp106.h,
+             include/nvgpu/hw/gp106/hw_proj_gp106.h,
+             include/nvgpu/hw/gp106/hw_psec_gp106.h,
+             include/nvgpu/hw/gp106/hw_pwr_gp106.h,
+             include/nvgpu/hw/gp106/hw_ram_gp106.h,
+             include/nvgpu/hw/gp106/hw_therm_gp106.h,
+             include/nvgpu/hw/gp106/hw_timer_gp106.h,
+             include/nvgpu/hw/gp106/hw_top_gp106.h,
+             include/nvgpu/hw/gp106/hw_trim_gp106.h,
+             include/nvgpu/hw/gp106/hw_xp_gp106.h,
+             include/nvgpu/hw/gp106/hw_xve_gp106.h,
+             include/nvgpu/hw/gp10b/hw_bus_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_ccsr_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_ce_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_ctxsw_prog_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_falcon_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_fb_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_fifo_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_flush_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_fuse_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_gmmu_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_gr_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_ltc_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_mc_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_pbdma_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_perf_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_pram_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_pri_ringmaster_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_pri_ringstation_gpc_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_pri_ringstation_sys_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_proj_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_pwr_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_ram_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_therm_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_timer_gp10b.h,
+             include/nvgpu/hw/gp10b/hw_top_gp10b.h,
+             include/nvgpu/hw/gv100/hw_bus_gv100.h,
+             include/nvgpu/hw/gv100/hw_ccsr_gv100.h,
+             include/nvgpu/hw/gv100/hw_ce_gv100.h,
+             include/nvgpu/hw/gv100/hw_ctxsw_prog_gv100.h,
+             include/nvgpu/hw/gv100/hw_falcon_gv100.h,
+             include/nvgpu/hw/gv100/hw_fb_gv100.h,
+             include/nvgpu/hw/gv100/hw_fifo_gv100.h,
+             include/nvgpu/hw/gv100/hw_flush_gv100.h,
+             include/nvgpu/hw/gv100/hw_fuse_gv100.h,
+             include/nvgpu/hw/gv100/hw_gmmu_gv100.h,
+             include/nvgpu/hw/gv100/hw_gr_gv100.h,
+             include/nvgpu/hw/gv100/hw_ioctrl_gv100.h,
+             include/nvgpu/hw/gv100/hw_ioctrlmif_gv100.h,
+             include/nvgpu/hw/gv100/hw_ltc_gv100.h,
+             include/nvgpu/hw/gv100/hw_mc_gv100.h,
+             include/nvgpu/hw/gv100/hw_minion_gv100.h,
+             include/nvgpu/hw/gv100/hw_nvl_gv100.h,
+             include/nvgpu/hw/gv100/hw_nvlinkip_discovery_gv100.h,
+             include/nvgpu/hw/gv100/hw_nvlipt_gv100.h,
+             include/nvgpu/hw/gv100/hw_nvtlc_gv100.h,
+             include/nvgpu/hw/gv100/hw_pbdma_gv100.h,
+             include/nvgpu/hw/gv100/hw_perf_gv100.h,
+             include/nvgpu/hw/gv100/hw_pgsp_gv100.h,
+             include/nvgpu/hw/gv100/hw_pram_gv100.h,
+             include/nvgpu/hw/gv100/hw_pri_ringmaster_gv100.h,
+             include/nvgpu/hw/gv100/hw_pri_ringstation_gpc_gv100.h,
+             include/nvgpu/hw/gv100/hw_pri_ringstation_sys_gv100.h,
+             include/nvgpu/hw/gv100/hw_proj_gv100.h,
+             include/nvgpu/hw/gv100/hw_pwr_gv100.h,
+             include/nvgpu/hw/gv100/hw_ram_gv100.h,
+             include/nvgpu/hw/gv100/hw_therm_gv100.h,
+             include/nvgpu/hw/gv100/hw_timer_gv100.h,
+             include/nvgpu/hw/gv100/hw_top_gv100.h,
+             include/nvgpu/hw/gv100/hw_trim_gv100.h,
+             include/nvgpu/hw/gv100/hw_usermode_gv100.h,
+             include/nvgpu/hw/gv100/hw_xp_gv100.h,
+             include/nvgpu/hw/gv100/hw_xve_gv100.h,
+             include/nvgpu/hw/gv11b/hw_bus_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_ccsr_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_ce_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_ctxsw_prog_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_falcon_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_fb_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_fifo_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_flush_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_fuse_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_gmmu_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_gr_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_ltc_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_mc_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_pbdma_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_perf_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_pram_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_pri_ringmaster_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_pri_ringstation_gpc_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_pri_ringstation_sys_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_pri_ringstation_fbp_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_proj_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_pwr_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_ram_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_therm_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_timer_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_top_gv11b.h,
+             include/nvgpu/hw/gv11b/hw_usermode_gv11b.h,
+             include/nvgpu/hw/tu104/hw_bus_tu104.h,
+             include/nvgpu/hw/tu104/hw_ccsr_tu104.h,
+             include/nvgpu/hw/tu104/hw_ce_tu104.h,
+             include/nvgpu/hw/tu104/hw_ctrl_tu104.h,
+             include/nvgpu/hw/tu104/hw_ctxsw_prog_tu104.h,
+             include/nvgpu/hw/tu104/hw_falcon_tu104.h,
+             include/nvgpu/hw/tu104/hw_fb_tu104.h,
+             include/nvgpu/hw/tu104/hw_fbpa_tu104.h,
+             include/nvgpu/hw/tu104/hw_fifo_tu104.h,
+             include/nvgpu/hw/tu104/hw_flush_tu104.h,
+             include/nvgpu/hw/tu104/hw_func_tu104.h,
+             include/nvgpu/hw/tu104/hw_fuse_tu104.h,
+             include/nvgpu/hw/tu104/hw_gc6_tu104.h,
+             include/nvgpu/hw/tu104/hw_gmmu_tu104.h,
+             include/nvgpu/hw/tu104/hw_gr_tu104.h,
+             include/nvgpu/hw/tu104/hw_ioctrl_tu104.h,
+             include/nvgpu/hw/tu104/hw_ioctrlmif_tu104.h,
+             include/nvgpu/hw/tu104/hw_ltc_tu104.h,
+             include/nvgpu/hw/tu104/hw_mc_tu104.h,
+             include/nvgpu/hw/tu104/hw_minion_tu104.h,
+             include/nvgpu/hw/tu104/hw_nvl_tu104.h,
+             include/nvgpu/hw/tu104/hw_nvlinkip_discovery_tu104.h,
+             include/nvgpu/hw/tu104/hw_nvlipt_tu104.h,
+             include/nvgpu/hw/tu104/hw_nvtlc_tu104.h,
+             include/nvgpu/hw/tu104/hw_pbdma_tu104.h,
+             include/nvgpu/hw/tu104/hw_perf_tu104.h,
+             include/nvgpu/hw/tu104/hw_pgsp_tu104.h,
+             include/nvgpu/hw/tu104/hw_pnvdec_tu104.h,
+             include/nvgpu/hw/tu104/hw_pram_tu104.h,
+             include/nvgpu/hw/tu104/hw_pri_ringmaster_tu104.h,
+             include/nvgpu/hw/tu104/hw_pri_ringstation_gpc_tu104.h,
+             include/nvgpu/hw/tu104/hw_pri_ringstation_sys_tu104.h,
+             include/nvgpu/hw/tu104/hw_pri_ringstation_fbp_tu104.h,
+             include/nvgpu/hw/tu104/hw_proj_tu104.h,
+             include/nvgpu/hw/tu104/hw_psec_tu104.h,
+             include/nvgpu/hw/tu104/hw_pwr_tu104.h,
+             include/nvgpu/hw/tu104/hw_ram_tu104.h,
+             include/nvgpu/hw/tu104/hw_therm_tu104.h,
+             include/nvgpu/hw/tu104/hw_timer_tu104.h,
+             include/nvgpu/hw/tu104/hw_top_tu104.h,
+             include/nvgpu/hw/tu104/hw_trim_tu104.h,
+             include/nvgpu/hw/tu104/hw_usermode_tu104.h,
+             include/nvgpu/hw/tu104/hw_xp_tu104.h,
+             include/nvgpu/hw/tu104/hw_xve_tu104.h ]
--- a/arch/nvgpu-hal-new.yaml
+++ b/arch/nvgpu-hal-new.yaml
@@ -0,0 +1,836 @@
+# Copyright (c) 2019-2021, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# HAL units. These are the units that have access to HW.
+#
+
+bus_fusa:
+  safe: yes
+  owner: Terje B
+  sources: [ include/nvgpu/gops/bus.h,
+             hal/bus/bus_gk20a_fusa.c,
+             hal/bus/bus_gk20a.h,
+             hal/bus/bus_gm20b_fusa.c, hal/bus/bus_gm20b.h,
+             hal/bus/bus_gp10b_fusa.c, hal/bus/bus_gp10b.h,
+             hal/bus/bus_gv11b_fusa.c, hal/bus/bus_gv11b.h ]
+
+bus:
+  safe: no
+  owner: Terje B
+  sources: [ hal/bus/bus_gk20a.c,
+             hal/bus/bus_gv100.c, hal/bus/bus_gv100.h,
+             hal/bus/bus_tu104.c, hal/bus/bus_tu104.h ]
+
+ltc:
+  owner: Seshendra G
+  children:
+    ltc_fusa:
+      safe: yes
+      sources: [ hal/ltc/ltc_gm20b_fusa.c,
+                 hal/ltc/ltc_gm20b.h,
+                 hal/ltc/ltc_gp10b_fusa.c,
+                 hal/ltc/ltc_gp10b.h,
+                 hal/ltc/ltc_gv11b_fusa.c,
+                 hal/ltc/ltc_gv11b.h ]
+    ltc:
+      safe: no
+      sources: [ hal/ltc/ltc_gm20b.c,
+                 hal/ltc/ltc_gm20b_dbg.c,
+                 hal/ltc/ltc_gp10b.c,
+                 hal/ltc/ltc_tu104.c,
+                 hal/ltc/ltc_tu104.h ]
+    intr_fusa:
+      safe: yes
+      sources: [ hal/ltc/intr/ltc_intr_gp10b_fusa.c,
+                 hal/ltc/intr/ltc_intr_gp10b.h,
+                 hal/ltc/intr/ltc_intr_gv11b_fusa.c,
+                 hal/ltc/intr/ltc_intr_gv11b.h ]
+    intr:
+      safe: no
+      sources: [ hal/ltc/intr/ltc_intr_gm20b.c,
+                 hal/ltc/intr/ltc_intr_gm20b.h,
+                 hal/ltc/intr/ltc_intr_gp10b.c ]
+
+init_fusa:
+  safe: yes
+  owner: Philip E
+  sources: [ hal/init/hal_gv11b.c,
+             hal/init/hal_gv11b.h,
+             hal/init/hal_init.c,
+             hal/init/hal_gv11b_litter.c,
+             hal/init/hal_gv11b_litter.h ]
+
+init:
+  safe: no
+  owner: Philip E
+  sources: [ hal/init/hal_gm20b.c,
+             hal/init/hal_gm20b.h,
+             hal/init/hal_gp10b.c,
+             hal/init/hal_gp10b.h,
+             hal/init/hal_tu104.c,
+             hal/init/hal_tu104.h,
+             hal/init/hal_gm20b_litter.c,
+             hal/init/hal_gm20b_litter.h,
+             hal/init/hal_gp10b_litter.c,
+             hal/init/hal_gp10b_litter.h,
+             hal/init/hal_tu104_litter.c,
+             hal/init/hal_tu104_litter.h ]
+
+priv_ring_fusa:
+  safe: yes
+  owner: Seema K
+  sources: [ include/nvgpu/gops/priv_ring.h,
+             hal/priv_ring/priv_ring_gm20b_fusa.c,
+             hal/priv_ring/priv_ring_gm20b.h,
+             hal/priv_ring/priv_ring_gp10b_fusa.c,
+             hal/priv_ring/priv_ring_gp10b.h ]
+
+priv_ring:
+  safe: no
+  owner: Seema K
+  sources: [ hal/priv_ring/priv_ring_gm20b.c,
+             hal/priv_ring/priv_ring_gv11b.c,
+             hal/priv_ring/priv_ring_gv11b.h ]
+
+ptimer_fusa:
+  safe: yes
+  owner: Terje B
+  sources: [ hal/ptimer/ptimer_gk20a_fusa.c,
+             hal/ptimer/ptimer_gk20a.h ]
+
+ptimer:
+  safe: no
+  owner: Deepak N
+  sources: [ hal/ptimer/ptimer_gp10b.c,
+             hal/ptimer/ptimer_gp10b.h,
+             hal/ptimer/ptimer_gv11b.c,
+             hal/ptimer/ptimer_gv11b.h ]
+
+cg_fusa:
+  safe: yes
+  owner: Seema K
+  sources: [ hal/power_features/cg/gating_reglist.h,
+             hal/power_features/cg/gv11b_gating_reglist.c,
+             hal/power_features/cg/gv11b_gating_reglist.h ]
+
+cg:
+  safe: no
+  owner: Seema K
+  sources: [ hal/power_features/cg/gm20b_gating_reglist.c,
+             hal/power_features/cg/gm20b_gating_reglist.h,
+             hal/power_features/cg/gp10b_gating_reglist.c,
+             hal/power_features/cg/gp10b_gating_reglist.h,
+             hal/power_features/cg/tu104_gating_reglist.c,
+             hal/power_features/cg/tu104_gating_reglist.h ]
+
+rc:
+  safe: no
+  owner: Seema K
+  sources: [ hal/rc/rc_gk20a.c,
+             hal/rc/rc_gk20a.h,
+             hal/rc/rc_gv11b.c,
+             hal/rc/rc_gv11b.h ]
+
+fbpa:
+  safe: yes
+  owner: Seshendra G
+  gpu: dgpu
+  sources: [ hal/fbpa/fbpa_tu104.c,   hal/fbpa/fbpa_tu104.h ]
+
+clk:
+  safe: yes
+  owner: Ramesh M
+  gpu: dgpu
+  sources: [ hal/clk/clk_tu104.c,
+             hal/clk/clk_tu104.h ]
+
+clk_mon:
+  safe: yes
+  owner: Ramesh M
+  gpu: dgpu
+  sources: [ hal/clk/clk_mon_tu104.c,
+             hal/clk/clk_mon_tu104.h,
+             include/nvgpu/clk_mon.h]
+
+clk_igpu:
+  safe: no
+  owner: Ramesh M
+  gpu: igpu
+  sources: [ hal/clk/clk_gk20a.h,
+             hal/clk/clk_gm20b.c,
+             hal/clk/clk_gm20b.h ]
+
+fifo:
+  safe: yes
+  owner: Seema K
+  children:
+    userd:
+      safe: no
+      sources: [ hal/fifo/userd_gk20a.c,
+                 hal/fifo/userd_gk20a.h,
+                 hal/fifo/userd_gv11b.c,
+                 hal/fifo/userd_gv11b.h ]
+    ramfc_fusa:
+      safe: yes
+      sources: [ hal/fifo/ramin_gk20a_fusa.c,
+                 hal/fifo/ramfc_gp10b_fusa.c,
+                 hal/fifo/ramfc_gp10b.h,
+                 hal/fifo/ramfc_gv11b_fusa.c,
+                 hal/fifo/ramfc_gv11b.h ]
+
+    ramfc:
+      safe: no
+      sources: [ hal/fifo/ramfc_gk20a.c,
+                 hal/fifo/ramfc_gk20a.h,
+                 hal/fifo/ramfc_gp10b.c,
+                 hal/fifo/ramfc_tu104.c,
+                 hal/fifo/ramfc_tu104.h ]
+
+    ramin_fusa:
+      safe: yes
+      sources: [ hal/fifo/ramin_gv11b.h,
+                 hal/fifo/ramin_gm20b.h,
+                 hal/fifo/ramin_gv11b_fusa.c,
+                 hal/fifo/ramin_gm20b_fusa.c ]
+
+    ramin:
+      safe: no
+      sources: [ hal/fifo/ramin_gk20a.h,
+                 hal/fifo/ramin_gp10b.h,
+                 hal/fifo/ramin_gk20a.c,
+                 hal/fifo/ramin_gp10b.c,
+                 hal/fifo/ramin_tu104.c,
+                 hal/fifo/ramin_tu104.h ]
+
+    runlist_fusa:
+      safe: yes
+      sources: [ hal/fifo/runlist_fifo_gk20a.c,
+                 hal/fifo/runlist_fifo_gk20a_fusa.c,
+                 hal/fifo/runlist_fifo_gk20a.h,
+                 hal/fifo/runlist_fifo_gv11b.c,
+                 hal/fifo/runlist_fifo_gv11b_fusa.c,
+                 hal/fifo/runlist_fifo_gv11b.h,
+                 hal/fifo/runlist_ram_gv11b_fusa.c,
+                 hal/fifo/runlist_ram_gv11b.h ]
+
+    runlist:
+      safe: no
+      sources: [ hal/fifo/runlist_fifo_gv100.c,
+                 hal/fifo/runlist_fifo_gv100.h,
+                 hal/fifo/runlist_fifo_tu104.c,
+                 hal/fifo/runlist_fifo_tu104.h,
+                 hal/fifo/runlist_ram_gk20a.c,
+                 hal/fifo/runlist_ram_gk20a.h,
+                 hal/fifo/runlist_ram_tu104.c,
+                 hal/fifo/runlist_ram_tu104.h ]
+
+    channel_fusa:
+      safe: yes
+      sources: [ hal/fifo/channel_gk20a_fusa.c,
+                 hal/fifo/channel_gk20a.h,
+                 hal/fifo/channel_gm20b_fusa.c,
+                 hal/fifo/channel_gm20b.h,
+                 hal/fifo/channel_gv11b_fusa.c,
+                 hal/fifo/channel_gv11b.h ]
+    channel:
+      safe: no
+      sources: [ hal/fifo/channel_gk20a.c,
+                 hal/fifo/channel_gm20b.c,
+                 hal/fifo/channel_gv100.c,
+                 hal/fifo/channel_gv100.h ]
+    tsg_fusa:
+      safe: yes
+      sources: [ hal/fifo/tsg_gk20a.h,
+                 hal/fifo/tsg_gk20a_fusa.c,
+                 hal/fifo/tsg_gv11b.h,
+                 hal/fifo/tsg_gv11b_fusa.c ]
+
+    tsg:
+      safe: no
+      sources: [ hal/fifo/tsg_gk20a.c ]
+
+    fifo_fusa:
+     safe: yes
+     sources: [ hal/fifo/fifo_intr_gk20a_fusa.c,
+                hal/fifo/fifo_intr_gk20a.h,
+                hal/fifo/fifo_intr_gv11b_fusa.c,
+                hal/fifo/fifo_intr_gv11b.h,
+                hal/fifo/ctxsw_timeout_gv11b_fusa.c,
+                hal/fifo/ctxsw_timeout_gv11b.h,
+                hal/fifo/fifo_gk20a_fusa.c,
+                hal/fifo/fifo_gk20a.h,
+                hal/fifo/fifo_gv11b_fusa.c,
+                hal/fifo/fifo_gv11b.h ]
+    fifo:
+     safe: no
+     sources: [ hal/fifo/fifo_intr_gk20a.c,
+                hal/fifo/fifo_intr_gv100.c,
+                hal/fifo/fifo_intr_gv100.h,
+                hal/fifo/ctxsw_timeout_gk20a.c,
+                hal/fifo/ctxsw_timeout_gk20a.h,
+                hal/fifo/mmu_fault_gk20a.c,
+                hal/fifo/mmu_fault_gk20a.h,
+                hal/fifo/mmu_fault_gm20b.c,
+                hal/fifo/mmu_fault_gm20b.h,
+                hal/fifo/mmu_fault_gp10b.c,
+                hal/fifo/mmu_fault_gp10b.h,
+                hal/fifo/fifo_gk20a.c,
+                hal/fifo/fifo_tu104.c,
+                hal/fifo/fifo_tu104.h ]
+
+    engine_status_fusa:
+     safe: yes
+     sources: [ hal/fifo/engine_status_gm20b_fusa.c,
+                hal/fifo/engine_status_gm20b.h,
+                hal/fifo/engine_status_gv100_fusa.c,
+                hal/fifo/engine_status_gv100.h ]
+    engine_status:
+     safe: no
+     sources: [ hal/fifo/engine_status_gm20b.c ]
+
+    engines_fusa:
+     safe: yes
+     sources: [ hal/fifo/engines_gp10b_fusa.c,
+                hal/fifo/engines_gp10b.h,
+                hal/fifo/engines_gv11b_fusa.c,
+                hal/fifo/engines_gv11b.h ]
+
+    engines:
+     safe: no
+     sources: [ hal/fifo/engines_gm20b.c,
+                hal/fifo/engines_gm20b.h ]
+
+    pbdma_status:
+      safe: yes
+      sources: [ hal/fifo/pbdma_status_gm20b_fusa.c,
+                 hal/fifo/pbdma_status_gm20b.h ]
+
+    pbdma_fusa:
+      safe: yes
+      sources: [ hal/fifo/pbdma_gm20b_fusa.c,
+                 hal/fifo/pbdma_gm20b.h,
+                 hal/fifo/pbdma_gp10b_fusa.c,
+                 hal/fifo/pbdma_gp10b.h,
+                 hal/fifo/pbdma_gv11b_fusa.c,
+                 hal/fifo/pbdma_gv11b.h ]
+
+    pbdma:
+      safe: no
+      sources: [ hal/fifo/pbdma_gm20b.c,
+                 hal/fifo/pbdma_gp10b.c,
+                 hal/fifo/pbdma_tu104.c,
+                 hal/fifo/pbdma_tu104.h ]
+
+    preempt_fusa:
+     safe: yes
+     sources: [ hal/fifo/preempt_gv11b_fusa.c,
+                hal/fifo/preempt_gv11b.h ]
+
+    preempt:
+     safe: no
+     sources: [ hal/fifo/preempt_gk20a.c,
+                hal/fifo/preempt_gk20a.h ]
+
+    usermode_fusa:
+      safe: yes
+      sources: [ hal/fifo/usermode_gv11b_fusa.c,
+                 hal/fifo/usermode_gv11b.h ]
+
+    usermode:
+      safe: no
+      sources: [ hal/fifo/usermode_tu104.c,
+                 hal/fifo/usermode_tu104.h ]
+
+fuse_fusa:
+  safe: yes
+  owner: Seema K
+  sources: [ hal/fuse/fuse_gm20b_fusa.c,
+             hal/fuse/fuse_gm20b.h,
+             hal/fuse/fuse_gp10b_fusa.c,
+             hal/fuse/fuse_gp10b.h ]
+
+fuse:
+  safe: no
+  owner: Seema K
+  sources: [ hal/fuse/fuse_gm20b.c,
+             hal/fuse/fuse_gp106.c,
+             hal/fuse/fuse_gp106.h,
+             hal/fuse/fuse_tu104.c,
+             hal/fuse/fuse_tu104.h ]
+
+gsp:
+  safe: no
+  sources: [ hal/gsp/gsp_tu104.c,
+             hal/gsp/gsp_tu104.h ]
+
+mm:
+  safe: yes
+  owner: Alex W
+  children:
+    gmmu_fusa:
+      safe: yes
+      sources: [ hal/mm/gmmu/gmmu_gk20a_fusa.c,
+                 hal/mm/gmmu/gmmu_gk20a.h,
+                 hal/mm/gmmu/gmmu_gm20b_fusa.c,
+                 hal/mm/gmmu/gmmu_gm20b.h,
+                 hal/mm/gmmu/gmmu_gp10b_fusa.c,
+                 hal/mm/gmmu/gmmu_gp10b.h,
+                 hal/mm/gmmu/gmmu_gv11b_fusa.c,
+                 hal/mm/gmmu/gmmu_gv11b.h ]
+    gmmu:
+      safe: no
+      sources: [ hal/mm/gmmu/gmmu_gk20a.c,
+                 hal/mm/gmmu/gmmu_gm20b.c]
+    cache_fusa:
+      safe: yes
+      sources: [ hal/mm/cache/flush_gk20a_fusa.c,
+                 hal/mm/cache/flush_gk20a.h,
+                 hal/mm/cache/flush_gv11b_fusa.c,
+                 hal/mm/cache/flush_gv11b.h ]
+    cache:
+      safe: no
+      sources: [ hal/mm/cache/flush_gk20a.c ]
+    mmu_fault:
+      safe: yes
+      sources: [ hal/mm/mmu_fault/mmu_fault_gv11b_fusa.c,
+                 hal/mm/mmu_fault/mmu_fault_gv11b.h ]
+    mm_fusa:
+      safe: yes
+      sources: [ hal/mm/mm_gp10b_fusa.c,
+                 hal/mm/mm_gp10b.h,
+                 hal/mm/mm_gv11b_fusa.c,
+                 hal/mm/mm_gv11b.h]
+    mm:
+      safe: no
+      sources: [ hal/mm/mm_gk20a.c,
+                 hal/mm/mm_gk20a.h,
+                 hal/mm/mm_gm20b.c,
+                 hal/mm/mm_gm20b.h,
+                 hal/mm/mm_gv100.c,
+                 hal/mm/mm_gv100.h,
+                 hal/mm/mm_tu104.c,
+                 hal/mm/mm_tu104.h]
+
+sync:
+  safe: yes
+  owner: Thomas F
+  children:
+    sema:
+      safe: no
+      sources: [ hal/sync/sema_cmdbuf_gk20a.c,
+                 hal/sync/sema_cmdbuf_gk20a.h,
+                 hal/sync/sema_cmdbuf_gv11b.c,
+                 hal/sync/sema_cmdbuf_gv11b.h ]
+    syncpt:
+      safe: no
+      sources: [ hal/sync/syncpt_cmdbuf_gk20a.c,
+                 hal/sync/syncpt_cmdbuf_gk20a.h,
+                 hal/sync/syncpt_cmdbuf_gv11b.c]
+    syncpt_fusa:
+      safe: yes
+      sources: [ hal/sync/syncpt_cmdbuf_gv11b_fusa.c,
+                 hal/sync/syncpt_cmdbuf_gv11b.h ]
+
+
+therm_fusa:
+  safe: yes
+  owner: Seshendra G
+  sources: [ hal/therm/therm_gv11b_fusa.c,
+             hal/therm/therm_gv11b.h ]
+
+therm:
+  safe: no
+  owner: Seshendra G
+  sources: [ hal/therm/therm_gm20b.c,
+             hal/therm/therm_gm20b.h,
+             hal/therm/therm_tu104.c,
+             hal/therm/therm_tu104.h,
+             hal/therm/therm_gp10b.c,
+             hal/therm/therm_gp10b.h ]
+
+cbc:
+  safe: no
+  owner: Seshendra G
+  sources: [ hal/cbc/cbc_gm20b.c,
+             hal/cbc/cbc_gm20b.h,
+             hal/cbc/cbc_gp10b.c,
+             hal/cbc/cbc_gp10b.h,
+             hal/cbc/cbc_gv11b.c,
+             hal/cbc/cbc_gv11b.h,
+             hal/cbc/cbc_tu104.c,
+             hal/cbc/cbc_tu104.h ]
+
+ce_fusa:
+  safe: yes
+  owner: Thomas F
+  sources: [ hal/ce/ce_gp10b_fusa.c,
+             hal/ce/ce_gp10b.h,
+             hal/ce/ce_gv11b_fusa.c,
+             hal/ce/ce_gv11b.h ]
+
+ce:
+  safe: no
+  owner: Thomas F
+  sources: [ hal/ce/ce2_gk20a.c,
+             hal/ce/ce2_gk20a.h,
+             hal/ce/ce_tu104.c,
+             hal/ce/ce_tu104.h ]
+
+gr:
+  safe: yes
+  owner: Deepak N
+  children:
+    ecc_fusa:
+      safe: yes
+      sources: [hal/gr/ecc/ecc_gv11b_fusa.c,
+                hal/gr/ecc/ecc_gv11b.h ]
+    ecc:
+      safe: no
+      sources: [hal/gr/ecc/ecc_gv11b.c,
+                hal/gr/ecc/ecc_gp10b.c,
+                hal/gr/ecc/ecc_gp10b.h ]
+    ctxsw_prog_fusa:
+      safe: yes
+      sources: [ hal/gr/ctxsw_prog/ctxsw_prog_gm20b_fusa.c,
+                 hal/gr/ctxsw_prog/ctxsw_prog_gm20b.h,
+                 hal/gr/ctxsw_prog/ctxsw_prog_gp10b_fusa.c,
+                 hal/gr/ctxsw_prog/ctxsw_prog_gp10b.h,
+                 hal/gr/ctxsw_prog/ctxsw_prog_gv11b_fusa.c,
+                 hal/gr/ctxsw_prog/ctxsw_prog_gv11b.h ]
+    ctxsw_prog:
+      safe: no
+      sources: [ hal/gr/ctxsw_prog/ctxsw_prog_gm20b.c,
+                 hal/gr/ctxsw_prog/ctxsw_prog_gm20b_dbg.c,
+                 hal/gr/ctxsw_prog/ctxsw_prog_gp10b.c,
+                 hal/gr/ctxsw_prog/ctxsw_prog_gv11b.c]
+    config_fusa:
+      safe: yes
+      sources: [ hal/gr/config/gr_config_gm20b_fusa.c,
+                 hal/gr/config/gr_config_gm20b.h,
+                 hal/gr/config/gr_config_gv100_fusa.c,
+                 hal/gr/config/gr_config_gv100.h ]
+
+    config:
+      safe: no
+      sources: [ hal/gr/config/gr_config_gm20b.c ]
+
+    init_fusa:
+      safe: yes
+      sources: [ hal/gr/init/gr_init_gm20b_fusa.c,
+                 hal/gr/init/gr_init_gm20b.h,
+                 hal/gr/init/gr_init_gp10b_fusa.c,
+                 hal/gr/init/gr_init_gp10b.h,
+                 hal/gr/init/gr_init_gv11b_fusa.c,
+                 hal/gr/init/gr_init_gv11b.h ]
+    init:
+      safe: no
+      sources: [ hal/gr/init/gr_init_gm20b.c,
+                 hal/gr/init/gr_init_gp10b.c,
+                 hal/gr/init/gr_init_gv100.c,
+                 hal/gr/init/gr_init_gv100.h,
+                 hal/gr/init/gr_init_gv11b.c,
+                 hal/gr/init/gr_init_tu104.c,
+                 hal/gr/init/gr_init_tu104.h ]
+    intr_fusa:
+      safe: yes
+      sources: [ hal/gr/intr/gr_intr_gm20b_fusa.c,
+                 hal/gr/intr/gr_intr_gm20b.h,
+                 hal/gr/intr/gr_intr_gp10b_fusa.c,
+                 hal/gr/intr/gr_intr_gp10b.h,
+                 hal/gr/intr/gr_intr_gv11b_fusa.c,
+                 hal/gr/intr/gr_intr_gv11b.h ]
+    intr:
+      safe: no
+      sources: [ hal/gr/intr/gr_intr_gm20b.c,
+                 hal/gr/intr/gr_intr_gp10b.c,
+                 hal/gr/intr/gr_intr_tu104.c,
+                 hal/gr/intr/gr_intr_tu104.h ]
+    falcon_fusa:
+      safe: yes
+      sources: [ hal/gr/falcon/gr_falcon_gm20b_fusa.c,
+                 hal/gr/falcon/gr_falcon_gm20b.h,
+                 hal/gr/falcon/gr_falcon_gp10b_fusa.c,
+                 hal/gr/falcon/gr_falcon_gp10b.h,
+                 hal/gr/falcon/gr_falcon_gv11b_fusa.c,
+                 hal/gr/falcon/gr_falcon_gv11b.h ]
+    falcon:
+      safe: no
+      sources: [ hal/gr/falcon/gr_falcon_gm20b.c,
+                 hal/gr/falcon/gr_falcon_tu104.c,
+                 hal/gr/falcon/gr_falcon_tu104.h ]
+    fecs_trace:
+      safe: no
+      sources: [ hal/gr/fecs_trace/fecs_trace_gm20b.c,
+                 hal/gr/fecs_trace/fecs_trace_gm20b.h,
+                 hal/gr/fecs_trace/fecs_trace_gm20b.h,
+                 hal/gr/fecs_trace/fecs_trace_gv11b.c,
+                 hal/gr/fecs_trace/fecs_trace_gv11b.h ]
+    hwpm_map:
+      safe: no
+      sources: [ hal/gr/hwpm_map/hwpm_map_gv100.c,
+                 hal/gr/hwpm_map/hwpm_map_gv100.h ]
+    zbc:
+      safe: no
+      sources: [ hal/gr/zbc/zbc_gm20b.c,
+                 hal/gr/zbc/zbc_gm20b.h,
+                 hal/gr/zbc/zbc_gp10b.c,
+                 hal/gr/zbc/zbc_gp10b.h,
+                 hal/gr/zbc/zbc_gv11b.c,
+                 hal/gr/zbc/zbc_gv11b.h ]
+    zcull:
+      safe: no
+      sources: [ hal/gr/zcull/zcull_gm20b.c,
+                 hal/gr/zcull/zcull_gm20b.h,
+                 hal/gr/zcull/zcull_gv11b.c,
+                 hal/gr/zcull/zcull_gv11b.h ]
+    gr:
+      safe: no
+      sources: [ hal/gr/gr/gr_gk20a.c, hal/gr/gr/gr_gk20a.h,
+                 hal/gr/gr/gr_gm20b.c, hal/gr/gr/gr_gm20b.h,
+                 hal/gr/gr/gr_gp10b.c, hal/gr/gr/gr_gp10b.h,
+                 hal/gr/gr/gr_gv100.c, hal/gr/gr/gr_gv100.h,
+                 hal/gr/gr/gr_gv11b.c, hal/gr/gr/gr_gv11b.h,
+                 hal/gr/gr/gr_tu104.c, hal/gr/gr/gr_tu104.h,
+                 include/nvgpu/gr/warpstate.h,
+                 hal/gr/gr/gr_pri_gk20a.h,
+                 hal/gr/gr/gr_pri_gv11b.h ]
+
+regops:
+  safe: no
+  owner: Deepak N
+  sources: [ hal/regops/regops_gm20b.c,
+             hal/regops/regops_gm20b.h,
+             hal/regops/regops_gp10b.c,
+             hal/regops/regops_gp10b.h,
+             hal/regops/regops_gv11b.c,
+             hal/regops/regops_gv11b.h,
+             hal/regops/regops_tu104.c,
+             hal/regops/regops_tu104.h,
+             hal/regops/allowlist_gv11b.c,
+             hal/regops/allowlist_gv11b.h,
+             hal/regops/allowlist_tu104.c,
+             hal/regops/allowlist_tu104.h ]
+
+falcon_fusa:
+  safe: yes
+  owner: Sagar K
+  sources: [ hal/falcon/falcon_gk20a_fusa.c,
+             hal/falcon/falcon_gk20a.h ]
+
+falcon:
+  safe: no
+  owner: Sagar K
+  sources: [ hal/falcon/falcon_gk20a.c ]
+
+mc_fusa:
+  safe: yes
+  owner: Seema K
+  sources: [ hal/mc/mc_gm20b_fusa.c,
+             hal/mc/mc_gm20b.h,
+             hal/mc/mc_gp10b_fusa.c,
+             hal/mc/mc_gp10b.h,
+             hal/mc/mc_gv11b_fusa.c,
+             hal/mc/mc_gv11b.h ]
+
+mc:
+  safe: no
+  owner: Seema K
+  sources: [ hal/mc/mc_gm20b.c,
+             hal/mc/mc_gv100.c,
+             hal/mc/mc_gv100.h,
+             hal/mc/mc_tu104.c,
+             hal/mc/mc_tu104.h ]
+
+fb_fusa:
+  safe: yes
+  owner: Seshendra G
+  sources: [ include/nvgpu/gops/fb.h,
+             hal/fb/fb_gm20b_fusa.c,
+             hal/fb/fb_gm20b.h,
+             hal/fb/fb_gv11b_fusa.c,
+             hal/fb/fb_gv11b.h,
+             hal/fb/ecc/fb_ecc_gv11b.h, hal/fb/ecc/fb_ecc_gv11b_fusa.c,
+             hal/fb/intr/fb_intr_gv11b.h, hal/fb/intr/fb_intr_gv11b_fusa.c,
+             hal/fb/fb_mmu_fault_gv11b.h, hal/fb/fb_mmu_fault_gv11b_fusa.c,
+             hal/fb/intr/fb_intr_ecc_gv11b.h, hal/fb/intr/fb_intr_ecc_gv11b_fusa.c ]
+
+fb:
+  safe: no
+  owner: Seshendra G
+  sources: [ hal/fb/fb_gm20b.c,
+             hal/fb/fb_gp106.c, hal/fb/fb_gp106.h,
+             hal/fb/fb_gp10b.c, hal/fb/fb_gp10b.h,
+             hal/fb/fb_gv100.c, hal/fb/fb_gv100.h,
+             hal/fb/fb_gv11b.c,
+             hal/fb/fb_tu104.c, hal/fb/fb_tu104.h,
+             hal/fb/intr/fb_intr_gv100.h, hal/fb/intr/fb_intr_gv100.c,
+             hal/fb/fb_mmu_fault_tu104.h, hal/fb/fb_mmu_fault_tu104.c,
+             hal/fb/intr/fb_intr_tu104.c, hal/fb/intr/fb_intr_tu104.h,
+             hal/fb/intr/fb_intr_ecc_gv11b.c ]
+
+pmu_fusa:
+  safe: yes
+  owner: Mahantesh K
+  sources: [ hal/pmu/pmu_gk20a_fusa.c,
+             hal/pmu/pmu_gk20a.h,
+             hal/pmu/pmu_gv11b_fusa.c,
+             hal/pmu/pmu_gv11b.h ]
+
+pmu:
+  safe: no
+  owner: Mahantesh K
+  sources: [ hal/pmu/pmu_gk20a.c,
+             hal/pmu/pmu_gm20b.c,
+             hal/pmu/pmu_gm20b.h,
+             hal/pmu/pmu_gp10b.c,
+             hal/pmu/pmu_gp10b.h,
+             hal/pmu/pmu_gv11b.c,
+             hal/pmu/pmu_tu104.c,
+             hal/pmu/pmu_tu104.h ]
+
+nvlink:
+  safe: yes
+  gpu: dgpu
+  sources: [ hal/nvlink/link_mode_transitions_gv100.c,
+             hal/nvlink/link_mode_transitions_gv100.h,
+             hal/nvlink/link_mode_transitions_tu104.c,
+             hal/nvlink/link_mode_transitions_tu104.h,
+             hal/nvlink/intr_and_err_handling_tu104.c,
+             hal/nvlink/intr_and_err_handling_tu104.h,
+             hal/nvlink/nvlink_gv100.c,
+             hal/nvlink/nvlink_gv100.h,
+             hal/nvlink/nvlink_tu104.c,
+             hal/nvlink/nvlink_tu104.h,
+             hal/nvlink/minion_gv100.c,
+             hal/nvlink/minion_gv100.h,
+             hal/nvlink/minion_tu104.c,
+             hal/nvlink/minion_tu104.h ]
+
+sec2:
+  safe: yes
+  owner: Sagar K
+  gpu: dgpu
+  sources: [ hal/sec2/sec2_tu104.c,
+             hal/sec2/sec2_tu104.h ]
+
+netlist_fusa:
+  safe: yes
+  owner: Seshendra G
+  gpu: both
+  sources: [ include/nvgpu/gops/netlist.h,
+             hal/netlist/netlist_gv11b_fusa.c,
+             hal/netlist/netlist_gv11b.h ]
+
+netlist:
+  safe: no
+  owner: Seshendra G
+  gpu: both
+  sources: [ hal/netlist/netlist_gm20b.c,
+             hal/netlist/netlist_gm20b.h,
+             hal/netlist/netlist_gp10b.c,
+             hal/netlist/netlist_gp10b.h,
+             hal/netlist/netlist_gv100.c,
+             hal/netlist/netlist_gv100.h,
+             hal/netlist/netlist_tu104.c,
+             hal/netlist/netlist_tu104.h ]
+
+nvdec:
+  safe: no
+  sources: [ hal/nvdec/nvdec_gp106.c,
+             hal/nvdec/nvdec_gp106.h,
+             hal/nvdec/nvdec_tu104.c,
+             hal/nvdec/nvdec_tu104.h ]
+
+perf:
+  safe: no
+  owner: Deepak N
+  sources: [ hal/perf/perf_gm20b.c,
+             hal/perf/perf_gm20b.h,
+             hal/perf/perf_gv11b.c,
+             hal/perf/perf_gv11b.h,
+             hal/perf/perf_tu104.c,
+             hal/perf/perf_tu104.h ]
+
+pramin:
+  safe: yes
+  gpu: dgpu
+  sources: [ hal/pramin/pramin_gp10b.c,
+             hal/pramin/pramin_gp10b.h,
+             hal/pramin/pramin_gv100.c,
+             hal/pramin/pramin_gv100.h,
+             hal/pramin/pramin_init.c,
+             hal/pramin/pramin_init.h,
+             hal/pramin/pramin_tu104.c,
+             hal/pramin/pramin_tu104.h ]
+
+class_fusa:
+  safe: yes
+  owner: Seshendra G
+  sources: [ hal/class/class_gm20b.h,
+             hal/class/class_gp10b.h,
+             hal/class/class_gv11b_fusa.c,
+             hal/class/class_gv11b.h ]
+
+class:
+  safe: no
+  owner: Seshendra G
+  sources: [ hal/class/class_gm20b.c,
+             hal/class/class_gp10b.c,
+             hal/class/class_tu104.c,
+             hal/class/class_tu104.h ]
+
+func:
+  safe: yes
+  owner: Terje B
+  gpu: dgpu
+  sources: [ hal/func/func_tu104.c,
+             hal/func/func_tu104.h ]
+
+top_fusa:
+  safe: yes
+  owner: Tejal K
+  sources: [ include/nvgpu/gops/top.h,
+             hal/top/top_gm20b_fusa.c,
+             hal/top/top_gm20b.h,
+             hal/top/top_gp10b.h,
+             hal/top/top_gv11b_fusa.c,
+             hal/top/top_gv11b.h ]
+
+top:
+  safe: no
+  owner: Tejal K
+  sources: [ hal/top/top_gm20b.c,
+             hal/top/top_gp106.c,
+             hal/top/top_gp106.h,
+             hal/top/top_gp10b.c,
+             hal/top/top_gv100.c,
+             hal/top/top_gv100.h ]
+
+bios:
+  safe: yes
+  owner: Tejal
+  gpu: dgpu
+  sources: [ hal/bios/bios_tu104.c,
+             hal/bios/bios_tu104.h ]
+
+xve:
+  safe: yes
+  owner: Alex W
+  gpu: dgpu
+  sources: [ include/nvgpu/xve.h,
+             hal/xve/xve_gp106.c,
+             hal/xve/xve_gp106.h,
+             hal/xve/xve_tu104.c,
+             hal/xve/xve_tu104.h ]
+
+tpc:
+  safe: no
+  owner: Divya S
+  sources: [ hal/tpc/tpc_gv11b.c,
+             hal/tpc/tpc_gv11b.h ]
+
+cic:
+  safe: yes
+  owner: Tejal K
+  sources: [ hal/cic/cic_gv11b_fusa.c,
+             hal/cic/cic_lut_gv11b_fusa.c,
+             hal/cic/cic_gv11b.h ]
--- a/arch/nvgpu-hal-vgpu.yaml
+++ b/arch/nvgpu-hal-vgpu.yaml
@@ -0,0 +1,29 @@
+# Copyright (c) 2019-2021, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# VGPU HAL units.
+#
+
+init:
+  safe: no
+  owner: Aparna D
+  sources: [ hal/vgpu/init/init_hal_vgpu.c,
+             hal/vgpu/init/init_hal_vgpu.h,
+             hal/vgpu/init/vgpu_hal_gv11b.c,
+             hal/vgpu/init/vgpu_hal_gv11b.h ]
+
+fifo:
+  safe : no
+  owner: Aparna D
+  children:
+    fifo:
+     safe: no
+     sources: [ hal/vgpu/fifo/fifo_gv11b_vgpu.c,
+                hal/vgpu/fifo/fifo_gv11b_vgpu.h ]
+
+sync:
+  safe: no
+  owner: Aparna D
+  children:
+    syncpt:
+      sources: [ hal/vgpu/sync/syncpt_cmdbuf_gv11b_vgpu.c,
+                 hal/vgpu/sync/syncpt_cmdbuf_gv11b_vgpu.h ]
--- a/arch/nvgpu-hal.yaml
+++ b/arch/nvgpu-hal.yaml
@@ -0,0 +1,10 @@
+# Copyright (c) 2019-2020, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# HAL units. These are the units that have access to HW.
+#
+
+init:
+  safe: yes
+  owner: Terje B
+  sources: [ include/nvgpu/hal_init.h ]
+
--- a/arch/nvgpu-interface.yaml
+++ b/arch/nvgpu-interface.yaml
@@ -0,0 +1,132 @@
+# Copyright (c) 2019, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# OS interface units and utilities. Often represented by simply a header file.
+#
+
+atomic:
+  safe: yes
+  sources: [ include/nvgpu/atomic.h ]
+
+barrier:
+  safe: yes
+  sources: [ include/nvgpu/barrier.h ]
+
+bitops:
+  safe: yes
+  sources: [ include/nvgpu/bitops.h ]
+
+bsearch:
+  safe: yes
+  sources: [ include/nvgpu/bsearch.h ]
+
+bug:
+  safe: yes
+  sources: [ include/nvgpu/bug.h ]
+
+circ_buf:
+  safe: yes
+  sources: [ include/nvgpu/circ_buf.h ]
+
+cond:
+  safe: yes
+  sources: [ include/nvgpu/cond.h ]
+
+dma:
+  safe: yes
+  sources: [ include/nvgpu/dma.h ]
+
+# This one is likely not structured correctly.
+dt:
+  safe: yes
+  sources: [ include/nvgpu/dt.h ]
+
+# Also a problem.
+errno:
+  safe: yes
+  sources: [ include/nvgpu/errno.h ]
+
+firmware:
+  safe: yes
+  sources: [ include/nvgpu/firmware.h ]
+
+fuse:
+  safe: yes
+  sources: [ include/nvgpu/fuse.h ]
+
+io:
+  safe: yes
+  sources: [ include/nvgpu/io.h, include/nvgpu/io_usermode.h ]
+
+kmem:
+  safe: yes
+  sources: [ include/nvgpu/kmem.h ]
+
+kref:
+  safe: yes
+  sources: [ include/nvgpu/kref.h ]
+
+list:
+  safe: yes
+  sources: [ include/nvgpu/list.h ]
+  tags: unit-testable
+
+lock:
+  safe: yes
+  sources: [ include/nvgpu/lock.h ]
+
+log:
+  safe: yes
+  sources: [ include/nvgpu/log.h, include/nvgpu/log_common.h ]
+
+log2:
+  safe: yes
+  sources: [ include/nvgpu/log2.h ]
+
+rwsem:
+  safe: yes
+  sources: [ include/nvgpu/rwsem.h ]
+
+sizes:
+  safe: yes
+  sources: [ include/nvgpu/sizes.h ]
+
+soc:
+  safe: yes
+  sources: [ include/nvgpu/soc.h ]
+
+sort:
+  safe: yes
+  sources: [ include/nvgpu/sort.h ]
+
+string:
+  safe: yes
+  sources: [ include/nvgpu/string.h ]
+  tags: unit-testable
+
+thread:
+  safe: yes
+  sources: [ include/nvgpu/thread.h ]
+
+timers:
+  safe: yes
+  sources: [ include/nvgpu/timers.h ]
+
+types:
+  safe: yes
+  sources: [ include/nvgpu/types.h ]
+
+nvgpu_sgt:
+  safe: yes
+  sources: [ include/nvgpu/nvgpu_sgt_os.h ]
+
+os_sched:
+  safe: yes
+  sources: [ include/nvgpu/os_sched.h ]
+
+nvhost:
+  safe: yes
+  sources: [ include/nvgpu/nvhost.h ]
+
+vpr:
+  safe: no
+  sources: [ include/nvgpu/vpr.h ]
--- a/arch/nvgpu-linux.yaml
+++ b/arch/nvgpu-linux.yaml
@@ -0,0 +1,256 @@
+#
+# Copyright (c) 2019-2021, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# Linux elements and units in nvgpu.
+#
+# The safe: tag is ommited through out since all Linux units are by definition
+# not safe.
+#
+# I also have not put a huge amount of thought into this since none of this
+# code is "safe" code. Nor are we planning on spending a lot of effort to
+# clean this up. At least not yet.
+
+bsearch:
+  sources: [ os/linux/bsearch.c ]
+
+channel:
+  sources: [ os/linux/linux-channel.c, os/linux/channel.h ]
+
+vpr:
+  sources: [ os/linux/vpr.c ]
+
+clk:
+  sources: [ os/linux/clk.c, os/linux/clk.h ]
+
+cde:
+  sources: [ os/linux/cde.c,       os/linux/cde.h,
+             os/linux/cde_gm20b.c, os/linux/cde_gm20b.h,
+             os/linux/cde_gp10b.c, os/linux/cde_gp10b.h  ]
+
+comptags:
+  sources: [ os/linux/comptags.c ]
+
+cond:
+  sources: [ os/linux/cond.c ]
+
+dma:
+  sources: [ os/linux/linux-dma.c ]
+
+dmabuf:
+  sources: [ os/linux/dmabuf_vidmem.c, os/linux/dmabuf_vidmem.h,
+             os/linux/dmabuf_priv.c, os/linux/dmabuf_priv.h ]
+
+driver_common:
+  sources: [ os/linux/driver_common.c, os/linux/driver_common.h ]
+
+dt:
+  sources: [ os/linux/dt.c ]
+
+debug:
+  sources: [ os/linux/debug.c,
+             os/linux/debug_allocator.c,
+             os/linux/debug_allocator.h,
+             os/linux/debug_bios.c,
+             os/linux/debug_bios.h,
+             os/linux/debug_cde.c,
+             os/linux/debug_cde.h,
+             os/linux/debug_ce.c,
+             os/linux/debug_ce.h,
+             os/linux/debug_clk_gm20b.c,
+             os/linux/debug_clk_gm20b.h,
+             os/linux/debug_clk_tu104.c,
+             os/linux/debug_clk_tu104.h,
+             os/linux/debug_fecs_trace.c,
+             os/linux/debug_fecs_trace.h,
+             os/linux/debug_fifo.c,
+             os/linux/debug_fifo.h,
+             os/linux/debug_gr.c,
+             os/linux/debug_gr.h,
+             os/linux/debug_hal.c,
+             os/linux/debug_hal.h,
+             os/linux/debug_kmem.c,
+             os/linux/debug_kmem.h,
+             os/linux/debug_ltc.c,
+             os/linux/debug_ltc.h,
+             os/linux/debug_pmgr.c,
+             os/linux/debug_pmgr.h,
+             os/linux/debug_pmu.c,
+             os/linux/debug_pmu.h,
+             os/linux/debug_sched.c,
+             os/linux/debug_sched.h,
+             os/linux/debug_therm_tu104.c,
+             os/linux/debug_therm_tu104.h,
+             os/linux/debug_xve.c,
+             os/linux/debug_xve.h,
+             os/linux/debug_s_param.c,
+             os/linux/debug_s_param.h,
+             os/linux/debug_volt.c,
+             os/linux/debug_volt.h,
+             os/linux/swprofile_debugfs.c,
+             os/linux/swprofile_debugfs.h,
+             os/linux/fecs_trace_linux.c,
+             os/linux/fecs_trace_linux.h,
+             os/linux/nvlink_probe.c ]
+
+firmware:
+  sources: [ os/linux/firmware.c ]
+
+fuse:
+  sources: [ os/linux/fuse.c ]
+
+intr:
+  sources: [ os/linux/intr.c ]
+
+io:
+  sources: [ os/linux/io_usermode.c,
+             os/linux/linux-io.c ]
+
+ioctl:
+  sources: [ os/linux/ioctl.c,
+             os/linux/ioctl.h,
+             os/linux/ioctl_as.c,
+             os/linux/ioctl_as.h,
+             os/linux/ioctl_channel.c,
+             os/linux/ioctl_channel.h,
+             os/linux/ioctl_clk_arb.c,
+             os/linux/ioctl_ctrl.c,
+             os/linux/ioctl_ctrl.h,
+             os/linux/ioctl_dbg.c,
+             os/linux/ioctl_dbg.h,
+             os/linux/ioctl_prof.c,
+             os/linux/ioctl_prof.h,
+             os/linux/ioctl_tsg.c,
+             os/linux/ioctl_tsg.h,
+             os/linux/power_ops.c,
+             os/linux/power_ops.h ]
+
+kmem:
+  sources: [ os/linux/kmem.c, os/linux/kmem_priv.h ]
+
+log:
+  sources: [ os/linux/log.c ]
+
+module:
+  sources: [ os/linux/module.c,          os/linux/module.h,
+             os/linux/module_usermode.c, os/linux/module_usermode.h ]
+
+nvgpu_mem:
+  sources: [ os/linux/nvgpu_mem.c ]
+
+nvhost:
+  sources: [ os/linux/nvhost.c,
+             os/linux/nvhost_common.c,
+             os/linux/nvhost_host1x.c,
+             os/linux/nvhost_priv.h ]
+
+nvlink:
+  sources: [ os/linux/nvlink.c,
+             os/linux/nvlink.h ]
+
+fence:
+  sources: [ os/linux/os_fence_android.c,
+             os/linux/os_fence_android_sema.c,
+             os/linux/os_fence_dma.c,
+             os/linux/os_fence_dma_sema.c,
+             os/linux/os_fence_syncpt.c,
+             os/linux/os_fence_priv.h,
+             os/linux/sync_sema_android.c,
+             os/linux/sync_sema_android.h,
+             os/linux/sync_sema_dma.c,
+             os/linux/sync_sema_dma.h,
+             include/nvgpu/os_fence.h,
+             include/nvgpu/os_fence_semas.h,
+             include/nvgpu/os_fence_syncpts.h ]
+
+ops:
+  sources: [ os/linux/os_ops.c,       os/linux/os_ops.h,
+             os/linux/os_ops_gm20b.c, os/linux/os_ops_gm20b.h,
+             os/linux/os_ops_gp10b.c, os/linux/os_ops_gp10b.h,
+             os/linux/os_ops_gv100.c, os/linux/os_ops_gv100.h,
+             os/linux/os_ops_gv11b.c, os/linux/os_ops_gv11b.h,
+             os/linux/os_ops_tu104.c, os/linux/os_ops_tu104.h ]
+
+pci:
+  sources: [ os/linux/pci.c,
+             os/linux/pci.h,
+             os/linux/pci_power.c,
+             os/linux/pci_power.h,
+             include/nvgpu/pci.h ]
+
+platform:
+  sources: [ os/linux/platform_gk20a.h,
+             os/linux/platform_gk20a_tegra.c,
+             os/linux/platform_gk20a_tegra.h,
+             os/linux/platform_gp10b.h,
+             os/linux/platform_gp10b_tegra.c,
+             os/linux/platform_gv11b_tegra.c ]
+
+rwsem:
+  sources: [ os/linux/rwsem.c ]
+
+scale:
+  sources: [os/linux/scale.c, os/linux/scale.h ]
+
+sched:
+  sources: [ os/linux/os_sched.c,
+             os/linux/sched.c,
+             os/linux/sched.h ]
+
+sim:
+  sources: [ os/linux/sim.c, os/linux/sim_pci.c ]
+
+soc:
+  sources: [ os/linux/soc.c ]
+
+sysfs:
+  sources: [ os/linux/sysfs.c,     os/linux/sysfs.h,
+             os/linux/ecc_sysfs.c ]
+
+thread:
+  sources: [ os/linux/thread.c ]
+
+timers:
+  sources: [ os/linux/timers.c ]
+
+vgpu:
+  sources: [ os/linux/vgpu/fecs_trace_vgpu_linux.c,
+             os/linux/vgpu/gv11b/platform_gv11b_vgpu_tegra.c,
+             os/linux/vgpu/gv11b/platform_gv11b_vgpu_tegra.h,
+             os/linux/vgpu/platform_vgpu_tegra.c,
+             os/linux/vgpu/platform_vgpu_tegra.h,
+             os/linux/vgpu/sysfs_vgpu.c,
+             os/linux/vgpu/vgpu_ivc.c,
+             os/linux/vgpu/vgpu_ivm.c,
+             os/linux/vgpu/vgpu_linux.c,
+             os/linux/vgpu/vgpu_linux.h ]
+
+vm:
+  sources: [ os/linux/vm.c ]
+
+cic:
+  sources: [ os/linux/cic/cic_stub.c ]
+
+# Group all the Linux headers for now.
+headers:
+  sources: [ include/nvgpu/linux/atomic.h,
+             include/nvgpu/linux/barrier.h,
+             include/nvgpu/linux/cond.h,
+             include/nvgpu/linux/dma.h,
+             include/nvgpu/linux/kmem.h,
+             include/nvgpu/linux/lock.h,
+             include/nvgpu/linux/bitops.h,
+             include/nvgpu/linux/nvgpu_mem.h,
+             include/nvgpu/linux/os_fence_android.h,
+             include/nvgpu/linux/os_fence_dma.h,
+             include/nvgpu/linux/rwsem.h,
+             include/nvgpu/linux/sim.h,
+             include/nvgpu/linux/sim_pci.h,
+             include/nvgpu/linux/soc_fuse.h,
+             include/nvgpu/linux/thread.h,
+             include/nvgpu/linux/log.h,
+             include/nvgpu/linux/utils.h,
+             include/nvgpu/linux/vm.h ]
+
+# An extra unit to lump all the unclassified Linux files.
+extra:
+  sources: [ os/linux/os_linux.h ]
--- a/arch/nvgpu-posix.yaml
+++ b/arch/nvgpu-posix.yaml
@@ -0,0 +1,171 @@
+# Copyright (c) 2019-2021, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# POSIX elements and units in nvgpu.
+#
+
+# TODO: break this up into individual units. Will be critical for re-use in
+# QNX.
+all:
+  safe: no
+  owner: Alex W
+  sources: [ os/posix/error_notifier.c,
+             os/posix/firmware.c,
+             os/posix/fuse.c,
+             os/posix/gk20a.c,
+             os/posix/log.c,
+             os/posix/nvgpu.c,
+             os/posix/os_posix.h,
+             os/posix/posix-channel.c,
+             os/posix/posix-comptags.c,
+             os/posix/posix-dma.c,
+             os/posix/posix-fault-injection.c,
+             os/posix/posix-nvgpu_mem.c,
+             os/posix/posix-tsg.c,
+             os/posix/posix-vm.c,
+             os/posix/soc.c,
+             os/posix/bsearch.c,
+             os/posix/posix-clk_arb.c,
+             os/posix/posix-dt.c,
+             os/posix/posix-io.c,
+             os/posix/posix-nvhost.c,
+             os/posix/posix-nvlink.c,
+             os/posix/posix-vgpu.c,
+             os/posix/posix-vidmem.c,
+             os/posix/fecs_trace_posix.c,
+             os/posix/stubs.c,
+             os/posix/posix-vpr.c,
+             os/posix/mock-registers.c ]
+
+headers:
+  safe: no
+  owner: Alex W
+  sources: [ include/nvgpu/posix/barrier.h,
+             include/nvgpu/posix/dma.h,
+             include/nvgpu/posix/io.h,
+             include/nvgpu/posix/mock-regs.h,
+             include/nvgpu/posix/log.h,
+             include/nvgpu/posix/nvgpu_mem.h,
+             include/nvgpu/posix/pci.h,
+             include/nvgpu/posix/posix-fault-injection.h,
+             include/nvgpu/posix/posix-channel.h,
+             include/nvgpu/posix/probe.h,
+             include/nvgpu/posix/soc_fuse.h,
+             include/nvgpu/posix/vm.h,
+             include/nvgpu/posix/posix_vidmem.h,
+             include/nvgpu/posix/posix-nvhost.h,
+             include/nvgpu/posix/trace_gk20a.h ]
+
+queue:
+  safe: yes
+  owner: Rajesh D
+  sources: [ os/posix/queue.c,
+             include/nvgpu/posix/queue.h ]
+
+sort:
+  safe: no
+  owner: Ajesh K
+  sources: [ include/nvgpu/posix/sort.h ]
+  deps:
+
+bug:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/bug.c,
+             include/nvgpu/posix/bug.h ]
+  deps:
+
+lock:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/lock.c,
+             include/nvgpu/posix/lock.h ]
+
+rwsem:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/rwsem.c,
+             include/nvgpu/posix/rwsem.h ]
+  deps:
+
+size:
+  safe: yes
+  owner: Ajesh K
+  sources: [ include/nvgpu/posix/sizes.h ]
+  deps:
+
+cond:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/cond.c,
+             include/nvgpu/posix/cond.h ]
+  deps:
+
+threads:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/thread.c,
+             include/nvgpu/posix/thread.h ]
+  deps:
+
+timers:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/timers.c,
+             include/nvgpu/posix/timers.h ]
+  deps:
+
+atomic:
+  safe: yes
+  owner: Ajesh K
+  sources: [ include/nvgpu/posix/atomic.h ]
+  deps:
+
+os_sched:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/os_sched.c ]
+
+kmem:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/kmem.c,
+             include/nvgpu/posix/kmem.h ]
+  deps:
+
+types:
+  safe: yes
+  owner: Ajesh K
+  sources: [ include/nvgpu/posix/types.h ]
+  deps:
+
+utils:
+  safe: yes
+  owner: Ajesh K
+  sources: [ include/nvgpu/posix/utils.h ]
+  deps:
+
+bitops:
+  safe: yes
+  owner: Ajesh K
+  sources: [ os/posix/bitmap.c,
+             include/nvgpu/posix/bitops.h ]
+  deps:
+
+file_ops:
+  safe: yes
+  owner: Prateek S
+  sources: [ os/posix/file_ops.c,
+             include/nvgpu/posix/file_ops.h ]
+  deps:
+
+log2:
+  safe: yes
+  owner: Ajesh K
+  sources: [ include/nvgpu/posix/log2.h ]
+  deps:
+
+circ_buf:
+  safe: yes
+  owner: Ajesh K
+  sources: [ include/nvgpu/posix/circ_buf.h ]
+  deps:
--- a/arch/nvgpu-vgpu.yaml
+++ b/arch/nvgpu-vgpu.yaml
@@ -0,0 +1,78 @@
+# Copyright (c) 2019-2021, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# vGPU architecture: currently there hasn't been much work done on
+# decomposing the vGPU architecture so all of the vGPU files are simply
+# grouped into one super unit.
+#
+# TODO: Fix this !?!? Seems rather important given that this is the
+#       target for safety!
+#
+
+all:
+  safe: no
+  owner: Aparna D
+  sources: [ common/vgpu/cbc/cbc_vgpu.c,
+             common/vgpu/cbc/cbc_vgpu.h,
+             common/vgpu/ce_vgpu.c,
+             common/vgpu/clk_vgpu.c,
+             common/vgpu/clk_vgpu.h,
+             common/vgpu/debugger_vgpu.c,
+             common/vgpu/debugger_vgpu.h,
+             common/vgpu/pm_reservation_vgpu.c,
+             common/vgpu/pm_reservation_vgpu.h,
+             common/vgpu/ecc_vgpu.c,
+             common/vgpu/ecc_vgpu.h,
+             common/vgpu/top/top_vgpu.c,
+             common/vgpu/top/top_vgpu.h,
+             common/vgpu/fifo/fifo_vgpu.c,
+             common/vgpu/fifo/fifo_vgpu.h,
+             common/vgpu/fifo/channel_vgpu.c,
+             common/vgpu/fifo/channel_vgpu.h,
+             common/vgpu/fifo/tsg_vgpu.c,
+             common/vgpu/fifo/tsg_vgpu.h,
+             common/vgpu/fifo/preempt_vgpu.c,
+             common/vgpu/fifo/preempt_vgpu.h,
+             common/vgpu/fifo/ramfc_vgpu.c,
+             common/vgpu/fifo/ramfc_vgpu.h,
+             common/vgpu/fifo/runlist_vgpu.c,
+             common/vgpu/fifo/runlist_vgpu.h,
+             common/vgpu/fifo/userd_vgpu.c,
+             common/vgpu/fifo/userd_vgpu.h,
+             common/vgpu/gr/ctx_vgpu.c,
+             common/vgpu/gr/ctx_vgpu.h,
+             common/vgpu/gr/fecs_trace_vgpu.c,
+             common/vgpu/gr/fecs_trace_vgpu.h,
+             common/vgpu/gr/gr_vgpu.c,
+             common/vgpu/gr/gr_vgpu.h,
+             common/vgpu/gr/subctx_vgpu.c,
+             common/vgpu/gr/subctx_vgpu.h,
+             common/vgpu/ltc/ltc_vgpu.c,
+             common/vgpu/ltc/ltc_vgpu.h,
+             common/vgpu/mm/mm_vgpu.c,
+             common/vgpu/mm/mm_vgpu.h,
+             common/vgpu/mm/vm_vgpu.c,
+             common/vgpu/perf/cyclestats_snapshot_vgpu.c,
+             common/vgpu/perf/cyclestats_snapshot_vgpu.h,
+             common/vgpu/perf/perf_vgpu.c,
+             common/vgpu/perf/perf_vgpu.h,
+             common/vgpu/fbp/fbp_vgpu.c,
+             common/vgpu/fbp/fbp_vgpu.h,
+             common/vgpu/fb/fb_vgpu.c,
+             common/vgpu/fb/fb_vgpu.h,
+             common/vgpu/intr/intr_vgpu.c,
+             common/vgpu/intr/intr_vgpu.h,
+             common/vgpu/ivc/comm_vgpu.c,
+             common/vgpu/ivc/comm_vgpu.h,
+             common/vgpu/ptimer/ptimer_vgpu.c,
+             common/vgpu/ptimer/ptimer_vgpu.h,
+             common/vgpu/init/init_vgpu.c,
+             common/vgpu/init/init_vgpu.h,
+             common/vgpu/profiler/profiler_vgpu.c,
+             common/vgpu/profiler/profiler_vgpu.h,
+             include/nvgpu/vgpu/tegra_vgpu.h,
+             include/nvgpu/vgpu/vgpu.h,
+             include/nvgpu/vgpu/vgpu_ivc.h,
+             include/nvgpu/vgpu/vgpu_ivm.h,
+             include/nvgpu/vgpu/ce_vgpu.h,
+             include/nvgpu/vgpu/vm_vgpu.h,
+             include/nvgpu/vgpu/os_init_hal_vgpu.h ]
--- a/arch/nvgpu.yaml
+++ b/arch/nvgpu.yaml
@@ -0,0 +1,69 @@
+# Copyright (c) 2019-2020, NVIDIA CORPORATION.  All Rights Reserved.
+#
+# Top level NVGPU architecure description in YAML.
+#
+# The format of this document is structured by element and unit. Though only
+# units may have source files associated with them. All units must exist in an
+# element.
+#
+
+nvgpu:
+  safe: no
+  children:
+    # The common code element. This has gr, mm, etc.
+    common:
+      safe: no
+      children:
+        !include nvgpu-common.yaml nvgpu-next-common.yaml
+
+    # HAL units - Hardware Abstraction Layer.
+    hal:
+      safe: no
+      children:
+        !include nvgpu-hal-new.yaml nvgpu-next-hal.yaml
+
+    # The QNX OS layer implementation units.
+    qnx:
+      safe: yes
+      children:
+        !include nvgpu-qnx.yaml
+
+    # And the Linux version of the OS implementation units.
+    linux:
+      safe: no
+      children:
+        !include nvgpu-linux.yaml nvgpu-next-linux.yaml
+
+    # POSIX units for implementing the OS layer for unit testing.
+    posix:
+      children:
+        !include nvgpu-posix.yaml
+
+
+    # Inteface units - these provide interfaces for NVGPU to the underlying
+    # OS or CPU.
+    interface:
+      safe: yes
+      owner: Alex W
+      children:
+        !include nvgpu-interface.yaml
+
+    # Virtualization code.
+    vgpu:
+      safe: yes
+      children:
+        !include nvgpu-vgpu.yaml
+
+    # Virtualization HAL code.
+    hal-vgpu:
+      safe: yes
+      children:
+        !include nvgpu-hal-vgpu.yaml nvgpu-next-hal-vgpu.yaml
+
+    # A meta-element for the GPU HW. A good example of this is the HW headers.
+    # This is not code we write in nvgpu, but we import it from the GPU HW
+    # tree (with a little tranformation - the gen reg scrip).
+    gpu_hw:
+      safe: no
+      children:
+        !include nvgpu-gpu_hw.yaml nvgpu-next-gpu_hw.yaml
--- a/drivers/gpu/Makefile
+++ b/drivers/gpu/Makefile
@@ -0,0 +1,2 @@
+# Choose this option if you have an SoC with integrated Nvidia GPU IP.
+obj-m += nvgpu/
--- a/drivers/gpu/nvgpu/Kconfig.nvgpu
+++ b/drivers/gpu/nvgpu/Kconfig.nvgpu
@@ -0,0 +1,112 @@
+config GK20A
+	tristate "Nvidia GK20A GPU support"
+	default y
+	help
+	  Choose this option if you have an SoC with integrated
+	  Nvidia GPU IP.
+
+config GK20A_DEFAULT_TIMEOUT
+	depends on GK20A
+	int "Default timeout for submits"
+	default 3000
+	help
+	  Default timeout for jobs in milliseconds. Set to zero for no timeout.
+
+config GK20A_PMU
+	bool "Support GK20A PMU"
+	depends on GK20A
+	default n
+	help
+	  Say Y here to enable GK20A PMU features.
+
+choice
+	depends on GK20A
+	prompt "Enable GK20A frequency scaling"
+	default GK20A_PERFMON
+	optional
+	help
+	  Select this entry to enable gk20a scaling
+
+config GK20A_PERFMON
+	bool "Use Perfmon"
+	help
+	  Select this to enable built-in perfmon scaling.
+	  The built-in scaling option uses simplistic
+	  scaling mechanism (if busy, increase frequency and
+	  decrease frequency if idle).
+
+config GK20A_DEVFREQ
+	depends on TEGRA_CLK_FRAMEWORK || COMMON_CLK
+	bool "Use Devfreq"
+	help
+	  Select this to use devfreq based scaling.
+	  Devfreq is a common framework that allows using
+	  variety of different governors and changing
+	  between governors on the fly. By default, no
+	  governor is selected.
+
+endchoice
+
+config GK20A_CYCLE_STATS
+	bool "Support GK20A GPU CYCLE STATS"
+	depends on GK20A
+	default y
+	help
+	  Say Y here to enable the cycle stats debugging features.
+
+config GK20A_CTXSW_TRACE
+	bool "Support GK20A Context Switch tracing"
+	depends on GK20A
+	default n
+	help
+	  Enable support for the GK20A Context Switch Tracing. In this mode,
+	  FECS collects timestamps for contexts loaded on GR engine. This
+	  allows tracking context switches on GR engine, as well as
+	  identifying processes that submitted work.
+
+config TEGRA_GK20A
+	bool "Enable the GK20A GPU on Tegra"
+	depends on TEGRA_GRHOST || TEGRA_HOST1X
+	depends on GK20A
+	default y
+	help
+	  Enable support for the GK20A graphics engine on Tegra
+	  by adding a Tegra platfrom interface to the GK20A driver.
+	  The Tegra platform interface requires TEGRA_GRHOST (host1x).
+
+config TEGRA_ACR
+	bool "Enable HS bin support on GM20B GPU on Tegra"
+	depends on GK20A_PMU
+	default n
+	help
+	  Enable Support for Loading High Secure binary, and using
+	  Write Protected Regions (WPR) for storing ucodes, and bootstrap
+	  PMU, FECS and GPCCS in Low Secure mode.
+
+config TEGRA_USE_NA_GPCPLL
+	bool "Enable noise aware mode of GM20B GPCPLL on Tegra"
+	depends on TEGRA_CLK_FRAMEWORK
+	default n
+	help
+	  Enable noise aware (NA) mode of GM20b GPCPLL. In this mode PLL output
+	  frequency is automatically adjusted when GM20b voltage is fluctuating
+	  because of transient PMIC or power distribution tree noise.
+
+config GK20A_PCI
+	bool "Support PCIe NVIDIA GPUs on nvgpu"
+	depends on PCI && GK20A
+	default y if ARM64
+	default n
+	help
+	  Enable support for GPUs on PCIe bus.
+
+config GK20A_VIDMEM
+	bool "Support separate video memory on nvgpu"
+	depends on GK20A
+	default n
+	help
+	  Enable support for using and allocating buffers in a distinct video
+	  memory aperture (in contrast to general system memory), available on
+	  GPUs that have their own banks. PCIe GPUs have this, for example.
+
+trysource "../nvgpu-t19x/drivers/gpu/nvgpu/Kconfig"
--- a/drivers/gpu/nvgpu/Makefile
+++ b/drivers/gpu/nvgpu/Makefile
@@ -0,0 +1,788 @@
+GCOV_PROFILE := y
+
+# When building NVGPU as an external module, srctree.nvgpu is not
+# defined. Given that NVGPU knows where its header files are located
+# relatively, we can use the path information of this Makefile to
+# set srctree.nvgpu if it is not already defined. Please note that
+# 'lastword $(MAKEFILE_LIST)' refers to this Makefile.
+srctree.nvgpu ?= $(abspath $(shell dirname $(lastword $(MAKEFILE_LIST)))/../../..)
+
+ccflags-y += -I$(srctree.nvgpu)/drivers/gpu/nvgpu/include
+ccflags-y += -I$(srctree.nvgpu)/drivers/gpu/nvgpu
+ccflags-y += -I$(srctree.nvgpu)/include
+ccflags-y += -I$(srctree.nvgpu)/include/uapi
+
+ccflags-y += -I$(srctree)/drivers/devfreq
+
+ccflags-y += -Wframe-larger-than=2048
+ccflags-y += -Wno-multichar
+ccflags-y += -Werror
+ccflags-y += -Wno-error=cpp
+ifeq ($(VERSION),4)
+ccflags-y += -Wextra -Wno-unused-parameter -Wno-missing-field-initializers
+endif
+
+# Turn off when this is fixed upstream, if ever.
+ccflags-y += -D__NVGPU_PREVENT_UNTRUSTED_SPECULATION
+
+ifneq ($(srctree.nvgpu),)
+include $(srctree.nvgpu)/drivers/gpu/nvgpu/Makefile.linux.configs
+else
+include Makefile.linux.configs
+endif
+
+# When using the upstream host1x driver, the Makefile must define the
+# srctree.host1x path in order to find the necessary header files for
+# the upstream host1x driver.
+ifeq ($(CONFIG_TEGRA_GK20A_NVHOST_HOST1X),y)
+ccflags-y += -I$(srctree.host1x)/include
+endif
+
+ifeq ($(CONFIG_NVGPU_DEBUGGER),y)
+ccflags-y += -DCONFIG_NVGPU_DEBUGGER
+ccflags-y += -DCONFIG_NVGPU_ENGINE_RESET
+endif
+
+ccflags-y += -DCONFIG_NVGPU_DETERMINISTIC_CHANNELS
+ccflags-y += -DCONFIG_NVGPU_TPC_POWERGATE
+ccflags-y += -DCONFIG_NVGPU_ACR_LEGACY
+ccflags-y += -DCONFIG_NVGPU_ENGINE_QUEUE
+ccflags-y += -DCONFIG_NVGPU_FIFO_ENGINE_ACTIVITY
+ccflags-y += -DCONFIG_NVGPU_USERD
+ccflags-y += -DCONFIG_NVGPU_CHANNEL_WDT
+ccflags-y += -DCONFIG_NVGPU_LS_PMU
+ccflags-y += -DCONFIG_NVGPU_CILP
+ccflags-y += -DCONFIG_NVGPU_GFXP
+ccflags-y += -DCONFIG_NVGPU_GRAPHICS
+ccflags-y += -DCONFIG_NVGPU_REPLAYABLE_FAULT
+ccflags-y += -DCONFIG_NVGPU_CHANNEL_TSG_SCHEDULING
+ccflags-y += -DCONFIG_NVGPU_CHANNEL_TSG_CONTROL
+ccflags-y += -DCONFIG_NVGPU_POWER_PG
+ccflags-y += -DCONFIG_NVGPU_KERNEL_MODE_SUBMIT
+ccflags-y += -DCONFIG_NVGPU_SIM
+ccflags-y += -DCONFIG_NVGPU_TRACE
+ccflags-y += -DCONFIG_NVGPU_SYSFS
+ccflags-y += -DCONFIG_NVGPU_CLK_ARB
+ccflags-y += -DCONFIG_NVGPU_FALCON_DEBUG
+ccflags-y += -DCONFIG_NVGPU_FALCON_NON_FUSA
+ccflags-y += -DCONFIG_NVGPU_IOCTL_NON_FUSA
+ccflags-y += -DCONFIG_NVGPU_NON_FUSA
+ccflags-y += -DCONFIG_NVGPU_INJECT_HWERR
+ccflags-y += -DCONFIG_NVGPU_GR_FALCON_NON_SECURE_BOOT
+ccflags-y += -DCONFIG_NVGPU_SET_FALCON_ACCESS_MAP
+ccflags-y += -DCONFIG_NVGPU_SW_SEMAPHORE
+ccflags-y += -DCONFIG_NVGPU_FENCE
+ccflags-y += -DCONFIG_NVGPU_PROFILER
+
+ifeq ($(CONFIG_NVGPU_LOGGING),y)
+ccflags-y += -DCONFIG_NVGPU_LOGGING=1
+endif
+
+ifeq ($(CONFIG_NVGPU_HAL_NON_FUSA),y)
+ccflags-y += -DCONFIG_NVGPU_HAL_NON_FUSA
+endif
+
+ifeq ($(CONFIG_NVGPU_RECOVERY),y)
+ccflags-y += -DCONFIG_NVGPU_RECOVERY
+ccflags-y += -DCONFIG_NVGPU_ENGINE_RESET
+nvgpu-y += \
+	hal/rc/rc_gk20a.o \
+	hal/rc/rc_gv11b.o
+endif
+
+obj-$(CONFIG_GK20A) := nvgpu.o
+
+# OS independent parts of nvgpu. The work to collect files here
+# is in progress.
+
+ifeq ($(CONFIG_NVGPU_DGPU),y)
+nvgpu-$(CONFIG_NVGPU_DGPU) += \
+	os/linux/pci.o \
+	os/linux/pci_power.o \
+	os/linux/dmabuf_vidmem.o \
+	os/linux/os_ops_gv100.o \
+	os/linux/os_ops_tu104.o \
+	common/sec2/sec2.o \
+	common/sec2/sec2_allocator.o \
+	common/sec2/sec2_lsfm.o \
+	common/sec2/ipc/sec2_cmd.o \
+	common/sec2/ipc/sec2_msg.o \
+	common/sec2/ipc/sec2_queue.o \
+	common/sec2/ipc/sec2_seq.o \
+	common/vbios/bios_sw_gv100.o \
+	common/vbios/bios_sw_tu104.o \
+	common/falcon/falcon_sw_tu104.o \
+	common/acr/acr_sw_tu104.o \
+	common/mm/allocators/page_allocator.o \
+	common/mm/vidmem.o \
+	common/pramin.o \
+	common/ce/ce_app.o \
+	common/clk_arb/clk_arb_gv100.o \
+	common/engine_queues/engine_emem_queue.o \
+	hal/mm/mm_gv100.o \
+	hal/mm/mm_tu104.o \
+	hal/mc/mc_gv100.o  \
+	hal/mc/mc_tu104.o  \
+	hal/bus/bus_gv100.o \
+	hal/bus/bus_tu104.o \
+	hal/class/class_tu104.o \
+	hal/clk/clk_tu104.o \
+	hal/clk/clk_mon_tu104.o \
+	hal/gr/init/gr_init_gv100.o \
+	hal/gr/init/gr_init_tu104.o \
+	hal/gr/intr/gr_intr_tu104.o \
+	hal/gr/falcon/gr_falcon_tu104.o \
+	hal/fbpa/fbpa_tu104.o \
+	hal/init/hal_tu104.o \
+	hal/init/hal_tu104_litter.o \
+	hal/power_features/cg/tu104_gating_reglist.o \
+	hal/ltc/ltc_tu104.o \
+	hal/fb/fb_gv100.o \
+	hal/fb/fb_tu104.o \
+	hal/fb/fb_mmu_fault_tu104.o \
+	hal/fb/intr/fb_intr_gv100.o \
+	hal/fb/intr/fb_intr_tu104.o \
+	hal/func/func_tu104.o \
+	hal/fifo/fifo_tu104.o \
+	hal/fifo/usermode_tu104.o \
+	hal/fifo/pbdma_tu104.o \
+	hal/fifo/ramfc_tu104.o \
+	hal/fifo/ramin_tu104.o \
+	hal/fifo/channel_gv100.o \
+	hal/fifo/runlist_ram_tu104.o \
+	hal/fifo/runlist_fifo_gv100.o \
+	hal/fifo/runlist_fifo_tu104.o \
+	hal/fifo/fifo_intr_gv100.o \
+	hal/fuse/fuse_gp106.o \
+	hal/fuse/fuse_tu104.o \
+	hal/netlist/netlist_gv100.o \
+	hal/netlist/netlist_tu104.o \
+	hal/nvdec/nvdec_gp106.o \
+	hal/nvdec/nvdec_tu104.o \
+	hal/gsp/gsp_tu104.o \
+	hal/sec2/sec2_tu104.o \
+	hal/pramin/pramin_gp10b.o \
+	hal/pramin/pramin_gv100.o \
+	hal/pramin/pramin_init.o \
+	hal/pramin/pramin_tu104.o \
+	hal/bios/bios_tu104.o \
+	hal/top/top_gv100.o \
+	hal/xve/xve_gp106.o \
+	hal/xve/xve_tu104.o
+
+nvgpu-$(CONFIG_DEBUG_FS) += \
+	os/linux/debug_therm_tu104.o \
+	os/linux/debug_bios.o \
+	os/linux/debug_xve.o \
+	os/linux/debug_clk_tu104.o
+endif
+
+# nvlink sources are not conditionally compiled. nvlink probe and
+# public functions return -ENODEV when not supported.
+
+nvgpu-y += \
+	common/vbios/nvlink_bios.o \
+	common/nvlink/probe.o \
+	common/nvlink/init/device_reginit.o \
+	common/nvlink/init/device_reginit_gv100.o \
+	common/nvlink/minion.o \
+	common/nvlink/link_mode_transitions.o \
+	common/nvlink/nvlink.o \
+	os/linux/nvlink_probe.o \
+	os/linux/nvlink.o \
+	hal/nvlink/minion_gv100.o \
+	hal/nvlink/minion_tu104.o \
+	hal/nvlink/nvlink_gv100.o \
+	hal/nvlink/nvlink_tu104.o \
+	hal/nvlink/intr_and_err_handling_tu104.o \
+	hal/nvlink/link_mode_transitions_gv100.o \
+	hal/nvlink/link_mode_transitions_tu104.o
+
+nvgpu-y += \
+	common/device.o \
+	common/utils/enabled.o \
+	common/utils/errata.o \
+	common/utils/rbtree.o \
+	common/utils/string.o \
+	common/utils/worker.o \
+	common/swdebug/profile.o \
+	common/ptimer/ptimer.o \
+	common/perf/perfbuf.o \
+	common/therm/therm.o \
+	common/mc/mc.o \
+	common/sync/channel_sync.o \
+	common/sync/channel_sync_semaphore.o \
+	common/semaphore/semaphore_sea.o \
+	common/semaphore/semaphore_pool.o \
+	common/semaphore/semaphore_hw.o \
+	common/semaphore/semaphore.o \
+	common/regops/regops.o \
+	common/ltc/ltc.o \
+	common/fb/fb.o \
+	common/fbp/fbp.o \
+	common/gr/gr_utils.o \
+	common/gr/gr.o \
+	common/gr/gr_intr.o \
+	common/gr/global_ctx.o \
+	common/gr/ctx.o \
+	common/gr/gr_falcon.o \
+	common/gr/subctx.o \
+	common/gr/zcull.o \
+	common/gr/gr_config.o \
+	common/gr/zbc.o \
+	common/gr/gr_setup.o \
+	common/gr/hwpm_map.o \
+	common/gr/obj_ctx.o \
+	common/gr/fs_state.o \
+	common/gr/gr_ecc.o \
+	common/netlist/netlist.o \
+	common/init/nvgpu_init.o \
+	common/pmu/pmu.o \
+	common/pmu/allocator.o \
+	common/pmu/pmu_mutex.o \
+	common/pmu/fw/fw.o \
+	common/pmu/fw/fw_ver_ops.o \
+	common/pmu/fw/fw_ns_bootstrap.o \
+	common/pmu/pg/pmu_pg.o \
+	common/pmu/pg/pmu_aelpg.o \
+	common/pmu/perfmon/pmu_perfmon.o \
+	common/pmu/perfmon/pmu_perfmon_sw_gm20b.o \
+	common/pmu/perfmon/pmu_perfmon_sw_gv11b.o \
+	common/pmu/pmu_debug.o \
+	common/pmu/pg/pg_sw_gm20b.o \
+	common/pmu/pg/pg_sw_gp10b.o \
+	common/pmu/pg/pg_sw_gp106.o \
+	common/pmu/pg/pg_sw_gv11b.o \
+	common/pmu/ipc/pmu_cmd.o \
+	common/pmu/ipc/pmu_msg.o \
+	common/pmu/ipc/pmu_queue.o \
+	common/pmu/ipc/pmu_seq.o \
+	common/acr/acr.o \
+	common/acr/acr_wpr.o \
+	common/acr/acr_blob_alloc.o \
+	common/acr/acr_blob_construct_v0.o \
+	common/acr/acr_blob_construct.o \
+	common/acr/acr_bootstrap.o \
+	common/acr/acr_sw_gm20b.o \
+	common/acr/acr_sw_gp10b.o \
+	common/acr/acr_sw_gv11b.o \
+	common/sbr/sbr.o \
+	common/pmu/super_surface/super_surface.o \
+	common/pmu/lsfm/lsfm.o \
+	common/pmu/lsfm/lsfm_sw_gm20b.o \
+	common/pmu/lsfm/lsfm_sw_gp10b.o \
+	common/pmu/lsfm/lsfm_sw_gv100.o \
+	common/pmu/lsfm/lsfm_sw_tu104.o \
+	common/pmu/perf/vfe_var.o \
+	common/pmu/perf/vfe_equ.o \
+	common/pmu/perf/perf.o \
+	common/pmu/perf/change_seq.o \
+	common/pmu/perf/pstate.o \
+	common/pmu/pmgr/pwrdev.o \
+	common/pmu/pmgr/pmgr.o \
+	common/pmu/pmgr/pmgrpmu.o \
+	common/pmu/pmgr/pwrmonitor.o \
+	common/pmu/pmgr/pwrpolicy.o \
+	common/pmu/volt/volt.o \
+	common/pmu/volt/volt_rail.o \
+	common/pmu/volt/volt_dev.o \
+	common/pmu/volt/volt_policy.o \
+	common/pmu/therm/thrm.o \
+	common/pmu/therm/therm_dev.o \
+	common/pmu/therm/therm_channel.o \
+	common/pmu/lpwr/rppg.o \
+	common/pmu/pmu_pstate.o \
+	common/pmu/pmu_rtos_init.o \
+	common/pmu/clk/clk_vin.o \
+	common/pmu/clk/clk_fll.o \
+	common/pmu/clk/clk_domain.o \
+	common/pmu/clk/clk_prog.o \
+	common/pmu/clk/clk_vf_point.o \
+	common/pmu/clk/clk.o \
+	common/pmu/boardobj/boardobj.o \
+	common/pmu/boardobj/boardobjgrp.o \
+	common/pmu/boardobj/boardobjgrpmask.o \
+	common/pmu/boardobj/boardobjgrp_e255.o \
+	common/pmu/boardobj/boardobjgrp_e32.o \
+	common/clk_arb/clk_arb.o \
+	common/clk_arb/clk_arb_gp10b.o \
+	common/rc/rc.o \
+	common/grmgr/grmgr.o \
+	common/cic/cic.o \
+	common/cic/cic_intr.o \
+	common/cic/ce_cic.o \
+	common/cic/ctxsw_cic.o \
+	common/cic/ecc_cic.o \
+	common/cic/host_cic.o \
+	common/cic/gr_cic.o \
+	common/cic/pri_cic.o \
+	common/cic/pmu_cic.o \
+	common/cic/mmu_cic.o \
+	common/cic/msg_cic.o \
+	hal/bus/bus_gk20a.o \
+	hal/class/class_gm20b.o \
+	hal/class/class_gp10b.o \
+	hal/clk/clk_gm20b.o \
+	hal/gr/ecc/ecc_gp10b.o \
+	hal/gr/ecc/ecc_gv11b.o \
+	hal/gr/zcull/zcull_gm20b.o \
+	hal/gr/zcull/zcull_gv11b.o \
+	hal/gr/ctxsw_prog/ctxsw_prog_gp10b.o \
+	hal/gr/ctxsw_prog/ctxsw_prog_gv11b.o \
+	hal/gr/init/gr_init_gm20b.o \
+	hal/gr/init/gr_init_gp10b.o \
+	hal/gr/init/gr_init_gv11b.o \
+	hal/gr/intr/gr_intr_gm20b.o \
+	hal/gr/intr/gr_intr_gp10b.o \
+	hal/gr/hwpm_map/hwpm_map_gv100.o \
+	hal/gr/zbc/zbc_gm20b.o \
+	hal/gr/zbc/zbc_gp10b.o \
+	hal/gr/zbc/zbc_gv11b.o \
+	hal/gr/gr/gr_gk20a.o \
+	hal/gr/gr/gr_gm20b.o \
+	hal/gr/gr/gr_gp10b.o \
+	hal/gr/gr/gr_gv100.o \
+	hal/gr/gr/gr_gv11b.o \
+	hal/gr/gr/gr_tu104.o \
+	hal/init/hal_gv11b.o \
+	hal/init/hal_gv11b_litter.o \
+	hal/init/hal_init.o \
+	hal/perf/perf_gv11b.o \
+	hal/perf/perf_tu104.o \
+	hal/power_features/cg/gp10b_gating_reglist.o \
+	hal/power_features/cg/gv11b_gating_reglist.o \
+	hal/regops/regops_gv11b.o \
+	hal/regops/allowlist_gv11b.o \
+	hal/ce/ce2_gk20a.o \
+	hal/therm/therm_gp10b.o \
+	hal/therm/therm_tu104.o \
+	hal/gr/falcon/gr_falcon_gm20b.o \
+	hal/ltc/ltc_gp10b.o \
+	hal/ltc/intr/ltc_intr_gm20b.o \
+	hal/ltc/intr/ltc_intr_gp10b.o \
+	hal/fb/fb_gm20b.o \
+	hal/fb/fb_gp10b.o \
+	hal/fb/fb_gp106.o \
+	hal/fb/fb_gv11b.o \
+	hal/fb/intr/fb_intr_ecc_gv11b.o \
+	hal/fuse/fuse_gm20b.o \
+	hal/fifo/fifo_gk20a.o \
+	hal/fifo/preempt_gk20a.o \
+	hal/fifo/ramfc_gk20a.o \
+	hal/fifo/ramfc_gp10b.o \
+	hal/fifo/ramin_gk20a.o \
+	hal/fifo/ramin_gp10b.o \
+	hal/fifo/runlist_fifo_gv11b.o \
+	hal/fifo/channel_gk20a.o \
+	hal/fifo/channel_gm20b.o \
+	hal/fifo/tsg_gk20a.o \
+	hal/fifo/userd_gk20a.o \
+	hal/fifo/userd_gv11b.o \
+	hal/fifo/fifo_intr_gk20a.o \
+	hal/fifo/ctxsw_timeout_gk20a.o \
+	hal/netlist/netlist_gp10b.o \
+	hal/sync/sema_cmdbuf_gk20a.o \
+	hal/sync/sema_cmdbuf_gv11b.o \
+	hal/pmu/pmu_gk20a.o \
+	hal/pmu/pmu_gm20b.o \
+	hal/pmu/pmu_gp10b.o \
+	hal/pmu/pmu_gv11b.o \
+	hal/pmu/pmu_tu104.o \
+	hal/top/top_gp106.o \
+	hal/top/top_gp10b.o \
+	hal/tpc/tpc_gv11b.o \
+	hal/priv_ring/priv_ring_gv11b.o \
+	hal/cic/cic_gv11b_fusa.o \
+	hal/cic/cic_lut_gv11b_fusa.o
+
+# Linux specific parts of nvgpu.
+nvgpu-y += \
+	os/linux/os_ops.o \
+	os/linux/os_ops_gm20b.o \
+	os/linux/os_ops_gp10b.o \
+	os/linux/os_ops_gv11b.o \
+	os/linux/kmem.o \
+	os/linux/timers.o \
+	os/linux/ioctl.o \
+	os/linux/ioctl_ctrl.o \
+	os/linux/ioctl_as.o \
+	os/linux/ioctl_channel.o \
+	os/linux/ioctl_tsg.o \
+	os/linux/ioctl_dbg.o \
+	os/linux/ioctl_prof.o \
+	os/linux/ioctl_clk_arb.o \
+	os/linux/cond.o \
+	os/linux/nvgpu_mem.o \
+	os/linux/linux-dma.o \
+	os/linux/driver_common.o \
+	os/linux/firmware.o \
+	os/linux/thread.o \
+	os/linux/vm.o \
+	os/linux/intr.o \
+	os/linux/sysfs.o \
+	os/linux/linux-io.o \
+	os/linux/io_usermode.o \
+	os/linux/rwsem.o \
+	os/linux/sched.o \
+	os/linux/linux-channel.o \
+	os/linux/sim.o \
+	os/linux/sim_pci.o \
+	os/linux/os_sched.o \
+	os/linux/dt.o \
+	os/linux/ecc_sysfs.o \
+	os/linux/bsearch.o \
+	os/linux/cic/cic_stub.o \
+	os/linux/dmabuf_priv.o \
+	os/linux/power_ops.o
+
+nvgpu-$(CONFIG_NVGPU_VPR) += os/linux/vpr.o
+
+nvgpu-$(CONFIG_DEBUG_FS) += \
+	os/linux/debug.o \
+	os/linux/debug_gr.o \
+	os/linux/debug_fifo.o \
+	os/linux/debug_ce.o \
+	os/linux/debug_pmu.o \
+	os/linux/debug_pmgr.o \
+	os/linux/debug_sched.o \
+	os/linux/debug_allocator.o \
+	os/linux/debug_hal.o \
+	os/linux/debug_clk_gm20b.o \
+	os/linux/debug_ltc.o \
+	os/linux/debug_volt.o \
+	os/linux/debug_s_param.o \
+	os/linux/swprofile_debugfs.o
+
+nvgpu-$(CONFIG_NVGPU_LOGGING) += os/linux/log.o
+
+ifeq ($(CONFIG_NVGPU_TRACK_MEM_USAGE),y)
+nvgpu-$(CONFIG_DEBUG_FS) += \
+	os/linux/debug_kmem.o
+endif
+
+nvgpu-$(CONFIG_NVGPU_FECS_TRACE) += \
+	common/gr/fecs_trace.o \
+	hal/gr/fecs_trace/fecs_trace_gm20b.o \
+	hal/gr/fecs_trace/fecs_trace_gv11b.o \
+	os/linux/fecs_trace_linux.o
+
+ifeq ($(CONFIG_NVGPU_FECS_TRACE),y)
+nvgpu-$(CONFIG_DEBUG_FS) += \
+	os/linux/debug_fecs_trace.o
+endif
+
+nvgpu-$(CONFIG_TEGRA_GK20A) += \
+	os/linux/fuse.o \
+	os/linux/module.o \
+	os/linux/module_usermode.o \
+	os/linux/platform_gk20a_tegra.o \
+	os/linux/platform_gp10b_tegra.o \
+	os/linux/platform_gv11b_tegra.o
+
+ifeq ($(CONFIG_TEGRA_GK20A),y)
+nvgpu-$(CONFIG_NVGPU_TEGRA_FUSE) += os/linux/soc.o
+endif
+
+nvgpu-$(CONFIG_NVGPU_SYNCFD_ANDROID) += \
+	os/linux/sync_sema_android.o \
+	os/linux/os_fence_android.o \
+	os/linux/os_fence_android_sema.o
+
+nvgpu-$(CONFIG_NVGPU_SYNCFD_STABLE) += \
+	os/linux/sync_sema_dma.o \
+	os/linux/os_fence_dma.o \
+	os/linux/os_fence_dma_sema.o
+
+nvgpu-$(CONFIG_TEGRA_GK20A_NVHOST) += \
+	common/sync/channel_sync_syncpt.o \
+	common/fence/fence_syncpt.o
+ifneq ($(CONFIG_NVGPU_SYNCFD_NONE),y)
+nvgpu-$(CONFIG_TEGRA_GK20A_NVHOST) += \
+	os/linux/os_fence_syncpt.o
+endif
+
+ifeq ($(CONFIG_TEGRA_GK20A_NVHOST_HOST1X),y)
+nvgpu-$(CONFIG_TEGRA_GK20A_NVHOST) += \
+	os/linux/nvhost_host1x.o
+else
+nvgpu-$(CONFIG_TEGRA_GK20A_NVHOST) += \
+	os/linux/nvhost.o
+endif
+
+nvgpu-$(CONFIG_TEGRA_GK20A_NVHOST) += \
+	os/linux/nvhost_common.o \
+	hal/sync/syncpt_cmdbuf_gk20a.o \
+	hal/sync/syncpt_cmdbuf_gv11b.o \
+	hal/sync/syncpt_cmdbuf_gv11b_fusa.o \
+	common/sync/channel_user_syncpt.o
+
+nvgpu-$(CONFIG_NVGPU_GR_VIRTUALIZATION) += \
+	os/linux/vgpu/platform_vgpu_tegra.o \
+	os/linux/vgpu/sysfs_vgpu.o \
+	os/linux/vgpu/vgpu_ivc.o \
+	os/linux/vgpu/vgpu_ivm.o \
+	os/linux/vgpu/vgpu_linux.o \
+	os/linux/vgpu/gv11b/platform_gv11b_vgpu_tegra.o
+
+ifeq ($(CONFIG_NVGPU_FECS_TRACE),y)
+nvgpu-$(CONFIG_NVGPU_GR_VIRTUALIZATION) += \
+	os/linux/vgpu/fecs_trace_vgpu_linux.o
+endif
+
+nvgpu-$(CONFIG_COMMON_CLK) += \
+	os/linux/clk.o
+
+nvgpu-$(CONFIG_GK20A_DEVFREQ) += \
+	os/linux/scale.o
+
+nvgpu-$(CONFIG_NVGPU_SUPPORT_CDE) += \
+	os/linux/cde.o \
+	os/linux/cde_gm20b.o \
+	os/linux/cde_gp10b.o
+
+ifeq ($(CONFIG_DEBUG_FS),y)
+nvgpu-$(CONFIG_NVGPU_SUPPORT_CDE) += \
+	os/linux/debug_cde.o
+endif
+
+nvgpu-y += \
+	common/mm/allocators/nvgpu_allocator.o \
+	common/mm/allocators/bitmap_allocator.o \
+	common/mm/allocators/buddy_allocator.o \
+	common/mm/gmmu/page_table.o \
+	common/mm/gmmu/pd_cache.o \
+	common/mm/gmmu/pte.o \
+	common/mm/as.o \
+	common/mm/vm.o \
+	common/mm/vm_area.o \
+	common/mm/nvgpu_mem.o \
+	common/mm/nvgpu_sgt.o \
+	common/mm/mm.o \
+	common/mm/dma.o \
+	common/vbios/bios.o \
+	common/falcon/falcon.o \
+	common/falcon/falcon_sw_gk20a.o \
+	common/engine_queues/engine_mem_queue.o \
+	common/engine_queues/engine_dmem_queue.o \
+	common/engine_queues/engine_fb_queue.o \
+	common/io/io.o \
+	common/power_features/power_features.o \
+	common/power_features/cg/cg.o \
+	common/power_features/pg/pg.o \
+	common/sim/sim.o \
+	common/sim/sim_pci.o \
+	common/sim/sim_netlist.o \
+	common/fifo/fifo.o \
+	common/fifo/preempt.o \
+	common/fifo/channel.o \
+	common/fifo/channel_wdt.o \
+	common/fifo/channel_worker.o \
+	common/fifo/pbdma.o \
+	common/fifo/submit.o \
+	common/fifo/job.o \
+	common/fifo/priv_cmdbuf.o \
+	common/fifo/tsg.o \
+	common/fifo/runlist.o \
+	common/fifo/engine_status.o \
+	common/fifo/engines.o \
+	common/fifo/pbdma_status.o \
+	common/fifo/userd.o \
+	common/fifo/watchdog.o \
+	common/fence/fence.o \
+	common/fence/fence_sema.o \
+	common/ecc.o \
+	common/log_common.o \
+	common/ce/ce.o \
+	common/debugger.o \
+	common/profiler/profiler.o \
+	common/profiler/pm_reservation.o
+
+nvgpu-$(CONFIG_NVGPU_GR_VIRTUALIZATION) += \
+	common/vgpu/ltc/ltc_vgpu.o \
+	common/vgpu/fbp/fbp_vgpu.o \
+	common/vgpu/fb/fb_vgpu.o \
+	common/vgpu/gr/gr_vgpu.o \
+	common/vgpu/gr/ctx_vgpu.o \
+	common/vgpu/gr/subctx_vgpu.o \
+	common/vgpu/top/top_vgpu.o \
+	common/vgpu/fifo/fifo_vgpu.o \
+	common/vgpu/fifo/channel_vgpu.o \
+	common/vgpu/fifo/tsg_vgpu.o \
+	common/vgpu/fifo/preempt_vgpu.o \
+	common/vgpu/fifo/runlist_vgpu.o \
+	common/vgpu/fifo/ramfc_vgpu.o \
+	common/vgpu/fifo/userd_vgpu.o \
+	common/vgpu/ce_vgpu.o \
+	common/vgpu/mm/mm_vgpu.o \
+	common/vgpu/mm/vm_vgpu.o \
+	common/vgpu/init/init_vgpu.o \
+	common/vgpu/ivc/comm_vgpu.o \
+	common/vgpu/intr/intr_vgpu.o \
+	common/vgpu/ptimer/ptimer_vgpu.o \
+	common/vgpu/debugger_vgpu.o \
+	common/vgpu/pm_reservation_vgpu.o \
+	common/vgpu/perf/perf_vgpu.o \
+	common/vgpu/profiler/profiler_vgpu.o \
+	common/vgpu/ecc_vgpu.o \
+	common/vgpu/clk_vgpu.o \
+	common/vgpu/gr/fecs_trace_vgpu.o \
+	hal/vgpu/init/init_hal_vgpu.o \
+	hal/vgpu/fifo/fifo_gv11b_vgpu.o \
+	hal/vgpu/sync/syncpt_cmdbuf_gv11b_vgpu.o
+
+nvgpu-$(CONFIG_NVGPU_CYCLESTATS) += \
+	common/perf/cyclestats_snapshot.o \
+	common/cyclestats/cyclestats.o
+
+ifeq ($(CONFIG_NVGPU_GR_VIRTUALIZATION),y)
+nvgpu-$(CONFIG_NVGPU_CYCLESTATS) += \
+	common/vgpu/perf/cyclestats_snapshot_vgpu.o
+nvgpu-$(CONFIG_NVGPU_COMPRESSION) += \
+	common/vgpu/cbc/cbc_vgpu.o
+endif
+
+nvgpu-$(CONFIG_NVGPU_COMPRESSION) += \
+	os/linux/comptags.o \
+	common/mm/comptags.o \
+	common/cbc/cbc.o \
+	hal/cbc/cbc_gm20b.o \
+	hal/cbc/cbc_gp10b.o \
+	hal/cbc/cbc_gv11b.o \
+	hal/cbc/cbc_tu104.o \
+
+# FUSA (Functionally Safe) HAL source files
+nvgpu-y += \
+	hal/mm/mm_gv11b_fusa.o \
+	hal/mm/mm_gp10b_fusa.o \
+	hal/mm/gmmu/gmmu_gv11b_fusa.o \
+	hal/mm/gmmu/gmmu_gp10b_fusa.o \
+	hal/mm/gmmu/gmmu_gk20a_fusa.o \
+	hal/mm/gmmu/gmmu_gm20b_fusa.o \
+	hal/mm/cache/flush_gk20a_fusa.o \
+	hal/mm/cache/flush_gv11b_fusa.o \
+	hal/mm/mmu_fault/mmu_fault_gv11b_fusa.o \
+	hal/ltc/intr/ltc_intr_gp10b_fusa.o \
+	hal/ltc/intr/ltc_intr_gv11b_fusa.o \
+	hal/bus/bus_gk20a_fusa.o \
+	hal/bus/bus_gm20b_fusa.o \
+	hal/bus/bus_gp10b_fusa.o \
+	hal/bus/bus_gv11b_fusa.o \
+	hal/ce/ce_gp10b_fusa.o \
+	hal/ce/ce_gv11b_fusa.o \
+	hal/class/class_gv11b_fusa.o \
+	hal/falcon/falcon_gk20a_fusa.o \
+	hal/fb/fb_gm20b_fusa.o \
+	hal/fb/fb_gv11b_fusa.o \
+	hal/fb/fb_mmu_fault_gv11b_fusa.o \
+	hal/fb/ecc/fb_ecc_gv11b_fusa.o \
+	hal/fb/intr/fb_intr_ecc_gv11b_fusa.o \
+	hal/fb/intr/fb_intr_gv11b_fusa.o \
+	hal/fifo/channel_gk20a_fusa.o \
+	hal/fifo/channel_gm20b_fusa.o \
+	hal/fifo/channel_gv11b_fusa.o \
+	hal/fifo/ctxsw_timeout_gv11b_fusa.o \
+	hal/fifo/engine_status_gm20b_fusa.o \
+	hal/fifo/engine_status_gv100_fusa.o \
+	hal/fifo/engines_gp10b_fusa.o \
+	hal/fifo/engines_gv11b_fusa.o \
+	hal/fifo/fifo_gk20a_fusa.o \
+	hal/fifo/fifo_gv11b_fusa.o \
+	hal/fifo/fifo_intr_gk20a_fusa.o \
+	hal/fifo/fifo_intr_gv11b_fusa.o \
+	hal/fifo/pbdma_gm20b_fusa.o \
+	hal/fifo/pbdma_gp10b_fusa.o \
+	hal/fifo/pbdma_gv11b_fusa.o \
+	hal/fifo/pbdma_status_gm20b_fusa.o \
+	hal/fifo/preempt_gv11b_fusa.o \
+	hal/fifo/ramfc_gp10b_fusa.o \
+	hal/fifo/ramfc_gv11b_fusa.o \
+	hal/fifo/ramin_gk20a_fusa.o \
+	hal/fifo/ramin_gm20b_fusa.o \
+	hal/fifo/ramin_gv11b_fusa.o \
+	hal/fifo/runlist_fifo_gk20a_fusa.o \
+	hal/fifo/runlist_fifo_gv11b_fusa.o \
+	hal/fifo/runlist_ram_gv11b_fusa.o \
+	hal/fifo/tsg_gk20a_fusa.o \
+	hal/fifo/tsg_gv11b_fusa.o \
+	hal/fifo/usermode_gv11b_fusa.o \
+	hal/fuse/fuse_gm20b_fusa.o \
+	hal/fuse/fuse_gp10b_fusa.o \
+	hal/gr/config/gr_config_gm20b_fusa.o \
+	hal/gr/config/gr_config_gv100_fusa.o \
+	hal/gr/ctxsw_prog/ctxsw_prog_gm20b_fusa.o \
+	hal/gr/ctxsw_prog/ctxsw_prog_gp10b_fusa.o \
+	hal/gr/ctxsw_prog/ctxsw_prog_gv11b_fusa.o \
+	hal/gr/ecc/ecc_gv11b_fusa.o \
+	hal/gr/falcon/gr_falcon_gm20b_fusa.o \
+	hal/gr/falcon/gr_falcon_gp10b_fusa.o \
+	hal/gr/falcon/gr_falcon_gv11b_fusa.o \
+	hal/gr/init/gr_init_gm20b_fusa.o \
+	hal/gr/init/gr_init_gp10b_fusa.o \
+	hal/gr/init/gr_init_gv11b_fusa.o \
+	hal/gr/intr/gr_intr_gm20b_fusa.o \
+	hal/gr/intr/gr_intr_gp10b_fusa.o \
+	hal/gr/intr/gr_intr_gv11b_fusa.o \
+	hal/ltc/ltc_gm20b_fusa.o \
+	hal/ltc/ltc_gp10b_fusa.o \
+	hal/ltc/ltc_gv11b_fusa.o \
+	hal/mc/mc_gm20b_fusa.o \
+	hal/mc/mc_gp10b_fusa.o \
+	hal/mc/mc_gv11b_fusa.o \
+	hal/netlist/netlist_gv11b_fusa.o \
+	hal/pmu/pmu_gk20a_fusa.o \
+	hal/pmu/pmu_gv11b_fusa.o \
+	hal/priv_ring/priv_ring_gm20b_fusa.o \
+	hal/priv_ring/priv_ring_gp10b_fusa.o \
+	hal/ptimer/ptimer_gk20a_fusa.o \
+	hal/ptimer/ptimer_gp10b.o \
+	hal/ptimer/ptimer_gv11b.o \
+	hal/therm/therm_gv11b_fusa.o \
+	hal/top/top_gm20b_fusa.o \
+	hal/top/top_gv11b_fusa.o
+
+nvgpu-$(CONFIG_NVGPU_HAL_NON_FUSA) += \
+	hal/ce/ce_tu104.o \
+	hal/clk/clk_gm20b.o \
+	hal/init/hal_gp10b.o \
+	hal/init/hal_gp10b_litter.o \
+	hal/init/hal_gm20b.o \
+	hal/init/hal_gm20b_litter.o \
+	hal/fifo/engine_status_gm20b.o \
+	hal/fifo/engines_gm20b.o \
+	hal/fifo/pbdma_gm20b.o \
+	hal/fifo/pbdma_gp10b.o \
+	hal/fifo/mmu_fault_gk20a.o \
+	hal/fifo/mmu_fault_gm20b.o \
+	hal/fifo/mmu_fault_gp10b.o \
+	hal/fifo/runlist_fifo_gk20a.o \
+	hal/fifo/runlist_ram_gk20a.o \
+	hal/gr/config/gr_config_gm20b.o \
+	hal/gr/ctxsw_prog/ctxsw_prog_gm20b.o \
+	hal/gr/ctxsw_prog/ctxsw_prog_gm20b_dbg.o \
+	hal/gr/gr/gr_gk20a.o \
+	hal/gr/gr/gr_gm20b.o \
+	hal/gr/gr/gr_gp10b.o \
+	hal/ltc/ltc_gm20b.o \
+	hal/ltc/ltc_gm20b_dbg.o \
+	hal/mc/mc_gm20b.o \
+	hal/mm/cache/flush_gk20a.o \
+	hal/mm/mm_gm20b.o \
+	hal/mm/mm_gk20a.o \
+	hal/mm/gmmu/gmmu_gk20a.o \
+	hal/mm/gmmu/gmmu_gm20b.o \
+	hal/falcon/falcon_gk20a.o \
+	hal/netlist/netlist_gm20b.o \
+	hal/perf/perf_gm20b.o \
+	hal/power_features/cg/gm20b_gating_reglist.o \
+	hal/priv_ring/priv_ring_gm20b.o \
+	hal/regops/regops_gm20b.o \
+	hal/regops/regops_gp10b.o \
+	hal/regops/regops_tu104.o \
+	hal/regops/allowlist_tu104.o \
+	hal/therm/therm_gm20b.o \
+	hal/top/top_gm20b.o
+
+ifeq ($(CONFIG_NVGPU_GR_VIRTUALIZATION),y)
+nvgpu-$(CONFIG_NVGPU_HAL_NON_FUSA) += \
+	hal/vgpu/init/vgpu_hal_gv11b.o
+endif
--- a/drivers/gpu/nvgpu/Makefile.doxygen
+++ b/drivers/gpu/nvgpu/Makefile.doxygen
@@ -0,0 +1,53 @@
+##################### tell Emacs this is a -*- makefile-gmake -*-
+#
+# Copyright (c) 2019-2020 NVIDIA CORPORATION.  All Rights Reserved.
+#
+# NVIDIA CORPORATION and its licensors retain all intellectual property
+# and proprietary rights in and to this software, related documentation
+# and any modifications thereto.  Any use, reproduction, disclosure or
+# distribution of this software and related documentation without an express
+# license agreement from NVIDIA CORPORATION is strictly prohibited.
+#
+# Build the doxygen output.
+#
+# Some assumptions: this is a local build only. You need installed:
+#
+#   doxygen
+#   python2
+#
+# You also must have $TOP/$TEGRA_TOP set; For L4T:
+#
+#   $ export TOP=$TEGRA_TOP
+#
+# Should work.
+#
+
+PYTHON2    = python2.7
+ARCH       = $(TEGRA_TOP)/core-private/tools/arch/arch.py
+NVGPU_ARCH = $(TOP)/kernel/nvgpu/arch
+ARCH_YAML  = $(NVGPU_ARCH)/*.yaml
+
+# Build the doxygen output. But make sure the sources file is generated
+# first.
+all: doxygen/sources
+	doxygen doxygen/Doxyfile.safety
+
+# Generate the sources file. This has a list of files that we shall include
+# in the doxygen output.
+doxygen/sources: $(ARCH) $(ARCH_YAML)
+	$(ARCH) --arch-file $(NVGPU_ARCH)/nvgpu.yaml files	\
+		--safe --gpu igpu --gpu both			\
+		--prefix 'INPUT += ' > doxygen/Doxyfile.sources.safety
+	@if [ ! -z "$(EXTRA_PATH)" ] ; then \
+		$(ARCH) --arch-file $(NVGPU_ARCH)/nvgpu.yaml \
+			--include-path $(EXTRA_PATH) files	\
+		--safe --gpu igpu --gpu both			\
+		--prefix 'INPUT += $(EXTRA_PATH)/' \
+		>> doxygen/Doxyfile.sources.safety ; \
+		cat $(EXTRA_PATH)/unit-tests/SWUTS.sources \
+			 >> doxygen/Doxyfile.sources.safety ; \
+	fi
+
+clean:
+	rm -rf doxygen/Doxyfile.sources.safety
+	rm -rf html
--- a/drivers/gpu/nvgpu/Makefile.linux.configs
+++ b/drivers/gpu/nvgpu/Makefile.linux.configs
@@ -0,0 +1,225 @@
+# Turn off all other configs, if CONFIG_GK20A is not set
+CONFIG_GK20A := m
+
+# Enable GK20A PMU features.
+CONFIG_GK20A_PMU := y
+
+# Enable support for the GK20A graphics engine on Tegra
+# by adding a Tegra platfrom interface to the GK20A driver.
+CONFIG_TEGRA_GK20A := y
+
+# Enable Support for Loading High Secure binary, and using
+# Write Protected Regions (WPR) for storing ucodes, and bootstrap
+# PMU, FECS and GPCCS in Low Secure mode.
+CONFIG_TEGRA_ACR := y
+
+# Support for debugger APIs
+CONFIG_NVGPU_DEBUGGER := y
+
+# Support for iGPU LS PMU enable/disable
+CONFIG_NVGPU_LS_PMU := y
+
+# Enable/Disable NVGPU logging
+CONFIG_NVGPU_LOGGING := y
+
+# Enable/Disable the support of HALs from chips that do not have functional
+# safety certification
+CONFIG_NVGPU_HAL_NON_FUSA := y
+
+# Support recovery on failure (which may involve engine reset)
+CONFIG_NVGPU_RECOVERY := y
+
+# Support for compression
+CONFIG_NVGPU_COMPRESSION := y
+
+# Enable support for extraction of comptags for CDE.
+ifeq ($(CONFIG_NVGPU_COMPRESSION),y)
+CONFIG_NVGPU_SUPPORT_CDE := y
+endif
+
+ifeq ($(CONFIG_COMMON_CLK),y)
+ifeq ($(CONFIG_PM_DEVFREQ),y)
+# Select this entry to enable gk20a scaling
+CONFIG_GK20A_DEVFREQ := y
+
+# Disable support to pass PM_QOS constraints to devfreq based scaling.
+CONFIG_GK20A_PM_QOS := n
+
+endif
+endif
+
+# Say Y here to allow nvgpu to track and keep statistics on
+# the system memory used by the driver. This does recreate
+# some of the kmem_leak tracking but this is also applicable
+# to other OSes which do not have Linux' kmem_leak.
+#CONFIG_NVGPU_TRACK_MEM_USAGE    := n
+
+# Enable the cycle stats debugging features.
+CONFIG_NVGPU_CYCLESTATS := y
+
+# Enable support for the NVGPU Context Switch Tracing. In this mode,
+# FECS collects timestamps for contexts loaded on GR engine. This
+# allows tracking context switches on GR engine, as well as
+# identifying processes that submitted work.
+CONFIG_NVGPU_FECS_TRACE := y
+
+# Enable support in GK20A for the nvhost (host1x) dma engine hardware
+# that includes things like hardware syncpts. This requires
+# TEGRA_GRHOST
+ifdef CONFIG_TEGRA_GRHOST
+CONFIG_TEGRA_GK20A_NVHOST := y
+endif
+ifdef CONFIG_TEGRA_HOST1X_NEXT
+CONFIG_TEGRA_GK20A_NVHOST := y
+CONFIG_TEGRA_GK20A_NVHOST_HOST1X := y
+endif
+
+# Enable support for GPUs on PCIe bus.
+ifeq ($(CONFIG_PCI),y)
+# Support for NVGPU DGPU
+CONFIG_NVGPU_DGPU := y
+endif
+
+# Enable nvgpu debug facility to redirect debug spew to ftrace. This
+# affects kernel memory use, so should not be enabled by default.
+ifeq ($(CONFIG_TRACING),y)
+#CONFIG_GK20A_TRACE_PRINTK := y
+endif
+
+# Use tegra_alloc_fd() for allocating dma_buf fds. This allocates
+# the fds above 1024 which exempts them from counting against process
+# fd limit.
+ifeq ($(CONFIG_NV_TEGRA_MC),y)
+CONFIG_NVGPU_USE_TEGRA_ALLOC_FD := y
+endif
+
+# Support Nvlink
+ifeq ($(CONFIG_TEGRA_NVLINK),y)
+CONFIG_NVGPU_NVLINK := y
+endif
+
+# Support NVGPU Virtualization
+ifeq ($(CONFIG_TEGRA_GR_VIRTUALIZATION),y)
+CONFIG_NVGPU_GR_VIRTUALIZATION := y
+endif
+
+# Support for NVGPU VPR
+ifeq ($(CONFIG_TEGRA_VPR),y)
+CONFIG_NVGPU_VPR := y
+endif
+
+# Support Tegra fuse
+ifeq ($(CONFIG_TEGRA_KFUSE),y)
+CONFIG_NVGPU_TEGRA_FUSE := y
+endif
+
+# GPU job synchronization (fences before and after submits) can use raw
+# syncpoints if available and sync fds if chosen. Without syncpoints,
+# nvgpu also provides semaphore-backed sync fds to userspace.
+#
+# Select which kernel-provided API is used for sync fds. Matching
+# support is required for the userspace drivers too.
+ifeq ($(CONFIG_SYNC),y)
+CONFIG_NVGPU_SYNCFD_ANDROID := y
+else ifeq ($(CONFIG_SYNC_FILE), y)
+CONFIG_NVGPU_SYNCFD_STABLE := y
+else
+CONFIG_NVGPU_SYNCFD_NONE := y
+endif
+
+# Below check indicates the build is invoked from Nvidia's
+# internal build system.
+ifneq ($(NV_BUILD_KERNEL_OPTIONS),)
+
+# Disable the below configs for kstable
+ifneq ($(findstring stable,$(NV_BUILD_KERNEL_OPTIONS)),)
+CONFIG_GK20A_DEVFREQ := n
+CONFIG_GK20A_PM_QOS := n
+else ifneq ($(filter 4.9 4.14,$(patsubst -,$(space),$(NV_BUILD_KERNEL_OPTIONS))),)
+# Enable support to pass PM_QOS constraints to devfreq based scaling.
+CONFIG_GK20A_PM_QOS := y
+endif
+
+endif
+
+ifeq ($(CONFIG_GK20A_PMU),y)
+ccflags-y += -DCONFIG_GK20A_PMU
+endif
+ifeq ($(CONFIG_TEGRA_GK20A),y)
+ccflags-y += -DCONFIG_TEGRA_GK20A
+endif
+ifeq ($(CONFIG_TEGRA_ACR),y)
+ccflags-y += -DCONFIG_TEGRA_ACR
+endif
+ifeq ($(CONFIG_NVGPU_DEBUGGER),y)
+ccflags-y += -DCONFIG_NVGPU_DEBUGGER
+endif
+ifeq ($(CONFIG_NVGPU_LS_PMU),y)
+ccflags-y += -DCONFIG_NVGPU_LS_PMU
+endif
+ifeq ($(CONFIG_NVGPU_LOGGING),y)
+ccflags-y += -DCONFIG_NVGPU_LOGGING
+endif
+ifeq ($(CONFIG_NVGPU_HAL_NON_FUSA),y)
+ccflags-y += -DCONFIG_NVGPU_HAL_NON_FUSA
+endif
+ifeq ($(CONFIG_NVGPU_RECOVERY),y)
+ccflags-y += -DCONFIG_NVGPU_RECOVERY
+endif
+ifeq ($(CONFIG_NVGPU_COMPRESSION),y)
+ccflags-y += -DCONFIG_NVGPU_COMPRESSION
+endif
+ifeq ($(CONFIG_NVGPU_SUPPORT_CDE),y)
+ccflags-y += -DCONFIG_NVGPU_SUPPORT_CDE
+endif
+ifeq ($(CONFIG_GK20A_DEVFREQ),y)
+ccflags-y += -DCONFIG_GK20A_DEVFREQ
+endif
+ifeq ($(CONFIG_GK20A_PM_QOS),y)
+ccflags-y += -DCONFIG_GK20A_PM_QOS
+endif
+ifeq ($(CONFIG_NVGPU_TRACK_MEM_USAGE),y)
+ccflags-y += -DCONFIG_NVGPU_TRACK_MEM_USAGE
+endif
+ifeq ($(CONFIG_NVGPU_CYCLESTATS),y)
+ccflags-y += -DCONFIG_NVGPU_CYCLESTATS
+endif
+ifeq ($(CONFIG_NVGPU_FECS_TRACE),y)
+ccflags-y += -DCONFIG_NVGPU_FECS_TRACE
+endif
+ifeq ($(CONFIG_TEGRA_GK20A_NVHOST),y)
+ccflags-y += -DCONFIG_TEGRA_GK20A_NVHOST
+endif
+ifeq ($(CONFIG_TEGRA_GK20A_NVHOST_HOST1X),y)
+ccflags-y += -DCONFIG_TEGRA_GK20A_NVHOST_HOST1X
+endif
+ifeq ($(CONFIG_NVGPU_DGPU),y)
+ccflags-y += -DCONFIG_NVGPU_DGPU
+endif
+ifeq ($(CONFIG_GK20A_TRACE_PRINTK),y)
+ccflags-y += -DCONFIG_GK20A_TRACE_PRINTK
+endif
+ifeq ($(CONFIG_NVGPU_USE_TEGRA_ALLOC_FD),y)
+ccflags-y += -DCONFIG_NVGPU_USE_TEGRA_ALLOC_FD
+endif
+ifeq ($(CONFIG_NVGPU_NVLINK),y)
+ccflags-y += -DCONFIG_NVGPU_NVLINK
+endif
+ifeq ($(CONFIG_NVGPU_GR_VIRTUALIZATION),y)
+ccflags-y += -DCONFIG_NVGPU_GR_VIRTUALIZATION
+endif
+ifeq ($(CONFIG_NVGPU_VPR),y)
+ccflags-y += -DCONFIG_NVGPU_VPR
+endif
+ifeq ($(CONFIG_NVGPU_TEGRA_FUSE),y)
+ccflags-y += -DCONFIG_NVGPU_TEGRA_FUSE
+endif
+ifeq ($(CONFIG_NVGPU_SYNCFD_ANDROID),y)
+ccflags-y += -DCONFIG_NVGPU_SYNCFD_ANDROID
+endif
+ifeq ($(CONFIG_NVGPU_SYNCFD_STABLE),y)
+ccflags-y += -DCONFIG_NVGPU_SYNCFD_STABLE
+endif
+ifeq ($(CONFIG_NVGPU_SYNCFD_NONE),y)
+ccflags-y += -DCONFIG_NVGPU_SYNCFD_NONE
+endif
--- a/drivers/gpu/nvgpu/Makefile.nvgpu
+++ b/drivers/gpu/nvgpu/Makefile.nvgpu
@@ -0,0 +1,137 @@
+GCOV_PROFILE := y
+
+ccflags-y += -Idrivers/gpu/nvgpu
+ccflags-y += -Idrivers/video/tegra/host
+ccflags-y += -Idrivers/devfreq
+ccflags-y += -I../nvgpu/include
+ccflags-y += -I../nvgpu/include/uapi
+ccflags-y += -Wno-multichar
+ccflags-y += -Werror
+ccflags-y += -Wno-error=cpp
+ccflags-y += -Wno-duplicate-decl-specifier
+
+ifeq ($(CONFIG_ARCH_TEGRA_18x_SOC),y)
+ccflags-y += -I$(srctree)/../nvgpu-t18x/drivers/gpu/nvgpu
+ccflags-y += -I$(srctree)/../nvgpu-t18x/include
+ccflags-y += -I$(srctree)/../nvgpu-t18x/include/uapi
+endif
+
+ifeq ($(CONFIG_TEGRA_19x_GPU),y)
+ccflags-y += -I$(srctree)/../nvgpu-t19x/drivers/gpu/nvgpu
+ccflags-y += -I$(srctree)/../nvgpu-t19x/include
+ccflags-y += -I$(srctree)/../nvgpu-t19x/include/uapi
+endif
+
+obj-$(CONFIG_GK20A) := nvgpu.o
+
+nvgpu-y := \
+	gk20a/gk20a.o \
+	gk20a/sched_gk20a.o \
+	gk20a/as_gk20a.o \
+	gk20a/ctrl_gk20a.o \
+	gk20a/ce2_gk20a.o \
+	gk20a/fifo_gk20a.o \
+	gk20a/channel_gk20a.o \
+	gk20a/channel_sync_gk20a.o \
+	gk20a/debug_gk20a.o \
+	gk20a/dbg_gpu_gk20a.o \
+	gk20a/regops_gk20a.o \
+	gk20a/gr_gk20a.o \
+	gk20a/kind_gk20a.o \
+	gk20a/mm_gk20a.o \
+	gk20a/pmu_gk20a.o \
+	gk20a/priv_ring_gk20a.o \
+	gk20a/semaphore_gk20a.o \
+	gk20a/fence_gk20a.o \
+	gk20a/therm_gk20a.o \
+	gk20a/gr_ctx_gk20a_sim.o \
+	gk20a/gr_ctx_gk20a.o \
+	gk20a/gk20a_gating_reglist.o \
+	gk20a/gk20a_sysfs.o \
+	gk20a/ltc_gk20a.o \
+	gk20a/fb_gk20a.o \
+	gk20a/hal.o \
+	gk20a/hal_gk20a.o \
+	gk20a/gk20a_allocator.o \
+	gk20a/gk20a_allocator_bitmap.o \
+	gk20a/gk20a_allocator_buddy.o \
+	gk20a/cde_gk20a.o \
+	gk20a/platform_gk20a_generic.o \
+	gk20a/tsg_gk20a.o \
+	gk20a/ctxsw_trace_gk20a.o \
+	gk20a/fecs_trace_gk20a.o \
+	gk20a/mc_gk20a.o \
+	gm20b/hal_gm20b.o \
+	gm20b/ltc_gm20b.o \
+	gm20b/ce2_gm20b.o \
+	gm20b/gr_gm20b.o \
+	gm20b/gr_gm20b.o \
+	gm20b/fb_gm20b.o \
+	gm20b/fifo_gm20b.o \
+	gm20b/gr_ctx_gm20b.o \
+	gm20b/gm20b_gating_reglist.o \
+	gm20b/acr_gm20b.o \
+	gm20b/pmu_gm20b.o \
+	gm20b/mm_gm20b.o \
+	gm20b/regops_gm20b.o \
+	gm20b/mc_gm20b.o \
+	gm20b/debug_gm20b.o \
+	gm20b/cde_gm20b.o \
+	gm20b/therm_gm20b.o \
+	gm206/bios_gm206.o \
+	gm206/fifo_gm206.o \
+	gm206/hal_gm206.o \
+	gm206/gr_gm206.o \
+	gm206/acr_gm206.o \
+	gm206/mm_gm206.o \
+	gm206/pmu_gm206.o \
+	gm206/ce_gm206.o
+
+nvgpu-$(CONFIG_TEGRA_GK20A) += gk20a/platform_gk20a_tegra.o
+nvgpu-$(CONFIG_SYNC) += gk20a/sync_gk20a.o
+nvgpu-$(CONFIG_GK20A_PCI) += pci.o
+
+nvgpu-$(CONFIG_TEGRA_GR_VIRTUALIZATION) += \
+	gk20a/platform_vgpu_tegra.o \
+	vgpu/ltc_vgpu.o \
+	vgpu/gr_vgpu.o \
+	vgpu/fifo_vgpu.o \
+	vgpu/ce2_vgpu.o \
+	vgpu/mm_vgpu.o \
+	vgpu/debug_vgpu.o \
+	vgpu/vgpu.o \
+	vgpu/dbg_vgpu.o \
+	vgpu/fecs_trace_vgpu.o \
+	vgpu/tsg_vgpu.o \
+	vgpu/gk20a/vgpu_hal_gk20a.o \
+	vgpu/gk20a/vgpu_gr_gk20a.o \
+	vgpu/gm20b/vgpu_hal_gm20b.o \
+	vgpu/gm20b/vgpu_gr_gm20b.o
+
+nvgpu-$(CONFIG_TEGRA_CLK_FRAMEWORK) += \
+	gm20b/clk_gm20b.o \
+	gk20a/clk_gk20a.o
+
+nvgpu-$(CONFIG_GK20A_DEVFREQ) += \
+	gk20a/gk20a_scale.o
+
+nvgpu-$(CONFIG_GK20A_CYCLE_STATS) += \
+	gk20a/css_gr_gk20a.o
+
+ifeq ($(CONFIG_ARCH_TEGRA_18x_SOC),y)
+ifneq ($(wildcard $(srctree)/../nvgpu-t18x/drivers/gpu/nvgpu/Makefile),)
+include $(srctree)/../nvgpu-t18x/drivers/gpu/nvgpu/Makefile
+endif
+ifneq ($(wildcard $(srctree)/../nvgpu-t18x/drivers/gpu/nvgpu/Makefile.nvgpu-t18x),)
+include $(srctree)/../nvgpu-t18x/drivers/gpu/nvgpu/Makefile.nvgpu-t18x
+endif
+endif
+
+ifeq ($(CONFIG_ARCH_TEGRA_19x_SOC),y)
+ifneq ($(wildcard $(srctree)/../nvgpu-t19x/drivers/gpu/nvgpu/Makefile),)
+include $(srctree)/../nvgpu-t19x/drivers/gpu/nvgpu/Makefile
+endif
+ifneq ($(wildcard $(srctree)/../nvgpu-t19x/drivers/gpu/nvgpu/Makefile.nvgpu-t19x),)
+include $(srctree)/../nvgpu-t19x/drivers/gpu/nvgpu/Makefile.nvgpu-t19x
+endif
+endif
--- a/drivers/gpu/nvgpu/Makefile.shared.configs
+++ b/drivers/gpu/nvgpu/Makefile.shared.configs
@@ -0,0 +1,319 @@
+#
+# Copyright (c) 2019-2021, NVIDIA CORPORATION.  All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a
+# copy of this software and associated documentation files (the "Software"),
+# to deal in the Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish, distribute, sublicense,
+# and/or sell copies of the Software, and to permit persons to whom the
+# Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+# DEALINGS IN THE SOFTWARE.
+#
+
+# This file defines the make variables and cflags applicable to nvgpu common
+# shared by qnx, nvgpu userspace, test builds. Note that cflags are added to
+# variable NVGPU_COMMON_CFLAGS that needs to be used by the parent Makefile
+# to update corresponding cflags variable.
+
+# Default is the regular profile. That can be overridden if necessary. by
+# setting the NVGPU_FORCE_SAFETY_PROFILE. This is a useful hack while we
+# wait for the userspace tmake build to make its way into a proper safety
+# profile build.
+profile := default
+
+# Decide whether to use the safety release, safety debug or the regular profile.
+ifeq ($(NV_BUILD_CONFIGURATION_IS_SAFETY),1)
+profile := safety_release
+ifeq ($(NV_BUILD_CONFIGURATION_IS_DEBUG),1)
+profile := safety_debug
+endif
+endif
+
+ifeq ($(NVGPU_FORCE_SAFETY_PROFILE),1)
+profile := safety_release
+ifeq ($(NVGPU_FORCE_DEBUG_PROFILE),1)
+profile := safety_debug
+endif
+endif
+
+NVGPU_COMMON_CFLAGS		:=
+
+#
+# Flags always enabled regardless of build profile.
+#
+
+NVGPU_COMMON_CFLAGS		+=		\
+	-DCONFIG_TEGRA_GK20A_PMU=1		\
+	-DCONFIG_TEGRA_ACR=1			\
+	-DCONFIG_NVGPU_GR_VIRTUALIZATION	\
+	-DCONFIG_PCI_MSI
+
+CONFIG_NVGPU_LOGGING                 := 1
+NVGPU_COMMON_CFLAGS                  += -DCONFIG_NVGPU_LOGGING
+
+# Syncpoint support provided by nvhost is expected to exist.
+CONFIG_TEGRA_GK20A_NVHOST            := 1
+NVGPU_COMMON_CFLAGS                  += -DCONFIG_TEGRA_GK20A_NVHOST
+
+# Syncfds are a Linux feature.
+CONFIG_NVGPU_SYNCFD_NONE             := 1
+NVGPU_COMMON_CFLAGS                  += -DCONFIG_NVGPU_SYNCFD_NONE
+
+CONFIG_NVGPU_GRAPHICS                := 1
+NVGPU_COMMON_CFLAGS                  += -DCONFIG_NVGPU_GRAPHICS
+
+ifeq ($(profile),$(filter $(profile),safety_debug safety_release))
+
+# Enable golden context verification only for safety debug/release build
+NVGPU_COMMON_CFLAGS             +=      \
+	-DCONFIG_NVGPU_GR_GOLDEN_CTX_VERIFICATION     \
+	-DCONFIG_NVGPU_BUILD_CONFIGURATION_IS_SAFETY
+
+## For tesing of CTXSW FW error codes manually, enable below configs in safety build.
+## Enable only one config at a time, because only one error can be tested at a time.
+# NVGPU_COMMON_CFLAGS             +=      \
+# 	-DCONFIG_NVGPU_CTXSW_FW_ERROR_WDT_TESTING
+#
+# NVGPU_COMMON_CFLAGS             +=      \
+# 	-DCONFIG_NVGPU_CTXSW_FW_ERROR_CODE_TESTING
+#
+# NVGPU_COMMON_CFLAGS             +=      \
+# 	-DCONFIG_NVGPU_CTXSW_FW_ERROR_HEADER_TESTING
+
+ifeq ($(CONFIG_NVGPU_DGPU),1)
+
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_DGPU
+
+CONFIG_NVGPU_NVLINK             := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_NVLINK
+
+# used by sec2 code
+CONFIG_NVGPU_ENGINE_QUEUE       := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_ENGINE_QUEUE
+
+# used in ce_app
+CONFIG_NVGPU_FENCE              := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_FENCE
+
+# ce_app uses syncpt (nvgpu_nvhost_syncpt_wait_timeout_ext)
+CONFIG_NVGPU_KERNEL_MODE_SUBMIT := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_KERNEL_MODE_SUBMIT
+
+CONFIG_NVGPU_FALCON_NON_FUSA	:= 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_FALCON_NON_FUSA
+
+CONFIG_NVGPU_GR_FALCON_NON_SECURE_BOOT := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_GR_FALCON_NON_SECURE_BOOT
+
+CONFIG_NVGPU_SM_DIVERSITY := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_SM_DIVERSITY
+
+CONFIG_NVGPU_USE_3LSS_ERR_INJECTION := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_USE_3LSS_ERR_INJECTION
+
+CONFIG_NVGPU_LS_PMU             := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_LS_PMU
+
+CONFIG_NVGPU_CLK_ARB            := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_CLK_ARB
+endif
+
+endif
+
+CONFIG_NVGPU_TEGRA_FUSE		:= 1
+NVGPU_COMMON_CFLAGS		+= -DCONFIG_NVGPU_TEGRA_FUSE
+
+#
+# Flags enabled only for safety debug and regular build profile.
+#
+ifneq ($(profile),safety_release)
+
+CONFIG_NVGPU_TRACE              := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_TRACE
+
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_FALCON_DEBUG
+
+#
+# Flags enabled only for regular build profile.
+#
+ifneq ($(profile),safety_debug)
+
+CONFIG_NVGPU_SYSFS              := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_SYSFS
+
+# ACR feature to enable old tegra ACR profile support
+CONFIG_NVGPU_ACR_LEGACY         := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_ACR_LEGACY
+
+CONFIG_NVGPU_ENGINE_QUEUE       := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_ENGINE_QUEUE
+
+CONFIG_NVGPU_DEBUGGER           := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_DEBUGGER
+
+CONFIG_NVGPU_PROFILER           := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_PROFILER
+
+CONFIG_NVGPU_RECOVERY           := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_RECOVERY
+
+CONFIG_NVGPU_CILP               := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_CILP
+
+CONFIG_NVGPU_GFXP               := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_GFXP
+
+CONFIG_NVGPU_CYCLESTATS         := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_CYCLESTATS
+
+CONFIG_NVGPU_FECS_TRACE         := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_FECS_TRACE
+
+ifneq ($(CONFIG_NVGPU_DGPU),1)
+CONFIG_NVGPU_IGPU_VIRT          := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_IGPU_VIRT
+endif
+
+# Enable the usage of 3LSS error injection features.
+CONFIG_NVGPU_USE_3LSS_ERR_INJECTION := 1
+NVGPU_COMMON_CFLAGS                 += -DCONFIG_NVGPU_USE_3LSS_ERR_INJECTION
+
+# Enable nvlink support for normal build.
+CONFIG_NVGPU_NVLINK             := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_NVLINK
+
+# Enable tpc_powergate support for normal build.
+CONFIG_NVGPU_TPC_POWERGATE      := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_TPC_POWERGATE
+
+# Enable mssnvlink0 reset control for normal build
+CONFIG_MSSNVLINK0_RST_CONTROL   := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_MSSNVLINK0_RST_CONTROL
+
+# Enable dgpu support for normal build.
+CONFIG_NVGPU_DGPU               := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_DGPU
+
+# Enable nvgpu_next for normal build
+ifneq ($(NV_BUILD_CONFIGURATION_IS_EXTERNAL), 1)
+CONFIG_NVGPU_NEXT               := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_NEXT
+endif
+
+CONFIG_NVGPU_VPR                := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_VPR
+
+CONFIG_NVGPU_REPLAYABLE_FAULT   := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_REPLAYABLE_FAULT
+
+# Enable LS PMU support for normal build
+CONFIG_NVGPU_LS_PMU             := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_LS_PMU
+
+# Enable elpg support for normal build
+CONFIG_NVGPU_POWER_PG           := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_POWER_PG
+
+# Enable sim support for normal build
+CONFIG_NVGPU_SIM                := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_SIM
+
+CONFIG_NVGPU_COMPRESSION        := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_COMPRESSION
+
+# Enable non FUSA HALs for normal build
+CONFIG_NVGPU_HAL_NON_FUSA       := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_HAL_NON_FUSA
+
+# Enable non FUSA common code for normal build
+CONFIG_NVGPU_NON_FUSA           := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_NON_FUSA
+
+CONFIG_NVGPU_CLK_ARB            := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_CLK_ARB
+
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_FALCON_NON_FUSA
+
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_IOCTL_NON_FUSA
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_DETERMINISTIC_CHANNELS
+
+CONFIG_NVGPU_GR_FALCON_NON_SECURE_BOOT := 1
+NVGPU_COMMON_CFLAGS                    += -DCONFIG_NVGPU_GR_FALCON_NON_SECURE_BOOT
+
+CONFIG_NVGPU_SET_FALCON_ACCESS_MAP := 1
+NVGPU_COMMON_CFLAGS                += -DCONFIG_NVGPU_SET_FALCON_ACCESS_MAP
+
+# Enable SW Semaphore for normal build
+CONFIG_NVGPU_SW_SEMAPHORE       := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_SW_SEMAPHORE
+
+# Enable Channel WDT for safety build until we switch to user mode submits only
+CONFIG_NVGPU_CHANNEL_WDT := 1
+NVGPU_COMMON_CFLAGS		+= -DCONFIG_NVGPU_CHANNEL_WDT
+
+# Enable Kernel Mode submit for safety build until we switch to user mode
+# submits only
+CONFIG_NVGPU_KERNEL_MODE_SUBMIT := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_KERNEL_MODE_SUBMIT
+
+# Enable fences for safety build till until we switch to user mode submits only
+CONFIG_NVGPU_FENCE              := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_FENCE
+
+# Enable powergate lib for normal build
+CONFIG_NVGPU_USE_POWERGATE_LIB  := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_USE_POWERGATE_LIB
+
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_FIFO_ENGINE_ACTIVITY
+# Enable dynamic busy/idle support
+CONFIG_NVGPU_DYNAMIC_BUSY_IDLE_SUPPORT := 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_DYNAMIC_BUSY_IDLE_SUPPORT
+
+# Enable HW based error injection support
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_INJECT_HWERR
+
+# Enable Channel/TSG Scheduling
+CONFIG_NVGPU_CHANNEL_TSG_SCHEDULING  := 1
+NVGPU_COMMON_CFLAGS                  += -DCONFIG_NVGPU_CHANNEL_TSG_SCHEDULING
+
+# Enable Channel/TSG Control
+CONFIG_NVGPU_CHANNEL_TSG_CONTROL     := 1
+NVGPU_COMMON_CFLAGS                  += -DCONFIG_NVGPU_CHANNEL_TSG_CONTROL
+
+# Enable Virtualization server for normal build
+NVGPU_COMMON_CFLAGS             += -DCONFIG_TEGRA_GR_VIRTUALIZATION_SERVER
+
+# Enable SM diversity support for normal build
+CONFIG_NVGPU_SM_DIVERSITY            := 1
+NVGPU_COMMON_CFLAGS                  += -DCONFIG_NVGPU_SM_DIVERSITY
+
+# Enable Multi Instance GPU support for normal build
+CONFIG_NVGPU_MIG                     := 1
+NVGPU_COMMON_CFLAGS                  += -DCONFIG_NVGPU_MIG
+
+endif
+endif
+
+# Enable USERD only if kernel mode submit is supported
+ifeq ($(CONFIG_NVGPU_KERNEL_MODE_SUBMIT),1)
+CONFIG_NVGPU_USERD		:= 1
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_USERD
+endif
+
+ifeq ($(CONFIG_NVGPU_DEBUGGER),1)
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_ENGINE_RESET
+endif
+
+ifeq ($(CONFIG_NVGPU_RECOVERY),1)
+NVGPU_COMMON_CFLAGS             += -DCONFIG_NVGPU_ENGINE_RESET
+endif
--- a/drivers/gpu/nvgpu/Makefile.sources
+++ b/drivers/gpu/nvgpu/Makefile.sources
@@ -0,0 +1,711 @@
+# -*- mode: makefile -*-
+#
+# Copyright (c) 2018-2021, NVIDIA CORPORATION.  All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a
+# copy of this software and associated documentation files (the "Software"),
+# to deal in the Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish, distribute, sublicense,
+# and/or sell copies of the Software, and to permit persons to whom the
+# Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+# DEALINGS IN THE SOFTWARE.
+
+srcs :=
+
+ifdef NVGPU_POSIX
+srcs +=	os/posix/nvgpu.c \
+	os/posix/posix-io.c \
+	os/posix/mock-registers.c \
+	os/posix/posix-nvgpu_mem.c \
+	os/posix/posix-dma.c \
+	os/posix/posix-vm.c \
+	os/posix/firmware.c \
+	os/posix/soc.c \
+	os/posix/error_notifier.c \
+	os/posix/posix-channel.c \
+	os/posix/posix-tsg.c \
+	os/posix/stubs.c \
+	os/posix/posix-nvhost.c \
+	os/posix/posix-vgpu.c \
+	os/posix/posix-dt.c \
+	os/posix/fuse.c
+
+ifdef CONFIG_NVGPU_VPR
+srcs += os/posix/posix-vpr.c
+endif
+
+ifdef CONFIG_NVGPU_FECS_TRACE
+srcs += os/posix/fecs_trace_posix.c
+endif
+
+ifeq ($(CONFIG_NVGPU_CLK_ARB),1)
+srcs += os/posix/posix-clk_arb.c
+endif
+
+ifdef CONFIG_NVGPU_NVLINK
+srcs +=	os/posix/posix-nvlink.c
+endif
+
+ifeq ($(CONFIG_NVGPU_COMPRESSION),1)
+srcs += os/posix/posix-comptags.c
+endif
+
+ifeq ($(CONFIG_NVGPU_LOGGING),1)
+srcs += os/posix/log.c
+endif
+
+ifeq ($(CONFIG_NVGPU_DGPU),1)
+srcs += os/posix/posix-vidmem.c
+endif
+endif
+
+# POSIX sources shared between the POSIX and QNX builds.
+srcs += os/posix/bug.c \
+	os/posix/rwsem.c \
+	os/posix/timers.c \
+	os/posix/cond.c \
+	os/posix/lock.c \
+	os/posix/thread.c \
+	os/posix/os_sched.c \
+	os/posix/bitmap.c \
+	os/posix/kmem.c \
+	os/posix/file_ops.c \
+	os/posix/queue.c
+
+ifeq ($(NV_BUILD_CONFIGURATION_IS_SAFETY),0)
+srcs += os/posix/bsearch.c
+endif
+
+srcs +=	common/device.c \
+	common/utils/enabled.c \
+	common/utils/errata.c \
+	common/utils/rbtree.c \
+	common/utils/string.c \
+	common/utils/worker.c \
+	common/swdebug/profile.c \
+	common/init/nvgpu_init.c \
+	common/mm/allocators/nvgpu_allocator.c \
+	common/mm/allocators/bitmap_allocator.c \
+	common/mm/allocators/buddy_allocator.c \
+	common/mm/gmmu/page_table.c \
+	common/mm/gmmu/pd_cache.c \
+	common/mm/gmmu/pte.c \
+	common/mm/as.c \
+	common/mm/vm.c \
+	common/mm/vm_area.c \
+	common/mm/nvgpu_mem.c \
+	common/mm/nvgpu_sgt.c \
+	common/mm/mm.c \
+	common/mm/dma.c \
+	common/therm/therm.c \
+	common/ltc/ltc.c \
+	common/fb/fb.c \
+	common/fbp/fbp.c \
+	common/io/io.c \
+	common/ecc.c \
+	common/falcon/falcon.c \
+	common/falcon/falcon_sw_gk20a.c \
+	common/gr/gr.c \
+	common/gr/gr_utils.c \
+	common/gr/gr_intr.c \
+	common/gr/global_ctx.c \
+	common/gr/subctx.c \
+	common/gr/ctx.c \
+	common/gr/gr_falcon.c \
+	common/gr/gr_config.c \
+	common/gr/gr_setup.c \
+	common/gr/obj_ctx.c \
+	common/gr/fs_state.c \
+	common/gr/gr_ecc.c \
+	common/netlist/netlist.c \
+	common/pmu/pmu.c \
+	common/acr/acr.c \
+	common/acr/acr_wpr.c \
+	common/acr/acr_blob_alloc.c \
+	common/acr/acr_blob_construct.c \
+	common/acr/acr_bootstrap.c \
+	common/acr/acr_sw_gv11b.c \
+	common/ptimer/ptimer.c \
+	common/power_features/cg/cg.c \
+	common/sync/channel_user_syncpt.c \
+	common/fifo/preempt.c \
+	common/fifo/channel.c \
+	common/fifo/fifo.c \
+	common/fifo/pbdma.c \
+	common/fifo/tsg.c \
+	common/fifo/runlist.c \
+	common/fifo/engine_status.c \
+	common/fifo/engines.c \
+	common/fifo/pbdma_status.c \
+	common/mc/mc.c \
+	common/rc/rc.c \
+	common/ce/ce.c \
+	common/grmgr/grmgr.c \
+	common/cic/cic.c \
+	common/cic/cic_intr.c \
+	common/cic/ce_cic.c \
+	common/cic/ctxsw_cic.c \
+	common/cic/ecc_cic.c \
+	common/cic/host_cic.c \
+	common/cic/gr_cic.c \
+	common/cic/pri_cic.c \
+	common/cic/pmu_cic.c \
+	common/cic/mmu_cic.c \
+	common/cic/msg_cic.c \
+	hal/init/hal_gv11b.c \
+	hal/init/hal_gv11b_litter.c \
+	hal/init/hal_init.c \
+	hal/power_features/cg/gv11b_gating_reglist.c \
+	hal/fifo/runlist_fifo_gv11b.c \
+	hal/fifo/userd_gk20a.c \
+	hal/sync/syncpt_cmdbuf_gv11b.c
+
+# Source files below are functionaly safe (FuSa) and must always be included.
+srcs += hal/mm/mm_gv11b_fusa.c \
+	hal/mm/mm_gp10b_fusa.c \
+	hal/mm/gmmu/gmmu_gv11b_fusa.c \
+	hal/mm/gmmu/gmmu_gp10b_fusa.c \
+	hal/mm/gmmu/gmmu_gk20a_fusa.c \
+	hal/mm/gmmu/gmmu_gm20b_fusa.c \
+	hal/mm/cache/flush_gk20a_fusa.c \
+	hal/mm/cache/flush_gv11b_fusa.c \
+	hal/mm/mmu_fault/mmu_fault_gv11b_fusa.c \
+	hal/ltc/intr/ltc_intr_gp10b_fusa.c \
+	hal/ltc/intr/ltc_intr_gv11b_fusa.c \
+	hal/bus/bus_gk20a_fusa.c \
+	hal/bus/bus_gm20b_fusa.c \
+	hal/bus/bus_gp10b_fusa.c \
+	hal/bus/bus_gv11b_fusa.c \
+	hal/ce/ce_gp10b_fusa.c \
+	hal/ce/ce_gv11b_fusa.c \
+	hal/class/class_gv11b_fusa.c \
+	hal/falcon/falcon_gk20a_fusa.c \
+	hal/fb/fb_gm20b_fusa.c \
+	hal/fb/fb_gv11b_fusa.c \
+	hal/fb/fb_mmu_fault_gv11b_fusa.c \
+	hal/fb/ecc/fb_ecc_gv11b_fusa.c \
+	hal/fb/intr/fb_intr_ecc_gv11b_fusa.c \
+	hal/fb/intr/fb_intr_gv11b_fusa.c \
+	hal/fifo/channel_gk20a_fusa.c \
+	hal/fifo/channel_gm20b_fusa.c \
+	hal/fifo/channel_gv11b_fusa.c \
+	hal/fifo/ctxsw_timeout_gv11b_fusa.c \
+	hal/fifo/engine_status_gm20b_fusa.c \
+	hal/fifo/engine_status_gv100_fusa.c \
+	hal/fifo/engines_gp10b_fusa.c \
+	hal/fifo/engines_gv11b_fusa.c \
+	hal/fifo/fifo_gk20a_fusa.c \
+	hal/fifo/fifo_gv11b_fusa.c \
+	hal/fifo/fifo_intr_gk20a_fusa.c \
+	hal/fifo/fifo_intr_gv11b_fusa.c \
+	hal/fifo/pbdma_gm20b_fusa.c \
+	hal/fifo/pbdma_gp10b_fusa.c \
+	hal/fifo/pbdma_gv11b_fusa.c \
+	hal/fifo/pbdma_status_gm20b_fusa.c \
+	hal/fifo/preempt_gv11b_fusa.c \
+	hal/fifo/ramfc_gp10b_fusa.c \
+	hal/fifo/ramfc_gv11b_fusa.c \
+	hal/fifo/ramin_gk20a_fusa.c \
+	hal/fifo/ramin_gm20b_fusa.c \
+	hal/fifo/ramin_gv11b_fusa.c \
+	hal/fifo/runlist_fifo_gk20a_fusa.c \
+	hal/fifo/runlist_fifo_gv11b_fusa.c \
+	hal/fifo/runlist_ram_gv11b_fusa.c \
+	hal/fifo/tsg_gk20a_fusa.c \
+	hal/fifo/tsg_gv11b_fusa.c \
+	hal/fifo/usermode_gv11b_fusa.c \
+	hal/fuse/fuse_gm20b_fusa.c \
+	hal/fuse/fuse_gp10b_fusa.c \
+	hal/gr/config/gr_config_gm20b_fusa.c \
+	hal/gr/config/gr_config_gv100_fusa.c \
+	hal/gr/ctxsw_prog/ctxsw_prog_gm20b_fusa.c \
+	hal/gr/ctxsw_prog/ctxsw_prog_gp10b_fusa.c \
+	hal/gr/ctxsw_prog/ctxsw_prog_gv11b_fusa.c \
+	hal/gr/ecc/ecc_gv11b_fusa.c \
+	hal/gr/falcon/gr_falcon_gm20b_fusa.c \
+	hal/gr/falcon/gr_falcon_gp10b_fusa.c \
+	hal/gr/falcon/gr_falcon_gv11b_fusa.c \
+	hal/gr/init/gr_init_gm20b_fusa.c \
+	hal/gr/init/gr_init_gp10b_fusa.c \
+	hal/gr/init/gr_init_gv11b_fusa.c \
+	hal/gr/intr/gr_intr_gm20b_fusa.c \
+	hal/gr/intr/gr_intr_gp10b_fusa.c \
+	hal/gr/intr/gr_intr_gv11b_fusa.c \
+	hal/ltc/ltc_gm20b_fusa.c \
+	hal/ltc/ltc_gp10b_fusa.c \
+	hal/ltc/ltc_gv11b_fusa.c \
+	hal/mc/mc_gm20b_fusa.c \
+	hal/mc/mc_gp10b_fusa.c \
+	hal/mc/mc_gv11b_fusa.c \
+	hal/netlist/netlist_gv11b_fusa.c \
+	hal/pmu/pmu_gk20a_fusa.c \
+	hal/pmu/pmu_gv11b_fusa.c \
+	hal/priv_ring/priv_ring_gm20b_fusa.c \
+	hal/priv_ring/priv_ring_gp10b_fusa.c \
+	hal/ptimer/ptimer_gk20a_fusa.c \
+	hal/sync/syncpt_cmdbuf_gv11b_fusa.c \
+	hal/therm/therm_gv11b_fusa.c \
+	hal/top/top_gm20b_fusa.c \
+	hal/top/top_gv11b_fusa.c \
+	hal/cic/cic_gv11b_fusa.c \
+	hal/cic/cic_lut_gv11b_fusa.c
+
+# Source files below are not guaranteed to be functionaly safe (FuSa) and are
+# only included in the normal build.
+ifeq ($(CONFIG_NVGPU_HAL_NON_FUSA),1)
+srcs += hal/init/hal_gp10b.c \
+	hal/init/hal_gp10b_litter.c \
+	hal/init/hal_gm20b.c \
+	hal/init/hal_gm20b_litter.c \
+	hal/mm/cache/flush_gk20a.c \
+	hal/mm/mm_gm20b.c \
+	hal/mm/mm_gk20a.c \
+	hal/mm/gmmu/gmmu_gk20a.c \
+	hal/mm/gmmu/gmmu_gm20b.c \
+	hal/mc/mc_gm20b.c  \
+	hal/bus/bus_gk20a.c \
+	hal/class/class_gm20b.c \
+	hal/class/class_gp10b.c \
+	hal/clk/clk_gm20b.c \
+	hal/falcon/falcon_gk20a.c \
+	hal/gr/config/gr_config_gm20b.c \
+	hal/gr/ecc/ecc_gp10b.c \
+	hal/gr/ecc/ecc_gv11b.c \
+	hal/gr/init/gr_init_gm20b.c \
+	hal/gr/init/gr_init_gp10b.c \
+	hal/gr/init/gr_init_gv11b.c \
+	hal/gr/intr/gr_intr_gm20b.c \
+	hal/gr/intr/gr_intr_gp10b.c \
+	hal/gr/falcon/gr_falcon_gm20b.c \
+	hal/priv_ring/priv_ring_gm20b.c \
+	hal/power_features/cg/gm20b_gating_reglist.c \
+	hal/power_features/cg/gp10b_gating_reglist.c \
+	hal/ce/ce2_gk20a.c \
+	hal/therm/therm_gm20b.c \
+	hal/therm/therm_gp10b.c \
+	hal/ltc/ltc_gm20b.c \
+	hal/ltc/ltc_gp10b.c \
+	hal/ltc/intr/ltc_intr_gm20b.c \
+	hal/ltc/intr/ltc_intr_gp10b.c \
+	hal/fb/fb_gp10b.c \
+	hal/fb/fb_gp106.c \
+	hal/fb/fb_gm20b.c \
+	hal/fb/fb_gv11b.c \
+	hal/fb/intr/fb_intr_ecc_gv11b.c \
+	hal/fuse/fuse_gm20b.c \
+	hal/fifo/fifo_gk20a.c \
+	hal/fifo/preempt_gk20a.c \
+	hal/fifo/engines_gm20b.c \
+	hal/fifo/pbdma_gm20b.c \
+	hal/fifo/pbdma_gp10b.c \
+	hal/fifo/engine_status_gm20b.c \
+	hal/fifo/ramfc_gk20a.c  \
+	hal/fifo/ramfc_gp10b.c  \
+	hal/fifo/ramin_gk20a.c \
+	hal/fifo/ramin_gp10b.c \
+	hal/fifo/channel_gk20a.c \
+	hal/fifo/channel_gm20b.c \
+	hal/fifo/tsg_gk20a.c \
+	hal/fifo/fifo_intr_gk20a.c \
+	hal/fifo/mmu_fault_gk20a.c \
+	hal/fifo/mmu_fault_gm20b.c \
+	hal/fifo/mmu_fault_gp10b.c \
+	hal/fifo/ctxsw_timeout_gk20a.c \
+	hal/fifo/runlist_fifo_gk20a.c \
+	hal/fifo/runlist_ram_gk20a.c \
+	hal/netlist/netlist_gm20b.c \
+	hal/netlist/netlist_gp10b.c \
+	hal/sync/syncpt_cmdbuf_gk20a.c \
+	hal/pmu/pmu_gv11b.c \
+	hal/top/top_gm20b.c \
+	hal/top/top_gp106.c \
+	hal/top/top_gp10b.c \
+	hal/gr/ctxsw_prog/ctxsw_prog_gm20b.c \
+	hal/gr/ctxsw_prog/ctxsw_prog_gp10b.c \
+	hal/gr/ctxsw_prog/ctxsw_prog_gv11b.c
+else
+ifeq ($(CONFIG_NVGPU_DGPU),1)
+# non-FUSA files needed to build dGPU in safety
+srcs += hal/gr/falcon/gr_falcon_gm20b.c \
+	hal/fuse/fuse_gm20b.c \
+	hal/fb/fb_gp106.c \
+	hal/falcon/falcon_gk20a.c \
+	hal/bus/bus_gk20a.c \
+	hal/pmu/pmu_gv11b.c
+endif
+endif
+
+ifeq ($(CONFIG_NVGPU_CLK_ARB),1)
+srcs += \
+	common/clk_arb/clk_arb.c \
+	common/clk_arb/clk_arb_gp10b.c
+endif
+
+ifeq ($(CONFIG_NVGPU_ACR_LEGACY),1)
+srcs += \
+	common/acr/acr_blob_construct_v0.c \
+	common/acr/acr_sw_gm20b.c \
+	common/acr/acr_sw_gp10b.c
+endif
+
+ifeq ($(CONFIG_NVGPU_ENGINE_QUEUE),1)
+srcs += common/engine_queues/engine_mem_queue.c \
+	common/engine_queues/engine_dmem_queue.c \
+	common/engine_queues/engine_emem_queue.c \
+	common/engine_queues/engine_fb_queue.c
+endif
+
+ifeq ($(CONFIG_NVGPU_GRAPHICS),1)
+srcs += common/gr/zbc.c \
+	common/gr/zcull.c \
+	hal/gr/zbc/zbc_gm20b.c \
+	hal/gr/zbc/zbc_gp10b.c \
+	hal/gr/zbc/zbc_gv11b.c \
+	hal/gr/zcull/zcull_gm20b.c \
+	hal/gr/zcull/zcull_gv11b.c
+endif
+
+ifeq ($(CONFIG_NVGPU_DEBUGGER),1)
+srcs += common/debugger.c \
+	common/regops/regops.c \
+	common/gr/hwpm_map.c \
+	common/perf/perfbuf.c \
+	hal/regops/regops_gv11b.c \
+	hal/regops/allowlist_gv11b.c \
+	hal/gr/ctxsw_prog/ctxsw_prog_gm20b_dbg.c \
+	hal/gr/hwpm_map/hwpm_map_gv100.c \
+	hal/ltc/ltc_gm20b_dbg.c \
+	hal/ptimer/ptimer_gp10b.c \
+	hal/perf/perf_gv11b.c \
+	hal/perf/perf_tu104.c \
+	hal/gr/gr/gr_gk20a.c \
+	hal/gr/gr/gr_gm20b.c \
+	hal/gr/gr/gr_gp10b.c \
+	hal/gr/gr/gr_gv11b.c \
+	hal/gr/gr/gr_gv100.c \
+	hal/gr/gr/gr_tu104.c
+ifeq ($(CONFIG_NVGPU_HAL_NON_FUSA),1)
+srcs += hal/regops/regops_gm20b.c \
+	hal/regops/regops_gp10b.c \
+	hal/regops/regops_tu104.c \
+	hal/regops/allowlist_tu104.c \
+	hal/perf/perf_gm20b.c
+endif
+endif
+
+ifeq ($(CONFIG_NVGPU_PROFILER),1)
+srcs += common/profiler/profiler.c \
+	common/profiler/pm_reservation.c \
+	hal/priv_ring/priv_ring_gv11b.c \
+	hal/ptimer/ptimer_gv11b.c
+endif
+
+ifeq ($(CONFIG_NVGPU_KERNEL_MODE_SUBMIT),1)
+srcs += common/fifo/submit.c \
+        common/fifo/priv_cmdbuf.c \
+        common/fifo/job.c \
+        common/fifo/channel_worker.c \
+	common/sync/channel_sync.c \
+	common/sync/channel_sync_syncpt.c
+endif
+
+ifeq ($(CONFIG_NVGPU_CHANNEL_WDT),1)
+srcs += common/fifo/watchdog.c \
+	common/fifo/channel_wdt.c
+endif
+
+ifeq ($(CONFIG_NVGPU_SW_SEMAPHORE),1)
+srcs += common/semaphore/semaphore_sea.c \
+	common/semaphore/semaphore_pool.c \
+	common/semaphore/semaphore_hw.c \
+	common/semaphore/semaphore.c \
+	common/sync/channel_sync_semaphore.c \
+	hal/sync/sema_cmdbuf_gk20a.c \
+	hal/sync/sema_cmdbuf_gv11b.c
+endif
+
+ifeq ($(CONFIG_NVGPU_USERD),1)
+srcs += common/fifo/userd.c \
+	hal/fifo/userd_gv11b.c
+endif
+
+ifeq ($(CONFIG_NVGPU_RECOVERY),1)
+srcs += hal/rc/rc_gv11b.c
+ifeq ($(CONFIG_NVGPU_HAL_NON_FUSA),1)
+srcs += hal/rc/rc_gk20a.c
+endif
+endif
+
+ifeq ($(CONFIG_NVGPU_FENCE),1)
+srcs += common/fence/fence.c
+ifeq ($(CONFIG_TEGRA_GK20A_NVHOST),1)
+srcs += common/fence/fence_syncpt.c
+endif
+ifeq ($(CONFIG_NVGPU_SW_SEMAPHORE),1)
+srcs += common/fence/fence_sema.c
+endif
+endif
+
+ifeq ($(CONFIG_NVGPU_FECS_TRACE),1)
+srcs += common/gr/fecs_trace.c \
+	hal/gr/fecs_trace/fecs_trace_gm20b.c \
+	hal/gr/fecs_trace/fecs_trace_gv11b.c
+ifeq ($(CONFIG_NVGPU_IGPU_VIRT),1)
+srcs += common/vgpu/gr/fecs_trace_vgpu.c
+endif
+endif
+
+ifeq ($(CONFIG_NVGPU_CYCLESTATS),1)
+srcs += common/perf/cyclestats_snapshot.c \
+	common/cyclestats/cyclestats.c
+ifeq ($(CONFIG_NVGPU_IGPU_VIRT),1)
+srcs += common/vgpu/perf/cyclestats_snapshot_vgpu.c
+endif
+endif
+
+# POSIX file used for unit testing for both qnx and linux
+ifdef NVGPU_FAULT_INJECTION_ENABLEMENT
+srcs += os/posix/posix-fault-injection.c
+endif
+
+ifeq ($(CONFIG_NVGPU_LS_PMU),1)
+# Add LS PMU files which are required for normal build
+srcs += \
+	common/pmu/boardobj/boardobj.c \
+	common/pmu/boardobj/boardobjgrp.c \
+	common/pmu/boardobj/boardobjgrpmask.c \
+	common/pmu/boardobj/boardobjgrp_e255.c \
+	common/pmu/boardobj/boardobjgrp_e32.c \
+	common/pmu/clk/clk.c \
+	common/pmu/volt/volt.c \
+	common/pmu/clk/clk_domain.c \
+	common/pmu/clk/clk_fll.c \
+	common/pmu/clk/clk_prog.c \
+	common/pmu/clk/clk_vf_point.c \
+	common/pmu/clk/clk_vin.c \
+	common/pmu/fw/fw.c \
+	common/pmu/fw/fw_ver_ops.c \
+	common/pmu/fw/fw_ns_bootstrap.c \
+	common/pmu/ipc/pmu_cmd.c \
+	common/pmu/ipc/pmu_msg.c \
+	common/pmu/ipc/pmu_queue.c \
+	common/pmu/ipc/pmu_seq.c \
+	common/pmu/lpwr/rppg.c \
+	common/pmu/lsfm/lsfm.c \
+	common/pmu/lsfm/lsfm_sw_gm20b.c \
+	common/pmu/lsfm/lsfm_sw_gp10b.c \
+	common/pmu/lsfm/lsfm_sw_gv100.c \
+	common/pmu/lsfm/lsfm_sw_tu104.c \
+	common/pmu/perf/vfe_equ.c \
+	common/pmu/perf/vfe_var.c \
+	common/pmu/perf/perf.c \
+	common/pmu/perf/pstate.c \
+	common/pmu/perf/change_seq.c \
+	common/pmu/perfmon/pmu_perfmon.c \
+	common/pmu/perfmon/pmu_perfmon_sw_gm20b.c \
+	common/pmu/perfmon/pmu_perfmon_sw_gv11b.c \
+	common/pmu/pmgr/pmgr.c \
+	common/pmu/pmgr/pmgrpmu.c \
+	common/pmu/pmgr/pwrdev.c \
+	common/pmu/pmgr/pwrmonitor.c \
+	common/pmu/pmgr/pwrpolicy.c \
+	common/pmu/super_surface/super_surface.c \
+	common/pmu/therm/thrm.c \
+	common/pmu/therm/therm_channel.c \
+	common/pmu/therm/therm_dev.c \
+	common/pmu/volt/volt_dev.c \
+	common/pmu/volt/volt_policy.c \
+	common/pmu/volt/volt_rail.c \
+	common/pmu/allocator.c \
+	common/pmu/pmu_debug.c \
+	common/pmu/pmu_mutex.c \
+	common/pmu/pmu_pstate.c \
+	common/pmu/pmu_rtos_init.c \
+	hal/therm/therm_tu104.c \
+	hal/pmu/pmu_gk20a.c \
+	hal/pmu/pmu_gm20b.c \
+	hal/pmu/pmu_gp10b.c \
+	hal/pmu/pmu_tu104.c
+
+ifeq ($(CONFIG_NVGPU_POWER_PG),1)
+srcs += common/pmu/pg/pg_sw_gm20b.c \
+	common/pmu/pg/pg_sw_gp10b.c \
+	common/pmu/pg/pg_sw_gp106.c \
+	common/pmu/pg/pg_sw_gv11b.c \
+	common/pmu/pg/pmu_pg.c \
+	common/pmu/pg/pmu_aelpg.c
+endif
+
+ifeq ($(CONFIG_NVGPU_CLK_ARB),1)
+srcs += common/clk_arb/clk_arb_gv100.c
+endif
+
+endif
+
+ifeq ($(CONFIG_NVGPU_POWER_PG),1)
+srcs += common/power_features/pg/pg.c
+endif
+
+ifeq ($(CONFIG_NVGPU_IGPU_VIRT),1)
+srcs += common/vgpu/init/init_vgpu.c \
+	common/vgpu/ivc/comm_vgpu.c \
+	common/vgpu/intr/intr_vgpu.c \
+	common/vgpu/ptimer/ptimer_vgpu.c \
+	common/vgpu/top/top_vgpu.c \
+	common/vgpu/fifo/fifo_vgpu.c \
+	common/vgpu/fifo/channel_vgpu.c \
+	common/vgpu/fifo/tsg_vgpu.c \
+	common/vgpu/fifo/preempt_vgpu.c \
+	common/vgpu/fifo/runlist_vgpu.c \
+	common/vgpu/fifo/ramfc_vgpu.c \
+	common/vgpu/perf/perf_vgpu.c \
+	common/vgpu/profiler/profiler_vgpu.c \
+	common/vgpu/mm/mm_vgpu.c \
+	common/vgpu/mm/vm_vgpu.c \
+	common/vgpu/gr/gr_vgpu.c \
+	common/vgpu/fb/fb_vgpu.c \
+	common/vgpu/gr/ctx_vgpu.c \
+	common/vgpu/gr/subctx_vgpu.c \
+	common/vgpu/clk_vgpu.c \
+	common/vgpu/debugger_vgpu.c \
+	common/vgpu/pm_reservation_vgpu.c \
+	common/vgpu/ltc/ltc_vgpu.c \
+	common/vgpu/fbp/fbp_vgpu.c \
+	common/vgpu/ce_vgpu.c \
+	hal/vgpu/init/init_hal_vgpu.c \
+	hal/vgpu/init/vgpu_hal_gv11b.c \
+	hal/vgpu/fifo/fifo_gv11b_vgpu.c \
+	hal/vgpu/sync/syncpt_cmdbuf_gv11b_vgpu.c
+
+ifeq ($(CONFIG_NVGPU_USERD),1)
+srcs += common/vgpu/fifo/userd_vgpu.c
+endif
+
+ifeq ($(CONFIG_NVGPU_COMPRESSION),1)
+srcs += common/vgpu/cbc/cbc_vgpu.c
+endif
+endif
+
+ifeq ($(CONFIG_NVGPU_COMPRESSION),1)
+srcs += common/mm/comptags.c \
+	common/cbc/cbc.c \
+	hal/cbc/cbc_gm20b.c \
+	hal/cbc/cbc_gp10b.c \
+	hal/cbc/cbc_gv11b.c
+endif
+
+ifeq ($(CONFIG_NVGPU_NVLINK),1)
+srcs += common/vbios/nvlink_bios.c \
+	common/nvlink/probe.c \
+	common/nvlink/init/device_reginit.c \
+	common/nvlink/init/device_reginit_gv100.c \
+	common/nvlink/minion.c \
+	common/nvlink/link_mode_transitions.c \
+	common/nvlink/nvlink.c \
+	hal/nvlink/minion_gv100.c \
+	hal/nvlink/minion_tu104.c \
+	hal/nvlink/nvlink_gv100.c \
+	hal/nvlink/nvlink_tu104.c \
+	hal/nvlink/intr_and_err_handling_tu104.c \
+	hal/nvlink/link_mode_transitions_gv100.c \
+	hal/nvlink/link_mode_transitions_tu104.c
+endif
+
+ifeq ($(CONFIG_NVGPU_DGPU),1)
+srcs += common/sec2/sec2.c \
+	common/sec2/sec2_allocator.c \
+	common/sec2/sec2_lsfm.c \
+	common/sec2/ipc/sec2_cmd.c \
+	common/sec2/ipc/sec2_msg.c \
+	common/sec2/ipc/sec2_queue.c \
+	common/sec2/ipc/sec2_seq.c \
+	common/vbios/bios.c \
+	common/vbios/bios_sw_gv100.c \
+	common/vbios/bios_sw_tu104.c \
+	common/falcon/falcon_sw_tu104.c \
+	common/acr/acr_sw_tu104.c \
+	common/mm/allocators/page_allocator.c \
+	common/mm/vidmem.c \
+	common/pramin.c \
+	common/ce/ce_app.c \
+	common/sbr/sbr.c \
+	hal/mm/mm_gv100.c \
+	hal/mm/mm_tu104.c \
+	hal/mc/mc_gv100.c  \
+	hal/mc/mc_tu104.c  \
+	hal/bus/bus_gv100.c \
+	hal/bus/bus_tu104.c \
+	hal/ce/ce_tu104.c \
+	hal/class/class_tu104.c \
+	hal/clk/clk_tu104.c \
+	hal/clk/clk_mon_tu104.c \
+	hal/gr/init/gr_init_gv100.c \
+	hal/gr/init/gr_init_tu104.c \
+	hal/gr/intr/gr_intr_tu104.c \
+	hal/gr/falcon/gr_falcon_tu104.c \
+	hal/fbpa/fbpa_tu104.c \
+	hal/init/hal_tu104.c \
+	hal/init/hal_tu104_litter.c \
+	hal/power_features/cg/tu104_gating_reglist.c \
+	hal/ltc/ltc_tu104.c \
+	hal/fb/fb_gv100.c \
+	hal/fb/fb_tu104.c \
+	hal/fb/fb_mmu_fault_tu104.c \
+	hal/fb/intr/fb_intr_gv100.c \
+	hal/fb/intr/fb_intr_tu104.c \
+	hal/func/func_tu104.c \
+	hal/fifo/fifo_tu104.c \
+	hal/fifo/usermode_tu104.c \
+	hal/fifo/pbdma_tu104.c \
+	hal/fifo/ramfc_tu104.c  \
+	hal/fifo/ramin_tu104.c \
+	hal/fifo/channel_gv100.c \
+	hal/fifo/runlist_ram_tu104.c \
+	hal/fifo/runlist_fifo_gv100.c \
+	hal/fifo/runlist_fifo_tu104.c \
+	hal/fifo/fifo_intr_gv100.c \
+	hal/fuse/fuse_gp106.c \
+	hal/fuse/fuse_tu104.c \
+	hal/netlist/netlist_gv100.c \
+	hal/netlist/netlist_tu104.c \
+	hal/nvdec/nvdec_gp106.c \
+	hal/nvdec/nvdec_tu104.c \
+	hal/gsp/gsp_tu104.c \
+	hal/sec2/sec2_tu104.c \
+	hal/pramin/pramin_gp10b.c \
+	hal/pramin/pramin_gv100.c \
+	hal/pramin/pramin_init.c \
+	hal/pramin/pramin_tu104.c \
+	hal/bios/bios_tu104.c \
+	hal/top/top_gv100.c \
+	hal/xve/xve_gp106.c \
+	hal/xve/xve_tu104.c
+
+ifeq ($(CONFIG_NVGPU_COMPRESSION),1)
+srcs +=	hal/cbc/cbc_tu104.c
+endif
+endif
+
+ifeq ($(CONFIG_NVGPU_SIM),1)
+srcs += common/sim/sim.c \
+	common/sim/sim_pci.c \
+	common/sim/sim_netlist.c
+endif
+
+ifeq ($(CONFIG_NVGPU_NON_FUSA),1)
+srcs +=	common/power_features/power_features.c
+endif
+
+ifeq ($(CONFIG_NVGPU_TPC_POWERGATE),1)
+srcs +=	hal/tpc/tpc_gv11b.c
+endif
--- a/drivers/gpu/nvgpu/acr.h
+++ b/drivers/gpu/nvgpu/acr.h
@@ -0,0 +1,51 @@
+/*
+ * Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ */
+
+#ifndef __ACR_H_
+#define __ACR_H_
+
+#include "gm20b/mm_gm20b.h"
+#include "gm20b/acr_gm20b.h"
+#include "gm206/acr_gm206.h"
+#ifdef CONFIG_ARCH_TEGRA_18x_SOC
+#include "acr_t18x.h"
+#endif
+
+struct acr_desc {
+	struct mem_desc ucode_blob;
+	struct mem_desc wpr_dummy;
+	struct bin_hdr *bl_bin_hdr;
+	struct hsflcn_bl_desc *pmu_hsbl_desc;
+	struct bin_hdr *hsbin_hdr;
+	struct acr_fw_header *fw_hdr;
+	u32 pmu_args;
+	const struct firmware *acr_fw;
+	union{
+		struct flcn_acr_desc *acr_dmem_desc;
+#ifdef CONFIG_ARCH_TEGRA_18x_SOC
+		struct flcn_acr_desc_v1 *acr_dmem_desc_v1;
+#endif
+	};
+	struct mem_desc acr_ucode;
+	const struct firmware *hsbl_fw;
+	struct mem_desc hsbl_ucode;
+	union {
+		struct flcn_bl_dmem_desc bl_dmem_desc;
+		struct flcn_bl_dmem_desc_v1 bl_dmem_desc_v1;
+	};
+	const struct firmware *pmu_fw;
+	const struct firmware *pmu_desc;
+	u32 capabilities;
+};
+
+#endif /*__ACR_H_*/
--- a/drivers/gpu/nvgpu/common/acr/acr.c
+++ b/drivers/gpu/nvgpu/common/acr/acr.c
@@ -0,0 +1,172 @@
+/*
+ * Copyright (c) 2019-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/types.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/firmware.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/acr.h>
+
+#include "acr_priv.h"
+#ifdef CONFIG_NVGPU_ACR_LEGACY
+#include "acr_sw_gm20b.h"
+#include "acr_sw_gp10b.h"
+#endif
+#include "acr_sw_gv11b.h"
+#ifdef CONFIG_NVGPU_DGPU
+#include "acr_sw_tu104.h"
+#endif
+
+#if defined(CONFIG_NVGPU_NEXT) && defined(CONFIG_NVGPU_NON_FUSA)
+#include "nvgpu_next_gpuid.h"
+#endif
+
+/* ACR public API's */
+bool nvgpu_acr_is_lsf_lazy_bootstrap(struct gk20a *g, struct nvgpu_acr *acr,
+	u32 falcon_id)
+{
+	if (acr == NULL) {
+		return false;
+	}
+
+	if ((falcon_id == FALCON_ID_FECS) || (falcon_id == FALCON_ID_PMU) ||
+		(falcon_id == FALCON_ID_GPCCS)) {
+		return acr->lsf[falcon_id].is_lazy_bootstrap;
+	} else {
+		nvgpu_err(g, "Invalid falcon id\n");
+		return false;
+	}
+}
+
+#ifdef CONFIG_NVGPU_DGPU
+int nvgpu_acr_alloc_blob_prerequisite(struct gk20a *g, struct nvgpu_acr *acr,
+	size_t size)
+{
+	if (acr == NULL) {
+		return -EINVAL;
+	}
+
+	return acr->alloc_blob_space(g, size, &acr->ucode_blob);
+}
+#endif
+
+/* ACR blob construct & bootstrap */
+int nvgpu_acr_bootstrap_hs_acr(struct gk20a *g, struct nvgpu_acr *acr)
+{
+	int err = 0;
+
+	if (acr == NULL) {
+		return -EINVAL;
+	}
+
+	err = acr->bootstrap_hs_acr(g, acr);
+	if (err != 0) {
+		nvgpu_err(g, "ACR bootstrap failed");
+	}
+
+	nvgpu_log(g, gpu_dbg_gr, "ACR bootstrap Done");
+	return err;
+}
+
+int nvgpu_acr_construct_execute(struct gk20a *g)
+{
+	int err = 0;
+
+	if (g->acr == NULL) {
+		return -EINVAL;
+	}
+
+	err = g->acr->prepare_ucode_blob(g);
+	if (err != 0) {
+		nvgpu_err(g, "ACR ucode blob prepare failed");
+		goto done;
+	}
+
+	err = nvgpu_acr_bootstrap_hs_acr(g, g->acr);
+	if (err != 0) {
+		nvgpu_err(g, "Bootstrap HS ACR failed");
+	}
+
+done:
+	return err;
+}
+
+/* ACR init */
+int nvgpu_acr_init(struct gk20a *g)
+{
+	u32 ver = nvgpu_safe_add_u32(g->params.gpu_arch,
+					g->params.gpu_impl);
+	int err = 0;
+
+	if (g->acr != NULL) {
+		/*
+		 * Recovery/unrailgate case, we do not need to do ACR init as ACR is
+		 * set during cold boot & doesn't execute ACR clean up as part off
+		 * sequence, so reuse to perform faster boot.
+		 */
+		return err;
+	}
+
+	g->acr = (struct nvgpu_acr *)nvgpu_kzalloc(g, sizeof(struct nvgpu_acr));
+	if (g->acr == NULL) {
+		err = -ENOMEM;
+		goto done;
+	}
+
+	switch (ver) {
+#ifdef CONFIG_NVGPU_ACR_LEGACY
+	case GK20A_GPUID_GM20B:
+	case GK20A_GPUID_GM20B_B:
+		nvgpu_gm20b_acr_sw_init(g, g->acr);
+		break;
+	case NVGPU_GPUID_GP10B:
+		nvgpu_gp10b_acr_sw_init(g, g->acr);
+		break;
+#endif
+	case NVGPU_GPUID_GV11B:
+		nvgpu_gv11b_acr_sw_init(g, g->acr);
+		break;
+#if defined(CONFIG_NVGPU_NEXT)
+	case NVGPU_NEXT_GPUID:
+		nvgpu_next_acr_sw_init(g, g->acr);
+		break;
+#endif
+#ifdef CONFIG_NVGPU_DGPU
+	case NVGPU_GPUID_TU104:
+		nvgpu_tu104_acr_sw_init(g, g->acr);
+		break;
+#if defined(CONFIG_NVGPU_NEXT)
+	case NVGPU_NEXT_DGPU_GPUID:
+		nvgpu_next_dgpu_acr_sw_init(g, g->acr);
+		break;
+#endif
+#endif
+	default:
+		nvgpu_kfree(g, g->acr);
+		err = -EINVAL;
+		nvgpu_err(g, "no support for GPUID %x", ver);
+		break;
+	}
+
+done:
+	return err;
+}
--- a/drivers/gpu/nvgpu/common/acr/acr_blob_alloc.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_blob_alloc.c
@@ -0,0 +1,63 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/types.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/gk20a.h>
+
+#include "acr_wpr.h"
+#include "acr_priv.h"
+#include "acr_blob_alloc.h"
+
+int nvgpu_acr_alloc_blob_space_sys(struct gk20a *g, size_t size,
+	struct nvgpu_mem *mem)
+{
+	return nvgpu_dma_alloc_flags_sys(g, NVGPU_DMA_PHYSICALLY_ADDRESSED,
+		size, mem);
+}
+#ifdef CONFIG_NVGPU_DGPU
+int nvgpu_acr_alloc_blob_space_vid(struct gk20a *g, size_t size,
+	struct nvgpu_mem *mem)
+{
+	struct wpr_carveout_info wpr_inf;
+	int err;
+
+	if (mem->size != 0ULL) {
+		return 0;
+	}
+
+	g->acr->get_wpr_info(g, &wpr_inf);
+
+	/*
+	 * Even though this mem_desc wouldn't be used, the wpr region needs to
+	 * be reserved in the allocator.
+	 */
+	err = nvgpu_dma_alloc_vid_at(g, wpr_inf.size,
+		&g->acr->wpr_dummy, wpr_inf.wpr_base);
+	if (err != 0) {
+		return err;
+	}
+
+	return nvgpu_dma_alloc_vid_at(g, wpr_inf.size, mem,
+		wpr_inf.nonwpr_base);
+}
+#endif
--- a/drivers/gpu/nvgpu/common/acr/acr_blob_alloc.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_blob_alloc.h
@@ -0,0 +1,36 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_BLOB_ALLOC_H
+#define ACR_BLOB_ALLOC_H
+
+struct gk20a;
+struct nvgpu_mem;
+
+int nvgpu_acr_alloc_blob_space_sys(struct gk20a *g, size_t size,
+	struct nvgpu_mem *mem);
+#ifdef CONFIG_NVGPU_DGPU
+int nvgpu_acr_alloc_blob_space_vid(struct gk20a *g, size_t size,
+	struct nvgpu_mem *mem);
+#endif
+
+#endif /* ACR_BLOB_ALLOC_H */
--- a/drivers/gpu/nvgpu/common/acr/acr_blob_construct.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_blob_construct.c
--- a/drivers/gpu/nvgpu/common/acr/acr_blob_construct.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_blob_construct.h
@@ -0,0 +1,153 @@
+/*
+ * Copyright (c) 2019-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_BLOB_CONSTRUCT_H
+#define ACR_BLOB_CONSTRUCT_H
+
+#include <nvgpu/falcon.h>
+#include <nvgpu/flcnif_cmn.h>
+#include <nvgpu/pmu.h>
+
+#include "nvgpu_acr_interface.h"
+
+#define UCODE_NB_MAX_DATE_LENGTH  64U
+struct ls_falcon_ucode_desc {
+	u32 descriptor_size;
+	u32 image_size;
+	u32 tools_version;
+	u32 app_version;
+	char date[UCODE_NB_MAX_DATE_LENGTH];
+	u32 bootloader_start_offset;
+	u32 bootloader_size;
+	u32 bootloader_imem_offset;
+	u32 bootloader_entry_point;
+	u32 app_start_offset;
+	u32 app_size;
+	u32 app_imem_offset;
+	u32 app_imem_entry;
+	u32 app_dmem_offset;
+	u32 app_resident_code_offset;
+	u32 app_resident_code_size;
+	u32 app_resident_data_offset;
+	u32 app_resident_data_size;
+	u32 nb_imem_overlays;
+	u32 nb_dmem_overlays;
+	struct {u32 start; u32 size; } load_ovl[UCODE_NB_MAX_DATE_LENGTH];
+	u32 compressed;
+};
+
+struct ls_falcon_ucode_desc_v1 {
+	u32 descriptor_size;
+	u32 image_size;
+	u32 tools_version;
+	u32 app_version;
+	char date[UCODE_NB_MAX_DATE_LENGTH];
+	u32 secure_bootloader;
+	u32 bootloader_start_offset;
+	u32 bootloader_size;
+	u32 bootloader_imem_offset;
+	u32 bootloader_entry_point;
+	u32 app_start_offset;
+	u32 app_size;
+	u32 app_imem_offset;
+	u32 app_imem_entry;
+	u32 app_dmem_offset;
+	u32 app_resident_code_offset;
+	u32 app_resident_code_size;
+	u32 app_resident_data_offset;
+	u32 app_resident_data_size;
+	u32 nb_imem_overlays;
+	u32 nb_dmem_overlays;
+	struct {u32 start; u32 size; } load_ovl[64];
+	u32 compressed;
+};
+
+struct flcn_ucode_img {
+	u32 *data;
+	struct ls_falcon_ucode_desc *desc;
+	u32 data_size;
+	struct lsf_ucode_desc *lsf_desc;
+	bool is_next_core_img;
+#if defined(CONFIG_NVGPU_NEXT)
+	struct falcon_next_core_ucode_desc *ndesc;
+#endif
+};
+
+struct lsfm_managed_ucode_img {
+	struct lsfm_managed_ucode_img *next;
+	struct lsf_wpr_header wpr_header;
+	struct lsf_lsb_header lsb_header;
+	struct flcn_bl_dmem_desc bl_gen_desc;
+	u32 bl_gen_desc_size;
+	u32 full_ucode_size;
+	struct flcn_ucode_img ucode_img;
+};
+
+#ifdef CONFIG_NVGPU_DGPU
+/*
+ * LSF shared SubWpr Header
+ *
+ * use_case_id - Shared SubWpr use case ID (updated by nvgpu)
+ * start_addr  - start address of subWpr (updated by nvgpu)
+ * size_4K     - size of subWpr in 4K (updated by nvgpu)
+ */
+struct lsf_shared_sub_wpr_header {
+	u32 use_case_id;
+	u32 start_addr;
+	u32 size_4K;
+};
+
+/*
+ * LSFM SUB WPRs struct
+ * pnext          : Next entry in the list, NULL if last
+ * sub_wpr_header : SubWpr Header struct
+ */
+struct lsfm_sub_wpr {
+	struct lsfm_sub_wpr *pnext;
+	struct lsf_shared_sub_wpr_header sub_wpr_header;
+};
+#endif
+
+struct ls_flcn_mgr {
+	u16 managed_flcn_cnt;
+	u32 wpr_size;
+	struct lsfm_managed_ucode_img *ucode_img_list;
+#ifdef CONFIG_NVGPU_DGPU
+	u16 managed_sub_wpr_count;
+	struct lsfm_sub_wpr *psub_wpr_list;
+#endif
+};
+
+int nvgpu_acr_prepare_ucode_blob(struct gk20a *g);
+#ifdef CONFIG_NVGPU_LS_PMU
+int nvgpu_acr_lsf_pmu_ucode_details(struct gk20a *g, void *lsf_ucode_img);
+#if defined(CONFIG_NVGPU_NEXT)
+s32 nvgpu_acr_lsf_pmu_ncore_ucode_details(struct gk20a *g, void *lsf_ucode_img);
+#endif
+#endif
+int nvgpu_acr_lsf_fecs_ucode_details(struct gk20a *g, void *lsf_ucode_img);
+int nvgpu_acr_lsf_gpccs_ucode_details(struct gk20a *g, void *lsf_ucode_img);
+#ifdef CONFIG_NVGPU_DGPU
+int nvgpu_acr_lsf_sec2_ucode_details(struct gk20a *g, void *lsf_ucode_img);
+#endif
+
+#endif /* ACR_BLOB_CONSTRUCT_H */
--- a/drivers/gpu/nvgpu/common/acr/acr_blob_construct_v0.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_blob_construct_v0.c
@@ -0,0 +1,801 @@
+/*
+ * Copyright (c) 2019-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/firmware.h>
+#include <nvgpu/pmu.h>
+#include <nvgpu/falcon.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/string.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/gr/gr_falcon.h>
+#include <nvgpu/pmu/fw.h>
+#include <nvgpu/gr/gr_utils.h>
+
+#include "acr_blob_construct_v0.h"
+#include "acr_wpr.h"
+#include "acr_priv.h"
+
+#ifdef CONFIG_NVGPU_LS_PMU
+int nvgpu_acr_lsf_pmu_ucode_details_v0(struct gk20a *g, void *lsf_ucode_img)
+{
+	struct lsf_ucode_desc_v0 *lsf_desc;
+	struct nvgpu_firmware *fw_sig;
+	struct nvgpu_firmware *fw_desc;
+	struct nvgpu_firmware *fw_image;
+	struct flcn_ucode_img_v0 *p_img = (struct flcn_ucode_img_v0 *)lsf_ucode_img;
+	int err = 0;
+
+	lsf_desc = nvgpu_kzalloc(g, sizeof(struct lsf_ucode_desc_v0));
+	if (lsf_desc == NULL) {
+		err = -ENOMEM;
+		goto exit;
+	}
+
+	fw_sig = nvgpu_pmu_fw_sig_desc(g, g->pmu);
+	fw_desc = nvgpu_pmu_fw_desc_desc(g, g->pmu);
+	fw_image = nvgpu_pmu_fw_image_desc(g, g->pmu);
+
+	nvgpu_memcpy((u8 *)lsf_desc, (u8 *)fw_sig->data,
+		min_t(size_t, sizeof(*lsf_desc), fw_sig->size));
+
+	lsf_desc->falcon_id = FALCON_ID_PMU;
+
+	p_img->desc = (struct pmu_ucode_desc *)(void *)fw_desc->data;
+	p_img->data = (u32 *)(void *)fw_image->data;
+	p_img->data_size = p_img->desc->image_size;
+	p_img->lsf_desc = (struct lsf_ucode_desc_v0 *)lsf_desc;
+
+exit:
+	return err;
+}
+#endif
+
+int nvgpu_acr_lsf_fecs_ucode_details_v0(struct gk20a *g, void *lsf_ucode_img)
+{
+	struct lsf_ucode_desc_v0 *lsf_desc;
+	struct nvgpu_firmware *fecs_sig;
+	struct flcn_ucode_img_v0 *p_img = (struct flcn_ucode_img_v0 *)lsf_ucode_img;
+	struct nvgpu_gr_falcon *gr_falcon = nvgpu_gr_get_falcon_ptr(g);
+	struct nvgpu_ctxsw_ucode_segments *fecs =
+			nvgpu_gr_falcon_get_fecs_ucode_segments(gr_falcon);
+	int err;
+
+	fecs_sig = nvgpu_request_firmware(g, GM20B_FECS_UCODE_SIG, 0);
+	if (fecs_sig == NULL) {
+		nvgpu_err(g, "failed to load fecs sig");
+		return -ENOENT;
+	}
+	lsf_desc = nvgpu_kzalloc(g, sizeof(struct lsf_ucode_desc_v0));
+	if (lsf_desc == NULL) {
+		err = -ENOMEM;
+		goto rel_sig;
+	}
+	nvgpu_memcpy((u8 *)lsf_desc, (u8 *)fecs_sig->data,
+			min_t(size_t, sizeof(*lsf_desc), fecs_sig->size));
+
+	lsf_desc->falcon_id = FALCON_ID_FECS;
+
+	p_img->desc = nvgpu_kzalloc(g, sizeof(struct pmu_ucode_desc));
+	if (p_img->desc == NULL) {
+		err = -ENOMEM;
+		goto free_lsf_desc;
+	}
+
+	p_img->desc->bootloader_start_offset = fecs->boot.offset;
+	p_img->desc->bootloader_size = NVGPU_ALIGN(fecs->boot.size, 256U);
+	p_img->desc->bootloader_imem_offset = fecs->boot_imem_offset;
+	p_img->desc->bootloader_entry_point = fecs->boot_entry;
+
+	p_img->desc->image_size = NVGPU_ALIGN(fecs->boot.size, 256U) +
+		NVGPU_ALIGN(fecs->code.size, 256U) + NVGPU_ALIGN(fecs->data.size, 256U);
+	p_img->desc->app_size = NVGPU_ALIGN(fecs->code.size, 256U) +
+					NVGPU_ALIGN(fecs->data.size, 256U);
+	p_img->desc->app_start_offset = fecs->code.offset;
+	p_img->desc->app_imem_offset = 0;
+	p_img->desc->app_imem_entry = 0;
+	p_img->desc->app_dmem_offset = 0;
+	p_img->desc->app_resident_code_offset = 0;
+	p_img->desc->app_resident_code_size = fecs->code.size;
+	p_img->desc->app_resident_data_offset =
+				fecs->data.offset - fecs->code.offset;
+	p_img->desc->app_resident_data_size = fecs->data.size;
+	p_img->data = nvgpu_gr_falcon_get_surface_desc_cpu_va(gr_falcon);
+	p_img->data_size = p_img->desc->image_size;
+
+	p_img->lsf_desc = (struct lsf_ucode_desc_v0 *)lsf_desc;
+	nvgpu_acr_dbg(g, "fecs fw loaded\n");
+	nvgpu_release_firmware(g, fecs_sig);
+	return 0;
+free_lsf_desc:
+	nvgpu_kfree(g, lsf_desc);
+rel_sig:
+	nvgpu_release_firmware(g, fecs_sig);
+	return err;
+}
+
+int nvgpu_acr_lsf_gpccs_ucode_details_v0(struct gk20a *g, void *lsf_ucode_img)
+{
+	struct lsf_ucode_desc_v0 *lsf_desc;
+	struct nvgpu_firmware *gpccs_sig;
+	struct flcn_ucode_img_v0 *p_img = (struct flcn_ucode_img_v0 *)lsf_ucode_img;
+	struct nvgpu_gr_falcon *gr_falcon = nvgpu_gr_get_falcon_ptr(g);
+	struct nvgpu_ctxsw_ucode_segments *gpccs =
+			nvgpu_gr_falcon_get_gpccs_ucode_segments(gr_falcon);
+	int err;
+
+	if (!nvgpu_is_enabled(g, NVGPU_SEC_SECUREGPCCS)) {
+		return -ENOENT;
+	}
+
+	gpccs_sig = nvgpu_request_firmware(g, T18x_GPCCS_UCODE_SIG, 0);
+	if (gpccs_sig == NULL) {
+		nvgpu_err(g, "failed to load gpccs sig");
+		return -ENOENT;
+	}
+	lsf_desc = nvgpu_kzalloc(g, sizeof(struct lsf_ucode_desc_v0));
+	if (lsf_desc == NULL) {
+		err = -ENOMEM;
+		goto rel_sig;
+	}
+	nvgpu_memcpy((u8 *)lsf_desc, (u8 *)gpccs_sig->data,
+			min_t(size_t, sizeof(*lsf_desc), gpccs_sig->size));
+	lsf_desc->falcon_id = FALCON_ID_GPCCS;
+
+	p_img->desc = nvgpu_kzalloc(g, sizeof(struct pmu_ucode_desc));
+	if (p_img->desc == NULL) {
+		err = -ENOMEM;
+		goto free_lsf_desc;
+	}
+
+	p_img->desc->bootloader_start_offset =
+		0;
+	p_img->desc->bootloader_size = NVGPU_ALIGN(gpccs->boot.size, 256U);
+	p_img->desc->bootloader_imem_offset = gpccs->boot_imem_offset;
+	p_img->desc->bootloader_entry_point = gpccs->boot_entry;
+
+	p_img->desc->image_size = NVGPU_ALIGN(gpccs->boot.size, 256U) +
+		NVGPU_ALIGN(gpccs->code.size, 256U) +
+		NVGPU_ALIGN(gpccs->data.size, 256U);
+	p_img->desc->app_size = NVGPU_ALIGN(gpccs->code.size, 256U) +
+		NVGPU_ALIGN(gpccs->data.size, 256U);
+	p_img->desc->app_start_offset = p_img->desc->bootloader_size;
+	p_img->desc->app_imem_offset = 0;
+	p_img->desc->app_imem_entry = 0;
+	p_img->desc->app_dmem_offset = 0;
+	p_img->desc->app_resident_code_offset = 0;
+	p_img->desc->app_resident_code_size = NVGPU_ALIGN(gpccs->code.size, 256U);
+	p_img->desc->app_resident_data_offset =
+		NVGPU_ALIGN(gpccs->data.offset, 256U) -
+		NVGPU_ALIGN(gpccs->code.offset, 256U);
+	p_img->desc->app_resident_data_size = NVGPU_ALIGN(gpccs->data.size, 256U);
+	p_img->data = (u32 *)
+		((u8 *)nvgpu_gr_falcon_get_surface_desc_cpu_va(gr_falcon) +
+							gpccs->boot.offset);
+	p_img->data_size = NVGPU_ALIGN(p_img->desc->image_size, 256U);
+	p_img->lsf_desc = (struct lsf_ucode_desc_v0 *)lsf_desc;
+	nvgpu_acr_dbg(g, "gpccs fw loaded\n");
+	nvgpu_release_firmware(g, gpccs_sig);
+	return 0;
+free_lsf_desc:
+	nvgpu_kfree(g, lsf_desc);
+rel_sig:
+	nvgpu_release_firmware(g, gpccs_sig);
+	return err;
+}
+
+/*
+ * @brief lsfm_fill_static_lsb_hdr_info
+ * Populate static LSB header information using the provided ucode image
+ */
+static void lsfm_fill_static_lsb_hdr_info(struct gk20a *g,
+	u32 falcon_id, struct lsfm_managed_ucode_img_v0 *pnode)
+{
+	u32 full_app_size = 0;
+	u32 data = 0;
+
+	if (pnode->ucode_img.lsf_desc != NULL) {
+		nvgpu_memcpy((u8 *)&pnode->lsb_header.signature,
+			(u8 *)pnode->ucode_img.lsf_desc,
+			sizeof(struct lsf_ucode_desc_v0));
+	}
+	pnode->lsb_header.ucode_size = pnode->ucode_img.data_size;
+
+	/* Uses a loader. that is has a desc */
+	pnode->lsb_header.data_size = 0;
+
+	/*
+	 * The loader code size is already aligned (padded) such that
+	 * the code following it is aligned, but the size in the image
+	 * desc is not, bloat it up to be on a 256 byte alignment.
+	 */
+	pnode->lsb_header.bl_code_size = NVGPU_ALIGN(
+		pnode->ucode_img.desc->bootloader_size,
+		LSF_BL_CODE_SIZE_ALIGNMENT);
+	full_app_size = NVGPU_ALIGN(pnode->ucode_img.desc->app_size,
+		LSF_BL_CODE_SIZE_ALIGNMENT) +
+		pnode->lsb_header.bl_code_size;
+	pnode->lsb_header.ucode_size = NVGPU_ALIGN(
+		pnode->ucode_img.desc->app_resident_data_offset,
+		LSF_BL_CODE_SIZE_ALIGNMENT) +
+		pnode->lsb_header.bl_code_size;
+	pnode->lsb_header.data_size = full_app_size -
+		pnode->lsb_header.ucode_size;
+	/*
+	 * Though the BL is located at 0th offset of the image, the VA
+	 * is different to make sure that it doesn't collide the actual
+	 * OS VA range
+	 */
+	pnode->lsb_header.bl_imem_off =
+		pnode->ucode_img.desc->bootloader_imem_offset;
+
+	pnode->lsb_header.flags = 0;
+
+	if (falcon_id == FALCON_ID_PMU) {
+		data = NV_FLCN_ACR_LSF_FLAG_DMACTL_REQ_CTX_TRUE;
+		pnode->lsb_header.flags = data;
+	}
+
+	if (g->acr->lsf[falcon_id].is_priv_load) {
+		pnode->lsb_header.flags |=
+			NV_FLCN_ACR_LSF_FLAG_FORCE_PRIV_LOAD_TRUE;
+	}
+}
+
+/* Adds a ucode image to the list of managed ucode images managed. */
+static int lsfm_add_ucode_img(struct gk20a *g, struct ls_flcn_mgr_v0 *plsfm,
+	struct flcn_ucode_img_v0 *ucode_image, u32 falcon_id)
+{
+
+	struct lsfm_managed_ucode_img_v0 *pnode;
+
+	pnode = nvgpu_kzalloc(g, sizeof(struct lsfm_managed_ucode_img_v0));
+	if (pnode == NULL) {
+		return -ENOMEM;
+	}
+
+	/* Keep a copy of the ucode image info locally */
+	nvgpu_memcpy((u8 *)&pnode->ucode_img, (u8 *)ucode_image,
+		sizeof(struct flcn_ucode_img_v0));
+
+	/* Fill in static WPR header info*/
+	pnode->wpr_header.falcon_id = falcon_id;
+	pnode->wpr_header.bootstrap_owner = g->acr->bootstrap_owner;
+	pnode->wpr_header.status = LSF_IMAGE_STATUS_COPY;
+
+	pnode->wpr_header.lazy_bootstrap =
+		(u32)g->acr->lsf[falcon_id].is_lazy_bootstrap;
+
+	/* Fill in static LSB header info elsewhere */
+	lsfm_fill_static_lsb_hdr_info(g, falcon_id, pnode);
+	pnode->next = plsfm->ucode_img_list;
+	plsfm->ucode_img_list = pnode;
+	return 0;
+}
+
+/* Discover all managed falcon ucode images */
+static int lsfm_discover_ucode_images(struct gk20a *g,
+	struct ls_flcn_mgr_v0 *plsfm)
+{
+	struct flcn_ucode_img_v0 ucode_img;
+	struct nvgpu_acr *acr = g->acr;
+	u32 falcon_id;
+	u32 i;
+	int err = 0;
+
+	/*
+	 * Enumerate all constructed falcon objects, as we need the ucode
+	 * image info and total falcon count
+	 */
+	for (i = 0U; i < FALCON_ID_END; i++) {
+		if (nvgpu_test_bit(i, (void *)&acr->lsf_enable_mask) &&
+			acr->lsf[i].get_lsf_ucode_details != NULL) {
+
+			(void) memset(&ucode_img, 0, sizeof(ucode_img));
+
+			if (acr->lsf[i].get_lsf_ucode_details(g,
+				(void *)&ucode_img) != 0) {
+				nvgpu_err(g, "LS falcon-%d ucode get failed", i);
+				goto exit;
+			}
+
+			if (ucode_img.lsf_desc != NULL) {
+				/*
+				 * falon_id is formed by grabbing the static
+				 * base falonId from the image and adding the
+				 * engine-designated falcon instance.
+				 */
+				falcon_id = ucode_img.lsf_desc->falcon_id;
+
+				err = lsfm_add_ucode_img(g, plsfm, &ucode_img,
+					falcon_id);
+				if (err != 0) {
+					nvgpu_err(g, " Failed to add falcon-%d to LSFM ",
+						falcon_id);
+					goto exit;
+				}
+
+				plsfm->managed_flcn_cnt++;
+			}
+		}
+	}
+
+exit:
+	return err;
+}
+
+/* Generate WPR requirements for ACR allocation request */
+static int lsf_gen_wpr_requirements(struct gk20a *g, struct ls_flcn_mgr_v0 *plsfm)
+{
+	struct lsfm_managed_ucode_img_v0 *pnode = plsfm->ucode_img_list;
+	u32 wpr_offset;
+
+	/*
+	 * Start with an array of WPR headers at the base of the WPR.
+	 * The expectation here is that the secure falcon will do a single DMA
+	 * read of this array and cache it internally so it's OK to pack these.
+	 * Also, we add 1 to the falcon count to indicate the end of the array.
+	 */
+	wpr_offset = U32(sizeof(struct lsf_wpr_header_v0)) *
+		(U32(plsfm->managed_flcn_cnt) + U32(1));
+
+	/*
+	 * Walk the managed falcons, accounting for the LSB structs
+	 * as well as the ucode images.
+	 */
+	while (pnode != NULL) {
+		/* Align, save off, and include an LSB header size */
+		wpr_offset = NVGPU_ALIGN(wpr_offset, LSF_LSB_HEADER_ALIGNMENT);
+		pnode->wpr_header.lsb_offset = wpr_offset;
+		wpr_offset += (u32)sizeof(struct lsf_lsb_header_v0);
+
+		/*
+		 * Align, save off, and include the original (static)
+		 * ucode image size
+		 */
+		wpr_offset = NVGPU_ALIGN(wpr_offset,
+			LSF_UCODE_DATA_ALIGNMENT);
+		pnode->lsb_header.ucode_off = wpr_offset;
+		wpr_offset += pnode->ucode_img.data_size;
+
+		/*
+		 * For falcons that use a boot loader (BL), we append a loader
+		 * desc structure on the end of the ucode image and consider this
+		 * the boot loader data. The host will then copy the loader desc
+		 * args to this space within the WPR region (before locking down)
+		 * and the HS bin will then copy them to DMEM 0 for the loader.
+		 */
+		/*
+		 * Track the size for LSB details filled in later
+		 * Note that at this point we don't know what kind of
+		 * boot loader desc, so we just take the size of the
+		 * generic one, which is the largest it will will ever be.
+		 */
+		/* Align (size bloat) and save off generic descriptor size */
+		pnode->lsb_header.bl_data_size = NVGPU_ALIGN(
+			(u32)sizeof(pnode->bl_gen_desc),
+			LSF_BL_DATA_SIZE_ALIGNMENT);
+
+		/* Align, save off, and include the additional BL data */
+		wpr_offset = NVGPU_ALIGN(wpr_offset,
+			LSF_BL_DATA_ALIGNMENT);
+		pnode->lsb_header.bl_data_off = wpr_offset;
+		wpr_offset += pnode->lsb_header.bl_data_size;
+
+		/* Finally, update ucode surface size to include updates */
+		pnode->full_ucode_size = wpr_offset -
+			pnode->lsb_header.ucode_off;
+		if (pnode->wpr_header.falcon_id != FALCON_ID_PMU) {
+			pnode->lsb_header.app_code_off =
+				pnode->lsb_header.bl_code_size;
+			pnode->lsb_header.app_code_size =
+				pnode->lsb_header.ucode_size -
+				pnode->lsb_header.bl_code_size;
+			pnode->lsb_header.app_data_off =
+				pnode->lsb_header.ucode_size;
+			pnode->lsb_header.app_data_size =
+				pnode->lsb_header.data_size;
+		}
+		pnode = pnode->next;
+	}
+	plsfm->wpr_size = wpr_offset;
+	return 0;
+}
+
+/* Initialize WPR contents */
+static int gm20b_pmu_populate_loader_cfg(struct gk20a *g,
+	void *lsfm, u32 *p_bl_gen_desc_size)
+{
+	struct wpr_carveout_info wpr_inf;
+	struct lsfm_managed_ucode_img_v0 *p_lsfm =
+			(struct lsfm_managed_ucode_img_v0 *)lsfm;
+	struct flcn_ucode_img_v0 *p_img = &(p_lsfm->ucode_img);
+	struct loader_config *ldr_cfg = &(p_lsfm->bl_gen_desc.loader_cfg);
+	u64 addr_base;
+	struct pmu_ucode_desc *desc;
+	u64 tmp;
+	u32 addr_code, addr_data;
+
+	if (p_img->desc == NULL) {
+		/*
+		 * This means its a header based ucode,
+		 * and so we do not fill BL gen desc structure
+		 */
+		return -EINVAL;
+	}
+	desc = p_img->desc;
+	/*
+	 * Calculate physical and virtual addresses for various portions of
+	 * the PMU ucode image
+	 * Calculate the 32-bit addresses for the application code, application
+	 * data, and bootloader code. These values are all based on IM_BASE.
+	 * The 32-bit addresses will be the upper 32-bits of the virtual or
+	 * physical addresses of each respective segment.
+	 */
+	addr_base = p_lsfm->lsb_header.ucode_off;
+	g->acr->get_wpr_info(g, &wpr_inf);
+	addr_base += wpr_inf.wpr_base;
+	nvgpu_acr_dbg(g, "pmu loader cfg u32 addrbase %x\n", (u32)addr_base);
+	/*From linux*/
+	tmp = (addr_base +
+			desc->app_start_offset +
+			desc->app_resident_code_offset) >> 8;
+	nvgpu_assert(tmp <= U32_MAX);
+	addr_code = u64_lo32(tmp);
+	nvgpu_acr_dbg(g, "app start %d app res code off %d\n",
+		desc->app_start_offset, desc->app_resident_code_offset);
+	tmp = (addr_base +
+			desc->app_start_offset +
+			desc->app_resident_data_offset) >> 8;
+	nvgpu_assert(tmp <= U32_MAX);
+	addr_data = u64_lo32(tmp);
+	nvgpu_acr_dbg(g, "app res data offset%d\n",
+		desc->app_resident_data_offset);
+	nvgpu_acr_dbg(g, "bl start off %d\n", desc->bootloader_start_offset);
+
+	/* Populate the loader_config state*/
+	ldr_cfg->dma_idx = g->acr->lsf[FALCON_ID_PMU].falcon_dma_idx;
+	ldr_cfg->code_dma_base = addr_code;
+	ldr_cfg->code_dma_base1 = 0x0;
+	ldr_cfg->code_size_total = desc->app_size;
+	ldr_cfg->code_size_to_load = desc->app_resident_code_size;
+	ldr_cfg->code_entry_point = desc->app_imem_entry;
+	ldr_cfg->data_dma_base = addr_data;
+	ldr_cfg->data_dma_base1 = 0;
+	ldr_cfg->data_size = desc->app_resident_data_size;
+	ldr_cfg->overlay_dma_base = addr_code;
+	ldr_cfg->overlay_dma_base1 = 0x0;
+
+	/* Update the argc/argv members*/
+	ldr_cfg->argc = 1;
+#ifdef CONFIG_NVGPU_LS_PMU
+	nvgpu_pmu_fw_get_cmd_line_args_offset(g, &ldr_cfg->argv);
+#endif
+	*p_bl_gen_desc_size = (u32)sizeof(struct loader_config);
+	return 0;
+}
+
+static int gm20b_flcn_populate_bl_dmem_desc(struct gk20a *g,
+	void *lsfm, u32 *p_bl_gen_desc_size, u32 falconid)
+{
+	struct wpr_carveout_info wpr_inf;
+	struct lsfm_managed_ucode_img_v0 *p_lsfm =
+			(struct lsfm_managed_ucode_img_v0 *)lsfm;
+	struct flcn_ucode_img_v0 *p_img = &(p_lsfm->ucode_img);
+	struct flcn_bl_dmem_desc_v0 *ldr_cfg =
+			&(p_lsfm->bl_gen_desc.bl_dmem_desc);
+	u64 addr_base;
+	struct pmu_ucode_desc *desc;
+	u32 addr_code, addr_data;
+	u64 tmp;
+
+	if (p_img->desc == NULL) {
+		/*
+		 * This means its a header based ucode,
+		 * and so we do not fill BL gen desc structure
+		 */
+		return -EINVAL;
+	}
+	desc = p_img->desc;
+
+	/*
+	 * Calculate physical and virtual addresses for various portions of
+	 * the PMU ucode image
+	 * Calculate the 32-bit addresses for the application code, application
+	 * data, and bootloader code. These values are all based on IM_BASE.
+	 * The 32-bit addresses will be the upper 32-bits of the virtual or
+	 * physical addresses of each respective segment.
+	 */
+	addr_base = p_lsfm->lsb_header.ucode_off;
+	g->acr->get_wpr_info(g, &wpr_inf);
+	addr_base += wpr_inf.wpr_base;
+
+	nvgpu_acr_dbg(g, "gen loader cfg %x u32 addrbase %x ID\n", (u32)addr_base,
+			p_lsfm->wpr_header.falcon_id);
+	tmp = (addr_base +
+			desc->app_start_offset +
+			desc->app_resident_code_offset) >> 8;
+	nvgpu_assert(tmp <= U32_MAX);
+	addr_code = u64_lo32(tmp);
+	tmp = (addr_base +
+			desc->app_start_offset +
+			desc->app_resident_data_offset) >> 8;
+	nvgpu_assert(tmp <= U32_MAX);
+	addr_data = u64_lo32(tmp);
+
+	nvgpu_acr_dbg(g, "gen cfg %x u32 addrcode %x & data %x load offset %xID\n",
+		(u32)addr_code, (u32)addr_data, desc->bootloader_start_offset,
+		p_lsfm->wpr_header.falcon_id);
+
+	/* Populate the LOADER_CONFIG state */
+	(void) memset((void *) ldr_cfg, 0, sizeof(struct flcn_bl_dmem_desc_v0));
+	ldr_cfg->ctx_dma = g->acr->lsf[falconid].falcon_dma_idx;
+	ldr_cfg->code_dma_base = addr_code;
+	ldr_cfg->non_sec_code_size = desc->app_resident_code_size;
+	ldr_cfg->data_dma_base = addr_data;
+	ldr_cfg->data_size = desc->app_resident_data_size;
+	ldr_cfg->code_entry_point = desc->app_imem_entry;
+	*p_bl_gen_desc_size = (u32)sizeof(struct flcn_bl_dmem_desc_v0);
+	return 0;
+}
+
+/* Populate falcon boot loader generic desc.*/
+static int lsfm_fill_flcn_bl_gen_desc(struct gk20a *g,
+		struct lsfm_managed_ucode_img_v0 *pnode)
+{
+	int err = -ENOENT;
+
+	if (pnode->wpr_header.falcon_id != FALCON_ID_PMU) {
+		nvgpu_acr_dbg(g, "non pmu. write flcn bl gen desc\n");
+		err = gm20b_flcn_populate_bl_dmem_desc(g,
+				pnode, &pnode->bl_gen_desc_size,
+				pnode->wpr_header.falcon_id);
+		if (err != 0) {
+			nvgpu_err(g, "flcn_populate_bl_dmem_desc failed=%d",
+				err);
+		}
+		return err;
+	}
+
+	if (pnode->wpr_header.falcon_id == FALCON_ID_PMU) {
+		nvgpu_acr_dbg(g, "pmu write flcn bl gen desc\n");
+		err = gm20b_pmu_populate_loader_cfg(g, pnode,
+				&pnode->bl_gen_desc_size);
+		if (err != 0) {
+			nvgpu_err(g, "pmu_populate_loader_cfg failed=%d",
+				err);
+		}
+		return err;
+	}
+
+	/* Failed to find the falcon requested. */
+	return err;
+}
+
+static int lsfm_init_wpr_contents(struct gk20a *g, struct ls_flcn_mgr_v0 *plsfm,
+	struct nvgpu_mem *ucode)
+{
+	struct lsfm_managed_ucode_img_v0 *pnode = plsfm->ucode_img_list;
+	struct lsf_wpr_header_v0 last_wpr_hdr;
+	u32 i;
+	int err = 0;
+
+	/* The WPR array is at the base of the WPR */
+	pnode = plsfm->ucode_img_list;
+	(void) memset(&last_wpr_hdr, 0, sizeof(struct lsf_wpr_header_v0));
+	i = 0;
+
+	/*
+	 * Walk the managed falcons, flush WPR and LSB headers to FB.
+	 * flush any bl args to the storage area relative to the
+	 * ucode image (appended on the end as a DMEM area).
+	 */
+	while (pnode != NULL) {
+		/* Flush WPR header to memory*/
+		nvgpu_mem_wr_n(g, ucode, i * (u32)sizeof(pnode->wpr_header),
+				&pnode->wpr_header,
+				(u32)sizeof(pnode->wpr_header));
+
+		nvgpu_acr_dbg(g, "wpr header");
+		nvgpu_acr_dbg(g, "falconid :%d",
+				pnode->wpr_header.falcon_id);
+		nvgpu_acr_dbg(g, "lsb_offset :%x",
+				pnode->wpr_header.lsb_offset);
+		nvgpu_acr_dbg(g, "bootstrap_owner :%d",
+			pnode->wpr_header.bootstrap_owner);
+		nvgpu_acr_dbg(g, "lazy_bootstrap :%d",
+				pnode->wpr_header.lazy_bootstrap);
+		nvgpu_acr_dbg(g, "status :%d",
+				pnode->wpr_header.status);
+
+		/*Flush LSB header to memory*/
+		nvgpu_mem_wr_n(g, ucode, pnode->wpr_header.lsb_offset,
+				&pnode->lsb_header,
+				(u32)sizeof(pnode->lsb_header));
+
+		nvgpu_acr_dbg(g, "lsb header");
+		nvgpu_acr_dbg(g, "ucode_off :%x",
+				pnode->lsb_header.ucode_off);
+		nvgpu_acr_dbg(g, "ucode_size :%x",
+				pnode->lsb_header.ucode_size);
+		nvgpu_acr_dbg(g, "data_size :%x",
+				pnode->lsb_header.data_size);
+		nvgpu_acr_dbg(g, "bl_code_size :%x",
+				pnode->lsb_header.bl_code_size);
+		nvgpu_acr_dbg(g, "bl_imem_off :%x",
+				pnode->lsb_header.bl_imem_off);
+		nvgpu_acr_dbg(g, "bl_data_off :%x",
+				pnode->lsb_header.bl_data_off);
+		nvgpu_acr_dbg(g, "bl_data_size :%x",
+				pnode->lsb_header.bl_data_size);
+		nvgpu_acr_dbg(g, "app_code_off :%x",
+				pnode->lsb_header.app_code_off);
+		nvgpu_acr_dbg(g, "app_code_size :%x",
+				pnode->lsb_header.app_code_size);
+		nvgpu_acr_dbg(g, "app_data_off :%x",
+				pnode->lsb_header.app_data_off);
+		nvgpu_acr_dbg(g, "app_data_size :%x",
+				pnode->lsb_header.app_data_size);
+		nvgpu_acr_dbg(g, "flags :%x",
+				pnode->lsb_header.flags);
+
+		/* this falcon has a boot loader and related args, flush them */
+		/* Populate gen bl and flush to memory */
+		err = lsfm_fill_flcn_bl_gen_desc(g, pnode);
+		if (err != 0) {
+			nvgpu_err(g, "bl_gen_desc failed err=%d", err);
+			return err;
+		}
+		nvgpu_mem_wr_n(g, ucode,
+				pnode->lsb_header.bl_data_off,
+				&pnode->bl_gen_desc,
+				pnode->bl_gen_desc_size);
+
+		/* Copying of ucode */
+		nvgpu_mem_wr_n(g, ucode, pnode->lsb_header.ucode_off,
+				pnode->ucode_img.data,
+				pnode->ucode_img.data_size);
+		pnode = pnode->next;
+		i++;
+	}
+
+	/* Tag the terminator WPR header with an invalid falcon ID. */
+	last_wpr_hdr.falcon_id = FALCON_ID_INVALID;
+	nvgpu_mem_wr_n(g, ucode,
+			(u32)plsfm->managed_flcn_cnt *
+				(u32)sizeof(struct lsf_wpr_header_v0),
+			&last_wpr_hdr,
+			(u32)sizeof(struct lsf_wpr_header_v0));
+	return err;
+}
+
+/* Free any ucode image structure resources. */
+static void lsfm_free_ucode_img_res(struct gk20a *g,
+	struct flcn_ucode_img_v0 *p_img)
+{
+	if (p_img->lsf_desc != NULL) {
+		nvgpu_kfree(g, p_img->lsf_desc);
+		p_img->lsf_desc = NULL;
+	}
+}
+
+/* Free any ucode image structure resources. */
+static void lsfm_free_nonpmu_ucode_img_res(struct gk20a *g,
+	struct flcn_ucode_img_v0 *p_img)
+{
+	if (p_img->lsf_desc != NULL) {
+		nvgpu_kfree(g, p_img->lsf_desc);
+		p_img->lsf_desc = NULL;
+	}
+	if (p_img->desc != NULL) {
+		nvgpu_kfree(g, p_img->desc);
+		p_img->desc = NULL;
+	}
+}
+
+static void free_acr_resources(struct gk20a *g, struct ls_flcn_mgr_v0 *plsfm)
+{
+	u32 cnt = plsfm->managed_flcn_cnt;
+	struct lsfm_managed_ucode_img_v0 *mg_ucode_img;
+	while (cnt != 0U) {
+		mg_ucode_img = plsfm->ucode_img_list;
+		if (mg_ucode_img->ucode_img.lsf_desc->falcon_id ==
+				FALCON_ID_PMU) {
+			lsfm_free_ucode_img_res(g, &mg_ucode_img->ucode_img);
+		} else {
+			lsfm_free_nonpmu_ucode_img_res(g,
+				&mg_ucode_img->ucode_img);
+		}
+		plsfm->ucode_img_list = mg_ucode_img->next;
+		nvgpu_kfree(g, mg_ucode_img);
+		cnt--;
+	}
+}
+
+int nvgpu_acr_prepare_ucode_blob_v0(struct gk20a *g)
+{
+	int err = 0;
+	struct ls_flcn_mgr_v0 lsfm_l, *plsfm;
+	struct wpr_carveout_info wpr_inf;
+	struct nvgpu_gr_falcon *gr_falcon = nvgpu_gr_get_falcon_ptr(g);
+
+	if (g->acr->ucode_blob.cpu_va != NULL) {
+		/* Recovery case, we do not need to form non WPR blob */
+		return err;
+	}
+	plsfm = &lsfm_l;
+	(void) memset((void *)plsfm, 0, sizeof(struct ls_flcn_mgr_v0));
+	nvgpu_acr_dbg(g, "fetching GMMU regs\n");
+	err = g->ops.fb.vpr_info_fetch(g);
+	if (err != 0) {
+		nvgpu_err(g, "fb.vpr_info_fetch failed err=%d", err);
+		return err;
+	}
+
+	err = nvgpu_gr_falcon_init_ctxsw_ucode(g, gr_falcon);
+	if (err != 0) {
+		nvgpu_err(g, "gr_falcon_init_ctxsw_ucode failed err=%d", err);
+		return err;
+	}
+
+	g->acr->get_wpr_info(g, &wpr_inf);
+	nvgpu_acr_dbg(g, "wpr carveout base:%llx\n", wpr_inf.wpr_base);
+	nvgpu_acr_dbg(g, "wpr carveout size :%llx\n", wpr_inf.size);
+
+	/* Discover all managed falcons*/
+	err = lsfm_discover_ucode_images(g, plsfm);
+	nvgpu_acr_dbg(g, " Managed Falcon cnt %d\n", plsfm->managed_flcn_cnt);
+	if (err != 0) {
+		goto exit_err;
+	}
+
+	if ((plsfm->managed_flcn_cnt != 0U) &&
+		(g->acr->ucode_blob.cpu_va == NULL)) {
+		/* Generate WPR requirements */
+		err = lsf_gen_wpr_requirements(g, plsfm);
+		if (err != 0) {
+			goto exit_err;
+		}
+
+		/* Alloc memory to hold ucode blob contents */
+		err = g->acr->alloc_blob_space(g, plsfm->wpr_size
+				, &g->acr->ucode_blob);
+		if (err != 0) {
+			goto exit_err;
+		}
+
+		nvgpu_acr_dbg(g, "managed LS falcon %d, WPR size %d bytes.\n",
+			plsfm->managed_flcn_cnt, plsfm->wpr_size);
+		err = lsfm_init_wpr_contents(g, plsfm, &g->acr->ucode_blob);
+		if (err != 0) {
+			nvgpu_kfree(g, &g->acr->ucode_blob);
+			goto free_acr;
+		}
+	} else {
+		nvgpu_acr_dbg(g, "LSFM is managing no falcons.\n");
+	}
+	nvgpu_acr_dbg(g, "prepare ucode blob return 0\n");
+
+free_acr:
+	free_acr_resources(g, plsfm);
+exit_err:
+	return err;
+}
--- a/drivers/gpu/nvgpu/common/acr/acr_blob_construct_v0.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_blob_construct_v0.h
@@ -0,0 +1,207 @@
+/*
+ * Copyright (c) 2019-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_BLOB_CONSTRUCT_V0_H
+#define ACR_BLOB_CONSTRUCT_V0_H
+
+#include <nvgpu/falcon.h>
+#include <nvgpu/flcnif_cmn.h>
+
+/*
+ * Light Secure WPR Content Alignments
+ */
+#define LSF_WPR_HEADER_ALIGNMENT        (256U)
+#define LSF_SUB_WPR_HEADER_ALIGNMENT    (256U)
+#define LSF_LSB_HEADER_ALIGNMENT        (256U)
+#define LSF_BL_DATA_ALIGNMENT           (256U)
+#define LSF_BL_DATA_SIZE_ALIGNMENT      (256U)
+#define LSF_BL_CODE_SIZE_ALIGNMENT      (256U)
+#define LSF_DATA_SIZE_ALIGNMENT         (256U)
+#define LSF_CODE_SIZE_ALIGNMENT         (256U)
+
+#define LSF_UCODE_DATA_ALIGNMENT 4096U
+
+
+/* Defined for 1MB alignment */
+#define SHIFT_1MB	(20U)
+#define SHIFT_4KB	(12U)
+
+/*Light Secure Bootstrap header related defines*/
+#define NV_FLCN_ACR_LSF_FLAG_LOAD_CODE_AT_0_FALSE       0U
+#define NV_FLCN_ACR_LSF_FLAG_LOAD_CODE_AT_0_TRUE        BIT32(0)
+#define NV_FLCN_ACR_LSF_FLAG_DMACTL_REQ_CTX_FALSE       0U
+#define NV_FLCN_ACR_LSF_FLAG_DMACTL_REQ_CTX_TRUE        BIT32(2)
+#define NV_FLCN_ACR_LSF_FLAG_FORCE_PRIV_LOAD_TRUE       BIT32(3)
+#define NV_FLCN_ACR_LSF_FLAG_FORCE_PRIV_LOAD_FALSE      (0U)
+
+/*
+ * Image Status Defines
+ */
+#define LSF_IMAGE_STATUS_NONE                           (0U)
+#define LSF_IMAGE_STATUS_COPY                           (1U)
+#define LSF_IMAGE_STATUS_VALIDATION_CODE_FAILED         (2U)
+#define LSF_IMAGE_STATUS_VALIDATION_DATA_FAILED         (3U)
+#define LSF_IMAGE_STATUS_VALIDATION_DONE                (4U)
+#define LSF_IMAGE_STATUS_VALIDATION_SKIPPED             (5U)
+#define LSF_IMAGE_STATUS_BOOTSTRAP_READY                (6U)
+
+/*
+ * Light Secure WPR Header
+ * Defines state allowing Light Secure Falcon bootstrapping.
+ */
+struct lsf_wpr_header_v0 {
+	u32 falcon_id;
+	u32 lsb_offset;
+	u32 bootstrap_owner;
+	u32 lazy_bootstrap;
+	u32 status;
+};
+
+/*
+ * Light Secure Falcon Ucode Description Defines
+ * This structure is prelim and may change as the ucode signing flow evolves.
+ */
+struct lsf_ucode_desc_v0 {
+	u8  prd_keys[2][16];
+	u8  dbg_keys[2][16];
+	u32 b_prd_present;
+	u32 b_dbg_present;
+	u32 falcon_id;
+};
+
+/*
+ * Light Secure Bootstrap Header
+ * Defines state allowing Light Secure Falcon bootstrapping.
+ */
+struct lsf_lsb_header_v0 {
+	struct lsf_ucode_desc_v0 signature;
+	u32 ucode_off;
+	u32 ucode_size;
+	u32 data_size;
+	u32 bl_code_size;
+	u32 bl_imem_off;
+	u32 bl_data_off;
+	u32 bl_data_size;
+	u32 app_code_off;
+	u32 app_code_size;
+	u32 app_data_off;
+	u32 app_data_size;
+	u32 flags;
+};
+
+/*
+ * Union of all supported structures used by bootloaders.
+ */
+/* Falcon BL interfaces */
+/*
+ * Structure used by the boot-loader to load the rest of the code. This has
+ * to be filled by NVGPU and copied into DMEM at offset provided in the
+ * hsflcn_bl_desc.bl_desc_dmem_load_off.
+ */
+struct flcn_bl_dmem_desc_v0 {
+	u32    reserved[4];        /*Should be the first element..*/
+	u32    signature[4];        /*Should be the first element..*/
+	u32    ctx_dma;
+	u32    code_dma_base;
+	u32    non_sec_code_off;
+	u32    non_sec_code_size;
+	u32    sec_code_off;
+	u32    sec_code_size;
+	u32    code_entry_point;
+	u32    data_dma_base;
+	u32    data_size;
+	u32    code_dma_base1;
+	u32    data_dma_base1;
+};
+
+/*
+ * Legacy structure used by the current PMU bootloader.
+ */
+struct loader_config {
+	u32 dma_idx;
+	u32 code_dma_base;     /* upper 32-bits of 40-bit dma address */
+	u32 code_size_total;
+	u32 code_size_to_load;
+	u32 code_entry_point;
+	u32 data_dma_base;     /* upper 32-bits of 40-bit dma address */
+	u32 data_size;         /* initialized data of the application  */
+	u32 overlay_dma_base;  /* upper 32-bits of the 40-bit dma address */
+	u32 argc;
+	u32 argv;
+	u16 code_dma_base1;    /* upper 7 bits of 47-bit dma address */
+	u16 data_dma_base1;    /* upper 7 bits of 47-bit dma address */
+	u16 overlay_dma_base1; /* upper 7 bits of the 47-bit dma address */
+};
+
+union flcn_bl_generic_desc {
+	struct flcn_bl_dmem_desc_v0 bl_dmem_desc;
+	struct loader_config loader_cfg;
+};
+
+struct flcn_ucode_img_v0 {
+	u32  *data;
+	struct pmu_ucode_desc *desc; /* only some falcons have descriptor */
+	u32  data_size;
+	/* NULL if not a light secure falcon. */
+	struct lsf_ucode_desc_v0 *lsf_desc;
+	/* True if there a resources to freed by the client. */
+};
+
+/*
+ * LSFM Managed Ucode Image
+ * next             : Next image the list, NULL if last.
+ * wpr_header       : WPR header for this ucode image
+ * lsb_header       : LSB header for this ucode image
+ * bl_gen_desc      : Bootloader generic desc structure for this ucode image
+ * bl_gen_desc_size : Sizeof bootloader desc structure for this ucode image
+ * full_ucode_size  : Surface size required for final ucode image
+ * ucode_img        : Ucode image info
+ */
+struct lsfm_managed_ucode_img_v0 {
+	struct lsfm_managed_ucode_img_v0 *next;
+	struct lsf_wpr_header_v0 wpr_header;
+	struct lsf_lsb_header_v0 lsb_header;
+	union flcn_bl_generic_desc bl_gen_desc;
+	u32 bl_gen_desc_size;
+	u32 full_ucode_size;
+	struct flcn_ucode_img_v0 ucode_img;
+};
+
+/*
+ * Defines the structure used to contain all generic information related to
+ * the LSFM.
+ *
+ * Contains the Light Secure Falcon Manager (LSFM) feature related data.
+ */
+struct ls_flcn_mgr_v0 {
+	u16 managed_flcn_cnt;
+	u32 wpr_size;
+	struct lsfm_managed_ucode_img_v0 *ucode_img_list;
+};
+
+int nvgpu_acr_lsf_pmu_ucode_details_v0(struct gk20a *g, void *lsf_ucode_img);
+int nvgpu_acr_lsf_fecs_ucode_details_v0(struct gk20a *g, void *lsf_ucode_img);
+int nvgpu_acr_lsf_gpccs_ucode_details_v0(struct gk20a *g, void *lsf_ucode_img);
+
+int nvgpu_acr_prepare_ucode_blob_v0(struct gk20a *g);
+
+#endif /* ACR_BLOB_CONSTRUCT_V0_H */
--- a/drivers/gpu/nvgpu/common/acr/acr_bootstrap.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_bootstrap.c
@@ -0,0 +1,254 @@
+/*
+ * Copyright (c) 2019-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/types.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/timers.h>
+#include <nvgpu/nvgpu_mem.h>
+#include <nvgpu/firmware.h>
+#include <nvgpu/pmu.h>
+#include <nvgpu/falcon.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/acr.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/soc.h>
+
+#include "acr_bootstrap.h"
+#include "acr_priv.h"
+
+int nvgpu_acr_wait_for_completion(struct gk20a *g, struct hs_acr *acr_desc,
+	u32 timeout)
+{
+	u32 flcn_id;
+#ifdef CONFIG_NVGPU_FALCON_NON_FUSA
+	u32 sctl, cpuctl;
+#endif
+	int completion = 0;
+	u32 data = 0;
+	u32 bar0_status = 0;
+	u32 error_type;
+
+	nvgpu_log_fn(g, " ");
+
+	flcn_id = nvgpu_falcon_get_id(acr_desc->acr_flcn);
+
+	completion = nvgpu_falcon_wait_for_halt(acr_desc->acr_flcn, timeout);
+	if (completion != 0) {
+		nvgpu_err(g, "flcn-%d: HS ucode boot timed out, limit: %d ms",
+				flcn_id, timeout);
+		error_type = ACR_BOOT_TIMEDOUT;
+		goto exit;
+	}
+
+	if (acr_desc->acr_engine_bus_err_status != NULL) {
+		completion = acr_desc->acr_engine_bus_err_status(g,
+			&bar0_status, &error_type);
+		if (completion != 0) {
+			nvgpu_err(g, "flcn-%d: ACR engine bus error", flcn_id);
+			goto exit;
+		}
+	}
+
+	data = nvgpu_falcon_mailbox_read(acr_desc->acr_flcn, FALCON_MAILBOX_0);
+	if (data != 0U) {
+		nvgpu_err(g, "flcn-%d: HS ucode boot failed, err %x", flcn_id,
+				data);
+		nvgpu_err(g, "flcn-%d: Mailbox-1 : 0x%x", flcn_id,
+				nvgpu_falcon_mailbox_read(acr_desc->acr_flcn,
+				FALCON_MAILBOX_1));
+		completion = -EAGAIN;
+		error_type = ACR_BOOT_FAILED;
+		goto exit;
+	}
+
+	/*
+	 * When engine-falcon is used for ACR bootstrap, validate the integrity
+	 * of falcon IMEM and DMEM.
+	 */
+	if (acr_desc->acr_validate_mem_integrity != NULL) {
+		if (!acr_desc->acr_validate_mem_integrity(g)) {
+			nvgpu_err(g, "flcn-%d: memcheck failed", flcn_id);
+			completion = -EAGAIN;
+			error_type = ACR_BOOT_FAILED;
+		}
+	}
+
+exit:
+
+#ifdef CONFIG_NVGPU_FALCON_NON_FUSA
+	nvgpu_falcon_get_ctls(acr_desc->acr_flcn, &sctl, &cpuctl);
+
+	nvgpu_acr_dbg(g, "flcn-%d: sctl reg %x cpuctl reg %x",
+			flcn_id, sctl, cpuctl);
+#endif
+
+	if (completion != 0) {
+#ifdef CONFIG_NVGPU_FALCON_DEBUG
+		nvgpu_falcon_dump_stats(acr_desc->acr_flcn);
+#endif
+		if (acr_desc->report_acr_engine_bus_err_status != NULL) {
+			acr_desc->report_acr_engine_bus_err_status(g,
+				bar0_status, error_type);
+		}
+	}
+
+	return completion;
+}
+
+/*
+ * Patch signatures into ucode image
+ */
+static void acr_ucode_patch_sig(struct gk20a *g,
+	unsigned int *p_img, unsigned int *p_prod_sig,
+	unsigned int *p_dbg_sig, unsigned int *p_patch_loc,
+	unsigned int *p_patch_ind, u32 sig_size)
+{
+#if defined(CONFIG_NVGPU_NEXT)
+	struct nvgpu_acr *acr = g->acr;
+#endif
+	unsigned int i, j, *p_sig;
+	const u32 dmem_word_size = 4U;
+	nvgpu_acr_dbg(g, " ");
+
+	if (!g->ops.pmu.is_debug_mode_enabled(g)) {
+		p_sig = p_prod_sig;
+		nvgpu_acr_dbg(g, "PRODUCTION MODE\n");
+	} else {
+		p_sig = p_dbg_sig;
+		nvgpu_info(g, "DEBUG MODE\n");
+	}
+
+#if defined(CONFIG_NVGPU_NEXT)
+	if (acr->get_versioned_sig != NULL) {
+		p_sig = acr->get_versioned_sig(g, acr, p_sig, &sig_size);
+	}
+#endif
+
+	/* Patching logic:*/
+	sig_size = sig_size / dmem_word_size;
+	for (i = 0U; i < (sizeof(*p_patch_loc) / dmem_word_size); i++) {
+		for (j = 0U; j < sig_size; j++) {
+			p_img[nvgpu_safe_add_u32(
+				(p_patch_loc[i] / dmem_word_size), j)] =
+				p_sig[nvgpu_safe_add_u32(
+					(p_patch_ind[i] * dmem_word_size), j)];
+		}
+	}
+}
+
+/*
+ * Loads ACR bin to SYSMEM/FB and bootstraps ACR with bootloader code
+ * start and end are addresses of ucode blob in non-WPR region
+ */
+int nvgpu_acr_bootstrap_hs_ucode(struct gk20a *g, struct nvgpu_acr *acr,
+	struct hs_acr *acr_desc)
+{
+	struct nvgpu_firmware *acr_fw = acr_desc->acr_fw;
+	struct bin_hdr *hs_bin_hdr = NULL;
+	struct acr_fw_header *fw_hdr = NULL;
+	u32 *ucode_header = NULL;
+	u32 *ucode = NULL;
+	u32 timeout = 0;
+	int err = 0;
+
+	nvgpu_acr_dbg(g, "ACR TYPE %x ", acr_desc->acr_type);
+
+	if (acr_fw != NULL) {
+		err = acr->patch_wpr_info_to_ucode(g, acr, acr_desc, true);
+		if (err != 0) {
+			nvgpu_err(g, "Falcon ucode patch wpr info failed");
+			return err;
+                }
+	} else {
+		/* Firmware is stored in soc specific path in FMODEL
+		 * Hence NVGPU_REQUEST_FIRMWARE_NO_WARN is used instead
+		 * of NVGPU_REQUEST_FIRMWARE_NO_SOC
+		 */
+#ifdef CONFIG_NVGPU_SIM
+		if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
+			acr_fw = nvgpu_request_firmware(g,
+					acr_desc->acr_fw_name,
+					NVGPU_REQUEST_FIRMWARE_NO_WARN);
+		} else
+#endif
+		{
+			acr_fw = nvgpu_request_firmware(g,
+					acr_desc->acr_fw_name,
+					NVGPU_REQUEST_FIRMWARE_NO_SOC);
+		}
+		if (acr_fw == NULL) {
+			nvgpu_err(g, "%s ucode get fail for %s",
+				acr_desc->acr_fw_name, g->name);
+			return -ENOENT;
+		}
+
+		acr_desc->acr_fw = acr_fw;
+
+		err = acr->patch_wpr_info_to_ucode(g, acr, acr_desc, false);
+		if (err != 0) {
+			nvgpu_err(g, "Falcon ucode patch wpr info failed");
+			goto err_free_ucode;
+                }
+	}
+
+
+	hs_bin_hdr = (struct bin_hdr *)(void *)acr_fw->data;
+	fw_hdr = (struct acr_fw_header *)(void *)(acr_fw->data +
+			hs_bin_hdr->header_offset);
+	ucode_header = (u32 *)(void *)(acr_fw->data + fw_hdr->hdr_offset);
+	ucode = (u32 *)(void *)(acr_fw->data + hs_bin_hdr->data_offset);
+
+	/* Patch Ucode signatures */
+	acr_ucode_patch_sig(g, ucode,
+		(u32 *)(void *)(acr_fw->data + fw_hdr->sig_prod_offset),
+		(u32 *)(void *)(acr_fw->data + fw_hdr->sig_dbg_offset),
+		(u32 *)(void *)(acr_fw->data + fw_hdr->patch_loc),
+		(u32 *)(void *)(acr_fw->data + fw_hdr->patch_sig),
+		fw_hdr->sig_dbg_size);
+
+	err = nvgpu_falcon_hs_ucode_load_bootstrap(acr_desc->acr_flcn,
+			ucode, ucode_header);
+	if (err != 0) {
+		nvgpu_err(g, "HS ucode load & bootstrap failed");
+		goto err_free_ucode;
+	}
+
+	/* wait for complete & halt */
+	if (nvgpu_platform_is_silicon(g)) {
+		timeout = ACR_COMPLETION_TIMEOUT_SILICON_MS;
+	} else {
+		timeout = ACR_COMPLETION_TIMEOUT_NON_SILICON_MS;
+	}
+	err = nvgpu_acr_wait_for_completion(g, acr_desc, timeout);
+
+	if (err != 0) {
+		nvgpu_err(g, "HS ucode completion err %d", err);
+		goto err_free_ucode;
+	}
+
+	return 0;
+
+err_free_ucode:
+	nvgpu_release_firmware(g, acr_fw);
+	acr_desc->acr_fw = NULL;
+	return err;
+}
--- a/drivers/gpu/nvgpu/common/acr/acr_bootstrap.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_bootstrap.h
@@ -0,0 +1,139 @@
+/*
+ * Copyright (c) 2019-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_BOOTSTRAP_H
+#define ACR_BOOTSTRAP_H
+
+#include "nvgpu_acr_interface.h"
+#ifdef CONFIG_NVGPU_NEXT
+#include "common/acr/nvgpu_next_acr_bootstrap.h"
+#endif
+
+struct gk20a;
+struct nvgpu_acr;
+
+struct flcn_acr_region_prop_v0 {
+	u32 start_addr;
+	u32 end_addr;
+	u32 region_id;
+	u32 read_mask;
+	u32 write_mask;
+	u32 client_mask;
+};
+
+struct flcn_acr_regions_v0 {
+	u32 no_regions;
+	struct flcn_acr_region_prop_v0 region_props[NVGPU_FLCN_ACR_MAX_REGIONS];
+};
+
+struct flcn_acr_desc_v0 {
+	union {
+		u32 reserved_dmem[(LSF_BOOTSTRAP_OWNER_RESERVED_DMEM_SIZE/4)];
+		u32 signatures[4];
+	} ucode_reserved_space;
+	/*Always 1st*/
+	u32 wpr_region_id;
+	u32 wpr_offset;
+	u32 mmu_mem_range;
+	struct flcn_acr_regions_v0 regions;
+	u32 nonwpr_ucode_blob_size;
+	u64 nonwpr_ucode_blob_start;
+};
+
+struct bin_hdr {
+	/* 0x10de */
+	u32 bin_magic;
+	/* versioning of bin format */
+	u32 bin_ver;
+	/* Entire image size including this header */
+	u32 bin_size;
+	/*
+	 * Header offset of executable binary metadata,
+	 * start @ offset- 0x100 *
+	 */
+	u32 header_offset;
+	/*
+	 * Start of executable binary data, start @
+	 * offset- 0x200
+	 */
+	u32 data_offset;
+	/* Size of executable binary */
+	u32 data_size;
+};
+
+struct acr_fw_header {
+	u32 sig_dbg_offset;
+	u32 sig_dbg_size;
+	u32 sig_prod_offset;
+	u32 sig_prod_size;
+	u32 patch_loc;
+	u32 patch_sig;
+	u32 hdr_offset; /* This header points to acr_ucode_header_t210_load */
+	u32 hdr_size; /* Size of above header */
+};
+
+/* ACR Falcon descriptor's */
+struct hs_acr {
+#define ACR_DEFAULT		0U
+#define ACR_AHESASC_NON_FUSA	1U
+#define ACR_ASB_NON_FUSA	2U
+#define ACR_AHESASC_FUSA	3U
+#define ACR_ASB_FUSA		4U
+	u32 acr_type;
+
+	/* ACR ucode */
+	const char *acr_fw_name;
+	const char *acr_code_name;
+	const char *acr_data_name;
+	const char *acr_manifest_name;
+	struct nvgpu_firmware *code_fw;
+	struct nvgpu_firmware *data_fw;
+	struct nvgpu_firmware *manifest_fw;
+	struct nvgpu_firmware *acr_fw;
+
+	union{
+		struct flcn_acr_desc_v0 *acr_dmem_desc_v0;
+		struct flcn_acr_desc *acr_dmem_desc;
+	};
+
+#if defined(CONFIG_NVGPU_NEXT)
+	struct nvgpu_mem acr_falcon2_sysmem_desc;
+	struct flcn2_acr_desc acr_sysmem_desc;
+	struct nvgpu_mem ls_pmu_desc;
+#endif
+
+	/* Falcon used to execute ACR ucode */
+	struct nvgpu_falcon *acr_flcn;
+
+	void (*report_acr_engine_bus_err_status)(struct gk20a *g,
+		u32 bar0_status, u32 error_type);
+	int (*acr_engine_bus_err_status)(struct gk20a *g, u32 *bar0_status,
+		u32 *error_type);
+	bool (*acr_validate_mem_integrity)(struct gk20a *g);
+};
+
+int nvgpu_acr_wait_for_completion(struct gk20a *g, struct hs_acr *acr_desc,
+	u32 timeout);
+int nvgpu_acr_bootstrap_hs_ucode(struct gk20a *g, struct nvgpu_acr *acr,
+	struct hs_acr *acr_desc);
+
+#endif /* ACR_BOOTSTRAP_H */
--- a/drivers/gpu/nvgpu/common/acr/acr_priv.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_priv.h
@@ -0,0 +1,161 @@
+/*
+ * Copyright (c) 2019-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_H
+#define ACR_H
+
+#include "acr_bootstrap.h"
+#ifdef CONFIG_NVGPU_ACR_LEGACY
+#include "acr_blob_construct_v0.h"
+#endif
+#include "acr_blob_construct.h"
+
+struct gk20a;
+struct nvgpu_acr;
+struct wpr_carveout_info;
+
+#define nvgpu_acr_dbg(g, fmt, args...) \
+	nvgpu_log(g, gpu_dbg_pmu, fmt, ##args)
+
+/*
+ * Falcon UCODE header index.
+ */
+#define FLCN_NL_UCODE_HDR_OS_CODE_OFF_IND              (0U)
+#define FLCN_NL_UCODE_HDR_OS_CODE_SIZE_IND             (1U)
+#define FLCN_NL_UCODE_HDR_OS_DATA_OFF_IND              (2U)
+#define FLCN_NL_UCODE_HDR_OS_DATA_SIZE_IND             (3U)
+#define FLCN_NL_UCODE_HDR_NUM_APPS_IND                 (4U)
+
+/*
+ * There are total N number of Apps with code and offset defined in UCODE header
+ * This macro provides the CODE and DATA offset and size of Ath application.
+ */
+#define FLCN_NL_UCODE_HDR_APP_CODE_START_IND           (5U)
+#define FLCN_NL_UCODE_HDR_APP_CODE_OFF_IND(N, A) \
+	(FLCN_NL_UCODE_HDR_APP_CODE_START_IND + ((A)*2U))
+#define FLCN_NL_UCODE_HDR_APP_CODE_SIZE_IND(N, A) \
+	(FLCN_NL_UCODE_HDR_APP_CODE_START_IND + ((A)*2U) + 1U)
+#define FLCN_NL_UCODE_HDR_APP_CODE_END_IND(N) \
+	(FLCN_NL_UCODE_HDR_APP_CODE_START_IND + ((N)*2U) - 1U)
+
+#define FLCN_NL_UCODE_HDR_APP_DATA_START_IND(N) \
+	(FLCN_NL_UCODE_HDR_APP_CODE_END_IND(N) + 1U)
+#define FLCN_NL_UCODE_HDR_APP_DATA_OFF_IND(N, A) \
+	(FLCN_NL_UCODE_HDR_APP_DATA_START_IND(N) + ((A)*2U))
+#define FLCN_NL_UCODE_HDR_APP_DATA_SIZE_IND(N, A) \
+	(FLCN_NL_UCODE_HDR_APP_DATA_START_IND(N) + ((A)*2U) + 1U)
+#define FLCN_NL_UCODE_HDR_APP_DATA_END_IND(N) \
+	(FLCN_NL_UCODE_HDR_APP_DATA_START_IND(N) + ((N)*2U) - 1U)
+
+#define FLCN_NL_UCODE_HDR_OS_OVL_OFF_IND(N) \
+	(FLCN_NL_UCODE_HDR_APP_DATA_END_IND(N) + 1U)
+#define FLCN_NL_UCODE_HDR_OS_OVL_SIZE_IND(N) \
+	(FLCN_NL_UCODE_HDR_APP_DATA_END_IND(N) + 2U)
+
+#define GM20B_HSBIN_ACR_PROD_UCODE "nv_acr_ucode_prod.bin"
+#define GM20B_HSBIN_ACR_DBG_UCODE "nv_acr_ucode_dbg.bin"
+#define HSBIN_ACR_BL_UCODE_IMAGE "pmu_bl.bin"
+#define HSBIN_ACR_PROD_UCODE "acr_ucode_prod.bin"
+#define HSBIN_ACR_DBG_UCODE "acr_ucode_dbg.bin"
+#define HSBIN_ACR_AHESASC_NON_FUSA_PROD_UCODE "acr_ahesasc_prod_ucode.bin"
+#define HSBIN_ACR_ASB_NON_FUSA_PROD_UCODE "acr_asb_prod_ucode.bin"
+#define HSBIN_ACR_AHESASC_NON_FUSA_DBG_UCODE "acr_ahesasc_dbg_ucode.bin"
+#define HSBIN_ACR_ASB_NON_FUSA_DBG_UCODE "acr_asb_dbg_ucode.bin"
+
+#define HSBIN_ACR_AHESASC_FUSA_PROD_UCODE "acr_ahesasc_fusa_prod_ucode.bin"
+#define HSBIN_ACR_ASB_FUSA_PROD_UCODE "acr_asb_fusa_prod_ucode.bin"
+#define HSBIN_ACR_AHESASC_FUSA_DBG_UCODE "acr_ahesasc_fusa_dbg_ucode.bin"
+#define HSBIN_ACR_ASB_FUSA_DBG_UCODE "acr_asb_fusa_dbg_ucode.bin"
+
+#define GM20B_FECS_UCODE_SIG "fecs_sig.bin"
+#define T18x_GPCCS_UCODE_SIG "gpccs_sig.bin"
+
+#define TU104_FECS_UCODE_SIG "tu104/fecs_sig.bin"
+#define TU104_GPCCS_UCODE_SIG "tu104/gpccs_sig.bin"
+
+#define LSF_SEC2_UCODE_IMAGE_BIN "sec2_ucode_image.bin"
+#define LSF_SEC2_UCODE_DESC_BIN "sec2_ucode_desc.bin"
+#define LSF_SEC2_UCODE_SIG_BIN "sec2_sig.bin"
+
+#define LSF_SEC2_UCODE_IMAGE_FUSA_BIN "sec2_ucode_fusa_image.bin"
+#define LSF_SEC2_UCODE_DESC_FUSA_BIN "sec2_ucode_fusa_desc.bin"
+#define LSF_SEC2_UCODE_SIG_FUSA_BIN "sec2_fusa_sig.bin"
+
+#define ACR_COMPLETION_TIMEOUT_NON_SILICON_MS 10000U /*in msec */
+#define ACR_COMPLETION_TIMEOUT_SILICON_MS 100 /*in msec */
+
+struct acr_lsf_config {
+	u32 falcon_id;
+	u32 falcon_dma_idx;
+	bool is_lazy_bootstrap;
+	bool is_priv_load;
+
+	int (*get_lsf_ucode_details)(struct gk20a *g, void *lsf_ucode_img);
+	void (*get_cmd_line_args_offset)(struct gk20a *g, u32 *args_offset);
+};
+
+struct nvgpu_acr {
+	struct gk20a *g;
+
+	u32 bootstrap_owner;
+	u32 num_of_sig;
+
+	/* LSF properties */
+	u64 lsf_enable_mask;
+	struct acr_lsf_config lsf[FALCON_ID_END];
+
+	/*
+	 * non-wpr space to hold LSF ucodes,
+	 * ACR does copy ucode from non-wpr to wpr
+	 */
+	struct nvgpu_mem ucode_blob;
+	/*
+	 * Even though this mem_desc wouldn't be used,
+	 * the wpr region needs to be reserved in the
+	 * allocator in dGPU case.
+	 */
+	struct nvgpu_mem wpr_dummy;
+
+	/* ACR member for different types of ucode */
+	/* For older dgpu/tegra ACR cuode */
+	struct hs_acr acr;
+	/* ACR load split feature support */
+	struct hs_acr acr_ahesasc;
+	struct hs_acr acr_asb;
+
+	/* ACR load split feature support for iGPU*/
+	struct hs_acr acr_alsb;
+	struct hs_acr acr_asc;
+
+	int (*prepare_ucode_blob)(struct gk20a *g);
+	int (*alloc_blob_space)(struct gk20a *g, size_t size,
+		struct nvgpu_mem *mem);
+	int (*patch_wpr_info_to_ucode)(struct gk20a *g, struct nvgpu_acr *acr,
+		struct hs_acr *acr_desc, bool is_recovery);
+	int (*bootstrap_hs_acr)(struct gk20a *g, struct nvgpu_acr *acr);
+
+	void (*get_wpr_info)(struct gk20a *g, struct wpr_carveout_info *inf);
+	u32* (*get_versioned_sig)(struct gk20a *g, struct nvgpu_acr *acr,
+		u32 *sig, u32 *sig_size);
+};
+
+#endif /* ACR_H */
--- a/drivers/gpu/nvgpu/common/acr/acr_sw_gm20b.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_sw_gm20b.c
@@ -0,0 +1,172 @@
+/*
+ * Copyright (c) 2015-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/types.h>
+#include <nvgpu/firmware.h>
+#include <nvgpu/falcon.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/pmu/fw.h>
+
+#include "acr_wpr.h"
+#include "acr_priv.h"
+#include "acr_sw_gm20b.h"
+#include "acr_blob_alloc.h"
+#include "acr_bootstrap.h"
+#include "acr_blob_construct_v0.h"
+
+static int gm20b_bootstrap_hs_acr(struct gk20a *g, struct nvgpu_acr *acr)
+{
+	int err = 0;
+
+	nvgpu_log_fn(g, " ");
+
+	err = nvgpu_acr_bootstrap_hs_ucode(g, g->acr, &g->acr->acr);
+	if (err != 0) {
+		nvgpu_err(g, "ACR bootstrap failed");
+	}
+
+	return err;
+}
+
+static int gm20b_acr_patch_wpr_info_to_ucode(struct gk20a *g,
+	struct nvgpu_acr *acr, struct hs_acr *acr_desc, bool is_recovery)
+{
+	struct nvgpu_firmware *acr_fw = acr_desc->acr_fw;
+	struct acr_fw_header *acr_fw_hdr = NULL;
+	struct bin_hdr *acr_fw_bin_hdr = NULL;
+	struct flcn_acr_desc_v0 *acr_dmem_desc;
+	u32 *acr_ucode_header = NULL;
+	u32 *acr_ucode_data = NULL;
+
+	nvgpu_log_fn(g, " ");
+
+	if (is_recovery) {
+		acr_desc->acr_dmem_desc_v0->nonwpr_ucode_blob_size = 0U;
+	} else {
+		acr_fw_bin_hdr = (struct bin_hdr *)acr_fw->data;
+		acr_fw_hdr = (struct acr_fw_header *)
+			(acr_fw->data + acr_fw_bin_hdr->header_offset);
+
+		acr_ucode_data = (u32 *)(acr_fw->data +
+			acr_fw_bin_hdr->data_offset);
+
+		acr_ucode_header = (u32 *)(acr_fw->data +
+			acr_fw_hdr->hdr_offset);
+
+		/* Patch WPR info to ucode */
+		acr_dmem_desc = (struct flcn_acr_desc_v0 *)
+			&(((u8 *)acr_ucode_data)[acr_ucode_header[2U]]);
+
+		acr_desc->acr_dmem_desc_v0 = acr_dmem_desc;
+
+		acr_dmem_desc->nonwpr_ucode_blob_start =
+			nvgpu_mem_get_addr(g, &g->acr->ucode_blob);
+		nvgpu_assert(g->acr->ucode_blob.size <= U32_MAX);
+		acr_dmem_desc->nonwpr_ucode_blob_size =
+			(u32)g->acr->ucode_blob.size;
+		acr_dmem_desc->regions.no_regions = 1U;
+		acr_dmem_desc->wpr_offset = 0U;
+	}
+
+	return 0;
+}
+
+/* LSF static config functions */
+static u32 gm20b_acr_lsf_pmu(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* PMU LS falcon info */
+	lsf->falcon_id = FALCON_ID_PMU;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	lsf->is_lazy_bootstrap = false;
+	lsf->is_priv_load = false;
+#ifdef CONFIG_NVGPU_LS_PMU
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_pmu_ucode_details_v0;
+	lsf->get_cmd_line_args_offset = nvgpu_pmu_fw_get_cmd_line_args_offset;
+#endif
+	return BIT32(lsf->falcon_id);
+}
+
+static u32 gm20b_acr_lsf_fecs(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* FECS LS falcon info */
+	lsf->falcon_id = FALCON_ID_FECS;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	lsf->is_lazy_bootstrap = false;
+	lsf->is_priv_load = false;
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_fecs_ucode_details_v0;
+	lsf->get_cmd_line_args_offset = NULL;
+
+	return BIT32(lsf->falcon_id);
+}
+
+static u32 gm20b_acr_lsf_conifg(struct gk20a *g,
+	struct nvgpu_acr *acr)
+{
+	u32 lsf_enable_mask = 0;
+
+	lsf_enable_mask |= gm20b_acr_lsf_pmu(g, &acr->lsf[FALCON_ID_PMU]);
+	lsf_enable_mask |= gm20b_acr_lsf_fecs(g, &acr->lsf[FALCON_ID_FECS]);
+
+	return lsf_enable_mask;
+}
+
+static void gm20b_acr_default_sw_init(struct gk20a *g, struct hs_acr *hs_acr)
+{
+	nvgpu_log_fn(g, " ");
+
+	/* ACR HS ucode type & f/w name*/
+	hs_acr->acr_type = ACR_DEFAULT;
+
+	if (!g->ops.pmu.is_debug_mode_enabled(g)) {
+		hs_acr->acr_fw_name = GM20B_HSBIN_ACR_PROD_UCODE;
+	} else {
+		hs_acr->acr_fw_name = GM20B_HSBIN_ACR_DBG_UCODE;
+	}
+
+	/* set on which falcon ACR need to execute*/
+	hs_acr->acr_flcn = g->pmu->flcn;
+	hs_acr->acr_engine_bus_err_status =
+		g->ops.pmu.bar0_error_status;
+}
+
+void nvgpu_gm20b_acr_sw_init(struct gk20a *g, struct nvgpu_acr *acr)
+{
+	nvgpu_log_fn(g, " ");
+
+	acr->g = g;
+
+	acr->bootstrap_owner = FALCON_ID_PMU;
+
+	acr->lsf_enable_mask = gm20b_acr_lsf_conifg(g, acr);
+
+	gm20b_acr_default_sw_init(g, &acr->acr);
+
+	acr->prepare_ucode_blob = nvgpu_acr_prepare_ucode_blob_v0;
+	acr->get_wpr_info = nvgpu_acr_wpr_info_sys;
+	acr->alloc_blob_space = nvgpu_acr_alloc_blob_space_sys;
+	acr->bootstrap_hs_acr = gm20b_bootstrap_hs_acr;
+	acr->patch_wpr_info_to_ucode =
+		gm20b_acr_patch_wpr_info_to_ucode;
+}
--- a/drivers/gpu/nvgpu/common/acr/acr_sw_gm20b.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_sw_gm20b.h
@@ -0,0 +1,33 @@
+/*
+ * GM20B ACR
+ *
+ * Copyright (c) 2015-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_SW_GM20B_H
+#define ACR_SW_GM20B_H
+
+struct gk20a;
+struct nvgpu_acr;
+
+void nvgpu_gm20b_acr_sw_init(struct gk20a *g, struct nvgpu_acr *acr);
+
+#endif /*ACR_SW_GM20B_H*/
--- a/drivers/gpu/nvgpu/common/acr/acr_sw_gp10b.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_sw_gp10b.c
@@ -0,0 +1,80 @@
+/*
+ * Copyright (c) 2019-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include "acr_sw_gp10b.h"
+
+#include <nvgpu/types.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/pmu.h>
+
+#include "acr_blob_construct_v0.h"
+#include "acr_priv.h"
+
+#include "acr_sw_gm20b.h"
+#include "acr_sw_gp10b.h"
+
+/* LSF static config functions */
+static u32 gp10b_acr_lsf_gpccs(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* GPCCS LS falcon info */
+	lsf->falcon_id = FALCON_ID_GPCCS;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	lsf->is_lazy_bootstrap = true;
+	lsf->is_priv_load = true;
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_gpccs_ucode_details_v0;
+	lsf->get_cmd_line_args_offset = NULL;
+
+	return BIT32(lsf->falcon_id);
+}
+
+static void gp10b_acr_default_sw_init(struct gk20a *g, struct hs_acr *hs_acr)
+{
+	nvgpu_log_fn(g, " ");
+
+	/* ACR HS ucode type & f/w name*/
+	hs_acr->acr_type = ACR_DEFAULT;
+
+	if (!g->ops.pmu.is_debug_mode_enabled(g)) {
+		hs_acr->acr_fw_name = HSBIN_ACR_PROD_UCODE;
+	} else {
+		hs_acr->acr_fw_name = HSBIN_ACR_DBG_UCODE;
+	}
+
+	/* set on which falcon ACR need to execute*/
+	hs_acr->acr_flcn = g->pmu->flcn;
+	hs_acr->acr_engine_bus_err_status =
+		g->ops.pmu.bar0_error_status;
+}
+
+void nvgpu_gp10b_acr_sw_init(struct gk20a *g, struct nvgpu_acr *acr)
+{
+	nvgpu_log_fn(g, " ");
+
+	/* inherit the gm20b config data */
+	nvgpu_gm20b_acr_sw_init(g, acr);
+	gp10b_acr_default_sw_init(g, &acr->acr);
+
+	/* gp10b supports LSF gpccs bootstrap */
+	acr->lsf_enable_mask |= gp10b_acr_lsf_gpccs(g,
+		&acr->lsf[FALCON_ID_GPCCS]);
+}
--- a/drivers/gpu/nvgpu/common/acr/acr_sw_gp10b.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_sw_gp10b.h
@@ -0,0 +1,31 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_SW_GP10B_H
+#define ACR_SW_GP10B_H
+
+struct gk20a;
+struct nvgpu_acr;
+
+void nvgpu_gp10b_acr_sw_init(struct gk20a *g, struct nvgpu_acr *acr);
+
+#endif /* ACR_SW_GP10B_H */
--- a/drivers/gpu/nvgpu/common/acr/acr_sw_gv11b.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_sw_gv11b.c
@@ -0,0 +1,211 @@
+/*
+ * Copyright (c) 2017-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/types.h>
+#include <nvgpu/firmware.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/bug.h>
+#ifdef CONFIG_NVGPU_LS_PMU
+#include <nvgpu/pmu/fw.h>
+#endif
+
+#include "acr_wpr.h"
+#include "acr_priv.h"
+#include "acr_blob_alloc.h"
+#include "acr_blob_construct.h"
+#include "acr_bootstrap.h"
+#include "acr_sw_gv11b.h"
+
+#define RECOVERY_UCODE_BLOB_SIZE	(0U)
+#define WPR_OFFSET			(0U)
+#define ACR_REGIONS			(1U)
+
+static int gv11b_bootstrap_hs_acr(struct gk20a *g, struct nvgpu_acr *acr)
+{
+	int err = 0;
+
+	nvgpu_log_fn(g, " ");
+
+	err = nvgpu_acr_bootstrap_hs_ucode(g, g->acr, &g->acr->acr);
+	if (err != 0) {
+		nvgpu_err(g, "ACR bootstrap failed");
+	}
+
+	return err;
+}
+
+static int gv11b_acr_patch_wpr_info_to_ucode(struct gk20a *g,
+	struct nvgpu_acr *acr, struct hs_acr *acr_desc, bool is_recovery)
+{
+	struct nvgpu_firmware *acr_fw = acr_desc->acr_fw;
+	struct acr_fw_header *acr_fw_hdr = NULL;
+	struct bin_hdr *acr_fw_bin_hdr = NULL;
+	struct flcn_acr_desc *acr_dmem_desc;
+	u32 *acr_ucode_header = NULL;
+	u32 *acr_ucode_data = NULL;
+	const u32 acr_desc_offset = 2U;
+
+	nvgpu_log_fn(g, " ");
+#ifdef CONFIG_NVGPU_NON_FUSA
+	if (is_recovery) {
+		acr_desc->acr_dmem_desc->nonwpr_ucode_blob_size =
+						RECOVERY_UCODE_BLOB_SIZE;
+	} else
+#endif
+	{
+		acr_fw_bin_hdr = (struct bin_hdr *)(void *)acr_fw->data;
+		acr_fw_hdr = (struct acr_fw_header *)(void *)
+			(acr_fw->data + acr_fw_bin_hdr->header_offset);
+
+		acr_ucode_data = (u32 *)(void *)(acr_fw->data +
+			acr_fw_bin_hdr->data_offset);
+		acr_ucode_header = (u32 *)(void *)(acr_fw->data +
+			acr_fw_hdr->hdr_offset);
+
+		/* Patch WPR info to ucode */
+		acr_dmem_desc = (struct flcn_acr_desc *)(void *)
+			&(((u8 *)acr_ucode_data)[acr_ucode_header[acr_desc_offset]]);
+
+		acr_desc->acr_dmem_desc = acr_dmem_desc;
+
+		acr_dmem_desc->nonwpr_ucode_blob_start =
+			nvgpu_mem_get_addr(g, &g->acr->ucode_blob);
+		nvgpu_assert(g->acr->ucode_blob.size <= U32_MAX);
+		acr_dmem_desc->nonwpr_ucode_blob_size =
+			(u32)g->acr->ucode_blob.size;
+		acr_dmem_desc->regions.no_regions = ACR_REGIONS;
+		acr_dmem_desc->wpr_offset = WPR_OFFSET;
+	}
+
+	return 0;
+}
+
+/* LSF static config functions */
+#ifdef CONFIG_NVGPU_LS_PMU
+static u32 gv11b_acr_lsf_pmu(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	if (!g->support_ls_pmu) {
+		/* skip adding LS PMU ucode to ACR blob */
+		return 0;
+	}
+
+	/* PMU LS falcon info */
+	lsf->falcon_id = FALCON_ID_PMU;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	lsf->is_lazy_bootstrap = false;
+	lsf->is_priv_load = false;
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_pmu_ucode_details;
+	lsf->get_cmd_line_args_offset = nvgpu_pmu_fw_get_cmd_line_args_offset;
+
+	return BIT32(lsf->falcon_id);
+}
+#endif
+
+/* LSF init */
+static u32 gv11b_acr_lsf_fecs(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* FECS LS falcon info */
+	lsf->falcon_id = FALCON_ID_FECS;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	/*
+	 * FECS LSF cold/recovery bootstrap is handled by ACR when LS PMU
+	 * not present
+	 */
+	lsf->is_lazy_bootstrap = g->support_ls_pmu ? true : false;
+	lsf->is_priv_load = false;
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_fecs_ucode_details;
+	lsf->get_cmd_line_args_offset = NULL;
+
+	return BIT32(lsf->falcon_id);
+}
+
+static u32 gv11b_acr_lsf_gpccs(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* GPCCS LS falcon info */
+	lsf->falcon_id = FALCON_ID_GPCCS;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	/*
+	 * GPCCS LSF cold/recovery bootstrap is handled by ACR when LS PMU
+	 * not present
+	 */
+	lsf->is_lazy_bootstrap = g->support_ls_pmu ? true : false;
+	lsf->is_priv_load = true;
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_gpccs_ucode_details;
+	lsf->get_cmd_line_args_offset = NULL;
+
+	return BIT32(lsf->falcon_id);
+}
+
+u32 gv11b_acr_lsf_config(struct gk20a *g,
+	struct nvgpu_acr *acr)
+{
+	u32 lsf_enable_mask = 0;
+#ifdef CONFIG_NVGPU_LS_PMU
+	lsf_enable_mask |= gv11b_acr_lsf_pmu(g, &acr->lsf[FALCON_ID_PMU]);
+#endif
+	lsf_enable_mask |= gv11b_acr_lsf_fecs(g, &acr->lsf[FALCON_ID_FECS]);
+	lsf_enable_mask |= gv11b_acr_lsf_gpccs(g, &acr->lsf[FALCON_ID_GPCCS]);
+
+	return lsf_enable_mask;
+}
+
+static void gv11b_acr_default_sw_init(struct gk20a *g, struct hs_acr *acr_desc)
+{
+	nvgpu_log_fn(g, " ");
+
+	acr_desc->acr_type = ACR_DEFAULT;
+
+	if (!g->ops.pmu.is_debug_mode_enabled(g)) {
+		acr_desc->acr_fw_name = HSBIN_ACR_PROD_UCODE;
+	} else {
+		acr_desc->acr_fw_name = HSBIN_ACR_DBG_UCODE;
+	}
+
+	acr_desc->acr_flcn = g->pmu->flcn;
+	acr_desc->report_acr_engine_bus_err_status =
+		nvgpu_pmu_report_bar0_pri_err_status;
+	acr_desc->acr_engine_bus_err_status =
+		g->ops.pmu.bar0_error_status;
+	acr_desc->acr_validate_mem_integrity = g->ops.pmu.validate_mem_integrity;
+}
+
+void nvgpu_gv11b_acr_sw_init(struct gk20a *g, struct nvgpu_acr *acr)
+{
+	nvgpu_log_fn(g, " ");
+
+	acr->g = g;
+
+	acr->bootstrap_owner = FALCON_ID_PMU;
+
+	acr->lsf_enable_mask = gv11b_acr_lsf_config(g, acr);
+
+	gv11b_acr_default_sw_init(g, &acr->acr);
+
+	acr->prepare_ucode_blob = nvgpu_acr_prepare_ucode_blob;
+	acr->get_wpr_info = nvgpu_acr_wpr_info_sys;
+	acr->alloc_blob_space = nvgpu_acr_alloc_blob_space_sys;
+	acr->bootstrap_hs_acr = gv11b_bootstrap_hs_acr;
+	acr->patch_wpr_info_to_ucode = gv11b_acr_patch_wpr_info_to_ucode;
+}
--- a/drivers/gpu/nvgpu/common/acr/acr_sw_gv11b.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_sw_gv11b.h
@@ -0,0 +1,34 @@
+/*
+ * Copyright (c) 2017-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_SW_GV11B_H
+#define ACR_SW_GV11B_H
+
+struct gk20a;
+struct nvgpu_acr;
+struct hs_acr;
+
+void nvgpu_gv11b_acr_sw_init(struct gk20a *g, struct nvgpu_acr *acr);
+u32 gv11b_acr_lsf_config(struct gk20a *g, struct nvgpu_acr *acr);
+
+#endif /* ACR_SW_GV11B_H */
+
--- a/drivers/gpu/nvgpu/common/acr/acr_sw_tu104.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_sw_tu104.c
@@ -0,0 +1,285 @@
+/*
+ * Copyright (c) 2016-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include "acr_sw_tu104.h"
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/firmware.h>
+
+#include "acr_wpr.h"
+#include "acr_priv.h"
+#include "acr_blob_alloc.h"
+#include "acr_bootstrap.h"
+#include "acr_blob_construct.h"
+#include "acr_sw_gv11b.h"
+#include "acr_sw_tu104.h"
+
+static int tu104_bootstrap_hs_acr(struct gk20a *g, struct nvgpu_acr *acr)
+{
+	int err = 0;
+
+	nvgpu_log_fn(g, " ");
+
+	err = nvgpu_acr_bootstrap_hs_ucode(g, g->acr, &g->acr->acr_ahesasc);
+	if (err != 0) {
+		nvgpu_err(g, "ACR AHESASC bootstrap failed");
+		goto exit;
+	}
+	err = nvgpu_acr_bootstrap_hs_ucode(g, g->acr, &g->acr->acr_asb);
+	if (err != 0) {
+		nvgpu_err(g, "ACR ASB bootstrap failed");
+		goto exit;
+	}
+
+exit:
+	return err;
+}
+
+/* WPR info update */
+static int tu104_acr_patch_wpr_info_to_ucode(struct gk20a *g,
+	struct nvgpu_acr *acr, struct hs_acr *acr_desc,
+	bool is_recovery)
+{
+	struct nvgpu_firmware *acr_fw = acr_desc->acr_fw;
+	struct acr_fw_header *acr_fw_hdr = NULL;
+	struct bin_hdr *acr_fw_bin_hdr = NULL;
+	struct flcn_acr_desc *acr_dmem_desc;
+	struct wpr_carveout_info wpr_inf;
+	u32 *acr_ucode_header = NULL;
+	u32 *acr_ucode_data = NULL;
+	u64 tmp_addr;
+
+	nvgpu_log_fn(g, " ");
+
+	acr_fw_bin_hdr = (struct bin_hdr *)acr_fw->data;
+	acr_fw_hdr = (struct acr_fw_header *)
+		(acr_fw->data + acr_fw_bin_hdr->header_offset);
+
+	acr_ucode_data = (u32 *)(acr_fw->data + acr_fw_bin_hdr->data_offset);
+	acr_ucode_header = (u32 *)(acr_fw->data + acr_fw_hdr->hdr_offset);
+
+	acr->get_wpr_info(g, &wpr_inf);
+
+	acr_dmem_desc = (struct flcn_acr_desc *)
+		&(((u8 *)acr_ucode_data)[acr_ucode_header[2U]]);
+
+	acr_dmem_desc->nonwpr_ucode_blob_start = wpr_inf.nonwpr_base;
+	nvgpu_assert(wpr_inf.size <= U32_MAX);
+	acr_dmem_desc->nonwpr_ucode_blob_size = (u32)wpr_inf.size;
+	acr_dmem_desc->regions.no_regions = 1U;
+	acr_dmem_desc->wpr_offset = 0U;
+
+	acr_dmem_desc->wpr_region_id = 1U;
+	acr_dmem_desc->regions.region_props[0U].region_id = 1U;
+
+	tmp_addr = (wpr_inf.wpr_base) >> 8U;
+	nvgpu_assert(u64_hi32(tmp_addr) == 0U);
+	acr_dmem_desc->regions.region_props[0U].start_addr = U32(tmp_addr);
+
+	tmp_addr = ((wpr_inf.wpr_base) + wpr_inf.size) >> 8U;
+	nvgpu_assert(u64_hi32(tmp_addr) == 0U);
+	acr_dmem_desc->regions.region_props[0U].end_addr = U32(tmp_addr);
+
+	tmp_addr = wpr_inf.nonwpr_base >> 8U;
+	nvgpu_assert(u64_hi32(tmp_addr) == 0U);
+	acr_dmem_desc->regions.region_props[0U].shadowmMem_startaddress =
+		U32(tmp_addr);
+
+	return 0;
+}
+
+/* LSF init */
+static u32 tu104_acr_lsf_sec2(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* SEC2 LS falcon info */
+	lsf->falcon_id = FALCON_ID_SEC2;
+	lsf->falcon_dma_idx = NV_SEC2_DMAIDX_UCODE;
+	lsf->is_lazy_bootstrap = false;
+	lsf->is_priv_load = false;
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_sec2_ucode_details;
+	lsf->get_cmd_line_args_offset = NULL;
+
+	return BIT32(lsf->falcon_id);
+}
+
+static u32 tu104_acr_lsf_pmu(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* PMU support not required until PSTATE support is enabled */
+	if (!g->support_ls_pmu) {
+		/* skip adding LS PMU ucode to ACR blob */
+		return 0;
+	}
+
+	/* PMU LS falcon info */
+	lsf->falcon_id = FALCON_ID_PMU;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	lsf->is_lazy_bootstrap = false;
+	lsf->is_priv_load = false;
+#ifdef CONFIG_NVGPU_LS_PMU
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_pmu_ucode_details;
+	lsf->get_cmd_line_args_offset = nvgpu_pmu_fw_get_cmd_line_args_offset;
+#endif
+	return BIT32(lsf->falcon_id);
+}
+
+static u32 tu104_acr_lsf_fecs(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* FECS LS falcon info */
+	lsf->falcon_id = FALCON_ID_FECS;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	lsf->is_lazy_bootstrap = true;
+	lsf->is_priv_load = true;
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_fecs_ucode_details;
+	lsf->get_cmd_line_args_offset = NULL;
+
+	return BIT32(lsf->falcon_id);
+}
+
+static u32 tu104_acr_lsf_gpccs(struct gk20a *g,
+		struct acr_lsf_config *lsf)
+{
+	/* FECS LS falcon info */
+	lsf->falcon_id = FALCON_ID_GPCCS;
+	lsf->falcon_dma_idx = GK20A_PMU_DMAIDX_UCODE;
+	lsf->is_lazy_bootstrap = true;
+	lsf->is_priv_load = true;
+	lsf->get_lsf_ucode_details = nvgpu_acr_lsf_gpccs_ucode_details;
+	lsf->get_cmd_line_args_offset = NULL;
+
+	return BIT32(lsf->falcon_id);
+}
+
+static u32 tu104_acr_lsf_conifg(struct gk20a *g,
+	struct nvgpu_acr *acr)
+{
+	u32 lsf_enable_mask = 0;
+	lsf_enable_mask |= tu104_acr_lsf_pmu(g, &acr->lsf[FALCON_ID_PMU]);
+	lsf_enable_mask |= tu104_acr_lsf_fecs(g, &acr->lsf[FALCON_ID_FECS]);
+	lsf_enable_mask |= tu104_acr_lsf_gpccs(g, &acr->lsf[FALCON_ID_GPCCS]);
+	lsf_enable_mask |= tu104_acr_lsf_sec2(g, &acr->lsf[FALCON_ID_SEC2]);
+
+	return lsf_enable_mask;
+}
+
+/* fusa signing enable check */
+static bool tu104_acr_is_fusa_enabled(struct gk20a *g)
+{
+	return g->is_fusa_sku;
+}
+
+/* ACR-AHESASC(ACR hub encryption setter and signature checker) init*/
+static void tu104_acr_ahesasc_v0_ucode_select(struct gk20a *g,
+		struct hs_acr *acr_ahesasc)
+{
+	acr_ahesasc->acr_type = ACR_AHESASC_NON_FUSA;
+
+	if (!g->ops.pmu.is_debug_mode_enabled(g)) {
+		acr_ahesasc->acr_fw_name = HSBIN_ACR_AHESASC_NON_FUSA_PROD_UCODE;
+	} else {
+		acr_ahesasc->acr_fw_name = HSBIN_ACR_AHESASC_NON_FUSA_DBG_UCODE;
+	}
+
+}
+
+static void tu104_acr_ahesasc_fusa_ucode_select(struct gk20a *g,
+		struct hs_acr *acr_ahesasc)
+{
+	acr_ahesasc->acr_type = ACR_AHESASC_FUSA;
+
+	if (!g->ops.pmu.is_debug_mode_enabled(g)) {
+		acr_ahesasc->acr_fw_name = HSBIN_ACR_AHESASC_FUSA_PROD_UCODE;
+	} else {
+		acr_ahesasc->acr_fw_name = HSBIN_ACR_AHESASC_FUSA_DBG_UCODE;
+	}
+}
+
+static void tu104_acr_ahesasc_sw_init(struct gk20a *g,
+	struct hs_acr *acr_ahesasc)
+{
+	if (tu104_acr_is_fusa_enabled(g)) {
+		tu104_acr_ahesasc_fusa_ucode_select(g, acr_ahesasc);
+	} else {
+		tu104_acr_ahesasc_v0_ucode_select(g, acr_ahesasc);
+	}
+
+	acr_ahesasc->acr_flcn = &g->sec2.flcn;
+}
+
+/* ACR-ASB(ACR SEC2 booter) init*/
+static void tu104_acr_asb_v0_ucode_select(struct gk20a *g,
+	struct hs_acr *acr_asb)
+{
+	acr_asb->acr_type = ACR_ASB_NON_FUSA;
+
+	if (!g->ops.pmu.is_debug_mode_enabled(g)) {
+		acr_asb->acr_fw_name = HSBIN_ACR_ASB_NON_FUSA_PROD_UCODE;
+	} else {
+		acr_asb->acr_fw_name = HSBIN_ACR_ASB_NON_FUSA_DBG_UCODE;
+	}
+}
+
+static void tu104_acr_asb_fusa_ucode_select(struct gk20a *g,
+	struct hs_acr *acr_asb)
+{
+	acr_asb->acr_type = ACR_ASB_FUSA;
+
+	if (!g->ops.pmu.is_debug_mode_enabled(g)) {
+		acr_asb->acr_fw_name = HSBIN_ACR_ASB_FUSA_PROD_UCODE;
+	} else {
+		acr_asb->acr_fw_name = HSBIN_ACR_ASB_FUSA_DBG_UCODE;
+	}
+}
+
+static void tu104_acr_asb_sw_init(struct gk20a *g,
+	struct hs_acr *acr_asb)
+{
+	if (tu104_acr_is_fusa_enabled(g)) {
+		tu104_acr_asb_fusa_ucode_select(g, acr_asb);
+	} else {
+		tu104_acr_asb_v0_ucode_select(g, acr_asb);
+	}
+
+	acr_asb->acr_flcn = &g->gsp_flcn;
+}
+
+void nvgpu_tu104_acr_sw_init(struct gk20a *g, struct nvgpu_acr *acr)
+{
+	nvgpu_log_fn(g, " ");
+
+	acr->lsf_enable_mask = tu104_acr_lsf_conifg(g, acr);
+
+	acr->prepare_ucode_blob = nvgpu_acr_prepare_ucode_blob;
+	acr->get_wpr_info = nvgpu_acr_wpr_info_vid;
+	acr->alloc_blob_space = nvgpu_acr_alloc_blob_space_vid;
+	acr->bootstrap_owner = FALCON_ID_GSPLITE;
+	acr->bootstrap_hs_acr = tu104_bootstrap_hs_acr;
+	acr->patch_wpr_info_to_ucode = tu104_acr_patch_wpr_info_to_ucode;
+
+	/* Init ACR-AHESASC */
+	tu104_acr_ahesasc_sw_init(g, &acr->acr_ahesasc);
+
+	/* Init ACR-ASB*/
+	tu104_acr_asb_sw_init(g, &acr->acr_asb);
+}
--- a/drivers/gpu/nvgpu/common/acr/acr_sw_tu104.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_sw_tu104.h
@@ -0,0 +1,31 @@
+/*
+ * Copyright (c) 2018-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_SW_TU104_H
+#define ACR_SW_TU104_H
+
+struct gk20a;
+struct nvgpu_acr;
+
+void nvgpu_tu104_acr_sw_init(struct gk20a *g, struct nvgpu_acr *acr);
+
+#endif /*ACR_SW_TU104_H*/
--- a/drivers/gpu/nvgpu/common/acr/acr_wpr.c
+++ b/drivers/gpu/nvgpu/common/acr/acr_wpr.c
@@ -0,0 +1,43 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/types.h>
+#include <nvgpu/dma.h>
+
+#include "acr_wpr.h"
+
+/* Both size and address of WPR need to be 128K-aligned */
+#define DGPU_WPR_SIZE 0x200000U
+
+void nvgpu_acr_wpr_info_sys(struct gk20a *g, struct wpr_carveout_info *inf)
+{
+	g->ops.fb.read_wpr_info(g, &inf->wpr_base, &inf->size);
+}
+#ifdef CONFIG_NVGPU_DGPU
+void nvgpu_acr_wpr_info_vid(struct gk20a *g, struct wpr_carveout_info *inf)
+{
+	inf->wpr_base = g->mm.vidmem.bootstrap_base;
+	inf->nonwpr_base = inf->wpr_base + DGPU_WPR_SIZE;
+	inf->size = DGPU_WPR_SIZE;
+}
+#endif
--- a/drivers/gpu/nvgpu/common/acr/acr_wpr.h
+++ b/drivers/gpu/nvgpu/common/acr/acr_wpr.h
@@ -0,0 +1,40 @@
+/*
+ * Copyright (c) 2018-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef ACR_WPR_H
+#define ACR_WPR_H
+
+struct gk20a;
+struct wpr_carveout_info;
+
+struct wpr_carveout_info {
+	u64 wpr_base;
+	u64 nonwpr_base;
+	u64 size;
+};
+
+void nvgpu_acr_wpr_info_sys(struct gk20a *g, struct wpr_carveout_info *inf);
+#ifdef CONFIG_NVGPU_DGPU
+void nvgpu_acr_wpr_info_vid(struct gk20a *g, struct wpr_carveout_info *inf);
+#endif
+
+#endif /* NVGPU_ACR_WPR_H */
--- a/drivers/gpu/nvgpu/common/acr/nvgpu_acr_interface.h
+++ b/drivers/gpu/nvgpu/common/acr/nvgpu_acr_interface.h
@@ -0,0 +1,609 @@
+/*
+ * Copyright (c) 2019-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_ACR_INTERFACE_H
+#define NVGPU_ACR_INTERFACE_H
+
+/**
+ * @defgroup NVGPURM_BLOB_CONSTRUCT blob construct
+ *
+ * Blob construct interfaces:
+ * NVGPU creates LS ucode blob in system/FB's non-WPR memory. LS ucodes
+ * will be read from filesystem and added to blob for the detected chip.
+ * Below are the structs that need to be filled by NvGPU for each LS Falcon
+ * ucode supported for the detected chip. After filling structures successfully,
+ * NvGPU should copy below structs along with ucode to the non-WPR blob
+ * in below mentioned pattern. LS ucodes blob is required by the ACR HS
+ * ucode to authenticate & load LS ucode on to respective engine's LS Falcon.
+ *
+ * + WPR header struct #lsf_wpr_header.
+ * + LSB header struct #lsf_lsb_header.
+ * + Boot loader struct #flcn_bl_dmem_desc.
+ * + ucode image.
+ *
+ * + BLOB Pattern:
+ *    ---------------------------------------------
+ *   | LSF WPR HDR  | LSF LSB HDR | BL desc | ucode |
+ *    ---------------------------------------------
+ */
+
+/**
+ * @ingroup NVGPURM_BLOB_CONSTRUCT
+ */
+/** @{*/
+
+/**
+ * Light Secure WPR Content Alignments
+ */
+/** WPR header should be aligned to 256 bytes */
+#define LSF_WPR_HEADER_ALIGNMENT        (256U)
+/** SUB WPR header should be aligned to 256 bytes */
+#define LSF_SUB_WPR_HEADER_ALIGNMENT    (256U)
+/** LSB header should be aligned to 256 bytes */
+#define LSF_LSB_HEADER_ALIGNMENT        (256U)
+/** BL DATA should be aligned to 256 bytes */
+#define LSF_BL_DATA_ALIGNMENT           (256U)
+/** BL DATA size should be aligned to 256 bytes */
+#define LSF_BL_DATA_SIZE_ALIGNMENT      (256U)
+/** BL CODE size should be aligned to 256 bytes */
+#define LSF_BL_CODE_SIZE_ALIGNMENT      (256U)
+/** LSF DATA size should be aligned to 256 bytes */
+#define LSF_DATA_SIZE_ALIGNMENT         (256U)
+/** LSF CODE size should be aligned to 256 bytes */
+#define LSF_CODE_SIZE_ALIGNMENT         (256U)
+
+/** UCODE surface should be aligned to 4k PAGE_SIZE */
+#define LSF_UCODE_DATA_ALIGNMENT 4096U
+
+/**
+ * Maximum WPR Header size
+ */
+#define LSF_WPR_HEADERS_TOTAL_SIZE_MAX	\
+	(ALIGN_UP(((u32)sizeof(struct lsf_wpr_header) * FALCON_ID_END), \
+		LSF_WPR_HEADER_ALIGNMENT))
+#define LSF_LSB_HEADER_TOTAL_SIZE_MAX	(\
+	ALIGN_UP(sizeof(struct lsf_lsb_header), LSF_LSB_HEADER_ALIGNMENT))
+
+/** @} */
+
+#ifdef CONFIG_NVGPU_DGPU
+/* Maximum SUB WPR header size */
+#define LSF_SUB_WPR_HEADERS_TOTAL_SIZE_MAX	(ALIGN_UP( \
+	(sizeof(struct lsf_shared_sub_wpr_header) * \
+	LSF_SHARED_DATA_SUB_WPR_USE_CASE_ID_MAX), \
+	LSF_SUB_WPR_HEADER_ALIGNMENT))
+
+/* MMU excepts sub_wpr sizes in units of 4K */
+#define SUB_WPR_SIZE_ALIGNMENT	(4096U)
+
+/* Defined for 1MB alignment */
+#define SHIFT_4KB	(12U)
+
+/* shared sub_wpr use case IDs */
+enum {
+	LSF_SHARED_DATA_SUB_WPR_USE_CASE_ID_FRTS_VBIOS_TABLES	= 1,
+	LSF_SHARED_DATA_SUB_WPR_USE_CASE_ID_PLAYREADY_SHARED_DATA = 2
+};
+
+#define LSF_SHARED_DATA_SUB_WPR_USE_CASE_ID_MAX \
+	LSF_SHARED_DATA_SUB_WPR_USE_CASE_ID_PLAYREADY_SHARED_DATA
+
+#define LSF_SHARED_DATA_SUB_WPR_USE_CASE_ID_INVALID	(0xFFFFFFFFU)
+
+#define MAX_SUPPORTED_SHARED_SUB_WPR_USE_CASES	\
+	LSF_SHARED_DATA_SUB_WPR_USE_CASE_ID_MAX
+
+/* Static sizes of shared subWPRs */
+/* Minimum granularity supported is 4K */
+/* 1MB in 4K */
+#define LSF_SHARED_DATA_SUB_WPR_FRTS_VBIOS_TABLES_SIZE_IN_4K	(0x100U)
+/* 4K */
+#define LSF_SHARED_DATA_SUB_WPR_PLAYREADY_SHARED_DATA_SIZE_IN_4K	(0x1U)
+#endif
+
+/**
+ * @ingroup NVGPURM_BLOB_CONSTRUCT
+ */
+/** @{*/
+
+/**
+ * Image status updated by ACR HS ucode to know the LS
+ * Falcon ucode status.
+ */
+/** IMAGE copied from NON-WPR to WPR BLOB*/
+#define LSF_IMAGE_STATUS_COPY                           (1U)
+/** LS Falcon ucode verification failed*/
+#define LSF_IMAGE_STATUS_VALIDATION_CODE_FAILED         (2U)
+/** LS Falcon data verification failed*/
+#define LSF_IMAGE_STATUS_VALIDATION_DATA_FAILED         (3U)
+/** Both ucode and data validation passed */
+#define LSF_IMAGE_STATUS_VALIDATION_DONE                (4U)
+/**
+ * LS Falcons such as FECS and GPCCS does not have signatures for binaries in
+ * debug environment(fmodel).
+ */
+#define LSF_IMAGE_STATUS_VALIDATION_SKIPPED             (5U)
+/** LS Falcon validation passed & ready for bootstrap */
+#define LSF_IMAGE_STATUS_BOOTSTRAP_READY                (6U)
+
+/**
+ * Light Secure WPR Header
+ * Defines state allowing Light Secure Falcon bootstrapping.
+ */
+struct lsf_wpr_header {
+	 /**
+	 * LS Falcon ID
+	 * FALCON_ID_FECS  - 2
+	 * FALCON_ID_GPCCS - 3
+	 */
+	u32 falcon_id;
+	/**
+	 * LS Falcon LSB header offset from non-WPR base, below equation used
+	 * to get LSB header offset for each managed LS falcon.
+	 * Offset = Non-WPR base + #LSF_LSB_HEADER_ALIGNMENT +
+	 *          ((#LSF_UCODE_DATA_ALIGNMENT + #LSF_BL_DATA_ALIGNMENT) *
+	 *          LS Falcon index)
+	 *
+	 */
+	u32 lsb_offset;
+	/**
+	 * LS Falcon bootstrap owner, which performs bootstrapping of
+	 * supported LS Falcon from ACR HS ucode. Below are the bootstrapping
+	 * supporting Falcon owners.
+	 *  + Falcon #FALCON_ID_PMU
+	 *
+	 * On GV11B, bootstrap_owner set to #FALCON_ID_PMU as ACR HS ucode
+	 * runs on PMU Engine Falcon.
+	 *
+	 */
+	u32 bootstrap_owner;
+	/**
+	 * Skip bootstrapping by ACR HS ucode,
+	 * 1 - skip LS Falcon bootstrapping by ACR HS ucode.
+	 * 0 - LS Falcon bootstrapping is done by ACR HS ucode.
+	 *
+	 * On GV11B, always set 0.
+	 */
+	u32 lazy_bootstrap;
+	/** LS ucode bin version*/
+	u32 bin_version;
+	/**
+	 * Bootstrapping status updated by ACR HS ucode to know the LS
+	 * Falcon ucode status.
+	 */
+	u32 status;
+};
+
+/** @} */
+
+/**
+ * @ingroup NVGPURM_BLOB_CONSTRUCT
+ */
+/** @{*/
+/**
+ * Size in entries of the ucode descriptor's dependency map.
+ */
+#define LSF_FALCON_DEPMAP_SIZE  (11U)
+
+/**
+ * Code/data signature details of LS falcon
+ */
+struct lsf_ucode_desc {
+	/** ucode's production signature */
+	u8  prd_keys[2][16];
+	/** ucode's debug signature */
+	u8  dbg_keys[2][16];
+	/**
+	 * production signature present status,
+	 * 1 - production signature present
+	 * 0 - production signature not present
+	 */
+	u32 b_prd_present;
+	/**
+	 * debug signature present
+	 * 1 - debug signature present
+	 * 0 - debug signature not present
+	 */
+	u32 b_dbg_present;
+	/**
+	 * LS Falcon ID
+	 * FALCON_ID_FECS  - 2
+	 * FALCON_ID_GPCCS - 3
+	 */
+	u32 falcon_id;
+	/**
+	 * include version in signature calculation if supported
+	 * 1 - supported
+	 * 0 - not supported
+	 */
+	u32 bsupports_versioning;
+	/** version to include it in signature calculation if supported */
+	u32 version;
+	/** valid dependency map data to consider from  dep_map array member */
+	u32 dep_map_count;
+	/**
+	 * packed dependency map used to compute the DM hashes on the code and
+	 * data.
+	 */
+	u8  dep_map[LSF_FALCON_DEPMAP_SIZE * 2 * 4];
+	/** Message used to derive key */
+	u8  kdf[16];
+};
+
+/** @} */
+
+/**
+ * @ingroup NVGPURM_BLOB_CONSTRUCT
+ */
+/** @{*/
+
+/**
+ * Light Secure Bootstrap Header
+ * Defines state allowing Light Secure Falcon bootstrapping.
+ */
+/** Load BL at 0th IMEM offset */
+#define NV_FLCN_ACR_LSF_FLAG_LOAD_CODE_AT_0_FALSE       0U
+#define NV_FLCN_ACR_LSF_FLAG_LOAD_CODE_AT_0_TRUE        BIT32(0)
+/** This falcon requires a ctx before issuing DMAs. */
+#define NV_FLCN_ACR_LSF_FLAG_DMACTL_REQ_CTX_FALSE       0U
+#define NV_FLCN_ACR_LSF_FLAG_DMACTL_REQ_CTX_TRUE        BIT32(2)
+/** Use priv loading method instead of bootloader/DMAs */
+#define NV_FLCN_ACR_LSF_FLAG_FORCE_PRIV_LOAD_TRUE       BIT32(3)
+#define NV_FLCN_ACR_LSF_FLAG_FORCE_PRIV_LOAD_FALSE      (0U)
+struct lsf_lsb_header {
+	/** Code/data signature details of each LS falcon */
+	struct lsf_ucode_desc signature;
+	/**
+	 * Offset from non-WPR base where UCODE is located,
+	 * Offset = Non-WPR base + #LSF_LSB_HEADER_ALIGNMENT +
+	 *          #LSF_UCODE_DATA_ALIGNMENT + ( #LSF_BL_DATA_ALIGNMENT *
+	 *          LS Falcon index)
+	 */
+	u32 ucode_off;
+	/**
+	 * Size of LS Falcon ucode, required to perform signature verification
+	 * of LS Falcon ucode by ACR HS.
+	 */
+	u32 ucode_size;
+	/**
+	 * Size of LS Falcon ucode data, required to perform signature
+	 * verification of LS Falcon ucode data by ACR HS.
+	 */
+	u32 data_size;
+	/**
+	 * Size of bootloader that needs to be loaded by bootstrap owner.
+	 *
+	 * On GV11B, respective LS Falcon BL code size should not exceed
+	 * below mentioned size.
+	 * FALCON_ID_FECS IMEM size  - 32k
+	 * FALCON_ID_GPCCS IMEM size - 16k
+	 */
+	u32 bl_code_size;
+	/** BL starting virtual address. Need for tagging */
+	u32 bl_imem_off;
+	/**
+	 * Offset from non-WPR base holding the BL data
+	 * Offset = (Non-WPR base + #LSF_LSB_HEADER_ALIGNMENT +
+	 *          #LSF_UCODE_DATA_ALIGNMENT + #LSF_BL_DATA_ALIGNMENT) *
+	 *          #LS Falcon index
+	 */
+	u32 bl_data_off;
+	/**
+	 * Size of BL data, BL data will be copied to LS Falcon DMEM of
+	 * bl data size
+	 *
+	 * On GV11B, respective LS Falcon BL data size should not exceed
+	 * below mentioned size.
+	 * FALCON_ID_FECS DMEM size  - 8k
+	 * FALCON_ID_GPCCS DMEM size - 5k
+	 */
+	u32 bl_data_size;
+	/**
+	 * Offset from non-WPR base address where UCODE Application code is
+	 * located.
+	 */
+	u32 app_code_off;
+	/**
+	 * Size of UCODE Application code.
+	 *
+	 * On GV11B, FECS/GPCCS LS Falcon app code size should not exceed
+	 * below mentioned size.
+	 * FALCON_ID_FECS IMEM size  - 32k
+	 * FALCON_ID_GPCCS IMEM size - 16k
+	 */
+	u32 app_code_size;
+	/**
+	 * Offset from non-WPR base address where UCODE Application data
+	 * is located
+	 */
+	u32 app_data_off;
+	/**
+	 * Size of UCODE Application data.
+	 *
+	 * On GV11B, respective LS Falcon app data size should not exceed
+	 * below mentioned size.
+	 * FALCON_ID_FECS DMEM size  - 8k
+	 * FALCON_ID_GPCCS DMEM size - 5k
+	 */
+	u32 app_data_size;
+	/**
+	 * NV_FLCN_ACR_LSF_FLAG_LOAD_CODE_AT_0 - Load BL at 0th IMEM offset
+	 * NV_FLCN_ACR_LSF_FLAG_DMACTL_REQ_CTX - This falcon requires a ctx
+	 * before issuing DMAs.
+	 * NV_FLCN_ACR_LSF_FLAG_FORCE_PRIV_LOAD - Use priv loading method
+	 * instead of bootloader/DMAs
+	 */
+	u32 flags;
+};
+
+#define FLCN_SIG_SIZE	(4U)
+/** @} */
+
+/**
+ * @ingroup NVGPURM_BLOB_CONSTRUCT
+ */
+/** @{*/
+/**
+ * Structure used by the boot-loader to load the rest of the LS Falcon code.
+ *
+ * This has to be filled by the GPU driver and copied into WPR region offset
+ * holding the BL data.
+ */
+struct flcn_bl_dmem_desc {
+	/** Should be always first element */
+	u32 reserved[FLCN_SIG_SIZE];
+	/**
+	 * Signature should follow reserved 16B signature for secure code.
+	 * 0s if no secure code
+	 */
+	u32 signature[FLCN_SIG_SIZE];
+	/**
+	 * Type of memory-aperture DMA index used by the bootloader
+	 * while loading code/data.
+	 */
+	u32 ctx_dma;
+	/**
+	 * 256B aligned physical sysmem(iGPU)/FB(dGPU) address where code
+	 * is located.
+	 */
+	struct falc_u64 code_dma_base;
+	/**
+	 * Offset from code_dma_base where the nonSecure code is located.
+	 * The offset must be multiple of 256 to help performance.
+	 */
+	u32 non_sec_code_off;
+	/**
+	 * The size of the non-secure code part.
+	 *
+	 * On GV11B, FECS/GPCCS LS Falcon non-secure + secure code size
+	 * should not exceed below mentioned size.
+	 * FALCON_ID_FECS IMEM size  - 32k
+	 * FALCON_ID_GPCCS IMEM size - 16k
+	 */
+	u32 non_sec_code_size;
+	/**
+	 * Offset from code_dma_base where the secure code is located.
+	 * The offset must be multiple of 256 to help performance.
+	 */
+	u32 sec_code_off;
+	/**
+	 * The size of the secure code part.
+	 *
+	 * On GV11B, FECS/GPCCS LS Falcon non-secure + secure code size
+	 * should not exceed below mentioned size.
+	 * FALCON_ID_FECS IMEM size  - 32k
+	 * FALCON_ID_GPCCS IMEM size - 16k
+	 */
+	u32 sec_code_size;
+	/**
+	 * Code entry point which will be invoked by BL after code is
+	 * loaded.
+	 */
+	u32 code_entry_point;
+	/**
+	 * 256B aligned Physical sysmem(iGPU)/FB(dGPU) Address where data
+	 * is located.
+	 */
+	struct falc_u64 data_dma_base;
+	/**
+	 * Size of data block. Should be multiple of 256B.
+	 *
+	 * On GV11B, respective LS Falcon data size should not exceed
+	 * below mentioned size.
+	 * FALCON_ID_FECS DMEM size  - 8k
+	 * FALCON_ID_GPCCS DMEM size - 5k
+	 */
+	u32 data_size;
+	/** Arguments to be passed to the target firmware being loaded. */
+	u32 argc;
+	/**
+	 * Number of arguments to be passed to the target firmware
+	 * being loaded.
+	 */
+	u32 argv;
+};
+
+/** @} */
+
+/**
+ * @defgroup NVGPURM_ACR_HS_LOAD_BOOTSTRAP ACR HS ucode load & bootstrap
+ *
+ * ACR HS ucode load & bootstrap interfaces:
+ * ACR HS ucode is read from the filesystem based on the chip-id by the ACR
+ * unit. Read ACR HS ucode will be update with below structs by patching at
+ * offset present in struct #struct acr_fw_header member hdr_offset. Read
+ * ACR HS ucode is loaded onto PMU/SEC2/GSP engines Falcon to bootstrap
+ * ACR HS ucode. ACR HS ucode does self-authentication using H/W based
+ * HS authentication methodology. Once authenticated the ACR HS ucode
+ * starts executing on the falcon.
+ */
+
+/**
+ * @ingroup NVGPURM_ACR_HS_LOAD_BOOTSTRAP
+ */
+/** @{*/
+
+/**
+ * Supporting maximum of 2 regions.
+ * This is needed to pre-allocate space in DMEM
+ */
+#define NVGPU_FLCN_ACR_MAX_REGIONS                (2U)
+/** Reserve 512 bytes for bootstrap owner LS ucode data */
+#define LSF_BOOTSTRAP_OWNER_RESERVED_DMEM_SIZE    (0x200U)
+
+/**
+ * The descriptor used by ACR HS ucode to figure out properties of individual
+ * WPR regions.
+ *
+ * On GV11B, this struct members are set to 0x0 by default, reason
+ * to fetch WPR1 details from H/W.
+ */
+struct flcn_acr_region_prop {
+	/** Starting address of WPR region */
+	u32 start_addr;
+	/** Ending address of WPR region */
+	u32 end_addr;
+	/** The ID of the WPR region. 0 for WPR1 and 1 for WPR2  */
+	u32 region_id;
+	/** Read mask associated with this region */
+	u32 read_mask;
+	/** Write mask associated with this region */
+	u32 write_mask;
+	/** Bit map of all clients currently using this region */
+	u32 client_mask;
+	/**
+	 * sysmem(iGPU)/FB(dGPU) location from where contents need to
+	 * be copied to startAddress
+	 */
+	u32 shadowmMem_startaddress;
+};
+
+/**
+ * The descriptor used by ACR HS ucode to figure out supporting regions &
+ * its properties.
+ */
+struct flcn_acr_regions {
+	/**
+	 * Number of regions used by NVGPU from the total number of ACR
+	 * regions supported in chip.
+	 *
+	 * On GV11B, 1 ACR region supported and should always be greater
+	 * than 0.
+	 */
+	u32 no_regions;
+	/** Region properties */
+	struct flcn_acr_region_prop region_props[NVGPU_FLCN_ACR_MAX_REGIONS];
+};
+
+#define DMEM_WORD_SIZE		4U
+#define DUMMY_SPACE_SIZE	4U
+/**
+ * The descriptor used by ACR HS ucode to figure out the
+ * WPR & non-WPR blob details.
+ */
+struct flcn_acr_desc {
+	/*
+	 * The bootstrap owner needs to switch into LS mode when bootstrapping
+	 * other LS Falcons is completed. It needs to have its own actual
+	 * DMEM image copied into DMEM as part of LS setup. If ACR desc is
+	 * at location 0, it will definitely get overwritten causing data
+	 * corruption. Hence need to reserve 0x200 bytes to give room for
+	 * any loading data.
+	 * NOTE: This has to be the first member always.
+	 */
+	union {
+		u32 reserved_dmem[(LSF_BOOTSTRAP_OWNER_RESERVED_DMEM_SIZE/DMEM_WORD_SIZE)];
+	} ucode_reserved_space;
+	/** Signature of ACR ucode. */
+	u32 signatures[FLCN_SIG_SIZE];
+	/**
+	 * WPR Region ID holding the WPR header and its details
+	 *
+	 * on GV11B, wpr_region_id set to 0x0 by default to indicate
+	 * to ACR HS ucode to fetch WPR region details from H/W &
+	 * updating WPR start_addr, end_addr, read_mask & write_mask
+	 * of struct #flcn_acr_region_prop.
+	 */
+	u32 wpr_region_id;
+	/** Offset from the non-WPR base holding the wpr header */
+	u32 wpr_offset;
+	/** usable memory ranges, on GV11B it is not set */
+	u32 mmu_mem_range;
+	/**
+	 * WPR Region descriptors to provide info about WPR.
+	 * on GV11B, no_regions set to 1 & region properties value to 0x0
+	 * to indicate to ACR HS ucode to fetch WPR region details from H/W.
+	 */
+	struct flcn_acr_regions regions;
+	/**
+	 * stores the size of the ucode blob.
+	 *
+	 * On GV11B, size is calculated at runtime & aligned to 256 bytes.
+	 * Size varies based on number of LS falcon supports.
+	 */
+	u32 nonwpr_ucode_blob_size;
+	/**
+	 * stores sysmem(iGPU)/FB's(dGPU) non-WPR start address where
+	 * kernel stores ucode blob
+	 */
+	u64 nonwpr_ucode_blob_start;
+	/** dummy space, not used by iGPU */
+	u32 dummy[DUMMY_SPACE_SIZE];
+};
+
+struct flcn2_acr_desc {
+	/**
+	 * WPR Region ID holding the WPR header and its details
+	 *
+	 * on GPUID_NEXT, wpr_region_id set to 0x0 by default to indicate
+	 * to ACR HS ucode to fetch WPR region details from H/W &
+	 * updating WPR start_addr, end_addr, read_mask & write_mask
+	 * of struct #flcn_acr_region_prop.
+	 */
+	u32 wpr_region_id;
+	/** Offset from the non-WPR base holding the wpr header */
+	u32 wpr_offset;
+	/**
+	 * WPR Region descriptors to provide info about WPR.
+	 * on GPUID_NEXT, no_regions set to 1 & region properties value to 0x0
+	 * to indicate to ACR HS ucode to fetch WPR region details from H/W.
+	 */
+	struct flcn_acr_regions regions;
+	/**
+	 * stores the size of the ucode blob.
+	 *
+	 * On GPUID_NEXT, size is calculated at runtime & aligned to 256 bytes.
+	 * Size varies based on number of LS falcon supports.
+	 */
+	u32 nonwpr_ucode_blob_size;
+	/**
+	 * stores sysmem(iGPU)/FB's(dGPU) non-WPR start address where
+	 * kernel stores ucode blob
+	 */
+	u64 nonwpr_ucode_blob_start;
+
+	u64 ls_pmu_desc;
+};
+
+/** @} */
+
+#endif /* NVGPU_ACR_INTERFACE_H */
--- a/drivers/gpu/nvgpu/common/cbc/cbc.c
+++ b/drivers/gpu/nvgpu/common/cbc/cbc.c
@@ -0,0 +1,122 @@
+/*
+ * CBC
+ *
+ * Copyright (c) 2019-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/cbc.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/log.h>
+#include <nvgpu/nvgpu_mem.h>
+#include <nvgpu/comptags.h>
+
+void nvgpu_cbc_remove_support(struct gk20a *g)
+{
+	struct nvgpu_cbc *cbc = g->cbc;
+
+	nvgpu_log_fn(g, " ");
+
+	if (cbc == NULL) {
+		return;
+	}
+
+	if (nvgpu_mem_is_valid(&cbc->compbit_store.mem)) {
+		nvgpu_dma_free(g, &cbc->compbit_store.mem);
+		(void) memset(&cbc->compbit_store, 0,
+			sizeof(struct compbit_store_desc));
+	}
+	gk20a_comptag_allocator_destroy(g, &cbc->comp_tags);
+
+	nvgpu_kfree(g, cbc);
+	g->cbc = NULL;
+}
+
+/*
+ * This function is triggered during finalize_poweron multiple times.
+ * This function should not return if cbc is not NULL.
+ * cbc.init(), which re-writes HW registers that are reset during suspend,
+ * should be allowed to execute each time.
+ */
+int nvgpu_cbc_init_support(struct gk20a *g)
+{
+	int err = 0;
+	struct nvgpu_cbc *cbc = g->cbc;
+
+	nvgpu_log_fn(g, " ");
+
+	if (cbc == NULL) {
+		cbc = nvgpu_kzalloc(g, sizeof(*cbc));
+		if (cbc == NULL) {
+			return -ENOMEM;
+		}
+		g->cbc = cbc;
+
+		if (g->ops.cbc.alloc_comptags != NULL) {
+			err = g->ops.cbc.alloc_comptags(g, g->cbc);
+			if (err != 0) {
+				nvgpu_err(g, "Failed to allocate comptags");
+				nvgpu_kfree(g, cbc);
+				g->cbc = NULL;
+				return err;
+			}
+		}
+	}
+
+	if (g->ops.cbc.init != NULL) {
+		g->ops.cbc.init(g, g->cbc);
+	}
+
+	return err;
+}
+
+int nvgpu_cbc_alloc(struct gk20a *g, size_t compbit_backing_size,
+			bool vidmem_alloc)
+{
+	struct nvgpu_cbc *cbc = g->cbc;
+
+	if (nvgpu_mem_is_valid(&cbc->compbit_store.mem) != 0) {
+		return 0;
+	}
+
+#ifdef CONFIG_NVGPU_DGPU
+	if (vidmem_alloc == true) {
+		/*
+		 * Backing store MUST be physically contiguous and allocated in
+		 * one chunk
+		 * Vidmem allocation API does not support FORCE_CONTIGUOUS like
+		 * flag to allocate contiguous memory
+		 * But this allocation will happen in vidmem bootstrap allocator
+		 * which always allocates contiguous memory
+		 */
+		return nvgpu_dma_alloc_vid(g,
+					 compbit_backing_size,
+					 &cbc->compbit_store.mem);
+	} else
+#endif
+	{
+		return nvgpu_dma_alloc_flags_sys(g,
+					 NVGPU_DMA_PHYSICALLY_ADDRESSED,
+					 compbit_backing_size,
+					 &cbc->compbit_store.mem);
+	}
+}
--- a/drivers/gpu/nvgpu/common/ce/ce.c
+++ b/drivers/gpu/nvgpu/common/ce/ce.c
@@ -0,0 +1,71 @@
+/*
+ * Copyright (c) 2018-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/types.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/engines.h>
+#include <nvgpu/device.h>
+#include <nvgpu/ce.h>
+#include <nvgpu/power_features/cg.h>
+#include <nvgpu/cic.h>
+#include <nvgpu/mc.h>
+
+int nvgpu_ce_init_support(struct gk20a *g)
+{
+	int err = 0;
+
+	if (g->ops.ce.set_pce2lce_mapping != NULL) {
+		g->ops.ce.set_pce2lce_mapping(g);
+	}
+
+	err = nvgpu_mc_reset_devtype(g, NVGPU_DEVTYPE_LCE);
+	if (err != 0) {
+		nvgpu_err(g, "NVGPU_DEVTYPE_LCE reset failed");
+		return err;
+	}
+
+	nvgpu_cg_slcg_ce2_load_enable(g);
+
+	nvgpu_cg_blcg_ce_load_enable(g);
+
+#if defined(CONFIG_NVGPU_HAL_NON_FUSA) && defined(CONFIG_NVGPU_NEXT)
+	nvgpu_cg_elcg_ce_load_enable(g);
+#endif
+
+	if (g->ops.ce.init_prod_values != NULL) {
+		g->ops.ce.init_prod_values(g);
+	}
+
+	if (g->ops.ce.init_hw != NULL) {
+		g->ops.ce.init_hw(g);
+	}
+
+	if (g->ops.ce.intr_enable != NULL) {
+		g->ops.ce.intr_enable(g, true);
+	}
+
+	/** Enable interrupts at MC level */
+	nvgpu_cic_intr_stall_unit_config(g, NVGPU_CIC_INTR_UNIT_CE, NVGPU_CIC_INTR_ENABLE);
+	nvgpu_cic_intr_nonstall_unit_config(g, NVGPU_CIC_INTR_UNIT_CE, NVGPU_CIC_INTR_ENABLE);
+
+	return 0;
+}
--- a/drivers/gpu/nvgpu/common/ce/ce_app.c
+++ b/drivers/gpu/nvgpu/common/ce/ce_app.c
@@ -0,0 +1,621 @@
+/*
+ * Copyright (c) 2018-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/types.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/engines.h>
+#include <nvgpu/os_sched.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/watchdog.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/utils.h>
+#include <nvgpu/fence.h>
+#include <nvgpu/ce_app.h>
+#include <nvgpu/power_features/cg.h>
+
+#include "common/ce/ce_priv.h"
+
+static inline u32 nvgpu_ce_get_valid_launch_flags(struct gk20a *g,
+		u32 launch_flags)
+{
+#ifdef CONFIG_NVGPU_DGPU
+	/*
+	 * there is no local memory available,
+	 * don't allow local memory related CE flags
+	 */
+	if (g->mm.vidmem.size == 0ULL) {
+		launch_flags &= ~(NVGPU_CE_SRC_LOCATION_LOCAL_FB |
+			NVGPU_CE_DST_LOCATION_LOCAL_FB);
+	}
+#endif
+	return launch_flags;
+}
+
+int nvgpu_ce_execute_ops(struct gk20a *g,
+		u32 ce_ctx_id,
+		u64 src_paddr,
+		u64 dst_paddr,
+		u64 size,
+		u32 payload,
+		u32 launch_flags,
+		u32 request_operation,
+		u32 submit_flags,
+		struct nvgpu_fence_type **fence_out)
+{
+	int ret = -EPERM;
+	struct nvgpu_ce_app *ce_app = g->ce_app;
+	struct nvgpu_ce_gpu_ctx *ce_ctx, *ce_ctx_save;
+	bool found = false;
+	u32 *cmd_buf_cpu_va;
+	u64 cmd_buf_gpu_va = 0UL;
+	u32 method_size;
+	u32 cmd_buf_read_offset;
+	u32 dma_copy_class;
+	struct nvgpu_gpfifo_entry gpfifo;
+	struct nvgpu_channel_fence fence = {0U, 0U};
+	struct nvgpu_fence_type *ce_cmd_buf_fence_out = NULL;
+
+	if (!ce_app->initialised || ce_app->app_state != NVGPU_CE_ACTIVE) {
+		goto end;
+	}
+
+	/* This shouldn't happen */
+	if (size == 0ULL) {
+		ret = -EINVAL;
+		goto end;
+	}
+
+	if (request_operation != NVGPU_CE_PHYS_MODE_TRANSFER &&
+	    request_operation != NVGPU_CE_MEMSET) {
+		ret = -EINVAL;
+		goto end;
+	}
+
+	if (src_paddr > NVGPU_CE_MAX_ADDRESS) {
+		ret = -EINVAL;
+		goto end;
+	}
+
+	if (dst_paddr > NVGPU_CE_MAX_ADDRESS) {
+		ret = -EINVAL;
+		goto end;
+	}
+
+	nvgpu_mutex_acquire(&ce_app->app_mutex);
+
+	nvgpu_list_for_each_entry_safe(ce_ctx, ce_ctx_save,
+			&ce_app->allocated_contexts, nvgpu_ce_gpu_ctx, list) {
+		if (ce_ctx->ctx_id == ce_ctx_id) {
+			found = true;
+			break;
+		}
+	}
+
+	nvgpu_mutex_release(&ce_app->app_mutex);
+
+	if (!found) {
+		ret = -EINVAL;
+		goto end;
+	}
+
+	if (ce_ctx->gpu_ctx_state != NVGPU_CE_GPU_CTX_ALLOCATED) {
+		ret = -ENODEV;
+		goto end;
+	}
+
+	nvgpu_mutex_acquire(&ce_ctx->gpu_ctx_mutex);
+
+	ce_ctx->cmd_buf_read_queue_offset %= NVGPU_CE_MAX_INFLIGHT_JOBS;
+
+	cmd_buf_read_offset = (ce_ctx->cmd_buf_read_queue_offset *
+			(NVGPU_CE_MAX_COMMAND_BUFF_BYTES_PER_SUBMIT /
+			U32(sizeof(u32))));
+
+	cmd_buf_cpu_va = (u32 *)ce_ctx->cmd_buf_mem.cpu_va;
+
+	if (ce_ctx->postfences[ce_ctx->cmd_buf_read_queue_offset] != NULL) {
+		struct nvgpu_fence_type **prev_post_fence =
+			&ce_ctx->postfences[ce_ctx->cmd_buf_read_queue_offset];
+
+		ret = nvgpu_fence_wait(g, *prev_post_fence,
+				       nvgpu_get_poll_timeout(g));
+
+		nvgpu_fence_put(*prev_post_fence);
+		*prev_post_fence = NULL;
+		if (ret != 0) {
+			goto noop;
+		}
+	}
+
+	cmd_buf_gpu_va = (ce_ctx->cmd_buf_mem.gpu_va +
+			(u64)(cmd_buf_read_offset * sizeof(u32)));
+
+	dma_copy_class = g->ops.get_litter_value(g, GPU_LIT_DMA_COPY_CLASS);
+	method_size = nvgpu_ce_prepare_submit(src_paddr,
+			dst_paddr,
+			size,
+			&cmd_buf_cpu_va[cmd_buf_read_offset],
+			payload,
+			nvgpu_ce_get_valid_launch_flags(g, launch_flags),
+			request_operation,
+			dma_copy_class);
+	nvgpu_assert(method_size <= NVGPU_CE_MAX_COMMAND_BUFF_BYTES_PER_SUBMIT);
+
+	if (method_size != 0U) {
+		/* store the element into gpfifo */
+		g->ops.pbdma.format_gpfifo_entry(g, &gpfifo,
+				cmd_buf_gpu_va, method_size);
+
+		/*
+		 * take always the postfence as it is needed for protecting the
+		 * ce context
+		 */
+		submit_flags |= NVGPU_SUBMIT_FLAGS_FENCE_GET;
+
+		nvgpu_smp_wmb();
+
+		ret = nvgpu_submit_channel_gpfifo_kernel(ce_ctx->ch, &gpfifo,
+				1, submit_flags, &fence, &ce_cmd_buf_fence_out);
+
+		if (ret == 0) {
+			ce_ctx->postfences[ce_ctx->cmd_buf_read_queue_offset] =
+				ce_cmd_buf_fence_out;
+			if (fence_out != NULL) {
+				nvgpu_fence_get(ce_cmd_buf_fence_out);
+				*fence_out = ce_cmd_buf_fence_out;
+			}
+
+			/* Next available command buffer queue Index */
+			++ce_ctx->cmd_buf_read_queue_offset;
+		}
+	} else {
+		ret = -ENOMEM;
+	}
+noop:
+	nvgpu_mutex_release(&ce_ctx->gpu_ctx_mutex);
+end:
+	return ret;
+}
+
+/* static CE app api */
+static void nvgpu_ce_put_fences(struct nvgpu_ce_gpu_ctx *ce_ctx)
+{
+	u32 i;
+
+	for (i = 0U; i < NVGPU_CE_MAX_INFLIGHT_JOBS; i++) {
+		struct nvgpu_fence_type **fence = &ce_ctx->postfences[i];
+
+		if (*fence != NULL) {
+			nvgpu_fence_put(*fence);
+		}
+		*fence = NULL;
+	}
+}
+
+/* caller must hold ce_app->app_mutex */
+static void nvgpu_ce_delete_gpu_context_locked(struct nvgpu_ce_gpu_ctx *ce_ctx)
+{
+	struct nvgpu_list_node *list = &ce_ctx->list;
+
+	ce_ctx->gpu_ctx_state = NVGPU_CE_GPU_CTX_DELETED;
+	ce_ctx->tsg->abortable = true;
+
+	nvgpu_mutex_acquire(&ce_ctx->gpu_ctx_mutex);
+
+	if (nvgpu_mem_is_valid(&ce_ctx->cmd_buf_mem)) {
+		nvgpu_ce_put_fences(ce_ctx);
+		nvgpu_dma_unmap_free(ce_ctx->vm, &ce_ctx->cmd_buf_mem);
+	}
+
+	/*
+	 * free the channel
+	 * nvgpu_channel_close() will also unbind the channel from TSG
+	 */
+	nvgpu_channel_close(ce_ctx->ch);
+	nvgpu_ref_put(&ce_ctx->tsg->refcount, nvgpu_tsg_release);
+
+	/* housekeeping on app */
+	if ((list->prev != NULL) && (list->next != NULL)) {
+		nvgpu_list_del(list);
+	}
+
+	nvgpu_mutex_release(&ce_ctx->gpu_ctx_mutex);
+	nvgpu_mutex_destroy(&ce_ctx->gpu_ctx_mutex);
+
+	nvgpu_kfree(ce_ctx->g, ce_ctx);
+}
+
+static u32 nvgpu_prepare_ce_op(u32 *cmd_buf_cpu_va,
+		u64 src_paddr, u64 dst_paddr,
+		u32 width, u32 height, u32 payload,
+		bool mode_transfer, u32 launch_flags)
+{
+	u32 launch = 0U;
+	u32 methodSize = 0U;
+
+	if (mode_transfer) {
+		/* setup the source */
+		cmd_buf_cpu_va[methodSize++] = 0x20028100;
+		cmd_buf_cpu_va[methodSize++] = (u64_hi32(src_paddr) &
+			NVGPU_CE_UPPER_ADDRESS_OFFSET_MASK);
+		cmd_buf_cpu_va[methodSize++] = (u64_lo32(src_paddr) &
+			NVGPU_CE_LOWER_ADDRESS_OFFSET_MASK);
+
+		cmd_buf_cpu_va[methodSize++] = 0x20018098;
+		if ((launch_flags &
+		     NVGPU_CE_SRC_LOCATION_LOCAL_FB) != 0U) {
+			cmd_buf_cpu_va[methodSize++] = 0x00000000;
+		} else if ((launch_flags &
+		     NVGPU_CE_SRC_LOCATION_NONCOHERENT_SYSMEM) != 0U) {
+			cmd_buf_cpu_va[methodSize++] = 0x00000002;
+		} else {
+			cmd_buf_cpu_va[methodSize++] = 0x00000001;
+		}
+
+		launch |= 0x00001000U;
+	} else { /* memset */
+		/* Remap from component A on 1 byte wide pixels */
+		cmd_buf_cpu_va[methodSize++] = 0x200181c2;
+		cmd_buf_cpu_va[methodSize++] = 0x00000004;
+
+		cmd_buf_cpu_va[methodSize++] = 0x200181c0;
+		cmd_buf_cpu_va[methodSize++] = payload;
+
+		launch |= 0x00000400U;
+	}
+
+	/* setup the destination/output */
+	cmd_buf_cpu_va[methodSize++] = 0x20068102;
+	cmd_buf_cpu_va[methodSize++] = (u64_hi32(dst_paddr) &
+		NVGPU_CE_UPPER_ADDRESS_OFFSET_MASK);
+	cmd_buf_cpu_va[methodSize++] = (u64_lo32(dst_paddr) &
+		NVGPU_CE_LOWER_ADDRESS_OFFSET_MASK);
+	/* Pitch in/out */
+	cmd_buf_cpu_va[methodSize++] = width;
+	cmd_buf_cpu_va[methodSize++] = width;
+	/* width and line count */
+	cmd_buf_cpu_va[methodSize++] = width;
+	cmd_buf_cpu_va[methodSize++] = height;
+
+	cmd_buf_cpu_va[methodSize++] = 0x20018099;
+	if ((launch_flags & NVGPU_CE_DST_LOCATION_LOCAL_FB) != 0U) {
+		cmd_buf_cpu_va[methodSize++] = 0x00000000;
+	} else if ((launch_flags &
+		   NVGPU_CE_DST_LOCATION_NONCOHERENT_SYSMEM) != 0U) {
+		cmd_buf_cpu_va[methodSize++] = 0x00000002;
+	} else {
+		cmd_buf_cpu_va[methodSize++] = 0x00000001;
+	}
+
+	launch |= 0x00002005U;
+
+	if ((launch_flags &
+	     NVGPU_CE_SRC_MEMORY_LAYOUT_BLOCKLINEAR) != 0U) {
+		launch |= 0x00000000U;
+	} else {
+		launch |= 0x00000080U;
+	}
+
+	if ((launch_flags &
+	     NVGPU_CE_DST_MEMORY_LAYOUT_BLOCKLINEAR) != 0U) {
+		launch |= 0x00000000U;
+	} else {
+		launch |= 0x00000100U;
+	}
+
+	cmd_buf_cpu_va[methodSize++] = 0x200180c0;
+	cmd_buf_cpu_va[methodSize++] = launch;
+
+	return methodSize;
+}
+
+u32 nvgpu_ce_prepare_submit(u64 src_paddr,
+		u64 dst_paddr,
+		u64 size,
+		u32 *cmd_buf_cpu_va,
+		u32 payload,
+		u32 launch_flags,
+		u32 request_operation,
+		u32 dma_copy_class)
+{
+	u32 methodSize = 0;
+	u64 low, hi;
+	bool mode_transfer = (request_operation == NVGPU_CE_PHYS_MODE_TRANSFER);
+
+	/* set the channel object */
+	cmd_buf_cpu_va[methodSize++] = 0x20018000;
+	cmd_buf_cpu_va[methodSize++] = dma_copy_class;
+
+	/*
+	 * The CE can work with 2D rectangles of at most 0xffffffff or 4G-1
+	 * pixels per line. Exactly 2G is a more round number, so we'll use
+	 * that as the base unit to clear large amounts of memory. If the
+	 * requested size is not a multiple of 2G, we'll do one clear first to
+	 * deal with the low bits, followed by another in units of 2G.
+	 *
+	 * We'll use 1 bytes per pixel to do byte aligned sets/copies. The
+	 * maximum number of lines is also 4G-1, so (4G-1) * 2 GB is enough for
+	 * whole vidmem.
+	 */
+
+	/* Lower 2GB */
+	low = size & 0x7fffffffULL;
+	/* Over 2GB */
+	hi  = size >> 31U;
+
+	/*
+	 * Unable to fit this in one submit, but no device should have this
+	 * much memory anyway.
+	 */
+	if (hi > 0xffffffffULL) {
+		/* zero size means error */
+		return 0;
+	}
+
+	if (low != 0U) {
+		/* do the low bytes in one long line */
+		methodSize += nvgpu_prepare_ce_op(&cmd_buf_cpu_va[methodSize],
+				src_paddr, dst_paddr,
+				nvgpu_safe_cast_u64_to_u32(low), 1,
+				payload, mode_transfer, launch_flags);
+	}
+	if (hi != 0U) {
+		/* do the high bytes in many 2G lines */
+		methodSize += nvgpu_prepare_ce_op(&cmd_buf_cpu_va[methodSize],
+				src_paddr + low, dst_paddr + low,
+				0x80000000ULL, nvgpu_safe_cast_u64_to_u32(hi),
+				payload, mode_transfer, launch_flags);
+	}
+
+	return methodSize;
+}
+
+/* global CE app related apis */
+int nvgpu_ce_app_init_support(struct gk20a *g)
+{
+	struct nvgpu_ce_app *ce_app = g->ce_app;
+
+	if (unlikely(ce_app == NULL)) {
+		ce_app = nvgpu_kzalloc(g, sizeof(*ce_app));
+		if (ce_app == NULL) {
+			return -ENOMEM;
+		}
+		g->ce_app = ce_app;
+	}
+
+	if (ce_app->initialised) {
+		/* assume this happen during poweron/poweroff GPU sequence */
+		ce_app->app_state = NVGPU_CE_ACTIVE;
+		return 0;
+	}
+
+	nvgpu_log(g, gpu_dbg_fn, "ce: init");
+
+	nvgpu_mutex_init(&ce_app->app_mutex);
+
+	nvgpu_mutex_acquire(&ce_app->app_mutex);
+
+	nvgpu_init_list_node(&ce_app->allocated_contexts);
+	ce_app->ctx_count = 0;
+	ce_app->next_ctx_id = 0;
+	ce_app->initialised = true;
+	ce_app->app_state = NVGPU_CE_ACTIVE;
+
+	nvgpu_mutex_release(&ce_app->app_mutex);
+
+	nvgpu_log(g, gpu_dbg_cde_ctx, "ce: init finished");
+
+	return 0;
+}
+
+void nvgpu_ce_app_destroy(struct gk20a *g)
+{
+	struct nvgpu_ce_app *ce_app = g->ce_app;
+	struct nvgpu_ce_gpu_ctx *ce_ctx, *ce_ctx_save;
+
+	if (ce_app == NULL) {
+		return;
+	}
+
+	if (ce_app->initialised == false) {
+		goto free;
+	}
+
+	ce_app->app_state = NVGPU_CE_SUSPEND;
+	ce_app->initialised = false;
+
+	nvgpu_mutex_acquire(&ce_app->app_mutex);
+
+	nvgpu_list_for_each_entry_safe(ce_ctx, ce_ctx_save,
+			&ce_app->allocated_contexts, nvgpu_ce_gpu_ctx, list) {
+		nvgpu_ce_delete_gpu_context_locked(ce_ctx);
+	}
+
+	nvgpu_init_list_node(&ce_app->allocated_contexts);
+	ce_app->ctx_count = 0;
+	ce_app->next_ctx_id = 0;
+
+	nvgpu_mutex_release(&ce_app->app_mutex);
+
+	nvgpu_mutex_destroy(&ce_app->app_mutex);
+free:
+	nvgpu_kfree(g, ce_app);
+	g->ce_app = NULL;
+}
+
+void nvgpu_ce_app_suspend(struct gk20a *g)
+{
+	struct nvgpu_ce_app *ce_app = g->ce_app;
+
+	if (ce_app == NULL || !ce_app->initialised) {
+		return;
+	}
+
+	ce_app->app_state = NVGPU_CE_SUSPEND;
+}
+
+/* CE app utility functions */
+u32 nvgpu_ce_app_create_context(struct gk20a *g,
+		u32 runlist_id,
+		int timeslice,
+		int runlist_level)
+{
+	struct nvgpu_ce_gpu_ctx *ce_ctx;
+	struct nvgpu_ce_app *ce_app = g->ce_app;
+	struct nvgpu_setup_bind_args setup_bind_args;
+	u32 ctx_id = NVGPU_CE_INVAL_CTX_ID;
+	int err = 0;
+
+	if (!ce_app->initialised || ce_app->app_state != NVGPU_CE_ACTIVE) {
+		return ctx_id;
+	}
+
+	ce_ctx = nvgpu_kzalloc(g, sizeof(*ce_ctx));
+	if (ce_ctx == NULL) {
+		return ctx_id;
+	}
+
+	nvgpu_mutex_init(&ce_ctx->gpu_ctx_mutex);
+
+	ce_ctx->g = g;
+	ce_ctx->cmd_buf_read_queue_offset = 0;
+	ce_ctx->vm = g->mm.ce.vm;
+
+	/* allocate a tsg if needed */
+	ce_ctx->tsg = nvgpu_tsg_open(g, nvgpu_current_pid(g));
+	if (ce_ctx->tsg == NULL) {
+		nvgpu_err(g, "ce: gk20a tsg not available");
+		goto end;
+	}
+
+	/* this TSG should never be aborted */
+	ce_ctx->tsg->abortable = false;
+
+	/* always kernel client needs privileged channel */
+	ce_ctx->ch = nvgpu_channel_open_new(g, runlist_id, true,
+				nvgpu_current_pid(g), nvgpu_current_tid(g));
+	if (ce_ctx->ch == NULL) {
+		nvgpu_err(g, "ce: gk20a channel not available");
+		goto end;
+	}
+
+	nvgpu_channel_wdt_disable(ce_ctx->ch->wdt);
+
+	/* bind the channel to the vm */
+	err = g->ops.mm.vm_bind_channel(g->mm.ce.vm, ce_ctx->ch);
+	if (err != 0) {
+		nvgpu_err(g, "ce: could not bind vm");
+		goto end;
+	}
+
+	err = nvgpu_tsg_bind_channel(ce_ctx->tsg, ce_ctx->ch);
+	if (err != 0) {
+		nvgpu_err(g, "ce: unable to bind to tsg");
+		goto end;
+	}
+
+	setup_bind_args.num_gpfifo_entries = 1024;
+	setup_bind_args.num_inflight_jobs = 0;
+	setup_bind_args.flags = 0;
+	err = nvgpu_channel_setup_bind(ce_ctx->ch, &setup_bind_args);
+	if (err != 0) {
+		nvgpu_err(g, "ce: unable to setup and bind channel");
+		goto end;
+	}
+
+	/* allocate command buffer from sysmem */
+	err = nvgpu_dma_alloc_map_sys(ce_ctx->vm,
+			NVGPU_CE_MAX_INFLIGHT_JOBS *
+			NVGPU_CE_MAX_COMMAND_BUFF_BYTES_PER_SUBMIT,
+			&ce_ctx->cmd_buf_mem);
+	if (err != 0) {
+		nvgpu_err(g,
+			"ce: alloc command buffer failed");
+		goto end;
+	}
+
+	(void) memset(ce_ctx->cmd_buf_mem.cpu_va, 0x00,
+		ce_ctx->cmd_buf_mem.size);
+
+#ifdef CONFIG_NVGPU_CHANNEL_TSG_SCHEDULING
+	/* -1 means default channel timeslice value */
+	if (timeslice != -1) {
+		err = g->ops.tsg.set_timeslice(ce_ctx->tsg, timeslice);
+		if (err != 0) {
+			nvgpu_err(g, "ce: set timesliced failed for CE context");
+			goto end;
+		}
+	}
+
+	/* -1 means default channel runlist level */
+	if (runlist_level != -1) {
+		err = nvgpu_tsg_set_interleave(ce_ctx->tsg, runlist_level);
+		if (err != 0) {
+			nvgpu_err(g, "ce: set runlist interleave failed");
+			goto end;
+		}
+	}
+#endif
+
+	nvgpu_mutex_acquire(&ce_app->app_mutex);
+	ctx_id = ce_ctx->ctx_id = ce_app->next_ctx_id;
+	nvgpu_list_add(&ce_ctx->list, &ce_app->allocated_contexts);
+	++ce_app->next_ctx_id;
+	++ce_app->ctx_count;
+	nvgpu_mutex_release(&ce_app->app_mutex);
+
+	ce_ctx->gpu_ctx_state = NVGPU_CE_GPU_CTX_ALLOCATED;
+
+end:
+	if (ctx_id == NVGPU_CE_INVAL_CTX_ID) {
+		nvgpu_mutex_acquire(&ce_app->app_mutex);
+		nvgpu_ce_delete_gpu_context_locked(ce_ctx);
+		nvgpu_mutex_release(&ce_app->app_mutex);
+	}
+	return ctx_id;
+
+}
+
+void nvgpu_ce_app_delete_context(struct gk20a *g,
+		u32 ce_ctx_id)
+{
+	struct nvgpu_ce_app *ce_app = g->ce_app;
+	struct nvgpu_ce_gpu_ctx *ce_ctx, *ce_ctx_save;
+
+	if (ce_app == NULL || !ce_app->initialised ||
+		ce_app->app_state != NVGPU_CE_ACTIVE) {
+		return;
+	}
+
+	nvgpu_mutex_acquire(&ce_app->app_mutex);
+
+	nvgpu_list_for_each_entry_safe(ce_ctx, ce_ctx_save,
+			&ce_app->allocated_contexts, nvgpu_ce_gpu_ctx, list) {
+		if (ce_ctx->ctx_id == ce_ctx_id) {
+			nvgpu_ce_delete_gpu_context_locked(ce_ctx);
+			--ce_app->ctx_count;
+			break;
+		}
+	}
+
+	nvgpu_mutex_release(&ce_app->app_mutex);
+}
--- a/drivers/gpu/nvgpu/common/ce/ce_priv.h
+++ b/drivers/gpu/nvgpu/common/ce/ce_priv.h
@@ -0,0 +1,82 @@
+/*
+ * Copyright (c) 2011-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef NVGPU_CE_PRIV_H
+#define NVGPU_CE_PRIV_H
+
+#include <nvgpu/types.h>
+#include <nvgpu/nvgpu_mem.h>
+#include <nvgpu/list.h>
+#include <nvgpu/lock.h>
+
+struct gk20a;
+
+/* ce context db */
+struct nvgpu_ce_gpu_ctx {
+	struct gk20a *g;
+	u32 ctx_id;
+	struct nvgpu_mutex gpu_ctx_mutex;
+	int gpu_ctx_state;
+
+	/* tsg related data */
+	struct nvgpu_tsg *tsg;
+
+	/* channel related data */
+	struct nvgpu_channel *ch;
+	struct vm_gk20a *vm;
+
+	/* cmd buf mem_desc */
+	struct nvgpu_mem cmd_buf_mem;
+	struct nvgpu_fence_type *postfences[NVGPU_CE_MAX_INFLIGHT_JOBS];
+
+	struct nvgpu_list_node list;
+
+	u32 cmd_buf_read_queue_offset;
+};
+
+/* global ce app db */
+struct nvgpu_ce_app {
+	bool initialised;
+	struct nvgpu_mutex app_mutex;
+	int app_state;
+
+	struct nvgpu_list_node allocated_contexts;
+	u32 ctx_count;
+	u32 next_ctx_id;
+};
+
+static inline struct nvgpu_ce_gpu_ctx *
+nvgpu_ce_gpu_ctx_from_list(struct nvgpu_list_node *node)
+{
+	return (struct nvgpu_ce_gpu_ctx *)
+		((uintptr_t)node - offsetof(struct nvgpu_ce_gpu_ctx, list));
+};
+
+u32 nvgpu_ce_prepare_submit(u64 src_paddr,
+		u64 dst_paddr,
+		u64 size,
+		u32 *cmd_buf_cpu_va,
+		u32 payload,
+		u32 launch_flags,
+		u32 request_operation,
+		u32 dma_copy_class);
+
+#endif /*NVGPU_CE_PRIV_H*/
--- a/drivers/gpu/nvgpu/common/cic/ce_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/ce_cic.c
@@ -0,0 +1,91 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/cic.h>
+
+#include "cic_priv.h"
+
+void nvgpu_report_ce_err(struct gk20a *g, u32 hw_unit,
+		u32 inst, u32 err_id, u32 intr_info)
+{
+	int err = 0;
+	struct nvgpu_err_desc *err_desc = NULL;
+	struct nvgpu_err_msg err_pkt;
+
+	if (g->ops.cic.report_err == NULL) {
+		cic_dbg(g, "CIC does not support reporting error "
+			       "to safety services");
+		return;
+	}
+
+	if (hw_unit != NVGPU_ERR_MODULE_CE) {
+		nvgpu_err(g, "invalid hw module (%u)", hw_unit);
+		err = -EINVAL;
+		goto handle_report_failure;
+	}
+
+	err = nvgpu_cic_get_err_desc(g, hw_unit, err_id, &err_desc);
+	if (err != 0) {
+		nvgpu_err(g, "Failed to get err_desc for "
+				"err_id (%u) for hw module (%u)",
+				err_id, hw_unit);
+		goto handle_report_failure;
+	}
+
+	nvgpu_init_ce_err_msg(&err_pkt);
+	err_pkt.hw_unit_id = hw_unit;
+	err_pkt.err_id = err_desc->error_id;
+	err_pkt.is_critical = err_desc->is_critical;
+	err_pkt.err_info.ce_info.header.sub_unit_id = inst;
+	err_pkt.err_desc = err_desc;
+	/* sub_err_type can be decoded using intr_info by referring
+	 * to the interrupt status register definition corresponding
+	 * to the error that is being reported.
+	 */
+	err_pkt.err_info.ce_info.header.sub_err_type = intr_info;
+	err_pkt.err_size = nvgpu_safe_cast_u64_to_u8(
+			sizeof(err_pkt.err_info.ce_info));
+
+	if (g->ops.cic.report_err != NULL) {
+		err = g->ops.cic.report_err(g, (void *)&err_pkt,
+			sizeof(err_pkt), err_desc->is_critical);
+		if (err != 0) {
+			nvgpu_err(g, "Failed to report CE error: "
+				"inst=%u err_id=%u intr_info=%u",
+				inst, err_id, intr_info);
+		}
+	}
+handle_report_failure:
+	if (err != 0) {
+		nvgpu_sw_quiesce(g);
+	}
+}
+
+void nvgpu_inject_ce_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type)
+{
+	nvgpu_report_ce_err(g, hw_unit, 0U, err_index, sub_err_type);
+}
--- a/drivers/gpu/nvgpu/common/cic/cic.c
+++ b/drivers/gpu/nvgpu/common/cic/cic.c
@@ -0,0 +1,161 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/log.h>
+#include <nvgpu/cic.h>
+#include <nvgpu/nvgpu_err_info.h>
+
+#include "cic_priv.h"
+
+int nvgpu_cic_init_common(struct gk20a *g)
+{
+	struct nvgpu_cic *cic;
+	int err = 0;
+
+	if (g->cic != NULL) {
+		cic_dbg(g, "CIC unit already initialized");
+		return 0;
+	}
+
+	cic = nvgpu_kzalloc(g, sizeof(*cic));
+	if (cic == NULL) {
+		nvgpu_err(g, "Failed to allocate memory "
+				"for struct nvgpu_cic");
+		return -ENOMEM;
+	}
+
+	if (g->ops.cic.init != NULL) {
+		err = g->ops.cic.init(g, cic);
+		if (err != 0) {
+			nvgpu_err(g, "CIC chip specific "
+					"initialization failed.");
+			goto cleanup;
+		}
+	} else {
+		cic->err_lut = NULL;
+		cic->num_hw_modules = 0;
+	}
+
+	g->cic = cic;
+	cic_dbg(g, "CIC unit initialization done.");
+	return 0;
+
+cleanup:
+	if (cic != NULL) {
+		nvgpu_kfree(g, cic);
+	}
+	return err;
+}
+
+int nvgpu_cic_deinit_common(struct gk20a *g)
+{
+	struct nvgpu_cic *cic;
+
+	cic = g->cic;
+
+	if (cic == NULL) {
+		cic_dbg(g, "CIC unit already deinitialized");
+		return 0;
+	}
+
+	cic->err_lut = NULL;
+	cic->num_hw_modules = 0;
+
+	nvgpu_kfree(g, cic);
+	g->cic = NULL;
+
+	return 0;
+}
+
+int nvgpu_cic_check_hw_unit_id(struct gk20a *g, u32 hw_unit_id)
+{
+	if (g->cic == NULL) {
+		nvgpu_err(g, "CIC is not initialized");
+		return -EINVAL;
+	}
+
+	if (g->cic->num_hw_modules == 0U) {
+		cic_dbg(g, "LUT not initialized.");
+		return -EINVAL;
+	}
+
+	if (hw_unit_id >= g->cic->num_hw_modules) {
+		cic_dbg(g, "Invalid input HW unit ID.");
+		return -EINVAL;
+	}
+
+	return 0;
+}
+
+int nvgpu_cic_check_err_id(struct gk20a *g, u32 hw_unit_id,
+		u32 err_id)
+{
+	int err = 0;
+
+	if ((g->cic == NULL) || (g->cic->err_lut == NULL)) {
+		cic_dbg(g, "CIC/LUT not initialized.");
+		return -EINVAL;
+	}
+
+	err = nvgpu_cic_check_hw_unit_id(g, hw_unit_id);
+	if (err != 0) {
+		return err;
+	}
+
+	if (err_id >= g->cic->err_lut[hw_unit_id].num_errs) {
+		err = -EINVAL;
+	}
+
+	return err;
+}
+
+int nvgpu_cic_get_err_desc(struct gk20a *g, u32 hw_unit_id,
+		u32 err_id, struct nvgpu_err_desc **err_desc)
+{
+	int err = 0;
+
+	/* if (g->cic != NULL) and (g->cic->err_lut != NULL) check
+	 * can be skipped here as it checked as part of
+	 * nvgpu_cic_check_err_id() called below.
+	 */
+
+	err = nvgpu_cic_check_err_id(g, hw_unit_id, err_id);
+	if (err != 0) {
+		return err;
+	}
+
+	*err_desc = &(g->cic->err_lut[hw_unit_id].errs[err_id]);
+
+	return err;
+}
+
+int nvgpu_cic_get_num_hw_modules(struct gk20a *g)
+{
+	if (g->cic == NULL) {
+		nvgpu_err(g, "CIC is not initialized");
+		return -EINVAL;
+	}
+
+	return g->cic->num_hw_modules;
+}
--- a/drivers/gpu/nvgpu/common/cic/cic_intr.c
+++ b/drivers/gpu/nvgpu/common/cic/cic_intr.c
@@ -0,0 +1,251 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/cic.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/trace.h>
+
+int nvgpu_cic_wait_for_stall_interrupts(struct gk20a *g, u32 timeout)
+{
+	/* wait until all stalling irqs are handled */
+	return NVGPU_COND_WAIT(&g->mc.sw_irq_stall_last_handled_cond,
+			nvgpu_atomic_read(&g->mc.sw_irq_stall_pending) == 0,
+			timeout);
+}
+
+int nvgpu_cic_wait_for_nonstall_interrupts(struct gk20a *g, u32 timeout)
+{
+	/* wait until all non-stalling irqs are handled */
+	return NVGPU_COND_WAIT(&g->mc.sw_irq_nonstall_last_handled_cond,
+			nvgpu_atomic_read(&g->mc.sw_irq_nonstall_pending) == 0,
+			timeout);
+}
+
+void nvgpu_cic_wait_for_deferred_interrupts(struct gk20a *g)
+{
+	int ret;
+
+	ret = nvgpu_cic_wait_for_stall_interrupts(g, 0U);
+	if (ret != 0) {
+		nvgpu_err(g, "wait for stall interrupts failed %d", ret);
+	}
+
+	ret = nvgpu_cic_wait_for_nonstall_interrupts(g, 0U);
+	if (ret != 0) {
+		nvgpu_err(g, "wait for nonstall interrupts failed %d", ret);
+	}
+}
+
+void nvgpu_cic_intr_mask(struct gk20a *g)
+{
+	unsigned long flags = 0;
+
+	if (g->ops.mc.intr_mask != NULL) {
+		nvgpu_spinlock_irqsave(&g->mc.intr_lock, flags);
+		g->ops.mc.intr_mask(g);
+		nvgpu_spinunlock_irqrestore(&g->mc.intr_lock, flags);
+	}
+}
+
+#ifdef CONFIG_NVGPU_NON_FUSA
+void nvgpu_cic_log_pending_intrs(struct gk20a *g)
+{
+	if (g->ops.mc.log_pending_intrs != NULL) {
+		g->ops.mc.log_pending_intrs(g);
+	}
+}
+
+void nvgpu_cic_intr_enable(struct gk20a *g)
+{
+	unsigned long flags = 0;
+
+	if (g->ops.mc.intr_enable != NULL) {
+		nvgpu_spinlock_irqsave(&g->mc.intr_lock, flags);
+		g->ops.mc.intr_enable(g);
+		nvgpu_spinunlock_irqrestore(&g->mc.intr_lock, flags);
+	}
+}
+#endif
+
+void nvgpu_cic_intr_stall_unit_config(struct gk20a *g, u32 unit, bool enable)
+{
+	unsigned long flags = 0;
+
+	nvgpu_spinlock_irqsave(&g->mc.intr_lock, flags);
+	g->ops.mc.intr_stall_unit_config(g, unit, enable);
+	nvgpu_spinunlock_irqrestore(&g->mc.intr_lock, flags);
+}
+
+void nvgpu_cic_intr_nonstall_unit_config(struct gk20a *g, u32 unit, bool enable)
+{
+	unsigned long flags = 0;
+
+	nvgpu_spinlock_irqsave(&g->mc.intr_lock, flags);
+	g->ops.mc.intr_nonstall_unit_config(g, unit, enable);
+	nvgpu_spinunlock_irqrestore(&g->mc.intr_lock, flags);
+}
+
+void nvgpu_cic_intr_stall_pause(struct gk20a *g)
+{
+	unsigned long flags = 0;
+
+	nvgpu_spinlock_irqsave(&g->mc.intr_lock, flags);
+	g->ops.mc.intr_stall_pause(g);
+	nvgpu_spinunlock_irqrestore(&g->mc.intr_lock, flags);
+}
+
+void nvgpu_cic_intr_stall_resume(struct gk20a *g)
+{
+	unsigned long flags = 0;
+
+	nvgpu_spinlock_irqsave(&g->mc.intr_lock, flags);
+	g->ops.mc.intr_stall_resume(g);
+	nvgpu_spinunlock_irqrestore(&g->mc.intr_lock, flags);
+}
+
+void nvgpu_cic_intr_nonstall_pause(struct gk20a *g)
+{
+	unsigned long flags = 0;
+
+	nvgpu_spinlock_irqsave(&g->mc.intr_lock, flags);
+	g->ops.mc.intr_nonstall_pause(g);
+	nvgpu_spinunlock_irqrestore(&g->mc.intr_lock, flags);
+}
+
+void nvgpu_cic_intr_nonstall_resume(struct gk20a *g)
+{
+	unsigned long flags = 0;
+
+	nvgpu_spinlock_irqsave(&g->mc.intr_lock, flags);
+	g->ops.mc.intr_nonstall_resume(g);
+	nvgpu_spinunlock_irqrestore(&g->mc.intr_lock, flags);
+}
+
+static void nvgpu_cic_intr_nonstall_work(struct gk20a *g, u32 work_ops)
+{
+	bool semaphore_wakeup, post_events;
+
+	semaphore_wakeup =
+		(((work_ops & NVGPU_CIC_NONSTALL_OPS_WAKEUP_SEMAPHORE) != 0U) ?
+					true : false);
+	post_events = (((work_ops & NVGPU_CIC_NONSTALL_OPS_POST_EVENTS) != 0U) ?
+					true : false);
+
+	if (semaphore_wakeup) {
+		g->ops.semaphore_wakeup(g, post_events);
+	}
+}
+
+u32 nvgpu_cic_intr_nonstall_isr(struct gk20a *g)
+{
+	u32 non_stall_intr_val = 0U;
+
+	if (nvgpu_is_powered_off(g)) {
+		return NVGPU_CIC_INTR_UNMASK;
+	}
+
+	/* not from gpu when sharing irq with others */
+	non_stall_intr_val = g->ops.mc.intr_nonstall(g);
+	if (non_stall_intr_val == 0U) {
+		return NVGPU_CIC_INTR_NONE;
+	}
+
+	nvgpu_cic_intr_nonstall_pause(g);
+	if (g->sw_quiesce_pending) {
+		return NVGPU_CIC_INTR_QUIESCE_PENDING;
+	}
+
+	nvgpu_atomic_set(&g->mc.sw_irq_nonstall_pending, 1);
+	return NVGPU_CIC_INTR_HANDLE;
+}
+
+void nvgpu_cic_intr_nonstall_handle(struct gk20a *g)
+{
+	int err;
+	u32 nonstall_ops = 0;
+
+	nonstall_ops = g->ops.mc.isr_nonstall(g);
+	if (nonstall_ops != 0U) {
+		nvgpu_cic_intr_nonstall_work(g, nonstall_ops);
+	}
+
+	/* sync handled irq counter before re-enabling interrupts */
+	nvgpu_atomic_set(&g->mc.sw_irq_nonstall_pending, 0);
+
+	nvgpu_cic_intr_nonstall_resume(g);
+
+	err = nvgpu_cond_broadcast(&g->mc.sw_irq_nonstall_last_handled_cond);
+	if (err != 0) {
+		nvgpu_err(g, "nvgpu_cond_broadcast failed err=%d", err);
+	}
+}
+
+u32 nvgpu_cic_intr_stall_isr(struct gk20a *g)
+{
+	u32 mc_intr_0 = 0U;
+
+	nvgpu_trace_intr_stall_start(g);
+
+	if (nvgpu_is_powered_off(g)) {
+		return NVGPU_CIC_INTR_UNMASK;
+	}
+
+	/* not from gpu when sharing irq with others */
+	mc_intr_0 = g->ops.mc.intr_stall(g);
+	if (mc_intr_0 == 0U) {
+		return NVGPU_CIC_INTR_NONE;
+	}
+
+	nvgpu_cic_intr_stall_pause(g);
+
+	if (g->sw_quiesce_pending) {
+		return NVGPU_CIC_INTR_QUIESCE_PENDING;
+	}
+
+	nvgpu_atomic_set(&g->mc.sw_irq_stall_pending, 1);
+
+	nvgpu_trace_intr_stall_done(g);
+
+	return NVGPU_CIC_INTR_HANDLE;
+}
+
+void nvgpu_cic_intr_stall_handle(struct gk20a *g)
+{
+	int err;
+
+	nvgpu_trace_intr_thread_stall_start(g);
+
+	g->ops.mc.isr_stall(g);
+
+	nvgpu_trace_intr_thread_stall_done(g);
+
+	/* sync handled irq counter before re-enabling interrupts */
+	nvgpu_atomic_set(&g->mc.sw_irq_stall_pending, 0);
+	nvgpu_cic_intr_stall_resume(g);
+
+	err = nvgpu_cond_broadcast(&g->mc.sw_irq_stall_last_handled_cond);
+	if (err != 0) {
+		nvgpu_err(g, "nvgpu_cond_broadcast failed err=%d", err);
+	}
+}
--- a/drivers/gpu/nvgpu/common/cic/cic_priv.h
+++ b/drivers/gpu/nvgpu/common/cic/cic_priv.h
@@ -0,0 +1,291 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef CIC_PRIV_H
+#define CIC_PRIV_H
+
+#include <nvgpu/types.h>
+
+struct gk20a;
+struct nvgpu_err_hw_module;
+struct nvgpu_err_msg;
+struct gpu_err_header;
+
+/*
+ * @file
+ *
+ * Declare CIC's private structure to store error-policy LUT and
+ * other data and ops needed during error reporting.
+ */
+
+#define ERR_INJECT_TEST_PATTERN 0xA5
+
+/*
+ * This struct contains members related to error-policy look-up table,
+ * number of units reporting errors.
+ */
+struct nvgpu_cic {
+	/** Pointer for error look-up table. */
+	struct nvgpu_err_hw_module *err_lut;
+
+	/** Total number of GPU HW modules considered in CIC. */
+	u32 num_hw_modules;
+
+};
+
+/**
+ * @brief Inject ECC error.
+ *
+ * @param g [in]		- The GPU driver struct.
+ * @param hw_unit [in]		- Index of HW unit.
+ * @param err_index [in]	- Error index.
+ * @param inst [in]		- Instance ID.
+ *
+ *  - Sets values for error address and error count.
+ *  - Invokes error reporting API with the required set of inputs.
+ *
+ * @return None
+ */
+void nvgpu_inject_ecc_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 inst);
+
+/**
+ * @brief Inject HOST error.
+ *
+ * @param g [in]		- The GPU driver struct.
+ * @param hw_unit [in]		- Index of HW unit.
+ * @param err_index [in]	- Error index.
+ * @param sub_err_type [in]	- Sub error type.
+ *
+ *  - Invokes error reporting API with the required set of inputs.
+ *
+ * @return None
+ */
+void nvgpu_inject_host_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type);
+
+/**
+ * @brief Inject GR error.
+ *
+ * @param g [in]		- The GPU driver struct.
+ * @param hw_unit [in]		- Index of HW unit.
+ * @param err_index [in]	- Error index.
+ * @param sub_err_type [in]	- Sub error type.
+ *
+ *  - Sets values for GR exception and SM machine check error information.
+ *  - Invokes error reporting API with the required set of inputs.
+ *
+ * @return None
+ */
+void nvgpu_inject_gr_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type);
+
+/**
+ * @brief Inject CE error.
+ *
+ * @param g [in]		- The GPU driver struct.
+ * @param hw_unit [in]		- Index of HW unit.
+ * @param err_index [in]	- Error index.
+ * @param sub_err_type [in]	- Sub error type.
+ *
+ *  - Invokes error reporting API with the required set of inputs.
+ *
+ * @return None
+ */
+void nvgpu_inject_ce_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type);
+
+/**
+ * @brief Inject CE error.
+ *
+ * @param g [in]		- The GPU driver struct.
+ * @param hw_unit [in]		- Index of HW unit.
+ * @param err_index [in]	- Error index.
+ * @param err_code [in]		- Error code.
+ *
+ *  - Invokes error reporting API with the required set of inputs.
+ *
+ * @return None
+ */
+void nvgpu_inject_pri_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 err_code);
+
+/**
+ * @brief Inject PMU error.
+ *
+ * @param g [in]		- The GPU driver struct.
+ * @param hw_unit [in]		- Index of HW unit.
+ * @param err_index [in]	- Error index.
+ * @param sub_err_type [in]	- Sub error type.
+ *
+ *  - Sets values for error info.
+ *  - Invokes error reporting API with the required set of inputs.
+ *
+ * @return None
+ */
+void nvgpu_inject_pmu_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type);
+
+/**
+ * @brief Inject CTXSW error.
+ *
+ * @param g [in]		- The GPU driver struct.
+ * @param hw_unit [in]		- Index of HW unit.
+ * @param err_index [in]	- Error index.
+ * @param inst [in]	        - Instance ID.
+ *
+ *  - Sets values for error info.
+ *  - Invokes error reporting API with the required set of inputs.
+ *
+ * @return None
+ */
+void nvgpu_inject_ctxsw_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 inst);
+
+/**
+ * @brief Inject MMU error.
+ *
+ * @param g [in]		- The GPU driver struct.
+ * @param hw_unit [in]		- Index of HW unit.
+ * @param err_index [in]	- Error index.
+ * @param sub_err_type [in]	- Sub error type.
+ *
+ *  - Sets values for mmu page fault info.
+ *  - Invokes error reporting API with the required set of inputs.
+ *
+ * @return None
+ */
+void nvgpu_inject_mmu_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type);
+
+/**
+ * @brief Initialize error message header.
+ *
+ * @param header [in]		- Error message header.
+ *
+ *  This is used to initialize error message header.
+ *
+ * @return None
+ */
+void nvgpu_init_err_msg_header(struct gpu_err_header *header);
+
+/**
+ * @brief Initialize error message.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is common
+ *  for all HW units.
+ *
+ * @return None
+ */
+void nvgpu_init_err_msg(struct nvgpu_err_msg *msg);
+
+/**
+ * @brief Initialize error message for HOST unit.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is specific to HOST unit.
+ *
+ * @return None
+ */
+void nvgpu_init_host_err_msg(struct nvgpu_err_msg *msg);
+
+/**
+ * @brief Initialize ECC error message.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is specific to ECC errors.
+ *
+ * @return None
+ */
+void nvgpu_init_ecc_err_msg(struct nvgpu_err_msg *msg);
+
+/**
+ * @brief Initialize error message for PRI unit.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is specific to PRI unit.
+ *
+ * @return None
+ */
+void nvgpu_init_pri_err_msg(struct nvgpu_err_msg *msg);
+
+/**
+ * @brief Initialize error message for CE unit.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is specific to CE unit.
+ *
+ * @return None
+ */
+void nvgpu_init_ce_err_msg(struct nvgpu_err_msg *msg);
+
+/**
+ * @brief Initialize error message for PMU unit.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is specific to PMU unit.
+ *
+ * @return None
+ */
+void nvgpu_init_pmu_err_msg(struct nvgpu_err_msg *msg);
+
+/**
+ * @brief Initialize error message for GR unit.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is specific to GR unit.
+ *
+ * @return None
+ */
+void nvgpu_init_gr_err_msg(struct nvgpu_err_msg *msg);
+
+/**
+ * @brief Initialize error message for CTXSW.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is specific to CTXSW.
+ *
+ * @return None
+ */
+void nvgpu_init_ctxsw_err_msg(struct nvgpu_err_msg *msg);
+
+/**
+ * @brief Initialize error message for MMU unit.
+ *
+ * @param msg [in]		- Error message.
+ *
+ *  This is used to initialize error message that is specific to MMU unit.
+ *
+ * @return None
+ */
+void nvgpu_init_mmu_err_msg(struct nvgpu_err_msg *msg);
+
+#endif /* CIC_PRIV_H */
--- a/drivers/gpu/nvgpu/common/cic/ctxsw_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/ctxsw_cic.c
@@ -0,0 +1,97 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/cic.h>
+
+#include "cic_priv.h"
+
+void nvgpu_report_ctxsw_err(struct gk20a *g, u32 hw_unit, u32 err_id,
+		void *data)
+{
+	int err = 0;
+	struct nvgpu_err_desc *err_desc = NULL;
+	struct nvgpu_err_msg err_pkt;
+	u32 inst = 0;
+	struct ctxsw_err_info *err_info = (struct ctxsw_err_info *)data;
+
+	if (g->ops.cic.report_err == NULL) {
+		cic_dbg(g, "CIC does not support reporting error "
+			       "to safety services");
+		return;
+	}
+
+	if (hw_unit != NVGPU_ERR_MODULE_FECS) {
+		nvgpu_err(g, "invalid hw module (%u)", hw_unit);
+		err = -EINVAL;
+		goto handle_report_failure;
+	}
+
+	err = nvgpu_cic_get_err_desc(g, hw_unit, err_id, &err_desc);
+	if (err != 0) {
+		nvgpu_err(g, "Failed to get err_desc for"
+			       " err_id (%u) for hw module (%u)",
+				err_id, hw_unit);
+		goto handle_report_failure;
+	}
+
+	nvgpu_init_ctxsw_err_msg(&err_pkt);
+	err_pkt.hw_unit_id = hw_unit;
+	err_pkt.err_id = err_desc->error_id;
+	err_pkt.is_critical = err_desc->is_critical;
+	err_pkt.err_info.ctxsw_info.header.sub_unit_id = inst;
+	err_pkt.err_info.ctxsw_info.curr_ctx = err_info->curr_ctx;
+	err_pkt.err_info.ctxsw_info.chid = err_info->chid;
+	err_pkt.err_info.ctxsw_info.ctxsw_status0 = err_info->ctxsw_status0;
+	err_pkt.err_info.ctxsw_info.ctxsw_status1 = err_info->ctxsw_status1;
+	err_pkt.err_info.ctxsw_info.mailbox_value = err_info->mailbox_value;
+	err_pkt.err_desc = err_desc;
+	err_pkt.err_size = nvgpu_safe_cast_u64_to_u8(
+			sizeof(err_pkt.err_info.ctxsw_info));
+
+	if (g->ops.cic.report_err != NULL) {
+		err = g->ops.cic.report_err(g, (void *)&err_pkt,
+			sizeof(err_pkt), err_desc->is_critical);
+		if (err != 0) {
+			nvgpu_err(g, "Failed to report CTXSW error: "
+					"err_id=%u, mailbox_val=%u",
+					err_id, err_info->mailbox_value);
+		}
+	}
+handle_report_failure:
+	if (err != 0) {
+		nvgpu_sw_quiesce(g);
+	}
+}
+
+void nvgpu_inject_ctxsw_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 inst)
+{
+	struct ctxsw_err_info err_info;
+
+	(void)memset(&err_info, ERR_INJECT_TEST_PATTERN, sizeof(err_info));
+
+	nvgpu_report_ctxsw_err(g, hw_unit, err_index, (void *)&err_info);
+}
--- a/drivers/gpu/nvgpu/common/cic/ecc_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/ecc_cic.c
@@ -0,0 +1,87 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/cic.h>
+
+#include "cic_priv.h"
+
+void nvgpu_report_ecc_err(struct gk20a *g, u32 hw_unit, u32 inst,
+		u32 err_id, u64 err_addr, u64 err_count)
+{
+	int err = 0;
+	struct nvgpu_err_desc *err_desc = NULL;
+	struct nvgpu_err_msg err_pkt;
+
+	if (g->ops.cic.report_err == NULL) {
+		cic_dbg(g, "CIC does not support reporting error "
+			       "to safety services");
+		return;
+	}
+
+	err = nvgpu_cic_get_err_desc(g, hw_unit, err_id, &err_desc);
+	if (err != 0) {
+		nvgpu_err(g, "Failed to get err_desc for "
+			       "err_id (%u) for hw module (%u)",
+				err_id, hw_unit);
+		goto handle_report_failure;
+	}
+
+	nvgpu_init_ecc_err_msg(&err_pkt);
+	err_pkt.hw_unit_id = hw_unit;
+	err_pkt.err_id = err_desc->error_id;
+	err_pkt.is_critical = err_desc->is_critical;
+	err_pkt.err_info.ecc_info.header.sub_unit_id = inst;
+	err_pkt.err_info.ecc_info.header.address = err_addr;
+	err_pkt.err_info.ecc_info.err_cnt = err_count;
+	err_pkt.err_desc = err_desc;
+	err_pkt.err_size = nvgpu_safe_cast_u64_to_u8(
+			sizeof(err_pkt.err_info.ecc_info));
+
+	if (g->ops.cic.report_err != NULL) {
+		err = g->ops.cic.report_err(g, (void *)&err_pkt,
+			sizeof(err_pkt), err_desc->is_critical);
+		if (err != 0) {
+			nvgpu_err(g, "Failed to report ECC error: hw_unit=%u, inst=%u, "
+				"err_id=%u, err_addr=%llu, err_count=%llu",
+				hw_unit, inst, err_id, err_addr, err_count);
+		}
+	}
+handle_report_failure:
+	if (err != 0) {
+		nvgpu_sw_quiesce(g);
+	}
+}
+
+void nvgpu_inject_ecc_swerror(struct gk20a *g, u32 hw_unit, u32 err_index,
+		u32 inst)
+{
+	u64 err_addr, err_count;
+
+	err_addr = (u64)ERR_INJECT_TEST_PATTERN;
+	err_count = (u64)ERR_INJECT_TEST_PATTERN;
+
+	nvgpu_report_ecc_err(g, hw_unit, inst, err_index, err_addr, err_count);
+}
--- a/drivers/gpu/nvgpu/common/cic/gr_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/gr_cic.c
@@ -0,0 +1,169 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/cic.h>
+
+#include "cic_priv.h"
+
+static void nvpgu_report_fill_err_info(u32 hw_unit,
+		struct nvgpu_err_msg *err_pkt, struct gr_err_info *err_info)
+{
+	if (hw_unit == NVGPU_ERR_MODULE_SM) {
+		struct gr_sm_mcerr_info *info = err_info->sm_mcerr_info;
+
+		err_pkt->err_info.sm_info.warp_esr_pc =
+			info->hww_warp_esr_pc;
+		err_pkt->err_info.sm_info.warp_esr_status =
+			info->hww_warp_esr_status;
+		err_pkt->err_info.sm_info.curr_ctx =
+			info->curr_ctx;
+		err_pkt->err_info.sm_info.chid =
+			info->chid;
+		err_pkt->err_info.sm_info.tsgid =
+			info->tsgid;
+		err_pkt->err_info.sm_info.gpc =
+			info->gpc;
+		err_pkt->err_info.sm_info.tpc =
+			info->tpc;
+		err_pkt->err_info.sm_info.sm =
+			info->sm;
+	} else {
+		struct gr_exception_info *info  = err_info->exception_info;
+
+		err_pkt->err_info.gr_info.curr_ctx = info->curr_ctx;
+		err_pkt->err_info.gr_info.chid = info->chid;
+		err_pkt->err_info.gr_info.tsgid = info->tsgid;
+		err_pkt->err_info.gr_info.status = info->status;
+	}
+}
+
+void nvgpu_report_gr_err(struct gk20a *g, u32 hw_unit, u32 inst,
+		u32 err_id, struct gr_err_info *err_info, u32 sub_err_type)
+{
+	int err = 0;
+	struct nvgpu_err_desc *err_desc = NULL;
+	struct nvgpu_err_msg err_pkt;
+
+	if (g->ops.cic.report_err == NULL) {
+		cic_dbg(g, "CIC does not support reporting error "
+			       "to safety services");
+		return;
+	}
+
+	if ((hw_unit != NVGPU_ERR_MODULE_SM) &&
+			(hw_unit != NVGPU_ERR_MODULE_PGRAPH)) {
+		nvgpu_err(g, "invalid hw module (%u)", hw_unit);
+		err = -EINVAL;
+		goto handle_report_failure;
+	}
+
+	err = nvgpu_cic_get_err_desc(g, hw_unit, err_id, &err_desc);
+	if (err != 0) {
+		nvgpu_err(g, "Failed to get err_desc for "
+				"err_id (%u) for hw module (%u)",
+				err_id, hw_unit);
+		goto handle_report_failure;
+	}
+
+	nvgpu_init_gr_err_msg(&err_pkt);
+	err_pkt.hw_unit_id = hw_unit;
+	err_pkt.err_id = err_desc->error_id;
+	err_pkt.is_critical = err_desc->is_critical;
+	err_pkt.err_desc = err_desc;
+	err_pkt.err_info.gr_info.header.sub_err_type = sub_err_type;
+	err_pkt.err_info.gr_info.header.sub_unit_id = inst;
+	nvpgu_report_fill_err_info(hw_unit, &err_pkt, err_info);
+	err_pkt.err_size = nvgpu_safe_cast_u64_to_u8(sizeof(err_pkt.err_info));
+
+	if (g->ops.cic.report_err != NULL) {
+		err = g->ops.cic.report_err(g, (void *)&err_pkt,
+			sizeof(err_pkt), err_desc->is_critical);
+		if (err != 0) {
+			if (hw_unit == NVGPU_ERR_MODULE_SM) {
+				nvgpu_err(g, "Failed to report SM exception"
+					"gpc=%u, tpc=%u, sm=%u, esr_status=%x",
+					err_pkt.err_info.sm_info.gpc,
+					err_pkt.err_info.sm_info.tpc,
+					err_pkt.err_info.sm_info.sm,
+					err_pkt.err_info.sm_info.warp_esr_status);
+			}
+			if (hw_unit == NVGPU_ERR_MODULE_PGRAPH) {
+				nvgpu_err(g, "Failed to report PGRAPH"
+					"exception: inst=%u, err_id=%u, "
+					"status=%u", inst, err_id,
+					err_pkt.err_info.gr_info.status);
+			}
+		}
+	}
+handle_report_failure:
+	if (err != 0) {
+		nvgpu_sw_quiesce(g);
+	}
+}
+
+void nvgpu_inject_gr_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type)
+{
+	struct gr_err_info err_info;
+	struct gr_exception_info gr_error_info;
+	struct gr_sm_mcerr_info sm_error_info;
+	int err = 0;
+	u32 inst = 0U;
+
+	/*
+	 * Fill fixed test pattern data for the error message
+	 * payload.
+	 */
+	(void)memset(&gr_error_info, ERR_INJECT_TEST_PATTERN, sizeof(gr_error_info));
+	(void)memset(&sm_error_info, ERR_INJECT_TEST_PATTERN, sizeof(sm_error_info));
+
+	switch (hw_unit) {
+	case NVGPU_ERR_MODULE_PGRAPH:
+		{
+			err_info.exception_info = &gr_error_info;
+		}
+		break;
+
+	case NVGPU_ERR_MODULE_SM:
+		{
+			err_info.sm_mcerr_info = &sm_error_info;
+		}
+		break;
+
+	default:
+		{
+			nvgpu_err(g, "unsupported hw_unit(%u)", hw_unit);
+			err = -EINVAL;
+		}
+		break;
+	}
+	if (err != 0) {
+		return;
+	}
+
+	nvgpu_report_gr_err(g, hw_unit, inst, err_index,
+			&err_info, sub_err_type);
+}
--- a/drivers/gpu/nvgpu/common/cic/host_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/host_cic.c
@@ -0,0 +1,91 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/cic.h>
+
+#include "cic_priv.h"
+
+void nvgpu_report_host_err(struct gk20a *g, u32 hw_unit,
+		u32 inst, u32 err_id, u32 intr_info)
+{
+	int err = 0;
+	struct nvgpu_err_desc *err_desc = NULL;
+	struct nvgpu_err_msg err_pkt;
+
+	if (g->ops.cic.report_err == NULL) {
+		cic_dbg(g, "CIC does not support reporting error "
+			       "to safety services");
+		return;
+	}
+
+	if (hw_unit != NVGPU_ERR_MODULE_HOST) {
+		nvgpu_err(g, "invalid hw module (%u)", hw_unit);
+		err = -EINVAL;
+		goto handle_report_failure;
+	}
+
+	err = nvgpu_cic_get_err_desc(g, hw_unit, err_id, &err_desc);
+	if (err != 0) {
+		nvgpu_err(g, "Failed to get err_desc for "
+				"err_id (%u) for hw module (%u)",
+				err_id, hw_unit);
+		goto handle_report_failure;
+	}
+
+	nvgpu_init_host_err_msg(&err_pkt);
+	err_pkt.hw_unit_id = hw_unit;
+	err_pkt.err_id = err_desc->error_id;
+	err_pkt.is_critical = err_desc->is_critical;
+	err_pkt.err_info.host_info.header.sub_unit_id = inst;
+	err_pkt.err_desc = err_desc;
+	/* sub_err_type can be decoded using intr_info by referring
+	 * to the interrupt status register definition corresponding
+	 * to the error that is being reported.
+	 */
+	err_pkt.err_info.host_info.header.sub_err_type = intr_info;
+	err_pkt.err_size = nvgpu_safe_cast_u64_to_u8(
+			sizeof(err_pkt.err_info.host_info));
+
+	if (g->ops.cic.report_err != NULL) {
+		err = g->ops.cic.report_err(g, (void *)&err_pkt,
+			sizeof(err_pkt), err_desc->is_critical);
+		if (err != 0) {
+			nvgpu_err(g, "Failed to report HOST error: "
+					"inst=%u, err_id=%u, intr_info=%u",
+					inst, err_id, intr_info);
+		}
+	}
+handle_report_failure:
+	if (err != 0) {
+		nvgpu_sw_quiesce(g);
+	}
+}
+
+void nvgpu_inject_host_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type)
+{
+	nvgpu_report_host_err(g, hw_unit, 0U, err_index, sub_err_type);
+}
--- a/drivers/gpu/nvgpu/common/cic/mmu_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/mmu_cic.c
@@ -0,0 +1,131 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/cic.h>
+
+#include "cic_priv.h"
+
+void nvgpu_report_mmu_err(struct gk20a *g, u32 hw_unit, u32 err_id,
+		struct mmu_fault_info *fault_info, u32 status, u32 sub_err_type)
+{
+	int err = 0;
+	struct nvgpu_err_desc *err_desc = NULL;
+	struct nvgpu_err_msg err_pkt;
+
+	if (g->ops.cic.report_err == NULL) {
+		cic_dbg(g, "CIC does not support reporting error "
+			       "to safety services");
+		return;
+	}
+
+	if (hw_unit != NVGPU_ERR_MODULE_HUBMMU) {
+		nvgpu_err(g, "invalid hw module (%u)", hw_unit);
+		err = -EINVAL;
+		goto handle_report_failure;
+	}
+
+	err = nvgpu_cic_get_err_desc(g, hw_unit, err_id, &err_desc);
+	if (err != 0) {
+		nvgpu_err(g, "Failed to get err_desc for "
+				"err_id (%u) for hw module (%u)",
+				err_id, hw_unit);
+		goto handle_report_failure;
+	}
+
+	nvgpu_init_mmu_err_msg(&err_pkt);
+	err_pkt.hw_unit_id = hw_unit;
+	err_pkt.err_id = err_desc->error_id;
+	err_pkt.is_critical = err_desc->is_critical;
+	err_pkt.err_info.mmu_info.header.sub_err_type = sub_err_type;
+	err_pkt.err_info.mmu_info.status = status;
+	/* Copy contents of mmu_fault_info */
+	if (fault_info != NULL) {
+		err_pkt.err_info.mmu_info.info.inst_ptr = fault_info->inst_ptr;
+		err_pkt.err_info.mmu_info.info.inst_aperture
+			= fault_info->inst_aperture;
+		err_pkt.err_info.mmu_info.info.fault_addr
+			= fault_info->fault_addr;
+		err_pkt.err_info.mmu_info.info.fault_addr_aperture
+			= fault_info->fault_addr_aperture;
+		err_pkt.err_info.mmu_info.info.timestamp_lo
+			= fault_info->timestamp_lo;
+		err_pkt.err_info.mmu_info.info.timestamp_hi
+			= fault_info->timestamp_hi;
+		err_pkt.err_info.mmu_info.info.mmu_engine_id
+			= fault_info->mmu_engine_id;
+		err_pkt.err_info.mmu_info.info.gpc_id = fault_info->gpc_id;
+		err_pkt.err_info.mmu_info.info.client_type
+			= fault_info->client_type;
+		err_pkt.err_info.mmu_info.info.client_id
+			= fault_info->client_id;
+		err_pkt.err_info.mmu_info.info.fault_type
+			= fault_info->fault_type;
+		err_pkt.err_info.mmu_info.info.access_type
+			= fault_info->access_type;
+		err_pkt.err_info.mmu_info.info.protected_mode
+			= fault_info->protected_mode;
+		err_pkt.err_info.mmu_info.info.replayable_fault
+			= fault_info->replayable_fault;
+		err_pkt.err_info.mmu_info.info.replay_fault_en
+			= fault_info->replay_fault_en;
+		err_pkt.err_info.mmu_info.info.valid = fault_info->valid;
+		err_pkt.err_info.mmu_info.info.faulted_pbdma =
+			fault_info->faulted_pbdma;
+		err_pkt.err_info.mmu_info.info.faulted_engine =
+			fault_info->faulted_engine;
+		err_pkt.err_info.mmu_info.info.faulted_subid =
+			fault_info->faulted_subid;
+		err_pkt.err_info.mmu_info.info.chid = fault_info->chid;
+	}
+	err_pkt.err_desc = err_desc;
+	err_pkt.err_size = nvgpu_safe_cast_u64_to_u8(
+			sizeof(err_pkt.err_info.mmu_info));
+
+	if (g->ops.cic.report_err != NULL) {
+		err = g->ops.cic.report_err(g, (void *)&err_pkt,
+			sizeof(err_pkt), err_desc->is_critical);
+		if (err != 0) {
+			nvgpu_err(g, "Failed to report MMU fault: hw_unit=%u, "
+				"err_id=%u, sub_err_type=%u, status=%u",
+				hw_unit, err_id, sub_err_type, status);
+		}
+	}
+handle_report_failure:
+	if (err != 0) {
+		nvgpu_sw_quiesce(g);
+	}
+}
+
+void nvgpu_inject_mmu_swerror(struct gk20a *g, u32 hw_unit, u32 err_index,
+		u32 sub_err_type)
+{
+	u32 status = 0U;
+	struct mmu_fault_info fault_info;
+
+	(void) memset(&fault_info, ERR_INJECT_TEST_PATTERN, sizeof(fault_info));
+	nvgpu_report_mmu_err(g, hw_unit, err_index,
+			&fault_info, status, sub_err_type);
+}
--- a/drivers/gpu/nvgpu/common/cic/msg_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/msg_cic.c
@@ -0,0 +1,126 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/string.h>
+
+#include "cic_priv.h"
+
+void nvgpu_init_err_msg_header(struct gpu_err_header *header)
+{
+	header->version.major = (u16)1U;
+	header->version.minor = (u16)0U;
+	header->sub_err_type = 0U;
+	header->sub_unit_id = 0UL;
+	header->address = 0UL;
+	header->timestamp_ns = 0UL;
+}
+
+void nvgpu_init_err_msg(struct nvgpu_err_msg *msg)
+{
+	(void) memset(msg, 0, sizeof(struct nvgpu_err_msg));
+	msg->hw_unit_id = 0U;
+	msg->is_critical = false;
+	msg->err_id = (u8)0U;
+	msg->err_size = (u8)0U;
+}
+
+void nvgpu_init_host_err_msg(struct nvgpu_err_msg *msg)
+{
+	nvgpu_init_err_msg(msg);
+	nvgpu_init_err_msg_header(&msg->err_info.host_info.header);
+}
+
+void nvgpu_init_ecc_err_msg(struct nvgpu_err_msg *msg)
+{
+	nvgpu_init_err_msg(msg);
+	nvgpu_init_err_msg_header(&msg->err_info.ecc_info.header);
+	msg->err_info.ecc_info.err_cnt = 0UL;
+}
+
+void nvgpu_init_pri_err_msg(struct nvgpu_err_msg *msg)
+{
+	nvgpu_init_err_msg(msg);
+	nvgpu_init_err_msg_header(&msg->err_info.pri_info.header);
+}
+
+void nvgpu_init_ce_err_msg(struct nvgpu_err_msg *msg)
+{
+	nvgpu_init_err_msg(msg);
+	nvgpu_init_err_msg_header(&msg->err_info.ce_info.header);
+}
+
+void nvgpu_init_pmu_err_msg(struct nvgpu_err_msg *msg)
+{
+	nvgpu_init_err_msg(msg);
+	nvgpu_init_err_msg_header(&msg->err_info.pmu_err_info.header);
+	msg->err_info.pmu_err_info.status = 0U;
+}
+
+void nvgpu_init_gr_err_msg(struct nvgpu_err_msg *msg)
+{
+	nvgpu_init_err_msg(msg);
+	nvgpu_init_err_msg_header(&msg->err_info.gr_info.header);
+	msg->err_info.gr_info.curr_ctx = 0U;
+	msg->err_info.gr_info.chid = 0U;
+	msg->err_info.gr_info.tsgid = 0U;
+	msg->err_info.gr_info.status = 0U;
+}
+
+void nvgpu_init_ctxsw_err_msg(struct nvgpu_err_msg *msg)
+{
+	nvgpu_init_err_msg(msg);
+	nvgpu_init_err_msg_header(&msg->err_info.ctxsw_info.header);
+	msg->err_info.ctxsw_info.curr_ctx = 0U;
+	msg->err_info.ctxsw_info.tsgid = 0U;
+	msg->err_info.ctxsw_info.chid = 0U;
+	msg->err_info.ctxsw_info.ctxsw_status0 = 0U;
+	msg->err_info.ctxsw_info.ctxsw_status1 = 0U;
+	msg->err_info.ctxsw_info.mailbox_value = 0U;
+}
+
+void nvgpu_init_mmu_err_msg(struct nvgpu_err_msg *msg)
+{
+	nvgpu_init_err_msg(msg);
+	nvgpu_init_err_msg_header(&msg->err_info.mmu_info.header);
+	msg->err_info.mmu_info.info.inst_ptr = 0UL;
+	msg->err_info.mmu_info.info.inst_aperture = 0U;
+	msg->err_info.mmu_info.info.fault_addr = 0UL;
+	msg->err_info.mmu_info.info.fault_addr_aperture = 0U;
+	msg->err_info.mmu_info.info.timestamp_lo = 0U;
+	msg->err_info.mmu_info.info.timestamp_hi = 0U;
+	msg->err_info.mmu_info.info.mmu_engine_id = 0U;
+	msg->err_info.mmu_info.info.gpc_id = 0U;
+	msg->err_info.mmu_info.info.client_type = 0U;
+	msg->err_info.mmu_info.info.client_id = 0U;
+	msg->err_info.mmu_info.info.fault_type = 0U;
+	msg->err_info.mmu_info.info.access_type = 0U;
+	msg->err_info.mmu_info.info.protected_mode = 0U;
+	msg->err_info.mmu_info.info.replayable_fault = false;
+	msg->err_info.mmu_info.info.replay_fault_en = 0U;
+	msg->err_info.mmu_info.info.valid = false;
+	msg->err_info.mmu_info.info.faulted_pbdma = 0U;
+	msg->err_info.mmu_info.info.faulted_engine = 0U;
+	msg->err_info.mmu_info.info.faulted_subid = 0U;
+	msg->err_info.mmu_info.info.chid = 0U;
+	msg->err_info.mmu_info.status = 0U;
+}
--- a/drivers/gpu/nvgpu/common/cic/pmu_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/pmu_cic.c
@@ -0,0 +1,91 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/cic.h>
+
+#include "cic_priv.h"
+
+void nvgpu_report_pmu_err(struct gk20a *g, u32 hw_unit, u32 err_id,
+		u32 sub_err_type, u32 status)
+{
+	int err = 0;
+	struct nvgpu_err_desc *err_desc = NULL;
+	struct nvgpu_err_msg err_pkt;
+
+	if (g->ops.cic.report_err == NULL) {
+		cic_dbg(g, "CIC does not support reporting error "
+			       "to safety services");
+		return;
+	}
+
+	if (hw_unit != NVGPU_ERR_MODULE_PMU) {
+		nvgpu_err(g, "invalid hw module (%u)", hw_unit);
+		err = -EINVAL;
+		goto handle_report_failure;
+	}
+
+	err = nvgpu_cic_get_err_desc(g, hw_unit, err_id, &err_desc);
+	if (err != 0) {
+		nvgpu_err(g, "Failed to get err_desc for "
+				"err_id (%u) for hw module (%u)",
+				err_id, hw_unit);
+		goto handle_report_failure;
+	}
+
+	nvgpu_init_pmu_err_msg(&err_pkt);
+	err_pkt.hw_unit_id = hw_unit;
+	err_pkt.err_id = err_desc->error_id;
+	err_pkt.is_critical = err_desc->is_critical;
+	err_pkt.err_info.pmu_err_info.status = status;
+	err_pkt.err_info.pmu_err_info.header.sub_err_type = sub_err_type;
+	err_pkt.err_desc = err_desc;
+	err_pkt.err_size = nvgpu_safe_cast_u64_to_u8(
+			sizeof(err_pkt.err_info.pmu_err_info));
+
+	if (g->ops.cic.report_err != NULL) {
+		err = g->ops.cic.report_err(g, (void *)&err_pkt,
+			sizeof(err_pkt), err_desc->is_critical);
+		if (err != 0) {
+			nvgpu_err(g, "Failed to report PMU error: "
+				"err_id=%u, sub_err_type=%u, status=%u",
+				err_id, sub_err_type, status);
+		}
+	}
+handle_report_failure:
+	if (err != 0) {
+		nvgpu_sw_quiesce(g);
+	}
+}
+
+void nvgpu_inject_pmu_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 sub_err_type)
+{
+	u32 err_info;
+
+	err_info = (u32)ERR_INJECT_TEST_PATTERN;
+
+	nvgpu_report_pmu_err(g, hw_unit, err_index, sub_err_type, err_info);
+}
--- a/drivers/gpu/nvgpu/common/cic/pri_cic.c
+++ b/drivers/gpu/nvgpu/common/cic/pri_cic.c
@@ -0,0 +1,91 @@
+/*
+ * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/nvgpu_err_info.h>
+#include <nvgpu/cic.h>
+
+#include "cic_priv.h"
+
+void nvgpu_report_pri_err(struct gk20a *g, u32 hw_unit, u32 inst,
+		u32 err_id, u32 err_addr, u32 err_code)
+{
+	int err = 0;
+	struct nvgpu_err_desc *err_desc = NULL;
+	struct nvgpu_err_msg err_pkt;
+
+	if (g->ops.cic.report_err == NULL) {
+		cic_dbg(g, "CIC does not support reporting error "
+			       "to safety services");
+		return;
+	}
+
+	if (hw_unit != NVGPU_ERR_MODULE_PRI) {
+		nvgpu_err(g, "invalid hw module (%u)", hw_unit);
+		err = -EINVAL;
+		goto handle_report_failure;
+	}
+
+	err = nvgpu_cic_get_err_desc(g, hw_unit, err_id, &err_desc);
+	if (err != 0) {
+		nvgpu_err(g, "Failed to get err_desc for "
+				"err_id (%u) for hw module (%u)",
+				err_id, hw_unit);
+		goto handle_report_failure;
+	}
+
+	nvgpu_init_pri_err_msg(&err_pkt);
+	err_pkt.hw_unit_id = hw_unit;
+	err_pkt.err_id = err_desc->error_id;
+	err_pkt.is_critical = err_desc->is_critical;
+	err_pkt.err_info.pri_info.header.sub_unit_id = inst;
+	err_pkt.err_info.pri_info.header.address = (u64) err_addr;
+	err_pkt.err_desc = err_desc;
+	/* sub_err_type can be decoded using err_code by referring
+	 * to the FECS pri error codes.
+	 */
+	err_pkt.err_info.pri_info.header.sub_err_type = err_code;
+	err_pkt.err_size = nvgpu_safe_cast_u64_to_u8(
+			sizeof(err_pkt.err_info.pri_info));
+
+	if (g->ops.cic.report_err != NULL) {
+		err = g->ops.cic.report_err(g, (void *)&err_pkt,
+			sizeof(err_pkt), err_desc->is_critical);
+		if (err != 0) {
+			nvgpu_err(g, "Failed to report PRI error: "
+					"inst=%u, err_id=%u, err_code=%u",
+					inst, err_id, err_code);
+		}
+	}
+handle_report_failure:
+	if (err != 0) {
+		nvgpu_sw_quiesce(g);
+	}
+}
+
+void nvgpu_inject_pri_swerror(struct gk20a *g, u32 hw_unit,
+		u32 err_index, u32 err_code)
+{
+	nvgpu_report_pri_err(g, hw_unit, 0U, err_index, 0U, err_code);
+}
--- a/drivers/gpu/nvgpu/common/clk_arb/clk_arb.c
+++ b/drivers/gpu/nvgpu/common/clk_arb/clk_arb.c
@@ -0,0 +1,826 @@
+/*
+ * Copyright (c) 2016-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/bitops.h>
+#include <nvgpu/lock.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/atomic.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/kref.h>
+#include <nvgpu/log.h>
+#include <nvgpu/barrier.h>
+#include <nvgpu/cond.h>
+#include <nvgpu/list.h>
+#include <nvgpu/clk_arb.h>
+#include <nvgpu/timers.h>
+#include <nvgpu/worker.h>
+#include <nvgpu/gk20a.h>
+#ifdef CONFIG_NVGPU_LS_PMU
+#include <nvgpu/pmu/clk/clk.h>
+#include <nvgpu/pmu/perf.h>
+#include <nvgpu/pmu/volt.h>
+#endif
+#include <nvgpu/boardobjgrp_e255.h>
+
+int nvgpu_clk_notification_queue_alloc(struct gk20a *g,
+				struct nvgpu_clk_notification_queue *queue,
+				u32 events_number) {
+	queue->clk_q_notifications = nvgpu_kcalloc(g, events_number,
+		sizeof(struct nvgpu_clk_notification));
+	if (queue->clk_q_notifications == NULL) {
+		return -ENOMEM;
+	}
+	queue->size = events_number;
+
+	nvgpu_atomic_set(&queue->head, 0);
+	nvgpu_atomic_set(&queue->tail, 0);
+
+	return 0;
+}
+
+void nvgpu_clk_notification_queue_free(struct gk20a *g,
+		struct nvgpu_clk_notification_queue *queue) {
+	if (queue->size > 0U) {
+		nvgpu_kfree(g, queue->clk_q_notifications);
+		queue->size = 0;
+		nvgpu_atomic_set(&queue->head, 0);
+		nvgpu_atomic_set(&queue->tail, 0);
+	}
+}
+
+static void nvgpu_clk_arb_queue_notification(struct gk20a *g,
+				struct nvgpu_clk_notification_queue *queue,
+				u32 alarm_mask) {
+
+	u32 queue_index;
+	u64 timestamp = 0U;
+
+	queue_index = U32(nvgpu_atomic_inc_return(&queue->tail)) % queue->size;
+
+#ifdef CONFIG_NVGPU_NON_FUSA
+	/* get current timestamp */
+	timestamp = (u64) nvgpu_hr_timestamp();
+#endif
+
+	queue->clk_q_notifications[queue_index].timestamp = timestamp;
+	queue->clk_q_notifications[queue_index].clk_notification = alarm_mask;
+
+}
+
+void nvgpu_clk_arb_set_global_alarm(struct gk20a *g, u32 alarm)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+
+	u64 current_mask;
+	u32 refcnt;
+	u32 alarm_mask;
+	u64 new_mask;
+
+	do {
+		current_mask = (u64)nvgpu_atomic64_read(&arb->alarm_mask);
+		/* atomic operations are strong so they do not need masks */
+
+		refcnt = ((u32) (current_mask >> 32)) + 1U;
+		alarm_mask =  (u32) (current_mask &  ~U32(0)) | alarm;
+		new_mask = ((u64) refcnt << 32) | alarm_mask;
+
+	} while (unlikely(current_mask !=
+			(u64)nvgpu_atomic64_cmpxchg(&arb->alarm_mask,
+				(long int)current_mask, (long int)new_mask)));
+
+	nvgpu_clk_arb_queue_notification(g, &arb->notification_queue, alarm);
+}
+
+#ifdef CONFIG_NVGPU_LS_PMU
+int nvgpu_clk_arb_update_vf_table(struct nvgpu_clk_arb *arb)
+{
+	struct gk20a *g = arb->g;
+	struct nvgpu_clk_vf_table *table;
+
+	u32 i, j;
+	int status = -EINVAL;
+	u16 clk_cur;
+	u32 num_points;
+
+	struct nvgpu_pmu_perf_pstate_clk_info *p0_info;
+
+	table = NV_READ_ONCE(arb->current_vf_table);
+	/* make flag visible when all data has resolved in the tables */
+	nvgpu_smp_rmb();
+	table = (table == &arb->vf_table_pool[0]) ? &arb->vf_table_pool[1] :
+		&arb->vf_table_pool[0];
+
+	/* Get allowed memory ranges */
+	if (g->ops.clk_arb.get_arbiter_clk_range(g, CTRL_CLK_DOMAIN_GPCCLK,
+						&arb->gpc2clk_min,
+						&arb->gpc2clk_max) < 0) {
+		nvgpu_err(g, "failed to fetch GPC2CLK range");
+		goto exit_vf_table;
+	}
+
+	if (g->ops.clk_arb.get_arbiter_clk_range(g, CTRL_CLK_DOMAIN_MCLK,
+						&arb->mclk_min,
+						&arb->mclk_max) < 0) {
+		nvgpu_err(g, "failed to fetch MCLK range");
+		goto exit_vf_table;
+	}
+
+	table->gpc2clk_num_points = MAX_F_POINTS;
+	table->mclk_num_points = MAX_F_POINTS;
+	if (g->ops.clk.clk_domain_get_f_points(arb->g, CTRL_CLK_DOMAIN_GPCCLK,
+		&table->gpc2clk_num_points, arb->gpc2clk_f_points)) {
+		nvgpu_err(g, "failed to fetch GPC2CLK frequency points");
+		goto exit_vf_table;
+	}
+	if (!table->gpc2clk_num_points) {
+		nvgpu_err(g, "empty queries to f points gpc2clk %d", table->gpc2clk_num_points);
+		status = -EINVAL;
+		goto exit_vf_table;
+	}
+
+	(void) memset(table->gpc2clk_points, 0,
+		table->gpc2clk_num_points*sizeof(struct nvgpu_clk_vf_point));
+
+	p0_info = nvgpu_pmu_perf_pstate_get_clk_set_info(g,
+			CTRL_PERF_PSTATE_P0, CLKWHICH_GPCCLK);
+	if (!p0_info) {
+		status = -EINVAL;
+		nvgpu_err(g, "failed to get GPC2CLK P0 info");
+		goto exit_vf_table;
+	}
+
+	/* GPC2CLK needs to be checked in two passes. The first determines the
+	 * relationships between GPC2CLK, SYS2CLK and XBAR2CLK, while the
+	 * second verifies that the clocks minimum is satisfied and sets
+	 * the voltages,the later part is done in nvgpu_pmu_perf_changeseq_set_clks
+	 */
+	j = 0; num_points = 0; clk_cur = 0;
+	for (i = 0; i < table->gpc2clk_num_points; i++) {
+		struct nvgpu_clk_slave_freq setfllclk;
+
+		if ((arb->gpc2clk_f_points[i] >= arb->gpc2clk_min) &&
+			(arb->gpc2clk_f_points[i] <= arb->gpc2clk_max) &&
+			(arb->gpc2clk_f_points[i] != clk_cur)) {
+
+			table->gpc2clk_points[j].gpc_mhz =
+				arb->gpc2clk_f_points[i];
+			setfllclk.gpc_mhz = arb->gpc2clk_f_points[i];
+
+			status = clk_get_fll_clks_per_clk_domain(g, &setfllclk);
+			if (status < 0) {
+				nvgpu_err(g,
+					"failed to get GPC2CLK slave clocks");
+				goto exit_vf_table;
+			}
+
+			table->gpc2clk_points[j].sys_mhz =
+				setfllclk.sys_mhz;
+			table->gpc2clk_points[j].xbar_mhz =
+				setfllclk.xbar_mhz;
+			table->gpc2clk_points[j].nvd_mhz =
+				setfllclk.nvd_mhz;
+			table->gpc2clk_points[j].host_mhz =
+				setfllclk.host_mhz;
+
+			clk_cur = table->gpc2clk_points[j].gpc_mhz;
+
+			if ((clk_cur >= p0_info->min_mhz) &&
+					(clk_cur <= p0_info->max_mhz)) {
+				VF_POINT_SET_PSTATE_SUPPORTED(
+					&table->gpc2clk_points[j],
+					CTRL_PERF_PSTATE_P0);
+			}
+
+			j++;
+			num_points++;
+		}
+	}
+	table->gpc2clk_num_points = num_points;
+
+	/* make table visible when all data has resolved in the tables */
+	nvgpu_smp_wmb();
+	arb->current_vf_table = table;
+
+exit_vf_table:
+
+	if (status < 0) {
+		nvgpu_clk_arb_set_global_alarm(g,
+			EVENT(ALARM_VF_TABLE_UPDATE_FAILED));
+	}
+	nvgpu_clk_arb_worker_enqueue(g, &arb->update_arb_work_item);
+
+	return status;
+}
+
+static void nvgpu_clk_arb_run_vf_table_cb(struct nvgpu_clk_arb *arb)
+{
+	struct gk20a *g = arb->g;
+	int err;
+
+	/* get latest vf curve from pmu */
+	err = nvgpu_clk_vf_point_cache(g);
+	if (err != 0) {
+		nvgpu_err(g, "failed to cache VF table");
+		nvgpu_clk_arb_set_global_alarm(g,
+			EVENT(ALARM_VF_TABLE_UPDATE_FAILED));
+		nvgpu_clk_arb_worker_enqueue(g, &arb->update_arb_work_item);
+
+		return;
+	}
+	nvgpu_clk_arb_update_vf_table(arb);
+}
+#endif
+u32 nvgpu_clk_arb_notify(struct nvgpu_clk_dev *dev,
+				struct nvgpu_clk_arb_target *target,
+				u32 alarm) {
+
+	struct nvgpu_clk_session *session = dev->session;
+	struct nvgpu_clk_arb *arb = session->g->clk_arb;
+	struct nvgpu_clk_notification *l_notification;
+
+	u32 queue_alarm_mask = 0;
+	u32 enabled_mask = 0;
+	u32 new_alarms_reported = 0;
+	u32 poll_mask = 0;
+	u32 tail, head, index;
+	u32 queue_index;
+	size_t size;
+
+	enabled_mask = (u32)nvgpu_atomic_read(&dev->enabled_mask);
+	size = arb->notification_queue.size;
+
+	/* queue global arbiter notifications in buffer */
+	do {
+		tail = (u32)nvgpu_atomic_read(&arb->notification_queue.tail);
+		/* copy items to the queue */
+		queue_index = (u32)nvgpu_atomic_read(&dev->queue.tail);
+		head = dev->arb_queue_head;
+		head = (tail - head) < arb->notification_queue.size ?
+			head : tail - arb->notification_queue.size;
+
+		for (index = head; WRAPGTEQ(tail, index); index++) {
+			u32 alarm_detected;
+
+			l_notification = &arb->notification_queue.
+				clk_q_notifications[((u64)index + 1ULL) % size];
+			alarm_detected = NV_READ_ONCE(
+					l_notification->clk_notification);
+
+			if ((enabled_mask & alarm_detected) == 0U) {
+				continue;
+			}
+
+			queue_index++;
+			dev->queue.clk_q_notifications[
+				queue_index % dev->queue.size].timestamp =
+				NV_READ_ONCE(l_notification->timestamp);
+
+			dev->queue.clk_q_notifications[queue_index %
+				dev->queue.size].clk_notification =
+					alarm_detected;
+
+			queue_alarm_mask |= alarm_detected;
+		}
+	} while (unlikely(nvgpu_atomic_read(&arb->notification_queue.tail) !=
+			(int)tail));
+
+	nvgpu_atomic_set(&dev->queue.tail, (int)queue_index);
+	/* update the last notification we processed from global queue */
+
+	dev->arb_queue_head = tail;
+
+	/* Check if current session targets are met */
+	if ((enabled_mask & EVENT(ALARM_LOCAL_TARGET_VF_NOT_POSSIBLE)) != 0U) {
+		if ((target->gpc2clk < session->target->gpc2clk)
+			|| (target->mclk < session->target->mclk)) {
+
+			poll_mask |= (NVGPU_POLLIN | NVGPU_POLLPRI);
+			nvgpu_clk_arb_queue_notification(arb->g, &dev->queue,
+				EVENT(ALARM_LOCAL_TARGET_VF_NOT_POSSIBLE));
+		}
+	}
+
+	/* Check if there is a new VF update */
+	if ((queue_alarm_mask & EVENT(VF_UPDATE)) != 0U) {
+		poll_mask |= (NVGPU_POLLIN | NVGPU_POLLRDNORM);
+	}
+
+	/* Notify sticky alarms that were not reported on previous run*/
+	new_alarms_reported = (queue_alarm_mask |
+			(alarm & ~dev->alarms_reported & queue_alarm_mask));
+
+	if ((new_alarms_reported & ~LOCAL_ALARM_MASK) != 0U) {
+		/* check that we are not re-reporting */
+		if ((new_alarms_reported & EVENT(ALARM_GPU_LOST)) != 0U) {
+			poll_mask |= NVGPU_POLLHUP;
+		}
+
+		poll_mask |= (NVGPU_POLLIN | NVGPU_POLLPRI);
+		/* On next run do not report global alarms that were already
+		 * reported, but report SHUTDOWN always
+		 */
+		dev->alarms_reported = new_alarms_reported & ~LOCAL_ALARM_MASK &
+							~EVENT(ALARM_GPU_LOST);
+	}
+
+	if (poll_mask != 0U) {
+		nvgpu_atomic_set(&dev->poll_mask, (int)poll_mask);
+		nvgpu_clk_arb_event_post_event(dev);
+	}
+
+	return new_alarms_reported;
+}
+
+void nvgpu_clk_arb_clear_global_alarm(struct gk20a *g, u32 alarm)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+
+	u64 current_mask;
+	u32 refcnt;
+	u32 alarm_mask;
+	u64 new_mask;
+
+	do {
+		current_mask = (u64)nvgpu_atomic64_read(&arb->alarm_mask);
+		/* atomic operations are strong so they do not need masks */
+
+		refcnt = ((u32) (current_mask >> 32)) + 1U;
+		alarm_mask =  (u32) ((u32)current_mask & ~alarm);
+		new_mask = ((u64) refcnt << 32) | alarm_mask;
+
+	} while (unlikely(current_mask !=
+			(u64)nvgpu_atomic64_cmpxchg(&arb->alarm_mask,
+				(long int)current_mask, (long int)new_mask)));
+}
+
+/*
+ * Process one scheduled work item.
+ */
+static void nvgpu_clk_arb_worker_poll_wakeup_process_item(
+		struct nvgpu_list_node *work_item)
+{
+	struct nvgpu_clk_arb_work_item *clk_arb_work_item =
+		nvgpu_clk_arb_work_item_from_worker_item(work_item);
+
+	struct gk20a *g = clk_arb_work_item->arb->g;
+
+	clk_arb_dbg(g, " ");
+
+	if (clk_arb_work_item->item_type == CLK_ARB_WORK_UPDATE_VF_TABLE) {
+#ifdef CONFIG_NVGPU_LS_PMU
+		nvgpu_clk_arb_run_vf_table_cb(clk_arb_work_item->arb);
+#endif
+	} else {
+		if (clk_arb_work_item->item_type == CLK_ARB_WORK_UPDATE_ARB) {
+			g->ops.clk_arb.clk_arb_run_arbiter_cb(
+							clk_arb_work_item->arb);
+		}
+	}
+}
+
+static void nvgpu_clk_arb_worker_poll_init(struct nvgpu_worker *worker)
+{
+	clk_arb_dbg(worker->g, " ");
+}
+
+const struct nvgpu_worker_ops clk_arb_worker_ops = {
+	.pre_process = nvgpu_clk_arb_worker_poll_init,
+	.wakeup_early_exit = nvgpu_worker_should_stop,
+	.wakeup_post_process = NULL,
+	.wakeup_process_item =
+		nvgpu_clk_arb_worker_poll_wakeup_process_item,
+	.wakeup_condition =
+		nvgpu_worker_should_stop,
+	.wakeup_timeout = NULL,
+};
+
+/**
+ * Append a work item to the worker's list.
+ *
+ * This adds work item to the end of the list and wakes the worker
+ * up immediately. If the work item already existed in the list, it's not added,
+ * because in that case it has been scheduled already but has not yet been
+ * processed.
+ */
+void nvgpu_clk_arb_worker_enqueue(struct gk20a *g,
+		struct nvgpu_clk_arb_work_item *work_item)
+{
+	clk_arb_dbg(g, " ");
+
+	(void)nvgpu_worker_enqueue(&g->clk_arb_worker.worker,
+			&work_item->worker_item);
+}
+
+/**
+ * Initialize the clk arb worker's metadata and start the background thread.
+ */
+int nvgpu_clk_arb_worker_init(struct gk20a *g)
+{
+	struct nvgpu_worker *worker = &g->clk_arb_worker.worker;
+
+	nvgpu_worker_init_name(worker, "nvgpu_clk_arb_poll", g->name);
+
+	return nvgpu_worker_init(g, worker, &clk_arb_worker_ops);
+}
+
+int nvgpu_clk_arb_init_arbiter(struct gk20a *g)
+{
+	int err = 0;
+
+	if (g->ops.clk_arb.check_clk_arb_support != NULL) {
+		if (!g->ops.clk_arb.check_clk_arb_support(g)) {
+			return 0;
+		}
+	}
+	else {
+		return 0;
+	}
+
+	nvgpu_mutex_acquire(&g->clk_arb_enable_lock);
+
+	err = g->ops.clk_arb.arbiter_clk_init(g);
+
+	nvgpu_mutex_release(&g->clk_arb_enable_lock);
+
+	return err;
+}
+
+bool nvgpu_clk_arb_has_active_req(struct gk20a *g)
+{
+	return (nvgpu_atomic_read(&g->clk_arb_global_nr) > 0);
+}
+
+static void nvgpu_clk_arb_schedule_alarm(struct gk20a *g, u32 alarm)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+
+	nvgpu_clk_arb_set_global_alarm(g, alarm);
+	nvgpu_clk_arb_worker_enqueue(g, &arb->update_arb_work_item);
+}
+
+void nvgpu_clk_arb_send_thermal_alarm(struct gk20a *g)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+
+	if (arb != NULL) {
+		nvgpu_clk_arb_schedule_alarm(g,
+			BIT32(NVGPU_EVENT_ALARM_THERMAL_ABOVE_THRESHOLD));
+	}
+}
+
+void nvgpu_clk_arb_worker_deinit(struct gk20a *g)
+{
+	struct nvgpu_worker *worker = &g->clk_arb_worker.worker;
+
+	nvgpu_worker_deinit(worker);
+}
+
+void nvgpu_clk_arb_cleanup_arbiter(struct gk20a *g)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+
+	nvgpu_mutex_acquire(&g->clk_arb_enable_lock);
+
+	if (arb != NULL) {
+		g->ops.clk_arb.clk_arb_cleanup(g->clk_arb);
+	}
+
+	nvgpu_mutex_release(&g->clk_arb_enable_lock);
+}
+
+int nvgpu_clk_arb_init_session(struct gk20a *g,
+		struct nvgpu_clk_session **l_session)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+	struct nvgpu_clk_session *session = *(l_session);
+
+	clk_arb_dbg(g, " ");
+
+	if (g->ops.clk_arb.check_clk_arb_support != NULL) {
+		if (!g->ops.clk_arb.check_clk_arb_support(g)) {
+			return 0;
+		}
+	}
+	else {
+		return 0;
+	}
+
+	session = nvgpu_kzalloc(g, sizeof(struct nvgpu_clk_session));
+	if (session == NULL) {
+		return -ENOMEM;
+	}
+	session->g = g;
+
+	nvgpu_ref_init(&session->refcount);
+
+	session->zombie = false;
+	session->target_pool[0].pstate = CTRL_PERF_PSTATE_P8;
+	/* make sure that the initialization of the pool is visible
+	 * before the update
+	 */
+	nvgpu_smp_wmb();
+	session->target = &session->target_pool[0];
+
+	nvgpu_init_list_node(&session->targets);
+	nvgpu_spinlock_init(&session->session_lock);
+
+	nvgpu_spinlock_acquire(&arb->sessions_lock);
+	nvgpu_list_add_tail(&session->link, &arb->sessions);
+	nvgpu_spinlock_release(&arb->sessions_lock);
+
+	*l_session = session;
+
+	return 0;
+}
+
+static struct nvgpu_clk_dev *
+nvgpu_clk_dev_from_refcount(struct nvgpu_ref *refcount)
+{
+	return (struct nvgpu_clk_dev *)
+	   ((uintptr_t)refcount - offsetof(struct nvgpu_clk_dev, refcount));
+};
+
+void nvgpu_clk_arb_free_fd(struct nvgpu_ref *refcount)
+{
+	struct nvgpu_clk_dev *dev = nvgpu_clk_dev_from_refcount(refcount);
+	struct nvgpu_clk_session *session = dev->session;
+	struct gk20a *g = session->g;
+
+	nvgpu_clk_notification_queue_free(g, &dev->queue);
+
+	nvgpu_atomic_dec(&g->clk_arb_global_nr);
+	nvgpu_kfree(g, dev);
+}
+
+static struct nvgpu_clk_session *
+nvgpu_clk_session_from_refcount(struct nvgpu_ref *refcount)
+{
+	return (struct nvgpu_clk_session *)
+	   ((uintptr_t)refcount - offsetof(struct nvgpu_clk_session, refcount));
+};
+
+void nvgpu_clk_arb_free_session(struct nvgpu_ref *refcount)
+{
+	struct nvgpu_clk_session *session =
+		nvgpu_clk_session_from_refcount(refcount);
+	struct nvgpu_clk_arb *arb = session->g->clk_arb;
+	struct gk20a *g = session->g;
+	struct nvgpu_clk_dev *dev, *tmp;
+
+	clk_arb_dbg(g, " ");
+
+	if (arb != NULL) {
+		nvgpu_spinlock_acquire(&arb->sessions_lock);
+		nvgpu_list_del(&session->link);
+		nvgpu_spinlock_release(&arb->sessions_lock);
+	}
+
+	nvgpu_spinlock_acquire(&session->session_lock);
+	nvgpu_list_for_each_entry_safe(dev, tmp, &session->targets,
+			nvgpu_clk_dev, node) {
+		nvgpu_ref_put(&dev->refcount, nvgpu_clk_arb_free_fd);
+		nvgpu_list_del(&dev->node);
+	}
+	nvgpu_spinlock_release(&session->session_lock);
+
+	nvgpu_kfree(g, session);
+}
+
+void nvgpu_clk_arb_release_session(struct gk20a *g,
+	struct nvgpu_clk_session *session)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+
+	clk_arb_dbg(g, " ");
+
+	session->zombie = true;
+	nvgpu_ref_put(&session->refcount, nvgpu_clk_arb_free_session);
+	if (arb != NULL) {
+		nvgpu_clk_arb_worker_enqueue(g, &arb->update_arb_work_item);
+	}
+}
+#ifdef CONFIG_NVGPU_LS_PMU
+void nvgpu_clk_arb_schedule_vf_table_update(struct gk20a *g)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+
+	nvgpu_clk_arb_worker_enqueue(g, &arb->update_vf_table_work_item);
+}
+
+/* This function is inherently unsafe to call while arbiter is running
+ * arbiter must be blocked before calling this function
+ */
+u32 nvgpu_clk_arb_get_current_pstate(struct gk20a *g)
+{
+	return NV_READ_ONCE(g->clk_arb->actual->pstate);
+}
+
+void nvgpu_clk_arb_pstate_change_lock(struct gk20a *g, bool lock)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+
+	if (lock) {
+		nvgpu_mutex_acquire(&arb->pstate_lock);
+	} else {
+		nvgpu_mutex_release(&arb->pstate_lock);
+	}
+}
+#endif
+bool nvgpu_clk_arb_is_valid_domain(struct gk20a *g, u32 api_domain)
+{
+	u32 clk_domains = g->ops.clk_arb.get_arbiter_clk_domains(g);
+	bool ret_result = false;
+
+	switch (api_domain) {
+	case NVGPU_CLK_DOMAIN_MCLK:
+		ret_result = ((clk_domains & CTRL_CLK_DOMAIN_MCLK) != 0U) ?
+								true : false;
+		break;
+	case NVGPU_CLK_DOMAIN_GPCCLK:
+		ret_result = ((clk_domains & CTRL_CLK_DOMAIN_GPCCLK) != 0U) ?
+								true : false;
+		break;
+	default:
+		ret_result = false;
+		break;
+	}
+	return ret_result;
+}
+
+int nvgpu_clk_arb_get_arbiter_clk_range(struct gk20a *g, u32 api_domain,
+		u16 *min_mhz, u16 *max_mhz)
+{
+	int ret = -EINVAL;
+
+	switch (api_domain) {
+	case NVGPU_CLK_DOMAIN_MCLK:
+		ret = g->ops.clk_arb.get_arbiter_clk_range(g,
+				CTRL_CLK_DOMAIN_MCLK, min_mhz, max_mhz);
+		break;
+
+	case NVGPU_CLK_DOMAIN_GPCCLK:
+		ret = g->ops.clk_arb.get_arbiter_clk_range(g,
+				CTRL_CLK_DOMAIN_GPCCLK, min_mhz, max_mhz);
+		break;
+
+	default:
+		ret = -EINVAL;
+		break;
+	}
+	return ret;
+}
+
+int nvgpu_clk_arb_get_arbiter_clk_f_points(struct gk20a *g,
+	u32 api_domain, u32 *max_points, u16 *fpoints)
+{
+	int err = -EINVAL;
+
+	switch (api_domain) {
+	case NVGPU_CLK_DOMAIN_GPCCLK:
+		err = g->ops.clk_arb.get_arbiter_f_points(g,
+			CTRL_CLK_DOMAIN_GPCCLK, max_points, fpoints);
+		if ((err != 0) || (fpoints == NULL)) {
+			break;
+		}
+		err = 0;
+		break;
+	case NVGPU_CLK_DOMAIN_MCLK:
+		err = g->ops.clk_arb.get_arbiter_f_points(g,
+			CTRL_CLK_DOMAIN_MCLK, max_points, fpoints);
+		break;
+	default:
+		err = -EINVAL;
+		break;
+	}
+	return err;
+}
+
+int nvgpu_clk_arb_get_session_target_mhz(struct nvgpu_clk_session *session,
+		u32 api_domain, u16 *target_mhz)
+{
+	int err = 0;
+	struct nvgpu_clk_arb_target *target = session->target;
+
+	if (!nvgpu_clk_arb_is_valid_domain(session->g, api_domain)) {
+		return -EINVAL;
+	}
+
+	switch (api_domain) {
+		case NVGPU_CLK_DOMAIN_MCLK:
+			*target_mhz = target->mclk;
+			break;
+
+		case NVGPU_CLK_DOMAIN_GPCCLK:
+			*target_mhz = target->gpc2clk;
+			break;
+
+		default:
+			*target_mhz = 0;
+			err = -EINVAL;
+			break;
+	}
+	return err;
+}
+
+int nvgpu_clk_arb_get_arbiter_actual_mhz(struct gk20a *g,
+		u32 api_domain, u16 *actual_mhz)
+{
+	struct nvgpu_clk_arb *arb = g->clk_arb;
+	int err = 0;
+	struct nvgpu_clk_arb_target *actual = arb->actual;
+
+	if (!nvgpu_clk_arb_is_valid_domain(g, api_domain)) {
+		return -EINVAL;
+	}
+
+	switch (api_domain) {
+		case NVGPU_CLK_DOMAIN_MCLK:
+			*actual_mhz = actual->mclk;
+			break;
+
+		case NVGPU_CLK_DOMAIN_GPCCLK:
+			*actual_mhz = actual->gpc2clk;
+			break;
+
+		default:
+			*actual_mhz = 0;
+			err = -EINVAL;
+			break;
+	}
+	return err;
+}
+
+unsigned long nvgpu_clk_measure_freq(struct gk20a *g, u32 api_domain)
+{
+	unsigned long freq = 0UL;
+
+	switch (api_domain) {
+	/*
+	 * Incase of iGPU clocks to each parition (GPC, SYS, LTC, XBAR) are
+	 * generated using 1X GPCCLK and hence should be the same.
+	 */
+	case CTRL_CLK_DOMAIN_GPCCLK:
+	case CTRL_CLK_DOMAIN_SYSCLK:
+	case CTRL_CLK_DOMAIN_XBARCLK:
+		freq = g->ops.clk.get_rate(g, CTRL_CLK_DOMAIN_GPCCLK);
+		break;
+	default:
+		freq = 0UL;
+		break;
+	}
+	return freq;
+}
+
+int nvgpu_clk_arb_get_arbiter_effective_mhz(struct gk20a *g,
+		u32 api_domain, u16 *effective_mhz)
+{
+	u64 freq_mhz_u64;
+	int err = -EINVAL;
+
+	if (!nvgpu_clk_arb_is_valid_domain(g, api_domain)) {
+		return -EINVAL;
+	}
+
+	switch (api_domain) {
+	case NVGPU_CLK_DOMAIN_MCLK:
+		freq_mhz_u64 = g->ops.clk.measure_freq(g,
+					CTRL_CLK_DOMAIN_MCLK) /	1000000ULL;
+		err = 0;
+		break;
+
+	case NVGPU_CLK_DOMAIN_GPCCLK:
+		freq_mhz_u64 = g->ops.clk.measure_freq(g,
+					CTRL_CLK_DOMAIN_GPCCLK) / 1000000ULL;
+		err = 0;
+		break;
+
+	default:
+		err = -EINVAL;
+		break;
+	}
+
+	if (err == 0) {
+		nvgpu_assert(freq_mhz_u64 <= (u64)U16_MAX);
+		*effective_mhz = (u16)freq_mhz_u64;
+	}
+	return err;
+}
--- a/drivers/gpu/nvgpu/common/clk_arb/clk_arb_gp10b.c
+++ b/drivers/gpu/nvgpu/common/clk_arb/clk_arb_gp10b.c
@@ -0,0 +1,406 @@
+/*
+ * Copyright (c) 2018-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/clk_arb.h>
+#include <nvgpu/pmu/clk/clk.h>
+
+#include "clk_arb_gp10b.h"
+
+bool gp10b_check_clk_arb_support(struct gk20a *g)
+{
+	if (g->ops.clk_arb.get_arbiter_clk_domains != NULL) {
+		return true;
+	}
+	else {
+		return false;
+	}
+}
+
+u32 gp10b_get_arbiter_clk_domains(struct gk20a *g)
+{
+	(void)g;
+	clk_arb_dbg(g, " ");
+	return CTRL_CLK_DOMAIN_GPCCLK;
+}
+
+int gp10b_get_arbiter_f_points(struct gk20a *g,u32 api_domain,
+				u32 *num_points, u16 *freqs_in_mhz)
+{
+	int ret = 0;
+
+	clk_arb_dbg(g, " ");
+
+	switch (api_domain) {
+	case CTRL_CLK_DOMAIN_GPCCLK:
+		ret = g->ops.clk.clk_domain_get_f_points(g, CTRL_CLK_DOMAIN_GPCCLK,
+			num_points, freqs_in_mhz);
+		break;
+	default:
+		ret = -EINVAL;
+		break;
+	}
+
+	return ret;
+}
+
+int gp10b_get_arbiter_clk_range(struct gk20a *g, u32 api_domain,
+		u16 *min_mhz, u16 *max_mhz)
+{
+	int ret = 0;
+
+	clk_arb_dbg(g, " ");
+
+	switch (api_domain) {
+	case CTRL_CLK_DOMAIN_GPCCLK:
+		ret = g->ops.clk.get_clk_range(g, CTRL_CLK_DOMAIN_GPCCLK,
+			min_mhz, max_mhz);
+		break;
+
+	default:
+		ret = -EINVAL;
+		break;
+	}
+
+	return ret;
+}
+
+int gp10b_get_arbiter_clk_default(struct gk20a *g, u32 api_domain,
+		u16 *default_mhz)
+{
+	int ret = 0;
+	u16 min_mhz, max_mhz;
+
+	clk_arb_dbg(g, " ");
+
+	switch (api_domain) {
+	case CTRL_CLK_DOMAIN_GPCCLK:
+		ret = gp10b_get_arbiter_clk_range(g, api_domain,
+			&min_mhz, &max_mhz);
+
+		if (ret == 0) {
+			*default_mhz = max_mhz;
+		}
+		break;
+
+	default:
+		ret = -EINVAL;
+		break;
+	}
+
+	return ret;
+}
+
+int gp10b_init_clk_arbiter(struct gk20a *g)
+{
+	struct nvgpu_clk_arb *arb = NULL;
+	u16 default_mhz;
+	int err;
+	int index;
+	struct nvgpu_clk_vf_table *table;
+
+	clk_arb_dbg(g, " ");
+
+	if(g->clk_arb != NULL) {
+		return 0;
+	}
+
+	arb = nvgpu_kzalloc(g, sizeof(struct nvgpu_clk_arb));
+	if (arb == NULL) {
+		return -ENOMEM;
+	}
+
+	nvgpu_mutex_init(&arb->pstate_lock);
+
+	nvgpu_spinlock_init(&arb->sessions_lock);
+	nvgpu_spinlock_init(&arb->users_lock);
+	nvgpu_spinlock_init(&arb->requests_lock);
+
+	arb->gpc2clk_f_points = nvgpu_kcalloc(g, MAX_F_POINTS, sizeof(u16));
+	if (arb->gpc2clk_f_points == NULL) {
+		err = -ENOMEM;
+		goto init_fail;
+	}
+
+	for (index = 0; index < 2; index++) {
+		table = &arb->vf_table_pool[index];
+		table->gpc2clk_num_points = MAX_F_POINTS;
+
+		table->gpc2clk_points = (struct nvgpu_clk_vf_point *)
+			nvgpu_kcalloc(g, MAX_F_POINTS,
+			sizeof(struct nvgpu_clk_vf_point));
+		if (table->gpc2clk_points == NULL) {
+			err = -ENOMEM;
+			goto init_fail;
+		}
+	}
+
+	g->clk_arb = arb;
+	arb->g = g;
+
+	err =  g->ops.clk_arb.get_arbiter_clk_default(g,
+			CTRL_CLK_DOMAIN_GPCCLK, &default_mhz);
+	if (err < 0) {
+		err = -EINVAL;
+		goto init_fail;
+	}
+
+	arb->gpc2clk_default_mhz = default_mhz;
+
+	err = g->ops.clk_arb.get_arbiter_clk_range(g, CTRL_CLK_DOMAIN_GPCCLK,
+		&arb->gpc2clk_min, &arb->gpc2clk_max);
+
+	if (err < 0) {
+		err = -EINVAL;
+		goto init_fail;
+	}
+
+	arb->actual = &arb->actual_pool[0];
+
+	nvgpu_atomic_set(&arb->req_nr, 0);
+
+	nvgpu_atomic64_set(&arb->alarm_mask, 0);
+	err = nvgpu_clk_notification_queue_alloc(g, &arb->notification_queue,
+		DEFAULT_EVENT_NUMBER);
+	if (err < 0) {
+		goto init_fail;
+	}
+
+	nvgpu_init_list_node(&arb->users);
+	nvgpu_init_list_node(&arb->sessions);
+	nvgpu_init_list_node(&arb->requests);
+
+	err = nvgpu_cond_init(&arb->request_wq);
+	if (err < 0) {
+		goto init_fail;
+	}
+
+	nvgpu_init_list_node(&arb->update_arb_work_item.worker_item);
+	arb->update_arb_work_item.arb = arb;
+	arb->update_arb_work_item.item_type = CLK_ARB_WORK_UPDATE_ARB;
+
+	err = nvgpu_clk_arb_worker_init(g);
+	if (err < 0) {
+		goto init_fail;
+	}
+
+	/* This is set for the duration of the default req */
+	nvgpu_atomic_inc(&g->clk_arb_global_nr);
+
+	nvgpu_clk_arb_worker_enqueue(g, &arb->update_arb_work_item);
+
+	do {
+		/* Check that first run is completed */
+		nvgpu_smp_mb();
+		NVGPU_COND_WAIT_INTERRUPTIBLE(&arb->request_wq,
+			nvgpu_atomic_read(&arb->req_nr) != 0, 0U);
+	} while (nvgpu_atomic_read(&arb->req_nr) == 0);
+
+	/* Once the default request is completed, reduce the usage count */
+	nvgpu_atomic_dec(&g->clk_arb_global_nr);
+
+	return arb->status;
+
+init_fail:
+	nvgpu_kfree(g, arb->gpc2clk_f_points);
+
+	for (index = 0; index < 2; index++) {
+		nvgpu_kfree(g, arb->vf_table_pool[index].gpc2clk_points);
+	}
+
+	nvgpu_mutex_destroy(&arb->pstate_lock);
+	nvgpu_kfree(g, arb);
+
+	return err;
+}
+
+void gp10b_clk_arb_run_arbiter_cb(struct nvgpu_clk_arb *arb)
+{
+	struct nvgpu_clk_session *session;
+	struct nvgpu_clk_dev *dev;
+	struct nvgpu_clk_dev *tmp;
+	struct nvgpu_clk_arb_target *target, *actual;
+	struct gk20a *g = arb->g;
+
+	bool gpc2clk_set;
+
+	int status = 0;
+	unsigned long rounded_rate = 0;
+
+	u16 gpc2clk_target, gpc2clk_session_target;
+
+	clk_arb_dbg(g, " ");
+
+	/* Only one arbiter should be running */
+	gpc2clk_target = 0;
+
+	nvgpu_spinlock_acquire(&arb->sessions_lock);
+	nvgpu_list_for_each_entry(session, &arb->sessions,
+			nvgpu_clk_session, link) {
+		if (session->zombie) {
+			continue;
+		}
+		gpc2clk_set = false;
+		target = (session->target == &session->target_pool[0] ?
+				&session->target_pool[1] :
+				&session->target_pool[0]);
+		nvgpu_spinlock_acquire(&session->session_lock);
+		if (!nvgpu_list_empty(&session->targets)) {
+			/* Copy over state */
+			target->gpc2clk = session->target->gpc2clk;
+			/* Query the latest committed request */
+			nvgpu_list_for_each_entry_safe(dev, tmp, &session->targets,
+						nvgpu_clk_dev, node) {
+				if (!gpc2clk_set &&
+					dev->gpc2clk_target_mhz != (u16)0) {
+					target->gpc2clk =
+						dev->gpc2clk_target_mhz;
+					gpc2clk_set = true;
+				}
+				nvgpu_ref_get(&dev->refcount);
+				nvgpu_list_del(&dev->node);
+				nvgpu_spinlock_acquire(&arb->requests_lock);
+				nvgpu_list_add(&dev->node, &arb->requests);
+				nvgpu_spinlock_release(&arb->requests_lock);
+			}
+			session->target = target;
+		}
+		nvgpu_spinlock_release(&session->session_lock);
+
+		gpc2clk_target =
+			gpc2clk_target > session->target->gpc2clk ?
+			gpc2clk_target : session->target->gpc2clk;
+	}
+	nvgpu_spinlock_release(&arb->sessions_lock);
+
+	gpc2clk_target = (gpc2clk_target > (u16)0) ? gpc2clk_target :
+			arb->gpc2clk_default_mhz;
+
+	if (gpc2clk_target < arb->gpc2clk_min) {
+		gpc2clk_target = arb->gpc2clk_min;
+	}
+
+	if (gpc2clk_target > arb->gpc2clk_max) {
+		gpc2clk_target = arb->gpc2clk_max;
+	}
+
+	gpc2clk_session_target = gpc2clk_target;
+
+	if (arb->actual->gpc2clk == gpc2clk_target) {
+		nvgpu_atomic_inc(&arb->req_nr);
+		nvgpu_cond_signal_interruptible(&arb->request_wq);
+		goto exit_arb;
+	}
+
+	nvgpu_mutex_acquire(&arb->pstate_lock);
+
+	status = g->ops.clk.clk_get_round_rate(g,
+		CTRL_CLK_DOMAIN_GPCCLK, gpc2clk_session_target * 1000000UL, &rounded_rate);
+
+	clk_arb_dbg(g, "rounded_rate: %lu\n",
+		rounded_rate);
+
+	if (status < 0) {
+		arb->status = status;
+		nvgpu_mutex_release(&arb->pstate_lock);
+
+		/* make status visible */
+		nvgpu_smp_mb();
+		nvgpu_atomic_inc(&arb->req_nr);
+		nvgpu_cond_signal_interruptible(&arb->request_wq);
+		goto exit_arb;
+	}
+
+	/* the igpu set_rate accepts freq in Hz */
+	status = g->ops.clk.set_rate(g, CTRL_CLK_DOMAIN_GPCCLK, rounded_rate);
+
+	if (status < 0) {
+		arb->status = status;
+		nvgpu_mutex_release(&arb->pstate_lock);
+
+		/* make status visible */
+		nvgpu_smp_mb();
+		nvgpu_atomic_inc(&arb->req_nr);
+		nvgpu_cond_signal_interruptible(&arb->request_wq);
+		goto exit_arb;
+	}
+
+	actual = ((NV_READ_ONCE(arb->actual)) == &arb->actual_pool[0] ?
+			&arb->actual_pool[1] : &arb->actual_pool[0]);
+
+	/* do not reorder this pointer */
+	nvgpu_smp_rmb();
+	actual->gpc2clk = gpc2clk_target;
+	arb->status = 0;
+
+	/* Make changes visible to other threads */
+	nvgpu_smp_wmb();
+	arb->actual = actual;
+
+	/* status must be visible before atomic inc */
+	nvgpu_smp_wmb();
+	nvgpu_atomic_inc(&arb->req_nr);
+
+	/* Unlock pstate change for PG */
+	nvgpu_mutex_release(&arb->pstate_lock);
+
+	nvgpu_cond_signal_interruptible(&arb->request_wq);
+
+exit_arb:
+	if (status < 0) {
+		nvgpu_err(g, "Error in arbiter update");
+	}
+
+	/* notify completion for all requests */
+	nvgpu_spinlock_acquire(&arb->requests_lock);
+	nvgpu_list_for_each_entry_safe(dev, tmp, &arb->requests,
+			nvgpu_clk_dev, node) {
+		u32 tmp_poll_mask = NVGPU_POLLIN | NVGPU_POLLRDNORM;
+		nvgpu_atomic_set(&dev->poll_mask,
+			(int)tmp_poll_mask);
+		nvgpu_clk_arb_event_post_event(dev);
+		nvgpu_ref_put(&dev->refcount, nvgpu_clk_arb_free_fd);
+		nvgpu_list_del(&dev->node);
+	}
+	nvgpu_spinlock_release(&arb->requests_lock);
+
+	clk_arb_dbg(g, "done");
+}
+
+void gp10b_clk_arb_cleanup(struct nvgpu_clk_arb *arb)
+{
+	struct gk20a *g = arb->g;
+	int index;
+
+	nvgpu_clk_arb_worker_deinit(g);
+	nvgpu_kfree(g, arb->gpc2clk_f_points);
+
+	for (index = 0; index < 2; index++) {
+		nvgpu_kfree(g,
+			arb->vf_table_pool[index].gpc2clk_points);
+	}
+
+	nvgpu_mutex_destroy(&g->clk_arb->pstate_lock);
+	nvgpu_kfree(g, g->clk_arb);
+
+	g->clk_arb = NULL;
+}
--- a/drivers/gpu/nvgpu/common/clk_arb/clk_arb_gp10b.h
+++ b/drivers/gpu/nvgpu/common/clk_arb/clk_arb_gp10b.h
@@ -0,0 +1,40 @@
+/*
+ * Copyright (c) 2018-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef CLK_ARB_GP10B_H
+#define CLK_ARB_GP10B_H
+
+struct nvgpu_clk_session;
+struct nvgpu_clk_arb;
+
+bool gp10b_check_clk_arb_support(struct gk20a *g);
+u32 gp10b_get_arbiter_clk_domains(struct gk20a *g);
+int gp10b_get_arbiter_f_points(struct gk20a *g,u32 api_domain,
+				u32 *num_points, u16 *freqs_in_mhz);
+int gp10b_get_arbiter_clk_range(struct gk20a *g, u32 api_domain,
+		u16 *min_mhz, u16 *max_mhz);
+int gp10b_get_arbiter_clk_default(struct gk20a *g, u32 api_domain,
+		u16 *default_mhz);
+int gp10b_init_clk_arbiter(struct gk20a *g);
+void gp10b_clk_arb_run_arbiter_cb(struct nvgpu_clk_arb *arb);
+void gp10b_clk_arb_cleanup(struct nvgpu_clk_arb *arb);
+
+#endif /* CLK_ARB_GP106_H */
--- a/drivers/gpu/nvgpu/common/clk_arb/clk_arb_gv100.c
+++ b/drivers/gpu/nvgpu/common/clk_arb/clk_arb_gv100.c
@@ -0,0 +1,560 @@
+/*
+ * Copyright (c) 2016-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/clk_arb.h>
+#include <nvgpu/pmu/clk/clk.h>
+#include <nvgpu/timers.h>
+#include <nvgpu/boardobjgrp_e255.h>
+#include <nvgpu/pmu/perf.h>
+
+#include "clk_arb_gv100.h"
+
+bool gv100_check_clk_arb_support(struct gk20a *g)
+{
+	if ((g->ops.clk_arb.get_arbiter_clk_domains != NULL) &&
+			nvgpu_is_enabled(g, NVGPU_PMU_PSTATE)){
+		return true;
+	}
+	else {
+		return false;
+	}
+}
+
+u32 gv100_get_arbiter_clk_domains(struct gk20a *g)
+{
+	(void)g;
+	return (CTRL_CLK_DOMAIN_GPCCLK);
+}
+
+int gv100_get_arbiter_f_points(struct gk20a *g,u32 api_domain,
+				u32 *num_points, u16 *freqs_in_mhz)
+{
+	return g->ops.clk.clk_domain_get_f_points(g,
+		api_domain, num_points, freqs_in_mhz);
+}
+
+int gv100_get_arbiter_clk_range(struct gk20a *g, u32 api_domain,
+		u16 *min_mhz, u16 *max_mhz)
+{
+	u32 clkwhich;
+	struct nvgpu_pmu_perf_pstate_clk_info *p0_info;
+	u16 max_min_freq_mhz;
+	u16 limit_min_mhz;
+	u16 gpcclk_cap_mhz;
+	bool error_status = false;
+
+	switch (api_domain) {
+	case CTRL_CLK_DOMAIN_MCLK:
+		clkwhich = CLKWHICH_MCLK;
+		break;
+
+	case CTRL_CLK_DOMAIN_GPCCLK:
+		clkwhich = CLKWHICH_GPCCLK;
+		break;
+
+	default:
+		error_status = true;
+		break;
+	}
+
+	if (error_status == true) {
+		return -EINVAL;
+	}
+
+	p0_info = nvgpu_pmu_perf_pstate_get_clk_set_info(g,
+			CTRL_PERF_PSTATE_P0, clkwhich);
+	if (p0_info == NULL) {
+		return -EINVAL;
+	}
+
+	limit_min_mhz = p0_info->min_mhz;
+	gpcclk_cap_mhz = p0_info->max_mhz;
+
+	max_min_freq_mhz = nvgpu_pmu_clk_fll_get_min_max_freq(g);
+	/*
+	 * When DVCO min is 0 in vbios update it to DVCO_MIN_DEFAULT_MHZ.
+	 */
+	if (max_min_freq_mhz == 0U) {
+		max_min_freq_mhz = DVCO_MIN_DEFAULT_MHZ;
+	}
+
+	/*
+	 * Needed for DVCO min.
+	 */
+	if (api_domain == CTRL_CLK_DOMAIN_GPCCLK) {
+		if ((max_min_freq_mhz != 0U) &&
+			(max_min_freq_mhz >= limit_min_mhz)) {
+			limit_min_mhz = nvgpu_safe_cast_u32_to_u16(
+				nvgpu_safe_add_u32(max_min_freq_mhz, 1U));
+		}
+		if ((g->clk_arb->gpc_cap_clkmhz != 0U) &&
+			(p0_info->max_mhz > g->clk_arb->gpc_cap_clkmhz )) {
+			gpcclk_cap_mhz = g->clk_arb->gpc_cap_clkmhz;
+		}
+	}
+	*min_mhz = limit_min_mhz;
+	*max_mhz = gpcclk_cap_mhz;
+
+	return 0;
+}
+
+int gv100_get_arbiter_clk_default(struct gk20a *g, u32 api_domain,
+		u16 *default_mhz)
+{
+	u32 clkwhich;
+	struct nvgpu_pmu_perf_pstate_clk_info *p0_info;
+	bool error_status = false;
+	u16 gpcclk_cap_mhz;
+
+	switch (api_domain) {
+	case CTRL_CLK_DOMAIN_MCLK:
+		clkwhich = CLKWHICH_MCLK;
+		break;
+
+	case CTRL_CLK_DOMAIN_GPCCLK:
+		clkwhich = CLKWHICH_GPCCLK;
+		break;
+
+	default:
+		error_status = true;
+		break;
+	}
+
+	if (error_status == true) {
+		return -EINVAL;
+	}
+
+	p0_info = nvgpu_pmu_perf_pstate_get_clk_set_info(g,
+			CTRL_PERF_PSTATE_P0, clkwhich);
+	if (p0_info == NULL) {
+		return -EINVAL;
+	}
+
+	gpcclk_cap_mhz = p0_info->max_mhz;
+	if (api_domain == CTRL_CLK_DOMAIN_GPCCLK) {
+		if ((g->clk_arb->gpc_cap_clkmhz != 0U) &&
+			(p0_info->max_mhz > g->clk_arb->gpc_cap_clkmhz )) {
+			gpcclk_cap_mhz = g->clk_arb->gpc_cap_clkmhz;
+		}
+	}
+	*default_mhz = gpcclk_cap_mhz;
+
+	return 0;
+}
+
+int gv100_init_clk_arbiter(struct gk20a *g)
+{
+	struct nvgpu_clk_arb *arb;
+	u16 default_mhz;
+	int err;
+	int index;
+	struct nvgpu_clk_vf_table *table;
+	clk_arb_dbg(g, " ");
+
+	if (g->clk_arb != NULL) {
+		return 0;
+	}
+	arb = nvgpu_kzalloc(g, sizeof(struct nvgpu_clk_arb));
+	if (arb == NULL) {
+		return -ENOMEM;
+	}
+
+	nvgpu_mutex_init(&arb->pstate_lock);
+	nvgpu_spinlock_init(&arb->sessions_lock);
+	nvgpu_spinlock_init(&arb->users_lock);
+	nvgpu_spinlock_init(&arb->requests_lock);
+
+	arb->mclk_f_points = nvgpu_kcalloc(g, MAX_F_POINTS, sizeof(u16));
+	if (arb->mclk_f_points == NULL) {
+		err = -ENOMEM;
+		goto init_fail;
+	}
+
+	arb->gpc2clk_f_points = nvgpu_kcalloc(g, MAX_F_POINTS, sizeof(u16));
+	if (arb->gpc2clk_f_points == NULL) {
+		err = -ENOMEM;
+		goto init_fail;
+	}
+
+	for (index = 0; index < 2; index++) {
+		table = &arb->vf_table_pool[index];
+		table->gpc2clk_num_points = MAX_F_POINTS;
+		table->mclk_num_points = MAX_F_POINTS;
+
+		table->gpc2clk_points = nvgpu_kcalloc(g, MAX_F_POINTS,
+			sizeof(struct nvgpu_clk_vf_point));
+		if (table->gpc2clk_points == NULL) {
+			err = -ENOMEM;
+			goto init_fail;
+		}
+
+
+		table->mclk_points = nvgpu_kcalloc(g, MAX_F_POINTS,
+			sizeof(struct nvgpu_clk_vf_point));
+		if (table->mclk_points == NULL) {
+			err = -ENOMEM;
+			goto init_fail;
+		}
+	}
+
+	g->clk_arb = arb;
+	arb->g = g;
+
+	err =  g->ops.clk_arb.get_arbiter_clk_default(g,
+			CTRL_CLK_DOMAIN_MCLK, &default_mhz);
+	if (err < 0) {
+		err = -EINVAL;
+		goto init_fail;
+	}
+
+	arb->mclk_default_mhz = default_mhz;
+
+	err =  g->ops.clk_arb.get_arbiter_clk_default(g,
+			CTRL_CLK_DOMAIN_GPCCLK, &default_mhz);
+	if (err < 0) {
+		err = -EINVAL;
+		goto init_fail;
+	}
+
+	arb->gpc2clk_default_mhz = default_mhz;
+
+	arb->actual = &arb->actual_pool[0];
+
+	nvgpu_atomic_set(&arb->req_nr, 0);
+
+	nvgpu_atomic64_set(&arb->alarm_mask, 0);
+	err = nvgpu_clk_notification_queue_alloc(g, &arb->notification_queue,
+		DEFAULT_EVENT_NUMBER);
+	if (err < 0) {
+		goto init_fail;
+	}
+	nvgpu_init_list_node(&arb->users);
+	nvgpu_init_list_node(&arb->sessions);
+	nvgpu_init_list_node(&arb->requests);
+
+	(void)nvgpu_cond_init(&arb->request_wq);
+
+	nvgpu_init_list_node(&arb->update_vf_table_work_item.worker_item);
+	nvgpu_init_list_node(&arb->update_arb_work_item.worker_item);
+	arb->update_vf_table_work_item.arb = arb;
+	arb->update_arb_work_item.arb = arb;
+	arb->update_vf_table_work_item.item_type = CLK_ARB_WORK_UPDATE_VF_TABLE;
+	arb->update_arb_work_item.item_type = CLK_ARB_WORK_UPDATE_ARB;
+	err = nvgpu_clk_arb_worker_init(g);
+	if (err < 0) {
+		goto init_fail;
+	}
+
+	if (g->dgpu_max_clk != 0U) {
+		g->dgpu_max_clk = (g->dgpu_max_clk /
+			FREQ_STEP_SIZE_MHZ) * FREQ_STEP_SIZE_MHZ;
+		arb->gpc_cap_clkmhz = g->dgpu_max_clk;
+	}
+#ifdef CONFIG_DEBUG_FS
+	arb->debug = &arb->debug_pool[0];
+
+	if (!arb->debugfs_set) {
+		if (nvgpu_clk_arb_debugfs_init(g))
+			arb->debugfs_set = true;
+	}
+#endif
+	err = nvgpu_clk_vf_point_cache(g);
+	if (err < 0) {
+		goto init_fail;
+	}
+
+	err = nvgpu_clk_arb_update_vf_table(arb);
+	if (err < 0) {
+		goto init_fail;
+	}
+
+	do {
+		/* Check that first run is completed */
+		nvgpu_smp_mb();
+		NVGPU_COND_WAIT_INTERRUPTIBLE(&arb->request_wq,
+			nvgpu_atomic_read(&arb->req_nr), 0U);
+	} while (nvgpu_atomic_read(&arb->req_nr) == 0);
+	return arb->status;
+
+init_fail:
+	nvgpu_kfree(g, arb->gpc2clk_f_points);
+	nvgpu_kfree(g, arb->mclk_f_points);
+
+	for (index = 0; index < 2; index++) {
+		nvgpu_kfree(g, arb->vf_table_pool[index].gpc2clk_points);
+		nvgpu_kfree(g, arb->vf_table_pool[index].mclk_points);
+	}
+
+	nvgpu_mutex_destroy(&arb->pstate_lock);
+	nvgpu_kfree(g, arb);
+
+	return err;
+}
+
+void gv100_clk_arb_run_arbiter_cb(struct nvgpu_clk_arb *arb)
+{
+	struct nvgpu_clk_session *session;
+	struct nvgpu_clk_dev *dev;
+	struct nvgpu_clk_dev *tmp;
+	struct nvgpu_clk_arb_target *target, *actual;
+	struct gk20a *g = arb->g;
+
+	u32 current_pstate = VF_POINT_INVALID_PSTATE;
+	u32 voltuv = 0;
+	bool mclk_set, gpc2clk_set;
+	u32 alarms_notified = 0;
+	u32 current_alarm;
+	int status = 0;
+	/* Temporary variables for checking target frequency */
+	u16 gpc2clk_target, mclk_target;
+	struct nvgpu_clk_slave_freq vf_point;
+
+#ifdef CONFIG_DEBUG_FS
+	s64 t0, t1;
+	struct nvgpu_clk_arb_debug *debug;
+
+#endif
+
+	clk_arb_dbg(g, " ");
+
+	/* bail out if gpu is down */
+	if (nvgpu_atomic64_read(&arb->alarm_mask) & EVENT(ALARM_GPU_LOST)) {
+		goto exit_arb;
+	}
+
+#ifdef CONFIG_DEBUG_FS
+	t0 = nvgpu_current_time_ns();
+#endif
+
+	/* Only one arbiter should be running */
+	gpc2clk_target = 0;
+	mclk_target = 0;
+	nvgpu_spinlock_acquire(&arb->sessions_lock);
+	nvgpu_list_for_each_entry(session, &arb->sessions,
+			nvgpu_clk_session, link) {
+		if (!session->zombie) {
+			mclk_set = false;
+			gpc2clk_set = false;
+			target = (session->target == &session->target_pool[0] ?
+					&session->target_pool[1] :
+					&session->target_pool[0]);
+			nvgpu_spinlock_acquire(&session->session_lock);
+			if (!nvgpu_list_empty(&session->targets)) {
+				/* Copy over state */
+				target->mclk = session->target->mclk;
+				target->gpc2clk = session->target->gpc2clk;
+				/* Query the latest committed request */
+				nvgpu_list_for_each_entry_safe(dev, tmp,
+				 &session->targets, nvgpu_clk_dev, node) {
+					if ((mclk_set == false) && (dev->mclk_target_mhz != 0U)) {
+						target->mclk =
+							dev->mclk_target_mhz;
+						mclk_set = true;
+					}
+					if ((gpc2clk_set == false) &&
+						(dev->gpc2clk_target_mhz != 0U)) {
+						target->gpc2clk =
+							dev->gpc2clk_target_mhz;
+						gpc2clk_set = true;
+					}
+					nvgpu_ref_get(&dev->refcount);
+					nvgpu_list_del(&dev->node);
+					nvgpu_spinlock_acquire(
+						&arb->requests_lock);
+					nvgpu_list_add(
+						&dev->node, &arb->requests);
+					nvgpu_spinlock_release(&arb->requests_lock);
+				}
+				session->target = target;
+			}
+			nvgpu_spinlock_release(
+				&session->session_lock);
+
+			mclk_target = mclk_target > session->target->mclk ?
+				mclk_target : session->target->mclk;
+
+			gpc2clk_target =
+				gpc2clk_target > session->target->gpc2clk ?
+				gpc2clk_target : session->target->gpc2clk;
+		}
+	}
+	nvgpu_spinlock_release(&arb->sessions_lock);
+
+	gpc2clk_target = (gpc2clk_target > 0U) ? gpc2clk_target :
+			arb->gpc2clk_default_mhz;
+
+	if (gpc2clk_target < arb->gpc2clk_min) {
+		gpc2clk_target = arb->gpc2clk_min;
+	}
+
+	if (gpc2clk_target > arb->gpc2clk_max) {
+		gpc2clk_target = arb->gpc2clk_max;
+	}
+
+	mclk_target = (mclk_target > 0U) ? mclk_target :
+			arb->mclk_default_mhz;
+
+	if (mclk_target < arb->mclk_min) {
+		mclk_target = arb->mclk_min;
+	}
+
+	if (mclk_target > arb->mclk_max) {
+		mclk_target = arb->mclk_max;
+	}
+
+	if ((arb->gpc_cap_clkmhz != 0U) &&
+			(gpc2clk_target > arb->gpc_cap_clkmhz)) {
+		gpc2clk_target = arb->gpc_cap_clkmhz;
+	}
+
+	vf_point.gpc_mhz = gpc2clk_target;
+	(void)nvgpu_clk_arb_find_slave_points(arb, &vf_point);
+	if (status != 0) {
+		nvgpu_err(g, "Unable to get slave frequency");
+		goto exit_arb;
+	}
+
+	status = nvgpu_pmu_perf_changeseq_set_clks(g, &vf_point);
+	if (status != 0) {
+		nvgpu_err(g, "Unable to program frequency");
+		goto exit_arb;
+	}
+
+	actual = NV_READ_ONCE(arb->actual) == &arb->actual_pool[0] ?
+			&arb->actual_pool[1] : &arb->actual_pool[0];
+
+	/* do not reorder this pointer */
+	nvgpu_smp_rmb();
+	actual->gpc2clk = gpc2clk_target;
+	actual->mclk = mclk_target;
+	arb->voltuv_actual = voltuv;
+	actual->pstate = current_pstate;
+	arb->status = status;
+
+	/* Make changes visible to other threads */
+	nvgpu_smp_wmb();
+	arb->actual = actual;
+
+	/* status must be visible before atomic inc */
+	nvgpu_smp_wmb();
+	nvgpu_atomic_inc(&arb->req_nr);
+
+	/* VF Update complete */
+	nvgpu_clk_arb_set_global_alarm(g, EVENT(VF_UPDATE));
+
+	nvgpu_cond_signal_interruptible(&arb->request_wq);
+#ifdef CONFIG_DEBUG_FS
+	t1 = nvgpu_current_time_ns();
+
+	debug = arb->debug == &arb->debug_pool[0] ?
+		&arb->debug_pool[1] : &arb->debug_pool[0];
+
+	memcpy(debug, arb->debug, sizeof(arb->debug_pool[0]));
+	debug->switch_num++;
+
+	if (debug->switch_num == 1) {
+		debug->switch_max = debug->switch_min =
+			debug->switch_avg = (t1-t0)/1000;
+		debug->switch_std = 0;
+	} else {
+		s64 prev_avg;
+		s64 curr = (t1-t0)/1000;
+
+		debug->switch_max = curr > debug->switch_max ?
+			curr : debug->switch_max;
+		debug->switch_min = debug->switch_min ?
+			(curr < debug->switch_min ?
+				curr : debug->switch_min) : curr;
+		prev_avg = debug->switch_avg;
+		debug->switch_avg = (curr +
+			(debug->switch_avg * (debug->switch_num-1))) /
+			debug->switch_num;
+		debug->switch_std +=
+			(curr - debug->switch_avg) * (curr - prev_avg);
+	}
+	/* commit changes before exchanging debug pointer */
+	nvgpu_smp_wmb();
+	arb->debug = debug;
+#endif
+
+exit_arb:
+	if (status < 0) {
+		nvgpu_err(g, "Error in arbiter update");
+		nvgpu_clk_arb_set_global_alarm(g,
+			EVENT(ALARM_CLOCK_ARBITER_FAILED));
+	}
+
+	current_alarm = (u32) nvgpu_atomic64_read(&arb->alarm_mask);
+	/* notify completion for all requests */
+	nvgpu_spinlock_acquire(&arb->requests_lock);
+	nvgpu_list_for_each_entry_safe(dev, tmp, &arb->requests,
+			nvgpu_clk_dev, node) {
+		/* avoid casting composite expression below */
+		u32 tmp_mask = NVGPU_POLLIN | NVGPU_POLLRDNORM;
+
+		nvgpu_atomic_set(&dev->poll_mask, (int)tmp_mask);
+		nvgpu_clk_arb_event_post_event(dev);
+		nvgpu_ref_put(&dev->refcount, nvgpu_clk_arb_free_fd);
+		nvgpu_list_del(&dev->node);
+	}
+	nvgpu_spinlock_release(&arb->requests_lock);
+
+	nvgpu_atomic_set(&arb->notification_queue.head,
+		nvgpu_atomic_read(&arb->notification_queue.tail));
+	/* notify event for all users */
+	nvgpu_spinlock_acquire(&arb->users_lock);
+	nvgpu_list_for_each_entry(dev, &arb->users, nvgpu_clk_dev, link) {
+		alarms_notified |=
+			nvgpu_clk_arb_notify(dev, arb->actual, current_alarm);
+	}
+	nvgpu_spinlock_release(&arb->users_lock);
+
+	/* clear alarms */
+	nvgpu_clk_arb_clear_global_alarm(g, alarms_notified &
+		~EVENT(ALARM_GPU_LOST));
+}
+
+void gv100_clk_arb_cleanup(struct nvgpu_clk_arb *arb)
+{
+	struct gk20a *g = arb->g;
+	int index;
+
+	nvgpu_kfree(g, arb->gpc2clk_f_points);
+	nvgpu_kfree(g, arb->mclk_f_points);
+
+	for (index = 0; index < 2; index++) {
+		nvgpu_kfree(g,
+			arb->vf_table_pool[index].gpc2clk_points);
+		nvgpu_kfree(g, arb->vf_table_pool[index].mclk_points);
+	}
+
+	nvgpu_mutex_destroy(&g->clk_arb->pstate_lock);
+	nvgpu_kfree(g, g->clk_arb);
+
+	g->clk_arb = NULL;
+}
+
+void gv100_stop_clk_arb_threads(struct gk20a *g)
+{
+	nvgpu_clk_arb_worker_deinit(g);
+}
--- a/drivers/gpu/nvgpu/common/clk_arb/clk_arb_gv100.h
+++ b/drivers/gpu/nvgpu/common/clk_arb/clk_arb_gv100.h
@@ -0,0 +1,42 @@
+/*
+ * Copyright (c) 2016-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef CLK_ARB_GV100_H
+#define CLK_ARB_GV100_H
+
+struct nvgpu_clk_session;
+struct nvgpu_clk_arb;
+
+#define DVCO_MIN_DEFAULT_MHZ	405
+
+bool gv100_check_clk_arb_support(struct gk20a *g);
+u32 gv100_get_arbiter_clk_domains(struct gk20a *g);
+int gv100_get_arbiter_f_points(struct gk20a *g,u32 api_domain,
+				u32 *num_points, u16 *freqs_in_mhz);
+int gv100_get_arbiter_clk_range(struct gk20a *g, u32 api_domain,
+		u16 *min_mhz, u16 *max_mhz);
+int gv100_get_arbiter_clk_default(struct gk20a *g, u32 api_domain,
+		u16 *default_mhz);
+int gv100_init_clk_arbiter(struct gk20a *g);
+void gv100_clk_arb_run_arbiter_cb(struct nvgpu_clk_arb *arb);
+void gv100_clk_arb_cleanup(struct nvgpu_clk_arb *arb);
+void gv100_stop_clk_arb_threads(struct gk20a *g);
+#endif /* CLK_ARB_GV100_H */
--- a/drivers/gpu/nvgpu/common/cyclestats/cyclestats.c
+++ b/drivers/gpu/nvgpu/common/cyclestats/cyclestats.c
@@ -0,0 +1,169 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/regops.h>
+#include <nvgpu/log.h>
+#include <nvgpu/io.h>
+#include <nvgpu/lock.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/cyclestats.h>
+
+#include "cyclestats_priv.h"
+
+static inline bool is_valid_cyclestats_bar0_offset_gk20a(struct gk20a *g,
+							 u32 offset)
+{
+	/* support only 24-bit 4-byte aligned offsets */
+	bool valid = !(offset & 0xFF000003U);
+
+	if (g->allow_all) {
+		return true;
+	}
+
+	/* whitelist check */
+	valid = valid &&
+		is_bar0_global_offset_whitelisted_gk20a(g, offset);
+	/* resource size check in case there was a problem
+	 * with allocating the assumed size of bar0 */
+	valid = valid && nvgpu_io_valid_reg(g, offset);
+	return valid;
+}
+
+void nvgpu_cyclestats_exec(struct gk20a *g,
+		struct nvgpu_channel *ch, u32 offset)
+{
+	void *virtual_address;
+	u32 buffer_size;
+	bool exit;
+
+	/* GL will never use payload 0 for cycle state */
+	if ((ch->cyclestate.cyclestate_buffer == NULL) || (offset == 0U)) {
+		return;
+	}
+
+	nvgpu_mutex_acquire(&ch->cyclestate.cyclestate_buffer_mutex);
+
+	virtual_address = ch->cyclestate.cyclestate_buffer;
+	buffer_size = ch->cyclestate.cyclestate_buffer_size;
+	exit = false;
+
+	while (!exit) {
+		struct share_buffer_head *sh_hdr;
+		u32 min_element_size;
+
+		/* validate offset */
+		if (offset + sizeof(struct share_buffer_head) > buffer_size ||
+		    offset + sizeof(struct share_buffer_head) < offset) {
+			nvgpu_err(g,
+				  "cyclestats buffer overrun at offset 0x%x",
+				  offset);
+			break;
+		}
+
+		sh_hdr = (struct share_buffer_head *)
+			 ((char *)virtual_address + offset);
+
+		min_element_size =
+			U32(sh_hdr->operation == OP_END ?
+			 sizeof(struct share_buffer_head) :
+			 sizeof(struct nvgpu_cyclestate_buffer_elem));
+
+		/* validate sh_hdr->size */
+		if (sh_hdr->size < min_element_size ||
+		    offset + sh_hdr->size > buffer_size ||
+		    offset + sh_hdr->size < offset) {
+			nvgpu_err(g,
+				  "bad cyclestate buffer header size at offset 0x%x",
+				  offset);
+			sh_hdr->failed = U32(true);
+			break;
+		}
+
+		switch (sh_hdr->operation) {
+		case OP_END:
+			exit = true;
+			break;
+
+		case BAR0_READ32:
+		case BAR0_WRITE32:
+		{
+			struct nvgpu_cyclestate_buffer_elem *op_elem =
+				(struct nvgpu_cyclestate_buffer_elem *)sh_hdr;
+			bool valid = is_valid_cyclestats_bar0_offset_gk20a(
+						g, op_elem->offset_bar0);
+			u32 raw_reg;
+			u64 mask_orig;
+			u64 v;
+
+			if (!valid) {
+				nvgpu_err(g,
+					   "invalid cycletstats op offset: 0x%x",
+					   op_elem->offset_bar0);
+
+				exit = true;
+				sh_hdr->failed = U32(exit);
+				break;
+			}
+
+			mask_orig =
+				((1ULL << (op_elem->last_bit + 1)) - 1) &
+				~((1ULL << op_elem->first_bit) - 1);
+
+			raw_reg = nvgpu_readl(g, op_elem->offset_bar0);
+
+			switch (sh_hdr->operation) {
+			case BAR0_READ32:
+				op_elem->data =	((raw_reg & mask_orig)
+							>> op_elem->first_bit);
+				break;
+
+			case BAR0_WRITE32:
+				v = 0;
+				if ((unsigned int)mask_orig !=
+							~((unsigned int)0)) {
+					v = (unsigned int)
+						(raw_reg & ~mask_orig);
+				}
+
+				v |= ((op_elem->data << op_elem->first_bit)
+							& mask_orig);
+				nvgpu_writel(g,op_elem->offset_bar0,
+					     (unsigned int)v);
+				break;
+			default:
+				/* nop ok?*/
+				break;
+			}
+		}
+		break;
+
+		default:
+			/* no operation content case */
+			exit = true;
+			break;
+		}
+		sh_hdr->completed = U32(true);
+		offset += sh_hdr->size;
+	}
+	nvgpu_mutex_release(&ch->cyclestate.cyclestate_buffer_mutex);
+}
--- a/drivers/gpu/nvgpu/common/cyclestats/cyclestats_priv.h
+++ b/drivers/gpu/nvgpu/common/cyclestats/cyclestats_priv.h
@@ -0,0 +1,60 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_CYCLESTATS_PRIV_H
+#define NVGPU_CYCLESTATS_PRIV_H
+
+#include <nvgpu/types.h>
+
+#define MULTICHAR_TAG(a, b, c, d) (((a) << 24) | ((b) << 16) | ((c) << 8) | (d))
+
+enum BAR0_DEBUG_OPERATION {
+	BARO_ZERO_NOP = 0,
+	OP_END = MULTICHAR_TAG('D', 'O', 'N', 'E'),
+	BAR0_READ32 = MULTICHAR_TAG('0', 'R', '3', '2'),
+	BAR0_WRITE32 = MULTICHAR_TAG('0', 'W', '3', '2'),
+};
+
+struct share_buffer_head {
+	enum BAR0_DEBUG_OPERATION operation;
+/* size of the operation item */
+	u32 size;
+	u32 completed;
+	u32 failed;
+	u64 context;
+	u64 completion_callback;
+};
+
+struct nvgpu_cyclestate_buffer_elem {
+	struct share_buffer_head	head;
+/* in */
+	u64 p_data;
+	u64 p_done;
+	u32 offset_bar0;
+	u16 first_bit;
+	u16 last_bit;
+/* out */
+/* keep 64 bits to be consistent */
+	u64 data;
+};
+
+#endif /* NVGPU_CYCLESTATS_PRIV_H */
--- a/drivers/gpu/nvgpu/common/debugger.c
+++ b/drivers/gpu/nvgpu/common/debugger.c
@@ -0,0 +1,241 @@
+/*
+ * Tegra GK20A GPU Debugger/Profiler Driver
+ *
+ * Copyright (c) 2013-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/kmem.h>
+#include <nvgpu/log.h>
+#include <nvgpu/vm.h>
+#include <nvgpu/atomic.h>
+#include <nvgpu/mm.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/io.h>
+#include <nvgpu/utils.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/nvgpu_init.h>
+#include <nvgpu/debugger.h>
+#include <nvgpu/profiler.h>
+#include <nvgpu/power_features/power_features.h>
+
+/*
+ * API to get first channel from the list of all channels
+ * bound to the debug session
+ */
+struct nvgpu_channel *
+nvgpu_dbg_gpu_get_session_channel(struct dbg_session_gk20a *dbg_s)
+{
+	struct dbg_session_channel_data *ch_data;
+	struct nvgpu_channel *ch;
+	struct gk20a *g = dbg_s->g;
+
+	nvgpu_mutex_acquire(&dbg_s->ch_list_lock);
+	if (nvgpu_list_empty(&dbg_s->ch_list)) {
+		nvgpu_mutex_release(&dbg_s->ch_list_lock);
+		return NULL;
+	}
+
+	ch_data = nvgpu_list_first_entry(&dbg_s->ch_list,
+				   dbg_session_channel_data,
+				   ch_entry);
+	ch = g->fifo.channel + ch_data->chid;
+
+	nvgpu_mutex_release(&dbg_s->ch_list_lock);
+
+	return ch;
+}
+
+void nvgpu_dbg_gpu_post_events(struct nvgpu_channel *ch)
+{
+	struct dbg_session_data *session_data;
+	struct dbg_session_gk20a *dbg_s;
+	struct gk20a *g = ch->g;
+
+	nvgpu_log(g, gpu_dbg_fn | gpu_dbg_gpu_dbg, " ");
+
+	/* guard against the session list being modified */
+	nvgpu_mutex_acquire(&ch->dbg_s_lock);
+
+	nvgpu_list_for_each_entry(session_data, &ch->dbg_s_list,
+				dbg_session_data, dbg_s_entry) {
+		dbg_s = session_data->dbg_s;
+		if (dbg_s->dbg_events.events_enabled) {
+			nvgpu_log(g, gpu_dbg_gpu_dbg, "posting event on session id %d",
+					dbg_s->id);
+			nvgpu_log(g, gpu_dbg_gpu_dbg, "%d events pending",
+					dbg_s->dbg_events.num_pending_events);
+
+			dbg_s->dbg_events.num_pending_events++;
+
+			nvgpu_dbg_session_post_event(dbg_s);
+		}
+	}
+
+	nvgpu_mutex_release(&ch->dbg_s_lock);
+}
+
+bool nvgpu_dbg_gpu_broadcast_stop_trigger(struct nvgpu_channel *ch)
+{
+	struct dbg_session_data *session_data;
+	struct dbg_session_gk20a *dbg_s;
+	bool broadcast = false;
+	struct gk20a *g = ch->g;
+
+	nvgpu_log(g, gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr, " ");
+
+	/* guard against the session list being modified */
+	nvgpu_mutex_acquire(&ch->dbg_s_lock);
+
+	nvgpu_list_for_each_entry(session_data, &ch->dbg_s_list,
+				dbg_session_data, dbg_s_entry) {
+		dbg_s = session_data->dbg_s;
+		if (dbg_s->broadcast_stop_trigger) {
+			nvgpu_log(g, gpu_dbg_gpu_dbg | gpu_dbg_fn | gpu_dbg_intr,
+					"stop trigger broadcast enabled");
+			broadcast = true;
+			break;
+		}
+	}
+
+	nvgpu_mutex_release(&ch->dbg_s_lock);
+
+	return broadcast;
+}
+
+void nvgpu_dbg_gpu_clear_broadcast_stop_trigger(struct nvgpu_channel *ch)
+{
+	struct dbg_session_data *session_data;
+	struct dbg_session_gk20a *dbg_s;
+	struct gk20a *g = ch->g;
+
+	nvgpu_log(g, gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr, " ");
+
+	/* guard against the session list being modified */
+	nvgpu_mutex_acquire(&ch->dbg_s_lock);
+
+	nvgpu_list_for_each_entry(session_data, &ch->dbg_s_list,
+				dbg_session_data, dbg_s_entry) {
+		dbg_s = session_data->dbg_s;
+		if (dbg_s->broadcast_stop_trigger) {
+			nvgpu_log(g, gpu_dbg_gpu_dbg | gpu_dbg_fn | gpu_dbg_intr,
+					"stop trigger broadcast disabled");
+			dbg_s->broadcast_stop_trigger = false;
+		}
+	}
+
+	nvgpu_mutex_release(&ch->dbg_s_lock);
+}
+
+u32 nvgpu_set_powergate_locked(struct dbg_session_gk20a *dbg_s,
+				bool mode)
+{
+	u32 err = 0U;
+	struct gk20a *g = dbg_s->g;
+
+	if (dbg_s->is_pg_disabled != mode) {
+		if (mode == false) {
+			g->dbg_powergating_disabled_refcount--;
+		}
+
+		/*
+		 * Allow powergate disable or enable only if
+		 * the global pg disabled refcount is zero
+		 */
+		if (g->dbg_powergating_disabled_refcount == 0) {
+			err = g->ops.debugger.dbg_set_powergate(dbg_s,
+									mode);
+		}
+
+		if (mode) {
+			g->dbg_powergating_disabled_refcount++;
+		}
+
+		dbg_s->is_pg_disabled = mode;
+	}
+
+	return err;
+}
+
+int nvgpu_dbg_set_powergate(struct dbg_session_gk20a *dbg_s, bool disable_powergate)
+{
+	int err = 0;
+	struct gk20a *g = dbg_s->g;
+
+	 /* This function must be called with g->dbg_sessions_lock held */
+
+	nvgpu_log(g, gpu_dbg_fn|gpu_dbg_gpu_dbg, "%s powergate mode = %s",
+		   g->name, disable_powergate ? "disable" : "enable");
+
+	/*
+	 * Powergate mode here refers to railgate+powergate+clockgate
+	 * so in case slcg/blcg/elcg are disabled and railgating is enabled,
+	 * disable railgating and then set is_pg_disabled = true
+	 * Similarly re-enable railgating and not other features if they are not
+	 * enabled when powermode=MODE_ENABLE
+	 */
+	if (disable_powergate) {
+		/* save off current powergate, clk state.
+		 * set gpu module's can_powergate = 0.
+		 * set gpu module's clk to max.
+		 * while *a* debug session is active there will be no power or
+		 * clocking state changes allowed from mainline code (but they
+		 * should be saved).
+		 */
+
+		nvgpu_log(g, gpu_dbg_gpu_dbg | gpu_dbg_fn,
+						"module busy");
+		err = gk20a_busy(g);
+		if (err != 0) {
+			return err;
+		}
+
+#ifdef CONFIG_NVGPU_NON_FUSA
+		err = nvgpu_cg_pg_disable(g);
+#endif
+		if (err == 0) {
+			dbg_s->is_pg_disabled = true;
+			nvgpu_log(g, gpu_dbg_gpu_dbg | gpu_dbg_fn,
+					"pg disabled");
+		}
+	} else {
+		/* restore (can) powergate, clk state */
+		/* release pending exceptions to fault/be handled as usual */
+		/*TBD: ordering of these? */
+
+#ifdef CONFIG_NVGPU_NON_FUSA
+		err = nvgpu_cg_pg_enable(g);
+#endif
+		if (err == 0) {
+			dbg_s->is_pg_disabled = false;
+			nvgpu_log(g, gpu_dbg_gpu_dbg | gpu_dbg_fn,
+					"pg enabled");
+		}
+
+		nvgpu_log(g, gpu_dbg_gpu_dbg | gpu_dbg_fn, "module idle");
+
+		gk20a_idle(g);
+	}
+
+	nvgpu_log(g, gpu_dbg_fn|gpu_dbg_gpu_dbg, "%s powergate mode = %s done",
+		   g->name, disable_powergate ? "disable" : "enable");
+	return err;
+}
--- a/drivers/gpu/nvgpu/common/device.c
+++ b/drivers/gpu/nvgpu/common/device.c
@@ -0,0 +1,338 @@
+/*
+ * Copyright (c) 2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/device.h>
+#include <nvgpu/list.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/string.h>
+#include <nvgpu/log.h>
+
+#define device_dbg(g, fmt, args...)					\
+	do {								\
+		nvgpu_log(g, gpu_dbg_device, fmt, ##args);		\
+	} while (0)
+
+static inline const char *nvgpu_device_type_to_str(const struct nvgpu_device *dev)
+{
+	const char *str = "Unknown";
+
+	switch (dev->type) {
+	case NVGPU_DEVTYPE_GRAPHICS:
+		str = "GFX";
+		break;
+	case NVGPU_DEVTYPE_COPY0:
+		str = "CE0";
+		break;
+	case NVGPU_DEVTYPE_COPY1:
+		str = "CE1";
+		break;
+	case NVGPU_DEVTYPE_COPY2:
+		str = "CE2";
+		break;
+	case NVGPU_DEVTYPE_IOCTRL:
+		str = "IOCTRL";
+		break;
+	case NVGPU_DEVTYPE_LCE:
+		str = "LCE";
+		break;
+	default:
+		break;
+	}
+
+	return str;
+}
+
+void nvgpu_device_dump_dev(struct gk20a *g, const struct nvgpu_device *dev)
+{
+	device_dbg(g, "Device %s:%d",
+		   nvgpu_device_type_to_str(dev), dev->inst_id);
+	device_dbg(g, "  EngineID:  %2u  FaultID: %2u",
+		   dev->engine_id, dev->fault_id);
+	device_dbg(g, "  RunlistID: %2u  IntrID:  %2u  ResetID: %u",
+		   dev->runlist_id, dev->intr_id, dev->reset_id);
+	device_dbg(g, "  PRI Base: 0x%x", dev->pri_base);
+}
+
+/*
+ * Faciliate the parsing of the TOP array describing the devices present in the
+ * GPU.
+ */
+static int nvgpu_device_parse_hw_table(struct gk20a *g)
+{
+	int ret = 0;
+	u32 token = NVGPU_DEVICE_TOKEN_INIT;
+	struct nvgpu_device *dev;
+	struct nvgpu_list_node *devlist;
+
+	while (true) {
+		dev = g->ops.top.parse_next_device(g, &token);
+		if (dev == NULL) {
+			break;
+		}
+
+		nvgpu_device_dump_dev(g, dev);
+
+		/*
+		 * Otherwise we have a device - let's add it to the right device
+		 * list.
+		 */
+		devlist = &g->devs->devlist_heads[dev->type];
+
+		nvgpu_list_add_tail(&dev->dev_list_node, devlist);
+		g->devs->dev_counts[dev->type] += 1;
+	}
+
+	return ret;
+}
+
+/*
+ * Faciliate reading the HW register table into a software abstraction. This is
+ * done only on the first boot as the table will never change dynamically.
+ */
+int nvgpu_device_init(struct gk20a *g)
+{
+	u32 i;
+
+	device_dbg(g, "Initializating GPU device list");
+
+	/*
+	 * Ground work - make sure we aren't doing this again and that we have
+	 * all the necessary data structures.
+	 */
+	if (g->devs != NULL) {
+		device_dbg(g, "  GPU device list already present. Done.");
+		return 0;
+	}
+
+	g->devs = nvgpu_kzalloc(g, sizeof(*g->devs));
+	if (g->devs == NULL) {
+		return -ENOMEM;
+	}
+
+	for (i = 0; i < NVGPU_MAX_DEVTYPE; i++) {
+		nvgpu_init_list_node(&g->devs->devlist_heads[i]);
+	}
+
+	return nvgpu_device_parse_hw_table(g);
+}
+
+static void nvgpu_device_cleanup_devtype(struct gk20a *g,
+					 struct nvgpu_list_node *list)
+{
+	struct nvgpu_device *dev;
+
+	while (!nvgpu_list_empty(list)) {
+		dev = nvgpu_list_first_entry(list,
+					     nvgpu_device,
+					     dev_list_node);
+		nvgpu_list_del(&dev->dev_list_node);
+		nvgpu_kfree(g, dev);
+	}
+}
+
+void nvgpu_device_cleanup(struct gk20a *g)
+{
+	u32 i;
+	struct nvgpu_list_node *devlist;
+
+	device_dbg(g, "Releasing GPU device list");
+
+	/*
+	 * Make unit testing a bit easier.
+	 */
+	if (g->devs == NULL) {
+		device_dbg(g, "  Already done.");
+		return;
+	}
+
+	for (i = 0; i < NVGPU_MAX_DEVTYPE; i++) {
+		devlist = &g->devs->devlist_heads[i];
+
+		if (devlist == NULL) {
+			continue;
+		}
+
+		nvgpu_device_cleanup_devtype(g, devlist);
+	}
+
+	nvgpu_kfree(g, g->devs);
+	g->devs = NULL;
+}
+
+/*
+ * Find the instance passed. Do this by simply traversing the linked list; it's
+ * not particularly efficient, but we aren't expecting there to ever be _that_
+ * many devices.
+ *
+ * Return a pointer to the device or NULL of the inst ID is out of range.
+ */
+static const struct nvgpu_device *dev_instance_from_devlist(
+	struct nvgpu_list_node *devlist, u32 inst_id)
+{
+	struct nvgpu_device *dev;
+
+	nvgpu_list_for_each_entry(dev, devlist, nvgpu_device, dev_list_node) {
+		if (dev->inst_id == inst_id) {
+			return dev;
+		}
+	}
+
+	return NULL;
+}
+
+const struct nvgpu_device *nvgpu_device_get(struct gk20a *g,
+		     u32 type, u32 inst_id)
+{
+	const struct nvgpu_device *dev;
+	struct nvgpu_list_node *device_list;
+
+	if (type >= NVGPU_MAX_DEVTYPE) {
+		return NULL;
+	}
+
+	device_list = &g->devs->devlist_heads[type];
+	dev = dev_instance_from_devlist(device_list, inst_id);
+
+	if (dev == NULL) {
+		return NULL;
+	}
+
+	return dev;
+}
+
+u32 nvgpu_device_count(struct gk20a *g, u32 type)
+{
+	if (type >= NVGPU_MAX_DEVTYPE) {
+		return 0U;
+	}
+
+	return g->devs->dev_counts[type];
+}
+
+/*
+ * Internal function to query copy engines; async_only specifies whether
+ * this function should or should not include the GR copy engines (CEs that
+ * share a runlist with the GR engine(s)).
+ *
+ * This function basically iterates over two distinct copy engine lists:
+ * first the COPY0-2 (the old way of describing copy engines) and the LCE
+ * list (the new in Pascal way of describing copy engines).
+ */
+static u32 nvgpu_device_do_get_copies(struct gk20a *g,
+				      bool async_only,
+				      const struct nvgpu_device **ces,
+				      u32 max)
+{
+	u32 i;
+	u32 copies = 0U;
+	const struct nvgpu_device *dev;
+	const struct nvgpu_device *gr_dev;
+
+	if (max == 0U) {
+		return 0U;
+	}
+
+	gr_dev = nvgpu_device_get(g, NVGPU_DEVTYPE_GRAPHICS, 0U);
+	nvgpu_assert(gr_dev != NULL);
+
+	/*
+	 * Start with the COPY0-2 engines. Note the awkward instance ID.
+	 */
+	for (i = NVGPU_DEVTYPE_COPY0; i <= NVGPU_DEVTYPE_COPY2; i++) {
+		dev = nvgpu_device_get(g, i, i - NVGPU_DEVTYPE_COPY0);
+		if (dev == NULL) {
+			continue;
+		}
+
+		if (async_only &&
+		    dev->runlist_id == gr_dev->runlist_id) {
+			/* It's a GRCE, skip it per async_only. */
+			continue;
+		}
+
+		ces[copies] = dev;
+		copies = nvgpu_safe_add_u32(copies, 1U);
+		if (copies == max) {
+			return copies;
+		}
+	}
+
+	for (i = 0; i < nvgpu_device_count(g, NVGPU_DEVTYPE_LCE); i++) {
+		dev = nvgpu_device_get(g, NVGPU_DEVTYPE_LCE, i);
+		nvgpu_assert(dev != NULL);
+
+		if (async_only &&
+		    dev->runlist_id == gr_dev->runlist_id) {
+			/* It's a GRCE, skip it per async_only. */
+			continue;
+		}
+
+		ces[copies] = dev;
+		copies = nvgpu_safe_add_u32(copies, 1U);
+		if (copies == max) {
+			return copies;
+		}
+	}
+
+	return copies;
+}
+
+u32 nvgpu_device_get_async_copies(struct gk20a *g,
+				  const struct nvgpu_device **ces,
+				  u32 max)
+{
+	return nvgpu_device_do_get_copies(g, true, ces, max);
+}
+
+u32 nvgpu_device_get_copies(struct gk20a *g,
+			    const struct nvgpu_device **ces,
+			    u32 max)
+{
+	return nvgpu_device_do_get_copies(g, false, ces, max);
+}
+
+/*
+ * Note: this kind of bleeds HW details into the core code. Eventually this
+ * should be handled by a translation table. However, for now, HW has kept the
+ * device type values consistent across chips and nvgpu already has this present
+ * in core code.
+ *
+ * Once a per-chip translation table exists we can translate and then do a
+ * comparison.
+ */
+bool nvgpu_device_is_ce(struct gk20a *g, const struct nvgpu_device *dev)
+{
+	if (dev->type == NVGPU_DEVTYPE_COPY0 ||
+	    dev->type == NVGPU_DEVTYPE_COPY1 ||
+	    dev->type == NVGPU_DEVTYPE_COPY2 ||
+	    dev->type == NVGPU_DEVTYPE_LCE) {
+		return true;
+	}
+
+	return false;
+}
+
+bool nvgpu_device_is_graphics(struct gk20a *g, const struct nvgpu_device *dev)
+{
+	return dev->type == NVGPU_DEVTYPE_GRAPHICS;
+}
--- a/drivers/gpu/nvgpu/common/ecc.c
+++ b/drivers/gpu/nvgpu/common/ecc.c
@@ -0,0 +1,167 @@
+/*
+ * Copyright (c) 2018-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/gr/gr_ecc.h>
+#include <nvgpu/ltc.h>
+
+void nvgpu_ecc_stat_add(struct gk20a *g, struct nvgpu_ecc_stat *stat)
+{
+	struct nvgpu_ecc *ecc = &g->ecc;
+
+	nvgpu_init_list_node(&stat->node);
+
+	nvgpu_mutex_acquire(&ecc->stats_lock);
+
+	nvgpu_list_add_tail(&stat->node, &ecc->stats_list);
+	ecc->stats_count = nvgpu_safe_add_s32(ecc->stats_count, 1);
+
+	nvgpu_mutex_release(&ecc->stats_lock);
+}
+
+void nvgpu_ecc_stat_del(struct gk20a *g, struct nvgpu_ecc_stat *stat)
+{
+	struct nvgpu_ecc *ecc = &g->ecc;
+
+	nvgpu_mutex_acquire(&ecc->stats_lock);
+
+	nvgpu_list_del(&stat->node);
+	ecc->stats_count = nvgpu_safe_sub_s32(ecc->stats_count, 1);
+
+	nvgpu_mutex_release(&ecc->stats_lock);
+}
+
+int nvgpu_ecc_counter_init(struct gk20a *g,
+		struct nvgpu_ecc_stat **statp, const char *name)
+{
+	struct nvgpu_ecc_stat *stat;
+
+	stat = nvgpu_kzalloc(g, sizeof(*stat));
+	if (stat == NULL) {
+		nvgpu_err(g, "ecc counter alloc failed");
+		return -ENOMEM;
+	}
+
+	(void)strncpy(stat->name, name, NVGPU_ECC_STAT_NAME_MAX_SIZE - 1U);
+	nvgpu_ecc_stat_add(g, stat);
+	*statp = stat;
+	return 0;
+}
+
+void nvgpu_ecc_counter_deinit(struct gk20a *g, struct nvgpu_ecc_stat **statp)
+{
+	struct nvgpu_ecc_stat *stat;
+
+	if (*statp == NULL) {
+		return;
+	}
+
+	stat = *statp;
+
+	nvgpu_ecc_stat_del(g, stat);
+	nvgpu_kfree(g, stat);
+	*statp = NULL;
+}
+
+/* release all ecc_stat */
+void nvgpu_ecc_free(struct gk20a *g)
+{
+	struct nvgpu_ecc *ecc = &g->ecc;
+
+	nvgpu_gr_ecc_free(g);
+	nvgpu_ltc_ecc_free(g);
+
+	if (g->ops.fb.ecc.free != NULL) {
+		g->ops.fb.ecc.free(g);
+	}
+
+#ifdef CONFIG_NVGPU_DGPU
+	if (g->ops.fb.fbpa_ecc_free != NULL) {
+		g->ops.fb.fbpa_ecc_free(g);
+	}
+#endif
+
+	if (g->ops.pmu.ecc_free != NULL) {
+		g->ops.pmu.ecc_free(g);
+	}
+
+	nvgpu_mutex_acquire(&ecc->stats_lock);
+	WARN_ON(!nvgpu_list_empty(&ecc->stats_list));
+	nvgpu_mutex_release(&ecc->stats_lock);
+
+	(void)memset(ecc, 0, sizeof(*ecc));
+}
+
+int nvgpu_ecc_init_support(struct gk20a *g)
+{
+	struct nvgpu_ecc *ecc = &g->ecc;
+
+	if (ecc->initialized) {
+		return 0;
+	}
+
+	nvgpu_mutex_init(&ecc->stats_lock);
+	nvgpu_init_list_node(&ecc->stats_list);
+
+	return 0;
+}
+
+/**
+ * Note that this function is to be called after all units requiring ecc stats
+ * have added entries to ecc->stats_list.
+ */
+int nvgpu_ecc_finalize_support(struct gk20a *g)
+{
+#ifdef CONFIG_NVGPU_SYSFS
+	int err;
+#endif
+
+	if (g->ecc.initialized) {
+		return 0;
+	}
+
+#ifdef CONFIG_NVGPU_SYSFS
+	err = nvgpu_ecc_sysfs_init(g);
+	if (err != 0) {
+		nvgpu_ecc_free(g);
+		return err;
+	}
+#endif
+
+	g->ecc.initialized = true;
+
+	return 0;
+}
+
+void nvgpu_ecc_remove_support(struct gk20a *g)
+{
+	if (!g->ecc.initialized) {
+		return;
+	}
+
+#ifdef CONFIG_NVGPU_SYSFS
+	nvgpu_ecc_sysfs_remove(g);
+#endif
+	nvgpu_ecc_free(g);
+
+	nvgpu_mutex_destroy(&g->ecc.stats_lock);
+}
--- a/drivers/gpu/nvgpu/common/engine_queues/engine_dmem_queue.c
+++ b/drivers/gpu/nvgpu/common/engine_queues/engine_dmem_queue.c
@@ -0,0 +1,69 @@
+/*
+ * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/falcon.h>
+#include <nvgpu/log.h>
+
+#include "engine_mem_queue_priv.h"
+#include "engine_dmem_queue.h"
+
+/* DMEM-Q specific ops */
+static int engine_dmem_queue_push(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue, u32 dst, void *data, u32 size)
+{
+	struct gk20a *g = queue->g;
+	int err = 0;
+
+	err = nvgpu_falcon_copy_to_dmem(flcn, dst, data, size, 0);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d, queue-%d", queue->flcn_id, queue->id);
+		nvgpu_err(g, "dmem queue write failed");
+		goto exit;
+	}
+
+exit:
+	return err;
+}
+
+static int engine_dmem_queue_pop(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue, u32 src, void *data, u32 size)
+{
+	struct gk20a *g = queue->g;
+	int err = 0;
+
+	err = nvgpu_falcon_copy_from_dmem(flcn, src, data, size, 0);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d, queue-%d", queue->flcn_id, queue->id);
+		nvgpu_err(g, "dmem queue read failed");
+		goto exit;
+	}
+
+exit:
+	return err;
+}
+
+/* assign DMEM queue type specific ops */
+void engine_dmem_queue_init(struct nvgpu_engine_mem_queue *queue)
+{
+	queue->push = engine_dmem_queue_push;
+	queue->pop = engine_dmem_queue_pop;
+}
--- a/drivers/gpu/nvgpu/common/engine_queues/engine_dmem_queue.h
+++ b/drivers/gpu/nvgpu/common/engine_queues/engine_dmem_queue.h
@@ -0,0 +1,28 @@
+/*
+ * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_ENGINE_DMEM_QUEUE_H
+#define NVGPU_ENGINE_DMEM_QUEUE_H
+
+void engine_dmem_queue_init(struct nvgpu_engine_mem_queue *queue);
+
+#endif /* NVGPU_ENGINE_DMEM_QUEUE_H */
--- a/drivers/gpu/nvgpu/common/engine_queues/engine_emem_queue.c
+++ b/drivers/gpu/nvgpu/common/engine_queues/engine_emem_queue.c
@@ -0,0 +1,69 @@
+/*
+ * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/falcon.h>
+#include <nvgpu/log.h>
+
+#include "engine_mem_queue_priv.h"
+#include "engine_emem_queue.h"
+
+/* EMEM-Q specific ops */
+static int engine_emem_queue_push(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue, u32 dst, void *data, u32 size)
+{
+	struct gk20a *g = queue->g;
+	int err = 0;
+
+	err = nvgpu_falcon_copy_to_emem(flcn, dst, data, size, 0);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d, queue-%d", queue->flcn_id, queue->id);
+		nvgpu_err(g, "emem queue write failed");
+		goto exit;
+	}
+
+exit:
+	return err;
+}
+
+static int engine_emem_queue_pop(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue, u32 src, void *data, u32 size)
+{
+	struct gk20a *g = queue->g;
+	int err = 0;
+
+	err = nvgpu_falcon_copy_from_emem(flcn, src, data, size, 0);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d, queue-%d", queue->flcn_id, queue->id);
+		nvgpu_err(g, "emem queue read failed");
+		goto exit;
+	}
+
+exit:
+	return err;
+}
+
+/* assign EMEM queue type specific ops */
+void engine_emem_queue_init(struct nvgpu_engine_mem_queue *queue)
+{
+	queue->push = engine_emem_queue_push;
+	queue->pop = engine_emem_queue_pop;
+}
--- a/drivers/gpu/nvgpu/common/engine_queues/engine_emem_queue.h
+++ b/drivers/gpu/nvgpu/common/engine_queues/engine_emem_queue.h
@@ -0,0 +1,28 @@
+/*
+ * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_ENGINE_EMEM_QUEUE_H
+#define NVGPU_ENGINE_EMEM_QUEUE_H
+
+void engine_emem_queue_init(struct nvgpu_engine_mem_queue *queue);
+
+#endif /* NVGPU_ENGINE_EMEM_QUEUE_H */
--- a/drivers/gpu/nvgpu/common/engine_queues/engine_fb_queue.c
+++ b/drivers/gpu/nvgpu/common/engine_queues/engine_fb_queue.c
@@ -0,0 +1,603 @@
+/*
+ * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/log.h>
+#include <nvgpu/errno.h>
+#include <nvgpu/types.h>
+#include <nvgpu/flcnif_cmn.h>
+#include <nvgpu/nvgpu_mem.h>
+#include <nvgpu/string.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/engine_queue.h>
+#include <nvgpu/engine_fb_queue.h>
+#include <nvgpu/pmu/pmuif/cmn.h>
+
+#include "engine_fb_queue_priv.h"
+
+/* FB-Q ops */
+static int engine_fb_queue_head(struct nvgpu_engine_fb_queue *queue,
+				u32 *head, bool set)
+{
+	return queue->queue_head(queue->g, queue->id, queue->index, head, set);
+}
+
+static int engine_fb_queue_tail(struct nvgpu_engine_fb_queue *queue,
+				u32 *tail, bool set)
+{
+	struct gk20a *g = queue->g;
+	int err;
+
+	if (set == false && PMU_IS_COMMAND_QUEUE(queue->id)) {
+		*tail = queue->fbq.tail;
+		err = 0;
+	} else {
+		err = queue->queue_tail(g, queue->id, queue->index, tail, set);
+	}
+
+	return err;
+}
+
+static inline u32 engine_fb_queue_get_next(struct nvgpu_engine_fb_queue *queue,
+					   u32 head)
+{
+		return (head + 1U) % queue->size;
+}
+
+static bool engine_fb_queue_has_room(struct nvgpu_engine_fb_queue *queue,
+	u32 size)
+{
+	u32 head = 0;
+	u32 tail = 0;
+	u32 next_head = 0;
+	int err = 0;
+
+	err = queue->head(queue, &head, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "queue head GET failed");
+		goto exit;
+	}
+
+	err = queue->tail(queue, &tail, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "queue tail GET failed");
+		goto exit;
+	}
+
+	next_head = engine_fb_queue_get_next(queue, head);
+
+exit:
+	return next_head != tail;
+}
+
+static int engine_fb_queue_write(struct nvgpu_engine_fb_queue *queue,
+	u32 offset, u8 *src, u32 size)
+{
+	struct gk20a *g = queue->g;
+	struct nv_falcon_fbq_hdr *fb_q_hdr = (struct nv_falcon_fbq_hdr *)
+		(void *)queue->fbq.work_buffer;
+	u32 entry_offset = 0U;
+	int err = 0;
+
+	if (queue->fbq.work_buffer == NULL) {
+		nvgpu_err(g, "Invalid/Unallocated work buffer");
+		err = -EINVAL;
+		goto exit;
+	}
+
+	/* Fill out FBQ hdr, that is in the work buffer */
+	fb_q_hdr->element_index = (u8)offset;
+
+	/* check queue entry size */
+	if (fb_q_hdr->heap_size >= (u16)queue->fbq.element_size) {
+		err = -EINVAL;
+		goto exit;
+	}
+
+	/* get offset to this element entry */
+	entry_offset = offset * queue->fbq.element_size;
+
+	/* copy cmd to super-surface */
+	nvgpu_mem_wr_n(g, queue->fbq.super_surface_mem,
+		queue->fbq.fb_offset + entry_offset,
+		queue->fbq.work_buffer, queue->fbq.element_size);
+
+exit:
+	return err;
+}
+
+static int engine_fb_queue_set_element_use_state(
+	struct nvgpu_engine_fb_queue *queue, u32 queue_pos, bool set)
+{
+	int err = 0;
+
+	if (queue_pos >= queue->size) {
+		err = -EINVAL;
+		goto exit;
+	}
+
+	if (nvgpu_test_bit(queue_pos,
+		(void *)&queue->fbq.element_in_use) && set) {
+		nvgpu_err(queue->g,
+			"FBQ last received queue element not processed yet"
+			" queue_pos %d", queue_pos);
+		err = -EINVAL;
+		goto exit;
+	}
+
+	if (set) {
+		nvgpu_set_bit(queue_pos, (void *)&queue->fbq.element_in_use);
+	} else {
+		nvgpu_clear_bit(queue_pos, (void *)&queue->fbq.element_in_use);
+	}
+
+exit:
+	return err;
+}
+
+static int engine_fb_queue_is_element_in_use(
+	struct nvgpu_engine_fb_queue *queue,
+	u32 queue_pos, bool *in_use)
+{
+	int err = 0;
+
+	if (queue_pos >= queue->size) {
+		err = -EINVAL;
+		goto exit;
+	}
+
+	*in_use = nvgpu_test_bit(queue_pos, (void *)&queue->fbq.element_in_use);
+
+exit:
+	return err;
+}
+
+static int engine_fb_queue_sweep(struct nvgpu_engine_fb_queue *queue)
+{
+	u32 head;
+	u32 tail;
+	bool in_use = false;
+	int err = 0;
+
+	tail = queue->fbq.tail;
+	err = queue->head(queue, &head, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "flcn-%d queue-%d, position GET failed",
+			queue->flcn_id, queue->id);
+		goto exit;
+	}
+
+	/*
+	 * Step from tail forward in the queue,
+	 * to see how many consecutive entries
+	 * can be made available.
+	 */
+	while (tail != head) {
+		if (engine_fb_queue_is_element_in_use(queue,
+			tail, &in_use) != 0) {
+			break;
+		}
+
+		if (in_use) {
+			break;
+		}
+
+		tail = engine_fb_queue_get_next(queue, tail);
+	}
+
+	/* Update tail */
+	queue->fbq.tail = tail;
+
+exit:
+	return err;
+}
+
+u32 nvgpu_engine_fb_queue_get_position(struct nvgpu_engine_fb_queue *queue)
+{
+	return queue->position;
+}
+
+/* return the queue element size */
+u32 nvgpu_engine_fb_queue_get_element_size(struct nvgpu_engine_fb_queue *queue)
+{
+	return queue->fbq.element_size;
+}
+
+/* return the queue offset from super surface FBQ's */
+u32 nvgpu_engine_fb_queue_get_offset(struct nvgpu_engine_fb_queue *queue)
+{
+	return queue->fbq.fb_offset;
+}
+
+/* lock work buffer of queue */
+void nvgpu_engine_fb_queue_lock_work_buffer(struct nvgpu_engine_fb_queue *queue)
+{
+	/* acquire work buffer mutex */
+	nvgpu_mutex_acquire(&queue->fbq.work_buffer_mutex);
+}
+
+/* unlock work buffer of queue */
+void nvgpu_engine_fb_queue_unlock_work_buffer(
+					struct nvgpu_engine_fb_queue *queue)
+{
+	/* release work buffer mutex */
+	nvgpu_mutex_release(&queue->fbq.work_buffer_mutex);
+}
+
+/* return a pointer of queue work buffer */
+u8 *nvgpu_engine_fb_queue_get_work_buffer(struct nvgpu_engine_fb_queue *queue)
+{
+	return queue->fbq.work_buffer;
+}
+
+int nvgpu_engine_fb_queue_free_element(struct nvgpu_engine_fb_queue *queue,
+			u32 queue_pos)
+{
+	int err = 0;
+
+	err = engine_fb_queue_set_element_use_state(queue,
+		queue_pos, false);
+	if (err != 0) {
+		nvgpu_err(queue->g, "fb queue elelment %d free failed",
+			queue_pos);
+		goto exit;
+	}
+
+	err = engine_fb_queue_sweep(queue);
+
+exit:
+	return err;
+}
+
+/* queue is_empty check with lock */
+bool nvgpu_engine_fb_queue_is_empty(struct nvgpu_engine_fb_queue *queue)
+{
+	u32 q_head = 0;
+	u32 q_tail = 0;
+	int err = 0;
+
+	if (queue == NULL) {
+		return true;
+	}
+
+	/* acquire mutex */
+	nvgpu_mutex_acquire(&queue->mutex);
+
+	err = queue->head(queue, &q_head, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "flcn-%d queue-%d, head GET failed",
+			queue->flcn_id, queue->id);
+		goto exit;
+	}
+
+	err = queue->tail(queue, &q_tail, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "flcn-%d queue-%d, tail GET failed",
+			queue->flcn_id, queue->id);
+		goto exit;
+	}
+
+exit:
+	/* release mutex */
+	nvgpu_mutex_release(&queue->mutex);
+
+	return q_head == q_tail;
+}
+
+static int engine_fb_queue_prepare_write(struct nvgpu_engine_fb_queue *queue,
+				u32 size)
+{
+	int err = 0;
+
+	/* make sure there's enough free space for the write */
+	if (!engine_fb_queue_has_room(queue, size)) {
+		nvgpu_log_info(queue->g, "queue full: queue-id %d: index %d",
+			       queue->id, queue->index);
+		err = -EAGAIN;
+		goto exit;
+	}
+
+	err = queue->head(queue, &queue->position, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "flcn-%d queue-%d, position GET failed",
+			queue->flcn_id, queue->id);
+		goto exit;
+	}
+
+exit:
+	return err;
+}
+
+/* queue push operation with lock */
+int nvgpu_engine_fb_queue_push(struct nvgpu_engine_fb_queue *queue,
+			void *data, u32 size)
+{
+	struct gk20a *g;
+	int err = 0;
+
+	if (queue == NULL) {
+		return -EINVAL;
+	}
+
+	g = queue->g;
+
+	nvgpu_log_fn(g, " ");
+
+	if (queue->oflag != OFLAG_WRITE) {
+		nvgpu_err(queue->g, "flcn-%d, queue-%d not opened for write",
+			queue->flcn_id, queue->id);
+		err = -EINVAL;
+		goto exit;
+	}
+
+	/* acquire mutex */
+	nvgpu_mutex_acquire(&queue->mutex);
+
+	err = engine_fb_queue_prepare_write(queue, size);
+	if (err != 0) {
+		goto unlock_mutex;
+	}
+
+	/* Bounds check size */
+	if (size > queue->fbq.element_size) {
+		nvgpu_err(g, "size too large size=0x%x", size);
+		goto unlock_mutex;
+	}
+
+	/* Set queue element in use */
+	if (engine_fb_queue_set_element_use_state(queue,
+		queue->position, true) != 0) {
+		nvgpu_err(g,
+			"fb-queue element in use map is in invalid state");
+		err = -EINVAL;
+		goto unlock_mutex;
+	}
+
+	/* write data to FB */
+	err = engine_fb_queue_write(queue, queue->position, data, size);
+	if (err != 0) {
+		nvgpu_err(g, "write to fb-queue failed");
+		goto unlock_mutex;
+	}
+
+	queue->position = engine_fb_queue_get_next(queue,
+			queue->position);
+
+	err = queue->head(queue, &queue->position, QUEUE_SET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "flcn-%d queue-%d, position SET failed",
+			queue->flcn_id, queue->id);
+		goto unlock_mutex;
+	}
+
+unlock_mutex:
+	/* release mutex */
+	nvgpu_mutex_release(&queue->mutex);
+exit:
+	if (err != 0) {
+		nvgpu_err(queue->g, "falcon id-%d, queue id-%d, failed",
+			queue->flcn_id, queue->id);
+	}
+
+	return err;
+}
+
+/* queue pop operation with lock */
+int nvgpu_engine_fb_queue_pop(struct nvgpu_engine_fb_queue *queue,
+	void *data, u32 size, u32 *bytes_read)
+{
+	struct gk20a *g;
+	struct pmu_hdr *hdr;
+	u32 entry_offset = 0U;
+	int err = 0;
+
+	if (queue == NULL) {
+		return -EINVAL;
+	}
+
+	g = queue->g;
+	hdr = (struct pmu_hdr *) (void *) (queue->fbq.work_buffer +
+			sizeof(struct nv_falcon_fbq_msgq_hdr));
+
+	nvgpu_log_fn(g, " ");
+
+	if (queue->oflag != OFLAG_READ) {
+		nvgpu_err(g, "flcn-%d, queue-%d, not opened for read",
+			queue->flcn_id, queue->id);
+		err = -EINVAL;
+		goto exit;
+	}
+
+	/* acquire mutex */
+	nvgpu_mutex_acquire(&queue->mutex);
+
+	err = queue->tail(queue, &queue->position, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d queue-%d, position GET failed",
+			queue->flcn_id, queue->id);
+		goto unlock_mutex;
+	}
+
+	*bytes_read = 0U;
+
+	/* Check size */
+	if ((size + queue->fbq.read_position) >= queue->fbq.element_size) {
+		nvgpu_err(g,
+			"Attempt to read > than queue element size "
+			"for queue id-%d", queue->id);
+		err = -EINVAL;
+		goto unlock_mutex;
+	}
+
+	entry_offset = queue->position * queue->fbq.element_size;
+
+	/*
+	 * If first read for this queue element then read whole queue
+	 * element into work buffer.
+	 */
+	if (queue->fbq.read_position == 0U) {
+		nvgpu_mem_rd_n(g, queue->fbq.super_surface_mem,
+			/* source (FBQ data) offset*/
+			queue->fbq.fb_offset + entry_offset,
+			/* destination buffer */
+			(void *)queue->fbq.work_buffer,
+			/* copy size */
+			queue->fbq.element_size);
+
+		/* Check size in hdr of MSG just read */
+		if (hdr->size >= queue->fbq.element_size) {
+			nvgpu_err(g, "Super Surface read failed");
+			err = -ERANGE;
+			goto unlock_mutex;
+		}
+	}
+
+	nvgpu_memcpy((u8 *)data, (u8 *)queue->fbq.work_buffer +
+		queue->fbq.read_position +
+		sizeof(struct nv_falcon_fbq_msgq_hdr),
+		size);
+
+	/* update current position */
+	queue->fbq.read_position += size;
+
+	/* If reached end of this queue element, move on to next. */
+	if (queue->fbq.read_position >= hdr->size) {
+		queue->fbq.read_position = 0U;
+		/* Increment queue index. */
+		queue->position = engine_fb_queue_get_next(queue,
+			queue->position);
+	}
+
+	*bytes_read = size;
+
+	err = queue->tail(queue, &queue->position, QUEUE_SET);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d queue-%d, position SET failed",
+			queue->flcn_id, queue->id);
+		goto unlock_mutex;
+	}
+
+unlock_mutex:
+	/* release mutex */
+	nvgpu_mutex_release(&queue->mutex);
+exit:
+	if (err != 0) {
+		nvgpu_err(g, "falcon id-%d, queue id-%d, failed",
+			queue->flcn_id, queue->id);
+	}
+
+	return err;
+}
+
+void nvgpu_engine_fb_queue_free(struct nvgpu_engine_fb_queue **queue_p)
+{
+	struct nvgpu_engine_fb_queue *queue = NULL;
+	struct gk20a *g;
+
+	if ((queue_p == NULL) || (*queue_p == NULL)) {
+		return;
+	}
+
+	queue = *queue_p;
+
+	g = queue->g;
+
+	nvgpu_log_info(g, "flcn id-%d q-id %d: index %d ",
+		      queue->flcn_id, queue->id, queue->index);
+
+	nvgpu_kfree(g, queue->fbq.work_buffer);
+	nvgpu_mutex_destroy(&queue->fbq.work_buffer_mutex);
+
+	/* destroy mutex */
+	nvgpu_mutex_destroy(&queue->mutex);
+
+	nvgpu_kfree(g, queue);
+	*queue_p = NULL;
+}
+
+int nvgpu_engine_fb_queue_init(struct nvgpu_engine_fb_queue **queue_p,
+	struct nvgpu_engine_fb_queue_params params)
+{
+	struct nvgpu_engine_fb_queue *queue = NULL;
+	struct gk20a *g = params.g;
+	int err = 0;
+
+	if (queue_p == NULL) {
+		return -EINVAL;
+	}
+
+	queue = (struct nvgpu_engine_fb_queue *)
+		   nvgpu_kmalloc(g, sizeof(struct nvgpu_engine_fb_queue));
+
+	if (queue == NULL) {
+		return -ENOMEM;
+	}
+
+	queue->g = params.g;
+	queue->flcn_id = params.flcn_id;
+	queue->id = params.id;
+	queue->index = params.index;
+	queue->size = params.size;
+	queue->oflag = params.oflag;
+
+	queue->fbq.tail = 0U;
+	queue->fbq.element_in_use = 0U;
+	queue->fbq.read_position = 0U;
+	queue->fbq.super_surface_mem = params.super_surface_mem;
+	queue->fbq.element_size = params.fbq_element_size;
+	queue->fbq.fb_offset = params.fbq_offset;
+
+	queue->position = 0U;
+
+	queue->queue_head = params.queue_head;
+	queue->queue_tail = params.queue_tail;
+
+	queue->head = engine_fb_queue_head;
+	queue->tail = engine_fb_queue_tail;
+
+	/* init mutex */
+	nvgpu_mutex_init(&queue->mutex);
+
+	/* init mutex */
+	nvgpu_mutex_init(&queue->fbq.work_buffer_mutex);
+
+	queue->fbq.work_buffer = nvgpu_kzalloc(g, queue->fbq.element_size);
+	if (queue->fbq.work_buffer == NULL) {
+		err = -ENOMEM;
+		goto free_work_mutex;
+	}
+
+	nvgpu_log_info(g,
+		"flcn id-%d q-id %d: index %d, size 0x%08x",
+		queue->flcn_id, queue->id, queue->index,
+		queue->size);
+
+	*queue_p = queue;
+
+	return 0;
+
+free_work_mutex:
+	nvgpu_mutex_destroy(&queue->fbq.work_buffer_mutex);
+	nvgpu_mutex_destroy(&queue->mutex);
+	nvgpu_kfree(g, queue);
+
+	return err;
+}
--- a/drivers/gpu/nvgpu/common/engine_queues/engine_fb_queue_priv.h
+++ b/drivers/gpu/nvgpu/common/engine_queues/engine_fb_queue_priv.h
@@ -0,0 +1,108 @@
+/*
+ * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_ENGINE_FB_QUEUE_PRIV_H
+#define NVGPU_ENGINE_FB_QUEUE_PRIV_H
+
+#include <nvgpu/lock.h>
+
+struct nvgpu_engine_fb_queue {
+	struct gk20a *g;
+	u32 flcn_id;
+
+	/* used by nvgpu, for command LPQ/HPQ */
+	struct nvgpu_mutex mutex;
+
+	/* current write position */
+	u32 position;
+	/* logical queue identifier */
+	u32 id;
+	/* physical queue index */
+	u32 index;
+	/* in bytes */
+	u32 size;
+	/* open-flag */
+	u32 oflag;
+
+	/* members unique to the FB version of the falcon queues */
+	struct {
+		/* Holds super surface base address */
+		struct nvgpu_mem *super_surface_mem;
+
+		/*
+		 * Holds the offset of queue data (0th element).
+		 * This is used for FB Queues to hold a offset of
+		 * Super Surface for this queue.
+		 */
+		 u32 fb_offset;
+
+		/*
+		 * Define the size of a single queue element.
+		 * queues_size above is used for the number of
+		 * queue elements.
+		 */
+		u32 element_size;
+
+		/* To keep track of elements in use */
+		u64 element_in_use;
+
+		/*
+		 * Define a pointer to a local (SYSMEM) allocated
+		 * buffer to hold a single queue element
+		 * it is being assembled.
+		 */
+		 u8 *work_buffer;
+		 struct nvgpu_mutex work_buffer_mutex;
+
+		/*
+		 * Tracks how much of the current FB Queue MSG queue
+		 * entry have been read. This is needed as functions read
+		 * the MSG queue as a byte stream, rather
+		 * than reading a whole MSG at a time.
+		 */
+		u32 read_position;
+
+		/*
+		 * Tail as tracked on the nvgpu "side".  Because the queue
+		 * elements and its associated payload (which is also moved
+		 * PMU->nvgpu through the FB CMD Queue) can't be free-ed until
+		 * the command is complete, response is received and any "out"
+		 * payload delivered to the client, it is necessary for the
+		 * nvgpu to track it's own version of "tail".  This one is
+		 * incremented as commands and completed entries are found
+		 * following tail.
+		 */
+		u32 tail;
+	} fbq;
+
+	/* engine and queue specific ops */
+	int (*tail)(struct nvgpu_engine_fb_queue *queue, u32 *tail, bool set);
+	int (*head)(struct nvgpu_engine_fb_queue *queue, u32 *head, bool set);
+
+	/* engine specific ops */
+	int (*queue_head)(struct gk20a *g, u32 queue_id, u32 queue_index,
+		u32 *head, bool set);
+	int (*queue_tail)(struct gk20a *g, u32 queue_id, u32 queue_index,
+		u32 *tail, bool set);
+};
+
+#endif /* NVGPU_ENGINE_FB_QUEUE_PRIV_H */
--- a/drivers/gpu/nvgpu/common/engine_queues/engine_mem_queue.c
+++ b/drivers/gpu/nvgpu/common/engine_queues/engine_mem_queue.c
@@ -0,0 +1,438 @@
+/*
+ * Copyright (c) 2017-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/errno.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/lock.h>
+#include <nvgpu/log.h>
+#include <nvgpu/flcnif_cmn.h>
+#include <nvgpu/pmu/pmuif/nvgpu_cmdif.h>
+#include <nvgpu/engine_queue.h>
+#include <nvgpu/engine_mem_queue.h>
+#include <nvgpu/pmu/cmd.h>
+
+#include "engine_mem_queue_priv.h"
+#include "engine_dmem_queue.h"
+#include "engine_emem_queue.h"
+
+static int mem_queue_get_head_tail(struct nvgpu_engine_mem_queue *queue,
+				   u32 *q_head, u32 *q_tail)
+{
+	int err = 0;
+
+	err = queue->head(queue->g, queue->id, queue->index,
+			  q_head, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "flcn-%d, queue-%d, head GET failed",
+			  queue->flcn_id, queue->id);
+		goto exit;
+	}
+
+	err = queue->tail(queue->g, queue->id, queue->index,
+			  q_tail, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "flcn-%d, queue-%d, tail GET failed",
+			  queue->flcn_id, queue->id);
+		goto exit;
+	}
+
+	return 0;
+exit:
+	return err;
+}
+
+/* common falcon queue ops */
+static bool engine_mem_queue_has_room(struct nvgpu_engine_mem_queue *queue,
+			u32 size, bool *need_rewind)
+{
+	u32 q_head = 0;
+	u32 q_tail = 0;
+	u32 q_free = 0;
+	bool q_rewind = false;
+	int err = 0;
+
+	size = NVGPU_ALIGN(size, QUEUE_ALIGNMENT);
+
+	err = mem_queue_get_head_tail(queue, &q_head, &q_tail);
+	if (err != 0) {
+		goto exit;
+	}
+
+	if (q_head >= q_tail) {
+		q_free = queue->offset + queue->size - q_head;
+		q_free -= (u32)PMU_CMD_HDR_SIZE;
+
+		if (size > q_free) {
+			q_rewind = true;
+			q_head = queue->offset;
+		}
+	}
+
+	if (q_head < q_tail) {
+		q_free = q_tail - q_head - 1U;
+	}
+
+	if (need_rewind != NULL) {
+		*need_rewind = q_rewind;
+	}
+
+exit:
+	return size <= q_free;
+}
+
+static int engine_mem_queue_rewind(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue)
+{
+	struct gk20a *g = queue->g;
+	struct pmu_cmd cmd;
+	int err = 0;
+
+	if (queue->oflag == OFLAG_WRITE) {
+		cmd.hdr.unit_id = PMU_UNIT_REWIND;
+		cmd.hdr.size = (u8)PMU_CMD_HDR_SIZE;
+		err = queue->push(flcn, queue, queue->position,
+				  &cmd, cmd.hdr.size);
+		if (err != 0) {
+			nvgpu_err(g, "flcn-%d queue-%d, rewind request failed",
+				queue->flcn_id, queue->id);
+			goto exit;
+		} else {
+			queue->position += nvgpu_safe_cast_u32_to_u8(
+				NVGPU_ALIGN(U32(cmd.hdr.size), QUEUE_ALIGNMENT));
+			nvgpu_log_info(g, "flcn-%d queue-%d, rewinded",
+			queue->flcn_id, queue->id);
+		}
+	}
+
+	/* update queue position */
+	queue->position = queue->offset;
+
+	if (queue->oflag == OFLAG_READ) {
+		err = queue->tail(g, queue->id, queue->index, &queue->position,
+			QUEUE_SET);
+		if (err != 0) {
+			nvgpu_err(g, "flcn-%d queue-%d, position SET failed",
+				queue->flcn_id, queue->id);
+			goto exit;
+		}
+	}
+
+exit:
+	return err;
+}
+
+static int engine_mem_queue_prepare_write(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue, u32 size)
+{
+	bool q_rewind = false;
+	int err = 0;
+
+	/* make sure there's enough free space for the write */
+	if (!engine_mem_queue_has_room(queue, size, &q_rewind)) {
+		nvgpu_log_info(queue->g, "queue full: queue-id %d: index %d",
+			queue->id, queue->index);
+		err = -EAGAIN;
+		goto exit;
+	}
+
+	err = queue->head(queue->g, queue->id, queue->index,
+			  &queue->position, QUEUE_GET);
+	if (err != 0) {
+		nvgpu_err(queue->g, "flcn-%d queue-%d, position GET failed",
+			queue->flcn_id, queue->id);
+		goto exit;
+	}
+
+	if (q_rewind) {
+		err = engine_mem_queue_rewind(flcn, queue);
+	}
+
+exit:
+	return err;
+}
+
+/* queue public functions */
+
+/* queue push operation with lock */
+int nvgpu_engine_mem_queue_push(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue, void *data, u32 size)
+{
+	struct gk20a *g;
+	int err = 0;
+
+	if ((flcn == NULL) || (queue == NULL)) {
+		return -EINVAL;
+	}
+
+	g = queue->g;
+
+	if (queue->oflag != OFLAG_WRITE) {
+		nvgpu_err(g, "flcn-%d, queue-%d not opened for write",
+			queue->flcn_id, queue->id);
+		err = -EINVAL;
+		goto exit;
+	}
+
+	/* acquire mutex */
+	nvgpu_mutex_acquire(&queue->mutex);
+
+	err = engine_mem_queue_prepare_write(flcn, queue, size);
+	if (err != 0) {
+		goto unlock_mutex;
+	}
+
+	err = queue->push(flcn, queue, queue->position, data, size);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d queue-%d, fail to write",
+			queue->flcn_id, queue->id);
+		goto unlock_mutex;
+	}
+
+	queue->position += NVGPU_ALIGN(size, QUEUE_ALIGNMENT);
+
+	err = queue->head(g, queue->id, queue->index,
+			  &queue->position, QUEUE_SET);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d queue-%d, position SET failed",
+			queue->flcn_id, queue->id);
+	}
+
+unlock_mutex:
+	/* release mutex */
+	nvgpu_mutex_release(&queue->mutex);
+exit:
+	return err;
+}
+
+/* queue pop operation with lock */
+int nvgpu_engine_mem_queue_pop(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue, void *data, u32 size,
+	u32 *bytes_read)
+{
+	struct gk20a *g;
+	u32 q_tail = 0;
+	u32 q_head = 0;
+	u32 used = 0;
+	int err = 0;
+
+	*bytes_read = 0;
+
+	if ((flcn == NULL) || (queue == NULL)) {
+		return -EINVAL;
+	}
+
+	g = queue->g;
+
+	if (queue->oflag != OFLAG_READ) {
+		nvgpu_err(g, "flcn-%d, queue-%d, not opened for read",
+			queue->flcn_id, queue->id);
+		err = -EINVAL;
+		goto exit;
+	}
+
+	/* acquire mutex */
+	nvgpu_mutex_acquire(&queue->mutex);
+
+	err = mem_queue_get_head_tail(queue, &q_head, &queue->position);
+	if (err != 0) {
+		goto unlock_mutex;
+	}
+
+	q_tail = queue->position;
+
+	if (q_head == q_tail) {
+		goto unlock_mutex;
+	} else if (q_head > q_tail) {
+		used = q_head - q_tail;
+	} else {
+		used = queue->offset + queue->size - q_tail;
+	}
+
+	if (size > used) {
+		nvgpu_warn(g, "queue size smaller than request read");
+		size = used;
+	}
+
+	err = queue->pop(flcn, queue, q_tail, data, size);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d queue-%d, fail to read",
+			queue->flcn_id, queue->id);
+		goto unlock_mutex;
+	}
+
+	queue->position += NVGPU_ALIGN(size, QUEUE_ALIGNMENT);
+
+	err = queue->tail(g, queue->id, queue->index,
+			  &queue->position, QUEUE_SET);
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d queue-%d, position SET failed",
+			queue->flcn_id, queue->id);
+		goto unlock_mutex;
+	}
+
+	*bytes_read = size;
+
+unlock_mutex:
+	/* release mutex */
+	nvgpu_mutex_release(&queue->mutex);
+exit:
+	return err;
+}
+
+int nvgpu_engine_mem_queue_rewind(struct nvgpu_falcon *flcn,
+	struct nvgpu_engine_mem_queue *queue)
+{
+	int err = 0;
+
+	if ((flcn == NULL) || (queue == NULL)) {
+		return -EINVAL;
+	}
+
+	/* acquire mutex */
+	nvgpu_mutex_acquire(&queue->mutex);
+
+	err = engine_mem_queue_rewind(flcn, queue);
+
+	/* release mutex */
+	nvgpu_mutex_release(&queue->mutex);
+
+	return err;
+}
+
+/* queue is_empty check with lock */
+bool nvgpu_engine_mem_queue_is_empty(struct nvgpu_engine_mem_queue *queue)
+{
+	u32 q_head = 0;
+	u32 q_tail = 0;
+	int err = 0;
+
+	if (queue == NULL) {
+		return true;
+	}
+
+	/* acquire mutex */
+	nvgpu_mutex_acquire(&queue->mutex);
+
+	err = mem_queue_get_head_tail(queue, &q_head, &q_tail);
+	if (err != 0) {
+		goto exit;
+	}
+
+exit:
+	/* release mutex */
+	nvgpu_mutex_release(&queue->mutex);
+
+	return q_head == q_tail;
+}
+
+void nvgpu_engine_mem_queue_free(struct nvgpu_engine_mem_queue **queue_p)
+{
+	struct nvgpu_engine_mem_queue *queue = NULL;
+	struct gk20a *g;
+
+	if ((queue_p == NULL) || (*queue_p == NULL)) {
+		return;
+	}
+
+	queue = *queue_p;
+
+	g = queue->g;
+
+	nvgpu_log_info(g, "flcn id-%d q-id %d: index %d ",
+		       queue->flcn_id, queue->id, queue->index);
+
+	/* destroy mutex */
+	nvgpu_mutex_destroy(&queue->mutex);
+
+	nvgpu_kfree(g, queue);
+	*queue_p = NULL;
+}
+
+u32 nvgpu_engine_mem_queue_get_size(struct nvgpu_engine_mem_queue *queue)
+{
+	return queue->size;
+}
+
+int nvgpu_engine_mem_queue_init(struct nvgpu_engine_mem_queue **queue_p,
+	struct nvgpu_engine_mem_queue_params params)
+{
+	struct nvgpu_engine_mem_queue *queue = NULL;
+	struct gk20a *g = params.g;
+	int err = 0;
+
+	if (queue_p == NULL) {
+		return -EINVAL;
+	}
+
+	queue = (struct nvgpu_engine_mem_queue *)
+		   nvgpu_kmalloc(g, sizeof(struct nvgpu_engine_mem_queue));
+
+	if (queue == NULL) {
+		return -ENOMEM;
+	}
+
+	queue->g = params.g;
+	queue->flcn_id = params.flcn_id;
+	queue->id = params.id;
+	queue->index = params.index;
+	queue->offset = params.offset;
+	queue->position = params.position;
+	queue->size = params.size;
+	queue->oflag = params.oflag;
+	queue->queue_type = params.queue_type;
+
+	queue->head = params.queue_head;
+	queue->tail = params.queue_tail;
+
+	nvgpu_log_info(g,
+		"flcn id-%d q-id %d: index %d, offset 0x%08x, size 0x%08x",
+		queue->flcn_id, queue->id, queue->index,
+		queue->offset, queue->size);
+
+	switch (queue->queue_type) {
+	case QUEUE_TYPE_DMEM:
+		engine_dmem_queue_init(queue);
+		break;
+#ifdef CONFIG_NVGPU_DGPU
+	case QUEUE_TYPE_EMEM:
+		engine_emem_queue_init(queue);
+		break;
+#endif
+	default:
+		err = -EINVAL;
+		break;
+	}
+
+	if (err != 0) {
+		nvgpu_err(g, "flcn-%d queue-%d, init failed",
+			queue->flcn_id, queue->id);
+		nvgpu_kfree(g, queue);
+		goto exit;
+	}
+
+	/* init mutex */
+	nvgpu_mutex_init(&queue->mutex);
+
+	*queue_p = queue;
+exit:
+	return err;
+}
--- a/drivers/gpu/nvgpu/common/engine_queues/engine_mem_queue_priv.h
+++ b/drivers/gpu/nvgpu/common/engine_queues/engine_mem_queue_priv.h
@@ -0,0 +1,70 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_ENGINE_MEM_QUEUE_PRIV_H
+#define NVGPU_ENGINE_MEM_QUEUE_PRIV_H
+
+#include <nvgpu/lock.h>
+#include <nvgpu/types.h>
+
+struct gk20a;
+struct nvgpu_falcon;
+
+struct nvgpu_engine_mem_queue {
+	struct gk20a *g;
+	u32 flcn_id;
+
+	/* Queue Type (queue_type) */
+	u8 queue_type;
+
+	/* used by nvgpu, for command LPQ/HPQ */
+	struct nvgpu_mutex mutex;
+
+	/* current write position */
+	u32 position;
+	/* physical dmem offset where this queue begins */
+	u32 offset;
+	/* logical queue identifier */
+	u32 id;
+	/* physical queue index */
+	u32 index;
+	/* in bytes */
+	u32 size;
+	/* open-flag */
+	u32 oflag;
+
+	/* queue type(DMEM-Q/EMEM-Q) specific ops */
+	int (*push)(struct nvgpu_falcon *flcn,
+		    struct nvgpu_engine_mem_queue *queue,
+		    u32 dst, void *data, u32 size);
+	int (*pop)(struct nvgpu_falcon *flcn,
+		   struct nvgpu_engine_mem_queue *queue,
+		   u32 src, void *data, u32 size);
+
+	/* engine specific ops */
+	int (*head)(struct gk20a *g, u32 queue_id, u32 queue_index,
+		u32 *head, bool set);
+	int (*tail)(struct gk20a *g, u32 queue_id, u32 queue_index,
+		u32 *tail, bool set);
+};
+
+#endif /* NVGPU_ENGINE_MEM_QUEUE_PRIV_H */
--- a/drivers/gpu/nvgpu/common/falcon/falcon.c
+++ b/drivers/gpu/nvgpu/common/falcon/falcon.c
@@ -0,0 +1,825 @@
+/*
+ * Copyright (c) 2017-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <nvgpu/gk20a.h>
+#include <nvgpu/timers.h>
+#include <nvgpu/falcon.h>
+#include <nvgpu/io.h>
+#include <nvgpu/static_analysis.h>
+
+#include "falcon_sw_gk20a.h"
+#ifdef CONFIG_NVGPU_DGPU
+#include "falcon_sw_tu104.h"
+#endif
+
+#if defined(CONFIG_NVGPU_NEXT) && defined(CONFIG_NVGPU_NON_FUSA)
+#include "nvgpu_next_gpuid.h"
+#endif
+
+static bool is_falcon_valid(struct nvgpu_falcon *flcn)
+{
+	if (flcn == NULL) {
+		return false;
+	}
+
+	if (!flcn->is_falcon_supported) {
+		nvgpu_err(flcn->g, "Falcon %d not supported", flcn->flcn_id);
+		return false;
+	}
+
+	return true;
+}
+
+u32 nvgpu_falcon_readl(struct nvgpu_falcon *flcn, u32 offset)
+{
+	return nvgpu_readl(flcn->g,
+			   nvgpu_safe_add_u32(flcn->flcn_base, offset));
+}
+
+void nvgpu_falcon_writel(struct nvgpu_falcon *flcn,
+				       u32 offset, u32 val)
+{
+	nvgpu_writel(flcn->g, nvgpu_safe_add_u32(flcn->flcn_base, offset), val);
+}
+
+int nvgpu_falcon_reset(struct nvgpu_falcon *flcn)
+{
+	struct gk20a *g;
+	int status = 0;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	if (flcn->flcn_engine_dep_ops.reset_eng != NULL) {
+		/* falcon & engine reset */
+		status = flcn->flcn_engine_dep_ops.reset_eng(g);
+	} else {
+		g->ops.falcon.reset(flcn);
+	}
+
+	if (status == 0) {
+		status = nvgpu_falcon_mem_scrub_wait(flcn);
+	}
+
+	return status;
+}
+
+int nvgpu_falcon_wait_for_halt(struct nvgpu_falcon *flcn, unsigned int timeout)
+{
+	struct nvgpu_timeout to;
+	struct gk20a *g;
+	int status;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	status = nvgpu_timeout_init(g, &to, timeout, NVGPU_TIMER_CPU_TIMER);
+	if (status != 0) {
+		return status;
+	}
+
+	do {
+		if (g->ops.falcon.is_falcon_cpu_halted(flcn)) {
+			break;
+		}
+
+		nvgpu_udelay(10);
+	} while (nvgpu_timeout_expired(&to) == 0);
+
+	if (nvgpu_timeout_peek_expired(&to)) {
+		status = -ETIMEDOUT;
+	}
+
+	return status;
+}
+
+int nvgpu_falcon_wait_idle(struct nvgpu_falcon *flcn)
+{
+	struct nvgpu_timeout timeout;
+	struct gk20a *g;
+	int status;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	status = nvgpu_timeout_init(g, &timeout, 2000, NVGPU_TIMER_RETRY_TIMER);
+	if (status != 0) {
+		return status;
+	}
+
+	/* wait for falcon idle */
+	do {
+		if (g->ops.falcon.is_falcon_idle(flcn)) {
+			break;
+		}
+
+		if (nvgpu_timeout_expired_msg(&timeout,
+			"waiting for falcon idle") != 0) {
+			return -ETIMEDOUT;
+		}
+
+		nvgpu_usleep_range(100, 200);
+	} while (true);
+
+	return 0;
+}
+
+int nvgpu_falcon_mem_scrub_wait(struct nvgpu_falcon *flcn)
+{
+	struct nvgpu_timeout timeout;
+	/**
+	 * Delay depends on memory size and pwr_clk
+	 * delay = (MAX {IMEM_SIZE, DMEM_SIZE} * 64 + 1) / pwr_clk
+	 * Timeout set is 1msec & status check at interval 10usec
+	 */
+	const u32 mem_scrubbing_max_timeout = 1000U;
+	const u32 mem_scrubbing_default_timeout = 10U;
+	struct gk20a *g;
+	int status;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	/* check IMEM/DMEM scrubbing complete status */
+	status = nvgpu_timeout_init(g, &timeout,
+				    mem_scrubbing_max_timeout /
+					mem_scrubbing_default_timeout,
+				    NVGPU_TIMER_RETRY_TIMER);
+	if (status != 0) {
+		return status;
+	}
+
+	do {
+		if (g->ops.falcon.is_falcon_scrubbing_done(flcn)) {
+			break;
+		}
+		nvgpu_udelay(mem_scrubbing_default_timeout);
+	} while (nvgpu_timeout_expired(&timeout) == 0);
+
+	if (nvgpu_timeout_peek_expired(&timeout)) {
+		status = -ETIMEDOUT;
+	}
+
+	return status;
+}
+
+static int falcon_memcpy_params_check(struct nvgpu_falcon *flcn,
+		u32 offset, u32 size, enum falcon_mem_type mem_type, u8 port)
+{
+	struct gk20a *g = flcn->g;
+	u32 mem_size = 0;
+	int ret = -EINVAL;
+
+	if (size == 0U) {
+		nvgpu_err(g, "size is zero");
+		goto exit;
+	}
+
+	if ((offset & 0x3U) != 0U) {
+		nvgpu_err(g, "offset (0x%08x) not 4-byte aligned", offset);
+		goto exit;
+	}
+
+	if (port >= g->ops.falcon.get_ports_count(flcn, mem_type)) {
+		nvgpu_err(g, "invalid port %u", (u32) port);
+		goto exit;
+	}
+
+	mem_size = g->ops.falcon.get_mem_size(flcn, mem_type);
+
+	if (!((offset < mem_size) && ((offset + size) <= mem_size))) {
+		nvgpu_err(g, "flcn-id 0x%x, copy overflow ",
+			flcn->flcn_id);
+		nvgpu_err(g, "total size 0x%x, offset 0x%x, copy size 0x%x",
+			mem_size, offset, size);
+		ret = -EINVAL;
+		goto exit;
+	}
+
+	ret = 0;
+
+exit:
+	return ret;
+}
+
+int nvgpu_falcon_copy_to_dmem(struct nvgpu_falcon *flcn,
+	u32 dst, u8 *src, u32 size, u8 port)
+{
+	int status = -EINVAL;
+	struct gk20a *g;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	if (falcon_memcpy_params_check(flcn, dst, size, MEM_DMEM, port) != 0) {
+		nvgpu_err(g, "incorrect parameters");
+		goto exit;
+	}
+
+	nvgpu_mutex_acquire(&flcn->dmem_lock);
+	status = g->ops.falcon.copy_to_dmem(flcn, dst, src, size, port);
+	nvgpu_mutex_release(&flcn->dmem_lock);
+
+exit:
+	return status;
+}
+
+int nvgpu_falcon_copy_to_imem(struct nvgpu_falcon *flcn,
+	u32 dst, u8 *src, u32 size, u8 port, bool sec, u32 tag)
+{
+	int status = -EINVAL;
+	struct gk20a *g;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	if (falcon_memcpy_params_check(flcn, dst, size, MEM_IMEM, port) != 0) {
+		nvgpu_err(g, "incorrect parameters");
+		goto exit;
+	}
+
+	nvgpu_mutex_acquire(&flcn->imem_lock);
+	status = g->ops.falcon.copy_to_imem(flcn, dst, src,
+					    size, port, sec, tag);
+	nvgpu_mutex_release(&flcn->imem_lock);
+
+exit:
+	return status;
+}
+
+u32 nvgpu_falcon_mailbox_read(struct nvgpu_falcon *flcn, u32 mailbox_index)
+{
+	struct gk20a *g;
+	u32 data = 0;
+
+	if (!is_falcon_valid(flcn)) {
+		return 0;
+	}
+
+	g = flcn->g;
+
+	if (mailbox_index >= FALCON_MAILBOX_COUNT) {
+		nvgpu_err(g, "incorrect mailbox id %d", mailbox_index);
+		goto exit;
+	}
+
+	data = g->ops.falcon.mailbox_read(flcn, mailbox_index);
+
+exit:
+	return data;
+}
+
+void nvgpu_falcon_mailbox_write(struct nvgpu_falcon *flcn, u32 mailbox_index,
+		u32 data)
+{
+	struct gk20a *g;
+
+	if (!is_falcon_valid(flcn)) {
+		return;
+	}
+
+	g = flcn->g;
+
+	if (mailbox_index >= FALCON_MAILBOX_COUNT) {
+		nvgpu_err(g, "incorrect mailbox id %d", mailbox_index);
+		goto exit;
+	}
+
+	g->ops.falcon.mailbox_write(flcn, mailbox_index, data);
+
+exit:
+	return;
+}
+
+int nvgpu_falcon_hs_ucode_load_bootstrap(struct nvgpu_falcon *flcn, u32 *ucode,
+	u32 *ucode_header)
+{
+	struct gk20a *g;
+	u32 sec_imem_dest = 0U;
+	int err = 0;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	/* falcon reset */
+	err = nvgpu_falcon_reset(flcn);
+	if (err != 0) {
+		nvgpu_err(g, "nvgpu_falcon_reset() failed err=%d", err);
+		return err;
+	}
+
+	/* setup falcon apertures, boot-config */
+	if (flcn->flcn_engine_dep_ops.setup_bootstrap_config != NULL) {
+		flcn->flcn_engine_dep_ops.setup_bootstrap_config(flcn->g);
+	}
+
+	/* Copy Non Secure IMEM code */
+	err = nvgpu_falcon_copy_to_imem(flcn, 0U,
+		(u8 *)&ucode[ucode_header[OS_CODE_OFFSET] >> 2U],
+		ucode_header[OS_CODE_SIZE], 0U, false,
+		GET_IMEM_TAG(ucode_header[OS_CODE_OFFSET]));
+	if (err != 0) {
+		nvgpu_err(g, "HS ucode non-secure code to IMEM failed");
+		goto exit;
+	}
+
+	/* Put secure code after non-secure block */
+	sec_imem_dest = GET_NEXT_BLOCK(ucode_header[OS_CODE_SIZE]);
+
+	err = nvgpu_falcon_copy_to_imem(flcn, sec_imem_dest,
+		(u8 *)&ucode[ucode_header[APP_0_CODE_OFFSET] >> 2U],
+		ucode_header[APP_0_CODE_SIZE], 0U, true,
+		GET_IMEM_TAG(ucode_header[APP_0_CODE_OFFSET]));
+	if (err != 0) {
+		nvgpu_err(g, "HS ucode secure code to IMEM failed");
+		goto exit;
+	}
+
+	/* load DMEM: ensure that signatures are patched */
+	err = nvgpu_falcon_copy_to_dmem(flcn, 0U, (u8 *)&ucode[
+		ucode_header[OS_DATA_OFFSET] >> 2U],
+		ucode_header[OS_DATA_SIZE], 0U);
+	if (err != 0) {
+		nvgpu_err(g, "HS ucode data copy to DMEM failed");
+		goto exit;
+	}
+
+	/*
+	 * Write non-zero value to mailbox register which is updated by
+	 * HS bin to denote its return status.
+	 */
+	nvgpu_falcon_mailbox_write(flcn, FALCON_MAILBOX_0, 0xdeadbeefU);
+
+	/* set BOOTVEC to start of non-secure code */
+	g->ops.falcon.bootstrap(flcn, 0U);
+
+exit:
+	return err;
+}
+
+u32 nvgpu_falcon_get_id(struct nvgpu_falcon *flcn)
+{
+	return flcn->flcn_id;
+}
+
+#if defined(CONFIG_NVGPU_NEXT)
+bool nvgpu_falcon_is_falcon2_enabled(struct nvgpu_falcon *flcn)
+{
+	return flcn->is_falcon2_enabled ? true : false;
+}
+
+bool nvgpu_falcon_is_feature_supported(struct nvgpu_falcon *flcn,
+		u32 feature)
+{
+	return nvgpu_test_bit(feature, (void *)&flcn->fuse_settings);
+}
+#endif
+
+struct nvgpu_falcon *nvgpu_falcon_get_instance(struct gk20a *g, u32 flcn_id)
+{
+	struct nvgpu_falcon *flcn = NULL;
+
+	switch (flcn_id) {
+	case FALCON_ID_PMU:
+		flcn = &g->pmu_flcn;
+		break;
+	case FALCON_ID_FECS:
+		flcn = &g->fecs_flcn;
+		break;
+	case FALCON_ID_GPCCS:
+		flcn = &g->gpccs_flcn;
+		break;
+	case FALCON_ID_GSPLITE:
+		flcn = &g->gsp_flcn;
+		break;
+	case FALCON_ID_NVDEC:
+		flcn = &g->nvdec_flcn;
+		break;
+	case FALCON_ID_SEC2:
+		flcn = &g->sec2.flcn;
+		break;
+	case FALCON_ID_MINION:
+		flcn = &g->minion_flcn;
+		break;
+	default:
+		nvgpu_err(g, "Invalid/Unsupported falcon ID %x", flcn_id);
+		break;
+	};
+
+	return flcn;
+}
+
+static int falcon_sw_chip_init(struct gk20a *g, struct nvgpu_falcon *flcn)
+{
+	u32 ver = nvgpu_safe_add_u32(g->params.gpu_arch, g->params.gpu_impl);
+	int err = 0;
+
+	switch (ver) {
+#ifdef CONFIG_NVGPU_NON_FUSA
+	case GK20A_GPUID_GM20B:
+	case GK20A_GPUID_GM20B_B:
+		gk20a_falcon_sw_init(flcn);
+		break;
+	case NVGPU_GPUID_GP10B:
+		gk20a_falcon_sw_init(flcn);
+		break;
+#if defined(CONFIG_NVGPU_NEXT)
+	case NVGPU_NEXT_GPUID:
+		nvgpu_next_falcon_sw_init(flcn);
+		break;
+#endif
+#endif
+	case NVGPU_GPUID_GV11B:
+		gk20a_falcon_sw_init(flcn);
+		break;
+#ifdef CONFIG_NVGPU_DGPU
+	case NVGPU_GPUID_TU104:
+#if defined(CONFIG_NVGPU_NEXT)
+	case NVGPU_NEXT_DGPU_GPUID:
+#endif
+		tu104_falcon_sw_init(flcn);
+		break;
+#endif
+	default:
+		err = -EINVAL;
+		nvgpu_err(g, "no support for GPUID %x", ver);
+		break;
+	}
+
+	return err;
+}
+
+int nvgpu_falcon_sw_init(struct gk20a *g, u32 flcn_id)
+{
+	struct nvgpu_falcon *flcn = NULL;
+	int err = 0;
+
+	flcn = nvgpu_falcon_get_instance(g, flcn_id);
+	if (flcn == NULL) {
+		return -ENODEV;
+	}
+
+	flcn->flcn_id = flcn_id;
+	flcn->g = g;
+
+	/* call SW init methods to assign flcn base & support of a falcon */
+	err = falcon_sw_chip_init(g, flcn);
+	if (err != 0) {
+		nvgpu_err(g, "Chip specific falcon sw init failed %d", err);
+		return err;
+	}
+
+	nvgpu_mutex_init(&flcn->imem_lock);
+	nvgpu_mutex_init(&flcn->dmem_lock);
+
+#ifdef CONFIG_NVGPU_DGPU
+	if (flcn->emem_supported) {
+		nvgpu_mutex_init(&flcn->emem_lock);
+	}
+#endif
+
+	return 0;
+}
+
+void nvgpu_falcon_sw_free(struct gk20a *g, u32 flcn_id)
+{
+	struct nvgpu_falcon *flcn = NULL;
+
+	flcn = nvgpu_falcon_get_instance(g, flcn_id);
+	if (flcn == NULL) {
+		return;
+	}
+
+	if (flcn->is_falcon_supported) {
+		flcn->is_falcon_supported = false;
+	} else {
+		nvgpu_log_info(g, "falcon 0x%x not supported on %s",
+			flcn->flcn_id, g->name);
+		return;
+	}
+
+#ifdef CONFIG_NVGPU_DGPU
+	if (flcn->emem_supported) {
+		nvgpu_mutex_destroy(&flcn->emem_lock);
+	}
+#endif
+	nvgpu_mutex_destroy(&flcn->dmem_lock);
+	nvgpu_mutex_destroy(&flcn->imem_lock);
+}
+
+void nvgpu_falcon_set_irq(struct nvgpu_falcon *flcn, bool enable,
+	u32 intr_mask, u32 intr_dest)
+{
+	struct gk20a *g;
+
+	if (!is_falcon_valid(flcn)) {
+		return;
+	}
+
+	g = flcn->g;
+
+	if (!flcn->is_interrupt_enabled) {
+		nvgpu_warn(g, "Interrupt not supported on flcn 0x%x ",
+			flcn->flcn_id);
+		return;
+	}
+
+	g->ops.falcon.set_irq(flcn, enable, intr_mask, intr_dest);
+}
+
+#ifdef CONFIG_NVGPU_DGPU
+int nvgpu_falcon_copy_from_emem(struct nvgpu_falcon *flcn,
+	u32 src, u8 *dst, u32 size, u8 port)
+{
+	struct nvgpu_falcon_engine_dependency_ops *flcn_dops;
+	int status = -EINVAL;
+	struct gk20a *g;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+	flcn_dops = &flcn->flcn_engine_dep_ops;
+
+	if (flcn_dops->copy_from_emem != NULL) {
+		nvgpu_mutex_acquire(&flcn->emem_lock);
+		status = flcn_dops->copy_from_emem(g, src, dst, size, port);
+		nvgpu_mutex_release(&flcn->emem_lock);
+	} else {
+		nvgpu_warn(g, "Invalid op on falcon 0x%x ",
+			flcn->flcn_id);
+		goto exit;
+	}
+
+exit:
+	return status;
+}
+
+int nvgpu_falcon_copy_to_emem(struct nvgpu_falcon *flcn,
+	u32 dst, u8 *src, u32 size, u8 port)
+{
+	struct nvgpu_falcon_engine_dependency_ops *flcn_dops;
+	int status = -EINVAL;
+	struct gk20a *g;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+	flcn_dops = &flcn->flcn_engine_dep_ops;
+
+	if (flcn_dops->copy_to_emem != NULL) {
+		nvgpu_mutex_acquire(&flcn->emem_lock);
+		status = flcn_dops->copy_to_emem(g, dst, src, size, port);
+		nvgpu_mutex_release(&flcn->emem_lock);
+	} else {
+		nvgpu_warn(g, "Invalid op on falcon 0x%x ",
+			flcn->flcn_id);
+		goto exit;
+	}
+
+exit:
+	return status;
+}
+#endif
+
+#ifdef CONFIG_NVGPU_FALCON_DEBUG
+void nvgpu_falcon_dump_stats(struct nvgpu_falcon *flcn)
+{
+	if (!is_falcon_valid(flcn)) {
+		return;
+	}
+
+	flcn->g->ops.falcon.dump_falcon_stats(flcn);
+}
+#endif
+
+#ifdef CONFIG_NVGPU_FALCON_NON_FUSA
+int nvgpu_falcon_bootstrap(struct nvgpu_falcon *flcn, u32 boot_vector)
+{
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	flcn->g->ops.falcon.bootstrap(flcn, boot_vector);
+
+	return 0;
+}
+
+int nvgpu_falcon_get_mem_size(struct nvgpu_falcon *flcn,
+			      enum falcon_mem_type type, u32 *size)
+{
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	*size = flcn->g->ops.falcon.get_mem_size(flcn, type);
+
+	return 0;
+}
+
+int nvgpu_falcon_clear_halt_intr_status(struct nvgpu_falcon *flcn,
+	unsigned int timeout)
+{
+	struct nvgpu_timeout to;
+	struct gk20a *g;
+	int status;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	status = nvgpu_timeout_init(g, &to, timeout, NVGPU_TIMER_CPU_TIMER);
+	if (status != 0) {
+		return status;
+	}
+
+	do {
+		if (g->ops.falcon.clear_halt_interrupt_status(flcn)) {
+			break;
+		}
+
+		nvgpu_udelay(1);
+	} while (nvgpu_timeout_expired(&to) == 0);
+
+	if (nvgpu_timeout_peek_expired(&to)) {
+		status = -ETIMEDOUT;
+	}
+
+	return status;
+}
+
+int nvgpu_falcon_copy_from_dmem(struct nvgpu_falcon *flcn,
+	u32 src, u8 *dst, u32 size, u8 port)
+{
+	int status = -EINVAL;
+	struct gk20a *g;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	if (falcon_memcpy_params_check(flcn, src, size, MEM_DMEM, port) != 0) {
+		nvgpu_err(g, "incorrect parameters");
+		goto exit;
+	}
+
+	nvgpu_mutex_acquire(&flcn->dmem_lock);
+	status = g->ops.falcon.copy_from_dmem(flcn, src, dst, size, port);
+	nvgpu_mutex_release(&flcn->dmem_lock);
+
+exit:
+	return status;
+}
+
+int nvgpu_falcon_copy_from_imem(struct nvgpu_falcon *flcn,
+	u32 src, u8 *dst, u32 size, u8 port)
+{
+	int status = -EINVAL;
+	struct gk20a *g;
+
+	if (!is_falcon_valid(flcn)) {
+		return -EINVAL;
+	}
+
+	g = flcn->g;
+
+	if (falcon_memcpy_params_check(flcn, src, size, MEM_IMEM, port) != 0) {
+		nvgpu_err(g, "incorrect parameters");
+		goto exit;
+	}
+
+	nvgpu_mutex_acquire(&flcn->imem_lock);
+	status = g->ops.falcon.copy_from_imem(flcn, src, dst, size, port);
+	nvgpu_mutex_release(&flcn->imem_lock);
+
+exit:
+	return status;
+}
+
+static void falcon_print_mem(struct nvgpu_falcon *flcn, u32 src,
+	u32 size, enum falcon_mem_type mem_type)
+{
+	u32 buff[64] = {0};
+	u32 total_block_read = 0;
+	u32 byte_read_count = 0;
+	struct gk20a *g;
+	u32 i = 0;
+	int status = 0;
+
+	g = flcn->g;
+
+	if (falcon_memcpy_params_check(flcn, src, size, mem_type, 0) != 0) {
+		nvgpu_err(g, "incorrect parameters");
+		return;
+	}
+
+	nvgpu_info(g, " offset 0x%x  size %d bytes", src, size);
+
+	total_block_read = size >> 8;
+	do {
+		byte_read_count =
+			(total_block_read != 0U) ? (u32)sizeof(buff) : size;
+
+		if (byte_read_count == 0U) {
+			break;
+		}
+
+		if (mem_type == MEM_DMEM) {
+			status = nvgpu_falcon_copy_from_dmem(flcn, src,
+				(u8 *)buff, byte_read_count, 0);
+		} else {
+			status = nvgpu_falcon_copy_from_imem(flcn, src,
+				(u8 *)buff, byte_read_count, 0);
+		}
+
+		if (status != 0) {
+			nvgpu_err(g, "MEM print failed");
+			break;
+		}
+
+		for (i = 0U; i < (byte_read_count >> 2U); i += 4U) {
+			nvgpu_info(g, "0x%04x: 0x%08x 0x%08x 0x%08x 0x%08x",
+				src + (i << 2U), buff[i], buff[i+1U],
+				buff[i+2U], buff[i+3U]);
+		}
+
+		src += byte_read_count;
+		size -= byte_read_count;
+	} while (total_block_read-- != 0U);
+}
+
+void nvgpu_falcon_print_dmem(struct nvgpu_falcon *flcn, u32 src, u32 size)
+{
+	if (!is_falcon_valid(flcn)) {
+		return;
+	}
+
+	nvgpu_info(flcn->g, " PRINT DMEM ");
+	falcon_print_mem(flcn, src, size, MEM_DMEM);
+}
+
+void nvgpu_falcon_print_imem(struct nvgpu_falcon *flcn, u32 src, u32 size)
+{
+	if (!is_falcon_valid(flcn)) {
+		return;
+	}
+
+	nvgpu_info(flcn->g, " PRINT IMEM ");
+	falcon_print_mem(flcn, src, size, MEM_IMEM);
+}
+
+void nvgpu_falcon_get_ctls(struct nvgpu_falcon *flcn, u32 *sctl, u32 *cpuctl)
+{
+	if (!is_falcon_valid(flcn)) {
+		return;
+	}
+
+	flcn->g->ops.falcon.get_falcon_ctls(flcn, sctl, cpuctl);
+}
+#endif
--- a/drivers/gpu/nvgpu/common/falcon/falcon_sw_gk20a.c
+++ b/drivers/gpu/nvgpu/common/falcon/falcon_sw_gk20a.c
@@ -0,0 +1,80 @@
+/*
+ * Copyright (c) 2017-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <nvgpu/gk20a.h>
+#include <nvgpu/falcon.h>
+
+#include "falcon_sw_gk20a.h"
+
+void gk20a_falcon_engine_dependency_ops(struct nvgpu_falcon *flcn)
+{
+	struct gk20a *g = flcn->g;
+	struct nvgpu_falcon_engine_dependency_ops *flcn_eng_dep_ops =
+			&flcn->flcn_engine_dep_ops;
+
+	switch (flcn->flcn_id) {
+	case FALCON_ID_PMU:
+		flcn_eng_dep_ops->reset_eng = g->ops.pmu.pmu_reset;
+		flcn_eng_dep_ops->setup_bootstrap_config =
+			g->ops.pmu.flcn_setup_boot_config;
+		break;
+	default:
+		/* NULL assignment make sure
+		 * CPU hard reset in gk20a_falcon_reset() gets execute
+		 * if falcon doesn't need specific reset implementation
+		 */
+		flcn_eng_dep_ops->reset_eng = NULL;
+		break;
+	}
+}
+
+void gk20a_falcon_sw_init(struct nvgpu_falcon *flcn)
+{
+	struct gk20a *g = flcn->g;
+
+	switch (flcn->flcn_id) {
+	case FALCON_ID_PMU:
+		flcn->flcn_base = g->ops.pmu.falcon_base_addr();
+		flcn->is_falcon_supported = true;
+		flcn->is_interrupt_enabled = true;
+		break;
+	case FALCON_ID_FECS:
+		flcn->flcn_base = g->ops.gr.falcon.fecs_base_addr();
+		flcn->is_falcon_supported = true;
+		flcn->is_interrupt_enabled = false;
+		break;
+	case FALCON_ID_GPCCS:
+		flcn->flcn_base = g->ops.gr.falcon.gpccs_base_addr();
+		flcn->is_falcon_supported = true;
+		flcn->is_interrupt_enabled = false;
+		break;
+	default:
+		flcn->is_falcon_supported = false;
+		break;
+	}
+
+	if (flcn->is_falcon_supported) {
+		gk20a_falcon_engine_dependency_ops(flcn);
+	} else {
+		nvgpu_log_info(g, "falcon 0x%x not supported on %s",
+			flcn->flcn_id, g->name);
+	}
+}
--- a/drivers/gpu/nvgpu/common/falcon/falcon_sw_gk20a.h
+++ b/drivers/gpu/nvgpu/common/falcon/falcon_sw_gk20a.h
@@ -0,0 +1,28 @@
+/*
+ * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef NVGPU_FALCON_SW_GK20A_H
+#define NVGPU_FALCON_SW_GK20A_H
+
+void gk20a_falcon_engine_dependency_ops(struct nvgpu_falcon *flcn);
+void gk20a_falcon_sw_init(struct nvgpu_falcon *flcn);
+
+#endif /* NVGPU_FALCON_SW_GK20A_H */
--- a/drivers/gpu/nvgpu/common/falcon/falcon_sw_tu104.c
+++ b/drivers/gpu/nvgpu/common/falcon/falcon_sw_tu104.c
@@ -0,0 +1,102 @@
+/*
+ * Copyright (c) 2018-2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <nvgpu/gk20a.h>
+#include <nvgpu/falcon.h>
+
+#include "falcon_sw_gk20a.h"
+#include "falcon_sw_tu104.h"
+
+void tu104_falcon_engine_dependency_ops(struct nvgpu_falcon *flcn)
+{
+	struct nvgpu_falcon_engine_dependency_ops *flcn_eng_dep_ops =
+			&flcn->flcn_engine_dep_ops;
+	struct gk20a *g = flcn->g;
+
+	gk20a_falcon_engine_dependency_ops(flcn);
+
+	switch (flcn->flcn_id) {
+	case FALCON_ID_GSPLITE:
+		flcn_eng_dep_ops->reset_eng = g->ops.gsp.gsp_reset;
+		flcn_eng_dep_ops->setup_bootstrap_config =
+			g->ops.gsp.falcon_setup_boot_config;
+		break;
+	case FALCON_ID_SEC2:
+		flcn_eng_dep_ops->reset_eng = g->ops.sec2.sec2_reset;
+		flcn_eng_dep_ops->setup_bootstrap_config =
+			g->ops.sec2.flcn_setup_boot_config;
+		flcn_eng_dep_ops->copy_to_emem = g->ops.sec2.sec2_copy_to_emem;
+		flcn_eng_dep_ops->copy_from_emem =
+						g->ops.sec2.sec2_copy_from_emem;
+		break;
+	default:
+		flcn_eng_dep_ops->reset_eng = NULL;
+		break;
+	}
+}
+
+void tu104_falcon_sw_init(struct nvgpu_falcon *flcn)
+{
+	struct gk20a *g = flcn->g;
+
+	switch (flcn->flcn_id) {
+	case FALCON_ID_GSPLITE:
+		flcn->flcn_base = g->ops.gsp.falcon_base_addr();
+		flcn->is_falcon_supported = true;
+		flcn->is_interrupt_enabled = false;
+		break;
+	case FALCON_ID_SEC2:
+		flcn->flcn_base = g->ops.sec2.falcon_base_addr();
+		flcn->is_falcon_supported = true;
+		flcn->is_interrupt_enabled = true;
+		flcn->emem_supported = true;
+		break;
+	case FALCON_ID_MINION:
+		flcn->flcn_base = g->ops.nvlink.minion.base_addr(g);
+		flcn->is_falcon_supported = true;
+		flcn->is_interrupt_enabled = true;
+		break;
+	case FALCON_ID_NVDEC:
+		flcn->flcn_base = g->ops.nvdec.falcon_base_addr();
+		flcn->is_falcon_supported = true;
+		flcn->is_interrupt_enabled = true;
+		break;
+	default:
+		/*
+		 * set false to inherit falcon support
+		 * from previous chips HAL
+		 */
+		flcn->is_falcon_supported = false;
+		break;
+	}
+
+	if (flcn->is_falcon_supported) {
+		tu104_falcon_engine_dependency_ops(flcn);
+	} else {
+		/*
+		 * Forward call to previous chip's SW init
+		 * to fetch info for requested
+		 * falcon as no changes between
+		 * current & previous chips.
+		 */
+		gk20a_falcon_sw_init(flcn);
+	}
+}
--- a/drivers/gpu/nvgpu/common/falcon/falcon_sw_tu104.h
+++ b/drivers/gpu/nvgpu/common/falcon/falcon_sw_tu104.h
@@ -0,0 +1,29 @@
+/*
+ * Copyright (c) 2018, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_FALCON_SW_TU104_H
+#define NVGPU_FALCON_SW_TU104_H
+
+void tu104_falcon_engine_dependency_ops(struct nvgpu_falcon *flcn);
+void tu104_falcon_sw_init(struct nvgpu_falcon *flcn);
+
+#endif /* NVGPU_FALCON_SW_TU104_H */
--- a/drivers/gpu/nvgpu/common/fb/fb.c
+++ b/drivers/gpu/nvgpu/common/fb/fb.c
@@ -0,0 +1,41 @@
+/*
+ * Copyright (c) 2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/power_features/cg.h>
+#include <nvgpu/fb.h>
+
+int nvgpu_init_fb_support(struct gk20a *g)
+{
+	if (g->ops.mc.fb_reset != NULL) {
+		g->ops.mc.fb_reset(g);
+	}
+
+	nvgpu_cg_slcg_fb_ltc_load_enable(g);
+
+	nvgpu_cg_blcg_fb_ltc_load_enable(g);
+
+	if (g->ops.fb.init_fs_state != NULL) {
+		g->ops.fb.init_fs_state(g);
+	}
+	return 0;
+}
--- a/drivers/gpu/nvgpu/common/fbp/fbp.c
+++ b/drivers/gpu/nvgpu/common/fbp/fbp.c
@@ -0,0 +1,130 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/log.h>
+#include <nvgpu/fbp.h>
+#include <nvgpu/static_analysis.h>
+
+#include "fbp_priv.h"
+
+int nvgpu_fbp_init_support(struct gk20a *g)
+{
+	struct nvgpu_fbp *fbp;
+	u32 fbp_en_mask;
+#ifdef CONFIG_NVGPU_NON_FUSA
+	u32 max_ltc_per_fbp;
+	u32 rop_l2_all_en;
+	unsigned long i;
+	unsigned long fbp_en_mask_tmp;
+	u32 tmp;
+#endif
+
+	if (g->fbp != NULL) {
+		return 0;
+	}
+
+	fbp = nvgpu_kzalloc(g, sizeof(*fbp));
+	if (fbp == NULL) {
+		return -ENOMEM;
+	}
+
+#ifdef CONFIG_NVGPU_NON_FUSA
+	fbp->num_fbps = g->ops.priv_ring.get_fbp_count(g);
+	nvgpu_log_info(g, "fbps: %d", fbp->num_fbps);
+#endif
+
+	fbp->max_fbps_count = g->ops.top.get_max_fbps_count(g);
+	nvgpu_log_info(g, "max_fbps_count: %d", fbp->max_fbps_count);
+
+	/*
+	 * Read active fbp mask from fuse
+	 * Note that 0:enable and 1:disable in value read from fuse so we've to
+	 * flip the bits.
+	 * Also set unused bits to zero
+	 */
+	fbp_en_mask = g->ops.fuse.fuse_status_opt_fbp(g);
+	fbp_en_mask = ~fbp_en_mask;
+	fbp_en_mask = fbp_en_mask &
+		nvgpu_safe_sub_u32(BIT32(fbp->max_fbps_count), 1U);
+	fbp->fbp_en_mask = fbp_en_mask;
+
+#ifdef CONFIG_NVGPU_NON_FUSA
+	fbp->fbp_rop_l2_en_mask =
+		nvgpu_kzalloc(g,
+			nvgpu_safe_mult_u64(fbp->max_fbps_count, sizeof(u32)));
+	if (fbp->fbp_rop_l2_en_mask == NULL) {
+		nvgpu_kfree(g, fbp);
+		return -ENOMEM;
+	}
+
+	fbp_en_mask_tmp = fbp_en_mask;
+	max_ltc_per_fbp = g->ops.top.get_max_ltc_per_fbp(g);
+	rop_l2_all_en = nvgpu_safe_sub_u32(BIT32(max_ltc_per_fbp), 1U);
+
+	/* mask of Rop_L2 for each FBP */
+	for_each_set_bit(i, &fbp_en_mask_tmp, fbp->max_fbps_count) {
+		tmp = g->ops.fuse.fuse_status_opt_rop_l2_fbp(g, i);
+		fbp->fbp_rop_l2_en_mask[i] = rop_l2_all_en ^ tmp;
+	}
+#endif
+
+	g->fbp = fbp;
+
+	return 0;
+}
+
+void nvgpu_fbp_remove_support(struct gk20a *g)
+{
+	struct nvgpu_fbp *fbp = g->fbp;
+
+	if (fbp != NULL) {
+		nvgpu_kfree(g, fbp->fbp_rop_l2_en_mask);
+		nvgpu_kfree(g, fbp);
+	}
+
+	g->fbp = NULL;
+}
+
+u32 nvgpu_fbp_get_max_fbps_count(struct nvgpu_fbp *fbp)
+{
+	return fbp->max_fbps_count;
+}
+
+u32 nvgpu_fbp_get_fbp_en_mask(struct nvgpu_fbp *fbp)
+{
+	return fbp->fbp_en_mask;
+}
+
+#ifdef CONFIG_NVGPU_NON_FUSA
+u32 nvgpu_fbp_get_num_fbps(struct nvgpu_fbp *fbp)
+{
+	return fbp->num_fbps;
+}
+
+u32 *nvgpu_fbp_get_rop_l2_en_mask(struct nvgpu_fbp *fbp)
+{
+	return fbp->fbp_rop_l2_en_mask;
+}
+#endif
+
--- a/drivers/gpu/nvgpu/common/fbp/fbp_priv.h
+++ b/drivers/gpu/nvgpu/common/fbp/fbp_priv.h
@@ -0,0 +1,33 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_FBP_PRIV_H
+#define NVGPU_FBP_PRIV_H
+
+struct nvgpu_fbp {
+	u32 num_fbps;
+	u32 max_fbps_count;
+	u32 fbp_en_mask;
+	u32 *fbp_rop_l2_en_mask;
+};
+
+#endif /* NVGPU_FBP_PRIV_H */
--- a/drivers/gpu/nvgpu/common/fence/fence.c
+++ b/drivers/gpu/nvgpu/common/fence/fence.c
@@ -0,0 +1,120 @@
+/*
+ * Copyright (c) 2014-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/soc.h>
+#include <nvgpu/os_fence.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/fence.h>
+#include <nvgpu/user_fence.h>
+#include "fence_priv.h"
+
+static struct nvgpu_fence_type *nvgpu_fence_from_ref(struct nvgpu_ref *ref)
+{
+	return (struct nvgpu_fence_type *)((uintptr_t)ref -
+				offsetof(struct nvgpu_fence_type, priv.ref));
+}
+
+static void nvgpu_fence_release(struct nvgpu_ref *ref)
+{
+	struct nvgpu_fence_type *f = nvgpu_fence_from_ref(ref);
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	if (nvgpu_os_fence_is_initialized(&pf->os_fence)) {
+		pf->os_fence.ops->drop_ref(&pf->os_fence);
+	}
+
+	pf->ops->release(f);
+}
+
+void nvgpu_fence_put(struct nvgpu_fence_type *f)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	nvgpu_ref_put(&pf->ref, nvgpu_fence_release);
+}
+
+struct nvgpu_fence_type *nvgpu_fence_get(struct nvgpu_fence_type *f)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	nvgpu_ref_get(&pf->ref);
+	return f;
+}
+
+/*
+ * Extract an object to be passed to the userspace as a result of a submitted
+ * job. This must be balanced with a call to nvgpu_user_fence_release().
+ */
+struct nvgpu_user_fence nvgpu_fence_extract_user(struct nvgpu_fence_type *f)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	struct nvgpu_user_fence uf = (struct nvgpu_user_fence) {
+#ifdef CONFIG_TEGRA_GK20A_NVHOST
+		.syncpt_id = pf->syncpt_id,
+		.syncpt_value = pf->syncpt_value,
+#endif
+		.os_fence = pf->os_fence,
+	};
+
+	/*
+	 * The os fence member has to live so it can be signaled when the job
+	 * completes. The returned user fence may live longer than that before
+	 * being safely attached to an fd if the job completes before a
+	 * submission ioctl finishes, or if it's stored for cde job state
+	 * tracking.
+	 */
+	if (nvgpu_os_fence_is_initialized(&pf->os_fence)) {
+		pf->os_fence.ops->dup(&pf->os_fence);
+	}
+
+	return uf;
+}
+
+int nvgpu_fence_wait(struct gk20a *g, struct nvgpu_fence_type *f,
+							u32 timeout)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	if (!nvgpu_platform_is_silicon(g)) {
+		timeout = U32_MAX;
+	}
+	return pf->ops->wait(f, timeout);
+}
+
+bool nvgpu_fence_is_expired(struct nvgpu_fence_type *f)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	return pf->ops->is_expired(f);
+}
+
+void nvgpu_fence_init(struct nvgpu_fence_type *f,
+		const struct nvgpu_fence_ops *ops,
+		struct nvgpu_os_fence os_fence)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	nvgpu_ref_init(&pf->ref);
+	pf->ops = ops;
+	pf->os_fence = os_fence;
+}
--- a/drivers/gpu/nvgpu/common/fence/fence_priv.h
+++ b/drivers/gpu/nvgpu/common/fence/fence_priv.h
@@ -0,0 +1,39 @@
+/*
+ * Copyright (c) 2014-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef NVGPU_FENCE_PRIV_H
+#define NVGPU_FENCE_PRIV_H
+
+#include <nvgpu/os_fence.h>
+
+struct nvgpu_fence_type;
+
+struct nvgpu_fence_ops {
+	int (*wait)(struct nvgpu_fence_type *f, u32 timeout);
+	bool (*is_expired)(struct nvgpu_fence_type *f);
+	void (*release)(struct nvgpu_fence_type *f);
+};
+
+void nvgpu_fence_init(struct nvgpu_fence_type *f,
+		const struct nvgpu_fence_ops *ops,
+		struct nvgpu_os_fence os_fence);
+
+#endif
--- a/drivers/gpu/nvgpu/common/fence/fence_sema.c
+++ b/drivers/gpu/nvgpu/common/fence/fence_sema.c
@@ -0,0 +1,78 @@
+/*
+ * Copyright (c) 2014-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/semaphore.h>
+#include <nvgpu/cond.h>
+#include <nvgpu/fence.h>
+#include <nvgpu/fence_sema.h>
+#include "fence_priv.h"
+
+static int nvgpu_fence_semaphore_wait(struct nvgpu_fence_type *f, u32 timeout)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	if (!nvgpu_semaphore_is_acquired(pf->semaphore)) {
+		return 0;
+	}
+
+	return NVGPU_COND_WAIT_INTERRUPTIBLE(
+		pf->semaphore_wq,
+		!nvgpu_semaphore_is_acquired(pf->semaphore),
+		timeout);
+}
+
+static bool nvgpu_fence_semaphore_is_expired(struct nvgpu_fence_type *f)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	return !nvgpu_semaphore_is_acquired(pf->semaphore);
+}
+
+static void nvgpu_fence_semaphore_release(struct nvgpu_fence_type *f)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	if (pf->semaphore != NULL) {
+		nvgpu_semaphore_put(pf->semaphore);
+	}
+}
+
+static const struct nvgpu_fence_ops nvgpu_fence_semaphore_ops = {
+	.wait = nvgpu_fence_semaphore_wait,
+	.is_expired = nvgpu_fence_semaphore_is_expired,
+	.release = nvgpu_fence_semaphore_release,
+};
+
+/* This function takes ownership of the semaphore as well as the os_fence */
+void nvgpu_fence_from_semaphore(
+		struct nvgpu_fence_type *f,
+		struct nvgpu_semaphore *semaphore,
+		struct nvgpu_cond *semaphore_wq,
+		struct nvgpu_os_fence os_fence)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	nvgpu_fence_init(f, &nvgpu_fence_semaphore_ops, os_fence);
+
+	pf->semaphore = semaphore;
+	pf->semaphore_wq = semaphore_wq;
+}
--- a/drivers/gpu/nvgpu/common/fence/fence_syncpt.c
+++ b/drivers/gpu/nvgpu/common/fence/fence_syncpt.c
@@ -0,0 +1,89 @@
+/*
+ * Copyright (c) 2014-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/nvhost.h>
+#include <nvgpu/fence.h>
+#include <nvgpu/fence_syncpt.h>
+#include "fence_priv.h"
+
+static int nvgpu_fence_syncpt_wait(struct nvgpu_fence_type *f, u32 timeout)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	return nvgpu_nvhost_syncpt_wait_timeout_ext(
+			pf->nvhost_device, pf->syncpt_id, pf->syncpt_value,
+			timeout, NVGPU_NVHOST_DEFAULT_WAITER);
+}
+
+static bool nvgpu_fence_syncpt_is_expired(struct nvgpu_fence_type *f)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	/*
+	 * In cases we don't register a notifier, we can't expect the
+	 * syncpt value to be updated. For this case, we force a read
+	 * of the value from HW, and then check for expiration.
+	 */
+	if (!nvgpu_nvhost_syncpt_is_expired_ext(pf->nvhost_device,
+				pf->syncpt_id, pf->syncpt_value)) {
+		int err;
+		u32 val;
+
+		err = nvgpu_nvhost_syncpt_read_ext_check(pf->nvhost_device,
+				pf->syncpt_id, &val);
+		WARN(err != 0, "syncpt read failed??");
+		if (err == 0) {
+			return nvgpu_nvhost_syncpt_is_expired_ext(
+					pf->nvhost_device,
+					pf->syncpt_id, pf->syncpt_value);
+		} else {
+			return false;
+		}
+	}
+
+	return true;
+}
+
+static void nvgpu_fence_syncpt_release(struct nvgpu_fence_type *f)
+{
+}
+
+static const struct nvgpu_fence_ops nvgpu_fence_syncpt_ops = {
+	.wait = nvgpu_fence_syncpt_wait,
+	.is_expired = nvgpu_fence_syncpt_is_expired,
+	.release = nvgpu_fence_syncpt_release,
+};
+
+/* This function takes the ownership of the os_fence */
+void nvgpu_fence_from_syncpt(
+		struct nvgpu_fence_type *f,
+		struct nvgpu_nvhost_dev *nvhost_device,
+		u32 id, u32 value, struct nvgpu_os_fence os_fence)
+{
+	struct nvgpu_fence_type_priv *pf = &f->priv;
+
+	nvgpu_fence_init(f, &nvgpu_fence_syncpt_ops, os_fence);
+
+	pf->nvhost_device = nvhost_device;
+	pf->syncpt_id = id;
+	pf->syncpt_value = value;
+}
--- a/drivers/gpu/nvgpu/common/fifo/channel.c
+++ b/drivers/gpu/nvgpu/common/fifo/channel.c
--- a/drivers/gpu/nvgpu/common/fifo/channel_wdt.c
+++ b/drivers/gpu/nvgpu/common/fifo/channel_wdt.c
@@ -0,0 +1,199 @@
+/*
+ * Copyright (c) 2015-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include "channel_wdt.h"
+#include "channel_worker.h"
+
+#include <nvgpu/watchdog.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/error_notifier.h>
+#include <nvgpu/gk20a.h>
+
+void nvgpu_channel_set_wdt_debug_dump(struct nvgpu_channel *ch, bool dump)
+{
+	ch->wdt_debug_dump = dump;
+}
+
+static struct nvgpu_channel_wdt_state nvgpu_channel_collect_wdt_state(
+		struct nvgpu_channel *ch)
+{
+	struct gk20a *g = ch->g;
+	struct nvgpu_channel_wdt_state state = { 0, 0 };
+
+	/*
+	 * Note: just checking for nvgpu_channel_wdt_enabled() is not enough at
+	 * the moment because system suspend puts g->regs away but doesn't stop
+	 * the worker thread that runs the watchdog. This might need to be
+	 * cleared up in the future.
+	 */
+	if (nvgpu_channel_wdt_running(ch->wdt)) {
+		/*
+		 * Read the state only if the wdt is on to avoid unnecessary
+		 * accesses. The kernel mem for userd may not even exist; this
+		 * channel could be in usermode submit mode.
+		 */
+		state.gp_get = g->ops.userd.gp_get(g, ch);
+		state.pb_get = g->ops.userd.pb_get(g, ch);
+	}
+
+	return state;
+}
+
+void nvgpu_channel_launch_wdt(struct nvgpu_channel *ch)
+{
+	struct nvgpu_channel_wdt_state state = nvgpu_channel_collect_wdt_state(ch);
+
+	/*
+	 * FIXME: channel recovery can race the submit path and can start even
+	 * after this, but this check is the best we can do for now.
+	 */
+	if (!nvgpu_channel_check_unserviceable(ch)) {
+		nvgpu_channel_wdt_start(ch->wdt, &state);
+	}
+}
+
+void nvgpu_channel_restart_all_wdts(struct gk20a *g)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+	u32 chid;
+
+	for (chid = 0; chid < f->num_channels; chid++) {
+		struct nvgpu_channel *ch = nvgpu_channel_from_id(g, chid);
+
+		if (ch != NULL) {
+			if ((ch->wdt != NULL) &&
+			    !nvgpu_channel_check_unserviceable(ch)) {
+				struct nvgpu_channel_wdt_state state =
+					nvgpu_channel_collect_wdt_state(ch);
+
+				nvgpu_channel_wdt_rewind(ch->wdt, &state);
+			}
+			nvgpu_channel_put(ch);
+		}
+	}
+}
+
+static void nvgpu_channel_recover_from_wdt(struct nvgpu_channel *ch)
+{
+	struct gk20a *g = ch->g;
+
+	nvgpu_log_fn(g, " ");
+
+	if (nvgpu_channel_check_unserviceable(ch)) {
+		/* channel is already recovered */
+		nvgpu_info(g, "chid: %d unserviceable but wdt was ON", ch->chid);
+		return;
+	}
+
+	nvgpu_err(g, "Job on channel %d timed out", ch->chid);
+
+	/* force reset calls gk20a_debug_dump but not this */
+	if (ch->wdt_debug_dump) {
+		gk20a_gr_debug_dump(g);
+	}
+
+#ifdef CONFIG_NVGPU_CHANNEL_TSG_CONTROL
+	if (g->ops.tsg.force_reset(ch,
+	    NVGPU_ERR_NOTIFIER_FIFO_ERROR_IDLE_TIMEOUT,
+	    ch->wdt_debug_dump) != 0) {
+		nvgpu_err(g, "failed tsg force reset for chid: %d", ch->chid);
+	}
+#endif
+}
+
+/*
+ * Test the watchdog progress. If the channel is stuck, reset it.
+ *
+ * The gpu is implicitly on at this point because the watchdog can only run on
+ * channels that have submitted jobs pending for cleanup.
+ */
+static void nvgpu_channel_check_wdt(struct nvgpu_channel *ch)
+{
+	struct nvgpu_channel_wdt_state state = nvgpu_channel_collect_wdt_state(ch);
+
+	if (nvgpu_channel_wdt_check(ch->wdt, &state)) {
+		nvgpu_channel_recover_from_wdt(ch);
+	}
+}
+
+void nvgpu_channel_worker_poll_init(struct nvgpu_worker *worker)
+{
+	struct nvgpu_channel_worker *ch_worker =
+		nvgpu_channel_worker_from_worker(worker);
+	int ret;
+
+	ch_worker->watchdog_interval = 100U;
+
+	ret = nvgpu_timeout_init(worker->g, &ch_worker->timeout,
+			ch_worker->watchdog_interval, NVGPU_TIMER_CPU_TIMER);
+	if (ret != 0) {
+		nvgpu_err(worker->g, "timeout_init failed: %d", ret);
+	}
+}
+
+/**
+ * Loop every living channel, check timeouts and handle stuck channels.
+ */
+static void nvgpu_channel_poll_wdt(struct gk20a *g)
+{
+	unsigned int chid;
+
+	for (chid = 0; chid < g->fifo.num_channels; chid++) {
+		struct nvgpu_channel *ch = nvgpu_channel_from_id(g, chid);
+
+		if (ch != NULL) {
+			if (!nvgpu_channel_check_unserviceable(ch)) {
+				nvgpu_channel_check_wdt(ch);
+			}
+			nvgpu_channel_put(ch);
+		}
+	}
+}
+
+void nvgpu_channel_worker_poll_wakeup_post_process_item(
+		struct nvgpu_worker *worker)
+{
+	struct gk20a *g = worker->g;
+
+	struct nvgpu_channel_worker *ch_worker =
+		nvgpu_channel_worker_from_worker(worker);
+	int ret;
+
+	if (nvgpu_timeout_peek_expired(&ch_worker->timeout)) {
+		nvgpu_channel_poll_wdt(g);
+		ret = nvgpu_timeout_init(g, &ch_worker->timeout,
+				ch_worker->watchdog_interval,
+				NVGPU_TIMER_CPU_TIMER);
+		if (ret != 0) {
+			nvgpu_err(g, "timeout_init failed: %d", ret);
+		}
+	}
+}
+
+u32 nvgpu_channel_worker_poll_wakeup_condition_get_timeout(
+		struct nvgpu_worker *worker)
+{
+	struct nvgpu_channel_worker *ch_worker =
+		nvgpu_channel_worker_from_worker(worker);
+
+	return ch_worker->watchdog_interval;
+}
--- a/drivers/gpu/nvgpu/common/fifo/channel_wdt.h
+++ b/drivers/gpu/nvgpu/common/fifo/channel_wdt.h
@@ -0,0 +1,42 @@
+/*
+ * Copyright (c) 2015-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef NVGPU_COMMON_FIFO_CHANNEL_WDT_H
+#define NVGPU_COMMON_FIFO_CHANNEL_WDT_H
+
+#include <nvgpu/types.h>
+
+struct nvgpu_channel;
+
+#ifdef CONFIG_NVGPU_CHANNEL_WDT
+struct nvgpu_worker;
+
+void nvgpu_channel_launch_wdt(struct nvgpu_channel *ch);
+void nvgpu_channel_worker_poll_init(struct nvgpu_worker *worker);
+void nvgpu_channel_worker_poll_wakeup_post_process_item(
+		struct nvgpu_worker *worker);
+u32 nvgpu_channel_worker_poll_wakeup_condition_get_timeout(
+		struct nvgpu_worker *worker);
+#else
+static inline void nvgpu_channel_launch_wdt(struct nvgpu_channel *ch) {}
+#endif /* CONFIG_NVGPU_CHANNEL_WDT */
+
+#endif /* NVGPU_COMMON_FIFO_CHANNEL_WDT_H */
--- a/drivers/gpu/nvgpu/common/fifo/channel_worker.c
+++ b/drivers/gpu/nvgpu/common/fifo/channel_worker.c
@@ -0,0 +1,118 @@
+/*
+ * Copyright (c) 2017-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include "channel_worker.h"
+#include "channel_wdt.h"
+
+#include <nvgpu/worker.h>
+#include <nvgpu/channel.h>
+
+static inline struct nvgpu_channel *
+nvgpu_channel_from_worker_item(struct nvgpu_list_node *node)
+{
+	return (struct nvgpu_channel *)
+	   ((uintptr_t)node - offsetof(struct nvgpu_channel, worker_item));
+};
+
+static void nvgpu_channel_worker_poll_wakeup_process_item(
+		struct nvgpu_list_node *work_item)
+{
+	struct nvgpu_channel *ch = nvgpu_channel_from_worker_item(work_item);
+
+	nvgpu_assert(ch != NULL);
+
+	nvgpu_log_fn(ch->g, " ");
+
+	nvgpu_channel_clean_up_jobs(ch);
+
+	/* ref taken when enqueued */
+	nvgpu_channel_put(ch);
+}
+
+static const struct nvgpu_worker_ops channel_worker_ops = {
+#ifdef CONFIG_NVGPU_CHANNEL_WDT
+	.pre_process = nvgpu_channel_worker_poll_init,
+	.wakeup_post_process =
+		nvgpu_channel_worker_poll_wakeup_post_process_item,
+	.wakeup_timeout =
+		nvgpu_channel_worker_poll_wakeup_condition_get_timeout,
+#endif
+	.wakeup_early_exit = NULL,
+	.wakeup_process_item =
+		nvgpu_channel_worker_poll_wakeup_process_item,
+	.wakeup_condition = NULL,
+};
+
+/**
+ * Initialize the channel worker's metadata and start the background thread.
+ */
+int nvgpu_channel_worker_init(struct gk20a *g)
+{
+	struct nvgpu_worker *worker = &g->channel_worker.worker;
+
+	nvgpu_worker_init_name(worker, "nvgpu_channel_poll", g->name);
+
+	return nvgpu_worker_init(g, worker, &channel_worker_ops);
+}
+
+void nvgpu_channel_worker_deinit(struct gk20a *g)
+{
+	struct nvgpu_worker *worker = &g->channel_worker.worker;
+
+	nvgpu_worker_deinit(worker);
+}
+
+/**
+ * Append a channel to the worker's list, if not there already.
+ *
+ * The worker thread processes work items (channels in its work list) and polls
+ * for other things. This adds @ch to the end of the list and wakes the worker
+ * up immediately. If the channel already existed in the list, it's not added,
+ * because in that case it has been scheduled already but has not yet been
+ * processed.
+ */
+void nvgpu_channel_worker_enqueue(struct nvgpu_channel *ch)
+{
+	struct gk20a *g = ch->g;
+	int ret;
+
+	nvgpu_log_fn(g, " ");
+
+	/*
+	 * Ref released when this item gets processed. The caller should hold
+	 * one ref already, so normally shouldn't fail, but the channel could
+	 * end up being freed between the time the caller got its reference and
+	 * the time we end up here (e.g., if the client got killed); if so, just
+	 * return.
+	 */
+	if (nvgpu_channel_get(ch) == NULL) {
+		nvgpu_info(g, "cannot get ch ref for worker!");
+		return;
+	}
+
+	ret = nvgpu_worker_enqueue(&g->channel_worker.worker,
+			&ch->worker_item);
+	if (ret != 0) {
+		nvgpu_channel_put(ch);
+		return;
+	}
+}
--- a/drivers/gpu/nvgpu/common/fifo/channel_worker.h
+++ b/drivers/gpu/nvgpu/common/fifo/channel_worker.h
@@ -0,0 +1,37 @@
+/*
+ * Copyright (c) 2017-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef NVGPU_COMMON_FIFO_CHANNEL_WORKER_H
+#define NVGPU_COMMON_FIFO_CHANNEL_WORKER_H
+
+#include <nvgpu/gk20a.h>
+
+void nvgpu_channel_worker_enqueue(struct nvgpu_channel *ch);
+
+static inline struct nvgpu_channel_worker *
+nvgpu_channel_worker_from_worker(struct nvgpu_worker *worker)
+{
+	return (struct nvgpu_channel_worker *)
+	   ((uintptr_t)worker - offsetof(struct nvgpu_channel_worker, worker));
+};
+
+#endif /* NVGPU_COMMON_FIFO_CHANNEL_WORKER_H */
--- a/drivers/gpu/nvgpu/common/fifo/engine_status.c
+++ b/drivers/gpu/nvgpu/common/fifo/engine_status.c
@@ -0,0 +1,88 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/io.h>
+#include <nvgpu/engine_status.h>
+
+bool nvgpu_engine_status_is_ctxsw_switch(struct nvgpu_engine_status_info
+		*engine_status)
+{
+	return engine_status->ctxsw_status == NVGPU_CTX_STATUS_CTXSW_SWITCH;
+}
+
+bool nvgpu_engine_status_is_ctxsw_load(struct nvgpu_engine_status_info
+		*engine_status)
+{
+	return engine_status->ctxsw_status == NVGPU_CTX_STATUS_CTXSW_LOAD;
+}
+
+bool nvgpu_engine_status_is_ctxsw_save(struct nvgpu_engine_status_info
+		*engine_status)
+{
+	return	engine_status->ctxsw_status == NVGPU_CTX_STATUS_CTXSW_SAVE;
+}
+
+bool nvgpu_engine_status_is_ctxsw(struct nvgpu_engine_status_info
+		*engine_status)
+{
+	return (nvgpu_engine_status_is_ctxsw_switch(engine_status) ||
+		nvgpu_engine_status_is_ctxsw_load(engine_status) ||
+		nvgpu_engine_status_is_ctxsw_save(engine_status));
+}
+
+bool nvgpu_engine_status_is_ctxsw_invalid(struct nvgpu_engine_status_info
+		*engine_status)
+{
+	return engine_status->ctxsw_status == NVGPU_CTX_STATUS_INVALID;
+}
+
+bool nvgpu_engine_status_is_ctxsw_valid(struct nvgpu_engine_status_info
+		*engine_status)
+{
+	return engine_status->ctxsw_status == NVGPU_CTX_STATUS_VALID;
+}
+bool nvgpu_engine_status_is_ctx_type_tsg(struct nvgpu_engine_status_info
+		*engine_status)
+{
+	return engine_status->ctx_id_type == ENGINE_STATUS_CTX_ID_TYPE_TSGID;
+}
+bool nvgpu_engine_status_is_next_ctx_type_tsg(struct nvgpu_engine_status_info
+		*engine_status)
+{
+	return engine_status->ctx_next_id_type ==
+		ENGINE_STATUS_CTX_NEXT_ID_TYPE_TSGID;
+}
+
+void nvgpu_engine_status_get_ctx_id_type(struct nvgpu_engine_status_info
+		*engine_status, u32 *ctx_id, u32 *ctx_type)
+{
+	*ctx_id = engine_status->ctx_id;
+	*ctx_type = engine_status->ctx_id_type;
+}
+
+void nvgpu_engine_status_get_next_ctx_id_type(struct nvgpu_engine_status_info
+		*engine_status, u32 *ctx_next_id,
+		u32 *ctx_next_type)
+{
+	*ctx_next_id = engine_status->ctx_next_id;
+	*ctx_next_type = engine_status->ctx_next_id_type;
+}
--- a/drivers/gpu/nvgpu/common/fifo/engines.c
+++ b/drivers/gpu/nvgpu/common/fifo/engines.c
@@ -0,0 +1,960 @@
+/*
+ * Copyright (c) 2019-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+
+#include <nvgpu/log.h>
+#include <nvgpu/errno.h>
+#include <nvgpu/timers.h>
+#include <nvgpu/bitops.h>
+#ifdef CONFIG_NVGPU_LS_PMU
+#include <nvgpu/pmu.h>
+#include <nvgpu/pmu/mutex.h>
+#endif
+#include <nvgpu/runlist.h>
+#include <nvgpu/engines.h>
+#include <nvgpu/engine_status.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/pbdma_status.h>
+#include <nvgpu/power_features/pg.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/soc.h>
+#include <nvgpu/device.h>
+#include <nvgpu/gr/gr_falcon.h>
+#include <nvgpu/gr/gr.h>
+#include <nvgpu/gr/gr_instances.h>
+#include <nvgpu/fifo.h>
+#include <nvgpu/static_analysis.h>
+#include <nvgpu/swprofile.h>
+
+#include <nvgpu/fifo/swprofile.h>
+
+#define FECS_METHOD_WFI_RESTORE	0x80000U
+
+enum nvgpu_fifo_engine nvgpu_engine_enum_from_dev(struct gk20a *g,
+			const struct nvgpu_device *dev)
+{
+	enum nvgpu_fifo_engine ret = NVGPU_ENGINE_INVAL;
+
+	if (nvgpu_device_is_graphics(g, dev)) {
+		ret = NVGPU_ENGINE_GR;
+	} else if (nvgpu_device_is_ce(g, dev)) {
+		/* For now, all CE engines have separate runlists. We can
+		 * identify the NVGPU_ENGINE_GRCE type CE using runlist_id
+		 * comparsion logic with GR runlist_id in init_info()
+		 */
+		ret = NVGPU_ENGINE_ASYNC_CE;
+	} else {
+		ret = NVGPU_ENGINE_INVAL;
+	}
+
+	return ret;
+}
+
+const struct nvgpu_device *nvgpu_engine_get_active_eng_info(
+	struct gk20a *g, u32 engine_id)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+
+	if (engine_id >= f->max_engines) {
+		return NULL;
+	}
+
+	return f->host_engines[engine_id];
+}
+
+bool nvgpu_engine_check_valid_id(struct gk20a *g, u32 engine_id)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+
+	if (engine_id >= f->max_engines) {
+		return false;
+	}
+
+	return f->host_engines[engine_id] != NULL;
+}
+
+u32 nvgpu_engine_get_gr_id_for_inst(struct gk20a *g, u32 inst_id)
+{
+	const struct nvgpu_device *dev;
+
+	dev = nvgpu_device_get(g, NVGPU_DEVTYPE_GRAPHICS, inst_id);
+	if (dev == NULL) {
+		nvgpu_warn(g, "No GR devices on this GPU for inst[%u]?!",
+			inst_id);
+		return NVGPU_INVALID_ENG_ID;
+	}
+
+	return dev->engine_id;
+}
+
+u32 nvgpu_engine_get_gr_id(struct gk20a *g)
+{
+	/* Consider 1st available GR engine */
+	return nvgpu_engine_get_gr_id_for_inst(g, 0U);
+}
+
+u32 nvgpu_engine_act_interrupt_mask(struct gk20a *g, u32 engine_id)
+{
+	const struct nvgpu_device *dev = NULL;
+
+	dev = nvgpu_engine_get_active_eng_info(g, engine_id);
+	if (dev == NULL) {
+		return 0;
+	}
+
+	return BIT32(dev->intr_id);
+}
+
+u32 nvgpu_gr_engine_interrupt_mask(struct gk20a *g)
+{
+	const struct nvgpu_device *dev;
+	u32 intr_mask = 0U;
+	u32 i;
+
+	for (i = 0U; i < g->num_gr_instances; i++) {
+		dev = nvgpu_device_get(g, NVGPU_DEVTYPE_GRAPHICS,
+				nvgpu_gr_get_syspipe_id(g, i));
+		if (dev == NULL) {
+			continue;
+		}
+
+		intr_mask |= BIT32(dev->intr_id);
+	}
+
+	return intr_mask;
+}
+
+u32 nvgpu_ce_engine_interrupt_mask(struct gk20a *g)
+{
+	const struct nvgpu_device *dev;
+	u32 i;
+	u32 mask = 0U;
+
+	/*
+	 * For old chips - pre-Pascal - we have COPY[0-2], for new chips we
+	 * have some number of LCE instances. For the purpose of this code we
+	 * imagine a system that could have both; in reality that'll never be
+	 * the case.
+	 *
+	 * This can be cleaned up in the future by defining a SW type for CE and
+	 * hiding this ugliness in the device management code.
+	 */
+	for (i = NVGPU_DEVTYPE_COPY0;  i <= NVGPU_DEVTYPE_COPY2; i++) {
+		dev = nvgpu_device_get(g, i, i - NVGPU_DEVTYPE_COPY0);
+		if (dev == NULL) {
+			continue;
+		}
+
+		mask |= BIT32(dev->intr_id);
+	}
+
+	/*
+	 * Now take care of LCEs.
+	 */
+	for (i = 0U; i < nvgpu_device_count(g, NVGPU_DEVTYPE_LCE); i++) {
+		dev = nvgpu_device_get(g, NVGPU_DEVTYPE_LCE, i);
+		nvgpu_assert(dev != NULL);
+
+		mask |= BIT32(dev->intr_id);
+	}
+
+	return mask;
+}
+
+#ifdef CONFIG_NVGPU_FIFO_ENGINE_ACTIVITY
+
+static void nvgpu_engine_enable_activity(struct gk20a *g,
+					 const struct nvgpu_device *dev)
+{
+	nvgpu_runlist_set_state(g, BIT32(dev->runlist_id), RUNLIST_ENABLED);
+}
+
+void nvgpu_engine_enable_activity_all(struct gk20a *g)
+{
+	u32 i;
+
+	for (i = 0; i < g->fifo.num_engines; i++) {
+		nvgpu_engine_enable_activity(g, g->fifo.active_engines[i]);
+	}
+}
+
+int nvgpu_engine_disable_activity(struct gk20a *g,
+				const struct nvgpu_device *dev,
+				bool wait_for_idle)
+{
+	u32 pbdma_chid = NVGPU_INVALID_CHANNEL_ID;
+	u32 engine_chid = NVGPU_INVALID_CHANNEL_ID;
+#ifdef CONFIG_NVGPU_LS_PMU
+	u32 token = PMU_INVALID_MUTEX_OWNER_ID;
+	int mutex_ret = -EINVAL;
+#endif
+	int err = 0;
+	struct nvgpu_channel *ch = NULL;
+	struct nvgpu_engine_status_info engine_status;
+	struct nvgpu_pbdma_status_info pbdma_status;
+	unsigned long runlist_served_pbdmas;
+	unsigned long bit;
+	u32 pbdma_id;
+	struct nvgpu_fifo *f = &g->fifo;
+
+	nvgpu_log_fn(g, " ");
+
+	g->ops.engine_status.read_engine_status_info(g, dev->engine_id,
+		 &engine_status);
+	if (engine_status.is_busy && !wait_for_idle) {
+		return -EBUSY;
+	}
+
+#ifdef CONFIG_NVGPU_LS_PMU
+	if (g->ops.pmu.is_pmu_supported(g)) {
+		mutex_ret = nvgpu_pmu_lock_acquire(g, g->pmu,
+						PMU_MUTEX_ID_FIFO, &token);
+	}
+#endif
+
+	nvgpu_runlist_set_state(g, BIT32(dev->runlist_id),
+			RUNLIST_DISABLED);
+
+	runlist_served_pbdmas = f->runlists[dev->runlist_id]->pbdma_bitmask;
+
+	for_each_set_bit(bit, &runlist_served_pbdmas,
+			 nvgpu_get_litter_value(g, GPU_LIT_HOST_NUM_PBDMA)) {
+		pbdma_id = U32(bit);
+		/* chid from pbdma status */
+		g->ops.pbdma_status.read_pbdma_status_info(g,
+						pbdma_id,
+						&pbdma_status);
+		if (nvgpu_pbdma_status_is_chsw_valid(&pbdma_status) ||
+			nvgpu_pbdma_status_is_chsw_save(&pbdma_status)) {
+			pbdma_chid = pbdma_status.id;
+		} else if (nvgpu_pbdma_status_is_chsw_load(&pbdma_status) ||
+			nvgpu_pbdma_status_is_chsw_switch(&pbdma_status)) {
+			pbdma_chid = pbdma_status.next_id;
+		} else {
+			/* Nothing to do here */
+		}
+
+		if (pbdma_chid != NVGPU_INVALID_CHANNEL_ID) {
+			ch = nvgpu_channel_from_id(g, pbdma_chid);
+			if (ch != NULL) {
+				err = g->ops.fifo.preempt_channel(g, ch);
+				nvgpu_channel_put(ch);
+			}
+			if (err != 0) {
+				goto clean_up;
+			}
+		}
+	}
+
+	/* chid from engine status */
+	g->ops.engine_status.read_engine_status_info(g, dev->engine_id,
+		 &engine_status);
+	if (nvgpu_engine_status_is_ctxsw_valid(&engine_status) ||
+	    nvgpu_engine_status_is_ctxsw_save(&engine_status)) {
+		engine_chid = engine_status.ctx_id;
+	} else if (nvgpu_engine_status_is_ctxsw_switch(&engine_status) ||
+	    nvgpu_engine_status_is_ctxsw_load(&engine_status)) {
+		engine_chid = engine_status.ctx_next_id;
+	} else {
+		/* Nothing to do here */
+	}
+
+	if (engine_chid != NVGPU_INVALID_ENG_ID && engine_chid != pbdma_chid) {
+		ch = nvgpu_channel_from_id(g, engine_chid);
+		if (ch != NULL) {
+			err = g->ops.fifo.preempt_channel(g, ch);
+			nvgpu_channel_put(ch);
+		}
+		if (err != 0) {
+			goto clean_up;
+		}
+	}
+
+clean_up:
+#ifdef CONFIG_NVGPU_LS_PMU
+	if (mutex_ret == 0) {
+		if (nvgpu_pmu_lock_release(g, g->pmu,
+			PMU_MUTEX_ID_FIFO, &token) != 0){
+			nvgpu_err(g, "failed to release PMU lock");
+		}
+	}
+#endif
+	if (err != 0) {
+		nvgpu_log_fn(g, "failed");
+		nvgpu_engine_enable_activity(g, dev);
+	} else {
+		nvgpu_log_fn(g, "done");
+	}
+	return err;
+}
+
+int nvgpu_engine_disable_activity_all(struct gk20a *g,
+					   bool wait_for_idle)
+{
+	unsigned int i;
+	int err = 0, ret = 0;
+
+	for (i = 0; i < g->fifo.num_engines; i++) {
+		err = nvgpu_engine_disable_activity(g,
+				g->fifo.active_engines[i],
+				wait_for_idle);
+		if (err != 0) {
+			nvgpu_err(g, "failed to disable engine %d activity",
+				  g->fifo.active_engines[i]->engine_id);
+			ret = err;
+			break;
+		}
+	}
+
+	if (err != 0) {
+		while (i-- != 0U) {
+			nvgpu_engine_enable_activity(g,
+					g->fifo.active_engines[i]);
+		}
+	}
+
+	return ret;
+}
+
+int nvgpu_engine_wait_for_idle(struct gk20a *g)
+{
+	struct nvgpu_timeout timeout;
+	u32 delay = POLL_DELAY_MIN_US;
+	int ret = 0, err = 0;
+	u32 i, host_num_engines;
+	struct nvgpu_engine_status_info engine_status;
+
+	nvgpu_log_fn(g, " ");
+
+	host_num_engines =
+		 nvgpu_get_litter_value(g, GPU_LIT_HOST_NUM_ENGINES);
+
+	err = nvgpu_timeout_init(g, &timeout, nvgpu_get_poll_timeout(g),
+			   NVGPU_TIMER_CPU_TIMER);
+	if (err != 0) {
+		return -EINVAL;
+	}
+
+	for (i = 0; i < host_num_engines; i++) {
+		if (!nvgpu_engine_check_valid_id(g, i)) {
+			continue;
+		}
+
+		ret = -ETIMEDOUT;
+		do {
+			g->ops.engine_status.read_engine_status_info(g, i,
+				&engine_status);
+			if (!engine_status.is_busy) {
+				ret = 0;
+				break;
+			}
+
+			nvgpu_usleep_range(delay, delay * 2U);
+			delay = min_t(u32,
+					delay << 1U, POLL_DELAY_MAX_US);
+		} while (nvgpu_timeout_expired(&timeout) == 0);
+
+		if (ret != 0) {
+			/* possible causes:
+			 * check register settings programmed in hal set by
+			 * elcg_init_idle_filters and init_therm_setup_hw
+			 */
+			nvgpu_err(g, "cannot idle engine: %u "
+					"engine_status: 0x%08x", i,
+					engine_status.reg_data);
+			break;
+		}
+	}
+
+	nvgpu_log_fn(g, "done");
+
+	return ret;
+}
+
+#endif /* CONFIG_NVGPU_FIFO_ENGINE_ACTIVITY */
+
+int nvgpu_engine_setup_sw(struct gk20a *g)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+	int err = 0;
+	size_t size;
+
+	f->max_engines = nvgpu_get_litter_value(g, GPU_LIT_HOST_NUM_ENGINES);
+	size = nvgpu_safe_mult_u64(f->max_engines,
+				   sizeof(struct nvgpu_device *));
+
+	/*
+	 * Allocate the two device lists for host devices.
+	 */
+	f->host_engines = nvgpu_kzalloc(g, size);
+	if (f->host_engines == NULL) {
+		nvgpu_err(g, "OOM allocating host engine list");
+		return -ENOMEM;
+	}
+	f->active_engines = nvgpu_kzalloc(g, size);
+	if (f->active_engines == NULL) {
+		nvgpu_err(g, "no mem for active engine list");
+		err = -ENOMEM;
+		goto clean_up_engine_info;
+	}
+
+	err = nvgpu_engine_init_info(f);
+	if (err != 0) {
+		nvgpu_err(g, "init engine info failed");
+		goto clean_up;
+	}
+
+	return 0;
+
+clean_up:
+	nvgpu_kfree(g, f->active_engines);
+	f->active_engines = NULL;
+
+clean_up_engine_info:
+	nvgpu_kfree(g, f->host_engines);
+	f->host_engines = NULL;
+
+	return err;
+}
+
+void nvgpu_engine_cleanup_sw(struct gk20a *g)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+
+	f->num_engines = 0;
+	nvgpu_kfree(g, f->host_engines);
+	f->host_engines = NULL;
+	nvgpu_kfree(g, f->active_engines);
+	f->active_engines = NULL;
+}
+
+#ifdef CONFIG_NVGPU_ENGINE_RESET
+static void nvgpu_engine_gr_reset(struct gk20a *g)
+{
+	struct nvgpu_swprofiler *prof = &g->fifo.eng_reset_profiler;
+	int err = 0;
+
+	nvgpu_swprofile_snapshot(prof, PROF_ENG_RESET_PREAMBLE);
+
+#ifdef CONFIG_NVGPU_POWER_PG
+	if (nvgpu_pg_elpg_disable(g) != 0 ) {
+		nvgpu_err(g, "failed to set disable elpg");
+	}
+#endif
+	nvgpu_swprofile_snapshot(prof, PROF_ENG_RESET_ELPG_DISABLE);
+
+#ifdef CONFIG_NVGPU_FECS_TRACE
+	/*
+	 * Resetting engine will alter read/write index. Need to flush
+	 * circular buffer before re-enabling FECS.
+	 */
+	if (g->ops.gr.fecs_trace.reset != NULL) {
+		if (g->ops.gr.fecs_trace.reset(g) != 0) {
+			nvgpu_warn(g, "failed to reset fecs traces");
+		}
+	}
+#endif
+
+	nvgpu_swprofile_snapshot(prof, PROF_ENG_RESET_FECS_TRACE_RESET);
+
+	/*
+	 * HALT_PIPELINE method and gr reset during recovery is supported
+	 * starting nvgpu-next simulation.
+	 */
+	err = g->ops.gr.falcon.ctrl_ctxsw(g,
+			NVGPU_GR_FALCON_METHOD_HALT_PIPELINE, 0U, NULL);
+	if (err != 0) {
+		nvgpu_err(g, "failed to halt gr pipe");
+	}
+
+	nvgpu_swprofile_snapshot(prof, PROF_ENG_RESET_HALT_PIPELINE);
+
+	/*
+	 * resetting only engine is not
+	 * enough, we do full init sequence
+	 */
+	nvgpu_log(g, gpu_dbg_rec, "resetting gr engine");
+
+	err = nvgpu_gr_reset(g);
+	if (err != 0) {
+		nvgpu_err(g, "failed to reset gr engine");
+	}
+
+#ifdef CONFIG_NVGPU_POWER_PG
+	if (nvgpu_pg_elpg_enable(g) != 0) {
+		nvgpu_err(g, "failed to set enable elpg");
+	}
+	nvgpu_swprofile_snapshot(prof, PROF_ENG_RESET_ELPG_REENABLE);
+#endif
+}
+
+void nvgpu_engine_reset(struct gk20a *g, u32 engine_id)
+{
+	struct nvgpu_swprofiler *prof = &g->fifo.eng_reset_profiler;
+	const struct nvgpu_device *dev;
+	int err = 0;
+	u32 gr_instance_id;
+
+	nvgpu_log_fn(g, " ");
+
+	if (g == NULL) {
+		return;
+	}
+
+	nvgpu_swprofile_begin_sample(prof);
+
+	dev = nvgpu_engine_get_active_eng_info(g, engine_id);
+	if (dev == NULL) {
+		nvgpu_err(g, "unsupported engine_id %d", engine_id);
+		return;
+	}
+
+	if (!nvgpu_device_is_ce(g, dev) &&
+	    !nvgpu_device_is_graphics(g, dev)) {
+		nvgpu_warn(g, "Ignoring reset for non-host engine.");
+		return;
+	}
+
+	/*
+	 * Simple case first: reset a copy engine.
+	 */
+	if (nvgpu_device_is_ce(g, dev)) {
+		err = nvgpu_mc_reset_dev(g, dev);
+		if (err != 0) {
+			nvgpu_log_info(g, "CE engine [id:%u] reset failed",
+				dev->engine_id);
+		}
+		return;
+	}
+
+	/*
+	 * Now reset a GR engine.
+	 */
+	gr_instance_id =
+		nvgpu_grmgr_get_gr_instance_id_for_syspipe(
+			g, dev->inst_id);
+
+	nvgpu_gr_exec_for_instance(g,
+		gr_instance_id, nvgpu_engine_gr_reset(g));
+}
+#endif
+
+u32 nvgpu_engine_get_fast_ce_runlist_id(struct gk20a *g)
+{
+	const struct nvgpu_device *dev;
+	u32 nr_lces;
+	u32 i;
+
+	/*
+	 * Obtain a runlist ID for the fastest available CE. The priority order
+	 * is:
+	 *
+	 *   1. Last available LCE
+	 *   2. Last available COPY[0-2]
+	 *   3. GRAPHICS runlist as a last resort.
+	 */
+	nr_lces = nvgpu_device_count(g, NVGPU_DEVTYPE_LCE);
+	if (nr_lces > 0U) {
+		dev = nvgpu_device_get(g,
+				       NVGPU_DEVTYPE_LCE,
+				       nr_lces - 1U);
+		nvgpu_assert(dev != NULL);
+
+		return dev->runlist_id;
+	}
+
+	/*
+	 * Note: this only works since NVGPU_DEVTYPE_GRAPHICS is 0 and the COPYx
+	 * are all > 0.
+	 */
+	for (i = NVGPU_DEVTYPE_COPY2; i >= NVGPU_DEVTYPE_COPY0; i--) {
+		dev = nvgpu_device_get(g, i, i - NVGPU_DEVTYPE_COPY0);
+		if (dev != NULL) {
+			return dev->runlist_id;
+		}
+	}
+
+	/*
+	 * Fall back to GR.
+	 */
+	dev = nvgpu_device_get(g, NVGPU_DEVTYPE_GRAPHICS, 0);
+	nvgpu_assert(dev != NULL);
+
+	return dev->runlist_id;
+}
+
+u32 nvgpu_engine_get_gr_runlist_id(struct gk20a *g)
+{
+	const struct nvgpu_device *dev;
+
+	dev = nvgpu_device_get(g, NVGPU_DEVTYPE_GRAPHICS, 0);
+	if (dev == NULL) {
+		nvgpu_warn(g, "No GR device on this GPU?!");
+		return NVGPU_INVALID_RUNLIST_ID;
+	}
+
+	return dev->runlist_id;
+}
+
+bool nvgpu_engine_is_valid_runlist_id(struct gk20a *g, u32 runlist_id)
+{
+	u32 i;
+	struct nvgpu_fifo *f = &g->fifo;
+
+	for (i = 0U; i < f->num_engines; i++) {
+		const struct nvgpu_device *dev = f->active_engines[i];
+
+		if (dev->runlist_id == runlist_id) {
+			return true;
+		}
+	}
+
+	return false;
+}
+
+/*
+ * Link engine IDs to MMU IDs and vice versa.
+ */
+u32 nvgpu_engine_id_to_mmu_fault_id(struct gk20a *g, u32 engine_id)
+{
+	const struct nvgpu_device *dev;
+
+	dev = nvgpu_engine_get_active_eng_info(g, engine_id);
+
+	if (dev == NULL) {
+		nvgpu_err(g,
+			  "engine_id: %u is not in active list",
+			  engine_id);
+		return NVGPU_INVALID_ENG_ID;
+	}
+
+	return dev->fault_id;
+}
+
+u32 nvgpu_engine_mmu_fault_id_to_engine_id(struct gk20a *g, u32 fault_id)
+{
+	u32 i;
+	const struct nvgpu_device *dev;
+	struct nvgpu_fifo *f = &g->fifo;
+
+	for (i = 0U; i < f->num_engines; i++) {
+		dev = f->active_engines[i];
+
+		if (dev->fault_id == fault_id) {
+			return dev->engine_id;
+		}
+	}
+
+	return NVGPU_INVALID_ENG_ID;
+}
+
+u32 nvgpu_engine_get_mask_on_id(struct gk20a *g, u32 id, bool is_tsg)
+{
+	unsigned int i;
+	u32 engines = 0;
+	struct nvgpu_engine_status_info engine_status;
+	u32 ctx_id;
+	u32 type;
+	bool busy;
+
+	for (i = 0; i < g->fifo.num_engines; i++) {
+		const struct nvgpu_device *dev = g->fifo.active_engines[i];
+
+		g->ops.engine_status.read_engine_status_info(g,
+			dev->engine_id, &engine_status);
+
+		if (nvgpu_engine_status_is_ctxsw_load(
+			&engine_status)) {
+			nvgpu_engine_status_get_next_ctx_id_type(
+				&engine_status, &ctx_id, &type);
+		} else {
+			nvgpu_engine_status_get_ctx_id_type(
+				&engine_status, &ctx_id, &type);
+		}
+
+		busy = engine_status.is_busy;
+
+		if (!busy || !(ctx_id == id)) {
+			continue;
+		}
+
+		if ((is_tsg  && (type == ENGINE_STATUS_CTX_ID_TYPE_TSGID)) ||
+		    (!is_tsg && (type == ENGINE_STATUS_CTX_ID_TYPE_CHID))) {
+			engines |= BIT32(dev->engine_id);
+		}
+	}
+
+	return engines;
+}
+
+static int nvgpu_engine_init_one_dev(struct nvgpu_fifo *f,
+				     const struct nvgpu_device *dev)
+{
+	bool found;
+	struct nvgpu_device *dev_rw;
+	struct gk20a *g = f->g;
+
+	dev_rw = (struct nvgpu_device *)dev;
+
+	/*
+	 * Populate the PBDMA info for this device; ideally it'd be done
+	 * during device init, but the FIFO unit is not out of reset that
+	 * early in the nvgpu_finalize_poweron() sequence.
+	 *
+	 * We only need to do this for native; vGPU already has pbdma_id
+	 * populated during device initialization.
+	 */
+	if (g->ops.fifo.find_pbdma_for_runlist != NULL) {
+		found = g->ops.fifo.find_pbdma_for_runlist(g,
+							   dev->runlist_id,
+							   &dev_rw->pbdma_id);
+		if (!found) {
+			nvgpu_err(g, "busted pbdma map");
+			return -EINVAL;
+		}
+	}
+
+#if defined(CONFIG_NVGPU_NEXT)
+	{
+		int err = nvgpu_next_engine_init_one_dev(g, dev);
+		if (err != 0) {
+			return err;
+		}
+	}
+#endif
+
+	f->host_engines[dev->engine_id] = dev;
+	f->active_engines[f->num_engines] = dev;
+	++f->num_engines;
+
+	return 0;
+}
+
+int nvgpu_engine_init_info(struct nvgpu_fifo *f)
+{
+	int err;
+	struct gk20a *g = f->g;
+	const struct nvgpu_device *dev;
+
+	f->num_engines = 0;
+
+	nvgpu_log(g, gpu_dbg_device, "Loading host engines from device list");
+	nvgpu_log(g, gpu_dbg_device, "  GFX devices: %u",
+		  nvgpu_device_count(g, NVGPU_DEVTYPE_GRAPHICS));
+
+	nvgpu_device_for_each(g, dev, NVGPU_DEVTYPE_GRAPHICS) {
+		err = nvgpu_engine_init_one_dev(f, dev);
+		if (err != 0) {
+			return err;
+		}
+	}
+
+	return g->ops.engine.init_ce_info(f);
+}
+
+void nvgpu_engine_get_id_and_type(struct gk20a *g, u32 engine_id,
+					  u32 *id, u32 *type)
+{
+	struct nvgpu_engine_status_info engine_status;
+
+	g->ops.engine_status.read_engine_status_info(g, engine_id,
+		&engine_status);
+
+	/* use next_id if context load is failing */
+	if (nvgpu_engine_status_is_ctxsw_load(
+		&engine_status)) {
+		nvgpu_engine_status_get_next_ctx_id_type(
+			&engine_status, id, type);
+	} else {
+		nvgpu_engine_status_get_ctx_id_type(
+			&engine_status, id, type);
+	}
+}
+
+u32 nvgpu_engine_find_busy_doing_ctxsw(struct gk20a *g,
+			u32 *id_ptr, bool *is_tsg_ptr)
+{
+	u32 i;
+	u32 id = U32_MAX;
+	bool is_tsg = false;
+	u32 mailbox2;
+	struct nvgpu_engine_status_info engine_status;
+	const struct nvgpu_device *dev = NULL;
+
+	for (i = 0U; i < g->fifo.num_engines; i++) {
+		dev = g->fifo.active_engines[i];
+
+		g->ops.engine_status.read_engine_status_info(g, dev->engine_id,
+			&engine_status);
+
+		/*
+		 * we are interested in busy engines that
+		 * are doing context switch
+		 */
+		if (!engine_status.is_busy ||
+		    !nvgpu_engine_status_is_ctxsw(&engine_status)) {
+			continue;
+		}
+
+		if (nvgpu_engine_status_is_ctxsw_load(&engine_status)) {
+			id = engine_status.ctx_next_id;
+			is_tsg = nvgpu_engine_status_is_next_ctx_type_tsg(
+					&engine_status);
+		} else if (nvgpu_engine_status_is_ctxsw_switch(&engine_status)) {
+			mailbox2 = g->ops.gr.falcon.read_fecs_ctxsw_mailbox(g,
+					NVGPU_GR_FALCON_FECS_CTXSW_MAILBOX2);
+			if ((mailbox2 & FECS_METHOD_WFI_RESTORE) != 0U) {
+				id = engine_status.ctx_next_id;
+				is_tsg = nvgpu_engine_status_is_next_ctx_type_tsg(
+						&engine_status);
+			} else {
+				id = engine_status.ctx_id;
+				is_tsg = nvgpu_engine_status_is_ctx_type_tsg(
+						&engine_status);
+			}
+		} else {
+			id = engine_status.ctx_id;
+			is_tsg = nvgpu_engine_status_is_ctx_type_tsg(
+					&engine_status);
+		}
+		break;
+	}
+
+	*id_ptr = id;
+	*is_tsg_ptr = is_tsg;
+
+	return dev->engine_id;
+}
+
+u32 nvgpu_engine_get_runlist_busy_engines(struct gk20a *g, u32 runlist_id)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+	u32 i, eng_bitmask = 0U;
+	struct nvgpu_engine_status_info engine_status;
+
+	for (i = 0U; i < f->num_engines; i++) {
+		const struct nvgpu_device *dev = f->active_engines[i];
+
+		g->ops.engine_status.read_engine_status_info(g, dev->engine_id,
+			&engine_status);
+
+		if (engine_status.is_busy && (dev->runlist_id == runlist_id)) {
+			eng_bitmask |= BIT32(dev->engine_id);
+		}
+	}
+
+	return eng_bitmask;
+}
+
+#ifdef CONFIG_NVGPU_DEBUGGER
+bool nvgpu_engine_should_defer_reset(struct gk20a *g, u32 engine_id,
+		u32 engine_subid, bool fake_fault)
+{
+	const struct nvgpu_device *dev;
+
+	dev = nvgpu_engine_get_active_eng_info(g, engine_id);
+	if (dev == NULL) {
+		return false;
+	}
+
+	/*
+	 * channel recovery is only deferred if an sm debugger
+	 * is attached and has MMU debug mode is enabled
+	 */
+	if (!g->ops.gr.sm_debugger_attached(g) ||
+	    !g->ops.fb.is_debug_mode_enabled(g)) {
+		return false;
+	}
+
+	/* if this fault is fake (due to RC recovery), don't defer recovery */
+	if (fake_fault) {
+		return false;
+	}
+
+	if (dev->type != NVGPU_DEVTYPE_GRAPHICS) {
+		return false;
+	}
+
+	return g->ops.engine.is_fault_engine_subid_gpc(g, engine_subid);
+}
+#endif
+
+u32 nvgpu_engine_mmu_fault_id_to_veid(struct gk20a *g, u32 mmu_fault_id,
+			u32 gr_eng_fault_id)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+	u32 num_subctx;
+	u32 veid = INVAL_ID;
+
+	num_subctx = f->max_subctx_count;
+
+	if ((mmu_fault_id >= gr_eng_fault_id) &&
+		(mmu_fault_id < nvgpu_safe_add_u32(gr_eng_fault_id,
+						num_subctx))) {
+		veid = mmu_fault_id - gr_eng_fault_id;
+	}
+
+	return veid;
+}
+
+static u32 nvgpu_engine_mmu_fault_id_to_eng_id_and_veid(struct gk20a *g,
+			 u32 mmu_fault_id, u32 *veid)
+{
+	u32 i;
+	u32 engine_id = INVAL_ID;
+	const struct nvgpu_device *dev;
+	struct nvgpu_fifo *f = &g->fifo;
+
+	for (i = 0U; i < f->num_engines; i++) {
+		dev = f->active_engines[i];
+
+		if (dev->type == NVGPU_DEVTYPE_GRAPHICS) {
+			*veid = nvgpu_engine_mmu_fault_id_to_veid(g,
+					mmu_fault_id, dev->fault_id);
+			if (*veid != INVAL_ID) {
+				engine_id = dev->engine_id;
+				break;
+			}
+		} else {
+			if (dev->fault_id == mmu_fault_id) {
+				engine_id = dev->engine_id;
+				*veid = INVAL_ID;
+				break;
+			}
+		}
+	}
+	return engine_id;
+}
+
+void nvgpu_engine_mmu_fault_id_to_eng_ve_pbdma_id(struct gk20a *g,
+	u32 mmu_fault_id, u32 *engine_id, u32 *veid, u32 *pbdma_id)
+{
+	*engine_id = nvgpu_engine_mmu_fault_id_to_eng_id_and_veid(g,
+				 mmu_fault_id, veid);
+
+	if (*engine_id == INVAL_ID) {
+		*pbdma_id = g->ops.fifo.mmu_fault_id_to_pbdma_id(g,
+				mmu_fault_id);
+	} else {
+		*pbdma_id = INVAL_ID;
+	}
+}
--- a/drivers/gpu/nvgpu/common/fifo/fifo.c
+++ b/drivers/gpu/nvgpu/common/fifo/fifo.c
@@ -0,0 +1,315 @@
+/*
+ * FIFO
+ *
+ * Copyright (c) 2011-2021, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/trace.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/fifo.h>
+#include <nvgpu/engines.h>
+#include <nvgpu/runlist.h>
+#include <nvgpu/preempt.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/pbdma.h>
+#include <nvgpu/tsg.h>
+#include <nvgpu/vm_area.h>
+#include <nvgpu/nvgpu_err.h>
+#include <nvgpu/cic.h>
+#include <nvgpu/mc.h>
+#include <nvgpu/swprofile.h>
+#include <nvgpu/fifo/swprofile.h>
+
+static const char *nvgpu_fifo_kickoff_profile_events[] = {
+	NVGPU_FIFO_KICKOFF_PROFILE_EVENTS,
+};
+
+static const char *nvgpu_fifo_recovery_profile_events[] = {
+	NVGPU_FIFO_RECOVERY_PROFILE_EVENTS,
+};
+
+static const char *nvgpu_fifo_engine_reset_events[] = {
+	NVGPU_FIFO_ENGINE_RESET_EVENTS,
+};
+
+void nvgpu_fifo_cleanup_sw_common(struct gk20a *g)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+
+	nvgpu_log_fn(g, " ");
+
+#ifdef CONFIG_NVGPU_USERD
+	g->ops.userd.cleanup_sw(g);
+#endif
+	nvgpu_channel_cleanup_sw(g);
+	nvgpu_tsg_cleanup_sw(g);
+	nvgpu_runlist_cleanup_sw(g);
+	nvgpu_engine_cleanup_sw(g);
+	if (g->ops.pbdma.cleanup_sw != NULL) {
+		g->ops.pbdma.cleanup_sw(g);
+	}
+
+#ifdef CONFIG_NVGPU_DEBUGGER
+	f->deferred_reset_pending = false;
+	nvgpu_mutex_destroy(&f->deferred_reset_mutex);
+#endif
+	nvgpu_mutex_destroy(&f->engines_reset_mutex);
+	nvgpu_mutex_destroy(&f->intr.isr.mutex);
+
+	f->sw_ready = false;
+}
+
+void nvgpu_fifo_cleanup_sw(struct gk20a *g)
+{
+#ifdef CONFIG_NVGPU_KERNEL_MODE_SUBMIT
+	nvgpu_channel_worker_deinit(g);
+#endif
+	nvgpu_fifo_cleanup_sw_common(g);
+}
+
+static void nvgpu_fifo_remove_support(struct nvgpu_fifo *f)
+{
+	struct gk20a *g = f->g;
+
+	g->ops.fifo.cleanup_sw(g);
+}
+
+int nvgpu_fifo_setup_sw_common(struct gk20a *g)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+	int err = 0;
+
+	nvgpu_log_fn(g, " ");
+
+	f->g = g;
+
+	nvgpu_mutex_init(&f->intr.isr.mutex);
+	nvgpu_mutex_init(&f->engines_reset_mutex);
+#ifdef CONFIG_NVGPU_DEBUGGER
+	nvgpu_mutex_init(&f->deferred_reset_mutex);
+#endif
+
+	nvgpu_swprofile_initialize(g, &f->kickoff_profiler,
+				 nvgpu_fifo_kickoff_profile_events);
+	nvgpu_swprofile_initialize(g, &f->recovery_profiler,
+				 nvgpu_fifo_recovery_profile_events);
+	nvgpu_swprofile_initialize(g, &f->eng_reset_profiler,
+				 nvgpu_fifo_engine_reset_events);
+
+
+	err = nvgpu_channel_setup_sw(g);
+	if (err != 0) {
+		nvgpu_err(g, "failed to init channel support");
+		goto clean_up;
+	}
+
+	err = nvgpu_tsg_setup_sw(g);
+	if (err != 0) {
+		nvgpu_err(g, "failed to init tsg support");
+		goto clean_up_channel;
+	}
+
+	if (g->ops.pbdma.setup_sw != NULL) {
+		err = g->ops.pbdma.setup_sw(g);
+		if (err != 0) {
+			nvgpu_err(g, "failed to init pbdma support");
+			goto clean_up_tsg;
+		}
+	}
+
+	err = nvgpu_engine_setup_sw(g);
+	if (err != 0) {
+		nvgpu_err(g, "failed to init engine support");
+		goto clean_up_pbdma;
+	}
+
+	err = nvgpu_runlist_setup_sw(g);
+	if (err != 0) {
+		nvgpu_err(g, "failed to init runlist support");
+		goto clean_up_engine;
+	}
+
+#ifdef CONFIG_NVGPU_USERD
+	err = g->ops.userd.setup_sw(g);
+	if (err != 0) {
+		nvgpu_err(g, "failed to init userd support");
+		goto clean_up_runlist;
+	}
+#endif
+
+	f->remove_support = nvgpu_fifo_remove_support;
+
+	nvgpu_log_fn(g, "done");
+	return 0;
+
+#ifdef CONFIG_NVGPU_USERD
+clean_up_runlist:
+	nvgpu_runlist_cleanup_sw(g);
+#endif
+
+clean_up_engine:
+	nvgpu_engine_cleanup_sw(g);
+
+clean_up_pbdma:
+	if (g->ops.pbdma.cleanup_sw != NULL) {
+		g->ops.pbdma.cleanup_sw(g);
+	}
+
+clean_up_tsg:
+	nvgpu_tsg_cleanup_sw(g);
+
+clean_up_channel:
+	nvgpu_channel_cleanup_sw(g);
+
+clean_up:
+	nvgpu_err(g, "init fifo support failed");
+	return err;
+}
+
+int nvgpu_fifo_setup_sw(struct gk20a *g)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+	int err = 0;
+
+	nvgpu_log_fn(g, " ");
+
+	if (f->sw_ready) {
+		nvgpu_log_fn(g, "skip init");
+		return 0;
+	}
+
+	err = nvgpu_fifo_setup_sw_common(g);
+	if (err != 0) {
+		nvgpu_err(g, "fifo common sw setup failed, err=%d", err);
+		return err;
+	}
+
+#ifdef CONFIG_NVGPU_KERNEL_MODE_SUBMIT
+	err = nvgpu_channel_worker_init(g);
+	if (err != 0) {
+		nvgpu_err(g, "worker init fail, err=%d", err);
+		goto clean_up;
+	}
+#endif
+
+	f->sw_ready = true;
+
+	nvgpu_log_fn(g, "done");
+	return 0;
+
+#ifdef CONFIG_NVGPU_KERNEL_MODE_SUBMIT
+clean_up:
+	nvgpu_fifo_cleanup_sw_common(g);
+
+	return err;
+#endif
+}
+
+int nvgpu_fifo_init_support(struct gk20a *g)
+{
+	int err;
+
+	err = g->ops.fifo.setup_sw(g);
+	if (err != 0) {
+		nvgpu_err(g, "fifo sw setup failed, err=%d", err);
+		return err;
+	}
+
+	if (g->ops.fifo.init_fifo_setup_hw != NULL) {
+		err = g->ops.fifo.init_fifo_setup_hw(g);
+		if (err != 0) {
+			nvgpu_err(g, "fifo hw setup failed, err=%d", err);
+			goto clean_up;
+		}
+	}
+
+	return 0;
+
+clean_up:
+	nvgpu_fifo_cleanup_sw_common(g);
+
+	return err;
+}
+
+static const char * const pbdma_ch_eng_status_str[] = {
+	"invalid",
+	"valid",
+	"NA",
+	"NA",
+	"NA",
+	"load",
+	"save",
+	"switch",
+};
+
+static const char * const not_found_str[] = {
+	"NOT FOUND"
+};
+
+const char *nvgpu_fifo_decode_pbdma_ch_eng_status(u32 index)
+{
+	if (index >= ARRAY_SIZE(pbdma_ch_eng_status_str)) {
+		return not_found_str[0];
+	} else {
+		return pbdma_ch_eng_status_str[index];
+	}
+}
+
+static void disable_fifo_interrupts(struct gk20a *g)
+{
+	/** Disable fifo intr */
+	g->ops.fifo.intr_0_enable(g, false);
+	g->ops.fifo.intr_1_enable(g, false);
+
+	if (g->ops.fifo.intr_top_enable == NULL) {
+		nvgpu_cic_intr_stall_unit_config(g, NVGPU_CIC_INTR_UNIT_FIFO,
+					NVGPU_CIC_INTR_DISABLE);
+		nvgpu_cic_intr_nonstall_unit_config(g, NVGPU_CIC_INTR_UNIT_FIFO,
+					   NVGPU_CIC_INTR_DISABLE);
+	} else {
+		g->ops.fifo.intr_top_enable(g, NVGPU_CIC_INTR_DISABLE);
+	}
+}
+
+int nvgpu_fifo_suspend(struct gk20a *g)
+{
+	nvgpu_log_fn(g, " ");
+
+	if (g->ops.mm.is_bar1_supported(g)) {
+		g->ops.fifo.bar1_snooping_disable(g);
+	}
+
+	disable_fifo_interrupts(g);
+
+	nvgpu_log_fn(g, "done");
+	return 0;
+}
+
+void nvgpu_fifo_sw_quiesce(struct gk20a *g)
+{
+	u32 runlist_mask = U32_MAX;
+
+	g->ops.runlist.write_state(g, runlist_mask, RUNLIST_DISABLED);
+
+	/* Preempt all runlists */
+	nvgpu_fifo_preempt_runlists_for_rc(g, runlist_mask);
+}
--- a/drivers/gpu/nvgpu/common/fifo/job.c
+++ b/drivers/gpu/nvgpu/common/fifo/job.c
@@ -0,0 +1,149 @@
+/*
+ * Copyright (c) 2011-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/log.h>
+#include <nvgpu/lock.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/barrier.h>
+#include <nvgpu/circ_buf.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/job.h>
+#include <nvgpu/priv_cmdbuf.h>
+#include <nvgpu/fence.h>
+
+static inline struct nvgpu_channel_job *
+channel_gk20a_job_from_list(struct nvgpu_list_node *node)
+{
+	return (struct nvgpu_channel_job *)
+	((uintptr_t)node - offsetof(struct nvgpu_channel_job, list));
+};
+
+int nvgpu_channel_alloc_job(struct nvgpu_channel *c,
+		struct nvgpu_channel_job **job_out)
+{
+	unsigned int put = c->joblist.pre_alloc.put;
+	unsigned int get = c->joblist.pre_alloc.get;
+	unsigned int next = (put + 1) % c->joblist.pre_alloc.length;
+	bool full = next == get;
+
+	if (full) {
+		return -EAGAIN;
+	}
+
+	*job_out = &c->joblist.pre_alloc.jobs[put];
+	(void) memset(*job_out, 0, sizeof(**job_out));
+
+	return 0;
+}
+
+void nvgpu_channel_free_job(struct nvgpu_channel *c,
+		struct nvgpu_channel_job *job)
+{
+	/*
+	 * Nothing needed for now. The job contents are preallocated. The
+	 * completion fence may briefly outlive the job, but the job memory is
+	 * reclaimed only when a new submit comes in and the ringbuffer has ran
+	 * out of space.
+	 */
+}
+
+void nvgpu_channel_joblist_lock(struct nvgpu_channel *c)
+{
+	nvgpu_mutex_acquire(&c->joblist.pre_alloc.read_lock);
+}
+
+void nvgpu_channel_joblist_unlock(struct nvgpu_channel *c)
+{
+	nvgpu_mutex_release(&c->joblist.pre_alloc.read_lock);
+}
+
+struct nvgpu_channel_job *nvgpu_channel_joblist_peek(struct nvgpu_channel *c)
+{
+	unsigned int get = c->joblist.pre_alloc.get;
+	unsigned int put = c->joblist.pre_alloc.put;
+	bool empty = get == put;
+
+	return empty ? NULL : &c->joblist.pre_alloc.jobs[get];
+}
+
+void nvgpu_channel_joblist_add(struct nvgpu_channel *c,
+		struct nvgpu_channel_job *job)
+{
+	c->joblist.pre_alloc.put = (c->joblist.pre_alloc.put + 1U) %
+			(c->joblist.pre_alloc.length);
+}
+
+void nvgpu_channel_joblist_delete(struct nvgpu_channel *c,
+		struct nvgpu_channel_job *job)
+{
+	c->joblist.pre_alloc.get = (c->joblist.pre_alloc.get + 1U) %
+			(c->joblist.pre_alloc.length);
+}
+
+int nvgpu_channel_joblist_init(struct nvgpu_channel *c, u32 num_jobs)
+{
+	int err;
+	u32 size;
+
+	size = (u32)sizeof(struct nvgpu_channel_job);
+	if (num_jobs > nvgpu_safe_sub_u32(U32_MAX / size, 1U)) {
+		err = -ERANGE;
+		goto clean_up;
+	}
+
+	/*
+	 * The max capacity of this ring buffer is the alloc size minus one (in
+	 * units of item slot), so allocate a size of (num_jobs + 1) * size
+	 * bytes.
+	 */
+	c->joblist.pre_alloc.jobs = nvgpu_vzalloc(c->g,
+			nvgpu_safe_mult_u32(
+				nvgpu_safe_add_u32(num_jobs, 1U),
+				size));
+	if (c->joblist.pre_alloc.jobs == NULL) {
+		err = -ENOMEM;
+		goto clean_up;
+	}
+
+	/*
+	 * length is the allocation size of the ringbuffer; the number of jobs
+	 * that fit is one less.
+	 */
+	c->joblist.pre_alloc.length = nvgpu_safe_add_u32(num_jobs, 1U);
+	c->joblist.pre_alloc.put = 0;
+	c->joblist.pre_alloc.get = 0;
+
+	return 0;
+
+clean_up:
+	nvgpu_vfree(c->g, c->joblist.pre_alloc.jobs);
+	(void) memset(&c->joblist.pre_alloc, 0, sizeof(c->joblist.pre_alloc));
+	return err;
+}
+
+void nvgpu_channel_joblist_deinit(struct nvgpu_channel *c)
+{
+	if (c->joblist.pre_alloc.jobs != NULL) {
+		nvgpu_vfree(c->g, c->joblist.pre_alloc.jobs);
+		c->joblist.pre_alloc.jobs = NULL;
+	}
+}
--- a/drivers/gpu/nvgpu/common/fifo/pbdma.c
+++ b/drivers/gpu/nvgpu/common/fifo/pbdma.c
@@ -0,0 +1,55 @@
+/*
+ * Copyright (c) 2011-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/gk20a.h>
+#include <nvgpu/pbdma.h>
+
+static void nvgpu_pbdma_init_intr_descs(struct gk20a *g)
+{
+	struct nvgpu_fifo *f = &g->fifo;
+
+	if (g->ops.pbdma.device_fatal_0_intr_descs != NULL) {
+		f->intr.pbdma.device_fatal_0 =
+			g->ops.pbdma.device_fatal_0_intr_descs();
+	}
+
+	if (g->ops.pbdma.channel_fatal_0_intr_descs != NULL) {
+		f->intr.pbdma.channel_fatal_0 =
+			g->ops.pbdma.channel_fatal_0_intr_descs();
+	}
+	if (g->ops.pbdma.restartable_0_intr_descs != NULL) {
+		f->intr.pbdma.restartable_0 =
+			g->ops.pbdma.restartable_0_intr_descs();
+	}
+}
+
+int nvgpu_pbdma_setup_sw(struct gk20a *g)
+{
+	nvgpu_pbdma_init_intr_descs(g);
+
+	return 0;
+}
+
+void nvgpu_pbdma_cleanup_sw(struct gk20a *g)
+{
+	return;
+}
--- a/drivers/gpu/nvgpu/common/fifo/pbdma_status.c
+++ b/drivers/gpu/nvgpu/common/fifo/pbdma_status.c
@@ -0,0 +1,54 @@
+/*
+ * Copyright (c) 2019, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/pbdma_status.h>
+
+bool nvgpu_pbdma_status_is_chsw_switch(struct nvgpu_pbdma_status_info
+		*pbdma_status)
+{
+	return pbdma_status->chsw_status == NVGPU_PBDMA_CHSW_STATUS_SWITCH;
+}
+bool nvgpu_pbdma_status_is_chsw_load(struct nvgpu_pbdma_status_info
+		*pbdma_status)
+{
+	return pbdma_status->chsw_status == NVGPU_PBDMA_CHSW_STATUS_LOAD;
+}
+bool nvgpu_pbdma_status_is_chsw_save(struct nvgpu_pbdma_status_info
+		*pbdma_status)
+{
+	return pbdma_status->chsw_status == NVGPU_PBDMA_CHSW_STATUS_SAVE;
+}
+bool nvgpu_pbdma_status_is_chsw_valid(struct nvgpu_pbdma_status_info
+		*pbdma_status)
+{
+	return pbdma_status->chsw_status == NVGPU_PBDMA_CHSW_STATUS_VALID;
+}
+bool nvgpu_pbdma_status_is_id_type_tsg(struct nvgpu_pbdma_status_info
+		*pbdma_status)
+{
+	return pbdma_status->id_type == PBDMA_STATUS_ID_TYPE_TSGID;
+}
+bool nvgpu_pbdma_status_is_next_id_type_tsg(struct nvgpu_pbdma_status_info
+		*pbdma_status)
+{
+	return pbdma_status->next_id_type == PBDMA_STATUS_NEXT_ID_TYPE_TSGID;
+}
--- a/Show More
+++ b/Show More