mirror of
git://nv-tegra.nvidia.com/linux-nvgpu.git
synced 2025-12-22 17:36:20 +03:00
Added logic to skip the following graphics CB allocation, map and programming sequence when MIG is enabled. Global CB: 1) NVGPU_GR_GLOBAL_CTX_CIRCULAR 2) NVGPU_GR_GLOBAL_CTX_PAGEPOOL 3) NVGPU_GR_GLOBAL_CTX_ATTRIBUTE 4) NVGPU_GR_GLOBAL_CTX_CIRCULAR_VPR 5) NVGPU_GR_GLOBAL_CTX_PAGEPOOL_VPR 6) NVGPU_GR_GLOBAL_CTX_ATTRIBUTE_VPR 7) NVGPU_GR_GLOBAL_CTX_RTV_CIRCULAR_BUFFER CTX CB: 1) NVGPU_GR_CTX_CIRCULAR_VA 2) NVGPU_GR_CTX_PAGEPOOL_VA 3) NVGPU_GR_CTX_ATTRIBUTE_VA 4) NVGPU_GR_CTX_RTV_CIRCULAR_BUFFER_VA JIRA NVGPU-5650 Change-Id: I38c2859ce57ad76c58a772fdf9f589f2106149af Signed-off-by: Lakshmanan M <lm@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/c/linux-nvgpu/+/2423450 Tested-by: mobile promotions <svcmobile_promotions@nvidia.com> Reviewed-by: automaticguardword <automaticguardword@nvidia.com> Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com> Reviewed-by: svc-mobile-cert <svc-mobile-cert@nvidia.com> Reviewed-by: Rajesh Devaraj <rdevaraj@nvidia.com> Reviewed-by: Dinesh T <dt@nvidia.com> Reviewed-by: Deepak Nibade <dnibade@nvidia.com> Reviewed-by: Vaibhav Kachore <vkachore@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> GVS: Gerrit_Virtual_Submit
373 lines
9.0 KiB
C
373 lines
9.0 KiB
C
/*
|
|
* Copyright (c) 2019-2020, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
* DEALINGS IN THE SOFTWARE.
|
|
*/
|
|
|
|
#include <nvgpu/log.h>
|
|
#include <nvgpu/gk20a.h>
|
|
#include <nvgpu/gr/ctx.h>
|
|
#include <nvgpu/gr/subctx.h>
|
|
#include <nvgpu/gr/obj_ctx.h>
|
|
#ifdef CONFIG_NVGPU_GRAPHICS
|
|
#include <nvgpu/gr/zcull.h>
|
|
#endif
|
|
#include <nvgpu/gr/setup.h>
|
|
#include <nvgpu/gr/gr_instances.h>
|
|
#include <nvgpu/channel.h>
|
|
#include <nvgpu/preempt.h>
|
|
|
|
#include "gr_priv.h"
|
|
|
|
#ifdef CONFIG_NVGPU_GRAPHICS
|
|
static int nvgpu_gr_setup_zcull(struct gk20a *g, struct nvgpu_channel *c,
|
|
struct nvgpu_gr_ctx *gr_ctx)
|
|
{
|
|
int ret = 0;
|
|
|
|
nvgpu_log_fn(g, " ");
|
|
|
|
ret = nvgpu_channel_disable_tsg(g, c);
|
|
if (ret != 0) {
|
|
nvgpu_err(g, "failed to disable channel/TSG");
|
|
return ret;
|
|
}
|
|
|
|
ret = nvgpu_preempt_channel(g, c);
|
|
if (ret != 0) {
|
|
nvgpu_err(g, "failed to preempt channel/TSG");
|
|
goto out;
|
|
}
|
|
|
|
ret = nvgpu_gr_zcull_ctx_setup(g, c->subctx, gr_ctx);
|
|
if (ret != 0) {
|
|
nvgpu_err(g, "failed to setup zcull");
|
|
goto out;
|
|
}
|
|
/* no error at this point */
|
|
ret = nvgpu_channel_enable_tsg(g, c);
|
|
if (ret != 0) {
|
|
nvgpu_err(g, "failed to re-enable channel/TSG");
|
|
}
|
|
|
|
return ret;
|
|
|
|
out:
|
|
/*
|
|
* control reaches here if preempt failed or nvgpu_gr_zcull_ctx_setup
|
|
* failed. Propagate preempt failure err or err for
|
|
* nvgpu_gr_zcull_ctx_setup
|
|
*/
|
|
if (nvgpu_channel_enable_tsg(g, c) != 0) {
|
|
/* ch might not be bound to tsg */
|
|
nvgpu_err(g, "failed to enable channel/TSG");
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
int nvgpu_gr_setup_bind_ctxsw_zcull(struct gk20a *g, struct nvgpu_channel *c,
|
|
u64 zcull_va, u32 mode)
|
|
{
|
|
struct nvgpu_tsg *tsg;
|
|
struct nvgpu_gr_ctx *gr_ctx;
|
|
|
|
tsg = nvgpu_tsg_from_ch(c);
|
|
if (tsg == NULL) {
|
|
return -EINVAL;
|
|
}
|
|
|
|
gr_ctx = tsg->gr_ctx;
|
|
nvgpu_gr_ctx_set_zcull_ctx(g, gr_ctx, mode, zcull_va);
|
|
|
|
return nvgpu_gr_setup_zcull(g, c, gr_ctx);
|
|
}
|
|
#endif
|
|
|
|
static int nvgpu_gr_setup_validate_channel_and_class(struct gk20a *g,
|
|
struct nvgpu_channel *c, u32 class_num)
|
|
{
|
|
int err = 0;
|
|
|
|
/* an address space needs to have been bound at this point.*/
|
|
if (!nvgpu_channel_as_bound(c)) {
|
|
nvgpu_err(g,
|
|
"not bound to address space at time"
|
|
" of grctx allocation");
|
|
return -EINVAL;
|
|
}
|
|
|
|
if (!g->ops.gpu_class.is_valid(class_num)) {
|
|
nvgpu_err(g,
|
|
"invalid obj class 0x%x", class_num);
|
|
err = -EINVAL;
|
|
}
|
|
|
|
return err;
|
|
}
|
|
|
|
static int nvgpu_gr_setup_alloc_subctx(struct gk20a *g, struct nvgpu_channel *c)
|
|
{
|
|
int err = 0;
|
|
|
|
if (nvgpu_is_enabled(g, NVGPU_SUPPORT_TSG_SUBCONTEXTS)) {
|
|
if (c->subctx == NULL) {
|
|
c->subctx = nvgpu_gr_subctx_alloc(g, c->vm);
|
|
if (c->subctx == NULL) {
|
|
err = -ENOMEM;
|
|
}
|
|
}
|
|
}
|
|
|
|
return err;
|
|
}
|
|
|
|
int nvgpu_gr_setup_alloc_obj_ctx(struct nvgpu_channel *c, u32 class_num,
|
|
u32 flags)
|
|
{
|
|
struct gk20a *g = c->g;
|
|
struct nvgpu_gr_ctx *gr_ctx;
|
|
struct nvgpu_tsg *tsg = NULL;
|
|
int err = 0;
|
|
struct nvgpu_gr *gr = nvgpu_gr_get_cur_instance_ptr(g);
|
|
|
|
nvgpu_log(g, gpu_dbg_fn | gpu_dbg_gr,
|
|
"GR%u: allocate object context for channel %u",
|
|
gr->instance_id, c->chid);
|
|
|
|
err = nvgpu_gr_setup_validate_channel_and_class(g, c, class_num);
|
|
if (err != 0) {
|
|
goto out;
|
|
}
|
|
|
|
c->obj_class = class_num;
|
|
|
|
#ifndef CONFIG_NVGPU_HAL_NON_FUSA
|
|
/*
|
|
* Only compute class is valid in safety build, Return success for valid
|
|
* non compute classees. Invalid classes are indentified by above check
|
|
* with nvgpu_gr_setup_validate_channel_and_class() function.
|
|
*/
|
|
if (!g->ops.gpu_class.is_valid_compute(class_num)) {
|
|
return 0;
|
|
}
|
|
#endif
|
|
|
|
tsg = nvgpu_tsg_from_ch(c);
|
|
if (tsg == NULL) {
|
|
return -EINVAL;
|
|
}
|
|
|
|
gr_ctx = tsg->gr_ctx;
|
|
|
|
err = nvgpu_gr_setup_alloc_subctx(g, c);
|
|
if (err != 0) {
|
|
nvgpu_err(g, "failed to allocate gr subctx buffer");
|
|
goto out;
|
|
}
|
|
|
|
if (!nvgpu_mem_is_valid(nvgpu_gr_ctx_get_ctx_mem(gr_ctx))) {
|
|
tsg->vm = c->vm;
|
|
nvgpu_vm_get(tsg->vm);
|
|
|
|
err = nvgpu_gr_obj_ctx_alloc(g, gr->golden_image,
|
|
gr->global_ctx_buffer, gr->gr_ctx_desc,
|
|
gr->config, gr_ctx, c->subctx,
|
|
tsg->vm, &c->inst_block, class_num, flags,
|
|
c->cde, c->vpr);
|
|
if (err != 0) {
|
|
nvgpu_err(g,
|
|
"failed to allocate gr ctx buffer");
|
|
nvgpu_vm_put(tsg->vm);
|
|
tsg->vm = NULL;
|
|
goto out;
|
|
}
|
|
|
|
nvgpu_gr_ctx_set_tsgid(gr_ctx, tsg->tsgid);
|
|
} else {
|
|
/* commit gr ctx buffer */
|
|
nvgpu_gr_obj_ctx_commit_inst(g, &c->inst_block, gr_ctx,
|
|
c->subctx, nvgpu_gr_ctx_get_ctx_mem(gr_ctx)->gpu_va);
|
|
}
|
|
|
|
#ifdef CONFIG_NVGPU_FECS_TRACE
|
|
if (g->ops.gr.fecs_trace.bind_channel && !c->vpr) {
|
|
err = g->ops.gr.fecs_trace.bind_channel(g, &c->inst_block,
|
|
c->subctx, gr_ctx, tsg->tgid, 0);
|
|
if (err != 0) {
|
|
nvgpu_warn(g,
|
|
"fail to bind channel for ctxsw trace");
|
|
}
|
|
}
|
|
#endif
|
|
|
|
nvgpu_log(g, gpu_dbg_fn | gpu_dbg_gr, "done");
|
|
return 0;
|
|
out:
|
|
if (c->subctx != NULL) {
|
|
nvgpu_gr_subctx_free(g, c->subctx, c->vm);
|
|
c->subctx = NULL;
|
|
}
|
|
|
|
/* 1. gr_ctx, patch_ctx and global ctx buffer mapping
|
|
can be reused so no need to release them.
|
|
2. golden image init and load is a one time thing so if
|
|
they pass, no need to undo. */
|
|
nvgpu_err(g, "fail");
|
|
return err;
|
|
}
|
|
|
|
void nvgpu_gr_setup_free_gr_ctx(struct gk20a *g,
|
|
struct vm_gk20a *vm, struct nvgpu_gr_ctx *gr_ctx)
|
|
{
|
|
nvgpu_log_fn(g, " ");
|
|
|
|
if (gr_ctx != NULL) {
|
|
#ifdef CONFIG_DEBUG_FS
|
|
if ((g->ops.gr.ctxsw_prog.dump_ctxsw_stats != NULL) &&
|
|
nvgpu_gr_ctx_desc_dump_ctxsw_stats_on_channel_close(
|
|
g->gr->gr_ctx_desc)) {
|
|
g->ops.gr.ctxsw_prog.dump_ctxsw_stats(g,
|
|
nvgpu_gr_ctx_get_ctx_mem(gr_ctx));
|
|
}
|
|
#endif
|
|
|
|
nvgpu_gr_ctx_free(g, gr_ctx, g->gr->global_ctx_buffer, vm);
|
|
}
|
|
}
|
|
|
|
void nvgpu_gr_setup_free_subctx(struct nvgpu_channel *c)
|
|
{
|
|
nvgpu_log_fn(c->g, " ");
|
|
|
|
if (!nvgpu_is_enabled(c->g, NVGPU_SUPPORT_TSG_SUBCONTEXTS)) {
|
|
return;
|
|
}
|
|
|
|
if (c->subctx != NULL) {
|
|
nvgpu_gr_subctx_free(c->g, c->subctx, c->vm);
|
|
c->subctx = NULL;
|
|
}
|
|
}
|
|
|
|
static bool nvgpu_gr_setup_validate_preemption_mode(u32 *graphics_preempt_mode,
|
|
u32 *compute_preempt_mode,
|
|
struct nvgpu_gr_ctx *gr_ctx)
|
|
{
|
|
#ifdef CONFIG_NVGPU_GRAPHICS
|
|
/* skip setting anything if both modes are already set */
|
|
if ((*graphics_preempt_mode != 0U) &&
|
|
(*graphics_preempt_mode ==
|
|
nvgpu_gr_ctx_get_graphics_preemption_mode(gr_ctx))) {
|
|
*graphics_preempt_mode = 0;
|
|
}
|
|
#endif /* CONFIG_NVGPU_GRAPHICS */
|
|
|
|
if ((*compute_preempt_mode != 0U) &&
|
|
(*compute_preempt_mode ==
|
|
nvgpu_gr_ctx_get_compute_preemption_mode(gr_ctx))) {
|
|
*compute_preempt_mode = 0;
|
|
}
|
|
|
|
if ((*graphics_preempt_mode == 0U) && (*compute_preempt_mode == 0U)) {
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
|
|
int nvgpu_gr_setup_set_preemption_mode(struct nvgpu_channel *ch,
|
|
u32 graphics_preempt_mode,
|
|
u32 compute_preempt_mode)
|
|
{
|
|
struct nvgpu_gr_ctx *gr_ctx;
|
|
struct gk20a *g = ch->g;
|
|
struct nvgpu_tsg *tsg;
|
|
struct vm_gk20a *vm;
|
|
struct nvgpu_gr *gr;
|
|
u32 class_num;
|
|
int err = 0;
|
|
|
|
gr = nvgpu_gr_get_cur_instance_ptr(g);
|
|
|
|
class_num = ch->obj_class;
|
|
if (class_num == 0U) {
|
|
return -EINVAL;
|
|
}
|
|
|
|
if (!g->ops.gpu_class.is_valid(class_num)) {
|
|
nvgpu_err(g, "invalid obj class 0x%x", class_num);
|
|
return -EINVAL;
|
|
}
|
|
|
|
tsg = nvgpu_tsg_from_ch(ch);
|
|
if (tsg == NULL) {
|
|
return -EINVAL;
|
|
}
|
|
|
|
vm = tsg->vm;
|
|
gr_ctx = tsg->gr_ctx;
|
|
|
|
if (nvgpu_gr_setup_validate_preemption_mode(&graphics_preempt_mode,
|
|
&compute_preempt_mode, gr_ctx) == false) {
|
|
return 0;
|
|
}
|
|
|
|
nvgpu_log(g, gpu_dbg_gr | gpu_dbg_sched, "chid=%d tsgid=%d pid=%d "
|
|
"graphics_preempt_mode=%u compute_preempt_mode=%u",
|
|
ch->chid, ch->tsgid, ch->tgid,
|
|
graphics_preempt_mode, compute_preempt_mode);
|
|
|
|
err = nvgpu_gr_obj_ctx_set_ctxsw_preemption_mode(g, gr->config,
|
|
gr->gr_ctx_desc, gr_ctx, vm, class_num,
|
|
graphics_preempt_mode, compute_preempt_mode);
|
|
if (err != 0) {
|
|
nvgpu_err(g, "set_ctxsw_preemption_mode failed");
|
|
return err;
|
|
}
|
|
|
|
g->ops.tsg.disable(tsg);
|
|
|
|
err = nvgpu_preempt_channel(g, ch);
|
|
if (err != 0) {
|
|
nvgpu_err(g, "failed to preempt channel/TSG");
|
|
goto enable_ch;
|
|
}
|
|
|
|
nvgpu_gr_obj_ctx_update_ctxsw_preemption_mode(g, gr->config, gr_ctx,
|
|
ch->subctx);
|
|
|
|
if (!nvgpu_is_enabled(g, NVGPU_SUPPORT_MIG)) {
|
|
nvgpu_gr_ctx_patch_write_begin(g, gr_ctx, true);
|
|
g->ops.gr.init.commit_global_cb_manager(g, gr->config, gr_ctx,
|
|
true);
|
|
nvgpu_gr_ctx_patch_write_end(g, gr_ctx, true);
|
|
}
|
|
|
|
g->ops.tsg.enable(tsg);
|
|
|
|
return err;
|
|
|
|
enable_ch:
|
|
g->ops.tsg.enable(tsg);
|
|
return err;
|
|
}
|