mirror of
git://nv-tegra.nvidia.com/linux-nvgpu.git
synced 2025-12-24 10:34:43 +03:00
gpu: nvgpu: vgpu: move common files out of linux folder
Most of files have been moved out of linux folder. More code could be common as halifying going on. Jira EVLR-2364 Change-Id: Ia9dbdbc82f45ceefe5c788eac7517000cd455d5e Signed-off-by: Richard Zhao <rizhao@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1649947 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
This commit is contained in:
committed by
mobile promotions
parent
7932568b7f
commit
6393eddfa9
@@ -1,46 +0,0 @@
|
||||
/*
|
||||
* Virtualized GPU CE2
|
||||
*
|
||||
* Copyright (c) 2015-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "vgpu.h"
|
||||
#include "gk20a/channel_gk20a.h"
|
||||
|
||||
#include <nvgpu/bug.h>
|
||||
|
||||
int vgpu_ce2_nonstall_isr(struct gk20a *g,
|
||||
struct tegra_vgpu_ce2_nonstall_intr_info *info)
|
||||
{
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
switch (info->type) {
|
||||
case TEGRA_VGPU_CE2_NONSTALL_INTR_NONBLOCKPIPE:
|
||||
gk20a_channel_semaphore_wakeup(g, true);
|
||||
break;
|
||||
default:
|
||||
WARN_ON(1);
|
||||
break;
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
u32 vgpu_ce_get_num_pce(struct gk20a *g)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
|
||||
return priv->constants.num_pce;
|
||||
}
|
||||
@@ -16,8 +16,9 @@
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <nvgpu/vgpu/vgpu.h>
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "vgpu.h"
|
||||
#include "clk_vgpu.h"
|
||||
#include "ctrl/ctrlclk.h"
|
||||
#include "common/linux/platform_gk20a.h"
|
||||
|
||||
@@ -18,14 +18,14 @@
|
||||
#include <nvgpu/vgpu/vgpu_ivm.h>
|
||||
#include <nvgpu/vgpu/tegra_vgpu.h>
|
||||
#include <uapi/linux/nvgpu.h>
|
||||
#include <nvgpu/vgpu/vgpu.h>
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "gk20a/channel_gk20a.h"
|
||||
#include "gk20a/css_gr_gk20a.h"
|
||||
#include "common/linux/platform_gk20a.h"
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
#include "common/linux/vgpu/css_vgpu.h"
|
||||
#include "common/linux/os_linux.h"
|
||||
#include "vgpu/css_vgpu.h"
|
||||
|
||||
static struct tegra_hv_ivm_cookie *css_cookie;
|
||||
|
||||
|
||||
@@ -1,34 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _CSS_VGPU_H_
|
||||
#define _CSS_VGPU_H_
|
||||
|
||||
#include <nvgpu/types.h>
|
||||
|
||||
struct gr_gk20a;
|
||||
struct channel_gk20a;
|
||||
struct gk20a_cs_snapshot_client;
|
||||
|
||||
void vgpu_css_release_snapshot_buffer(struct gr_gk20a *gr);
|
||||
int vgpu_css_flush_snapshots(struct channel_gk20a *ch,
|
||||
u32 *pending, bool *hw_overflow);
|
||||
int vgpu_css_detach(struct channel_gk20a *ch,
|
||||
struct gk20a_cs_snapshot_client *cs_client);
|
||||
int vgpu_css_enable_snapshot_buffer(struct channel_gk20a *ch,
|
||||
struct gk20a_cs_snapshot_client *cs_client);
|
||||
u32 vgpu_css_get_buffer_size(struct gk20a *g);
|
||||
#endif
|
||||
@@ -1,209 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <nvgpu/vgpu/vgpu_ivc.h>
|
||||
#include <nvgpu/vgpu/tegra_vgpu.h>
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "gk20a/channel_gk20a.h"
|
||||
#include "gk20a/dbg_gpu_gk20a.h"
|
||||
#include "gk20a/regops_gk20a.h"
|
||||
#include "vgpu.h"
|
||||
#include "dbg_vgpu.h"
|
||||
|
||||
#include <nvgpu/bug.h>
|
||||
|
||||
int vgpu_exec_regops(struct dbg_session_gk20a *dbg_s,
|
||||
struct nvgpu_dbg_reg_op *ops,
|
||||
u64 num_ops)
|
||||
{
|
||||
struct channel_gk20a *ch;
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_reg_ops_params *p = &msg.params.reg_ops;
|
||||
void *oob;
|
||||
size_t oob_size, ops_size;
|
||||
void *handle = NULL;
|
||||
int err = 0;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
BUG_ON(sizeof(*ops) != sizeof(struct tegra_vgpu_reg_op));
|
||||
|
||||
handle = vgpu_ivc_oob_get_ptr(vgpu_ivc_get_server_vmid(),
|
||||
TEGRA_VGPU_QUEUE_CMD,
|
||||
&oob, &oob_size);
|
||||
if (!handle)
|
||||
return -EINVAL;
|
||||
|
||||
ops_size = sizeof(*ops) * num_ops;
|
||||
if (oob_size < ops_size) {
|
||||
err = -ENOMEM;
|
||||
goto fail;
|
||||
}
|
||||
|
||||
memcpy(oob, ops, ops_size);
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_REG_OPS;
|
||||
msg.handle = vgpu_get_handle(dbg_s->g);
|
||||
ch = nvgpu_dbg_gpu_get_session_channel(dbg_s);
|
||||
p->handle = ch ? ch->virt_ctx : 0;
|
||||
p->num_ops = num_ops;
|
||||
p->is_profiler = dbg_s->is_profiler;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (!err)
|
||||
memcpy(ops, oob, ops_size);
|
||||
|
||||
fail:
|
||||
vgpu_ivc_oob_put_ptr(handle);
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_dbg_set_powergate(struct dbg_session_gk20a *dbg_s, bool disable_powergate)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_set_powergate_params *p = &msg.params.set_powergate;
|
||||
int err = 0;
|
||||
u32 mode;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
/* Just return if requested mode is the same as the session's mode */
|
||||
if (disable_powergate) {
|
||||
if (dbg_s->is_pg_disabled)
|
||||
return 0;
|
||||
dbg_s->is_pg_disabled = true;
|
||||
mode = TEGRA_VGPU_POWERGATE_MODE_DISABLE;
|
||||
} else {
|
||||
if (!dbg_s->is_pg_disabled)
|
||||
return 0;
|
||||
dbg_s->is_pg_disabled = false;
|
||||
mode = TEGRA_VGPU_POWERGATE_MODE_ENABLE;
|
||||
}
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_SET_POWERGATE;
|
||||
msg.handle = vgpu_get_handle(dbg_s->g);
|
||||
p->mode = mode;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
return err;
|
||||
}
|
||||
|
||||
static int vgpu_sendrecv_prof_cmd(struct dbg_session_gk20a *dbg_s, u32 mode)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_prof_mgt_params *p = &msg.params.prof_management;
|
||||
int err = 0;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_PROF_MGT;
|
||||
msg.handle = vgpu_get_handle(dbg_s->g);
|
||||
|
||||
p->mode = mode;
|
||||
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
return err;
|
||||
}
|
||||
|
||||
bool vgpu_check_and_set_global_reservation(
|
||||
struct dbg_session_gk20a *dbg_s,
|
||||
struct dbg_profiler_object_data *prof_obj)
|
||||
{
|
||||
struct gk20a *g = dbg_s->g;
|
||||
|
||||
if (g->profiler_reservation_count > 0)
|
||||
return false;
|
||||
|
||||
/* Check that another guest OS doesn't already have a reservation */
|
||||
if (!vgpu_sendrecv_prof_cmd(dbg_s, TEGRA_VGPU_PROF_GET_GLOBAL)) {
|
||||
g->global_profiler_reservation_held = true;
|
||||
g->profiler_reservation_count = 1;
|
||||
dbg_s->has_profiler_reservation = true;
|
||||
prof_obj->has_reservation = true;
|
||||
return true;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
bool vgpu_check_and_set_context_reservation(
|
||||
struct dbg_session_gk20a *dbg_s,
|
||||
struct dbg_profiler_object_data *prof_obj)
|
||||
{
|
||||
struct gk20a *g = dbg_s->g;
|
||||
|
||||
/* Assumes that we've already checked that no global reservation
|
||||
* is in effect for this guest.
|
||||
*
|
||||
* If our reservation count is non-zero, then no other guest has the
|
||||
* global reservation; if it is zero, need to check with RM server.
|
||||
*
|
||||
*/
|
||||
if ((g->profiler_reservation_count != 0) ||
|
||||
!vgpu_sendrecv_prof_cmd(dbg_s, TEGRA_VGPU_PROF_GET_CONTEXT)) {
|
||||
g->profiler_reservation_count++;
|
||||
dbg_s->has_profiler_reservation = true;
|
||||
prof_obj->has_reservation = true;
|
||||
return true;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
void vgpu_release_profiler_reservation(
|
||||
struct dbg_session_gk20a *dbg_s,
|
||||
struct dbg_profiler_object_data *prof_obj)
|
||||
{
|
||||
struct gk20a *g = dbg_s->g;
|
||||
|
||||
dbg_s->has_profiler_reservation = false;
|
||||
prof_obj->has_reservation = false;
|
||||
if (prof_obj->ch == NULL)
|
||||
g->global_profiler_reservation_held = false;
|
||||
|
||||
/* If new reservation count is zero, notify server */
|
||||
g->profiler_reservation_count--;
|
||||
if (g->profiler_reservation_count == 0)
|
||||
vgpu_sendrecv_prof_cmd(dbg_s, TEGRA_VGPU_PROF_RELEASE);
|
||||
}
|
||||
|
||||
static int vgpu_sendrecv_perfbuf_cmd(struct gk20a *g, u64 offset, u32 size)
|
||||
{
|
||||
struct mm_gk20a *mm = &g->mm;
|
||||
struct vm_gk20a *vm = mm->perfbuf.vm;
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_perfbuf_mgt_params *p =
|
||||
&msg.params.perfbuf_management;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_PERFBUF_MGT;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
|
||||
p->vm_handle = vm->handle;
|
||||
p->offset = offset;
|
||||
p->size = size;
|
||||
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_perfbuffer_enable(struct gk20a *g, u64 offset, u32 size)
|
||||
{
|
||||
return vgpu_sendrecv_perfbuf_cmd(g, offset, size);
|
||||
}
|
||||
|
||||
int vgpu_perfbuffer_disable(struct gk20a *g)
|
||||
{
|
||||
return vgpu_sendrecv_perfbuf_cmd(g, 0, 0);
|
||||
}
|
||||
@@ -1,41 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _DBG_VGPU_H_
|
||||
#define _DBG_VGPU_H_
|
||||
|
||||
struct dbg_session_gk20a;
|
||||
struct nvgpu_dbg_reg_op;
|
||||
struct dbg_profiler_object_data;
|
||||
struct gk20a;
|
||||
|
||||
int vgpu_exec_regops(struct dbg_session_gk20a *dbg_s,
|
||||
struct nvgpu_dbg_reg_op *ops,
|
||||
u64 num_ops);
|
||||
int vgpu_dbg_set_powergate(struct dbg_session_gk20a *dbg_s, bool disable_powergate);
|
||||
bool vgpu_check_and_set_global_reservation(
|
||||
struct dbg_session_gk20a *dbg_s,
|
||||
struct dbg_profiler_object_data *prof_obj);
|
||||
bool vgpu_check_and_set_context_reservation(
|
||||
struct dbg_session_gk20a *dbg_s,
|
||||
struct dbg_profiler_object_data *prof_obj);
|
||||
|
||||
void vgpu_release_profiler_reservation(
|
||||
struct dbg_session_gk20a *dbg_s,
|
||||
struct dbg_profiler_object_data *prof_obj);
|
||||
int vgpu_perfbuffer_enable(struct gk20a *g, u64 offset, u32 size);
|
||||
int vgpu_perfbuffer_disable(struct gk20a *g);
|
||||
#endif
|
||||
@@ -22,11 +22,11 @@
|
||||
#include <nvgpu/ctxsw_trace.h>
|
||||
#include <nvgpu/vgpu/vgpu_ivm.h>
|
||||
#include <nvgpu/vgpu/tegra_vgpu.h>
|
||||
#include <nvgpu/vgpu/vgpu.h>
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "common/linux/os_linux.h"
|
||||
#include "vgpu.h"
|
||||
#include "fecs_trace_vgpu.h"
|
||||
#include "vgpu/fecs_trace_vgpu.h"
|
||||
|
||||
struct vgpu_fecs_trace {
|
||||
struct tegra_hv_ivm_cookie *cookie;
|
||||
|
||||
@@ -1,41 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2016-2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef __FECS_TRACE_VGPU_H
|
||||
#define __FECS_TRACE_VGPU_H
|
||||
|
||||
#include <nvgpu/types.h>
|
||||
|
||||
struct gk20a;
|
||||
struct vm_area_struct;
|
||||
struct nvgpu_ctxsw_trace_filter;
|
||||
|
||||
void vgpu_fecs_trace_data_update(struct gk20a *g);
|
||||
int vgpu_fecs_trace_init(struct gk20a *g);
|
||||
int vgpu_fecs_trace_deinit(struct gk20a *g);
|
||||
int vgpu_fecs_trace_enable(struct gk20a *g);
|
||||
int vgpu_fecs_trace_disable(struct gk20a *g);
|
||||
bool vgpu_fecs_trace_is_enabled(struct gk20a *g);
|
||||
int vgpu_fecs_trace_poll(struct gk20a *g);
|
||||
int vgpu_alloc_user_buffer(struct gk20a *g, void **buf, size_t *size);
|
||||
int vgpu_free_user_buffer(struct gk20a *g);
|
||||
int vgpu_mmap_user_buffer(struct gk20a *g, struct vm_area_struct *vma);
|
||||
int vgpu_fecs_trace_max_entries(struct gk20a *g,
|
||||
struct nvgpu_ctxsw_trace_filter *filter);
|
||||
int vgpu_fecs_trace_set_filter(struct gk20a *g,
|
||||
struct nvgpu_ctxsw_trace_filter *filter);
|
||||
|
||||
#endif /* __FECS_TRACE_VGPU_H */
|
||||
@@ -1,764 +0,0 @@
|
||||
/*
|
||||
* Virtualized GPU Fifo
|
||||
*
|
||||
* Copyright (c) 2014-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <trace/events/gk20a.h>
|
||||
|
||||
#include <nvgpu/kmem.h>
|
||||
#include <nvgpu/dma.h>
|
||||
#include <nvgpu/atomic.h>
|
||||
#include <nvgpu/bug.h>
|
||||
#include <nvgpu/barrier.h>
|
||||
#include <nvgpu/error_notifier.h>
|
||||
#include <nvgpu/vgpu/vgpu_ivc.h>
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "vgpu.h"
|
||||
#include "fifo_vgpu.h"
|
||||
|
||||
#include <nvgpu/hw/gk20a/hw_fifo_gk20a.h>
|
||||
#include <nvgpu/hw/gk20a/hw_ram_gk20a.h>
|
||||
|
||||
void vgpu_channel_bind(struct channel_gk20a *ch)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_channel_config_params *p =
|
||||
&msg.params.channel_config;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_info("bind channel %d", ch->chid);
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_BIND;
|
||||
msg.handle = vgpu_get_handle(ch->g);
|
||||
p->handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
|
||||
nvgpu_smp_wmb();
|
||||
nvgpu_atomic_set(&ch->bound, true);
|
||||
}
|
||||
|
||||
void vgpu_channel_unbind(struct channel_gk20a *ch)
|
||||
{
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (nvgpu_atomic_cmpxchg(&ch->bound, true, false)) {
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_channel_config_params *p =
|
||||
&msg.params.channel_config;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_UNBIND;
|
||||
msg.handle = vgpu_get_handle(ch->g);
|
||||
p->handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
int vgpu_channel_alloc_inst(struct gk20a *g, struct channel_gk20a *ch)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_channel_hwctx_params *p = &msg.params.channel_hwctx;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_ALLOC_HWCTX;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->id = ch->chid;
|
||||
p->pid = (u64)current->tgid;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
if (err || msg.ret) {
|
||||
nvgpu_err(g, "fail");
|
||||
return -ENOMEM;
|
||||
}
|
||||
|
||||
ch->virt_ctx = p->handle;
|
||||
gk20a_dbg_fn("done");
|
||||
return 0;
|
||||
}
|
||||
|
||||
void vgpu_channel_free_inst(struct gk20a *g, struct channel_gk20a *ch)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_channel_hwctx_params *p = &msg.params.channel_hwctx;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_FREE_HWCTX;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
}
|
||||
|
||||
void vgpu_channel_enable(struct channel_gk20a *ch)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_channel_config_params *p =
|
||||
&msg.params.channel_config;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_ENABLE;
|
||||
msg.handle = vgpu_get_handle(ch->g);
|
||||
p->handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
}
|
||||
|
||||
void vgpu_channel_disable(struct channel_gk20a *ch)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_channel_config_params *p =
|
||||
&msg.params.channel_config;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_DISABLE;
|
||||
msg.handle = vgpu_get_handle(ch->g);
|
||||
p->handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
}
|
||||
|
||||
int vgpu_channel_setup_ramfc(struct channel_gk20a *ch, u64 gpfifo_base,
|
||||
u32 gpfifo_entries,
|
||||
unsigned long acquire_timeout, u32 flags)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_ramfc_params *p = &msg.params.ramfc;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_SETUP_RAMFC;
|
||||
msg.handle = vgpu_get_handle(ch->g);
|
||||
p->handle = ch->virt_ctx;
|
||||
p->gpfifo_va = gpfifo_base;
|
||||
p->num_entries = gpfifo_entries;
|
||||
p->userd_addr = ch->userd_iova;
|
||||
p->iova = 0;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
|
||||
return (err || msg.ret) ? -ENOMEM : 0;
|
||||
}
|
||||
|
||||
int vgpu_fifo_init_engine_info(struct fifo_gk20a *f)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(f->g);
|
||||
struct tegra_vgpu_engines_info *engines = &priv->constants.engines_info;
|
||||
u32 i;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (engines->num_engines > TEGRA_VGPU_MAX_ENGINES) {
|
||||
nvgpu_err(f->g, "num_engines %d larger than max %d",
|
||||
engines->num_engines, TEGRA_VGPU_MAX_ENGINES);
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
f->num_engines = engines->num_engines;
|
||||
for (i = 0; i < f->num_engines; i++) {
|
||||
struct fifo_engine_info_gk20a *info =
|
||||
&f->engine_info[engines->info[i].engine_id];
|
||||
|
||||
if (engines->info[i].engine_id >= f->max_engines) {
|
||||
nvgpu_err(f->g, "engine id %d larger than max %d",
|
||||
engines->info[i].engine_id,
|
||||
f->max_engines);
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
info->intr_mask = engines->info[i].intr_mask;
|
||||
info->reset_mask = engines->info[i].reset_mask;
|
||||
info->runlist_id = engines->info[i].runlist_id;
|
||||
info->pbdma_id = engines->info[i].pbdma_id;
|
||||
info->inst_id = engines->info[i].inst_id;
|
||||
info->pri_base = engines->info[i].pri_base;
|
||||
info->engine_enum = engines->info[i].engine_enum;
|
||||
info->fault_id = engines->info[i].fault_id;
|
||||
f->active_engines_list[i] = engines->info[i].engine_id;
|
||||
}
|
||||
|
||||
gk20a_dbg_fn("done");
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
static int init_runlist(struct gk20a *g, struct fifo_gk20a *f)
|
||||
{
|
||||
struct fifo_runlist_info_gk20a *runlist;
|
||||
unsigned int runlist_id = -1;
|
||||
u32 i;
|
||||
u64 runlist_size;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
f->max_runlists = g->ops.fifo.eng_runlist_base_size();
|
||||
f->runlist_info = nvgpu_kzalloc(g,
|
||||
sizeof(struct fifo_runlist_info_gk20a) *
|
||||
f->max_runlists);
|
||||
if (!f->runlist_info)
|
||||
goto clean_up_runlist;
|
||||
|
||||
memset(f->runlist_info, 0, (sizeof(struct fifo_runlist_info_gk20a) *
|
||||
f->max_runlists));
|
||||
|
||||
for (runlist_id = 0; runlist_id < f->max_runlists; runlist_id++) {
|
||||
runlist = &f->runlist_info[runlist_id];
|
||||
|
||||
runlist->active_channels =
|
||||
nvgpu_kzalloc(g, DIV_ROUND_UP(f->num_channels,
|
||||
BITS_PER_BYTE));
|
||||
if (!runlist->active_channels)
|
||||
goto clean_up_runlist;
|
||||
|
||||
runlist_size = sizeof(u16) * f->num_channels;
|
||||
for (i = 0; i < MAX_RUNLIST_BUFFERS; i++) {
|
||||
int err = nvgpu_dma_alloc_sys(g, runlist_size,
|
||||
&runlist->mem[i]);
|
||||
if (err) {
|
||||
nvgpu_err(g, "memory allocation failed");
|
||||
goto clean_up_runlist;
|
||||
}
|
||||
}
|
||||
nvgpu_mutex_init(&runlist->mutex);
|
||||
|
||||
/* None of buffers is pinned if this value doesn't change.
|
||||
Otherwise, one of them (cur_buffer) must have been pinned. */
|
||||
runlist->cur_buffer = MAX_RUNLIST_BUFFERS;
|
||||
}
|
||||
|
||||
gk20a_dbg_fn("done");
|
||||
return 0;
|
||||
|
||||
clean_up_runlist:
|
||||
gk20a_fifo_delete_runlist(f);
|
||||
gk20a_dbg_fn("fail");
|
||||
return -ENOMEM;
|
||||
}
|
||||
|
||||
static int vgpu_init_fifo_setup_sw(struct gk20a *g)
|
||||
{
|
||||
struct fifo_gk20a *f = &g->fifo;
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
unsigned int chid;
|
||||
int err = 0;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (f->sw_ready) {
|
||||
gk20a_dbg_fn("skip init");
|
||||
return 0;
|
||||
}
|
||||
|
||||
f->g = g;
|
||||
f->num_channels = priv->constants.num_channels;
|
||||
f->max_engines = nvgpu_get_litter_value(g, GPU_LIT_HOST_NUM_ENGINES);
|
||||
|
||||
f->userd_entry_size = 1 << ram_userd_base_shift_v();
|
||||
|
||||
err = nvgpu_dma_alloc_sys(g, f->userd_entry_size * f->num_channels,
|
||||
&f->userd);
|
||||
if (err) {
|
||||
nvgpu_err(g, "memory allocation failed");
|
||||
goto clean_up;
|
||||
}
|
||||
|
||||
/* bar1 va */
|
||||
if (g->ops.mm.is_bar1_supported(g)) {
|
||||
f->userd.gpu_va = vgpu_bar1_map(g, &f->userd);
|
||||
if (!f->userd.gpu_va) {
|
||||
nvgpu_err(g, "gmmu mapping failed");
|
||||
goto clean_up;
|
||||
}
|
||||
/* if reduced BAR1 range is specified, use offset of 0
|
||||
* (server returns offset assuming full BAR1 range)
|
||||
*/
|
||||
if (vgpu_is_reduced_bar1(g))
|
||||
f->userd.gpu_va = 0;
|
||||
}
|
||||
|
||||
gk20a_dbg(gpu_dbg_map_v, "userd bar1 va = 0x%llx", f->userd.gpu_va);
|
||||
|
||||
f->channel = nvgpu_vzalloc(g, f->num_channels * sizeof(*f->channel));
|
||||
f->tsg = nvgpu_vzalloc(g, f->num_channels * sizeof(*f->tsg));
|
||||
f->engine_info = nvgpu_kzalloc(g, f->max_engines *
|
||||
sizeof(*f->engine_info));
|
||||
f->active_engines_list = nvgpu_kzalloc(g, f->max_engines * sizeof(u32));
|
||||
|
||||
if (!(f->channel && f->tsg && f->engine_info && f->active_engines_list)) {
|
||||
err = -ENOMEM;
|
||||
goto clean_up;
|
||||
}
|
||||
memset(f->active_engines_list, 0xff, (f->max_engines * sizeof(u32)));
|
||||
|
||||
g->ops.fifo.init_engine_info(f);
|
||||
|
||||
init_runlist(g, f);
|
||||
|
||||
nvgpu_init_list_node(&f->free_chs);
|
||||
nvgpu_mutex_init(&f->free_chs_mutex);
|
||||
|
||||
for (chid = 0; chid < f->num_channels; chid++) {
|
||||
f->channel[chid].userd_iova =
|
||||
nvgpu_mem_get_addr(g, &f->userd) +
|
||||
chid * f->userd_entry_size;
|
||||
f->channel[chid].userd_gpu_va =
|
||||
f->userd.gpu_va + chid * f->userd_entry_size;
|
||||
|
||||
gk20a_init_channel_support(g, chid);
|
||||
gk20a_init_tsg_support(g, chid);
|
||||
}
|
||||
nvgpu_mutex_init(&f->tsg_inuse_mutex);
|
||||
|
||||
err = nvgpu_channel_worker_init(g);
|
||||
if (err)
|
||||
goto clean_up;
|
||||
|
||||
f->deferred_reset_pending = false;
|
||||
nvgpu_mutex_init(&f->deferred_reset_mutex);
|
||||
|
||||
f->channel_base = priv->constants.channel_base;
|
||||
|
||||
f->sw_ready = true;
|
||||
|
||||
gk20a_dbg_fn("done");
|
||||
return 0;
|
||||
|
||||
clean_up:
|
||||
gk20a_dbg_fn("fail");
|
||||
/* FIXME: unmap from bar1 */
|
||||
nvgpu_dma_free(g, &f->userd);
|
||||
|
||||
memset(&f->userd, 0, sizeof(f->userd));
|
||||
|
||||
nvgpu_vfree(g, f->channel);
|
||||
f->channel = NULL;
|
||||
nvgpu_vfree(g, f->tsg);
|
||||
f->tsg = NULL;
|
||||
nvgpu_kfree(g, f->engine_info);
|
||||
f->engine_info = NULL;
|
||||
nvgpu_kfree(g, f->active_engines_list);
|
||||
f->active_engines_list = NULL;
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_init_fifo_setup_hw(struct gk20a *g)
|
||||
{
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
/* test write, read through bar1 @ userd region before
|
||||
* turning on the snooping */
|
||||
{
|
||||
struct fifo_gk20a *f = &g->fifo;
|
||||
u32 v, v1 = 0x33, v2 = 0x55;
|
||||
|
||||
u32 bar1_vaddr = f->userd.gpu_va;
|
||||
volatile u32 *cpu_vaddr = f->userd.cpu_va;
|
||||
|
||||
gk20a_dbg_info("test bar1 @ vaddr 0x%x",
|
||||
bar1_vaddr);
|
||||
|
||||
v = gk20a_bar1_readl(g, bar1_vaddr);
|
||||
|
||||
*cpu_vaddr = v1;
|
||||
nvgpu_mb();
|
||||
|
||||
if (v1 != gk20a_bar1_readl(g, bar1_vaddr)) {
|
||||
nvgpu_err(g, "bar1 broken @ gk20a!");
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
gk20a_bar1_writel(g, bar1_vaddr, v2);
|
||||
|
||||
if (v2 != gk20a_bar1_readl(g, bar1_vaddr)) {
|
||||
nvgpu_err(g, "bar1 broken @ gk20a!");
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
/* is it visible to the cpu? */
|
||||
if (*cpu_vaddr != v2) {
|
||||
nvgpu_err(g, "cpu didn't see bar1 write @ %p!",
|
||||
cpu_vaddr);
|
||||
}
|
||||
|
||||
/* put it back */
|
||||
gk20a_bar1_writel(g, bar1_vaddr, v);
|
||||
}
|
||||
|
||||
gk20a_dbg_fn("done");
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int vgpu_init_fifo_support(struct gk20a *g)
|
||||
{
|
||||
u32 err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = vgpu_init_fifo_setup_sw(g);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
if (g->ops.fifo.init_fifo_setup_hw)
|
||||
err = g->ops.fifo.init_fifo_setup_hw(g);
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_fifo_preempt_channel(struct gk20a *g, u32 chid)
|
||||
{
|
||||
struct fifo_gk20a *f = &g->fifo;
|
||||
struct channel_gk20a *ch = &f->channel[chid];
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_channel_config_params *p =
|
||||
&msg.params.channel_config;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (!nvgpu_atomic_read(&ch->bound))
|
||||
return 0;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_PREEMPT;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
|
||||
if (err || msg.ret) {
|
||||
nvgpu_err(g,
|
||||
"preempt channel %d failed", chid);
|
||||
err = -ENOMEM;
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_fifo_preempt_tsg(struct gk20a *g, u32 tsgid)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_tsg_preempt_params *p =
|
||||
&msg.params.tsg_preempt;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_TSG_PREEMPT;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->tsg_id = tsgid;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
|
||||
if (err) {
|
||||
nvgpu_err(g,
|
||||
"preempt tsg %u failed", tsgid);
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
static int vgpu_submit_runlist(struct gk20a *g, u64 handle, u8 runlist_id,
|
||||
u16 *runlist, u32 num_entries)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_runlist_params *p;
|
||||
int err;
|
||||
void *oob_handle;
|
||||
void *oob;
|
||||
size_t size, oob_size;
|
||||
|
||||
oob_handle = vgpu_ivc_oob_get_ptr(vgpu_ivc_get_server_vmid(),
|
||||
TEGRA_VGPU_QUEUE_CMD,
|
||||
&oob, &oob_size);
|
||||
if (!oob_handle)
|
||||
return -EINVAL;
|
||||
|
||||
size = sizeof(*runlist) * num_entries;
|
||||
if (oob_size < size) {
|
||||
err = -ENOMEM;
|
||||
goto done;
|
||||
}
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_SUBMIT_RUNLIST;
|
||||
msg.handle = handle;
|
||||
p = &msg.params.runlist;
|
||||
p->runlist_id = runlist_id;
|
||||
p->num_entries = num_entries;
|
||||
|
||||
memcpy(oob, runlist, size);
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
|
||||
err = (err || msg.ret) ? -1 : 0;
|
||||
|
||||
done:
|
||||
vgpu_ivc_oob_put_ptr(oob_handle);
|
||||
return err;
|
||||
}
|
||||
|
||||
static int vgpu_fifo_update_runlist_locked(struct gk20a *g, u32 runlist_id,
|
||||
u32 chid, bool add,
|
||||
bool wait_for_finish)
|
||||
{
|
||||
struct fifo_gk20a *f = &g->fifo;
|
||||
struct fifo_runlist_info_gk20a *runlist;
|
||||
u16 *runlist_entry = NULL;
|
||||
u32 count = 0;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
runlist = &f->runlist_info[runlist_id];
|
||||
|
||||
/* valid channel, add/remove it from active list.
|
||||
Otherwise, keep active list untouched for suspend/resume. */
|
||||
if (chid != (u32)~0) {
|
||||
if (add) {
|
||||
if (test_and_set_bit(chid,
|
||||
runlist->active_channels) == 1)
|
||||
return 0;
|
||||
} else {
|
||||
if (test_and_clear_bit(chid,
|
||||
runlist->active_channels) == 0)
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
|
||||
if (chid != (u32)~0 || /* add/remove a valid channel */
|
||||
add /* resume to add all channels back */) {
|
||||
u32 cid;
|
||||
|
||||
runlist_entry = runlist->mem[0].cpu_va;
|
||||
for_each_set_bit(cid,
|
||||
runlist->active_channels, f->num_channels) {
|
||||
gk20a_dbg_info("add channel %d to runlist", cid);
|
||||
runlist_entry[0] = cid;
|
||||
runlist_entry++;
|
||||
count++;
|
||||
}
|
||||
} else /* suspend to remove all channels */
|
||||
count = 0;
|
||||
|
||||
return vgpu_submit_runlist(g, vgpu_get_handle(g), runlist_id,
|
||||
runlist->mem[0].cpu_va, count);
|
||||
}
|
||||
|
||||
/* add/remove a channel from runlist
|
||||
special cases below: runlist->active_channels will NOT be changed.
|
||||
(chid == ~0 && !add) means remove all active channels from runlist.
|
||||
(chid == ~0 && add) means restore all active channels on runlist. */
|
||||
int vgpu_fifo_update_runlist(struct gk20a *g, u32 runlist_id,
|
||||
u32 chid, bool add, bool wait_for_finish)
|
||||
{
|
||||
struct fifo_runlist_info_gk20a *runlist = NULL;
|
||||
struct fifo_gk20a *f = &g->fifo;
|
||||
u32 ret = 0;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
runlist = &f->runlist_info[runlist_id];
|
||||
|
||||
nvgpu_mutex_acquire(&runlist->mutex);
|
||||
|
||||
ret = vgpu_fifo_update_runlist_locked(g, runlist_id, chid, add,
|
||||
wait_for_finish);
|
||||
|
||||
nvgpu_mutex_release(&runlist->mutex);
|
||||
return ret;
|
||||
}
|
||||
|
||||
int vgpu_fifo_wait_engine_idle(struct gk20a *g)
|
||||
{
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int vgpu_fifo_set_runlist_interleave(struct gk20a *g,
|
||||
u32 id,
|
||||
u32 runlist_id,
|
||||
u32 new_level)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {0};
|
||||
struct tegra_vgpu_tsg_runlist_interleave_params *p =
|
||||
&msg.params.tsg_interleave;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_TSG_SET_RUNLIST_INTERLEAVE;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->tsg_id = id;
|
||||
p->level = new_level;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
return err ? err : msg.ret;
|
||||
}
|
||||
|
||||
int vgpu_fifo_force_reset_ch(struct channel_gk20a *ch,
|
||||
u32 err_code, bool verbose)
|
||||
{
|
||||
struct tsg_gk20a *tsg = NULL;
|
||||
struct channel_gk20a *ch_tsg = NULL;
|
||||
struct gk20a *g = ch->g;
|
||||
struct tegra_vgpu_cmd_msg msg = {0};
|
||||
struct tegra_vgpu_channel_config_params *p =
|
||||
&msg.params.channel_config;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (gk20a_is_channel_marked_as_tsg(ch)) {
|
||||
tsg = &g->fifo.tsg[ch->tsgid];
|
||||
|
||||
nvgpu_rwsem_down_read(&tsg->ch_list_lock);
|
||||
|
||||
nvgpu_list_for_each_entry(ch_tsg, &tsg->ch_list,
|
||||
channel_gk20a, ch_entry) {
|
||||
if (gk20a_channel_get(ch_tsg)) {
|
||||
nvgpu_set_error_notifier(ch_tsg, err_code);
|
||||
ch_tsg->has_timedout = true;
|
||||
gk20a_channel_put(ch_tsg);
|
||||
}
|
||||
}
|
||||
|
||||
nvgpu_rwsem_up_read(&tsg->ch_list_lock);
|
||||
} else {
|
||||
nvgpu_set_error_notifier(ch, err_code);
|
||||
ch->has_timedout = true;
|
||||
}
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_FORCE_RESET;
|
||||
msg.handle = vgpu_get_handle(ch->g);
|
||||
p->handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
if (!err)
|
||||
gk20a_channel_abort(ch, false);
|
||||
return err ? err : msg.ret;
|
||||
}
|
||||
|
||||
static void vgpu_fifo_set_ctx_mmu_error_ch(struct gk20a *g,
|
||||
struct channel_gk20a *ch)
|
||||
{
|
||||
/*
|
||||
* If error code is already set, this mmu fault
|
||||
* was triggered as part of recovery from other
|
||||
* error condition.
|
||||
* Don't overwrite error flag.
|
||||
*/
|
||||
nvgpu_set_error_notifier_if_empty(ch,
|
||||
NVGPU_ERR_NOTIFIER_FIFO_ERROR_MMU_ERR_FLT);
|
||||
|
||||
/* mark channel as faulted */
|
||||
ch->has_timedout = true;
|
||||
nvgpu_smp_wmb();
|
||||
/* unblock pending waits */
|
||||
nvgpu_cond_broadcast_interruptible(&ch->semaphore_wq);
|
||||
nvgpu_cond_broadcast_interruptible(&ch->notifier_wq);
|
||||
}
|
||||
|
||||
static void vgpu_fifo_set_ctx_mmu_error_ch_tsg(struct gk20a *g,
|
||||
struct channel_gk20a *ch)
|
||||
{
|
||||
struct tsg_gk20a *tsg = NULL;
|
||||
struct channel_gk20a *ch_tsg = NULL;
|
||||
|
||||
if (gk20a_is_channel_marked_as_tsg(ch)) {
|
||||
tsg = &g->fifo.tsg[ch->tsgid];
|
||||
|
||||
nvgpu_rwsem_down_read(&tsg->ch_list_lock);
|
||||
|
||||
nvgpu_list_for_each_entry(ch_tsg, &tsg->ch_list,
|
||||
channel_gk20a, ch_entry) {
|
||||
if (gk20a_channel_get(ch_tsg)) {
|
||||
vgpu_fifo_set_ctx_mmu_error_ch(g, ch_tsg);
|
||||
gk20a_channel_put(ch_tsg);
|
||||
}
|
||||
}
|
||||
|
||||
nvgpu_rwsem_up_read(&tsg->ch_list_lock);
|
||||
} else {
|
||||
vgpu_fifo_set_ctx_mmu_error_ch(g, ch);
|
||||
}
|
||||
}
|
||||
|
||||
int vgpu_fifo_isr(struct gk20a *g, struct tegra_vgpu_fifo_intr_info *info)
|
||||
{
|
||||
struct fifo_gk20a *f = &g->fifo;
|
||||
struct channel_gk20a *ch = gk20a_channel_get(&f->channel[info->chid]);
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
if (!ch)
|
||||
return 0;
|
||||
|
||||
nvgpu_err(g, "fifo intr (%d) on ch %u",
|
||||
info->type, info->chid);
|
||||
|
||||
trace_gk20a_channel_reset(ch->chid, ch->tsgid);
|
||||
|
||||
switch (info->type) {
|
||||
case TEGRA_VGPU_FIFO_INTR_PBDMA:
|
||||
nvgpu_set_error_notifier(ch, NVGPU_ERR_NOTIFIER_PBDMA_ERROR);
|
||||
break;
|
||||
case TEGRA_VGPU_FIFO_INTR_CTXSW_TIMEOUT:
|
||||
nvgpu_set_error_notifier(ch,
|
||||
NVGPU_ERR_NOTIFIER_FIFO_ERROR_IDLE_TIMEOUT);
|
||||
break;
|
||||
case TEGRA_VGPU_FIFO_INTR_MMU_FAULT:
|
||||
vgpu_fifo_set_ctx_mmu_error_ch_tsg(g, ch);
|
||||
gk20a_channel_abort(ch, false);
|
||||
break;
|
||||
default:
|
||||
WARN_ON(1);
|
||||
break;
|
||||
}
|
||||
|
||||
gk20a_channel_put(ch);
|
||||
return 0;
|
||||
}
|
||||
|
||||
int vgpu_fifo_nonstall_isr(struct gk20a *g,
|
||||
struct tegra_vgpu_fifo_nonstall_intr_info *info)
|
||||
{
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
switch (info->type) {
|
||||
case TEGRA_VGPU_FIFO_NONSTALL_INTR_CHANNEL:
|
||||
gk20a_channel_semaphore_wakeup(g, false);
|
||||
break;
|
||||
default:
|
||||
WARN_ON(1);
|
||||
break;
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
u32 vgpu_fifo_default_timeslice_us(struct gk20a *g)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
|
||||
return priv->constants.default_timeslice_us;
|
||||
}
|
||||
@@ -1,59 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _FIFO_VGPU_H_
|
||||
#define _FIFO_VGPU_H_
|
||||
|
||||
#include <nvgpu/types.h>
|
||||
|
||||
struct gk20a;
|
||||
struct channel_gk20a;
|
||||
struct fifo_gk20a;
|
||||
struct tsg_gk20a;
|
||||
|
||||
int vgpu_init_fifo_setup_hw(struct gk20a *g);
|
||||
void vgpu_channel_bind(struct channel_gk20a *ch);
|
||||
void vgpu_channel_unbind(struct channel_gk20a *ch);
|
||||
int vgpu_channel_alloc_inst(struct gk20a *g, struct channel_gk20a *ch);
|
||||
void vgpu_channel_free_inst(struct gk20a *g, struct channel_gk20a *ch);
|
||||
void vgpu_channel_enable(struct channel_gk20a *ch);
|
||||
void vgpu_channel_disable(struct channel_gk20a *ch);
|
||||
int vgpu_channel_setup_ramfc(struct channel_gk20a *ch, u64 gpfifo_base,
|
||||
u32 gpfifo_entries,
|
||||
unsigned long acquire_timeout, u32 flags);
|
||||
int vgpu_fifo_init_engine_info(struct fifo_gk20a *f);
|
||||
int vgpu_fifo_preempt_channel(struct gk20a *g, u32 chid);
|
||||
int vgpu_fifo_preempt_tsg(struct gk20a *g, u32 tsgid);
|
||||
int vgpu_fifo_update_runlist(struct gk20a *g, u32 runlist_id,
|
||||
u32 chid, bool add, bool wait_for_finish);
|
||||
int vgpu_fifo_wait_engine_idle(struct gk20a *g);
|
||||
int vgpu_fifo_set_runlist_interleave(struct gk20a *g,
|
||||
u32 id,
|
||||
u32 runlist_id,
|
||||
u32 new_level);
|
||||
int vgpu_channel_set_timeslice(struct channel_gk20a *ch, u32 timeslice);
|
||||
int vgpu_fifo_force_reset_ch(struct channel_gk20a *ch,
|
||||
u32 err_code, bool verbose);
|
||||
u32 vgpu_fifo_default_timeslice_us(struct gk20a *g);
|
||||
int vgpu_tsg_open(struct tsg_gk20a *tsg);
|
||||
void vgpu_tsg_release(struct tsg_gk20a *tsg);
|
||||
int vgpu_tsg_bind_channel(struct tsg_gk20a *tsg,
|
||||
struct channel_gk20a *ch);
|
||||
int vgpu_tsg_unbind_channel(struct channel_gk20a *ch);
|
||||
int vgpu_tsg_set_timeslice(struct tsg_gk20a *tsg, u32 timeslice);
|
||||
int vgpu_enable_tsg(struct tsg_gk20a *tsg);
|
||||
|
||||
#endif
|
||||
@@ -1,42 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <nvgpu/enabled.h>
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "gk20a/css_gr_gk20a.h"
|
||||
#include "common/linux/vgpu/css_vgpu.h"
|
||||
#include "vgpu_gr_gm20b.h"
|
||||
|
||||
void vgpu_gr_gm20b_init_cyclestats(struct gk20a *g)
|
||||
{
|
||||
#if defined(CONFIG_GK20A_CYCLE_STATS)
|
||||
bool snapshots_supported = true;
|
||||
|
||||
/* cyclestats not supported on vgpu */
|
||||
__nvgpu_set_enabled(g, NVGPU_SUPPORT_CYCLE_STATS, false);
|
||||
|
||||
g->gr.max_css_buffer_size = vgpu_css_get_buffer_size(g);
|
||||
|
||||
/* snapshots not supported if the buffer size is 0 */
|
||||
if (g->gr.max_css_buffer_size == 0)
|
||||
snapshots_supported = false;
|
||||
|
||||
__nvgpu_set_enabled(g, NVGPU_SUPPORT_CYCLE_STATS_SNAPSHOT,
|
||||
snapshots_supported);
|
||||
#endif
|
||||
}
|
||||
|
||||
@@ -1,24 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef __VGPU_GR_GM20B_H__
|
||||
#define __VGPU_GR_GM20B_H__
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
|
||||
void vgpu_gr_gm20b_init_cyclestats(struct gk20a *g);
|
||||
|
||||
#endif
|
||||
@@ -1,24 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "vgpu_fifo_gp10b.h"
|
||||
|
||||
void vgpu_gp10b_init_fifo_ops(struct gpu_ops *gops)
|
||||
{
|
||||
/* syncpoint protection not supported yet */
|
||||
gops->fifo.resetup_ramfc = NULL;
|
||||
gops->fifo.reschedule_runlist = NULL;
|
||||
}
|
||||
@@ -1,38 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* Permission is hereby granted, free of charge, to any person obtaining a
|
||||
* copy of this software and associated documentation files (the "Software"),
|
||||
* to deal in the Software without restriction, including without limitation
|
||||
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
||||
* and/or sell copies of the Software, and to permit persons to whom the
|
||||
* Software is furnished to do so, subject to the following conditions:
|
||||
*
|
||||
* The above copyright notice and this permission notice shall be included in
|
||||
* all copies or substantial portions of the Software.
|
||||
*
|
||||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
||||
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
||||
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
||||
* DEALINGS IN THE SOFTWARE.
|
||||
*/
|
||||
|
||||
#include <nvgpu/enabled.h>
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
|
||||
int vgpu_gp10b_fuse_check_priv_security(struct gk20a *g)
|
||||
{
|
||||
if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
|
||||
__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
|
||||
__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
|
||||
} else {
|
||||
__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
|
||||
__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
@@ -1,30 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* Permission is hereby granted, free of charge, to any person obtaining a
|
||||
* copy of this software and associated documentation files (the "Software"),
|
||||
* to deal in the Software without restriction, including without limitation
|
||||
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
||||
* and/or sell copies of the Software, and to permit persons to whom the
|
||||
* Software is furnished to do so, subject to the following conditions:
|
||||
*
|
||||
* The above copyright notice and this permission notice shall be included in
|
||||
* all copies or substantial portions of the Software.
|
||||
*
|
||||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
||||
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
||||
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
||||
* DEALINGS IN THE SOFTWARE.
|
||||
*/
|
||||
|
||||
#ifndef _VGPU_GP10B_FUSE
|
||||
#define _VGPU_GP10B_FUSE
|
||||
|
||||
struct gk20a;
|
||||
|
||||
int vgpu_gp10b_fuse_check_priv_security(struct gk20a *g);
|
||||
|
||||
#endif
|
||||
@@ -1,302 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <nvgpu/kmem.h>
|
||||
#include <nvgpu/dma.h>
|
||||
#include <nvgpu/bug.h>
|
||||
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
#include "common/linux/vgpu/gm20b/vgpu_gr_gm20b.h"
|
||||
|
||||
#include "gp10b/gr_gp10b.h"
|
||||
#include "vgpu_gr_gp10b.h"
|
||||
|
||||
#include <nvgpu/hw/gp10b/hw_gr_gp10b.h>
|
||||
|
||||
int vgpu_gr_gp10b_alloc_gr_ctx(struct gk20a *g,
|
||||
struct nvgpu_gr_ctx *gr_ctx,
|
||||
struct vm_gk20a *vm,
|
||||
u32 class,
|
||||
u32 flags)
|
||||
{
|
||||
u32 graphics_preempt_mode = 0;
|
||||
u32 compute_preempt_mode = 0;
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = vgpu_gr_alloc_gr_ctx(g, gr_ctx, vm, class, flags);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
if (flags & NVGPU_OBJ_CTX_FLAGS_SUPPORT_GFXP)
|
||||
graphics_preempt_mode = NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP;
|
||||
if (flags & NVGPU_OBJ_CTX_FLAGS_SUPPORT_CILP)
|
||||
compute_preempt_mode = NVGPU_PREEMPTION_MODE_COMPUTE_CILP;
|
||||
|
||||
if (priv->constants.force_preempt_mode && !graphics_preempt_mode &&
|
||||
!compute_preempt_mode) {
|
||||
graphics_preempt_mode = g->ops.gr.is_valid_gfx_class(g, class) ?
|
||||
NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP : 0;
|
||||
compute_preempt_mode =
|
||||
g->ops.gr.is_valid_compute_class(g, class) ?
|
||||
NVGPU_PREEMPTION_MODE_COMPUTE_CTA : 0;
|
||||
}
|
||||
|
||||
if (graphics_preempt_mode || compute_preempt_mode) {
|
||||
if (g->ops.gr.set_ctxsw_preemption_mode) {
|
||||
err = g->ops.gr.set_ctxsw_preemption_mode(g, gr_ctx, vm,
|
||||
class, graphics_preempt_mode, compute_preempt_mode);
|
||||
if (err) {
|
||||
nvgpu_err(g,
|
||||
"set_ctxsw_preemption_mode failed");
|
||||
goto fail;
|
||||
}
|
||||
} else {
|
||||
err = -ENOSYS;
|
||||
goto fail;
|
||||
}
|
||||
}
|
||||
|
||||
gk20a_dbg_fn("done");
|
||||
return err;
|
||||
|
||||
fail:
|
||||
vgpu_gr_free_gr_ctx(g, vm, gr_ctx);
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_gr_gp10b_set_ctxsw_preemption_mode(struct gk20a *g,
|
||||
struct nvgpu_gr_ctx *gr_ctx,
|
||||
struct vm_gk20a *vm, u32 class,
|
||||
u32 graphics_preempt_mode,
|
||||
u32 compute_preempt_mode)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_gr_bind_ctxsw_buffers_params *p =
|
||||
&msg.params.gr_bind_ctxsw_buffers;
|
||||
int err = 0;
|
||||
|
||||
if (g->ops.gr.is_valid_gfx_class(g, class) &&
|
||||
g->gr.ctx_vars.force_preemption_gfxp)
|
||||
graphics_preempt_mode = NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP;
|
||||
|
||||
if (g->ops.gr.is_valid_compute_class(g, class) &&
|
||||
g->gr.ctx_vars.force_preemption_cilp)
|
||||
compute_preempt_mode = NVGPU_PREEMPTION_MODE_COMPUTE_CILP;
|
||||
|
||||
/* check for invalid combinations */
|
||||
if ((graphics_preempt_mode == 0) && (compute_preempt_mode == 0))
|
||||
return -EINVAL;
|
||||
|
||||
if ((graphics_preempt_mode == NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP) &&
|
||||
(compute_preempt_mode == NVGPU_PREEMPTION_MODE_COMPUTE_CILP))
|
||||
return -EINVAL;
|
||||
|
||||
/* set preemption modes */
|
||||
switch (graphics_preempt_mode) {
|
||||
case NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP:
|
||||
{
|
||||
u32 spill_size =
|
||||
gr_gpc0_swdx_rm_spill_buffer_size_256b_default_v() *
|
||||
gr_gpc0_swdx_rm_spill_buffer_size_256b_byte_granularity_v();
|
||||
u32 pagepool_size = g->ops.gr.pagepool_default_size(g) *
|
||||
gr_scc_pagepool_total_pages_byte_granularity_v();
|
||||
u32 betacb_size = g->gr.attrib_cb_default_size +
|
||||
(gr_gpc0_ppc0_cbm_beta_cb_size_v_gfxp_v() -
|
||||
gr_gpc0_ppc0_cbm_beta_cb_size_v_default_v());
|
||||
u32 attrib_cb_size = (betacb_size + g->gr.alpha_cb_size) *
|
||||
gr_gpc0_ppc0_cbm_beta_cb_size_v_granularity_v() *
|
||||
g->gr.max_tpc_count;
|
||||
struct nvgpu_mem *desc;
|
||||
|
||||
attrib_cb_size = ALIGN(attrib_cb_size, 128);
|
||||
|
||||
gk20a_dbg_info("gfxp context preempt size=%d",
|
||||
g->gr.ctx_vars.preempt_image_size);
|
||||
gk20a_dbg_info("gfxp context spill size=%d", spill_size);
|
||||
gk20a_dbg_info("gfxp context pagepool size=%d", pagepool_size);
|
||||
gk20a_dbg_info("gfxp context attrib cb size=%d",
|
||||
attrib_cb_size);
|
||||
|
||||
err = gr_gp10b_alloc_buffer(vm,
|
||||
g->gr.ctx_vars.preempt_image_size,
|
||||
&gr_ctx->preempt_ctxsw_buffer);
|
||||
if (err) {
|
||||
err = -ENOMEM;
|
||||
goto fail;
|
||||
}
|
||||
desc = &gr_ctx->preempt_ctxsw_buffer;
|
||||
p->gpu_va[TEGRA_VGPU_GR_BIND_CTXSW_BUFFER_MAIN] = desc->gpu_va;
|
||||
p->size[TEGRA_VGPU_GR_BIND_CTXSW_BUFFER_MAIN] = desc->size;
|
||||
|
||||
err = gr_gp10b_alloc_buffer(vm,
|
||||
spill_size,
|
||||
&gr_ctx->spill_ctxsw_buffer);
|
||||
if (err) {
|
||||
err = -ENOMEM;
|
||||
goto fail;
|
||||
}
|
||||
desc = &gr_ctx->spill_ctxsw_buffer;
|
||||
p->gpu_va[TEGRA_VGPU_GR_BIND_CTXSW_BUFFER_SPILL] = desc->gpu_va;
|
||||
p->size[TEGRA_VGPU_GR_BIND_CTXSW_BUFFER_SPILL] = desc->size;
|
||||
|
||||
err = gr_gp10b_alloc_buffer(vm,
|
||||
pagepool_size,
|
||||
&gr_ctx->pagepool_ctxsw_buffer);
|
||||
if (err) {
|
||||
err = -ENOMEM;
|
||||
goto fail;
|
||||
}
|
||||
desc = &gr_ctx->pagepool_ctxsw_buffer;
|
||||
p->gpu_va[TEGRA_VGPU_GR_BIND_CTXSW_BUFFER_PAGEPOOL] =
|
||||
desc->gpu_va;
|
||||
p->size[TEGRA_VGPU_GR_BIND_CTXSW_BUFFER_PAGEPOOL] = desc->size;
|
||||
|
||||
err = gr_gp10b_alloc_buffer(vm,
|
||||
attrib_cb_size,
|
||||
&gr_ctx->betacb_ctxsw_buffer);
|
||||
if (err) {
|
||||
err = -ENOMEM;
|
||||
goto fail;
|
||||
}
|
||||
desc = &gr_ctx->betacb_ctxsw_buffer;
|
||||
p->gpu_va[TEGRA_VGPU_GR_BIND_CTXSW_BUFFER_BETACB] =
|
||||
desc->gpu_va;
|
||||
p->size[TEGRA_VGPU_GR_BIND_CTXSW_BUFFER_BETACB] = desc->size;
|
||||
|
||||
gr_ctx->graphics_preempt_mode = NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP;
|
||||
p->mode = TEGRA_VGPU_GR_CTXSW_PREEMPTION_MODE_GFX_GFXP;
|
||||
break;
|
||||
}
|
||||
case NVGPU_PREEMPTION_MODE_GRAPHICS_WFI:
|
||||
gr_ctx->graphics_preempt_mode = graphics_preempt_mode;
|
||||
break;
|
||||
|
||||
default:
|
||||
break;
|
||||
}
|
||||
|
||||
if (g->ops.gr.is_valid_compute_class(g, class)) {
|
||||
switch (compute_preempt_mode) {
|
||||
case NVGPU_PREEMPTION_MODE_COMPUTE_WFI:
|
||||
gr_ctx->compute_preempt_mode =
|
||||
NVGPU_PREEMPTION_MODE_COMPUTE_WFI;
|
||||
p->mode = TEGRA_VGPU_GR_CTXSW_PREEMPTION_MODE_WFI;
|
||||
break;
|
||||
case NVGPU_PREEMPTION_MODE_COMPUTE_CTA:
|
||||
gr_ctx->compute_preempt_mode =
|
||||
NVGPU_PREEMPTION_MODE_COMPUTE_CTA;
|
||||
p->mode =
|
||||
TEGRA_VGPU_GR_CTXSW_PREEMPTION_MODE_COMPUTE_CTA;
|
||||
break;
|
||||
case NVGPU_PREEMPTION_MODE_COMPUTE_CILP:
|
||||
gr_ctx->compute_preempt_mode =
|
||||
NVGPU_PREEMPTION_MODE_COMPUTE_CILP;
|
||||
p->mode =
|
||||
TEGRA_VGPU_GR_CTXSW_PREEMPTION_MODE_COMPUTE_CILP;
|
||||
break;
|
||||
default:
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
if (gr_ctx->graphics_preempt_mode || gr_ctx->compute_preempt_mode) {
|
||||
msg.cmd = TEGRA_VGPU_CMD_CHANNEL_BIND_GR_CTXSW_BUFFERS;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->gr_ctx_handle = gr_ctx->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
if (err || msg.ret) {
|
||||
err = -ENOMEM;
|
||||
goto fail;
|
||||
}
|
||||
}
|
||||
|
||||
return err;
|
||||
|
||||
fail:
|
||||
nvgpu_err(g, "%s failed %d", __func__, err);
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_gr_gp10b_set_preemption_mode(struct channel_gk20a *ch,
|
||||
u32 graphics_preempt_mode,
|
||||
u32 compute_preempt_mode)
|
||||
{
|
||||
struct nvgpu_gr_ctx *gr_ctx;
|
||||
struct gk20a *g = ch->g;
|
||||
struct tsg_gk20a *tsg;
|
||||
struct vm_gk20a *vm;
|
||||
u32 class;
|
||||
int err;
|
||||
|
||||
class = ch->obj_class;
|
||||
if (!class)
|
||||
return -EINVAL;
|
||||
|
||||
tsg = tsg_gk20a_from_ch(ch);
|
||||
if (!tsg)
|
||||
return -EINVAL;
|
||||
|
||||
vm = tsg->vm;
|
||||
gr_ctx = &tsg->gr_ctx;
|
||||
|
||||
/* skip setting anything if both modes are already set */
|
||||
if (graphics_preempt_mode &&
|
||||
(graphics_preempt_mode == gr_ctx->graphics_preempt_mode))
|
||||
graphics_preempt_mode = 0;
|
||||
|
||||
if (compute_preempt_mode &&
|
||||
(compute_preempt_mode == gr_ctx->compute_preempt_mode))
|
||||
compute_preempt_mode = 0;
|
||||
|
||||
if (graphics_preempt_mode == 0 && compute_preempt_mode == 0)
|
||||
return 0;
|
||||
|
||||
if (g->ops.gr.set_ctxsw_preemption_mode) {
|
||||
err = g->ops.gr.set_ctxsw_preemption_mode(g, gr_ctx, vm, class,
|
||||
graphics_preempt_mode,
|
||||
compute_preempt_mode);
|
||||
if (err) {
|
||||
nvgpu_err(g, "set_ctxsw_preemption_mode failed");
|
||||
return err;
|
||||
}
|
||||
} else {
|
||||
err = -ENOSYS;
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_gr_gp10b_init_ctx_state(struct gk20a *g)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = vgpu_gr_init_ctx_state(g);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
g->gr.ctx_vars.preempt_image_size =
|
||||
priv->constants.preempt_ctx_size;
|
||||
if (!g->gr.ctx_vars.preempt_image_size)
|
||||
return -EINVAL;
|
||||
|
||||
return 0;
|
||||
}
|
||||
@@ -1,37 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef __VGPU_GR_GP10B_H__
|
||||
#define __VGPU_GR_GP10B_H__
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
|
||||
int vgpu_gr_gp10b_alloc_gr_ctx(struct gk20a *g,
|
||||
struct nvgpu_gr_ctx *gr_ctx,
|
||||
struct vm_gk20a *vm,
|
||||
u32 class,
|
||||
u32 flags);
|
||||
int vgpu_gr_gp10b_set_ctxsw_preemption_mode(struct gk20a *g,
|
||||
struct nvgpu_gr_ctx *gr_ctx,
|
||||
struct vm_gk20a *vm, u32 class,
|
||||
u32 graphics_preempt_mode,
|
||||
u32 compute_preempt_mode);
|
||||
int vgpu_gr_gp10b_set_preemption_mode(struct channel_gk20a *ch,
|
||||
u32 graphics_preempt_mode,
|
||||
u32 compute_preempt_mode);
|
||||
int vgpu_gr_gp10b_init_ctx_state(struct gk20a *g);
|
||||
|
||||
#endif
|
||||
@@ -1,607 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
#include "common/linux/vgpu/fifo_vgpu.h"
|
||||
#include "common/linux/vgpu/gr_vgpu.h"
|
||||
#include "common/linux/vgpu/ltc_vgpu.h"
|
||||
#include "common/linux/vgpu/mm_vgpu.h"
|
||||
#include "common/linux/vgpu/dbg_vgpu.h"
|
||||
#include "common/linux/vgpu/fecs_trace_vgpu.h"
|
||||
#include "common/linux/vgpu/css_vgpu.h"
|
||||
#include "gp10b/gp10b.h"
|
||||
#include "gp10b/hal_gp10b.h"
|
||||
#include "common/linux/vgpu/gm20b/vgpu_gr_gm20b.h"
|
||||
#include "vgpu_gr_gp10b.h"
|
||||
#include "vgpu_mm_gp10b.h"
|
||||
#include "vgpu_fuse_gp10b.h"
|
||||
|
||||
#include "gk20a/bus_gk20a.h"
|
||||
#include "gk20a/pramin_gk20a.h"
|
||||
#include "gk20a/flcn_gk20a.h"
|
||||
#include "gk20a/mc_gk20a.h"
|
||||
#include "gk20a/fb_gk20a.h"
|
||||
|
||||
#include "gp10b/mc_gp10b.h"
|
||||
#include "gp10b/ltc_gp10b.h"
|
||||
#include "gp10b/mm_gp10b.h"
|
||||
#include "gp10b/ce_gp10b.h"
|
||||
#include "gp10b/fb_gp10b.h"
|
||||
#include "gp10b/pmu_gp10b.h"
|
||||
#include "gp10b/gr_gp10b.h"
|
||||
#include "gp10b/gr_ctx_gp10b.h"
|
||||
#include "gp10b/fifo_gp10b.h"
|
||||
#include "gp10b/gp10b_gating_reglist.h"
|
||||
#include "gp10b/regops_gp10b.h"
|
||||
#include "gp10b/therm_gp10b.h"
|
||||
#include "gp10b/priv_ring_gp10b.h"
|
||||
|
||||
#include "gm20b/ltc_gm20b.h"
|
||||
#include "gm20b/gr_gm20b.h"
|
||||
#include "gm20b/fifo_gm20b.h"
|
||||
#include "gm20b/acr_gm20b.h"
|
||||
#include "gm20b/pmu_gm20b.h"
|
||||
#include "gm20b/fb_gm20b.h"
|
||||
#include "gm20b/mm_gm20b.h"
|
||||
|
||||
#include <nvgpu/enabled.h>
|
||||
|
||||
#include <nvgpu/hw/gp10b/hw_fuse_gp10b.h>
|
||||
#include <nvgpu/hw/gp10b/hw_fifo_gp10b.h>
|
||||
#include <nvgpu/hw/gp10b/hw_ram_gp10b.h>
|
||||
#include <nvgpu/hw/gp10b/hw_top_gp10b.h>
|
||||
#include <nvgpu/hw/gp10b/hw_pram_gp10b.h>
|
||||
#include <nvgpu/hw/gp10b/hw_pwr_gp10b.h>
|
||||
|
||||
static const struct gpu_ops vgpu_gp10b_ops = {
|
||||
.ltc = {
|
||||
.determine_L2_size_bytes = vgpu_determine_L2_size_bytes,
|
||||
.set_zbc_color_entry = gm20b_ltc_set_zbc_color_entry,
|
||||
.set_zbc_depth_entry = gm20b_ltc_set_zbc_depth_entry,
|
||||
.init_cbc = gm20b_ltc_init_cbc,
|
||||
.init_fs_state = vgpu_ltc_init_fs_state,
|
||||
.init_comptags = vgpu_ltc_init_comptags,
|
||||
.cbc_ctrl = NULL,
|
||||
.isr = gp10b_ltc_isr,
|
||||
.cbc_fix_config = gm20b_ltc_cbc_fix_config,
|
||||
.flush = gm20b_flush_ltc,
|
||||
.set_enabled = gp10b_ltc_set_enabled,
|
||||
},
|
||||
.ce2 = {
|
||||
.isr_stall = gp10b_ce_isr,
|
||||
.isr_nonstall = gp10b_ce_nonstall_isr,
|
||||
.get_num_pce = vgpu_ce_get_num_pce,
|
||||
},
|
||||
.gr = {
|
||||
.get_patch_slots = gr_gk20a_get_patch_slots,
|
||||
.init_gpc_mmu = gr_gm20b_init_gpc_mmu,
|
||||
.bundle_cb_defaults = gr_gm20b_bundle_cb_defaults,
|
||||
.cb_size_default = gr_gp10b_cb_size_default,
|
||||
.calc_global_ctx_buffer_size =
|
||||
gr_gp10b_calc_global_ctx_buffer_size,
|
||||
.commit_global_attrib_cb = gr_gp10b_commit_global_attrib_cb,
|
||||
.commit_global_bundle_cb = gr_gp10b_commit_global_bundle_cb,
|
||||
.commit_global_cb_manager = gr_gp10b_commit_global_cb_manager,
|
||||
.commit_global_pagepool = gr_gp10b_commit_global_pagepool,
|
||||
.handle_sw_method = gr_gp10b_handle_sw_method,
|
||||
.set_alpha_circular_buffer_size =
|
||||
gr_gp10b_set_alpha_circular_buffer_size,
|
||||
.set_circular_buffer_size = gr_gp10b_set_circular_buffer_size,
|
||||
.enable_hww_exceptions = gr_gk20a_enable_hww_exceptions,
|
||||
.is_valid_class = gr_gp10b_is_valid_class,
|
||||
.is_valid_gfx_class = gr_gp10b_is_valid_gfx_class,
|
||||
.is_valid_compute_class = gr_gp10b_is_valid_compute_class,
|
||||
.get_sm_dsm_perf_regs = gr_gm20b_get_sm_dsm_perf_regs,
|
||||
.get_sm_dsm_perf_ctrl_regs = gr_gm20b_get_sm_dsm_perf_ctrl_regs,
|
||||
.init_fs_state = vgpu_gr_init_fs_state,
|
||||
.set_hww_esr_report_mask = gr_gm20b_set_hww_esr_report_mask,
|
||||
.falcon_load_ucode = gr_gm20b_load_ctxsw_ucode_segments,
|
||||
.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode,
|
||||
.set_gpc_tpc_mask = gr_gp10b_set_gpc_tpc_mask,
|
||||
.get_gpc_tpc_mask = vgpu_gr_get_gpc_tpc_mask,
|
||||
.alloc_obj_ctx = vgpu_gr_alloc_obj_ctx,
|
||||
.bind_ctxsw_zcull = vgpu_gr_bind_ctxsw_zcull,
|
||||
.get_zcull_info = vgpu_gr_get_zcull_info,
|
||||
.is_tpc_addr = gr_gm20b_is_tpc_addr,
|
||||
.get_tpc_num = gr_gm20b_get_tpc_num,
|
||||
.detect_sm_arch = vgpu_gr_detect_sm_arch,
|
||||
.add_zbc_color = gr_gp10b_add_zbc_color,
|
||||
.add_zbc_depth = gr_gp10b_add_zbc_depth,
|
||||
.zbc_set_table = vgpu_gr_add_zbc,
|
||||
.zbc_query_table = vgpu_gr_query_zbc,
|
||||
.pmu_save_zbc = gk20a_pmu_save_zbc,
|
||||
.add_zbc = gr_gk20a_add_zbc,
|
||||
.pagepool_default_size = gr_gp10b_pagepool_default_size,
|
||||
.init_ctx_state = vgpu_gr_gp10b_init_ctx_state,
|
||||
.alloc_gr_ctx = vgpu_gr_gp10b_alloc_gr_ctx,
|
||||
.free_gr_ctx = vgpu_gr_free_gr_ctx,
|
||||
.update_ctxsw_preemption_mode =
|
||||
gr_gp10b_update_ctxsw_preemption_mode,
|
||||
.dump_gr_regs = NULL,
|
||||
.update_pc_sampling = gr_gm20b_update_pc_sampling,
|
||||
.get_fbp_en_mask = vgpu_gr_get_fbp_en_mask,
|
||||
.get_max_ltc_per_fbp = vgpu_gr_get_max_ltc_per_fbp,
|
||||
.get_max_lts_per_ltc = vgpu_gr_get_max_lts_per_ltc,
|
||||
.get_rop_l2_en_mask = vgpu_gr_rop_l2_en_mask,
|
||||
.get_max_fbps_count = vgpu_gr_get_max_fbps_count,
|
||||
.init_sm_dsm_reg_info = gr_gm20b_init_sm_dsm_reg_info,
|
||||
.wait_empty = gr_gp10b_wait_empty,
|
||||
.init_cyclestats = vgpu_gr_gm20b_init_cyclestats,
|
||||
.set_sm_debug_mode = vgpu_gr_set_sm_debug_mode,
|
||||
.enable_cde_in_fecs = gr_gm20b_enable_cde_in_fecs,
|
||||
.bpt_reg_info = gr_gm20b_bpt_reg_info,
|
||||
.get_access_map = gr_gp10b_get_access_map,
|
||||
.handle_fecs_error = gr_gp10b_handle_fecs_error,
|
||||
.handle_sm_exception = gr_gp10b_handle_sm_exception,
|
||||
.handle_tex_exception = gr_gp10b_handle_tex_exception,
|
||||
.enable_gpc_exceptions = gk20a_gr_enable_gpc_exceptions,
|
||||
.enable_exceptions = gk20a_gr_enable_exceptions,
|
||||
.get_lrf_tex_ltc_dram_override = get_ecc_override_val,
|
||||
.update_smpc_ctxsw_mode = vgpu_gr_update_smpc_ctxsw_mode,
|
||||
.update_hwpm_ctxsw_mode = vgpu_gr_update_hwpm_ctxsw_mode,
|
||||
.record_sm_error_state = gm20b_gr_record_sm_error_state,
|
||||
.update_sm_error_state = gm20b_gr_update_sm_error_state,
|
||||
.clear_sm_error_state = vgpu_gr_clear_sm_error_state,
|
||||
.suspend_contexts = vgpu_gr_suspend_contexts,
|
||||
.resume_contexts = vgpu_gr_resume_contexts,
|
||||
.get_preemption_mode_flags = gr_gp10b_get_preemption_mode_flags,
|
||||
.init_sm_id_table = vgpu_gr_init_sm_id_table,
|
||||
.load_smid_config = gr_gp10b_load_smid_config,
|
||||
.program_sm_id_numbering = gr_gm20b_program_sm_id_numbering,
|
||||
.is_ltcs_ltss_addr = gr_gm20b_is_ltcs_ltss_addr,
|
||||
.is_ltcn_ltss_addr = gr_gm20b_is_ltcn_ltss_addr,
|
||||
.split_lts_broadcast_addr = gr_gm20b_split_lts_broadcast_addr,
|
||||
.split_ltc_broadcast_addr = gr_gm20b_split_ltc_broadcast_addr,
|
||||
.setup_rop_mapping = gr_gk20a_setup_rop_mapping,
|
||||
.program_zcull_mapping = gr_gk20a_program_zcull_mapping,
|
||||
.commit_global_timeslice = gr_gk20a_commit_global_timeslice,
|
||||
.commit_inst = vgpu_gr_commit_inst,
|
||||
.write_zcull_ptr = gr_gk20a_write_zcull_ptr,
|
||||
.write_pm_ptr = gr_gk20a_write_pm_ptr,
|
||||
.init_elcg_mode = gr_gk20a_init_elcg_mode,
|
||||
.load_tpc_mask = gr_gm20b_load_tpc_mask,
|
||||
.inval_icache = gr_gk20a_inval_icache,
|
||||
.trigger_suspend = gr_gk20a_trigger_suspend,
|
||||
.wait_for_pause = gr_gk20a_wait_for_pause,
|
||||
.resume_from_pause = gr_gk20a_resume_from_pause,
|
||||
.clear_sm_errors = gr_gk20a_clear_sm_errors,
|
||||
.tpc_enabled_exceptions = gr_gk20a_tpc_enabled_exceptions,
|
||||
.get_esr_sm_sel = gk20a_gr_get_esr_sm_sel,
|
||||
.sm_debugger_attached = gk20a_gr_sm_debugger_attached,
|
||||
.suspend_single_sm = gk20a_gr_suspend_single_sm,
|
||||
.suspend_all_sms = gk20a_gr_suspend_all_sms,
|
||||
.resume_single_sm = gk20a_gr_resume_single_sm,
|
||||
.resume_all_sms = gk20a_gr_resume_all_sms,
|
||||
.get_sm_hww_warp_esr = gp10b_gr_get_sm_hww_warp_esr,
|
||||
.get_sm_hww_global_esr = gk20a_gr_get_sm_hww_global_esr,
|
||||
.get_sm_no_lock_down_hww_global_esr_mask =
|
||||
gk20a_gr_get_sm_no_lock_down_hww_global_esr_mask,
|
||||
.lock_down_sm = gk20a_gr_lock_down_sm,
|
||||
.wait_for_sm_lock_down = gk20a_gr_wait_for_sm_lock_down,
|
||||
.clear_sm_hww = gm20b_gr_clear_sm_hww,
|
||||
.init_ovr_sm_dsm_perf = gk20a_gr_init_ovr_sm_dsm_perf,
|
||||
.get_ovr_perf_regs = gk20a_gr_get_ovr_perf_regs,
|
||||
.disable_rd_coalesce = gm20a_gr_disable_rd_coalesce,
|
||||
.set_boosted_ctx = NULL,
|
||||
.set_preemption_mode = vgpu_gr_gp10b_set_preemption_mode,
|
||||
.set_czf_bypass = gr_gp10b_set_czf_bypass,
|
||||
.init_czf_bypass = gr_gp10b_init_czf_bypass,
|
||||
.pre_process_sm_exception = gr_gp10b_pre_process_sm_exception,
|
||||
.set_preemption_buffer_va = gr_gp10b_set_preemption_buffer_va,
|
||||
.init_preemption_state = gr_gp10b_init_preemption_state,
|
||||
.update_boosted_ctx = NULL,
|
||||
.set_bes_crop_debug3 = gr_gp10b_set_bes_crop_debug3,
|
||||
.set_bes_crop_debug4 = gr_gp10b_set_bes_crop_debug4,
|
||||
.create_gr_sysfs = gr_gp10b_create_sysfs,
|
||||
.set_ctxsw_preemption_mode =
|
||||
vgpu_gr_gp10b_set_ctxsw_preemption_mode,
|
||||
.init_ctxsw_hdr_data = gr_gp10b_init_ctxsw_hdr_data,
|
||||
.init_gfxp_wfi_timeout_count =
|
||||
gr_gp10b_init_gfxp_wfi_timeout_count,
|
||||
.get_max_gfxp_wfi_timeout_count =
|
||||
gr_gp10b_get_max_gfxp_wfi_timeout_count,
|
||||
},
|
||||
.fb = {
|
||||
.reset = fb_gk20a_reset,
|
||||
.init_hw = gk20a_fb_init_hw,
|
||||
.init_fs_state = fb_gm20b_init_fs_state,
|
||||
.set_mmu_page_size = gm20b_fb_set_mmu_page_size,
|
||||
.set_use_full_comp_tag_line =
|
||||
gm20b_fb_set_use_full_comp_tag_line,
|
||||
.compression_page_size = gp10b_fb_compression_page_size,
|
||||
.compressible_page_size = gp10b_fb_compressible_page_size,
|
||||
.compression_align_mask = gm20b_fb_compression_align_mask,
|
||||
.vpr_info_fetch = gm20b_fb_vpr_info_fetch,
|
||||
.dump_vpr_wpr_info = gm20b_fb_dump_vpr_wpr_info,
|
||||
.read_wpr_info = gm20b_fb_read_wpr_info,
|
||||
.is_debug_mode_enabled = NULL,
|
||||
.set_debug_mode = vgpu_mm_mmu_set_debug_mode,
|
||||
.tlb_invalidate = vgpu_mm_tlb_invalidate,
|
||||
},
|
||||
.clock_gating = {
|
||||
.slcg_bus_load_gating_prod =
|
||||
gp10b_slcg_bus_load_gating_prod,
|
||||
.slcg_ce2_load_gating_prod =
|
||||
gp10b_slcg_ce2_load_gating_prod,
|
||||
.slcg_chiplet_load_gating_prod =
|
||||
gp10b_slcg_chiplet_load_gating_prod,
|
||||
.slcg_ctxsw_firmware_load_gating_prod =
|
||||
gp10b_slcg_ctxsw_firmware_load_gating_prod,
|
||||
.slcg_fb_load_gating_prod =
|
||||
gp10b_slcg_fb_load_gating_prod,
|
||||
.slcg_fifo_load_gating_prod =
|
||||
gp10b_slcg_fifo_load_gating_prod,
|
||||
.slcg_gr_load_gating_prod =
|
||||
gr_gp10b_slcg_gr_load_gating_prod,
|
||||
.slcg_ltc_load_gating_prod =
|
||||
ltc_gp10b_slcg_ltc_load_gating_prod,
|
||||
.slcg_perf_load_gating_prod =
|
||||
gp10b_slcg_perf_load_gating_prod,
|
||||
.slcg_priring_load_gating_prod =
|
||||
gp10b_slcg_priring_load_gating_prod,
|
||||
.slcg_pmu_load_gating_prod =
|
||||
gp10b_slcg_pmu_load_gating_prod,
|
||||
.slcg_therm_load_gating_prod =
|
||||
gp10b_slcg_therm_load_gating_prod,
|
||||
.slcg_xbar_load_gating_prod =
|
||||
gp10b_slcg_xbar_load_gating_prod,
|
||||
.blcg_bus_load_gating_prod =
|
||||
gp10b_blcg_bus_load_gating_prod,
|
||||
.blcg_ce_load_gating_prod =
|
||||
gp10b_blcg_ce_load_gating_prod,
|
||||
.blcg_ctxsw_firmware_load_gating_prod =
|
||||
gp10b_blcg_ctxsw_firmware_load_gating_prod,
|
||||
.blcg_fb_load_gating_prod =
|
||||
gp10b_blcg_fb_load_gating_prod,
|
||||
.blcg_fifo_load_gating_prod =
|
||||
gp10b_blcg_fifo_load_gating_prod,
|
||||
.blcg_gr_load_gating_prod =
|
||||
gp10b_blcg_gr_load_gating_prod,
|
||||
.blcg_ltc_load_gating_prod =
|
||||
gp10b_blcg_ltc_load_gating_prod,
|
||||
.blcg_pwr_csb_load_gating_prod =
|
||||
gp10b_blcg_pwr_csb_load_gating_prod,
|
||||
.blcg_pmu_load_gating_prod =
|
||||
gp10b_blcg_pmu_load_gating_prod,
|
||||
.blcg_xbar_load_gating_prod =
|
||||
gp10b_blcg_xbar_load_gating_prod,
|
||||
.pg_gr_load_gating_prod =
|
||||
gr_gp10b_pg_gr_load_gating_prod,
|
||||
},
|
||||
.fifo = {
|
||||
.init_fifo_setup_hw = vgpu_init_fifo_setup_hw,
|
||||
.bind_channel = vgpu_channel_bind,
|
||||
.unbind_channel = vgpu_channel_unbind,
|
||||
.disable_channel = vgpu_channel_disable,
|
||||
.enable_channel = vgpu_channel_enable,
|
||||
.alloc_inst = vgpu_channel_alloc_inst,
|
||||
.free_inst = vgpu_channel_free_inst,
|
||||
.setup_ramfc = vgpu_channel_setup_ramfc,
|
||||
.default_timeslice_us = vgpu_fifo_default_timeslice_us,
|
||||
.setup_userd = gk20a_fifo_setup_userd,
|
||||
.userd_gp_get = gk20a_fifo_userd_gp_get,
|
||||
.userd_gp_put = gk20a_fifo_userd_gp_put,
|
||||
.userd_pb_get = gk20a_fifo_userd_pb_get,
|
||||
.pbdma_acquire_val = gk20a_fifo_pbdma_acquire_val,
|
||||
.preempt_channel = vgpu_fifo_preempt_channel,
|
||||
.preempt_tsg = vgpu_fifo_preempt_tsg,
|
||||
.enable_tsg = vgpu_enable_tsg,
|
||||
.disable_tsg = gk20a_disable_tsg,
|
||||
.tsg_verify_channel_status = NULL,
|
||||
.tsg_verify_status_ctx_reload = NULL,
|
||||
.reschedule_runlist = NULL,
|
||||
.update_runlist = vgpu_fifo_update_runlist,
|
||||
.trigger_mmu_fault = gm20b_fifo_trigger_mmu_fault,
|
||||
.get_mmu_fault_info = gp10b_fifo_get_mmu_fault_info,
|
||||
.wait_engine_idle = vgpu_fifo_wait_engine_idle,
|
||||
.get_num_fifos = gm20b_fifo_get_num_fifos,
|
||||
.get_pbdma_signature = gp10b_fifo_get_pbdma_signature,
|
||||
.set_runlist_interleave = vgpu_fifo_set_runlist_interleave,
|
||||
.tsg_set_timeslice = vgpu_tsg_set_timeslice,
|
||||
.tsg_open = vgpu_tsg_open,
|
||||
.force_reset_ch = vgpu_fifo_force_reset_ch,
|
||||
.engine_enum_from_type = gp10b_fifo_engine_enum_from_type,
|
||||
.device_info_data_parse = gp10b_device_info_data_parse,
|
||||
.eng_runlist_base_size = fifo_eng_runlist_base__size_1_v,
|
||||
.init_engine_info = vgpu_fifo_init_engine_info,
|
||||
.runlist_entry_size = ram_rl_entry_size_v,
|
||||
.get_tsg_runlist_entry = gk20a_get_tsg_runlist_entry,
|
||||
.get_ch_runlist_entry = gk20a_get_ch_runlist_entry,
|
||||
.is_fault_engine_subid_gpc = gk20a_is_fault_engine_subid_gpc,
|
||||
.dump_pbdma_status = gk20a_dump_pbdma_status,
|
||||
.dump_eng_status = gk20a_dump_eng_status,
|
||||
.dump_channel_status_ramfc = gk20a_dump_channel_status_ramfc,
|
||||
.intr_0_error_mask = gk20a_fifo_intr_0_error_mask,
|
||||
.is_preempt_pending = gk20a_fifo_is_preempt_pending,
|
||||
.init_pbdma_intr_descs = gp10b_fifo_init_pbdma_intr_descs,
|
||||
.reset_enable_hw = gk20a_init_fifo_reset_enable_hw,
|
||||
.teardown_ch_tsg = gk20a_fifo_teardown_ch_tsg,
|
||||
.handle_sched_error = gk20a_fifo_handle_sched_error,
|
||||
.handle_pbdma_intr_0 = gk20a_fifo_handle_pbdma_intr_0,
|
||||
.handle_pbdma_intr_1 = gk20a_fifo_handle_pbdma_intr_1,
|
||||
.tsg_bind_channel = vgpu_tsg_bind_channel,
|
||||
.tsg_unbind_channel = vgpu_tsg_unbind_channel,
|
||||
#ifdef CONFIG_TEGRA_GK20A_NVHOST
|
||||
.alloc_syncpt_buf = gk20a_fifo_alloc_syncpt_buf,
|
||||
.free_syncpt_buf = gk20a_fifo_free_syncpt_buf,
|
||||
.add_syncpt_wait_cmd = gk20a_fifo_add_syncpt_wait_cmd,
|
||||
.get_syncpt_wait_cmd_size = gk20a_fifo_get_syncpt_wait_cmd_size,
|
||||
.add_syncpt_incr_cmd = gk20a_fifo_add_syncpt_incr_cmd,
|
||||
.get_syncpt_incr_cmd_size = gk20a_fifo_get_syncpt_incr_cmd_size,
|
||||
.get_sync_ro_map = NULL,
|
||||
#endif
|
||||
.resetup_ramfc = NULL,
|
||||
.device_info_fault_id = top_device_info_data_fault_id_enum_v,
|
||||
},
|
||||
.gr_ctx = {
|
||||
.get_netlist_name = gr_gp10b_get_netlist_name,
|
||||
.is_fw_defined = gr_gp10b_is_firmware_defined,
|
||||
},
|
||||
#ifdef CONFIG_GK20A_CTXSW_TRACE
|
||||
.fecs_trace = {
|
||||
.alloc_user_buffer = vgpu_alloc_user_buffer,
|
||||
.free_user_buffer = vgpu_free_user_buffer,
|
||||
.mmap_user_buffer = vgpu_mmap_user_buffer,
|
||||
.init = vgpu_fecs_trace_init,
|
||||
.deinit = vgpu_fecs_trace_deinit,
|
||||
.enable = vgpu_fecs_trace_enable,
|
||||
.disable = vgpu_fecs_trace_disable,
|
||||
.is_enabled = vgpu_fecs_trace_is_enabled,
|
||||
.reset = NULL,
|
||||
.flush = NULL,
|
||||
.poll = vgpu_fecs_trace_poll,
|
||||
.bind_channel = NULL,
|
||||
.unbind_channel = NULL,
|
||||
.max_entries = vgpu_fecs_trace_max_entries,
|
||||
.set_filter = vgpu_fecs_trace_set_filter,
|
||||
},
|
||||
#endif /* CONFIG_GK20A_CTXSW_TRACE */
|
||||
.mm = {
|
||||
/* FIXME: add support for sparse mappings */
|
||||
.support_sparse = NULL,
|
||||
.gmmu_map = vgpu_gp10b_locked_gmmu_map,
|
||||
.gmmu_unmap = vgpu_locked_gmmu_unmap,
|
||||
.vm_bind_channel = vgpu_vm_bind_channel,
|
||||
.fb_flush = vgpu_mm_fb_flush,
|
||||
.l2_invalidate = vgpu_mm_l2_invalidate,
|
||||
.l2_flush = vgpu_mm_l2_flush,
|
||||
.cbc_clean = gk20a_mm_cbc_clean,
|
||||
.set_big_page_size = gm20b_mm_set_big_page_size,
|
||||
.get_big_page_sizes = gm20b_mm_get_big_page_sizes,
|
||||
.get_default_big_page_size = gp10b_mm_get_default_big_page_size,
|
||||
.gpu_phys_addr = gm20b_gpu_phys_addr,
|
||||
.get_iommu_bit = gk20a_mm_get_iommu_bit,
|
||||
.get_mmu_levels = gp10b_mm_get_mmu_levels,
|
||||
.init_pdb = gp10b_mm_init_pdb,
|
||||
.init_mm_setup_hw = vgpu_gp10b_init_mm_setup_hw,
|
||||
.is_bar1_supported = gm20b_mm_is_bar1_supported,
|
||||
.init_inst_block = gk20a_init_inst_block,
|
||||
.mmu_fault_pending = gk20a_fifo_mmu_fault_pending,
|
||||
.init_bar2_vm = gp10b_init_bar2_vm,
|
||||
.init_bar2_mm_hw_setup = gp10b_init_bar2_mm_hw_setup,
|
||||
.remove_bar2_vm = gp10b_remove_bar2_vm,
|
||||
.get_kind_invalid = gm20b_get_kind_invalid,
|
||||
.get_kind_pitch = gm20b_get_kind_pitch,
|
||||
},
|
||||
.pramin = {
|
||||
.enter = gk20a_pramin_enter,
|
||||
.exit = gk20a_pramin_exit,
|
||||
.data032_r = pram_data032_r,
|
||||
},
|
||||
.therm = {
|
||||
.init_therm_setup_hw = gp10b_init_therm_setup_hw,
|
||||
.elcg_init_idle_filters = gp10b_elcg_init_idle_filters,
|
||||
},
|
||||
.pmu = {
|
||||
.pmu_setup_elpg = gp10b_pmu_setup_elpg,
|
||||
.pmu_get_queue_head = pwr_pmu_queue_head_r,
|
||||
.pmu_get_queue_head_size = pwr_pmu_queue_head__size_1_v,
|
||||
.pmu_get_queue_tail = pwr_pmu_queue_tail_r,
|
||||
.pmu_get_queue_tail_size = pwr_pmu_queue_tail__size_1_v,
|
||||
.pmu_queue_head = gk20a_pmu_queue_head,
|
||||
.pmu_queue_tail = gk20a_pmu_queue_tail,
|
||||
.pmu_msgq_tail = gk20a_pmu_msgq_tail,
|
||||
.pmu_mutex_size = pwr_pmu_mutex__size_1_v,
|
||||
.pmu_mutex_acquire = gk20a_pmu_mutex_acquire,
|
||||
.pmu_mutex_release = gk20a_pmu_mutex_release,
|
||||
.write_dmatrfbase = gp10b_write_dmatrfbase,
|
||||
.pmu_elpg_statistics = gp10b_pmu_elpg_statistics,
|
||||
.pmu_init_perfmon = nvgpu_pmu_init_perfmon,
|
||||
.pmu_perfmon_start_sampling = nvgpu_pmu_perfmon_start_sampling,
|
||||
.pmu_perfmon_stop_sampling = nvgpu_pmu_perfmon_stop_sampling,
|
||||
.pmu_pg_init_param = gp10b_pg_gr_init,
|
||||
.pmu_pg_supported_engines_list = gk20a_pmu_pg_engines_list,
|
||||
.pmu_pg_engines_feature_list = gk20a_pmu_pg_feature_list,
|
||||
.dump_secure_fuses = pmu_dump_security_fuses_gp10b,
|
||||
.reset_engine = gk20a_pmu_engine_reset,
|
||||
.is_engine_in_reset = gk20a_pmu_is_engine_in_reset,
|
||||
},
|
||||
.regops = {
|
||||
.get_global_whitelist_ranges =
|
||||
gp10b_get_global_whitelist_ranges,
|
||||
.get_global_whitelist_ranges_count =
|
||||
gp10b_get_global_whitelist_ranges_count,
|
||||
.get_context_whitelist_ranges =
|
||||
gp10b_get_context_whitelist_ranges,
|
||||
.get_context_whitelist_ranges_count =
|
||||
gp10b_get_context_whitelist_ranges_count,
|
||||
.get_runcontrol_whitelist = gp10b_get_runcontrol_whitelist,
|
||||
.get_runcontrol_whitelist_count =
|
||||
gp10b_get_runcontrol_whitelist_count,
|
||||
.get_runcontrol_whitelist_ranges =
|
||||
gp10b_get_runcontrol_whitelist_ranges,
|
||||
.get_runcontrol_whitelist_ranges_count =
|
||||
gp10b_get_runcontrol_whitelist_ranges_count,
|
||||
.get_qctl_whitelist = gp10b_get_qctl_whitelist,
|
||||
.get_qctl_whitelist_count = gp10b_get_qctl_whitelist_count,
|
||||
.get_qctl_whitelist_ranges = gp10b_get_qctl_whitelist_ranges,
|
||||
.get_qctl_whitelist_ranges_count =
|
||||
gp10b_get_qctl_whitelist_ranges_count,
|
||||
.apply_smpc_war = gp10b_apply_smpc_war,
|
||||
},
|
||||
.mc = {
|
||||
.intr_enable = mc_gp10b_intr_enable,
|
||||
.intr_unit_config = mc_gp10b_intr_unit_config,
|
||||
.isr_stall = mc_gp10b_isr_stall,
|
||||
.intr_stall = mc_gp10b_intr_stall,
|
||||
.intr_stall_pause = mc_gp10b_intr_stall_pause,
|
||||
.intr_stall_resume = mc_gp10b_intr_stall_resume,
|
||||
.intr_nonstall = mc_gp10b_intr_nonstall,
|
||||
.intr_nonstall_pause = mc_gp10b_intr_nonstall_pause,
|
||||
.intr_nonstall_resume = mc_gp10b_intr_nonstall_resume,
|
||||
.enable = gk20a_mc_enable,
|
||||
.disable = gk20a_mc_disable,
|
||||
.reset = gk20a_mc_reset,
|
||||
.boot_0 = gk20a_mc_boot_0,
|
||||
.is_intr1_pending = mc_gp10b_is_intr1_pending,
|
||||
},
|
||||
.debug = {
|
||||
.show_dump = NULL,
|
||||
},
|
||||
.dbg_session_ops = {
|
||||
.exec_reg_ops = vgpu_exec_regops,
|
||||
.dbg_set_powergate = vgpu_dbg_set_powergate,
|
||||
.check_and_set_global_reservation =
|
||||
vgpu_check_and_set_global_reservation,
|
||||
.check_and_set_context_reservation =
|
||||
vgpu_check_and_set_context_reservation,
|
||||
.release_profiler_reservation =
|
||||
vgpu_release_profiler_reservation,
|
||||
.perfbuffer_enable = vgpu_perfbuffer_enable,
|
||||
.perfbuffer_disable = vgpu_perfbuffer_disable,
|
||||
},
|
||||
.bus = {
|
||||
.init_hw = gk20a_bus_init_hw,
|
||||
.isr = gk20a_bus_isr,
|
||||
.read_ptimer = vgpu_read_ptimer,
|
||||
.get_timestamps_zipper = vgpu_get_timestamps_zipper,
|
||||
.bar1_bind = gk20a_bus_bar1_bind,
|
||||
},
|
||||
#if defined(CONFIG_GK20A_CYCLE_STATS)
|
||||
.css = {
|
||||
.enable_snapshot = vgpu_css_enable_snapshot_buffer,
|
||||
.disable_snapshot = vgpu_css_release_snapshot_buffer,
|
||||
.check_data_available = vgpu_css_flush_snapshots,
|
||||
.detach_snapshot = vgpu_css_detach,
|
||||
.set_handled_snapshots = NULL,
|
||||
.allocate_perfmon_ids = NULL,
|
||||
.release_perfmon_ids = NULL,
|
||||
},
|
||||
#endif
|
||||
.falcon = {
|
||||
.falcon_hal_sw_init = gk20a_falcon_hal_sw_init,
|
||||
},
|
||||
.priv_ring = {
|
||||
.isr = gp10b_priv_ring_isr,
|
||||
},
|
||||
.fuse = {
|
||||
.check_priv_security = vgpu_gp10b_fuse_check_priv_security,
|
||||
},
|
||||
.chip_init_gpu_characteristics = vgpu_init_gpu_characteristics,
|
||||
.get_litter_value = gp10b_get_litter_value,
|
||||
};
|
||||
|
||||
int vgpu_gp10b_init_hal(struct gk20a *g)
|
||||
{
|
||||
struct gpu_ops *gops = &g->ops;
|
||||
|
||||
gops->ltc = vgpu_gp10b_ops.ltc;
|
||||
gops->ce2 = vgpu_gp10b_ops.ce2;
|
||||
gops->gr = vgpu_gp10b_ops.gr;
|
||||
gops->fb = vgpu_gp10b_ops.fb;
|
||||
gops->clock_gating = vgpu_gp10b_ops.clock_gating;
|
||||
gops->fifo = vgpu_gp10b_ops.fifo;
|
||||
gops->gr_ctx = vgpu_gp10b_ops.gr_ctx;
|
||||
#ifdef CONFIG_GK20A_CTXSW_TRACE
|
||||
gops->fecs_trace = vgpu_gp10b_ops.fecs_trace;
|
||||
#endif
|
||||
gops->mm = vgpu_gp10b_ops.mm;
|
||||
gops->pramin = vgpu_gp10b_ops.pramin;
|
||||
gops->therm = vgpu_gp10b_ops.therm;
|
||||
gops->pmu = vgpu_gp10b_ops.pmu;
|
||||
gops->regops = vgpu_gp10b_ops.regops;
|
||||
gops->mc = vgpu_gp10b_ops.mc;
|
||||
gops->debug = vgpu_gp10b_ops.debug;
|
||||
gops->dbg_session_ops = vgpu_gp10b_ops.dbg_session_ops;
|
||||
gops->bus = vgpu_gp10b_ops.bus;
|
||||
#if defined(CONFIG_GK20A_CYCLE_STATS)
|
||||
gops->css = vgpu_gp10b_ops.css;
|
||||
#endif
|
||||
gops->falcon = vgpu_gp10b_ops.falcon;
|
||||
|
||||
gops->priv_ring = vgpu_gp10b_ops.priv_ring;
|
||||
|
||||
gops->fuse = vgpu_gp10b_ops.fuse;
|
||||
|
||||
/* Lone Functions */
|
||||
gops->chip_init_gpu_characteristics =
|
||||
vgpu_gp10b_ops.chip_init_gpu_characteristics;
|
||||
gops->get_litter_value = vgpu_gp10b_ops.get_litter_value;
|
||||
|
||||
__nvgpu_set_enabled(g, NVGPU_GR_USE_DMA_FOR_FW_BOOTSTRAP, true);
|
||||
__nvgpu_set_enabled(g, NVGPU_PMU_PSTATE, false);
|
||||
|
||||
/* Read fuses to check if gpu needs to boot in secure/non-secure mode */
|
||||
if (gops->fuse.check_priv_security(g))
|
||||
return -EINVAL; /* Do not boot gpu */
|
||||
|
||||
/* priv security dependent ops */
|
||||
if (nvgpu_is_enabled(g, NVGPU_SEC_PRIVSECURITY)) {
|
||||
/* Add in ops from gm20b acr */
|
||||
gops->pmu.is_pmu_supported = gm20b_is_pmu_supported,
|
||||
gops->pmu.prepare_ucode = prepare_ucode_blob,
|
||||
gops->pmu.pmu_setup_hw_and_bootstrap = gm20b_bootstrap_hs_flcn,
|
||||
gops->pmu.is_lazy_bootstrap = gm20b_is_lazy_bootstrap,
|
||||
gops->pmu.is_priv_load = gm20b_is_priv_load,
|
||||
gops->pmu.get_wpr = gm20b_wpr_info,
|
||||
gops->pmu.alloc_blob_space = gm20b_alloc_blob_space,
|
||||
gops->pmu.pmu_populate_loader_cfg =
|
||||
gm20b_pmu_populate_loader_cfg,
|
||||
gops->pmu.flcn_populate_bl_dmem_desc =
|
||||
gm20b_flcn_populate_bl_dmem_desc,
|
||||
gops->pmu.falcon_wait_for_halt = pmu_wait_for_halt,
|
||||
gops->pmu.falcon_clear_halt_interrupt_status =
|
||||
clear_halt_interrupt_status,
|
||||
gops->pmu.init_falcon_setup_hw = gm20b_init_pmu_setup_hw1,
|
||||
|
||||
gops->pmu.init_wpr_region = gm20b_pmu_init_acr;
|
||||
gops->pmu.load_lsfalcon_ucode = gp10b_load_falcon_ucode;
|
||||
gops->pmu.is_lazy_bootstrap = gp10b_is_lazy_bootstrap;
|
||||
gops->pmu.is_priv_load = gp10b_is_priv_load;
|
||||
|
||||
gops->gr.load_ctxsw_ucode = gr_gm20b_load_ctxsw_ucode;
|
||||
} else {
|
||||
/* Inherit from gk20a */
|
||||
gops->pmu.is_pmu_supported = gk20a_is_pmu_supported,
|
||||
gops->pmu.prepare_ucode = nvgpu_pmu_prepare_ns_ucode_blob,
|
||||
gops->pmu.pmu_setup_hw_and_bootstrap = gk20a_init_pmu_setup_hw1,
|
||||
gops->pmu.pmu_nsbootstrap = pmu_bootstrap,
|
||||
|
||||
gops->pmu.load_lsfalcon_ucode = NULL;
|
||||
gops->pmu.init_wpr_region = NULL;
|
||||
gops->pmu.pmu_setup_hw_and_bootstrap = gp10b_init_pmu_setup_hw1;
|
||||
|
||||
gops->gr.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode;
|
||||
}
|
||||
|
||||
__nvgpu_set_enabled(g, NVGPU_PMU_FECS_BOOTSTRAP_DONE, false);
|
||||
g->pmu_lsf_pmu_wpr_init_done = 0;
|
||||
g->bootstrap_owner = LSF_BOOTSTRAP_OWNER_DEFAULT;
|
||||
|
||||
g->name = "gp10b";
|
||||
|
||||
return 0;
|
||||
}
|
||||
@@ -1,200 +0,0 @@
|
||||
/*
|
||||
* Virtualized GPU Memory Management
|
||||
*
|
||||
* Copyright (c) 2015-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
#include "vgpu_mm_gp10b.h"
|
||||
#include "gk20a/mm_gk20a.h"
|
||||
|
||||
#include <nvgpu/bug.h>
|
||||
#include <nvgpu/dma.h>
|
||||
#include <nvgpu/vgpu/vgpu_ivc.h>
|
||||
|
||||
int vgpu_gp10b_init_mm_setup_hw(struct gk20a *g)
|
||||
{
|
||||
g->mm.disable_bigpage = true;
|
||||
return 0;
|
||||
}
|
||||
|
||||
static inline int add_mem_desc(struct tegra_vgpu_mem_desc *mem_desc,
|
||||
u64 addr, u64 size, size_t *oob_size)
|
||||
{
|
||||
if (*oob_size < sizeof(*mem_desc))
|
||||
return -ENOMEM;
|
||||
|
||||
mem_desc->addr = addr;
|
||||
mem_desc->length = size;
|
||||
*oob_size -= sizeof(*mem_desc);
|
||||
return 0;
|
||||
}
|
||||
|
||||
u64 vgpu_gp10b_locked_gmmu_map(struct vm_gk20a *vm,
|
||||
u64 map_offset,
|
||||
struct nvgpu_sgt *sgt,
|
||||
u64 buffer_offset,
|
||||
u64 size,
|
||||
int pgsz_idx,
|
||||
u8 kind_v,
|
||||
u32 ctag_offset,
|
||||
u32 flags,
|
||||
int rw_flag,
|
||||
bool clear_ctags,
|
||||
bool sparse,
|
||||
bool priv,
|
||||
struct vm_gk20a_mapping_batch *batch,
|
||||
enum nvgpu_aperture aperture)
|
||||
{
|
||||
int err = 0;
|
||||
struct gk20a *g = gk20a_from_vm(vm);
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_as_map_ex_params *p = &msg.params.as_map_ex;
|
||||
struct tegra_vgpu_mem_desc *mem_desc;
|
||||
u32 page_size = vm->gmmu_page_sizes[pgsz_idx];
|
||||
u64 buffer_size = PAGE_ALIGN(size);
|
||||
u64 space_to_skip = buffer_offset;
|
||||
u32 mem_desc_count = 0, i;
|
||||
void *handle = NULL;
|
||||
size_t oob_size;
|
||||
u8 prot;
|
||||
void *sgl;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
/* FIXME: add support for sparse mappings */
|
||||
|
||||
if (WARN_ON(!sgt) || WARN_ON(nvgpu_iommuable(g)))
|
||||
return 0;
|
||||
|
||||
if (space_to_skip & (page_size - 1))
|
||||
return 0;
|
||||
|
||||
memset(&msg, 0, sizeof(msg));
|
||||
|
||||
/* Allocate (or validate when map_offset != 0) the virtual address. */
|
||||
if (!map_offset) {
|
||||
map_offset = __nvgpu_vm_alloc_va(vm, size, pgsz_idx);
|
||||
if (!map_offset) {
|
||||
nvgpu_err(g, "failed to allocate va space");
|
||||
err = -ENOMEM;
|
||||
goto fail;
|
||||
}
|
||||
}
|
||||
|
||||
handle = vgpu_ivc_oob_get_ptr(vgpu_ivc_get_server_vmid(),
|
||||
TEGRA_VGPU_QUEUE_CMD,
|
||||
(void **)&mem_desc, &oob_size);
|
||||
if (!handle) {
|
||||
err = -EINVAL;
|
||||
goto fail;
|
||||
}
|
||||
sgl = sgt->sgl;
|
||||
while (sgl) {
|
||||
u64 phys_addr;
|
||||
u64 chunk_length;
|
||||
|
||||
/*
|
||||
* Cut out sgl ents for space_to_skip.
|
||||
*/
|
||||
if (space_to_skip &&
|
||||
space_to_skip >= nvgpu_sgt_get_length(sgt, sgl)) {
|
||||
space_to_skip -= nvgpu_sgt_get_length(sgt, sgl);
|
||||
sgl = nvgpu_sgt_get_next(sgt, sgl);
|
||||
continue;
|
||||
}
|
||||
|
||||
phys_addr = nvgpu_sgt_get_phys(sgt, sgl) + space_to_skip;
|
||||
chunk_length = min(size,
|
||||
nvgpu_sgt_get_length(sgt, sgl) - space_to_skip);
|
||||
|
||||
if (add_mem_desc(&mem_desc[mem_desc_count++], phys_addr,
|
||||
chunk_length, &oob_size)) {
|
||||
err = -ENOMEM;
|
||||
goto fail;
|
||||
}
|
||||
|
||||
space_to_skip = 0;
|
||||
size -= chunk_length;
|
||||
sgl = nvgpu_sgt_get_next(sgt, sgl);
|
||||
|
||||
if (size == 0)
|
||||
break;
|
||||
}
|
||||
|
||||
if (rw_flag == gk20a_mem_flag_read_only)
|
||||
prot = TEGRA_VGPU_MAP_PROT_READ_ONLY;
|
||||
else if (rw_flag == gk20a_mem_flag_write_only)
|
||||
prot = TEGRA_VGPU_MAP_PROT_WRITE_ONLY;
|
||||
else
|
||||
prot = TEGRA_VGPU_MAP_PROT_NONE;
|
||||
|
||||
if (pgsz_idx == gmmu_page_size_kernel) {
|
||||
if (page_size == vm->gmmu_page_sizes[gmmu_page_size_small]) {
|
||||
pgsz_idx = gmmu_page_size_small;
|
||||
} else if (page_size ==
|
||||
vm->gmmu_page_sizes[gmmu_page_size_big]) {
|
||||
pgsz_idx = gmmu_page_size_big;
|
||||
} else {
|
||||
nvgpu_err(g, "invalid kernel page size %d",
|
||||
page_size);
|
||||
goto fail;
|
||||
}
|
||||
}
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_AS_MAP_EX;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->handle = vm->handle;
|
||||
p->gpu_va = map_offset;
|
||||
p->size = buffer_size;
|
||||
p->mem_desc_count = mem_desc_count;
|
||||
p->pgsz_idx = pgsz_idx;
|
||||
p->iova = 0;
|
||||
p->kind = kind_v;
|
||||
if (flags & NVGPU_VM_MAP_CACHEABLE)
|
||||
p->flags = TEGRA_VGPU_MAP_CACHEABLE;
|
||||
if (flags & NVGPU_VM_MAP_IO_COHERENT)
|
||||
p->flags |= TEGRA_VGPU_MAP_IO_COHERENT;
|
||||
if (flags & NVGPU_VM_MAP_L3_ALLOC)
|
||||
p->flags |= TEGRA_VGPU_MAP_L3_ALLOC;
|
||||
p->prot = prot;
|
||||
p->ctag_offset = ctag_offset;
|
||||
p->clear_ctags = clear_ctags;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
if (err || msg.ret)
|
||||
goto fail;
|
||||
|
||||
/* TLB invalidate handled on server side */
|
||||
|
||||
vgpu_ivc_oob_put_ptr(handle);
|
||||
return map_offset;
|
||||
fail:
|
||||
if (handle)
|
||||
vgpu_ivc_oob_put_ptr(handle);
|
||||
nvgpu_err(g, "Failed: err=%d, msg.ret=%d", err, msg.ret);
|
||||
nvgpu_err(g,
|
||||
" Map: %-5s GPU virt %#-12llx +%#-9llx "
|
||||
"phys offset: %#-4llx; pgsz: %3dkb perm=%-2s | "
|
||||
"kind=%#02x APT=%-6s",
|
||||
vm->name, map_offset, buffer_size, buffer_offset,
|
||||
vm->gmmu_page_sizes[pgsz_idx] >> 10,
|
||||
nvgpu_gmmu_perm_str(rw_flag),
|
||||
kind_v, "SYSMEM");
|
||||
for (i = 0; i < mem_desc_count; i++)
|
||||
nvgpu_err(g, " > 0x%010llx + 0x%llx",
|
||||
mem_desc[i].addr, mem_desc[i].length);
|
||||
|
||||
return 0;
|
||||
}
|
||||
@@ -1,39 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef __VGPU_MM_GP10B_H__
|
||||
#define __VGPU_MM_GP10B_H__
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
|
||||
u64 vgpu_gp10b_locked_gmmu_map(struct vm_gk20a *vm,
|
||||
u64 map_offset,
|
||||
struct nvgpu_sgt *sgt,
|
||||
u64 buffer_offset,
|
||||
u64 size,
|
||||
int pgsz_idx,
|
||||
u8 kind_v,
|
||||
u32 ctag_offset,
|
||||
u32 flags,
|
||||
int rw_flag,
|
||||
bool clear_ctags,
|
||||
bool sparse,
|
||||
bool priv,
|
||||
struct vm_gk20a_mapping_batch *batch,
|
||||
enum nvgpu_aperture aperture);
|
||||
int vgpu_gp10b_init_mm_setup_hw(struct gk20a *g);
|
||||
|
||||
#endif
|
||||
File diff suppressed because it is too large
Load Diff
@@ -1,68 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _GR_VGPU_H_
|
||||
#define _GR_VGPU_H_
|
||||
|
||||
#include <nvgpu/types.h>
|
||||
|
||||
struct gk20a;
|
||||
struct channel_gk20a;
|
||||
struct gr_gk20a;
|
||||
struct gr_zcull_info;
|
||||
struct zbc_entry;
|
||||
struct zbc_query_params;
|
||||
struct dbg_session_gk20a;
|
||||
struct tsg_gk20a;
|
||||
|
||||
void vgpu_gr_detect_sm_arch(struct gk20a *g);
|
||||
void vgpu_gr_free_channel_ctx(struct channel_gk20a *c, bool is_tsg);
|
||||
void vgpu_gr_free_tsg_ctx(struct tsg_gk20a *tsg);
|
||||
int vgpu_gr_alloc_obj_ctx(struct channel_gk20a *c, u32 class_num, u32 flags);
|
||||
int vgpu_gr_bind_ctxsw_zcull(struct gk20a *g, struct gr_gk20a *gr,
|
||||
struct channel_gk20a *c, u64 zcull_va,
|
||||
u32 mode);
|
||||
int vgpu_gr_get_zcull_info(struct gk20a *g, struct gr_gk20a *gr,
|
||||
struct gr_zcull_info *zcull_params);
|
||||
u32 vgpu_gr_get_gpc_tpc_mask(struct gk20a *g, u32 gpc_index);
|
||||
u32 vgpu_gr_get_max_fbps_count(struct gk20a *g);
|
||||
u32 vgpu_gr_get_fbp_en_mask(struct gk20a *g);
|
||||
u32 vgpu_gr_get_max_ltc_per_fbp(struct gk20a *g);
|
||||
u32 vgpu_gr_get_max_lts_per_ltc(struct gk20a *g);
|
||||
u32 *vgpu_gr_rop_l2_en_mask(struct gk20a *g);
|
||||
int vgpu_gr_add_zbc(struct gk20a *g, struct gr_gk20a *gr,
|
||||
struct zbc_entry *zbc_val);
|
||||
int vgpu_gr_query_zbc(struct gk20a *g, struct gr_gk20a *gr,
|
||||
struct zbc_query_params *query_params);
|
||||
int vgpu_gr_set_sm_debug_mode(struct gk20a *g,
|
||||
struct channel_gk20a *ch, u64 sms, bool enable);
|
||||
int vgpu_gr_update_smpc_ctxsw_mode(struct gk20a *g,
|
||||
struct channel_gk20a *ch, bool enable);
|
||||
int vgpu_gr_update_hwpm_ctxsw_mode(struct gk20a *g,
|
||||
struct channel_gk20a *ch, bool enable);
|
||||
int vgpu_gr_clear_sm_error_state(struct gk20a *g,
|
||||
struct channel_gk20a *ch, u32 sm_id);
|
||||
int vgpu_gr_suspend_contexts(struct gk20a *g,
|
||||
struct dbg_session_gk20a *dbg_s,
|
||||
int *ctx_resident_ch_fd);
|
||||
int vgpu_gr_resume_contexts(struct gk20a *g,
|
||||
struct dbg_session_gk20a *dbg_s,
|
||||
int *ctx_resident_ch_fd);
|
||||
int vgpu_gr_commit_inst(struct channel_gk20a *c, u64 gpu_va);
|
||||
int vgpu_gr_init_sm_id_table(struct gk20a *g);
|
||||
int vgpu_gr_init_fs_state(struct gk20a *g);
|
||||
|
||||
#endif
|
||||
@@ -1,139 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <gk20a/gk20a.h>
|
||||
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
#include "gv11b/fifo_gv11b.h"
|
||||
#include <nvgpu/nvhost.h>
|
||||
#include <nvgpu/vgpu/tegra_vgpu.h>
|
||||
|
||||
#ifdef CONFIG_TEGRA_GK20A_NVHOST
|
||||
|
||||
static int set_syncpt_ro_map_gpu_va_locked(struct vm_gk20a *vm)
|
||||
{
|
||||
int err;
|
||||
struct gk20a *g = gk20a_from_vm(vm);
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_map_syncpt_params *p = &msg.params.map_syncpt;
|
||||
|
||||
if (vm->syncpt_ro_map_gpu_va)
|
||||
return 0;
|
||||
|
||||
vm->syncpt_ro_map_gpu_va = __nvgpu_vm_alloc_va(vm,
|
||||
g->syncpt_unit_size,
|
||||
gmmu_page_size_kernel);
|
||||
if (!vm->syncpt_ro_map_gpu_va) {
|
||||
nvgpu_err(g, "allocating read-only va space failed");
|
||||
return -ENOMEM;
|
||||
}
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_MAP_SYNCPT;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->as_handle = vm->handle;
|
||||
p->gpu_va = vm->syncpt_ro_map_gpu_va;
|
||||
p->len = g->syncpt_unit_size;
|
||||
p->offset = 0;
|
||||
p->prot = TEGRA_VGPU_MAP_PROT_READ_ONLY;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (err) {
|
||||
nvgpu_err(g,
|
||||
"mapping read-only va space failed err %d",
|
||||
err);
|
||||
__nvgpu_vm_free_va(vm, vm->syncpt_ro_map_gpu_va,
|
||||
gmmu_page_size_kernel);
|
||||
vm->syncpt_ro_map_gpu_va = 0;
|
||||
return err;
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int vgpu_gv11b_fifo_alloc_syncpt_buf(struct channel_gk20a *c,
|
||||
u32 syncpt_id, struct nvgpu_mem *syncpt_buf)
|
||||
{
|
||||
int err;
|
||||
struct gk20a *g = c->g;
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_map_syncpt_params *p = &msg.params.map_syncpt;
|
||||
|
||||
/*
|
||||
* Add ro map for complete sync point shim range in vm.
|
||||
* All channels sharing same vm will share same ro mapping.
|
||||
* Create rw map for current channel sync point.
|
||||
*/
|
||||
nvgpu_mutex_acquire(&c->vm->syncpt_ro_map_lock);
|
||||
err = set_syncpt_ro_map_gpu_va_locked(c->vm);
|
||||
nvgpu_mutex_release(&c->vm->syncpt_ro_map_lock);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
syncpt_buf->gpu_va = __nvgpu_vm_alloc_va(c->vm, g->syncpt_size,
|
||||
gmmu_page_size_kernel);
|
||||
if (!syncpt_buf->gpu_va) {
|
||||
nvgpu_err(g, "allocating syncpt va space failed");
|
||||
return -ENOMEM;
|
||||
}
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_MAP_SYNCPT;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->as_handle = c->vm->handle;
|
||||
p->gpu_va = syncpt_buf->gpu_va;
|
||||
p->len = g->syncpt_size;
|
||||
p->offset =
|
||||
nvgpu_nvhost_syncpt_unit_interface_get_byte_offset(syncpt_id);
|
||||
p->prot = TEGRA_VGPU_MAP_PROT_NONE;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (err) {
|
||||
nvgpu_err(g, "mapping syncpt va space failed err %d", err);
|
||||
__nvgpu_vm_free_va(c->vm, syncpt_buf->gpu_va,
|
||||
gmmu_page_size_kernel);
|
||||
return err;
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int vgpu_gv11b_fifo_get_sync_ro_map(struct vm_gk20a *vm,
|
||||
u64 *base_gpuva, u32 *sync_size)
|
||||
{
|
||||
struct gk20a *g = gk20a_from_vm(vm);
|
||||
int err;
|
||||
|
||||
nvgpu_mutex_acquire(&vm->syncpt_ro_map_lock);
|
||||
err = set_syncpt_ro_map_gpu_va_locked(vm);
|
||||
nvgpu_mutex_release(&vm->syncpt_ro_map_lock);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
*base_gpuva = vm->syncpt_ro_map_gpu_va;
|
||||
*sync_size = g->syncpt_size;
|
||||
|
||||
return 0;
|
||||
}
|
||||
#endif /* CONFIG_TEGRA_GK20A_NVHOST */
|
||||
|
||||
int vgpu_gv11b_init_fifo_setup_hw(struct gk20a *g)
|
||||
{
|
||||
struct fifo_gk20a *f = &g->fifo;
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
|
||||
f->max_subctx_count = priv->constants.max_subctx_count;
|
||||
|
||||
return 0;
|
||||
}
|
||||
@@ -1,27 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _VGPU_FIFO_GV11B_H_
|
||||
#define _VGPU_FIFO_GV11B_H_
|
||||
|
||||
struct gk20a;
|
||||
|
||||
int vgpu_gv11b_init_fifo_setup_hw(struct gk20a *g);
|
||||
int vgpu_gv11b_fifo_alloc_syncpt_buf(struct channel_gk20a *c,
|
||||
u32 syncpt_id, struct nvgpu_mem *syncpt_buf);
|
||||
int vgpu_gv11b_fifo_get_sync_ro_map(struct vm_gk20a *vm,
|
||||
u64 *base_gpuva, u32 *sync_size);
|
||||
#endif
|
||||
@@ -1,34 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "common/linux/vgpu/gr_vgpu.h"
|
||||
#include "vgpu_subctx_gv11b.h"
|
||||
|
||||
int vgpu_gr_gv11b_commit_inst(struct channel_gk20a *c, u64 gpu_va)
|
||||
{
|
||||
int err;
|
||||
|
||||
err = vgpu_gv11b_alloc_subctx_header(c);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
err = vgpu_gr_commit_inst(c, gpu_va);
|
||||
if (err)
|
||||
vgpu_gv11b_free_subctx_header(c);
|
||||
|
||||
return err;
|
||||
}
|
||||
@@ -1,24 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _VGPU_GR_GV11B_H_
|
||||
#define _VGPU_GR_GV11B_H_
|
||||
|
||||
struct channel_gk20a;
|
||||
|
||||
int vgpu_gr_gv11b_commit_inst(struct channel_gk20a *c, u64 gpu_va);
|
||||
|
||||
#endif
|
||||
@@ -1,42 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
|
||||
#include <nvgpu/enabled.h>
|
||||
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
#include "vgpu_gv11b.h"
|
||||
|
||||
int vgpu_gv11b_init_gpu_characteristics(struct gk20a *g)
|
||||
{
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = vgpu_init_gpu_characteristics(g);
|
||||
if (err) {
|
||||
nvgpu_err(g, "vgpu_init_gpu_characteristics failed, err %d\n", err);
|
||||
return err;
|
||||
}
|
||||
|
||||
__nvgpu_set_enabled(g, NVGPU_SUPPORT_TSG_SUBCONTEXTS, true);
|
||||
__nvgpu_set_enabled(g, NVGPU_SUPPORT_IO_COHERENCE, true);
|
||||
__nvgpu_set_enabled(g, NVGPU_SUPPORT_SCG, true);
|
||||
__nvgpu_set_enabled(g, NVGPU_SUPPORT_SYNCPOINT_ADDRESS, true);
|
||||
|
||||
return 0;
|
||||
}
|
||||
@@ -1,24 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _VGPU_GV11B_H_
|
||||
#define _VGPU_GV11B_H_
|
||||
|
||||
struct gk20a;
|
||||
|
||||
int vgpu_gv11b_init_gpu_characteristics(struct gk20a *g);
|
||||
|
||||
#endif
|
||||
@@ -1,597 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <gk20a/gk20a.h>
|
||||
#include <gv11b/hal_gv11b.h>
|
||||
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
#include "common/linux/vgpu/fifo_vgpu.h"
|
||||
#include "common/linux/vgpu/gr_vgpu.h"
|
||||
#include "common/linux/vgpu/ltc_vgpu.h"
|
||||
#include "common/linux/vgpu/mm_vgpu.h"
|
||||
#include "common/linux/vgpu/dbg_vgpu.h"
|
||||
#include "common/linux/vgpu/fecs_trace_vgpu.h"
|
||||
#include "common/linux/vgpu/css_vgpu.h"
|
||||
#include "common/linux/vgpu/gm20b/vgpu_gr_gm20b.h"
|
||||
#include "common/linux/vgpu/gp10b/vgpu_mm_gp10b.h"
|
||||
#include "common/linux/vgpu/gp10b/vgpu_gr_gp10b.h"
|
||||
|
||||
#include <gk20a/fb_gk20a.h>
|
||||
#include <gk20a/flcn_gk20a.h>
|
||||
#include <gk20a/bus_gk20a.h>
|
||||
#include <gk20a/mc_gk20a.h>
|
||||
|
||||
#include <gm20b/gr_gm20b.h>
|
||||
#include <gm20b/fb_gm20b.h>
|
||||
#include <gm20b/fifo_gm20b.h>
|
||||
#include <gm20b/pmu_gm20b.h>
|
||||
#include <gm20b/mm_gm20b.h>
|
||||
#include <gm20b/acr_gm20b.h>
|
||||
#include <gm20b/ltc_gm20b.h>
|
||||
|
||||
#include <gp10b/fb_gp10b.h>
|
||||
#include <gp10b/pmu_gp10b.h>
|
||||
#include <gp10b/mm_gp10b.h>
|
||||
#include <gp10b/mc_gp10b.h>
|
||||
#include <gp10b/ce_gp10b.h>
|
||||
#include "gp10b/gr_gp10b.h"
|
||||
#include <gp10b/fifo_gp10b.h>
|
||||
#include <gp10b/therm_gp10b.h>
|
||||
#include <gp10b/priv_ring_gp10b.h>
|
||||
#include <gp10b/ltc_gp10b.h>
|
||||
|
||||
#include <gp106/pmu_gp106.h>
|
||||
#include <gp106/acr_gp106.h>
|
||||
|
||||
#include <gv11b/fb_gv11b.h>
|
||||
#include <gv11b/pmu_gv11b.h>
|
||||
#include <gv11b/acr_gv11b.h>
|
||||
#include <gv11b/mm_gv11b.h>
|
||||
#include <gv11b/mc_gv11b.h>
|
||||
#include <gv11b/ce_gv11b.h>
|
||||
#include <gv11b/fifo_gv11b.h>
|
||||
#include <gv11b/therm_gv11b.h>
|
||||
#include <gv11b/regops_gv11b.h>
|
||||
#include <gv11b/gr_ctx_gv11b.h>
|
||||
#include <gv11b/ltc_gv11b.h>
|
||||
#include <gv11b/gv11b_gating_reglist.h>
|
||||
#include <gv11b/gr_gv11b.h>
|
||||
|
||||
#include <nvgpu/enabled.h>
|
||||
|
||||
#include "vgpu_gv11b.h"
|
||||
#include "vgpu_gr_gv11b.h"
|
||||
#include "vgpu_fifo_gv11b.h"
|
||||
#include "vgpu_subctx_gv11b.h"
|
||||
#include "vgpu_tsg_gv11b.h"
|
||||
|
||||
#include <nvgpu/hw/gv11b/hw_fuse_gv11b.h>
|
||||
#include <nvgpu/hw/gv11b/hw_fifo_gv11b.h>
|
||||
#include <nvgpu/hw/gv11b/hw_ram_gv11b.h>
|
||||
#include <nvgpu/hw/gv11b/hw_top_gv11b.h>
|
||||
#include <nvgpu/hw/gv11b/hw_pwr_gv11b.h>
|
||||
|
||||
static const struct gpu_ops vgpu_gv11b_ops = {
|
||||
.ltc = {
|
||||
.determine_L2_size_bytes = vgpu_determine_L2_size_bytes,
|
||||
.set_zbc_s_entry = gv11b_ltc_set_zbc_stencil_entry,
|
||||
.set_zbc_color_entry = gm20b_ltc_set_zbc_color_entry,
|
||||
.set_zbc_depth_entry = gm20b_ltc_set_zbc_depth_entry,
|
||||
.init_cbc = NULL,
|
||||
.init_fs_state = vgpu_ltc_init_fs_state,
|
||||
.init_comptags = vgpu_ltc_init_comptags,
|
||||
.cbc_ctrl = NULL,
|
||||
.isr = gv11b_ltc_isr,
|
||||
.flush = gm20b_flush_ltc,
|
||||
.set_enabled = gp10b_ltc_set_enabled,
|
||||
},
|
||||
.ce2 = {
|
||||
.isr_stall = gv11b_ce_isr,
|
||||
.isr_nonstall = gp10b_ce_nonstall_isr,
|
||||
.get_num_pce = vgpu_ce_get_num_pce,
|
||||
},
|
||||
.gr = {
|
||||
.init_gpc_mmu = gr_gv11b_init_gpc_mmu,
|
||||
.bundle_cb_defaults = gr_gv11b_bundle_cb_defaults,
|
||||
.cb_size_default = gr_gv11b_cb_size_default,
|
||||
.calc_global_ctx_buffer_size =
|
||||
gr_gv11b_calc_global_ctx_buffer_size,
|
||||
.commit_global_attrib_cb = gr_gv11b_commit_global_attrib_cb,
|
||||
.commit_global_bundle_cb = gr_gp10b_commit_global_bundle_cb,
|
||||
.commit_global_cb_manager = gr_gp10b_commit_global_cb_manager,
|
||||
.commit_global_pagepool = gr_gp10b_commit_global_pagepool,
|
||||
.handle_sw_method = gr_gv11b_handle_sw_method,
|
||||
.set_alpha_circular_buffer_size =
|
||||
gr_gv11b_set_alpha_circular_buffer_size,
|
||||
.set_circular_buffer_size = gr_gv11b_set_circular_buffer_size,
|
||||
.enable_hww_exceptions = gr_gv11b_enable_hww_exceptions,
|
||||
.is_valid_class = gr_gv11b_is_valid_class,
|
||||
.is_valid_gfx_class = gr_gv11b_is_valid_gfx_class,
|
||||
.is_valid_compute_class = gr_gv11b_is_valid_compute_class,
|
||||
.get_sm_dsm_perf_regs = gv11b_gr_get_sm_dsm_perf_regs,
|
||||
.get_sm_dsm_perf_ctrl_regs = gv11b_gr_get_sm_dsm_perf_ctrl_regs,
|
||||
.init_fs_state = vgpu_gr_init_fs_state,
|
||||
.set_hww_esr_report_mask = gv11b_gr_set_hww_esr_report_mask,
|
||||
.falcon_load_ucode = gr_gm20b_load_ctxsw_ucode_segments,
|
||||
.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode,
|
||||
.set_gpc_tpc_mask = gr_gv11b_set_gpc_tpc_mask,
|
||||
.get_gpc_tpc_mask = vgpu_gr_get_gpc_tpc_mask,
|
||||
.alloc_obj_ctx = vgpu_gr_alloc_obj_ctx,
|
||||
.bind_ctxsw_zcull = vgpu_gr_bind_ctxsw_zcull,
|
||||
.get_zcull_info = vgpu_gr_get_zcull_info,
|
||||
.is_tpc_addr = gr_gm20b_is_tpc_addr,
|
||||
.get_tpc_num = gr_gm20b_get_tpc_num,
|
||||
.detect_sm_arch = vgpu_gr_detect_sm_arch,
|
||||
.add_zbc_color = gr_gp10b_add_zbc_color,
|
||||
.add_zbc_depth = gr_gp10b_add_zbc_depth,
|
||||
.zbc_set_table = vgpu_gr_add_zbc,
|
||||
.zbc_query_table = vgpu_gr_query_zbc,
|
||||
.pmu_save_zbc = gk20a_pmu_save_zbc,
|
||||
.add_zbc = gr_gk20a_add_zbc,
|
||||
.pagepool_default_size = gr_gv11b_pagepool_default_size,
|
||||
.init_ctx_state = vgpu_gr_gp10b_init_ctx_state,
|
||||
.alloc_gr_ctx = vgpu_gr_gp10b_alloc_gr_ctx,
|
||||
.free_gr_ctx = vgpu_gr_free_gr_ctx,
|
||||
.update_ctxsw_preemption_mode =
|
||||
gr_gp10b_update_ctxsw_preemption_mode,
|
||||
.dump_gr_regs = NULL,
|
||||
.update_pc_sampling = gr_gm20b_update_pc_sampling,
|
||||
.get_fbp_en_mask = vgpu_gr_get_fbp_en_mask,
|
||||
.get_max_ltc_per_fbp = vgpu_gr_get_max_ltc_per_fbp,
|
||||
.get_max_lts_per_ltc = vgpu_gr_get_max_lts_per_ltc,
|
||||
.get_rop_l2_en_mask = vgpu_gr_rop_l2_en_mask,
|
||||
.get_max_fbps_count = vgpu_gr_get_max_fbps_count,
|
||||
.init_sm_dsm_reg_info = gv11b_gr_init_sm_dsm_reg_info,
|
||||
.wait_empty = gr_gv11b_wait_empty,
|
||||
.init_cyclestats = vgpu_gr_gm20b_init_cyclestats,
|
||||
.set_sm_debug_mode = vgpu_gr_set_sm_debug_mode,
|
||||
.enable_cde_in_fecs = gr_gm20b_enable_cde_in_fecs,
|
||||
.bpt_reg_info = gv11b_gr_bpt_reg_info,
|
||||
.get_access_map = gr_gv11b_get_access_map,
|
||||
.handle_fecs_error = gr_gv11b_handle_fecs_error,
|
||||
.handle_sm_exception = gr_gk20a_handle_sm_exception,
|
||||
.handle_tex_exception = gr_gv11b_handle_tex_exception,
|
||||
.enable_gpc_exceptions = gr_gv11b_enable_gpc_exceptions,
|
||||
.enable_exceptions = gr_gv11b_enable_exceptions,
|
||||
.get_lrf_tex_ltc_dram_override = get_ecc_override_val,
|
||||
.update_smpc_ctxsw_mode = vgpu_gr_update_smpc_ctxsw_mode,
|
||||
.update_hwpm_ctxsw_mode = vgpu_gr_update_hwpm_ctxsw_mode,
|
||||
.record_sm_error_state = gv11b_gr_record_sm_error_state,
|
||||
.update_sm_error_state = gv11b_gr_update_sm_error_state,
|
||||
.clear_sm_error_state = vgpu_gr_clear_sm_error_state,
|
||||
.suspend_contexts = vgpu_gr_suspend_contexts,
|
||||
.resume_contexts = vgpu_gr_resume_contexts,
|
||||
.get_preemption_mode_flags = gr_gp10b_get_preemption_mode_flags,
|
||||
.init_sm_id_table = vgpu_gr_init_sm_id_table,
|
||||
.load_smid_config = gr_gv11b_load_smid_config,
|
||||
.program_sm_id_numbering = gr_gv11b_program_sm_id_numbering,
|
||||
.is_ltcs_ltss_addr = gr_gm20b_is_ltcs_ltss_addr,
|
||||
.is_ltcn_ltss_addr = gr_gm20b_is_ltcn_ltss_addr,
|
||||
.split_lts_broadcast_addr = gr_gm20b_split_lts_broadcast_addr,
|
||||
.split_ltc_broadcast_addr = gr_gm20b_split_ltc_broadcast_addr,
|
||||
.setup_rop_mapping = gr_gv11b_setup_rop_mapping,
|
||||
.program_zcull_mapping = gr_gv11b_program_zcull_mapping,
|
||||
.commit_global_timeslice = gr_gv11b_commit_global_timeslice,
|
||||
.commit_inst = vgpu_gr_gv11b_commit_inst,
|
||||
.write_zcull_ptr = gr_gv11b_write_zcull_ptr,
|
||||
.write_pm_ptr = gr_gv11b_write_pm_ptr,
|
||||
.init_elcg_mode = gr_gv11b_init_elcg_mode,
|
||||
.load_tpc_mask = gr_gv11b_load_tpc_mask,
|
||||
.inval_icache = gr_gk20a_inval_icache,
|
||||
.trigger_suspend = gv11b_gr_sm_trigger_suspend,
|
||||
.wait_for_pause = gr_gk20a_wait_for_pause,
|
||||
.resume_from_pause = gv11b_gr_resume_from_pause,
|
||||
.clear_sm_errors = gr_gk20a_clear_sm_errors,
|
||||
.tpc_enabled_exceptions = gr_gk20a_tpc_enabled_exceptions,
|
||||
.get_esr_sm_sel = gv11b_gr_get_esr_sm_sel,
|
||||
.sm_debugger_attached = gv11b_gr_sm_debugger_attached,
|
||||
.suspend_single_sm = gv11b_gr_suspend_single_sm,
|
||||
.suspend_all_sms = gv11b_gr_suspend_all_sms,
|
||||
.resume_single_sm = gv11b_gr_resume_single_sm,
|
||||
.resume_all_sms = gv11b_gr_resume_all_sms,
|
||||
.get_sm_hww_warp_esr = gv11b_gr_get_sm_hww_warp_esr,
|
||||
.get_sm_hww_global_esr = gv11b_gr_get_sm_hww_global_esr,
|
||||
.get_sm_no_lock_down_hww_global_esr_mask =
|
||||
gv11b_gr_get_sm_no_lock_down_hww_global_esr_mask,
|
||||
.lock_down_sm = gv11b_gr_lock_down_sm,
|
||||
.wait_for_sm_lock_down = gv11b_gr_wait_for_sm_lock_down,
|
||||
.clear_sm_hww = gv11b_gr_clear_sm_hww,
|
||||
.init_ovr_sm_dsm_perf = gv11b_gr_init_ovr_sm_dsm_perf,
|
||||
.get_ovr_perf_regs = gv11b_gr_get_ovr_perf_regs,
|
||||
.disable_rd_coalesce = gm20a_gr_disable_rd_coalesce,
|
||||
.set_boosted_ctx = NULL,
|
||||
.set_preemption_mode = vgpu_gr_gp10b_set_preemption_mode,
|
||||
.set_czf_bypass = NULL,
|
||||
.pre_process_sm_exception = gr_gv11b_pre_process_sm_exception,
|
||||
.set_preemption_buffer_va = gr_gv11b_set_preemption_buffer_va,
|
||||
.init_preemption_state = NULL,
|
||||
.update_boosted_ctx = NULL,
|
||||
.set_bes_crop_debug3 = gr_gp10b_set_bes_crop_debug3,
|
||||
.set_bes_crop_debug4 = gr_gp10b_set_bes_crop_debug4,
|
||||
.create_gr_sysfs = gr_gv11b_create_sysfs,
|
||||
.set_ctxsw_preemption_mode = vgpu_gr_gp10b_set_ctxsw_preemption_mode,
|
||||
.is_etpc_addr = gv11b_gr_pri_is_etpc_addr,
|
||||
.egpc_etpc_priv_addr_table = gv11b_gr_egpc_etpc_priv_addr_table,
|
||||
.handle_tpc_mpc_exception = gr_gv11b_handle_tpc_mpc_exception,
|
||||
.zbc_s_query_table = gr_gv11b_zbc_s_query_table,
|
||||
.load_zbc_s_default_tbl = gr_gv11b_load_stencil_default_tbl,
|
||||
.handle_gpc_gpcmmu_exception =
|
||||
gr_gv11b_handle_gpc_gpcmmu_exception,
|
||||
.add_zbc_type_s = gr_gv11b_add_zbc_type_s,
|
||||
.get_egpc_base = gv11b_gr_get_egpc_base,
|
||||
.get_egpc_etpc_num = gv11b_gr_get_egpc_etpc_num,
|
||||
.handle_gpc_gpccs_exception =
|
||||
gr_gv11b_handle_gpc_gpccs_exception,
|
||||
.load_zbc_s_tbl = gr_gv11b_load_stencil_tbl,
|
||||
.access_smpc_reg = gv11b_gr_access_smpc_reg,
|
||||
.is_egpc_addr = gv11b_gr_pri_is_egpc_addr,
|
||||
.add_zbc_s = gr_gv11b_add_zbc_stencil,
|
||||
.handle_gcc_exception = gr_gv11b_handle_gcc_exception,
|
||||
.init_sw_veid_bundle = gr_gv11b_init_sw_veid_bundle,
|
||||
.handle_tpc_sm_ecc_exception =
|
||||
gr_gv11b_handle_tpc_sm_ecc_exception,
|
||||
.decode_egpc_addr = gv11b_gr_decode_egpc_addr,
|
||||
.init_ctxsw_hdr_data = gr_gp10b_init_ctxsw_hdr_data,
|
||||
.init_gfxp_wfi_timeout_count =
|
||||
gr_gv11b_init_gfxp_wfi_timeout_count,
|
||||
.get_max_gfxp_wfi_timeout_count =
|
||||
gr_gv11b_get_max_gfxp_wfi_timeout_count,
|
||||
},
|
||||
.fb = {
|
||||
.reset = gv11b_fb_reset,
|
||||
.init_hw = gk20a_fb_init_hw,
|
||||
.init_fs_state = gv11b_fb_init_fs_state,
|
||||
.init_cbc = gv11b_fb_init_cbc,
|
||||
.set_mmu_page_size = gm20b_fb_set_mmu_page_size,
|
||||
.set_use_full_comp_tag_line =
|
||||
gm20b_fb_set_use_full_comp_tag_line,
|
||||
.compression_page_size = gp10b_fb_compression_page_size,
|
||||
.compressible_page_size = gp10b_fb_compressible_page_size,
|
||||
.compression_align_mask = gm20b_fb_compression_align_mask,
|
||||
.vpr_info_fetch = gm20b_fb_vpr_info_fetch,
|
||||
.dump_vpr_wpr_info = gm20b_fb_dump_vpr_wpr_info,
|
||||
.read_wpr_info = gm20b_fb_read_wpr_info,
|
||||
.is_debug_mode_enabled = NULL,
|
||||
.set_debug_mode = vgpu_mm_mmu_set_debug_mode,
|
||||
.tlb_invalidate = vgpu_mm_tlb_invalidate,
|
||||
.hub_isr = gv11b_fb_hub_isr,
|
||||
},
|
||||
.clock_gating = {
|
||||
.slcg_bus_load_gating_prod =
|
||||
gv11b_slcg_bus_load_gating_prod,
|
||||
.slcg_ce2_load_gating_prod =
|
||||
gv11b_slcg_ce2_load_gating_prod,
|
||||
.slcg_chiplet_load_gating_prod =
|
||||
gv11b_slcg_chiplet_load_gating_prod,
|
||||
.slcg_ctxsw_firmware_load_gating_prod =
|
||||
gv11b_slcg_ctxsw_firmware_load_gating_prod,
|
||||
.slcg_fb_load_gating_prod =
|
||||
gv11b_slcg_fb_load_gating_prod,
|
||||
.slcg_fifo_load_gating_prod =
|
||||
gv11b_slcg_fifo_load_gating_prod,
|
||||
.slcg_gr_load_gating_prod =
|
||||
gr_gv11b_slcg_gr_load_gating_prod,
|
||||
.slcg_ltc_load_gating_prod =
|
||||
ltc_gv11b_slcg_ltc_load_gating_prod,
|
||||
.slcg_perf_load_gating_prod =
|
||||
gv11b_slcg_perf_load_gating_prod,
|
||||
.slcg_priring_load_gating_prod =
|
||||
gv11b_slcg_priring_load_gating_prod,
|
||||
.slcg_pmu_load_gating_prod =
|
||||
gv11b_slcg_pmu_load_gating_prod,
|
||||
.slcg_therm_load_gating_prod =
|
||||
gv11b_slcg_therm_load_gating_prod,
|
||||
.slcg_xbar_load_gating_prod =
|
||||
gv11b_slcg_xbar_load_gating_prod,
|
||||
.blcg_bus_load_gating_prod =
|
||||
gv11b_blcg_bus_load_gating_prod,
|
||||
.blcg_ce_load_gating_prod =
|
||||
gv11b_blcg_ce_load_gating_prod,
|
||||
.blcg_ctxsw_firmware_load_gating_prod =
|
||||
gv11b_blcg_ctxsw_firmware_load_gating_prod,
|
||||
.blcg_fb_load_gating_prod =
|
||||
gv11b_blcg_fb_load_gating_prod,
|
||||
.blcg_fifo_load_gating_prod =
|
||||
gv11b_blcg_fifo_load_gating_prod,
|
||||
.blcg_gr_load_gating_prod =
|
||||
gv11b_blcg_gr_load_gating_prod,
|
||||
.blcg_ltc_load_gating_prod =
|
||||
gv11b_blcg_ltc_load_gating_prod,
|
||||
.blcg_pwr_csb_load_gating_prod =
|
||||
gv11b_blcg_pwr_csb_load_gating_prod,
|
||||
.blcg_pmu_load_gating_prod =
|
||||
gv11b_blcg_pmu_load_gating_prod,
|
||||
.blcg_xbar_load_gating_prod =
|
||||
gv11b_blcg_xbar_load_gating_prod,
|
||||
.pg_gr_load_gating_prod =
|
||||
gr_gv11b_pg_gr_load_gating_prod,
|
||||
},
|
||||
.fifo = {
|
||||
.init_fifo_setup_hw = vgpu_gv11b_init_fifo_setup_hw,
|
||||
.bind_channel = vgpu_channel_bind,
|
||||
.unbind_channel = vgpu_channel_unbind,
|
||||
.disable_channel = vgpu_channel_disable,
|
||||
.enable_channel = vgpu_channel_enable,
|
||||
.alloc_inst = vgpu_channel_alloc_inst,
|
||||
.free_inst = vgpu_channel_free_inst,
|
||||
.setup_ramfc = vgpu_channel_setup_ramfc,
|
||||
.default_timeslice_us = vgpu_fifo_default_timeslice_us,
|
||||
.setup_userd = gk20a_fifo_setup_userd,
|
||||
.userd_gp_get = gv11b_userd_gp_get,
|
||||
.userd_gp_put = gv11b_userd_gp_put,
|
||||
.userd_pb_get = gv11b_userd_pb_get,
|
||||
.pbdma_acquire_val = gk20a_fifo_pbdma_acquire_val,
|
||||
.preempt_channel = vgpu_fifo_preempt_channel,
|
||||
.preempt_tsg = vgpu_fifo_preempt_tsg,
|
||||
.enable_tsg = vgpu_enable_tsg,
|
||||
.disable_tsg = gk20a_disable_tsg,
|
||||
.tsg_verify_channel_status = NULL,
|
||||
.tsg_verify_status_ctx_reload = NULL,
|
||||
/* TODO: implement it for CE fault */
|
||||
.tsg_verify_status_faulted = NULL,
|
||||
.update_runlist = vgpu_fifo_update_runlist,
|
||||
.trigger_mmu_fault = NULL,
|
||||
.get_mmu_fault_info = NULL,
|
||||
.wait_engine_idle = vgpu_fifo_wait_engine_idle,
|
||||
.get_num_fifos = gv11b_fifo_get_num_fifos,
|
||||
.get_pbdma_signature = gp10b_fifo_get_pbdma_signature,
|
||||
.set_runlist_interleave = vgpu_fifo_set_runlist_interleave,
|
||||
.tsg_set_timeslice = vgpu_tsg_set_timeslice,
|
||||
.tsg_open = vgpu_tsg_open,
|
||||
.tsg_release = vgpu_tsg_release,
|
||||
.force_reset_ch = vgpu_fifo_force_reset_ch,
|
||||
.engine_enum_from_type = gp10b_fifo_engine_enum_from_type,
|
||||
.device_info_data_parse = gp10b_device_info_data_parse,
|
||||
.eng_runlist_base_size = fifo_eng_runlist_base__size_1_v,
|
||||
.init_engine_info = vgpu_fifo_init_engine_info,
|
||||
.runlist_entry_size = ram_rl_entry_size_v,
|
||||
.get_tsg_runlist_entry = gv11b_get_tsg_runlist_entry,
|
||||
.get_ch_runlist_entry = gv11b_get_ch_runlist_entry,
|
||||
.is_fault_engine_subid_gpc = gv11b_is_fault_engine_subid_gpc,
|
||||
.dump_pbdma_status = gk20a_dump_pbdma_status,
|
||||
.dump_eng_status = gv11b_dump_eng_status,
|
||||
.dump_channel_status_ramfc = gv11b_dump_channel_status_ramfc,
|
||||
.intr_0_error_mask = gv11b_fifo_intr_0_error_mask,
|
||||
.is_preempt_pending = gv11b_fifo_is_preempt_pending,
|
||||
.init_pbdma_intr_descs = gv11b_fifo_init_pbdma_intr_descs,
|
||||
.reset_enable_hw = gv11b_init_fifo_reset_enable_hw,
|
||||
.teardown_ch_tsg = gv11b_fifo_teardown_ch_tsg,
|
||||
.handle_sched_error = gv11b_fifo_handle_sched_error,
|
||||
.handle_pbdma_intr_0 = gv11b_fifo_handle_pbdma_intr_0,
|
||||
.handle_pbdma_intr_1 = gv11b_fifo_handle_pbdma_intr_1,
|
||||
.init_eng_method_buffers = gv11b_fifo_init_eng_method_buffers,
|
||||
.deinit_eng_method_buffers =
|
||||
gv11b_fifo_deinit_eng_method_buffers,
|
||||
.tsg_bind_channel = vgpu_gv11b_tsg_bind_channel,
|
||||
.tsg_unbind_channel = vgpu_tsg_unbind_channel,
|
||||
#ifdef CONFIG_TEGRA_GK20A_NVHOST
|
||||
.alloc_syncpt_buf = vgpu_gv11b_fifo_alloc_syncpt_buf,
|
||||
.free_syncpt_buf = gv11b_fifo_free_syncpt_buf,
|
||||
.add_syncpt_wait_cmd = gv11b_fifo_add_syncpt_wait_cmd,
|
||||
.get_syncpt_wait_cmd_size = gv11b_fifo_get_syncpt_wait_cmd_size,
|
||||
.add_syncpt_incr_cmd = gv11b_fifo_add_syncpt_incr_cmd,
|
||||
.get_syncpt_incr_cmd_size = gv11b_fifo_get_syncpt_incr_cmd_size,
|
||||
.get_sync_ro_map = vgpu_gv11b_fifo_get_sync_ro_map,
|
||||
#endif
|
||||
.resetup_ramfc = NULL,
|
||||
.reschedule_runlist = NULL,
|
||||
.device_info_fault_id = top_device_info_data_fault_id_enum_v,
|
||||
.free_channel_ctx_header = vgpu_gv11b_free_subctx_header,
|
||||
.preempt_ch_tsg = gv11b_fifo_preempt_ch_tsg,
|
||||
.handle_ctxsw_timeout = gv11b_fifo_handle_ctxsw_timeout,
|
||||
},
|
||||
.gr_ctx = {
|
||||
.get_netlist_name = gr_gv11b_get_netlist_name,
|
||||
.is_fw_defined = gr_gv11b_is_firmware_defined,
|
||||
},
|
||||
#ifdef CONFIG_GK20A_CTXSW_TRACE
|
||||
.fecs_trace = {
|
||||
.alloc_user_buffer = NULL,
|
||||
.free_user_buffer = NULL,
|
||||
.mmap_user_buffer = NULL,
|
||||
.init = NULL,
|
||||
.deinit = NULL,
|
||||
.enable = NULL,
|
||||
.disable = NULL,
|
||||
.is_enabled = NULL,
|
||||
.reset = NULL,
|
||||
.flush = NULL,
|
||||
.poll = NULL,
|
||||
.bind_channel = NULL,
|
||||
.unbind_channel = NULL,
|
||||
.max_entries = NULL,
|
||||
},
|
||||
#endif /* CONFIG_GK20A_CTXSW_TRACE */
|
||||
.mm = {
|
||||
/* FIXME: add support for sparse mappings */
|
||||
.support_sparse = NULL,
|
||||
.gmmu_map = vgpu_gp10b_locked_gmmu_map,
|
||||
.gmmu_unmap = vgpu_locked_gmmu_unmap,
|
||||
.vm_bind_channel = vgpu_vm_bind_channel,
|
||||
.fb_flush = vgpu_mm_fb_flush,
|
||||
.l2_invalidate = vgpu_mm_l2_invalidate,
|
||||
.l2_flush = vgpu_mm_l2_flush,
|
||||
.cbc_clean = gk20a_mm_cbc_clean,
|
||||
.set_big_page_size = gm20b_mm_set_big_page_size,
|
||||
.get_big_page_sizes = gm20b_mm_get_big_page_sizes,
|
||||
.get_default_big_page_size = gp10b_mm_get_default_big_page_size,
|
||||
.gpu_phys_addr = gm20b_gpu_phys_addr,
|
||||
.get_iommu_bit = gk20a_mm_get_iommu_bit,
|
||||
.get_mmu_levels = gp10b_mm_get_mmu_levels,
|
||||
.init_pdb = gp10b_mm_init_pdb,
|
||||
.init_mm_setup_hw = vgpu_gp10b_init_mm_setup_hw,
|
||||
.is_bar1_supported = gv11b_mm_is_bar1_supported,
|
||||
.init_inst_block = gv11b_init_inst_block,
|
||||
.mmu_fault_pending = gv11b_mm_mmu_fault_pending,
|
||||
.get_kind_invalid = gm20b_get_kind_invalid,
|
||||
.get_kind_pitch = gm20b_get_kind_pitch,
|
||||
.init_bar2_vm = gp10b_init_bar2_vm,
|
||||
.init_bar2_mm_hw_setup = gv11b_init_bar2_mm_hw_setup,
|
||||
.remove_bar2_vm = gv11b_mm_remove_bar2_vm,
|
||||
.fault_info_mem_destroy = gv11b_mm_fault_info_mem_destroy,
|
||||
},
|
||||
.therm = {
|
||||
.init_therm_setup_hw = gp10b_init_therm_setup_hw,
|
||||
.elcg_init_idle_filters = gv11b_elcg_init_idle_filters,
|
||||
},
|
||||
.pmu = {
|
||||
.pmu_setup_elpg = gp10b_pmu_setup_elpg,
|
||||
.pmu_get_queue_head = pwr_pmu_queue_head_r,
|
||||
.pmu_get_queue_head_size = pwr_pmu_queue_head__size_1_v,
|
||||
.pmu_get_queue_tail = pwr_pmu_queue_tail_r,
|
||||
.pmu_get_queue_tail_size = pwr_pmu_queue_tail__size_1_v,
|
||||
.pmu_queue_head = gk20a_pmu_queue_head,
|
||||
.pmu_queue_tail = gk20a_pmu_queue_tail,
|
||||
.pmu_msgq_tail = gk20a_pmu_msgq_tail,
|
||||
.pmu_mutex_size = pwr_pmu_mutex__size_1_v,
|
||||
.pmu_mutex_acquire = gk20a_pmu_mutex_acquire,
|
||||
.pmu_mutex_release = gk20a_pmu_mutex_release,
|
||||
.write_dmatrfbase = gp10b_write_dmatrfbase,
|
||||
.pmu_elpg_statistics = gp106_pmu_elpg_statistics,
|
||||
.pmu_init_perfmon = nvgpu_pmu_init_perfmon_rpc,
|
||||
.pmu_perfmon_start_sampling = nvgpu_pmu_perfmon_start_sampling_rpc,
|
||||
.pmu_perfmon_stop_sampling = nvgpu_pmu_perfmon_stop_sampling_rpc,
|
||||
.pmu_perfmon_get_samples_rpc = nvgpu_pmu_perfmon_get_samples_rpc,
|
||||
.pmu_pg_init_param = gv11b_pg_gr_init,
|
||||
.pmu_pg_supported_engines_list = gk20a_pmu_pg_engines_list,
|
||||
.pmu_pg_engines_feature_list = gk20a_pmu_pg_feature_list,
|
||||
.dump_secure_fuses = pmu_dump_security_fuses_gp10b,
|
||||
.reset_engine = gp106_pmu_engine_reset,
|
||||
.is_engine_in_reset = gp106_pmu_is_engine_in_reset,
|
||||
.pmu_nsbootstrap = gv11b_pmu_bootstrap,
|
||||
.pmu_pg_set_sub_feature_mask = gv11b_pg_set_subfeature_mask,
|
||||
.is_pmu_supported = gv11b_is_pmu_supported,
|
||||
},
|
||||
.regops = {
|
||||
.get_global_whitelist_ranges =
|
||||
gv11b_get_global_whitelist_ranges,
|
||||
.get_global_whitelist_ranges_count =
|
||||
gv11b_get_global_whitelist_ranges_count,
|
||||
.get_context_whitelist_ranges =
|
||||
gv11b_get_context_whitelist_ranges,
|
||||
.get_context_whitelist_ranges_count =
|
||||
gv11b_get_context_whitelist_ranges_count,
|
||||
.get_runcontrol_whitelist = gv11b_get_runcontrol_whitelist,
|
||||
.get_runcontrol_whitelist_count =
|
||||
gv11b_get_runcontrol_whitelist_count,
|
||||
.get_runcontrol_whitelist_ranges =
|
||||
gv11b_get_runcontrol_whitelist_ranges,
|
||||
.get_runcontrol_whitelist_ranges_count =
|
||||
gv11b_get_runcontrol_whitelist_ranges_count,
|
||||
.get_qctl_whitelist = gv11b_get_qctl_whitelist,
|
||||
.get_qctl_whitelist_count = gv11b_get_qctl_whitelist_count,
|
||||
.get_qctl_whitelist_ranges = gv11b_get_qctl_whitelist_ranges,
|
||||
.get_qctl_whitelist_ranges_count =
|
||||
gv11b_get_qctl_whitelist_ranges_count,
|
||||
.apply_smpc_war = gv11b_apply_smpc_war,
|
||||
},
|
||||
.mc = {
|
||||
.intr_enable = mc_gv11b_intr_enable,
|
||||
.intr_unit_config = mc_gp10b_intr_unit_config,
|
||||
.isr_stall = mc_gp10b_isr_stall,
|
||||
.intr_stall = mc_gp10b_intr_stall,
|
||||
.intr_stall_pause = mc_gp10b_intr_stall_pause,
|
||||
.intr_stall_resume = mc_gp10b_intr_stall_resume,
|
||||
.intr_nonstall = mc_gp10b_intr_nonstall,
|
||||
.intr_nonstall_pause = mc_gp10b_intr_nonstall_pause,
|
||||
.intr_nonstall_resume = mc_gp10b_intr_nonstall_resume,
|
||||
.enable = gk20a_mc_enable,
|
||||
.disable = gk20a_mc_disable,
|
||||
.reset = gk20a_mc_reset,
|
||||
.boot_0 = gk20a_mc_boot_0,
|
||||
.is_intr1_pending = mc_gp10b_is_intr1_pending,
|
||||
.is_intr_hub_pending = gv11b_mc_is_intr_hub_pending,
|
||||
},
|
||||
.debug = {
|
||||
.show_dump = NULL,
|
||||
},
|
||||
.dbg_session_ops = {
|
||||
.exec_reg_ops = vgpu_exec_regops,
|
||||
.dbg_set_powergate = vgpu_dbg_set_powergate,
|
||||
.check_and_set_global_reservation =
|
||||
vgpu_check_and_set_global_reservation,
|
||||
.check_and_set_context_reservation =
|
||||
vgpu_check_and_set_context_reservation,
|
||||
.release_profiler_reservation =
|
||||
vgpu_release_profiler_reservation,
|
||||
.perfbuffer_enable = vgpu_perfbuffer_enable,
|
||||
.perfbuffer_disable = vgpu_perfbuffer_disable,
|
||||
},
|
||||
.bus = {
|
||||
.init_hw = gk20a_bus_init_hw,
|
||||
.isr = gk20a_bus_isr,
|
||||
.read_ptimer = vgpu_read_ptimer,
|
||||
.get_timestamps_zipper = vgpu_get_timestamps_zipper,
|
||||
.bar1_bind = NULL,
|
||||
},
|
||||
#if defined(CONFIG_GK20A_CYCLE_STATS)
|
||||
.css = {
|
||||
.enable_snapshot = vgpu_css_enable_snapshot_buffer,
|
||||
.disable_snapshot = vgpu_css_release_snapshot_buffer,
|
||||
.check_data_available = vgpu_css_flush_snapshots,
|
||||
.detach_snapshot = vgpu_css_detach,
|
||||
.set_handled_snapshots = NULL,
|
||||
.allocate_perfmon_ids = NULL,
|
||||
.release_perfmon_ids = NULL,
|
||||
},
|
||||
#endif
|
||||
.falcon = {
|
||||
.falcon_hal_sw_init = gk20a_falcon_hal_sw_init,
|
||||
},
|
||||
.priv_ring = {
|
||||
.isr = gp10b_priv_ring_isr,
|
||||
},
|
||||
.chip_init_gpu_characteristics = vgpu_gv11b_init_gpu_characteristics,
|
||||
.get_litter_value = gv11b_get_litter_value,
|
||||
};
|
||||
|
||||
int vgpu_gv11b_init_hal(struct gk20a *g)
|
||||
{
|
||||
struct gpu_ops *gops = &g->ops;
|
||||
|
||||
gops->ltc = vgpu_gv11b_ops.ltc;
|
||||
gops->ce2 = vgpu_gv11b_ops.ce2;
|
||||
gops->gr = vgpu_gv11b_ops.gr;
|
||||
gops->fb = vgpu_gv11b_ops.fb;
|
||||
gops->clock_gating = vgpu_gv11b_ops.clock_gating;
|
||||
gops->fifo = vgpu_gv11b_ops.fifo;
|
||||
gops->gr_ctx = vgpu_gv11b_ops.gr_ctx;
|
||||
gops->mm = vgpu_gv11b_ops.mm;
|
||||
#ifdef CONFIG_GK20A_CTXSW_TRACE
|
||||
gops->fecs_trace = vgpu_gv11b_ops.fecs_trace;
|
||||
#endif
|
||||
gops->therm = vgpu_gv11b_ops.therm;
|
||||
gops->pmu = vgpu_gv11b_ops.pmu;
|
||||
gops->regops = vgpu_gv11b_ops.regops;
|
||||
gops->mc = vgpu_gv11b_ops.mc;
|
||||
gops->debug = vgpu_gv11b_ops.debug;
|
||||
gops->dbg_session_ops = vgpu_gv11b_ops.dbg_session_ops;
|
||||
gops->bus = vgpu_gv11b_ops.bus;
|
||||
#if defined(CONFIG_GK20A_CYCLE_STATS)
|
||||
gops->css = vgpu_gv11b_ops.css;
|
||||
#endif
|
||||
gops->falcon = vgpu_gv11b_ops.falcon;
|
||||
gops->priv_ring = vgpu_gv11b_ops.priv_ring;
|
||||
|
||||
/* Lone functions */
|
||||
gops->chip_init_gpu_characteristics =
|
||||
vgpu_gv11b_ops.chip_init_gpu_characteristics;
|
||||
gops->get_litter_value = vgpu_gv11b_ops.get_litter_value;
|
||||
|
||||
g->name = "gv11b";
|
||||
|
||||
return 0;
|
||||
}
|
||||
@@ -1,73 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
#include <nvgpu/vgpu/tegra_vgpu.h>
|
||||
#include <nvgpu/hw/gv11b/hw_ctxsw_prog_gv11b.h>
|
||||
|
||||
int vgpu_gv11b_alloc_subctx_header(struct channel_gk20a *c)
|
||||
{
|
||||
struct ctx_header_desc *ctx = &c->ctx_header;
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_alloc_ctx_header_params *p =
|
||||
&msg.params.alloc_ctx_header;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_ALLOC_CTX_HEADER;
|
||||
msg.handle = vgpu_get_handle(c->g);
|
||||
p->ch_handle = c->virt_ctx;
|
||||
p->ctx_header_va = __nvgpu_vm_alloc_va(c->vm,
|
||||
ctxsw_prog_fecs_header_v(),
|
||||
gmmu_page_size_kernel);
|
||||
if (!p->ctx_header_va) {
|
||||
nvgpu_err(c->g, "alloc va failed for ctx_header");
|
||||
return -ENOMEM;
|
||||
}
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (unlikely(err)) {
|
||||
nvgpu_err(c->g, "alloc ctx_header failed err %d", err);
|
||||
__nvgpu_vm_free_va(c->vm, p->ctx_header_va,
|
||||
gmmu_page_size_kernel);
|
||||
return err;
|
||||
}
|
||||
ctx->mem.gpu_va = p->ctx_header_va;
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
void vgpu_gv11b_free_subctx_header(struct channel_gk20a *c)
|
||||
{
|
||||
struct ctx_header_desc *ctx = &c->ctx_header;
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_free_ctx_header_params *p =
|
||||
&msg.params.free_ctx_header;
|
||||
int err;
|
||||
|
||||
if (ctx->mem.gpu_va) {
|
||||
msg.cmd = TEGRA_VGPU_CMD_FREE_CTX_HEADER;
|
||||
msg.handle = vgpu_get_handle(c->g);
|
||||
p->ch_handle = c->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (unlikely(err))
|
||||
nvgpu_err(c->g, "free ctx_header failed err %d", err);
|
||||
__nvgpu_vm_free_va(c->vm, ctx->mem.gpu_va,
|
||||
gmmu_page_size_kernel);
|
||||
ctx->mem.gpu_va = 0;
|
||||
}
|
||||
}
|
||||
@@ -1,25 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _VGPU_SUBCTX_GV11B_H_
|
||||
#define _VGPU_SUBCTX_GV11B_H_
|
||||
|
||||
struct channel_gk20a;
|
||||
|
||||
int vgpu_gv11b_alloc_subctx_header(struct channel_gk20a *c);
|
||||
void vgpu_gv11b_free_subctx_header(struct channel_gk20a *c);
|
||||
|
||||
#endif
|
||||
@@ -1,53 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2016-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <nvgpu/vgpu/tegra_vgpu.h>
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "common/linux/vgpu/vgpu.h"
|
||||
|
||||
#include "vgpu_tsg_gv11b.h"
|
||||
|
||||
int vgpu_gv11b_tsg_bind_channel(struct tsg_gk20a *tsg,
|
||||
struct channel_gk20a *ch)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_tsg_bind_channel_ex_params *p =
|
||||
&msg.params.tsg_bind_channel_ex;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = gk20a_tsg_bind_channel(tsg, ch);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_TSG_BIND_CHANNEL_EX;
|
||||
msg.handle = vgpu_get_handle(tsg->g);
|
||||
p->tsg_id = tsg->tsgid;
|
||||
p->ch_handle = ch->virt_ctx;
|
||||
p->subctx_id = ch->subctx_id;
|
||||
p->runqueue_sel = ch->runqueue_sel;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (err) {
|
||||
nvgpu_err(tsg->g,
|
||||
"vgpu_gv11b_tsg_bind_channel failed, ch %d tsgid %d",
|
||||
ch->chid, tsg->tsgid);
|
||||
gk20a_tsg_unbind_channel(ch);
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
@@ -1,23 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _VGPU_TSG_GV11B_H_
|
||||
#define _VGPU_TSG_GV11B_H_
|
||||
|
||||
int vgpu_gv11b_tsg_bind_channel(struct tsg_gk20a *tsg,
|
||||
struct channel_gk20a *ch);
|
||||
|
||||
#endif
|
||||
@@ -1,62 +0,0 @@
|
||||
/*
|
||||
* Virtualized GPU L2
|
||||
*
|
||||
* Copyright (c) 2014-2018 NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "vgpu.h"
|
||||
#include "ltc_vgpu.h"
|
||||
|
||||
int vgpu_determine_L2_size_bytes(struct gk20a *g)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
return priv->constants.l2_size;
|
||||
}
|
||||
|
||||
int vgpu_ltc_init_comptags(struct gk20a *g, struct gr_gk20a *gr)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
u32 max_comptag_lines = 0;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
gr->cacheline_size = priv->constants.cacheline_size;
|
||||
gr->comptags_per_cacheline = priv->constants.comptags_per_cacheline;
|
||||
gr->slices_per_ltc = priv->constants.slices_per_ltc;
|
||||
max_comptag_lines = priv->constants.comptag_lines;
|
||||
|
||||
if (max_comptag_lines < 2)
|
||||
return -ENXIO;
|
||||
|
||||
err = gk20a_comptag_allocator_init(g, &gr->comp_tags, max_comptag_lines);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
void vgpu_ltc_init_fs_state(struct gk20a *g)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
g->ltc_count = priv->constants.ltc_count;
|
||||
}
|
||||
@@ -1,27 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _LTC_VGPU_H_
|
||||
#define _LTC_VGPU_H_
|
||||
|
||||
struct gk20a;
|
||||
struct gr_gk20a;
|
||||
|
||||
int vgpu_determine_L2_size_bytes(struct gk20a *g);
|
||||
int vgpu_ltc_init_comptags(struct gk20a *g, struct gr_gk20a *gr);
|
||||
void vgpu_ltc_init_fs_state(struct gk20a *g);
|
||||
|
||||
#endif
|
||||
@@ -1,272 +0,0 @@
|
||||
/*
|
||||
* Virtualized GPU Memory Management
|
||||
*
|
||||
* Copyright (c) 2014-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <nvgpu/kmem.h>
|
||||
#include <nvgpu/dma.h>
|
||||
#include <nvgpu/bug.h>
|
||||
#include <nvgpu/vm.h>
|
||||
#include <nvgpu/vm_area.h>
|
||||
|
||||
#include <nvgpu/vgpu/vm.h>
|
||||
|
||||
#include <nvgpu/linux/vm.h>
|
||||
#include <nvgpu/linux/nvgpu_mem.h>
|
||||
|
||||
#include "vgpu.h"
|
||||
#include "mm_vgpu.h"
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "gk20a/mm_gk20a.h"
|
||||
#include "gm20b/mm_gm20b.h"
|
||||
|
||||
static int vgpu_init_mm_setup_sw(struct gk20a *g)
|
||||
{
|
||||
struct mm_gk20a *mm = &g->mm;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (mm->sw_ready) {
|
||||
gk20a_dbg_fn("skip init");
|
||||
return 0;
|
||||
}
|
||||
|
||||
nvgpu_mutex_init(&mm->tlb_lock);
|
||||
nvgpu_mutex_init(&mm->priv_lock);
|
||||
|
||||
mm->g = g;
|
||||
|
||||
/*TBD: make channel vm size configurable */
|
||||
mm->channel.user_size = NV_MM_DEFAULT_USER_SIZE;
|
||||
mm->channel.kernel_size = NV_MM_DEFAULT_KERNEL_SIZE;
|
||||
|
||||
gk20a_dbg_info("channel vm size: user %dMB kernel %dMB",
|
||||
(int)(mm->channel.user_size >> 20),
|
||||
(int)(mm->channel.kernel_size >> 20));
|
||||
|
||||
mm->sw_ready = true;
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int vgpu_init_mm_support(struct gk20a *g)
|
||||
{
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = vgpu_init_mm_setup_sw(g);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
if (g->ops.mm.init_mm_setup_hw)
|
||||
err = g->ops.mm.init_mm_setup_hw(g);
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
void vgpu_locked_gmmu_unmap(struct vm_gk20a *vm,
|
||||
u64 vaddr,
|
||||
u64 size,
|
||||
int pgsz_idx,
|
||||
bool va_allocated,
|
||||
int rw_flag,
|
||||
bool sparse,
|
||||
struct vm_gk20a_mapping_batch *batch)
|
||||
{
|
||||
struct gk20a *g = gk20a_from_vm(vm);
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_as_map_params *p = &msg.params.as_map;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (va_allocated) {
|
||||
err = __nvgpu_vm_free_va(vm, vaddr, pgsz_idx);
|
||||
if (err) {
|
||||
nvgpu_err(g, "failed to free va");
|
||||
return;
|
||||
}
|
||||
}
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_AS_UNMAP;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->handle = vm->handle;
|
||||
p->gpu_va = vaddr;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
if (err || msg.ret)
|
||||
nvgpu_err(g, "failed to update gmmu ptes on unmap");
|
||||
|
||||
/* TLB invalidate handled on server side */
|
||||
}
|
||||
|
||||
/*
|
||||
* This is called by the common VM init routine to handle vGPU specifics of
|
||||
* intializing a VM on a vGPU. This alone is not enough to init a VM. See
|
||||
* nvgpu_vm_init().
|
||||
*/
|
||||
int vgpu_vm_init(struct gk20a *g, struct vm_gk20a *vm)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_as_share_params *p = &msg.params.as_share;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_AS_ALLOC_SHARE;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->size = vm->va_limit;
|
||||
p->big_page_size = vm->big_page_size;
|
||||
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
if (err || msg.ret)
|
||||
return -ENOMEM;
|
||||
|
||||
vm->handle = p->handle;
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
/*
|
||||
* Similar to vgpu_vm_init() this is called as part of the cleanup path for
|
||||
* VMs. This alone is not enough to remove a VM - see nvgpu_vm_remove().
|
||||
*/
|
||||
void vgpu_vm_remove(struct vm_gk20a *vm)
|
||||
{
|
||||
struct gk20a *g = gk20a_from_vm(vm);
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_as_share_params *p = &msg.params.as_share;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_AS_FREE_SHARE;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->handle = vm->handle;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
}
|
||||
|
||||
u64 vgpu_bar1_map(struct gk20a *g, struct nvgpu_mem *mem)
|
||||
{
|
||||
u64 addr = nvgpu_mem_get_addr(g, mem);
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_as_map_params *p = &msg.params.as_map;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_MAP_BAR1;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->addr = addr;
|
||||
p->size = mem->size;
|
||||
p->iova = 0;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
if (err || msg.ret)
|
||||
addr = 0;
|
||||
else
|
||||
addr = p->gpu_va;
|
||||
|
||||
return addr;
|
||||
}
|
||||
|
||||
int vgpu_vm_bind_channel(struct gk20a_as_share *as_share,
|
||||
struct channel_gk20a *ch)
|
||||
{
|
||||
struct vm_gk20a *vm = as_share->vm;
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_as_bind_share_params *p = &msg.params.as_bind_share;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
ch->vm = vm;
|
||||
msg.cmd = TEGRA_VGPU_CMD_AS_BIND_SHARE;
|
||||
msg.handle = vgpu_get_handle(ch->g);
|
||||
p->as_handle = vm->handle;
|
||||
p->chan_handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
|
||||
if (err || msg.ret) {
|
||||
ch->vm = NULL;
|
||||
err = -ENOMEM;
|
||||
}
|
||||
|
||||
if (ch->vm)
|
||||
nvgpu_vm_get(ch->vm);
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
static void vgpu_cache_maint(u64 handle, u8 op)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_cache_maint_params *p = &msg.params.cache_maint;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CACHE_MAINT;
|
||||
msg.handle = handle;
|
||||
p->op = op;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
}
|
||||
|
||||
int vgpu_mm_fb_flush(struct gk20a *g)
|
||||
{
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
vgpu_cache_maint(vgpu_get_handle(g), TEGRA_VGPU_FB_FLUSH);
|
||||
return 0;
|
||||
}
|
||||
|
||||
void vgpu_mm_l2_invalidate(struct gk20a *g)
|
||||
{
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
vgpu_cache_maint(vgpu_get_handle(g), TEGRA_VGPU_L2_MAINT_INV);
|
||||
}
|
||||
|
||||
void vgpu_mm_l2_flush(struct gk20a *g, bool invalidate)
|
||||
{
|
||||
u8 op;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (invalidate)
|
||||
op = TEGRA_VGPU_L2_MAINT_FLUSH_INV;
|
||||
else
|
||||
op = TEGRA_VGPU_L2_MAINT_FLUSH;
|
||||
|
||||
vgpu_cache_maint(vgpu_get_handle(g), op);
|
||||
}
|
||||
|
||||
void vgpu_mm_tlb_invalidate(struct gk20a *g, struct nvgpu_mem *pdb)
|
||||
{
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
nvgpu_err(g, "call to RM server not supported");
|
||||
}
|
||||
|
||||
void vgpu_mm_mmu_set_debug_mode(struct gk20a *g, bool enable)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_mmu_debug_mode *p = &msg.params.mmu_debug_mode;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_SET_MMU_DEBUG_MODE;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->enable = (u32)enable;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
WARN_ON(err || msg.ret);
|
||||
}
|
||||
@@ -1,40 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef _MM_VGPU_H_
|
||||
#define _MM_VGPU_H_
|
||||
|
||||
struct nvgpu_mem;
|
||||
struct channel_gk20a;
|
||||
struct vm_gk20a_mapping_batch;
|
||||
struct gk20a_as_share;
|
||||
|
||||
void vgpu_locked_gmmu_unmap(struct vm_gk20a *vm,
|
||||
u64 vaddr,
|
||||
u64 size,
|
||||
int pgsz_idx,
|
||||
bool va_allocated,
|
||||
int rw_flag,
|
||||
bool sparse,
|
||||
struct vm_gk20a_mapping_batch *batch);
|
||||
int vgpu_vm_bind_channel(struct gk20a_as_share *as_share,
|
||||
struct channel_gk20a *ch);
|
||||
int vgpu_mm_fb_flush(struct gk20a *g);
|
||||
void vgpu_mm_l2_invalidate(struct gk20a *g);
|
||||
void vgpu_mm_l2_flush(struct gk20a *g, bool invalidate);
|
||||
void vgpu_mm_tlb_invalidate(struct gk20a *g, struct nvgpu_mem *pdb);
|
||||
void vgpu_mm_mmu_set_debug_mode(struct gk20a *g, bool enable);
|
||||
#endif
|
||||
@@ -15,8 +15,8 @@
|
||||
*/
|
||||
|
||||
#include <linux/device.h>
|
||||
#include <nvgpu/vgpu/vgpu.h>
|
||||
|
||||
#include "vgpu.h"
|
||||
#include "common/linux/platform_gk20a.h"
|
||||
|
||||
static ssize_t vgpu_load_show(struct device *dev,
|
||||
|
||||
@@ -1,155 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2016-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "gk20a/channel_gk20a.h"
|
||||
#include "gk20a/tsg_gk20a.h"
|
||||
#include "common/linux/platform_gk20a.h"
|
||||
#include "vgpu.h"
|
||||
#include "fifo_vgpu.h"
|
||||
|
||||
#include <nvgpu/bug.h>
|
||||
#include <nvgpu/vgpu/tegra_vgpu.h>
|
||||
|
||||
int vgpu_tsg_open(struct tsg_gk20a *tsg)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_tsg_open_rel_params *p =
|
||||
&msg.params.tsg_open;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_TSG_OPEN;
|
||||
msg.handle = vgpu_get_handle(tsg->g);
|
||||
p->tsg_id = tsg->tsgid;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (err) {
|
||||
nvgpu_err(tsg->g,
|
||||
"vgpu_tsg_open failed, tsgid %d", tsg->tsgid);
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
void vgpu_tsg_release(struct tsg_gk20a *tsg)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_tsg_open_rel_params *p =
|
||||
&msg.params.tsg_release;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_TSG_RELEASE;
|
||||
msg.handle = vgpu_get_handle(tsg->g);
|
||||
p->tsg_id = tsg->tsgid;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (err) {
|
||||
nvgpu_err(tsg->g,
|
||||
"vgpu_tsg_release failed, tsgid %d", tsg->tsgid);
|
||||
}
|
||||
}
|
||||
|
||||
int vgpu_enable_tsg(struct tsg_gk20a *tsg)
|
||||
{
|
||||
struct gk20a *g = tsg->g;
|
||||
struct channel_gk20a *ch;
|
||||
|
||||
nvgpu_rwsem_down_read(&tsg->ch_list_lock);
|
||||
nvgpu_list_for_each_entry(ch, &tsg->ch_list, channel_gk20a, ch_entry)
|
||||
g->ops.fifo.enable_channel(ch);
|
||||
nvgpu_rwsem_up_read(&tsg->ch_list_lock);
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int vgpu_tsg_bind_channel(struct tsg_gk20a *tsg,
|
||||
struct channel_gk20a *ch)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_tsg_bind_unbind_channel_params *p =
|
||||
&msg.params.tsg_bind_unbind_channel;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = gk20a_tsg_bind_channel(tsg, ch);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_TSG_BIND_CHANNEL;
|
||||
msg.handle = vgpu_get_handle(tsg->g);
|
||||
p->tsg_id = tsg->tsgid;
|
||||
p->ch_handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (err) {
|
||||
nvgpu_err(tsg->g,
|
||||
"vgpu_tsg_bind_channel failed, ch %d tsgid %d",
|
||||
ch->chid, tsg->tsgid);
|
||||
gk20a_tsg_unbind_channel(ch);
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_tsg_unbind_channel(struct channel_gk20a *ch)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_tsg_bind_unbind_channel_params *p =
|
||||
&msg.params.tsg_bind_unbind_channel;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = gk20a_fifo_tsg_unbind_channel(ch);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_TSG_UNBIND_CHANNEL;
|
||||
msg.handle = vgpu_get_handle(ch->g);
|
||||
p->ch_handle = ch->virt_ctx;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
WARN_ON(err);
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_tsg_set_timeslice(struct tsg_gk20a *tsg, u32 timeslice)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {0};
|
||||
struct tegra_vgpu_tsg_timeslice_params *p =
|
||||
&msg.params.tsg_timeslice;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_TSG_SET_TIMESLICE;
|
||||
msg.handle = vgpu_get_handle(tsg->g);
|
||||
p->tsg_id = tsg->tsgid;
|
||||
p->timeslice_us = timeslice;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
WARN_ON(err);
|
||||
if (!err)
|
||||
tsg->timeslice_us = timeslice;
|
||||
|
||||
return err;
|
||||
}
|
||||
@@ -1,344 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2014-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#include <nvgpu/enabled.h>
|
||||
#include <nvgpu/bus.h>
|
||||
#include <nvgpu/vgpu/vgpu_ivc.h>
|
||||
|
||||
#include "gk20a/gk20a.h"
|
||||
#include "vgpu.h"
|
||||
#include "fecs_trace_vgpu.h"
|
||||
|
||||
int vgpu_comm_init(struct gk20a *g)
|
||||
{
|
||||
size_t queue_sizes[] = { TEGRA_VGPU_QUEUE_SIZES };
|
||||
|
||||
return vgpu_ivc_init(g, 3, queue_sizes, TEGRA_VGPU_QUEUE_CMD,
|
||||
ARRAY_SIZE(queue_sizes));
|
||||
}
|
||||
|
||||
void vgpu_comm_deinit(void)
|
||||
{
|
||||
size_t queue_sizes[] = { TEGRA_VGPU_QUEUE_SIZES };
|
||||
|
||||
vgpu_ivc_deinit(TEGRA_VGPU_QUEUE_CMD, ARRAY_SIZE(queue_sizes));
|
||||
}
|
||||
|
||||
int vgpu_comm_sendrecv(struct tegra_vgpu_cmd_msg *msg, size_t size_in,
|
||||
size_t size_out)
|
||||
{
|
||||
void *handle;
|
||||
size_t size = size_in;
|
||||
void *data = msg;
|
||||
int err;
|
||||
|
||||
err = vgpu_ivc_sendrecv(vgpu_ivc_get_server_vmid(),
|
||||
TEGRA_VGPU_QUEUE_CMD, &handle, &data, &size);
|
||||
if (!err) {
|
||||
WARN_ON(size < size_out);
|
||||
memcpy(msg, data, size_out);
|
||||
vgpu_ivc_release(handle);
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
u64 vgpu_connect(void)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_connect_params *p = &msg.params.connect;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_CONNECT;
|
||||
p->module = TEGRA_VGPU_MODULE_GPU;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
|
||||
return (err || msg.ret) ? 0 : p->handle;
|
||||
}
|
||||
|
||||
int vgpu_get_attribute(u64 handle, u32 attrib, u32 *value)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg;
|
||||
struct tegra_vgpu_attrib_params *p = &msg.params.attrib;
|
||||
int err;
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_GET_ATTRIBUTE;
|
||||
msg.handle = handle;
|
||||
p->attrib = attrib;
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
|
||||
if (err || msg.ret)
|
||||
return -1;
|
||||
|
||||
*value = p->value;
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void vgpu_handle_channel_event(struct gk20a *g,
|
||||
struct tegra_vgpu_channel_event_info *info)
|
||||
{
|
||||
struct tsg_gk20a *tsg;
|
||||
|
||||
if (!info->is_tsg) {
|
||||
nvgpu_err(g, "channel event posted");
|
||||
return;
|
||||
}
|
||||
|
||||
if (info->id >= g->fifo.num_channels ||
|
||||
info->event_id >= TEGRA_VGPU_CHANNEL_EVENT_ID_MAX) {
|
||||
nvgpu_err(g, "invalid channel event");
|
||||
return;
|
||||
}
|
||||
|
||||
tsg = &g->fifo.tsg[info->id];
|
||||
|
||||
gk20a_tsg_event_id_post_event(tsg, info->event_id);
|
||||
}
|
||||
|
||||
int vgpu_intr_thread(void *dev_id)
|
||||
{
|
||||
struct gk20a *g = dev_id;
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
|
||||
while (true) {
|
||||
struct tegra_vgpu_intr_msg *msg;
|
||||
u32 sender;
|
||||
void *handle;
|
||||
size_t size;
|
||||
int err;
|
||||
|
||||
err = vgpu_ivc_recv(TEGRA_VGPU_QUEUE_INTR, &handle,
|
||||
(void **)&msg, &size, &sender);
|
||||
if (err == -ETIME)
|
||||
continue;
|
||||
if (WARN_ON(err))
|
||||
continue;
|
||||
|
||||
if (msg->event == TEGRA_VGPU_EVENT_ABORT) {
|
||||
vgpu_ivc_release(handle);
|
||||
break;
|
||||
}
|
||||
|
||||
switch (msg->event) {
|
||||
case TEGRA_VGPU_EVENT_INTR:
|
||||
if (msg->unit == TEGRA_VGPU_INTR_GR)
|
||||
vgpu_gr_isr(g, &msg->info.gr_intr);
|
||||
else if (msg->unit == TEGRA_VGPU_NONSTALL_INTR_GR)
|
||||
vgpu_gr_nonstall_isr(g,
|
||||
&msg->info.gr_nonstall_intr);
|
||||
else if (msg->unit == TEGRA_VGPU_INTR_FIFO)
|
||||
vgpu_fifo_isr(g, &msg->info.fifo_intr);
|
||||
else if (msg->unit == TEGRA_VGPU_NONSTALL_INTR_FIFO)
|
||||
vgpu_fifo_nonstall_isr(g,
|
||||
&msg->info.fifo_nonstall_intr);
|
||||
else if (msg->unit == TEGRA_VGPU_NONSTALL_INTR_CE2)
|
||||
vgpu_ce2_nonstall_isr(g,
|
||||
&msg->info.ce2_nonstall_intr);
|
||||
break;
|
||||
#ifdef CONFIG_GK20A_CTXSW_TRACE
|
||||
case TEGRA_VGPU_EVENT_FECS_TRACE:
|
||||
vgpu_fecs_trace_data_update(g);
|
||||
break;
|
||||
#endif
|
||||
case TEGRA_VGPU_EVENT_CHANNEL:
|
||||
vgpu_handle_channel_event(g, &msg->info.channel_event);
|
||||
break;
|
||||
case TEGRA_VGPU_EVENT_SM_ESR:
|
||||
vgpu_gr_handle_sm_esr_event(g, &msg->info.sm_esr);
|
||||
break;
|
||||
default:
|
||||
nvgpu_err(g, "unknown event %u", msg->event);
|
||||
break;
|
||||
}
|
||||
|
||||
vgpu_ivc_release(handle);
|
||||
}
|
||||
|
||||
while (!nvgpu_thread_should_stop(&priv->intr_handler))
|
||||
nvgpu_msleep(10);
|
||||
return 0;
|
||||
}
|
||||
|
||||
void vgpu_remove_support_common(struct gk20a *g)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
struct tegra_vgpu_intr_msg msg;
|
||||
int err;
|
||||
|
||||
if (g->dbg_regops_tmp_buf)
|
||||
nvgpu_kfree(g, g->dbg_regops_tmp_buf);
|
||||
|
||||
if (g->pmu.remove_support)
|
||||
g->pmu.remove_support(&g->pmu);
|
||||
|
||||
if (g->gr.remove_support)
|
||||
g->gr.remove_support(&g->gr);
|
||||
|
||||
if (g->fifo.remove_support)
|
||||
g->fifo.remove_support(&g->fifo);
|
||||
|
||||
if (g->mm.remove_support)
|
||||
g->mm.remove_support(&g->mm);
|
||||
|
||||
msg.event = TEGRA_VGPU_EVENT_ABORT;
|
||||
err = vgpu_ivc_send(vgpu_ivc_get_peer_self(), TEGRA_VGPU_QUEUE_INTR,
|
||||
&msg, sizeof(msg));
|
||||
WARN_ON(err);
|
||||
nvgpu_thread_stop(&priv->intr_handler);
|
||||
}
|
||||
|
||||
void vgpu_detect_chip(struct gk20a *g)
|
||||
{
|
||||
struct nvgpu_gpu_params *p = &g->params;
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
|
||||
p->gpu_arch = priv->constants.arch;
|
||||
p->gpu_impl = priv->constants.impl;
|
||||
p->gpu_rev = priv->constants.rev;
|
||||
|
||||
gk20a_dbg_info("arch: %x, impl: %x, rev: %x\n",
|
||||
p->gpu_arch,
|
||||
p->gpu_impl,
|
||||
p->gpu_rev);
|
||||
}
|
||||
|
||||
int vgpu_init_gpu_characteristics(struct gk20a *g)
|
||||
{
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
err = gk20a_init_gpu_characteristics(g);
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
__nvgpu_set_enabled(g, NVGPU_SUPPORT_MAP_BUFFER_BATCH, false);
|
||||
|
||||
/* features vgpu does not support */
|
||||
__nvgpu_set_enabled(g, NVGPU_SUPPORT_RESCHEDULE_RUNLIST, false);
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int vgpu_read_ptimer(struct gk20a *g, u64 *value)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {0};
|
||||
struct tegra_vgpu_read_ptimer_params *p = &msg.params.read_ptimer;
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_READ_PTIMER;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (!err)
|
||||
*value = p->time;
|
||||
else
|
||||
nvgpu_err(g, "vgpu read ptimer failed, err=%d", err);
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_get_timestamps_zipper(struct gk20a *g,
|
||||
u32 source_id, u32 count,
|
||||
struct nvgpu_cpu_time_correlation_sample *samples)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {0};
|
||||
struct tegra_vgpu_get_timestamps_zipper_params *p =
|
||||
&msg.params.get_timestamps_zipper;
|
||||
int err;
|
||||
u32 i;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
if (count > TEGRA_VGPU_GET_TIMESTAMPS_ZIPPER_MAX_COUNT) {
|
||||
nvgpu_err(g, "count %u overflow", count);
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_GET_TIMESTAMPS_ZIPPER;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
p->source_id = TEGRA_VGPU_GET_TIMESTAMPS_ZIPPER_SRC_ID_TSC;
|
||||
p->count = count;
|
||||
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
if (err) {
|
||||
nvgpu_err(g, "vgpu get timestamps zipper failed, err=%d", err);
|
||||
return err;
|
||||
}
|
||||
|
||||
for (i = 0; i < count; i++) {
|
||||
samples[i].cpu_timestamp = p->samples[i].cpu_timestamp;
|
||||
samples[i].gpu_timestamp = p->samples[i].gpu_timestamp;
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_init_hal(struct gk20a *g)
|
||||
{
|
||||
u32 ver = g->params.gpu_arch + g->params.gpu_impl;
|
||||
int err;
|
||||
|
||||
switch (ver) {
|
||||
case NVGPU_GPUID_GP10B:
|
||||
gk20a_dbg_info("gp10b detected");
|
||||
err = vgpu_gp10b_init_hal(g);
|
||||
break;
|
||||
case NVGPU_GPUID_GV11B:
|
||||
err = vgpu_gv11b_init_hal(g);
|
||||
break;
|
||||
default:
|
||||
nvgpu_err(g, "no support for %x", ver);
|
||||
err = -ENODEV;
|
||||
break;
|
||||
}
|
||||
|
||||
return err;
|
||||
}
|
||||
|
||||
int vgpu_get_constants(struct gk20a *g)
|
||||
{
|
||||
struct tegra_vgpu_cmd_msg msg = {};
|
||||
struct tegra_vgpu_constants_params *p = &msg.params.constants;
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
int err;
|
||||
|
||||
gk20a_dbg_fn("");
|
||||
|
||||
msg.cmd = TEGRA_VGPU_CMD_GET_CONSTANTS;
|
||||
msg.handle = vgpu_get_handle(g);
|
||||
err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
|
||||
err = err ? err : msg.ret;
|
||||
|
||||
if (unlikely(err)) {
|
||||
nvgpu_err(g, "%s failed, err=%d", __func__, err);
|
||||
return err;
|
||||
}
|
||||
|
||||
if (unlikely(p->gpc_count > TEGRA_VGPU_MAX_GPC_COUNT ||
|
||||
p->max_tpc_per_gpc_count > TEGRA_VGPU_MAX_TPC_COUNT_PER_GPC)) {
|
||||
nvgpu_err(g, "gpc_count %d max_tpc_per_gpc %d overflow",
|
||||
(int)p->gpc_count, (int)p->max_tpc_per_gpc_count);
|
||||
return -EINVAL;
|
||||
}
|
||||
|
||||
priv->constants = *p;
|
||||
return 0;
|
||||
}
|
||||
@@ -1,104 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2014-2018, NVIDIA CORPORATION. All rights reserved.
|
||||
*
|
||||
* This program is free software; you can redistribute it and/or modify it
|
||||
* under the terms and conditions of the GNU General Public License,
|
||||
* version 2, as published by the Free Software Foundation.
|
||||
*
|
||||
* This program is distributed in the hope it will be useful, but WITHOUT
|
||||
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||||
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
||||
* more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*/
|
||||
|
||||
#ifndef __VGPU_COMMON_H__
|
||||
#define __VGPU_COMMON_H__
|
||||
|
||||
#include <nvgpu/types.h>
|
||||
#include <nvgpu/thread.h>
|
||||
#include <nvgpu/log.h>
|
||||
#include <nvgpu/vgpu/tegra_vgpu.h>
|
||||
|
||||
struct device;
|
||||
struct tegra_vgpu_gr_intr_info;
|
||||
struct tegra_vgpu_fifo_intr_info;
|
||||
struct tegra_vgpu_cmd_msg;
|
||||
struct nvgpu_mem;
|
||||
struct gk20a;
|
||||
struct vm_gk20a;
|
||||
struct nvgpu_gr_ctx;
|
||||
struct nvgpu_cpu_time_correlation_sample;
|
||||
|
||||
struct vgpu_priv_data {
|
||||
u64 virt_handle;
|
||||
struct nvgpu_thread intr_handler;
|
||||
struct tegra_vgpu_constants_params constants;
|
||||
};
|
||||
|
||||
struct vgpu_priv_data *vgpu_get_priv_data(struct gk20a *g);
|
||||
|
||||
static inline u64 vgpu_get_handle(struct gk20a *g)
|
||||
{
|
||||
struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
|
||||
|
||||
if (unlikely(!priv)) {
|
||||
nvgpu_err(g, "invalid vgpu_priv_data in %s", __func__);
|
||||
return INT_MAX;
|
||||
}
|
||||
|
||||
return priv->virt_handle;
|
||||
}
|
||||
|
||||
int vgpu_comm_init(struct gk20a *g);
|
||||
void vgpu_comm_deinit(void);
|
||||
int vgpu_comm_sendrecv(struct tegra_vgpu_cmd_msg *msg, size_t size_in,
|
||||
size_t size_out);
|
||||
u64 vgpu_connect(void);
|
||||
int vgpu_get_attribute(u64 handle, u32 attrib, u32 *value);
|
||||
int vgpu_intr_thread(void *dev_id);
|
||||
void vgpu_remove_support_common(struct gk20a *g);
|
||||
void vgpu_detect_chip(struct gk20a *g);
|
||||
int vgpu_init_gpu_characteristics(struct gk20a *g);
|
||||
int vgpu_read_ptimer(struct gk20a *g, u64 *value);
|
||||
int vgpu_get_timestamps_zipper(struct gk20a *g,
|
||||
u32 source_id, u32 count,
|
||||
struct nvgpu_cpu_time_correlation_sample *samples);
|
||||
int vgpu_init_hal(struct gk20a *g);
|
||||
int vgpu_get_constants(struct gk20a *g);
|
||||
u64 vgpu_bar1_map(struct gk20a *g, struct nvgpu_mem *mem);
|
||||
int vgpu_gr_isr(struct gk20a *g, struct tegra_vgpu_gr_intr_info *info);
|
||||
int vgpu_gr_nonstall_isr(struct gk20a *g,
|
||||
struct tegra_vgpu_gr_nonstall_intr_info *info);
|
||||
int vgpu_gr_alloc_gr_ctx(struct gk20a *g,
|
||||
struct nvgpu_gr_ctx *gr_ctx,
|
||||
struct vm_gk20a *vm,
|
||||
u32 class,
|
||||
u32 flags);
|
||||
void vgpu_gr_free_gr_ctx(struct gk20a *g, struct vm_gk20a *vm,
|
||||
struct nvgpu_gr_ctx *gr_ctx);
|
||||
void vgpu_gr_handle_sm_esr_event(struct gk20a *g,
|
||||
struct tegra_vgpu_sm_esr_info *info);
|
||||
int vgpu_gr_init_ctx_state(struct gk20a *g);
|
||||
int vgpu_fifo_isr(struct gk20a *g, struct tegra_vgpu_fifo_intr_info *info);
|
||||
int vgpu_fifo_nonstall_isr(struct gk20a *g,
|
||||
struct tegra_vgpu_fifo_nonstall_intr_info *info);
|
||||
int vgpu_ce2_nonstall_isr(struct gk20a *g,
|
||||
struct tegra_vgpu_ce2_nonstall_intr_info *info);
|
||||
u32 vgpu_ce_get_num_pce(struct gk20a *g);
|
||||
int vgpu_init_mm_support(struct gk20a *g);
|
||||
int vgpu_init_gr_support(struct gk20a *g);
|
||||
int vgpu_init_fifo_support(struct gk20a *g);
|
||||
|
||||
int vgpu_gp10b_init_hal(struct gk20a *g);
|
||||
int vgpu_gv11b_init_hal(struct gk20a *g);
|
||||
|
||||
int vgpu_read_ptimer(struct gk20a *g, u64 *value);
|
||||
int vgpu_get_timestamps_zipper(struct gk20a *g,
|
||||
u32 source_id, u32 count,
|
||||
struct nvgpu_cpu_time_correlation_sample *samples);
|
||||
bool vgpu_is_reduced_bar1(struct gk20a *g);
|
||||
|
||||
#endif
|
||||
@@ -32,9 +32,8 @@
|
||||
#include <nvgpu/ctxsw_trace.h>
|
||||
#include <nvgpu/defaults.h>
|
||||
|
||||
#include "vgpu.h"
|
||||
#include "vgpu_linux.h"
|
||||
#include "fecs_trace_vgpu.h"
|
||||
#include "vgpu/fecs_trace_vgpu.h"
|
||||
#include "clk_vgpu.h"
|
||||
#include "gk20a/tsg_gk20a.h"
|
||||
#include "gk20a/channel_gk20a.h"
|
||||
|
||||
@@ -24,7 +24,7 @@ struct platform_device;
|
||||
|
||||
#ifdef CONFIG_TEGRA_GR_VIRTUALIZATION
|
||||
|
||||
#include "vgpu.h"
|
||||
#include <nvgpu/vgpu/vgpu.h>
|
||||
|
||||
int vgpu_pm_prepare_poweroff(struct device *dev);
|
||||
int vgpu_pm_finalize_poweron(struct device *dev);
|
||||
|
||||
Reference in New Issue
Block a user