Files
linux-nvgpu/drivers/gpu/nvgpu/hal/fifo/ramfc_ga10b_fusa.c
Rajesh Devaraj b9e771ecfc gpu: nvgpu: split capture_ram_dump api
This patch splits capture_ram_dump into two parts to separate out
NV_RAMFC_TOP_LEVEL_GET/NV_RAMFC_TOP_LEVEL_GET_HI into a new api. This
split helps in reducing duplication of capture_ram_dump in future chips.

JIRA NVGPU-9325

Change-Id: I4dba2db7c08406af1569e28037b2aa2f2abfc782
Signed-off-by: Rajesh Devaraj <rdevaraj@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/c/linux-nvgpu/+/2836197
Reviewed-by: svcacv <svcacv@nvidia.com>
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: svc-mobile-misra <svc-mobile-misra@nvidia.com>
Reviewed-by: Seema Khowala <seemaj@nvidia.com>
GVS: Gerrit_Virtual_Submit <buildbot_gerritrpt@nvidia.com>
2023-01-05 05:45:15 -08:00

175 lines
5.8 KiB
C

/*
* Copyright (c) 2020-2023, NVIDIA CORPORATION. All rights reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
* DEALINGS IN THE SOFTWARE.
*/
#include <nvgpu/log.h>
#include <nvgpu/log2.h>
#include <nvgpu/nvgpu_mem.h>
#include <nvgpu/io.h>
#include <nvgpu/gk20a.h>
#include <nvgpu/channel.h>
#include <nvgpu/fifo.h>
#include <nvgpu/engines.h>
#include <nvgpu/runlist.h>
#include "hal/fifo/ramfc_ga10b.h"
#include <nvgpu/hw/ga10b/hw_ram_ga10b.h>
int ga10b_ramfc_setup(struct nvgpu_channel *ch, u64 gpfifo_base,
u32 gpfifo_entries, u64 pbdma_acquire_timeout, u32 flags)
{
struct gk20a *g = ch->g;
struct nvgpu_mem *mem = &ch->inst_block;
u32 data;
u32 engine_id = 0U;
u32 eng_intr_mask = 0U;
u32 eng_intr_vector = 0U;
u32 eng_bitmask = 0U;
(void)flags;
nvgpu_log_fn(g, " ");
/*
* ga10b can have max 3 engines on a runlist and only
* runlist 0 has more than 1 engine(gr0, grcopy0 and grcopy1).
* Since grcopy0 and grcopy1 can't schedule work directly, it
* is always safe to assume that first active engine on runlist
* will trigger pbdma intr notify.
* TODO: Add helper function to get active engine mask for
* runlist - NVGPU-5219
*/
eng_bitmask = ch->runlist->eng_bitmask;
engine_id = nvgpu_safe_sub_u32(
nvgpu_safe_cast_u64_to_u32(nvgpu_ffs(eng_bitmask)), 1U);
nvgpu_memset(g, mem, 0U, 0U, ram_fc_size_val_v());
nvgpu_log_info(g, "%llu %u", pbdma_acquire_timeout,
g->ops.pbdma.acquire_val(pbdma_acquire_timeout));
nvgpu_mem_wr32(g, mem, ram_fc_gp_base_w(),
g->ops.pbdma.get_gp_base(gpfifo_base));
nvgpu_mem_wr32(g, mem, ram_fc_gp_base_hi_w(),
g->ops.pbdma.get_gp_base_hi(gpfifo_base, gpfifo_entries));
nvgpu_mem_wr32(g, mem, ram_fc_signature_w(),
ch->g->ops.pbdma.get_signature(ch->g));
nvgpu_mem_wr32(g, mem, ram_fc_pb_header_w(),
g->ops.pbdma.get_fc_pb_header());
nvgpu_mem_wr32(g, mem, ram_fc_subdevice_w(),
g->ops.pbdma.get_fc_subdevice());
nvgpu_mem_wr32(g, mem, ram_fc_target_w(),
g->ops.pbdma.get_fc_target(
nvgpu_engine_get_active_eng_info(g, engine_id)));
nvgpu_mem_wr32(g, mem, ram_fc_acquire_w(),
g->ops.pbdma.acquire_val(pbdma_acquire_timeout));
data = nvgpu_mem_rd32(g, mem, ram_fc_set_channel_info_w());
data = data | (g->ops.pbdma.set_channel_info_veid(ch->subctx_id) |
g->ops.pbdma.set_channel_info_chid(ch->chid));
nvgpu_mem_wr32(g, mem, ram_fc_set_channel_info_w(), data);
nvgpu_mem_wr32(g, mem, ram_in_engine_wfi_veid_w(),
ram_in_engine_wfi_veid_f(ch->subctx_id));
/* get engine interrupt vector */
eng_intr_mask = nvgpu_engine_act_interrupt_mask(g, engine_id);
eng_intr_vector = nvgpu_safe_sub_u32(
nvgpu_safe_cast_u64_to_u32(nvgpu_ffs(eng_intr_mask)), 1U);
/*
* engine_intr_vector can be value between 0 and 255.
* For example, engine_intr_vector x translates to subtree x/64,
* leaf (x % 64)/32 and leaf entry interrupt bit(x % 64)%32.
* ga10b engine_intr_vectors are 0,1,2,3,4,5. They map to
* subtree_0 and leaf_0(Engine non-stall interrupts) interrupt
* bits.
*/
data = g->ops.pbdma.set_intr_notify(eng_intr_vector);
nvgpu_mem_wr32(g, mem, ram_fc_intr_notify_w(), data);
if (ch->is_privileged_channel) {
/* Set privilege level for channel */
nvgpu_mem_wr32(g, mem, ram_fc_config_w(),
g->ops.pbdma.get_config_auth_level_privileged());
/* Enable HCE priv mode for phys mode transfer */
nvgpu_mem_wr32(g, mem, ram_fc_hce_ctrl_w(),
g->ops.pbdma.get_ctrl_hce_priv_mode_yes());
}
/* Enable userd writeback */
data = nvgpu_mem_rd32(g, mem, ram_fc_config_w());
data = g->ops.pbdma.config_userd_writeback_enable(data);
nvgpu_mem_wr32(g, mem, ram_fc_config_w(), data);
return 0;
}
void ga10b_ramfc_capture_ram_dump_1(struct gk20a *g,
struct nvgpu_channel *ch, struct nvgpu_channel_dump_info *info)
{
struct nvgpu_mem *mem = &ch->inst_block;
info->inst.pb_top_level_get = nvgpu_mem_rd32_pair(g, mem,
ram_fc_pb_top_level_get_w(),
ram_fc_pb_top_level_get_hi_w());
}
void ga10b_ramfc_capture_ram_dump_2(struct gk20a *g,
struct nvgpu_channel *ch, struct nvgpu_channel_dump_info *info)
{
struct nvgpu_mem *mem = &ch->inst_block;
info->inst.pb_put = nvgpu_mem_rd32_pair(g, mem,
ram_fc_pb_put_w(),
ram_fc_pb_put_hi_w());
info->inst.pb_get = nvgpu_mem_rd32_pair(g, mem,
ram_fc_pb_get_w(),
ram_fc_pb_get_hi_w());
info->inst.pb_header = nvgpu_mem_rd32(g, mem,
ram_fc_pb_header_w());
info->inst.pb_count = nvgpu_mem_rd32(g, mem,
ram_fc_pb_count_w());
info->inst.sem_addr = nvgpu_mem_rd32_pair(g, mem,
ram_fc_sem_addr_lo_w(),
ram_fc_sem_addr_hi_w());
info->inst.sem_payload = nvgpu_mem_rd32_pair(g, mem,
ram_fc_sem_payload_lo_w(),
ram_fc_sem_payload_hi_w());
info->inst.sem_execute = nvgpu_mem_rd32(g, mem,
ram_fc_sem_execute_w());
}
void ga10b_ramfc_capture_ram_dump(struct gk20a *g, struct nvgpu_channel *ch,
struct nvgpu_channel_dump_info *info)
{
ga10b_ramfc_capture_ram_dump_1(g, ch, info);
ga10b_ramfc_capture_ram_dump_2(g, ch, info);
}