mirror of
git://nv-tegra.nvidia.com/linux-nvgpu.git
synced 2025-12-24 10:34:43 +03:00
Add clock arbiter skeleton with support of clock sessions, notifications on clock changes, request numbering, and asynchronous handling of clock requests. Provides minimum behaviour to allow unit tests implementation. Actual arbitration and clock settings will be done separately. For now, dummy arbiter keeps last requested target mhz. Actual arbiter may move to a lockless implementation. Jira DNVGPU-125 Change-Id: I6a8e443fb0d15dc5f1993e7260256d71acddd106 Signed-off-by: Thomas Fleury <tfleury@nvidia.com> Reviewed-on: http://git-master/r/1223476 (cherry picked from commit cb130825d84e4124d273bd443e2b62d493377461) Reviewed-on: http://git-master/r/1243105 GVS: Gerrit_Virtual_Submit Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
242 lines
6.2 KiB
C
242 lines
6.2 KiB
C
/*
|
|
* GP106 HAL interface
|
|
*
|
|
* Copyright (c) 2016, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms and conditions of the GNU General Public License,
|
|
* version 2, as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
* more details.
|
|
*/
|
|
|
|
#include <linux/types.h>
|
|
#include <linux/printk.h>
|
|
|
|
#include <linux/types.h>
|
|
|
|
#include "gk20a/gk20a.h"
|
|
|
|
#include "gp10b/gr_gp10b.h"
|
|
#include "gp10b/mc_gp10b.h"
|
|
#include "gp106/ltc_gp106.h"
|
|
#include "gp10b/mm_gp10b.h"
|
|
#include "gp10b/ce_gp10b.h"
|
|
#include "gp106/fifo_gp106.h"
|
|
#include "gp106/regops_gp106.h"
|
|
#include "gp10b/cde_gp10b.h"
|
|
#include "gp106/therm_gp106.h"
|
|
#include "gp106/xve_gp106.h"
|
|
|
|
#include "gp106/bios_gp106.h"
|
|
|
|
#include "gm20b/gr_gm20b.h"
|
|
#include "gm20b/fifo_gm20b.h"
|
|
#include "gm20b/pmu_gm20b.h"
|
|
#include "gp106/clk_gp106.h"
|
|
#include "gp106/clk_arb_gp106.h"
|
|
|
|
#include "gp106/mm_gp106.h"
|
|
#include "gp106/pmu_gp106.h"
|
|
#include "gp106/gr_ctx_gp106.h"
|
|
#include "gp106/gr_gp106.h"
|
|
#include "gp106/fb_gp106.h"
|
|
#include "gp106/gp106_gating_reglist.h"
|
|
#include "nvgpu_gpuid_t18x.h"
|
|
#include "hw_proj_gp106.h"
|
|
#include "gk20a/dbg_gpu_gk20a.h"
|
|
#include "gk20a/css_gr_gk20a.h"
|
|
|
|
static struct gpu_ops gp106_ops = {
|
|
.clock_gating = {
|
|
.slcg_bus_load_gating_prod =
|
|
gp106_slcg_bus_load_gating_prod,
|
|
.slcg_ce2_load_gating_prod =
|
|
gp106_slcg_ce2_load_gating_prod,
|
|
.slcg_chiplet_load_gating_prod =
|
|
gp106_slcg_chiplet_load_gating_prod,
|
|
.slcg_ctxsw_firmware_load_gating_prod =
|
|
gp106_slcg_ctxsw_firmware_load_gating_prod,
|
|
.slcg_fb_load_gating_prod =
|
|
gp106_slcg_fb_load_gating_prod,
|
|
.slcg_fifo_load_gating_prod =
|
|
gp106_slcg_fifo_load_gating_prod,
|
|
.slcg_gr_load_gating_prod =
|
|
gr_gp106_slcg_gr_load_gating_prod,
|
|
.slcg_ltc_load_gating_prod =
|
|
ltc_gp106_slcg_ltc_load_gating_prod,
|
|
.slcg_perf_load_gating_prod =
|
|
gp106_slcg_perf_load_gating_prod,
|
|
.slcg_priring_load_gating_prod =
|
|
gp106_slcg_priring_load_gating_prod,
|
|
.slcg_pmu_load_gating_prod =
|
|
gp106_slcg_pmu_load_gating_prod,
|
|
.slcg_therm_load_gating_prod =
|
|
gp106_slcg_therm_load_gating_prod,
|
|
.slcg_xbar_load_gating_prod =
|
|
gp106_slcg_xbar_load_gating_prod,
|
|
.blcg_bus_load_gating_prod =
|
|
gp106_blcg_bus_load_gating_prod,
|
|
.blcg_ce_load_gating_prod =
|
|
gp106_blcg_ce_load_gating_prod,
|
|
.blcg_fb_load_gating_prod =
|
|
gp106_blcg_fb_load_gating_prod,
|
|
.blcg_fifo_load_gating_prod =
|
|
gp106_blcg_fifo_load_gating_prod,
|
|
.blcg_gr_load_gating_prod =
|
|
gp106_blcg_gr_load_gating_prod,
|
|
.blcg_ltc_load_gating_prod =
|
|
gp106_blcg_ltc_load_gating_prod,
|
|
.blcg_pmu_load_gating_prod =
|
|
gp106_blcg_pmu_load_gating_prod,
|
|
.blcg_xbar_load_gating_prod =
|
|
gp106_blcg_xbar_load_gating_prod,
|
|
.pg_gr_load_gating_prod =
|
|
gr_gp106_pg_gr_load_gating_prod,
|
|
}
|
|
};
|
|
|
|
static int gp106_get_litter_value(struct gk20a *g, int value)
|
|
{
|
|
int ret = -EINVAL;
|
|
|
|
switch (value) {
|
|
case GPU_LIT_NUM_GPCS:
|
|
ret = proj_scal_litter_num_gpcs_v();
|
|
break;
|
|
case GPU_LIT_NUM_PES_PER_GPC:
|
|
ret = proj_scal_litter_num_pes_per_gpc_v();
|
|
break;
|
|
case GPU_LIT_NUM_ZCULL_BANKS:
|
|
ret = proj_scal_litter_num_zcull_banks_v();
|
|
break;
|
|
case GPU_LIT_NUM_TPC_PER_GPC:
|
|
ret = proj_scal_litter_num_tpc_per_gpc_v();
|
|
break;
|
|
case GPU_LIT_NUM_FBPS:
|
|
ret = proj_scal_litter_num_fbps_v();
|
|
break;
|
|
case GPU_LIT_GPC_BASE:
|
|
ret = proj_gpc_base_v();
|
|
break;
|
|
case GPU_LIT_GPC_STRIDE:
|
|
ret = proj_gpc_stride_v();
|
|
break;
|
|
case GPU_LIT_GPC_SHARED_BASE:
|
|
ret = proj_gpc_shared_base_v();
|
|
break;
|
|
case GPU_LIT_TPC_IN_GPC_BASE:
|
|
ret = proj_tpc_in_gpc_base_v();
|
|
break;
|
|
case GPU_LIT_TPC_IN_GPC_STRIDE:
|
|
ret = proj_tpc_in_gpc_stride_v();
|
|
break;
|
|
case GPU_LIT_TPC_IN_GPC_SHARED_BASE:
|
|
ret = proj_tpc_in_gpc_shared_base_v();
|
|
break;
|
|
case GPU_LIT_PPC_IN_GPC_BASE:
|
|
ret = proj_ppc_in_gpc_base_v();
|
|
break;
|
|
case GPU_LIT_PPC_IN_GPC_STRIDE:
|
|
ret = proj_ppc_in_gpc_stride_v();
|
|
break;
|
|
case GPU_LIT_PPC_IN_GPC_SHARED_BASE:
|
|
ret = proj_ppc_in_gpc_shared_base_v();
|
|
break;
|
|
case GPU_LIT_ROP_BASE:
|
|
ret = proj_rop_base_v();
|
|
break;
|
|
case GPU_LIT_ROP_STRIDE:
|
|
ret = proj_rop_stride_v();
|
|
break;
|
|
case GPU_LIT_ROP_SHARED_BASE:
|
|
ret = proj_rop_shared_base_v();
|
|
break;
|
|
case GPU_LIT_HOST_NUM_ENGINES:
|
|
ret = proj_host_num_engines_v();
|
|
break;
|
|
case GPU_LIT_HOST_NUM_PBDMA:
|
|
ret = proj_host_num_pbdma_v();
|
|
break;
|
|
case GPU_LIT_LTC_STRIDE:
|
|
ret = proj_ltc_stride_v();
|
|
break;
|
|
case GPU_LIT_LTS_STRIDE:
|
|
ret = proj_lts_stride_v();
|
|
break;
|
|
case GPU_LIT_NUM_FBPAS:
|
|
ret = proj_scal_litter_num_fbpas_v();
|
|
break;
|
|
case GPU_LIT_FBPA_SHARED_BASE:
|
|
ret = proj_fbpa_shared_base_v();
|
|
break;
|
|
case GPU_LIT_FBPA_BASE:
|
|
ret = proj_fbpa_base_v();
|
|
break;
|
|
case GPU_LIT_FBPA_STRIDE:
|
|
ret = proj_fbpa_stride_v();
|
|
break;
|
|
default:
|
|
BUG();
|
|
break;
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
int gp106_init_hal(struct gk20a *g)
|
|
{
|
|
struct gpu_ops *gops = &g->ops;
|
|
struct nvgpu_gpu_characteristics *c = &g->gpu_characteristics;
|
|
|
|
gk20a_dbg_fn("");
|
|
|
|
*gops = gp106_ops;
|
|
|
|
gops->privsecurity = 1;
|
|
gops->securegpccs = 1;
|
|
gops->pmupstate = true;
|
|
gp10b_init_mc(gops);
|
|
gp106_init_gr(gops);
|
|
gp106_init_ltc(gops);
|
|
gp106_init_fb(gops);
|
|
gp106_init_fifo(gops);
|
|
gp10b_init_ce(gops);
|
|
gp106_init_gr_ctx(gops);
|
|
gp106_init_mm(gops);
|
|
gp106_init_pmu_ops(gops);
|
|
gk20a_init_debug_ops(gops);
|
|
gk20a_init_dbg_session_ops(gops);
|
|
gp106_init_clk_ops(gops);
|
|
gp106_init_clk_arb_ops(gops);
|
|
gp106_init_regops(gops);
|
|
gp10b_init_cde_ops(gops);
|
|
gk20a_init_tsg_ops(gops);
|
|
#if defined(CONFIG_GK20A_CYCLE_STATS)
|
|
gk20a_init_css_ops(gops);
|
|
#endif
|
|
gp106_init_bios(gops);
|
|
gp106_init_therm_ops(gops);
|
|
gp106_init_xve_ops(gops);
|
|
|
|
gops->name = "gp10x";
|
|
gops->get_litter_value = gp106_get_litter_value;
|
|
gops->chip_init_gpu_characteristics = gk20a_init_gpu_characteristics;
|
|
gops->gr_ctx.use_dma_for_fw_bootstrap = true;
|
|
gops->read_ptimer = gk20a_read_ptimer;
|
|
|
|
c->twod_class = FERMI_TWOD_A;
|
|
c->threed_class = PASCAL_B;
|
|
c->compute_class = PASCAL_COMPUTE_B;
|
|
c->gpfifo_class = PASCAL_CHANNEL_GPFIFO_A;
|
|
c->inline_to_memory_class = KEPLER_INLINE_TO_MEMORY_B;
|
|
c->dma_copy_class = PASCAL_DMA_COPY_A;
|
|
|
|
gk20a_dbg_fn("done");
|
|
|
|
return 0;
|
|
}
|