Files
linux-nvgpu/drivers/gpu/nvgpu/gp106/hal_gp106.c
Thomas Fleury 3d9c33c595 gpu: nvgpu: clk arbiter skeleton
Add clock arbiter skeleton with support of clock sessions,
notifications on clock changes, request numbering, and asynchronous
handling of clock requests. Provides minimum behaviour to allow
unit tests implementation. Actual arbitration and clock settings
will be done separately. For now, dummy arbiter keeps last
requested target mhz. Actual arbiter may move to a lockless
implementation.

Jira DNVGPU-125

Change-Id: I6a8e443fb0d15dc5f1993e7260256d71acddd106
Signed-off-by: Thomas Fleury <tfleury@nvidia.com>
Reviewed-on: http://git-master/r/1223476
(cherry picked from commit cb130825d84e4124d273bd443e2b62d493377461)
Reviewed-on: http://git-master/r/1243105
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
2016-12-27 15:26:51 +05:30

242 lines
6.2 KiB
C

/*
* GP106 HAL interface
*
* Copyright (c) 2016, NVIDIA CORPORATION. All rights reserved.
*
* This program is free software; you can redistribute it and/or modify it
* under the terms and conditions of the GNU General Public License,
* version 2, as published by the Free Software Foundation.
*
* This program is distributed in the hope it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
* more details.
*/
#include <linux/types.h>
#include <linux/printk.h>
#include <linux/types.h>
#include "gk20a/gk20a.h"
#include "gp10b/gr_gp10b.h"
#include "gp10b/mc_gp10b.h"
#include "gp106/ltc_gp106.h"
#include "gp10b/mm_gp10b.h"
#include "gp10b/ce_gp10b.h"
#include "gp106/fifo_gp106.h"
#include "gp106/regops_gp106.h"
#include "gp10b/cde_gp10b.h"
#include "gp106/therm_gp106.h"
#include "gp106/xve_gp106.h"
#include "gp106/bios_gp106.h"
#include "gm20b/gr_gm20b.h"
#include "gm20b/fifo_gm20b.h"
#include "gm20b/pmu_gm20b.h"
#include "gp106/clk_gp106.h"
#include "gp106/clk_arb_gp106.h"
#include "gp106/mm_gp106.h"
#include "gp106/pmu_gp106.h"
#include "gp106/gr_ctx_gp106.h"
#include "gp106/gr_gp106.h"
#include "gp106/fb_gp106.h"
#include "gp106/gp106_gating_reglist.h"
#include "nvgpu_gpuid_t18x.h"
#include "hw_proj_gp106.h"
#include "gk20a/dbg_gpu_gk20a.h"
#include "gk20a/css_gr_gk20a.h"
static struct gpu_ops gp106_ops = {
.clock_gating = {
.slcg_bus_load_gating_prod =
gp106_slcg_bus_load_gating_prod,
.slcg_ce2_load_gating_prod =
gp106_slcg_ce2_load_gating_prod,
.slcg_chiplet_load_gating_prod =
gp106_slcg_chiplet_load_gating_prod,
.slcg_ctxsw_firmware_load_gating_prod =
gp106_slcg_ctxsw_firmware_load_gating_prod,
.slcg_fb_load_gating_prod =
gp106_slcg_fb_load_gating_prod,
.slcg_fifo_load_gating_prod =
gp106_slcg_fifo_load_gating_prod,
.slcg_gr_load_gating_prod =
gr_gp106_slcg_gr_load_gating_prod,
.slcg_ltc_load_gating_prod =
ltc_gp106_slcg_ltc_load_gating_prod,
.slcg_perf_load_gating_prod =
gp106_slcg_perf_load_gating_prod,
.slcg_priring_load_gating_prod =
gp106_slcg_priring_load_gating_prod,
.slcg_pmu_load_gating_prod =
gp106_slcg_pmu_load_gating_prod,
.slcg_therm_load_gating_prod =
gp106_slcg_therm_load_gating_prod,
.slcg_xbar_load_gating_prod =
gp106_slcg_xbar_load_gating_prod,
.blcg_bus_load_gating_prod =
gp106_blcg_bus_load_gating_prod,
.blcg_ce_load_gating_prod =
gp106_blcg_ce_load_gating_prod,
.blcg_fb_load_gating_prod =
gp106_blcg_fb_load_gating_prod,
.blcg_fifo_load_gating_prod =
gp106_blcg_fifo_load_gating_prod,
.blcg_gr_load_gating_prod =
gp106_blcg_gr_load_gating_prod,
.blcg_ltc_load_gating_prod =
gp106_blcg_ltc_load_gating_prod,
.blcg_pmu_load_gating_prod =
gp106_blcg_pmu_load_gating_prod,
.blcg_xbar_load_gating_prod =
gp106_blcg_xbar_load_gating_prod,
.pg_gr_load_gating_prod =
gr_gp106_pg_gr_load_gating_prod,
}
};
static int gp106_get_litter_value(struct gk20a *g, int value)
{
int ret = -EINVAL;
switch (value) {
case GPU_LIT_NUM_GPCS:
ret = proj_scal_litter_num_gpcs_v();
break;
case GPU_LIT_NUM_PES_PER_GPC:
ret = proj_scal_litter_num_pes_per_gpc_v();
break;
case GPU_LIT_NUM_ZCULL_BANKS:
ret = proj_scal_litter_num_zcull_banks_v();
break;
case GPU_LIT_NUM_TPC_PER_GPC:
ret = proj_scal_litter_num_tpc_per_gpc_v();
break;
case GPU_LIT_NUM_FBPS:
ret = proj_scal_litter_num_fbps_v();
break;
case GPU_LIT_GPC_BASE:
ret = proj_gpc_base_v();
break;
case GPU_LIT_GPC_STRIDE:
ret = proj_gpc_stride_v();
break;
case GPU_LIT_GPC_SHARED_BASE:
ret = proj_gpc_shared_base_v();
break;
case GPU_LIT_TPC_IN_GPC_BASE:
ret = proj_tpc_in_gpc_base_v();
break;
case GPU_LIT_TPC_IN_GPC_STRIDE:
ret = proj_tpc_in_gpc_stride_v();
break;
case GPU_LIT_TPC_IN_GPC_SHARED_BASE:
ret = proj_tpc_in_gpc_shared_base_v();
break;
case GPU_LIT_PPC_IN_GPC_BASE:
ret = proj_ppc_in_gpc_base_v();
break;
case GPU_LIT_PPC_IN_GPC_STRIDE:
ret = proj_ppc_in_gpc_stride_v();
break;
case GPU_LIT_PPC_IN_GPC_SHARED_BASE:
ret = proj_ppc_in_gpc_shared_base_v();
break;
case GPU_LIT_ROP_BASE:
ret = proj_rop_base_v();
break;
case GPU_LIT_ROP_STRIDE:
ret = proj_rop_stride_v();
break;
case GPU_LIT_ROP_SHARED_BASE:
ret = proj_rop_shared_base_v();
break;
case GPU_LIT_HOST_NUM_ENGINES:
ret = proj_host_num_engines_v();
break;
case GPU_LIT_HOST_NUM_PBDMA:
ret = proj_host_num_pbdma_v();
break;
case GPU_LIT_LTC_STRIDE:
ret = proj_ltc_stride_v();
break;
case GPU_LIT_LTS_STRIDE:
ret = proj_lts_stride_v();
break;
case GPU_LIT_NUM_FBPAS:
ret = proj_scal_litter_num_fbpas_v();
break;
case GPU_LIT_FBPA_SHARED_BASE:
ret = proj_fbpa_shared_base_v();
break;
case GPU_LIT_FBPA_BASE:
ret = proj_fbpa_base_v();
break;
case GPU_LIT_FBPA_STRIDE:
ret = proj_fbpa_stride_v();
break;
default:
BUG();
break;
}
return ret;
}
int gp106_init_hal(struct gk20a *g)
{
struct gpu_ops *gops = &g->ops;
struct nvgpu_gpu_characteristics *c = &g->gpu_characteristics;
gk20a_dbg_fn("");
*gops = gp106_ops;
gops->privsecurity = 1;
gops->securegpccs = 1;
gops->pmupstate = true;
gp10b_init_mc(gops);
gp106_init_gr(gops);
gp106_init_ltc(gops);
gp106_init_fb(gops);
gp106_init_fifo(gops);
gp10b_init_ce(gops);
gp106_init_gr_ctx(gops);
gp106_init_mm(gops);
gp106_init_pmu_ops(gops);
gk20a_init_debug_ops(gops);
gk20a_init_dbg_session_ops(gops);
gp106_init_clk_ops(gops);
gp106_init_clk_arb_ops(gops);
gp106_init_regops(gops);
gp10b_init_cde_ops(gops);
gk20a_init_tsg_ops(gops);
#if defined(CONFIG_GK20A_CYCLE_STATS)
gk20a_init_css_ops(gops);
#endif
gp106_init_bios(gops);
gp106_init_therm_ops(gops);
gp106_init_xve_ops(gops);
gops->name = "gp10x";
gops->get_litter_value = gp106_get_litter_value;
gops->chip_init_gpu_characteristics = gk20a_init_gpu_characteristics;
gops->gr_ctx.use_dma_for_fw_bootstrap = true;
gops->read_ptimer = gk20a_read_ptimer;
c->twod_class = FERMI_TWOD_A;
c->threed_class = PASCAL_B;
c->compute_class = PASCAL_COMPUTE_B;
c->gpfifo_class = PASCAL_CHANNEL_GPFIFO_A;
c->inline_to_memory_class = KEPLER_INLINE_TO_MEMORY_B;
c->dma_copy_class = PASCAL_DMA_COPY_A;
gk20a_dbg_fn("done");
return 0;
}