mirror of
git://nv-tegra.nvidia.com/linux-nvgpu.git
synced 2025-12-23 09:57:08 +03:00
Add virtualized support for NUM_VSMS and VSMS_MAPPING ioctls. This requires adding an attribute request for the RM server, GPC0_TPC_COUNT JIRASW EVLR-253 Change-Id: Icaab4fadbbc9eab5d00cf78132928686944162df Signed-off-by: Peter Daifuku <pdaifuku@nvidia.com> Reviewed-on: http://git-master/r/1130615 (cherry picked from commit 78514079382b0de48457db340e3479e99a012040) Reviewed-on: http://git-master/r/1133865 (cherry picked from commit 27a8e645e2787a43d0073f0be6e8f64c0f183228) Reviewed-on: http://git-master/r/1122553 GVS: Gerrit_Virtual_Submit Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
80 lines
2.1 KiB
C
80 lines
2.1 KiB
C
/*
|
|
* Copyright (c) 2015-2016, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms and conditions of the GNU General Public License,
|
|
* version 2, as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
* more details.
|
|
*/
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include "gk20a/hw_gr_gk20a.h"
|
|
#include "gk20a/gk20a.h"
|
|
#include "vgpu/vgpu.h"
|
|
#include "vgpu_gr_gk20a.h"
|
|
|
|
static void vgpu_gk20a_detect_sm_arch(struct gk20a *g)
|
|
{
|
|
struct gk20a_platform *platform = gk20a_get_platform(g->dev);
|
|
u32 v = 0, raw_version, version = 0;
|
|
|
|
gk20a_dbg_fn("");
|
|
|
|
if (vgpu_get_attribute(platform->virt_handle,
|
|
TEGRA_VGPU_ATTRIB_GPC0_TPC0_SM_ARCH, &v))
|
|
gk20a_err(dev_from_gk20a(g), "failed to retrieve SM arch");
|
|
|
|
raw_version = gr_gpc0_tpc0_sm_arch_spa_version_v(v);
|
|
|
|
if (raw_version == gr_gpc0_tpc0_sm_arch_spa_version_smkepler_lp_v())
|
|
version = 0x320; /* SM 3.2 */
|
|
else
|
|
gk20a_err(dev_from_gk20a(g), "Unknown SM version 0x%x",
|
|
raw_version);
|
|
|
|
/* on Kepler, SM version == SPA version */
|
|
g->gpu_characteristics.sm_arch_spa_version = version;
|
|
g->gpu_characteristics.sm_arch_sm_version = version;
|
|
|
|
g->gpu_characteristics.sm_arch_warp_count =
|
|
gr_gpc0_tpc0_sm_arch_warp_count_v(v);
|
|
}
|
|
|
|
static int vgpu_gk20a_init_fs_state(struct gk20a *g)
|
|
{
|
|
struct gr_gk20a *gr = &g->gr;
|
|
u32 tpc_index, gpc_index;
|
|
u32 sm_id = 0;
|
|
|
|
gk20a_dbg_fn("");
|
|
|
|
for (tpc_index = 0; tpc_index < gr->max_tpc_per_gpc_count;
|
|
tpc_index++) {
|
|
for (gpc_index = 0; gpc_index < gr->gpc_count; gpc_index++) {
|
|
if (tpc_index < gr->gpc_tpc_count[gpc_index]) {
|
|
g->gr.sm_to_cluster[sm_id].tpc_index =
|
|
tpc_index;
|
|
g->gr.sm_to_cluster[sm_id].gpc_index =
|
|
gpc_index;
|
|
|
|
sm_id++;
|
|
}
|
|
}
|
|
}
|
|
|
|
gr->no_of_sm = sm_id;
|
|
|
|
return 0;
|
|
}
|
|
|
|
void vgpu_gk20a_init_gr_ops(struct gpu_ops *gops)
|
|
{
|
|
gops->gr.detect_sm_arch = vgpu_gk20a_detect_sm_arch;
|
|
gops->gr.init_fs_state = vgpu_gk20a_init_fs_state;
|
|
}
|