Files
linux-nvgpu/drivers/gpu/nvgpu/common/cic/mon/mon_init.c
Tejal Kudav 494dc19ee8 gpu: nvgpu: Err injection utility support
The HSI error injection utility is an on-bench debug and test utility
which can be used by customers and SQA to test end-to-end error
detection and reporting path.
Inplement callback function to integrate with this utility and allow
injecting GPU HSI related errors.
As part of callback function hsierrrpt_inj(), invoke the driver's
error-reporting logic which uses the EPD MISC_EC APIs. In future,
we can enhance the callback function to trigger driver's error
handling logic incrementally for different errors.

Bug 3413214

Change-Id: I2d050b6c850d6151b40095f243a6733b4ba74f47
Signed-off-by: Tejal Kudav <tkudav@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/c/linux-nvgpu/+/2727198
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
2022-07-01 08:11:45 -07:00

137 lines
3.2 KiB
C

/*
* Copyright (c) 2021-2022, NVIDIA CORPORATION. All rights reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
* DEALINGS IN THE SOFTWARE.
*/
#include <nvgpu/gk20a.h>
#include <nvgpu/kmem.h>
#include <nvgpu/log.h>
#include <nvgpu/cic_mon.h>
#include "cic_mon_priv.h"
int nvgpu_cic_mon_setup(struct gk20a *g)
{
struct nvgpu_cic_mon *cic_mon;
int err = 0;
if (g->cic_mon != NULL) {
cic_dbg(g, "CIC_MON already initialized");
return 0;
}
cic_mon = nvgpu_kzalloc(g, sizeof(*cic_mon));
if (cic_mon == NULL) {
nvgpu_err(g, "Failed to allocate memory "
"for struct nvgpu_cic_mon");
return -ENOMEM;
}
g->cic_mon = cic_mon;
#ifdef CONFIG_NVGPU_FSI_ERR_INJECTION
err = nvgpu_cic_mon_reg_errinj_cb(g);
if (err != 0) {
nvgpu_err(g,
"Err inj callback registration failed: %d",
err);
/* Continue CIC init despite err inj utility
* registration failure, as the err inj support
* is meant only for debug purposes.
*/
err = 0;
}
#endif
cic_dbg(g, "CIC_MON unit initialization done.");
return err;
}
int nvgpu_cic_mon_init_lut(struct gk20a *g)
{
struct nvgpu_cic_mon *cic_mon;
int err = 0;
cic_mon = g->cic_mon;
if (cic_mon == NULL) {
nvgpu_err(g, "CIC_MON setup pending");
return -EINVAL;
}
if (g->ops.cic_mon.init != NULL) {
err = g->ops.cic_mon.init(g, cic_mon);
if (err != 0) {
nvgpu_err(g, "CIC MON chip specific "
"initialization failed.");
goto cleanup;
}
} else {
cic_mon->err_lut = NULL;
cic_mon->num_hw_modules = 0;
}
return 0;
cleanup:
if (cic_mon != NULL) {
nvgpu_kfree(g, cic_mon);
g->cic_mon = NULL;
}
return err;
}
int nvgpu_cic_mon_remove(struct gk20a *g)
{
struct nvgpu_cic_mon *cic_mon;
cic_mon = g->cic_mon;
if (cic_mon == NULL) {
cic_dbg(g, "CIC_MON already removed");
return 0;
}
nvgpu_kfree(g, cic_mon);
g->cic_mon = NULL;
return 0;
}
int nvgpu_cic_mon_deinit_lut(struct gk20a *g)
{
struct nvgpu_cic_mon *cic_mon;
cic_mon = g->cic_mon;
if (cic_mon == NULL) {
cic_dbg(g, "CIC_MON and LUT removed");
return 0;
}
cic_mon->err_lut = NULL;
cic_mon->num_hw_modules = 0;
return 0;
}
int nvgpu_cic_mon_deinit(struct gk20a *g)
{
/** More deinit calls might get added here as CIC grows. */
return nvgpu_cic_mon_deinit_lut(g);
}