Files
linux-nvgpu/drivers/gpu/nvgpu/common/perf/perfbuf.c
Deepak Nibade 9e94e118fe gpu: nvgpu: ensure pma byte buffer address fits in 32 bits
Right now PMA byte buffer address is allocated in the range of
0x1ffc010000. The register that stores this address is only 32-bit and
there is no corresponding _hi() register, so the address must fit in
32 bits.

Update nvgpu_vm_init() parameters in nvgpu_perfbuf_init_vm() so that a
low_hole of only 4K is used. This allows the address to be allocated
in the range of 0x4000000.

Also map byte buffer before PMA stream buffer so that byte buffer always
gets lower address.

There is only one PMA stream buffer allowed to be mapped right now so
this works for now. But in future multiple buffers can be mapped and this
solution needs to be reworked.

Bug 2510974
Jira NVGPU-5360

Change-Id: Ief1a9ee54d554e3bc13c7a9567934dcbeaefbcc6
Signed-off-by: Deepak Nibade <dnibade@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/c/linux-nvgpu/+/2418520
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
2020-12-15 14:13:28 -06:00

157 lines
3.9 KiB
C

/*
* Copyright (c) 2018-2020, NVIDIA CORPORATION. All rights reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
* DEALINGS IN THE SOFTWARE.
*/
#include <nvgpu/mm.h>
#include <nvgpu/sizes.h>
#include <nvgpu/perfbuf.h>
#include <nvgpu/gk20a.h>
#include <nvgpu/nvgpu_init.h>
int nvgpu_perfbuf_enable_locked(struct gk20a *g, u64 offset, u32 size)
{
int err;
err = gk20a_busy(g);
if (err != 0) {
nvgpu_err(g, "failed to poweron");
return err;
}
g->ops.perf.membuf_reset_streaming(g);
g->ops.perf.enable_membuf(g, size, offset);
gk20a_idle(g);
return 0;
}
int nvgpu_perfbuf_disable_locked(struct gk20a *g)
{
int err = gk20a_busy(g);
if (err != 0) {
nvgpu_err(g, "failed to poweron");
return err;
}
g->ops.perf.membuf_reset_streaming(g);
g->ops.perf.disable_membuf(g);
gk20a_idle(g);
return 0;
}
int nvgpu_perfbuf_init_inst_block(struct gk20a *g)
{
struct mm_gk20a *mm = &g->mm;
int err;
err = nvgpu_alloc_inst_block(g, &mm->perfbuf.inst_block);
if (err != 0) {
return err;
}
g->ops.mm.init_inst_block(&mm->perfbuf.inst_block, mm->perfbuf.vm, 0);
g->ops.perf.init_inst_block(g, &mm->perfbuf.inst_block);
return 0;
}
int nvgpu_perfbuf_init_vm(struct gk20a *g)
{
struct mm_gk20a *mm = &g->mm;
u32 big_page_size = g->ops.mm.gmmu.get_default_big_page_size();
int err;
mm->perfbuf.vm = nvgpu_vm_init(g, big_page_size, SZ_4K,
nvgpu_safe_sub_u64(NV_MM_DEFAULT_USER_SIZE, SZ_4K),
NV_MM_DEFAULT_KERNEL_SIZE,
false, false, false, "perfbuf");
if (mm->perfbuf.vm == NULL) {
return -ENOMEM;
}
err = g->ops.perfbuf.init_inst_block(g);
if (err != 0) {
nvgpu_vm_put(mm->perfbuf.vm);
return err;
}
return 0;
}
void nvgpu_perfbuf_deinit_inst_block(struct gk20a *g)
{
g->ops.perf.deinit_inst_block(g);
nvgpu_free_inst_block(g, &g->mm.perfbuf.inst_block);
}
void nvgpu_perfbuf_deinit_vm(struct gk20a *g)
{
g->ops.perfbuf.deinit_inst_block(g);
nvgpu_vm_put(g->mm.perfbuf.vm);
}
int nvgpu_perfbuf_update_get_put(struct gk20a *g, u64 bytes_consumed,
u64 *bytes_available, void *cpuva, bool wait,
u64 *put_ptr, bool *overflowed)
{
struct nvgpu_timeout timeout;
int err;
bool update_available_bytes = (bytes_available == NULL) ? false : true;
volatile u32 *available_bytes_va = (u32 *)cpuva;
if (update_available_bytes) {
*available_bytes_va = 0xffffffff;
}
err = g->ops.perf.update_get_put(g, bytes_consumed,
update_available_bytes, put_ptr, overflowed);
if (err != 0) {
return err;
}
if (update_available_bytes && wait) {
err = nvgpu_timeout_init(g, &timeout, 10000, NVGPU_TIMER_CPU_TIMER);
if (err != 0) {
nvgpu_err(g, "nvgpu_timeout_init() failed err=%d", err);
return err;
}
do {
if (*available_bytes_va != 0xffffffff) {
break;
}
nvgpu_msleep(10);
} while (nvgpu_timeout_expired(&timeout) == 0);
if (*available_bytes_va == 0xffffffff) {
return -ETIMEDOUT;
}
*bytes_available = *available_bytes_va;
}
return 0;
}