gpu: nvgpu: simplify gmmu map calls

Introduce nvgpu_gmmu_map_partial() to map a specific size of a buffer
represented by nvgpu_mem, or what nvgpu_gmmu_map() used to do. Delete
the size parameter from nvgpu_gmmu_map() such that it now maps the
entire buffer. The separate size parameter is a historical artifact from
when nvgpu_mem did not exist yet; the typical use is to map the entire
buffer.

Mapping at a certain address with nvgpu_gmmu_map_fixed() still takes the
size parameter.

The returned address still has to be stored somewhere, typically to
mem.gpu_va by the caller so that the matching unmap variant finds the
right address.

Change-Id: I7d67a0b15d741c6bcee1aecff1678e3216cc28d2
Signed-off-by: Konsta Hölttä <kholtta@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/c/linux-nvgpu/+/2601788
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: svc-mobile-misra <svc-mobile-misra@nvidia.com>
Reviewed-by: svc-mobile-cert <svc-mobile-cert@nvidia.com>
Reviewed-by: svcacv <svcacv@nvidia.com>
Reviewed-by: Alex Waterman <alexw@nvidia.com>
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
GVS: Gerrit_Virtual_Submit
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
This commit is contained in:
Konsta Hölttä
2021-09-28 09:24:17 +03:00
committed by mobile promotions
parent 6d38ae76ce
commit 1b1d183b9c
15 changed files with 50 additions and 24 deletions

View File

@@ -87,7 +87,6 @@ int nvgpu_gr_ctx_alloc(struct gk20a *g,
gr_ctx->mem.gpu_va = nvgpu_gmmu_map(vm, gr_ctx->mem.gpu_va = nvgpu_gmmu_map(vm,
&gr_ctx->mem, &gr_ctx->mem,
gr_ctx->mem.size,
0, /* not GPU-cacheable */ 0, /* not GPU-cacheable */
gk20a_mem_flag_none, true, gk20a_mem_flag_none, true,
gr_ctx->mem.aperture); gr_ctx->mem.aperture);
@@ -802,7 +801,7 @@ static int nvgpu_gr_ctx_alloc_ctxsw_buffer(struct vm_gk20a *vm, size_t size,
return err; return err;
} }
mem->gpu_va = nvgpu_gmmu_map(vm, mem->gpu_va = nvgpu_gmmu_map_partial(vm,
mem, mem,
mem->aligned_size, mem->aligned_size,
NVGPU_VM_MAP_CACHEABLE, NVGPU_VM_MAP_CACHEABLE,
@@ -1004,7 +1003,6 @@ int nvgpu_gr_ctx_alloc_pm_ctx(struct gk20a *g,
pm_ctx->mem.gpu_va = nvgpu_gmmu_map(vm, pm_ctx->mem.gpu_va = nvgpu_gmmu_map(vm,
&pm_ctx->mem, &pm_ctx->mem,
pm_ctx->mem.size,
NVGPU_VM_MAP_CACHEABLE, NVGPU_VM_MAP_CACHEABLE,
gk20a_mem_flag_none, true, gk20a_mem_flag_none, true,
pm_ctx->mem.aperture); pm_ctx->mem.aperture);

View File

@@ -326,7 +326,7 @@ u64 nvgpu_gr_global_ctx_buffer_map(struct nvgpu_gr_global_ctx_buffer_desc *desc,
return 0; return 0;
} }
gpu_va = nvgpu_gmmu_map(vm, &desc[index].mem, desc[index].mem.size, gpu_va = nvgpu_gmmu_map(vm, &desc[index].mem,
flags, gk20a_mem_flag_none, priv, flags, gk20a_mem_flag_none, priv,
desc[index].mem.aperture); desc[index].mem.aperture);
return gpu_va; return gpu_va;

View File

@@ -225,7 +225,6 @@ static int nvgpu_gr_falcon_init_ctxsw_ucode_vaspace(struct gk20a *g,
/* Map ucode surface to GMMU */ /* Map ucode surface to GMMU */
ucode_info->surface_desc.gpu_va = nvgpu_gmmu_map(vm, ucode_info->surface_desc.gpu_va = nvgpu_gmmu_map(vm,
&ucode_info->surface_desc, &ucode_info->surface_desc,
ucode_info->surface_desc.size,
0, /* flags */ 0, /* flags */
gk20a_mem_flag_read_only, gk20a_mem_flag_read_only,
false, false,

View File

@@ -51,7 +51,6 @@ struct nvgpu_gr_subctx *nvgpu_gr_subctx_alloc(struct gk20a *g,
subctx->ctx_header.gpu_va = nvgpu_gmmu_map(vm, subctx->ctx_header.gpu_va = nvgpu_gmmu_map(vm,
&subctx->ctx_header, &subctx->ctx_header,
subctx->ctx_header.size,
0, /* not GPU-cacheable */ 0, /* not GPU-cacheable */
gk20a_mem_flag_none, true, gk20a_mem_flag_none, true,
subctx->ctx_header.aperture); subctx->ctx_header.aperture);

View File

@@ -158,7 +158,7 @@ int nvgpu_dma_alloc_map_flags_sys(struct vm_gk20a *vm, unsigned long flags,
return err; return err;
} }
mem->gpu_va = nvgpu_gmmu_map(vm, mem, size, 0, mem->gpu_va = nvgpu_gmmu_map(vm, mem, 0,
gk20a_mem_flag_none, false, gk20a_mem_flag_none, false,
mem->aperture); mem->aperture);
if (mem->gpu_va == 0ULL) { if (mem->gpu_va == 0ULL) {
@@ -190,7 +190,7 @@ int nvgpu_dma_alloc_map_flags_vid(struct vm_gk20a *vm, unsigned long flags,
return err; return err;
} }
mem->gpu_va = nvgpu_gmmu_map(vm, mem, size, 0, mem->gpu_va = nvgpu_gmmu_map(vm, mem, 0,
gk20a_mem_flag_none, false, gk20a_mem_flag_none, false,
mem->aperture); mem->aperture);
if (mem->gpu_va == 0ULL) { if (mem->gpu_va == 0ULL) {

View File

@@ -131,7 +131,7 @@ static u64 nvgpu_gmmu_map_core(struct vm_gk20a *vm,
/* /*
* Map a nvgpu_mem into the GMMU. This is for kernel space to use. * Map a nvgpu_mem into the GMMU. This is for kernel space to use.
*/ */
u64 nvgpu_gmmu_map(struct vm_gk20a *vm, u64 nvgpu_gmmu_map_partial(struct vm_gk20a *vm,
struct nvgpu_mem *mem, struct nvgpu_mem *mem,
u64 size, u64 size,
u32 flags, u32 flags,
@@ -143,6 +143,20 @@ u64 nvgpu_gmmu_map(struct vm_gk20a *vm,
aperture); aperture);
} }
/*
* Map a nvgpu_mem into the GMMU. This is for kernel space to use.
*/
u64 nvgpu_gmmu_map(struct vm_gk20a *vm,
struct nvgpu_mem *mem,
u32 flags,
enum gk20a_mem_rw_flag rw_flag,
bool priv,
enum nvgpu_aperture aperture)
{
return nvgpu_gmmu_map_core(vm, mem, 0, mem->size, flags, rw_flag, priv,
aperture);
}
/* /*
* Like nvgpu_gmmu_map() except this can work on a fixed address. * Like nvgpu_gmmu_map() except this can work on a fixed address.
*/ */

View File

@@ -135,7 +135,7 @@ int nvgpu_semaphore_pool_map(struct nvgpu_semaphore_pool *p,
goto fail_unmap; goto fail_unmap;
} }
addr = nvgpu_gmmu_map(vm, &p->rw_mem, SZ_4K, 0, addr = nvgpu_gmmu_map_partial(vm, &p->rw_mem, SZ_4K, 0,
gk20a_mem_flag_none, 0, gk20a_mem_flag_none, 0,
p->rw_mem.aperture); p->rw_mem.aperture);

View File

@@ -42,7 +42,7 @@ static int set_syncpt_ro_map_gpu_va_locked(struct vm_gk20a *vm)
return 0; return 0;
} }
vm->syncpt_ro_map_gpu_va = nvgpu_gmmu_map(vm, vm->syncpt_ro_map_gpu_va = nvgpu_gmmu_map_partial(vm,
&g->syncpt_mem, g->syncpt_unit_size, &g->syncpt_mem, g->syncpt_unit_size,
0, gk20a_mem_flag_read_only, 0, gk20a_mem_flag_read_only,
false, APERTURE_SYSMEM); false, APERTURE_SYSMEM);
@@ -85,7 +85,7 @@ int gv11b_syncpt_alloc_buf(struct nvgpu_channel *c,
return err; return err;
} }
syncpt_buf->gpu_va = nvgpu_gmmu_map(c->vm, syncpt_buf, syncpt_buf->gpu_va = nvgpu_gmmu_map_partial(c->vm, syncpt_buf,
g->syncpt_size, 0, gk20a_mem_flag_none, g->syncpt_size, 0, gk20a_mem_flag_none,
false, APERTURE_SYSMEM); false, APERTURE_SYSMEM);

View File

@@ -281,8 +281,8 @@ int nvgpu_gmmu_init_page_table(struct vm_gk20a *vm);
* context on the GR, CE to access the given virtual address. * context on the GR, CE to access the given virtual address.
* *
* @param vm [in] Pointer to virtual memory structure. * @param vm [in] Pointer to virtual memory structure.
* @param mem [in] Structure for storing the memory informati on. * @param mem [in] The previously allocated buffer to map.
* @param size [in] Size of the buffer in bytes. * @param size [in] Size of the mapping in bytes.
* @param flags [in] Mapping flags. * @param flags [in] Mapping flags.
* - Min: NVGPU_VM_MAP_FIXED_OFFSET * - Min: NVGPU_VM_MAP_FIXED_OFFSET
* - Max: NVGPU_VM_MAP_PLATFORM_ATOMIC * - Max: NVGPU_VM_MAP_PLATFORM_ATOMIC
@@ -311,6 +311,8 @@ int nvgpu_gmmu_init_page_table(struct vm_gk20a *vm);
* Invalidates the GPU TLB, gm20b_fb_tlb_invalidate does the tlb invalidate. * Invalidates the GPU TLB, gm20b_fb_tlb_invalidate does the tlb invalidate.
* Release the VM GMMU lock. * Release the VM GMMU lock.
* *
* Note that mem->gpu_va is not updated.
*
* @return valid GMMU VA start address in case of success. * @return valid GMMU VA start address in case of success.
* @retval 0 in case of all possible failures. * @retval 0 in case of all possible failures.
* Possible Failure cases: * Possible Failure cases:
@@ -320,7 +322,7 @@ int nvgpu_gmmu_init_page_table(struct vm_gk20a *vm);
* - invalid inputs. * - invalid inputs.
* *
*/ */
u64 nvgpu_gmmu_map(struct vm_gk20a *vm, u64 nvgpu_gmmu_map_partial(struct vm_gk20a *vm,
struct nvgpu_mem *mem, struct nvgpu_mem *mem,
u64 size, u64 size,
u32 flags, u32 flags,
@@ -328,6 +330,19 @@ u64 nvgpu_gmmu_map(struct vm_gk20a *vm,
bool priv, bool priv,
enum nvgpu_aperture aperture); enum nvgpu_aperture aperture);
/**
* @brief Map a whole buffer into the GMMU.
*
* This is like nvgpu_gmmu_map_partial() but with the full requested size of
* the buffer in nvgpu_mem.size.
*/
u64 nvgpu_gmmu_map(struct vm_gk20a *vm,
struct nvgpu_mem *mem,
u32 flags,
enum gk20a_mem_rw_flag rw_flag,
bool priv,
enum nvgpu_aperture aperture);
/** /**
* @brief Map memory into the GMMU at a fixed address. This is required to * @brief Map memory into the GMMU at a fixed address. This is required to
* make the parrticular context on the GR, CE to access the given virtual * make the parrticular context on the GR, CE to access the given virtual

View File

@@ -1411,7 +1411,6 @@ static int gk20a_cde_load(struct gk20a_cde_ctx *cde_ctx)
/* map backing store to gpu virtual space */ /* map backing store to gpu virtual space */
vaddr = nvgpu_gmmu_map(ch->vm, &cbc->compbit_store.mem, vaddr = nvgpu_gmmu_map(ch->vm, &cbc->compbit_store.mem,
cbc->compbit_store.mem.size,
NVGPU_VM_MAP_CACHEABLE, NVGPU_VM_MAP_CACHEABLE,
gk20a_mem_flag_read_only, gk20a_mem_flag_read_only,
false, false,

View File

@@ -530,7 +530,7 @@ static int nvgpu_channel_alloc_usermode_buffers(struct nvgpu_channel *c,
} }
c->usermode_gpfifo.gpu_va = nvgpu_gmmu_map(c->vm, &c->usermode_gpfifo, c->usermode_gpfifo.gpu_va = nvgpu_gmmu_map(c->vm, &c->usermode_gpfifo,
c->usermode_gpfifo.size, 0, gk20a_mem_flag_read_only, 0, gk20a_mem_flag_read_only,
false, c->usermode_gpfifo.aperture); false, c->usermode_gpfifo.aperture);
if (c->usermode_gpfifo.gpu_va == 0) { if (c->usermode_gpfifo.gpu_va == 0) {

View File

@@ -406,8 +406,9 @@ nvgpu_get_pte
nvgpu_gmmu_default_big_page_size nvgpu_gmmu_default_big_page_size
nvgpu_gmmu_init_page_table nvgpu_gmmu_init_page_table
nvgpu_gmmu_map nvgpu_gmmu_map
nvgpu_gmmu_map_locked
nvgpu_gmmu_map_fixed nvgpu_gmmu_map_fixed
nvgpu_gmmu_map_locked
nvgpu_gmmu_map_partial
nvgpu_gmmu_unmap nvgpu_gmmu_unmap
nvgpu_gmmu_unmap_addr nvgpu_gmmu_unmap_addr
nvgpu_gmmu_unmap_locked nvgpu_gmmu_unmap_locked

View File

@@ -422,8 +422,9 @@ nvgpu_get_pte
nvgpu_gmmu_default_big_page_size nvgpu_gmmu_default_big_page_size
nvgpu_gmmu_init_page_table nvgpu_gmmu_init_page_table
nvgpu_gmmu_map nvgpu_gmmu_map
nvgpu_gmmu_map_locked
nvgpu_gmmu_map_fixed nvgpu_gmmu_map_fixed
nvgpu_gmmu_map_locked
nvgpu_gmmu_map_partial
nvgpu_gmmu_unmap nvgpu_gmmu_unmap
nvgpu_gmmu_unmap_addr nvgpu_gmmu_unmap_addr
nvgpu_gmmu_unmap_locked nvgpu_gmmu_unmap_locked

View File

@@ -479,7 +479,7 @@ int test_nvgpu_gmmu_map_unmap(struct unit_module *m, struct gk20a *g,
params->flags, params->rw_flag, params->priv, params->flags, params->rw_flag, params->priv,
params->aperture); params->aperture);
} else { } else {
mem.gpu_va = nvgpu_gmmu_map(g->mm.pmu.vm, &mem, mem.size, mem.gpu_va = nvgpu_gmmu_map(g->mm.pmu.vm, &mem,
params->flags, params->rw_flag, params->priv, params->flags, params->rw_flag, params->priv,
params->aperture); params->aperture);
} }
@@ -607,7 +607,7 @@ int test_nvgpu_gmmu_map_unmap_map_fail(struct unit_module *m, struct gk20a *g,
g->ops.fb.tlb_invalidate = hal_fb_tlb_invalidate_fail; g->ops.fb.tlb_invalidate = hal_fb_tlb_invalidate_fail;
} }
mem.gpu_va = nvgpu_gmmu_map(g->mm.pmu.vm, &mem, mem.size, mem.gpu_va = nvgpu_gmmu_map(g->mm.pmu.vm, &mem,
NVGPU_VM_MAP_CACHEABLE, gk20a_mem_flag_none, NVGPU_VM_MAP_CACHEABLE, gk20a_mem_flag_none,
true, APERTURE_SYSMEM); true, APERTURE_SYSMEM);
@@ -656,7 +656,7 @@ int test_nvgpu_gmmu_set_pte(struct unit_module *m, struct gk20a *g, void *args)
p->mm_is_iommuable = params->is_iommuable; p->mm_is_iommuable = params->is_iommuable;
mem.size = TEST_SIZE; mem.size = TEST_SIZE;
mem.cpu_va = (void *) TEST_PA_ADDRESS; mem.cpu_va = (void *) TEST_PA_ADDRESS;
mem.gpu_va = nvgpu_gmmu_map(g->mm.pmu.vm, &mem, mem.size, mem.gpu_va = nvgpu_gmmu_map(g->mm.pmu.vm, &mem,
params->flags, params->rw_flag, params->priv, params->flags, params->rw_flag, params->priv,
params->aperture); params->aperture);
@@ -1053,7 +1053,7 @@ int test_nvgpu_page_table_c1_full(struct unit_module *m, struct gk20a *g,
&test_iommu_sysmem, NULL, vm, mixed_sgt); &test_iommu_sysmem, NULL, vm, mixed_sgt);
} else { } else {
mem[mem_i].gpu_va = nvgpu_gmmu_map(vm, &mem[mem_i], mem[mem_i].gpu_va = nvgpu_gmmu_map(vm, &mem[mem_i],
mem[mem_i].size, NVGPU_VM_MAP_CACHEABLE, NVGPU_VM_MAP_CACHEABLE,
gk20a_mem_flag_none, true, APERTURE_SYSMEM); gk20a_mem_flag_none, true, APERTURE_SYSMEM);
} }

View File

@@ -348,7 +348,7 @@ int test_sync_get_ro_map(struct unit_module *m, struct gk20a *g, void *args)
for (branches = 0U; branches <= F_SYNC_GET_RO_MAP_MAX; branches++) { for (branches = 0U; branches <= F_SYNC_GET_RO_MAP_MAX; branches++) {
if (branches == F_SYNC_GET_RO_MAP_PRE_ALLOCATED) { if (branches == F_SYNC_GET_RO_MAP_PRE_ALLOCATED) {
ch->vm->syncpt_ro_map_gpu_va = nvgpu_gmmu_map(ch->vm, ch->vm->syncpt_ro_map_gpu_va = nvgpu_gmmu_map_partial(ch->vm,
&g->syncpt_mem, g->syncpt_unit_size, &g->syncpt_mem, g->syncpt_unit_size,
0, gk20a_mem_flag_read_only, 0, gk20a_mem_flag_read_only,
false, APERTURE_SYSMEM); false, APERTURE_SYSMEM);