mirror of
git://nv-tegra.nvidia.com/linux-nvgpu.git
synced 2025-12-22 17:36:20 +03:00
gk20a_busy() call in channel_syncpt_incr() and corresponding gk20a_idle() call in channel_update() are redundant since they are already encapsulated inside another pair of busy/idle calls This busy/idle pair will be called only from submit_gpfifo() and submit_gpfifo() already has its own busy/idle which it preserves for whole path and hence this redundant pair can be removed Also, this prevents a dead lock scenario while do_idle() is in progress as follows : - in submit_gpfifo() we call first gk20a_busy() which acquires busy read semaphore - in do_idle() we acquire busy write semaphore and wait for current jobs to finish - now submit_gpfifo() encounters second gk20a_busy() and requests busy read semaphore again - this results in dead lock where do_idle() is waiting for submit_gpfifo() to complete and submit_gpfifo() is waiting for busy lock held by do_idle() and hence it cannot complete bug 1529160 Change-Id: I96e4368352f693e93524f0f61689b4447e5331ea Signed-off-by: Deepak Nibade <dnibade@nvidia.com> Reviewed-on: http://git-master/r/434191 (cherry picked from commit c4315c6caa42bab72ba6017c7ded25f4e9363dec) Reviewed-on: http://git-master/r/435132 Reviewed-by: Sachin Nikam <snikam@nvidia.com> Tested-by: Sachin Nikam <snikam@nvidia.com>
791 lines
20 KiB
C
791 lines
20 KiB
C
/*
|
|
* drivers/video/tegra/host/gk20a/channel_sync_gk20a.c
|
|
*
|
|
* GK20A Channel Synchronization Abstraction
|
|
*
|
|
* Copyright (c) 2014, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms and conditions of the GNU General Public License,
|
|
* version 2, as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
* more details.
|
|
*/
|
|
|
|
#include <linux/gk20a.h>
|
|
|
|
#include "channel_sync_gk20a.h"
|
|
#include "gk20a.h"
|
|
#include "semaphore_gk20a.h"
|
|
#include "sync_gk20a.h"
|
|
#include "mm_gk20a.h"
|
|
|
|
#ifdef CONFIG_SYNC
|
|
#include "../../../staging/android/sync.h"
|
|
#endif
|
|
|
|
#ifdef CONFIG_TEGRA_GK20A
|
|
#include <linux/nvhost.h>
|
|
#endif
|
|
|
|
#ifdef CONFIG_TEGRA_GK20A
|
|
|
|
struct gk20a_channel_syncpt {
|
|
struct gk20a_channel_sync ops;
|
|
struct channel_gk20a *c;
|
|
struct platform_device *host1x_pdev;
|
|
u32 id;
|
|
};
|
|
|
|
static void add_wait_cmd(u32 *ptr, u32 id, u32 thresh)
|
|
{
|
|
/* syncpoint_a */
|
|
ptr[0] = 0x2001001C;
|
|
/* payload */
|
|
ptr[1] = thresh;
|
|
/* syncpoint_b */
|
|
ptr[2] = 0x2001001D;
|
|
/* syncpt_id, switch_en, wait */
|
|
ptr[3] = (id << 8) | 0x10;
|
|
}
|
|
|
|
int gk20a_channel_syncpt_wait_cpu(struct gk20a_channel_sync *s,
|
|
struct gk20a_channel_fence *fence,
|
|
int timeout)
|
|
{
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
if (!fence->valid)
|
|
return 0;
|
|
return nvhost_syncpt_wait_timeout_ext(
|
|
sp->host1x_pdev, sp->id, fence->thresh,
|
|
timeout, NULL, NULL);
|
|
}
|
|
|
|
bool gk20a_channel_syncpt_is_expired(struct gk20a_channel_sync *s,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
if (!fence->valid)
|
|
return true;
|
|
return nvhost_syncpt_is_expired_ext(sp->host1x_pdev, sp->id,
|
|
fence->thresh);
|
|
}
|
|
|
|
int gk20a_channel_syncpt_wait_syncpt(struct gk20a_channel_sync *s, u32 id,
|
|
u32 thresh, struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
struct priv_cmd_entry *wait_cmd = NULL;
|
|
|
|
if (id >= nvhost_syncpt_nb_pts_ext(sp->host1x_pdev)) {
|
|
dev_warn(dev_from_gk20a(sp->c->g),
|
|
"invalid wait id in gpfifo submit, elided");
|
|
return 0;
|
|
}
|
|
|
|
if (nvhost_syncpt_is_expired_ext(sp->host1x_pdev, id, thresh))
|
|
return 0;
|
|
|
|
gk20a_channel_alloc_priv_cmdbuf(sp->c, 4, &wait_cmd);
|
|
if (wait_cmd == NULL) {
|
|
gk20a_err(dev_from_gk20a(sp->c->g),
|
|
"not enough priv cmd buffer space");
|
|
return -EAGAIN;
|
|
}
|
|
|
|
add_wait_cmd(&wait_cmd->ptr[0], id, thresh);
|
|
|
|
*entry = wait_cmd;
|
|
fence->valid = false;
|
|
return 0;
|
|
}
|
|
|
|
int gk20a_channel_syncpt_wait_fd(struct gk20a_channel_sync *s, int fd,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
#ifdef CONFIG_SYNC
|
|
int i;
|
|
int num_wait_cmds;
|
|
struct sync_pt *pt;
|
|
struct sync_fence *sync_fence;
|
|
struct priv_cmd_entry *wait_cmd = NULL;
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
struct channel_gk20a *c = sp->c;
|
|
|
|
sync_fence = nvhost_sync_fdget(fd);
|
|
if (!sync_fence)
|
|
return -EINVAL;
|
|
|
|
/* validate syncpt ids */
|
|
list_for_each_entry(pt, &sync_fence->pt_list_head, pt_list) {
|
|
u32 wait_id = nvhost_sync_pt_id(pt);
|
|
if (!wait_id ||
|
|
wait_id >= nvhost_syncpt_nb_pts_ext(sp->host1x_pdev)) {
|
|
sync_fence_put(sync_fence);
|
|
return -EINVAL;
|
|
}
|
|
}
|
|
|
|
num_wait_cmds = nvhost_sync_num_pts(sync_fence);
|
|
gk20a_channel_alloc_priv_cmdbuf(c, 4 * num_wait_cmds, &wait_cmd);
|
|
if (wait_cmd == NULL) {
|
|
gk20a_err(dev_from_gk20a(c->g),
|
|
"not enough priv cmd buffer space");
|
|
sync_fence_put(sync_fence);
|
|
return -EAGAIN;
|
|
}
|
|
|
|
i = 0;
|
|
list_for_each_entry(pt, &sync_fence->pt_list_head, pt_list) {
|
|
u32 wait_id = nvhost_sync_pt_id(pt);
|
|
u32 wait_value = nvhost_sync_pt_thresh(pt);
|
|
|
|
if (nvhost_syncpt_is_expired_ext(sp->host1x_pdev,
|
|
wait_id, wait_value)) {
|
|
wait_cmd->ptr[i * 4 + 0] = 0;
|
|
wait_cmd->ptr[i * 4 + 1] = 0;
|
|
wait_cmd->ptr[i * 4 + 2] = 0;
|
|
wait_cmd->ptr[i * 4 + 3] = 0;
|
|
} else
|
|
add_wait_cmd(&wait_cmd->ptr[i * 4], wait_id,
|
|
wait_value);
|
|
i++;
|
|
}
|
|
WARN_ON(i != num_wait_cmds);
|
|
sync_fence_put(sync_fence);
|
|
|
|
*entry = wait_cmd;
|
|
fence->valid = false;
|
|
return 0;
|
|
#else
|
|
return -ENODEV;
|
|
#endif
|
|
}
|
|
|
|
static void gk20a_channel_syncpt_update(void *priv, int nr_completed)
|
|
{
|
|
struct channel_gk20a *ch20a = priv;
|
|
gk20a_channel_update(ch20a, nr_completed);
|
|
}
|
|
|
|
static int __gk20a_channel_syncpt_incr(struct gk20a_channel_sync *s,
|
|
bool gfx_class, bool wfi_cmd,
|
|
bool register_irq,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
u32 thresh;
|
|
int incr_cmd_size;
|
|
int j = 0;
|
|
int err;
|
|
struct priv_cmd_entry *incr_cmd = NULL;
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
struct channel_gk20a *c = sp->c;
|
|
|
|
incr_cmd_size = 4;
|
|
if (wfi_cmd)
|
|
incr_cmd_size += 2;
|
|
|
|
gk20a_channel_alloc_priv_cmdbuf(c, incr_cmd_size, &incr_cmd);
|
|
if (incr_cmd == NULL) {
|
|
gk20a_err(dev_from_gk20a(c->g),
|
|
"not enough priv cmd buffer space");
|
|
return -EAGAIN;
|
|
}
|
|
|
|
if (gfx_class) {
|
|
WARN_ON(wfi_cmd); /* No sense to use gfx class + wfi. */
|
|
/* setobject KEPLER_C */
|
|
incr_cmd->ptr[j++] = 0x20010000;
|
|
incr_cmd->ptr[j++] = KEPLER_C;
|
|
/* syncpt incr */
|
|
incr_cmd->ptr[j++] = 0x200100B2;
|
|
incr_cmd->ptr[j++] = sp->id |
|
|
(0x1 << 20) | (0x1 << 16);
|
|
} else {
|
|
if (wfi_cmd) {
|
|
/* wfi */
|
|
incr_cmd->ptr[j++] = 0x2001001E;
|
|
/* handle, ignored */
|
|
incr_cmd->ptr[j++] = 0x00000000;
|
|
}
|
|
/* syncpoint_a */
|
|
incr_cmd->ptr[j++] = 0x2001001C;
|
|
/* payload, ignored */
|
|
incr_cmd->ptr[j++] = 0;
|
|
/* syncpoint_b */
|
|
incr_cmd->ptr[j++] = 0x2001001D;
|
|
/* syncpt_id, incr */
|
|
incr_cmd->ptr[j++] = (sp->id << 8) | 0x1;
|
|
}
|
|
WARN_ON(j != incr_cmd_size);
|
|
|
|
thresh = nvhost_syncpt_incr_max_ext(sp->host1x_pdev, sp->id, 1);
|
|
|
|
if (register_irq) {
|
|
err = nvhost_intr_register_notifier(sp->host1x_pdev,
|
|
sp->id, thresh,
|
|
gk20a_channel_syncpt_update, c);
|
|
|
|
/* Adding interrupt action should never fail. A proper error
|
|
* handling here would require us to decrement the syncpt max
|
|
* back to its original value. */
|
|
WARN(err, "failed to set submit complete interrupt");
|
|
}
|
|
|
|
fence->thresh = thresh;
|
|
fence->valid = true;
|
|
fence->wfi = wfi_cmd;
|
|
*entry = incr_cmd;
|
|
return 0;
|
|
}
|
|
|
|
int gk20a_channel_syncpt_incr_wfi(struct gk20a_channel_sync *s,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
return __gk20a_channel_syncpt_incr(s,
|
|
false /* use host class */,
|
|
true /* wfi */,
|
|
false /* no irq handler */,
|
|
entry, fence);
|
|
}
|
|
|
|
int gk20a_channel_syncpt_incr(struct gk20a_channel_sync *s,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
/* Don't put wfi cmd to this one since we're not returning
|
|
* a fence to user space. */
|
|
return __gk20a_channel_syncpt_incr(s,
|
|
sp->c->obj_class == KEPLER_C /* may use gfx class */,
|
|
false /* no wfi */,
|
|
true /* register irq */,
|
|
entry, fence);
|
|
}
|
|
|
|
int gk20a_channel_syncpt_incr_user_syncpt(struct gk20a_channel_sync *s,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence,
|
|
bool wfi,
|
|
u32 *id, u32 *thresh)
|
|
{
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
/* Need to do 'host incr + wfi' or 'gfx incr' since we return the fence
|
|
* to user space. */
|
|
int err = __gk20a_channel_syncpt_incr(s,
|
|
wfi &&
|
|
sp->c->obj_class == KEPLER_C /* use gfx class? */,
|
|
wfi &&
|
|
sp->c->obj_class != KEPLER_C /* wfi if host class */,
|
|
true /* register irq */,
|
|
entry, fence);
|
|
if (err)
|
|
return err;
|
|
*id = sp->id;
|
|
*thresh = fence->thresh;
|
|
return 0;
|
|
}
|
|
|
|
int gk20a_channel_syncpt_incr_user_fd(struct gk20a_channel_sync *s,
|
|
int wait_fence_fd,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence,
|
|
bool wfi,
|
|
int *fd)
|
|
{
|
|
#ifdef CONFIG_SYNC
|
|
int err;
|
|
struct nvhost_ctrl_sync_fence_info pt;
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
err = gk20a_channel_syncpt_incr_user_syncpt(s, entry, fence, wfi,
|
|
&pt.id, &pt.thresh);
|
|
if (err)
|
|
return err;
|
|
return nvhost_sync_create_fence_fd(sp->host1x_pdev, &pt, 1,
|
|
"fence", fd);
|
|
#else
|
|
return -ENODEV;
|
|
#endif
|
|
}
|
|
|
|
void gk20a_channel_syncpt_set_min_eq_max(struct gk20a_channel_sync *s)
|
|
{
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
nvhost_syncpt_set_min_eq_max_ext(sp->host1x_pdev, sp->id);
|
|
}
|
|
|
|
static void gk20a_channel_syncpt_destroy(struct gk20a_channel_sync *s)
|
|
{
|
|
struct gk20a_channel_syncpt *sp =
|
|
container_of(s, struct gk20a_channel_syncpt, ops);
|
|
nvhost_free_syncpt(sp->id);
|
|
kfree(sp);
|
|
}
|
|
|
|
static struct gk20a_channel_sync *
|
|
gk20a_channel_syncpt_create(struct channel_gk20a *c)
|
|
{
|
|
struct gk20a_channel_syncpt *sp;
|
|
|
|
sp = kzalloc(sizeof(*sp), GFP_KERNEL);
|
|
if (!sp)
|
|
return NULL;
|
|
|
|
sp->c = c;
|
|
sp->host1x_pdev = c->g->host1x_dev;
|
|
sp->id = nvhost_get_syncpt_host_managed(c->g->dev, c->hw_chid);
|
|
if (!sp->id) {
|
|
kfree(sp);
|
|
gk20a_err(&c->g->dev->dev, "failed to get free syncpt");
|
|
return NULL;
|
|
}
|
|
|
|
sp->ops.wait_cpu = gk20a_channel_syncpt_wait_cpu;
|
|
sp->ops.is_expired = gk20a_channel_syncpt_is_expired;
|
|
sp->ops.wait_syncpt = gk20a_channel_syncpt_wait_syncpt;
|
|
sp->ops.wait_fd = gk20a_channel_syncpt_wait_fd;
|
|
sp->ops.incr = gk20a_channel_syncpt_incr;
|
|
sp->ops.incr_wfi = gk20a_channel_syncpt_incr_wfi;
|
|
sp->ops.incr_user_syncpt = gk20a_channel_syncpt_incr_user_syncpt;
|
|
sp->ops.incr_user_fd = gk20a_channel_syncpt_incr_user_fd;
|
|
sp->ops.set_min_eq_max = gk20a_channel_syncpt_set_min_eq_max;
|
|
sp->ops.destroy = gk20a_channel_syncpt_destroy;
|
|
|
|
sp->ops.aggressive_destroy = true;
|
|
|
|
return &sp->ops;
|
|
}
|
|
#endif /* CONFIG_TEGRA_GK20A */
|
|
|
|
struct gk20a_channel_semaphore {
|
|
struct gk20a_channel_sync ops;
|
|
struct channel_gk20a *c;
|
|
|
|
/* A semaphore pool owned by this channel. */
|
|
struct gk20a_semaphore_pool *pool;
|
|
|
|
/* A sync timeline that advances when gpu completes work. */
|
|
struct sync_timeline *timeline;
|
|
};
|
|
|
|
#ifdef CONFIG_SYNC
|
|
struct wait_fence_work {
|
|
struct sync_fence_waiter waiter;
|
|
struct channel_gk20a *ch;
|
|
struct gk20a_semaphore *sema;
|
|
};
|
|
|
|
static void gk20a_channel_semaphore_launcher(
|
|
struct sync_fence *fence,
|
|
struct sync_fence_waiter *waiter)
|
|
{
|
|
int err;
|
|
struct wait_fence_work *w =
|
|
container_of(waiter, struct wait_fence_work, waiter);
|
|
struct gk20a *g = w->ch->g;
|
|
|
|
gk20a_dbg_info("waiting for pre fence %p '%s'",
|
|
fence, fence->name);
|
|
err = sync_fence_wait(fence, -1);
|
|
if (err < 0)
|
|
dev_err(&g->dev->dev, "error waiting pre-fence: %d\n", err);
|
|
|
|
gk20a_dbg_info(
|
|
"wait completed (%d) for fence %p '%s', triggering gpu work",
|
|
err, fence, fence->name);
|
|
sync_fence_put(fence);
|
|
gk20a_semaphore_release(w->sema);
|
|
gk20a_semaphore_put(w->sema);
|
|
kfree(w);
|
|
}
|
|
#endif
|
|
|
|
static int add_sema_cmd(u32 *ptr, u64 sema, u32 payload,
|
|
bool acquire, bool wfi)
|
|
{
|
|
int i = 0;
|
|
/* semaphore_a */
|
|
ptr[i++] = 0x20010004;
|
|
/* offset_upper */
|
|
ptr[i++] = (sema >> 32) & 0xff;
|
|
/* semaphore_b */
|
|
ptr[i++] = 0x20010005;
|
|
/* offset */
|
|
ptr[i++] = sema & 0xffffffff;
|
|
/* semaphore_c */
|
|
ptr[i++] = 0x20010006;
|
|
/* payload */
|
|
ptr[i++] = payload;
|
|
if (acquire) {
|
|
/* semaphore_d */
|
|
ptr[i++] = 0x20010007;
|
|
/* operation: acq_geq, switch_en */
|
|
ptr[i++] = 0x4 | (0x1 << 12);
|
|
} else {
|
|
/* semaphore_d */
|
|
ptr[i++] = 0x20010007;
|
|
/* operation: release, wfi */
|
|
ptr[i++] = 0x2 | ((wfi ? 0x0 : 0x1) << 20);
|
|
/* non_stall_int */
|
|
ptr[i++] = 0x20010008;
|
|
/* ignored */
|
|
ptr[i++] = 0;
|
|
}
|
|
return i;
|
|
}
|
|
|
|
static int gk20a_channel_semaphore_wait_cpu(
|
|
struct gk20a_channel_sync *s,
|
|
struct gk20a_channel_fence *fence,
|
|
int timeout)
|
|
{
|
|
int remain;
|
|
struct gk20a_channel_semaphore *sp =
|
|
container_of(s, struct gk20a_channel_semaphore, ops);
|
|
if (!fence->valid || WARN_ON(!fence->semaphore))
|
|
return 0;
|
|
|
|
remain = wait_event_interruptible_timeout(
|
|
sp->c->semaphore_wq,
|
|
!gk20a_semaphore_is_acquired(fence->semaphore),
|
|
timeout);
|
|
if (remain == 0 && gk20a_semaphore_is_acquired(fence->semaphore))
|
|
return -ETIMEDOUT;
|
|
else if (remain < 0)
|
|
return remain;
|
|
return 0;
|
|
}
|
|
|
|
static bool gk20a_channel_semaphore_is_expired(
|
|
struct gk20a_channel_sync *s,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
bool expired;
|
|
struct gk20a_channel_semaphore *sp =
|
|
container_of(s, struct gk20a_channel_semaphore, ops);
|
|
if (!fence->valid || WARN_ON(!fence->semaphore))
|
|
return true;
|
|
|
|
expired = !gk20a_semaphore_is_acquired(fence->semaphore);
|
|
if (expired)
|
|
gk20a_sync_timeline_signal(sp->timeline);
|
|
return expired;
|
|
}
|
|
|
|
static int gk20a_channel_semaphore_wait_syncpt(
|
|
struct gk20a_channel_sync *s, u32 id,
|
|
u32 thresh, struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
struct gk20a_channel_semaphore *sema =
|
|
container_of(s, struct gk20a_channel_semaphore, ops);
|
|
struct device *dev = dev_from_gk20a(sema->c->g);
|
|
gk20a_err(dev, "trying to use syncpoint synchronization");
|
|
return -ENODEV;
|
|
}
|
|
|
|
static int gk20a_channel_semaphore_wait_fd(
|
|
struct gk20a_channel_sync *s, int fd,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
struct gk20a_channel_semaphore *sema =
|
|
container_of(s, struct gk20a_channel_semaphore, ops);
|
|
struct channel_gk20a *c = sema->c;
|
|
#ifdef CONFIG_SYNC
|
|
struct sync_fence *sync_fence;
|
|
struct priv_cmd_entry *wait_cmd = NULL;
|
|
struct wait_fence_work *w;
|
|
int written;
|
|
int err;
|
|
u64 va;
|
|
|
|
sync_fence = gk20a_sync_fence_fdget(fd);
|
|
if (!sync_fence)
|
|
return -EINVAL;
|
|
|
|
w = kzalloc(sizeof(*w), GFP_KERNEL);
|
|
if (!w) {
|
|
err = -ENOMEM;
|
|
goto fail;
|
|
}
|
|
sync_fence_waiter_init(&w->waiter, gk20a_channel_semaphore_launcher);
|
|
w->ch = c;
|
|
w->sema = gk20a_semaphore_alloc(sema->pool);
|
|
if (!w->sema) {
|
|
gk20a_err(dev_from_gk20a(c->g), "ran out of semaphores");
|
|
err = -EAGAIN;
|
|
goto fail;
|
|
}
|
|
|
|
gk20a_channel_alloc_priv_cmdbuf(c, 8, &wait_cmd);
|
|
if (wait_cmd == NULL) {
|
|
gk20a_err(dev_from_gk20a(c->g),
|
|
"not enough priv cmd buffer space");
|
|
err = -EAGAIN;
|
|
goto fail;
|
|
}
|
|
|
|
va = gk20a_semaphore_gpu_va(w->sema, c->vm);
|
|
/* GPU unblocked when when the semaphore value becomes 1. */
|
|
written = add_sema_cmd(wait_cmd->ptr, va, 1, true, false);
|
|
WARN_ON(written != wait_cmd->size);
|
|
sync_fence_wait_async(sync_fence, &w->waiter);
|
|
|
|
*entry = wait_cmd;
|
|
return 0;
|
|
fail:
|
|
if (w && w->sema)
|
|
gk20a_semaphore_put(w->sema);
|
|
kfree(w);
|
|
sync_fence_put(sync_fence);
|
|
return err;
|
|
#else
|
|
gk20a_err(dev_from_gk20a(c->g),
|
|
"trying to use sync fds with CONFIG_SYNC disabled");
|
|
return -ENODEV;
|
|
#endif
|
|
}
|
|
|
|
static int __gk20a_channel_semaphore_incr(
|
|
struct gk20a_channel_sync *s, bool wfi_cmd,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
u64 va;
|
|
int incr_cmd_size;
|
|
int written;
|
|
struct priv_cmd_entry *incr_cmd = NULL;
|
|
struct gk20a_channel_semaphore *sp =
|
|
container_of(s, struct gk20a_channel_semaphore, ops);
|
|
struct channel_gk20a *c = sp->c;
|
|
struct gk20a_semaphore *semaphore;
|
|
|
|
semaphore = gk20a_semaphore_alloc(sp->pool);
|
|
if (!semaphore) {
|
|
gk20a_err(dev_from_gk20a(c->g),
|
|
"ran out of semaphores");
|
|
return -EAGAIN;
|
|
}
|
|
|
|
incr_cmd_size = 10;
|
|
gk20a_channel_alloc_priv_cmdbuf(c, incr_cmd_size, &incr_cmd);
|
|
if (incr_cmd == NULL) {
|
|
gk20a_err(dev_from_gk20a(c->g),
|
|
"not enough priv cmd buffer space");
|
|
gk20a_semaphore_put(semaphore);
|
|
return -EAGAIN;
|
|
}
|
|
|
|
/* Release the completion semaphore. */
|
|
va = gk20a_semaphore_gpu_va(semaphore, c->vm);
|
|
written = add_sema_cmd(incr_cmd->ptr, va, 1, false, wfi_cmd);
|
|
WARN_ON(written != incr_cmd_size);
|
|
|
|
fence->valid = true;
|
|
fence->wfi = wfi_cmd;
|
|
fence->semaphore = semaphore;
|
|
*entry = incr_cmd;
|
|
return 0;
|
|
}
|
|
|
|
static int gk20a_channel_semaphore_incr_wfi(
|
|
struct gk20a_channel_sync *s,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
return __gk20a_channel_semaphore_incr(s,
|
|
true /* wfi */,
|
|
entry, fence);
|
|
}
|
|
|
|
static int gk20a_channel_semaphore_incr(
|
|
struct gk20a_channel_sync *s,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence)
|
|
{
|
|
/* Don't put wfi cmd to this one since we're not returning
|
|
* a fence to user space. */
|
|
return __gk20a_channel_semaphore_incr(s, false /* no wfi */,
|
|
entry, fence);
|
|
}
|
|
|
|
static int gk20a_channel_semaphore_incr_user_syncpt(
|
|
struct gk20a_channel_sync *s,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence,
|
|
bool wfi,
|
|
u32 *id, u32 *thresh)
|
|
{
|
|
struct gk20a_channel_semaphore *sema =
|
|
container_of(s, struct gk20a_channel_semaphore, ops);
|
|
struct device *dev = dev_from_gk20a(sema->c->g);
|
|
gk20a_err(dev, "trying to use syncpoint synchronization");
|
|
return -ENODEV;
|
|
}
|
|
|
|
static int gk20a_channel_semaphore_incr_user_fd(
|
|
struct gk20a_channel_sync *s,
|
|
int wait_fence_fd,
|
|
struct priv_cmd_entry **entry,
|
|
struct gk20a_channel_fence *fence,
|
|
bool wfi,
|
|
int *fd)
|
|
{
|
|
struct gk20a_channel_semaphore *sema =
|
|
container_of(s, struct gk20a_channel_semaphore, ops);
|
|
#ifdef CONFIG_SYNC
|
|
struct sync_fence *dependency = NULL;
|
|
int err;
|
|
|
|
err = __gk20a_channel_semaphore_incr(s, wfi,
|
|
entry, fence);
|
|
if (err)
|
|
return err;
|
|
|
|
if (wait_fence_fd >= 0) {
|
|
dependency = gk20a_sync_fence_fdget(wait_fence_fd);
|
|
if (!dependency)
|
|
return -EINVAL;
|
|
}
|
|
|
|
*fd = gk20a_sync_fence_create(sema->timeline, fence->semaphore,
|
|
dependency, "fence");
|
|
if (*fd < 0) {
|
|
if (dependency)
|
|
sync_fence_put(dependency);
|
|
return *fd;
|
|
}
|
|
return 0;
|
|
#else
|
|
gk20a_err(dev_from_gk20a(sema->c->g),
|
|
"trying to use sync fds with CONFIG_SYNC disabled");
|
|
return -ENODEV;
|
|
#endif
|
|
}
|
|
|
|
static void gk20a_channel_semaphore_set_min_eq_max(struct gk20a_channel_sync *s)
|
|
{
|
|
/* Nothing to do. */
|
|
}
|
|
|
|
static void gk20a_channel_semaphore_destroy(struct gk20a_channel_sync *s)
|
|
{
|
|
struct gk20a_channel_semaphore *sema =
|
|
container_of(s, struct gk20a_channel_semaphore, ops);
|
|
if (sema->timeline)
|
|
gk20a_sync_timeline_destroy(sema->timeline);
|
|
if (sema->pool) {
|
|
gk20a_semaphore_pool_unmap(sema->pool, sema->c->vm);
|
|
gk20a_semaphore_pool_put(sema->pool);
|
|
}
|
|
kfree(sema);
|
|
}
|
|
|
|
static struct gk20a_channel_sync *
|
|
gk20a_channel_semaphore_create(struct channel_gk20a *c)
|
|
{
|
|
int err;
|
|
int asid = -1;
|
|
struct gk20a_channel_semaphore *sema;
|
|
char pool_name[20];
|
|
|
|
if (WARN_ON(!c->vm))
|
|
return NULL;
|
|
|
|
sema = kzalloc(sizeof(*sema), GFP_KERNEL);
|
|
if (!sema)
|
|
return NULL;
|
|
sema->c = c;
|
|
|
|
if (c->vm->as_share)
|
|
asid = c->vm->as_share->id;
|
|
|
|
/* A pool of 256 semaphores fits into one 4k page. */
|
|
sprintf(pool_name, "semaphore_pool-%d", c->hw_chid);
|
|
sema->pool = gk20a_semaphore_pool_alloc(dev_from_gk20a(c->g),
|
|
pool_name, 256);
|
|
if (!sema->pool)
|
|
goto clean_up;
|
|
|
|
/* Map the semaphore pool to the channel vm. Map as read-write to the
|
|
* owner channel (all other channels should map as read only!). */
|
|
err = gk20a_semaphore_pool_map(sema->pool, c->vm, gk20a_mem_flag_none);
|
|
if (err)
|
|
goto clean_up;
|
|
|
|
#ifdef CONFIG_SYNC
|
|
sema->timeline = gk20a_sync_timeline_create(
|
|
"gk20a_ch%d_as%d", c->hw_chid, asid);
|
|
if (!sema->timeline)
|
|
goto clean_up;
|
|
#endif
|
|
sema->ops.wait_cpu = gk20a_channel_semaphore_wait_cpu;
|
|
sema->ops.is_expired = gk20a_channel_semaphore_is_expired;
|
|
sema->ops.wait_syncpt = gk20a_channel_semaphore_wait_syncpt;
|
|
sema->ops.wait_fd = gk20a_channel_semaphore_wait_fd;
|
|
sema->ops.incr = gk20a_channel_semaphore_incr;
|
|
sema->ops.incr_wfi = gk20a_channel_semaphore_incr_wfi;
|
|
sema->ops.incr_user_syncpt = gk20a_channel_semaphore_incr_user_syncpt;
|
|
sema->ops.incr_user_fd = gk20a_channel_semaphore_incr_user_fd;
|
|
sema->ops.set_min_eq_max = gk20a_channel_semaphore_set_min_eq_max;
|
|
sema->ops.destroy = gk20a_channel_semaphore_destroy;
|
|
|
|
/* Aggressively destroying the semaphore sync would cause overhead
|
|
* since the pool needs to be mapped to GMMU. */
|
|
sema->ops.aggressive_destroy = false;
|
|
|
|
return &sema->ops;
|
|
clean_up:
|
|
gk20a_channel_semaphore_destroy(&sema->ops);
|
|
return NULL;
|
|
}
|
|
|
|
struct gk20a_channel_sync *gk20a_channel_sync_create(struct channel_gk20a *c)
|
|
{
|
|
#ifdef CONFIG_TEGRA_GK20A
|
|
if (gk20a_platform_has_syncpoints(c->g->dev))
|
|
return gk20a_channel_syncpt_create(c);
|
|
#endif
|
|
return gk20a_channel_semaphore_create(c);
|
|
}
|
|
|
|
static inline bool gk20a_channel_fence_is_closed(struct gk20a_channel_fence *f)
|
|
{
|
|
if (f->valid || f->semaphore)
|
|
return false;
|
|
return true;
|
|
}
|
|
|
|
void gk20a_channel_fence_close(struct gk20a_channel_fence *f)
|
|
{
|
|
if (f->semaphore)
|
|
gk20a_semaphore_put(f->semaphore);
|
|
memset(f, 0, sizeof(*f));
|
|
}
|
|
|
|
void gk20a_channel_fence_dup(struct gk20a_channel_fence *from,
|
|
struct gk20a_channel_fence *to)
|
|
{
|
|
WARN_ON(!gk20a_channel_fence_is_closed(to));
|
|
*to = *from;
|
|
if (to->semaphore)
|
|
gk20a_semaphore_get(to->semaphore);
|
|
}
|