mirror of
git://nv-tegra.nvidia.com/linux-nvgpu.git
synced 2025-12-23 09:57:08 +03:00
Add reference counting for channels, and wait for reference count to get to 0 in gk20a_channel_free() before actually freeing the channel. Also, change free channel tracking a bit by employing a list of free channels, which simplifies the procedure of finding available channels with reference counting. Each use of a channel must have a reference taken before use or held by the caller. Taking a reference of a wild channel pointer may fail, if the channel is either not opened or in a process of being closed. Also, add safeguards for protecting accidental use of closed channels, specifically, by setting ch->g = NULL in channel free. This will make it obvious if freed channel is attempted to be used. The last user of a channel might be the deferred interrupt handler, so wait for deferred interrupts to be processed twice in the channel free procedure: once for providing last notifications to the channel and once to make sure there are no stale pointers left after referencing to the channel has been denied. Finally, fix some races in channel and TSG force reset IOCTL path, by pausing the channel scheduler in gk20a_fifo_recover_ch() and gk20a_fifo_recover_tsg(), while the affected engines have been identified, the appropriate MMU faults triggered, and the MMU faults handled. In this case, make sure that the MMU fault does not attempt to query the hardware about the failing channel or TSG ids. This should make channel recovery more safe also in the regular (i.e., not in the interrupt handler) context. Bug 1530226 Bug 1597493 Bug 1625901 Bug 200076344 Bug 200071810 Change-Id: Ib274876908e18219c64ea41e50ca443df81d957b Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com> Signed-off-by: Konsta Holtta <kholtta@nvidia.com> Signed-off-by: Sami Kiminki <skiminki@nvidia.com> Reviewed-on: http://git-master/r/448463 (cherry picked from commit 3f03aeae64ef2af4829e06f5f63062e8ebd21353) Reviewed-on: http://git-master/r/755147 Reviewed-by: Automatic_Commit_Validation_User
182 lines
4.9 KiB
C
182 lines
4.9 KiB
C
/*
|
|
* drivers/video/tegra/host/gk20a/fifo_gk20a.h
|
|
*
|
|
* GK20A graphics fifo (gr host)
|
|
*
|
|
* Copyright (c) 2011-2015, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms and conditions of the GNU General Public License,
|
|
* version 2, as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
* more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along with
|
|
* this program; if not, write to the Free Software Foundation, Inc.,
|
|
* 51 Franklin St - Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*/
|
|
#ifndef __FIFO_GK20A_H__
|
|
#define __FIFO_GK20A_H__
|
|
|
|
#include "channel_gk20a.h"
|
|
#include "tsg_gk20a.h"
|
|
|
|
#define MAX_RUNLIST_BUFFERS 2
|
|
|
|
/* generally corresponds to the "pbdma" engine */
|
|
|
|
struct fifo_runlist_info_gk20a {
|
|
unsigned long *active_channels;
|
|
unsigned long *active_tsgs;
|
|
/* Each engine has its own SW and HW runlist buffer.*/
|
|
struct mem_desc mem[MAX_RUNLIST_BUFFERS];
|
|
u32 cur_buffer;
|
|
u32 total_entries;
|
|
bool stopped;
|
|
bool support_tsg;
|
|
struct mutex mutex; /* protect channel preempt and runlist upate */
|
|
};
|
|
|
|
/* so far gk20a has two engines: gr and ce2(gr_copy) */
|
|
enum {
|
|
ENGINE_GR_GK20A = 0,
|
|
ENGINE_CE2_GK20A = 1,
|
|
ENGINE_INVAL_GK20A
|
|
};
|
|
|
|
struct fifo_pbdma_exception_info_gk20a {
|
|
u32 status_r; /* raw register value from hardware */
|
|
u32 id, next_id;
|
|
u32 chan_status_v; /* raw value from hardware */
|
|
bool id_is_chid, next_id_is_chid;
|
|
bool chsw_in_progress;
|
|
};
|
|
|
|
struct fifo_engine_exception_info_gk20a {
|
|
u32 status_r; /* raw register value from hardware */
|
|
u32 id, next_id;
|
|
u32 ctx_status_v; /* raw value from hardware */
|
|
bool id_is_chid, next_id_is_chid;
|
|
bool faulted, idle, ctxsw_in_progress;
|
|
};
|
|
|
|
struct fifo_mmu_fault_info_gk20a {
|
|
u32 fault_info_v;
|
|
u32 fault_type_v;
|
|
u32 engine_subid_v;
|
|
u32 client_v;
|
|
u32 fault_hi_v;
|
|
u32 fault_lo_v;
|
|
u64 inst_ptr;
|
|
const char *fault_type_desc;
|
|
const char *engine_subid_desc;
|
|
const char *client_desc;
|
|
};
|
|
|
|
struct fifo_engine_info_gk20a {
|
|
u32 engine_id;
|
|
u32 runlist_id;
|
|
u32 intr_id;
|
|
u32 reset_id;
|
|
u32 pbdma_id;
|
|
struct fifo_pbdma_exception_info_gk20a pbdma_exception_info;
|
|
struct fifo_engine_exception_info_gk20a engine_exception_info;
|
|
struct fifo_mmu_fault_info_gk20a mmu_fault_info;
|
|
|
|
};
|
|
|
|
struct fifo_gk20a {
|
|
struct gk20a *g;
|
|
int num_channels;
|
|
|
|
int num_pbdma;
|
|
u32 *pbdma_map;
|
|
|
|
struct fifo_engine_info_gk20a *engine_info;
|
|
u32 max_engines;
|
|
u32 num_engines;
|
|
|
|
struct fifo_runlist_info_gk20a *runlist_info;
|
|
u32 max_runlists;
|
|
|
|
struct mem_desc userd;
|
|
u32 userd_entry_size;
|
|
|
|
struct channel_gk20a *channel;
|
|
/* zero-kref'd channels here */
|
|
struct list_head free_chs;
|
|
struct mutex free_chs_mutex;
|
|
|
|
struct tsg_gk20a *tsg;
|
|
struct mutex tsg_inuse_mutex;
|
|
|
|
void (*remove_support)(struct fifo_gk20a *);
|
|
bool sw_ready;
|
|
struct {
|
|
/* share info between isrs and non-isr code */
|
|
struct {
|
|
struct mutex mutex;
|
|
} isr;
|
|
struct {
|
|
u32 device_fatal_0;
|
|
u32 channel_fatal_0;
|
|
u32 restartable_0;
|
|
} pbdma;
|
|
struct {
|
|
|
|
} engine;
|
|
|
|
|
|
} intr;
|
|
|
|
u32 deferred_fault_engines;
|
|
bool deferred_reset_pending;
|
|
struct mutex deferred_reset_mutex;
|
|
};
|
|
|
|
int gk20a_init_fifo_support(struct gk20a *g);
|
|
|
|
void gk20a_fifo_isr(struct gk20a *g);
|
|
void gk20a_fifo_nonstall_isr(struct gk20a *g);
|
|
|
|
int gk20a_fifo_preempt_channel(struct gk20a *g, u32 hw_chid);
|
|
int gk20a_fifo_preempt_tsg(struct gk20a *g, u32 tsgid);
|
|
int gk20a_fifo_preempt(struct gk20a *g, struct channel_gk20a *ch);
|
|
|
|
int gk20a_fifo_enable_engine_activity(struct gk20a *g,
|
|
struct fifo_engine_info_gk20a *eng_info);
|
|
int gk20a_fifo_disable_engine_activity(struct gk20a *g,
|
|
struct fifo_engine_info_gk20a *eng_info,
|
|
bool wait_for_idle);
|
|
u32 gk20a_fifo_engines_on_ch(struct gk20a *g, u32 hw_chid);
|
|
|
|
int gk20a_fifo_update_runlist(struct gk20a *g, u32 engine_id, u32 hw_chid,
|
|
bool add, bool wait_for_finish);
|
|
|
|
int gk20a_fifo_suspend(struct gk20a *g);
|
|
|
|
bool gk20a_fifo_mmu_fault_pending(struct gk20a *g);
|
|
|
|
void gk20a_fifo_recover(struct gk20a *g,
|
|
u32 engine_ids, /* if zero, will be queried from HW */
|
|
u32 hw_id, /* if ~0, will be queried from HW */
|
|
bool hw_id_is_tsg, /* ignored if hw_id == ~0 */
|
|
bool verbose);
|
|
void gk20a_fifo_recover_ch(struct gk20a *g, u32 hw_chid, bool verbose);
|
|
void gk20a_fifo_recover_tsg(struct gk20a *g, u32 tsgid, bool verbose);
|
|
int gk20a_fifo_force_reset_ch(struct channel_gk20a *ch, bool verbose);
|
|
void gk20a_fifo_reset_engine(struct gk20a *g, u32 engine_id);
|
|
int gk20a_init_fifo_reset_enable_hw(struct gk20a *g);
|
|
void gk20a_init_fifo(struct gpu_ops *gops);
|
|
|
|
void fifo_gk20a_finish_mmu_fault_handling(struct gk20a *g,
|
|
unsigned long fault_id);
|
|
int gk20a_fifo_wait_engine_idle(struct gk20a *g);
|
|
u32 gk20a_fifo_engine_interrupt_mask(struct gk20a *g);
|
|
u32 gk20a_fifo_get_pbdma_signature(struct gk20a *g);
|
|
|
|
#endif /*__GR_GK20A_H__*/
|