mirror of
https://github.com/raspberrypi/linux.git
synced 2025-12-17 23:34:24 +00:00
When GuC support was added to error capture, the reference counting around the request object was broken. Fix it up. The context based search manages the spinlocking around the search internally. So it needs to grab the reference count internally as well. The execlist only request based search relies on external locking, so it needs an external reference count but within the spinlock not outside it. The only other caller of the context based search is the code for dumping engine state to debugfs. That code wasn't previously getting an explicit reference at all as it does everything while holding the execlist specific spinlock. So, that needs updaing as well as that spinlock doesn't help when using GuC submission. Rather than trying to conditionally get/put depending on submission model, just change it to always do the get/put. v2: Explicitly document adding an extra blank line in some dense code (Andy Shevchenko). Fix multiple potential null pointer derefs in case of no request found (some spotted by Tvrtko, but there was more!). Also fix a leaked request in case of !started and another in __guc_reset_context now that intel_context_find_active_request is actually reference counting the returned request. v3: Add a _get suffix to intel_context_find_active_request now that it grabs a reference (Daniele). v4: Split the intel_guc_find_hung_context change to a separate patch and rename intel_context_find_active_request_get to intel_context_get_active_request (Tvrtko). v5: s/locking/reference counting/ in commit message (Tvrtko) Fixes:dc0dad365c("drm/i915/guc: Fix for error capture after full GPU reset with GuC") Fixes:573ba126ae("drm/i915/guc: Capture error state on context reset") Signed-off-by: John Harrison <John.C.Harrison@Intel.com> Reviewed-by: Daniele Ceraolo Spurio <daniele.ceraolospurio@intel.com> Acked-by: Tvrtko Ursulin <tvrtko.ursulin@intel.com> Cc: Matthew Brost <matthew.brost@intel.com> Cc: Jani Nikula <jani.nikula@linux.intel.com> Cc: Joonas Lahtinen <joonas.lahtinen@linux.intel.com> Cc: Rodrigo Vivi <rodrigo.vivi@intel.com> Cc: Andrzej Hajda <andrzej.hajda@intel.com> Cc: Matthew Auld <matthew.auld@intel.com> Cc: Matt Roper <matthew.d.roper@intel.com> Cc: Umesh Nerlige Ramappa <umesh.nerlige.ramappa@intel.com> Cc: Michael Cheng <michael.cheng@intel.com> Cc: Lucas De Marchi <lucas.demarchi@intel.com> Cc: Tejas Upadhyay <tejaskumarx.surendrakumar.upadhyay@intel.com> Cc: Andy Shevchenko <andriy.shevchenko@linux.intel.com> Cc: Aravind Iddamsetty <aravind.iddamsetty@intel.com> Cc: Alan Previn <alan.previn.teres.alexis@intel.com> Cc: Bruce Chang <yu.bruce.chang@intel.com> Link: https://patchwork.freedesktop.org/patch/msgid/20230127002842.3169194-3-John.C.Harrison@Intel.com (cherry picked from commit3700e35378) Signed-off-by: Rodrigo Vivi <rodrigo.vivi@intel.com>
381 lines
9.8 KiB
C
381 lines
9.8 KiB
C
/* SPDX-License-Identifier: MIT */
|
|
/*
|
|
* Copyright © 2019 Intel Corporation
|
|
*/
|
|
|
|
#ifndef __INTEL_CONTEXT_H__
|
|
#define __INTEL_CONTEXT_H__
|
|
|
|
#include <linux/bitops.h>
|
|
#include <linux/lockdep.h>
|
|
#include <linux/types.h>
|
|
|
|
#include "i915_active.h"
|
|
#include "i915_drv.h"
|
|
#include "intel_context_types.h"
|
|
#include "intel_engine_types.h"
|
|
#include "intel_ring_types.h"
|
|
#include "intel_timeline_types.h"
|
|
#include "i915_trace.h"
|
|
|
|
#define CE_TRACE(ce, fmt, ...) do { \
|
|
const struct intel_context *ce__ = (ce); \
|
|
ENGINE_TRACE(ce__->engine, "context:%llx " fmt, \
|
|
ce__->timeline->fence_context, \
|
|
##__VA_ARGS__); \
|
|
} while (0)
|
|
|
|
#define INTEL_CONTEXT_BANNED_PREEMPT_TIMEOUT_MS (1)
|
|
|
|
struct i915_gem_ww_ctx;
|
|
|
|
void intel_context_init(struct intel_context *ce,
|
|
struct intel_engine_cs *engine);
|
|
void intel_context_fini(struct intel_context *ce);
|
|
|
|
void i915_context_module_exit(void);
|
|
int i915_context_module_init(void);
|
|
|
|
struct intel_context *
|
|
intel_context_create(struct intel_engine_cs *engine);
|
|
|
|
int intel_context_alloc_state(struct intel_context *ce);
|
|
|
|
void intel_context_free(struct intel_context *ce);
|
|
|
|
int intel_context_reconfigure_sseu(struct intel_context *ce,
|
|
const struct intel_sseu sseu);
|
|
|
|
#define PARENT_SCRATCH_SIZE PAGE_SIZE
|
|
|
|
static inline bool intel_context_is_child(struct intel_context *ce)
|
|
{
|
|
return !!ce->parallel.parent;
|
|
}
|
|
|
|
static inline bool intel_context_is_parent(struct intel_context *ce)
|
|
{
|
|
return !!ce->parallel.number_children;
|
|
}
|
|
|
|
static inline bool intel_context_is_pinned(struct intel_context *ce);
|
|
|
|
static inline struct intel_context *
|
|
intel_context_to_parent(struct intel_context *ce)
|
|
{
|
|
if (intel_context_is_child(ce)) {
|
|
/*
|
|
* The parent holds ref count to the child so it is always safe
|
|
* for the parent to access the child, but the child has a
|
|
* pointer to the parent without a ref. To ensure this is safe
|
|
* the child should only access the parent pointer while the
|
|
* parent is pinned.
|
|
*/
|
|
GEM_BUG_ON(!intel_context_is_pinned(ce->parallel.parent));
|
|
|
|
return ce->parallel.parent;
|
|
} else {
|
|
return ce;
|
|
}
|
|
}
|
|
|
|
static inline bool intel_context_is_parallel(struct intel_context *ce)
|
|
{
|
|
return intel_context_is_child(ce) || intel_context_is_parent(ce);
|
|
}
|
|
|
|
void intel_context_bind_parent_child(struct intel_context *parent,
|
|
struct intel_context *child);
|
|
|
|
#define for_each_child(parent, ce)\
|
|
list_for_each_entry(ce, &(parent)->parallel.child_list,\
|
|
parallel.child_link)
|
|
#define for_each_child_safe(parent, ce, cn)\
|
|
list_for_each_entry_safe(ce, cn, &(parent)->parallel.child_list,\
|
|
parallel.child_link)
|
|
|
|
/**
|
|
* intel_context_lock_pinned - Stablises the 'pinned' status of the HW context
|
|
* @ce - the context
|
|
*
|
|
* Acquire a lock on the pinned status of the HW context, such that the context
|
|
* can neither be bound to the GPU or unbound whilst the lock is held, i.e.
|
|
* intel_context_is_pinned() remains stable.
|
|
*/
|
|
static inline int intel_context_lock_pinned(struct intel_context *ce)
|
|
__acquires(ce->pin_mutex)
|
|
{
|
|
return mutex_lock_interruptible(&ce->pin_mutex);
|
|
}
|
|
|
|
/**
|
|
* intel_context_is_pinned - Reports the 'pinned' status
|
|
* @ce - the context
|
|
*
|
|
* While in use by the GPU, the context, along with its ring and page
|
|
* tables is pinned into memory and the GTT.
|
|
*
|
|
* Returns: true if the context is currently pinned for use by the GPU.
|
|
*/
|
|
static inline bool
|
|
intel_context_is_pinned(struct intel_context *ce)
|
|
{
|
|
return atomic_read(&ce->pin_count);
|
|
}
|
|
|
|
static inline void intel_context_cancel_request(struct intel_context *ce,
|
|
struct i915_request *rq)
|
|
{
|
|
GEM_BUG_ON(!ce->ops->cancel_request);
|
|
return ce->ops->cancel_request(ce, rq);
|
|
}
|
|
|
|
/**
|
|
* intel_context_unlock_pinned - Releases the earlier locking of 'pinned' status
|
|
* @ce - the context
|
|
*
|
|
* Releases the lock earlier acquired by intel_context_unlock_pinned().
|
|
*/
|
|
static inline void intel_context_unlock_pinned(struct intel_context *ce)
|
|
__releases(ce->pin_mutex)
|
|
{
|
|
mutex_unlock(&ce->pin_mutex);
|
|
}
|
|
|
|
int __intel_context_do_pin(struct intel_context *ce);
|
|
int __intel_context_do_pin_ww(struct intel_context *ce,
|
|
struct i915_gem_ww_ctx *ww);
|
|
|
|
static inline bool intel_context_pin_if_active(struct intel_context *ce)
|
|
{
|
|
return atomic_inc_not_zero(&ce->pin_count);
|
|
}
|
|
|
|
static inline int intel_context_pin(struct intel_context *ce)
|
|
{
|
|
if (likely(intel_context_pin_if_active(ce)))
|
|
return 0;
|
|
|
|
return __intel_context_do_pin(ce);
|
|
}
|
|
|
|
static inline int intel_context_pin_ww(struct intel_context *ce,
|
|
struct i915_gem_ww_ctx *ww)
|
|
{
|
|
if (likely(intel_context_pin_if_active(ce)))
|
|
return 0;
|
|
|
|
return __intel_context_do_pin_ww(ce, ww);
|
|
}
|
|
|
|
static inline void __intel_context_pin(struct intel_context *ce)
|
|
{
|
|
GEM_BUG_ON(!intel_context_is_pinned(ce));
|
|
atomic_inc(&ce->pin_count);
|
|
}
|
|
|
|
void __intel_context_do_unpin(struct intel_context *ce, int sub);
|
|
|
|
static inline void intel_context_sched_disable_unpin(struct intel_context *ce)
|
|
{
|
|
__intel_context_do_unpin(ce, 2);
|
|
}
|
|
|
|
static inline void intel_context_unpin(struct intel_context *ce)
|
|
{
|
|
if (!ce->ops->sched_disable) {
|
|
__intel_context_do_unpin(ce, 1);
|
|
} else {
|
|
/*
|
|
* Move ownership of this pin to the scheduling disable which is
|
|
* an async operation. When that operation completes the above
|
|
* intel_context_sched_disable_unpin is called potentially
|
|
* unpinning the context.
|
|
*/
|
|
while (!atomic_add_unless(&ce->pin_count, -1, 1)) {
|
|
if (atomic_cmpxchg(&ce->pin_count, 1, 2) == 1) {
|
|
ce->ops->sched_disable(ce);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void intel_context_enter_engine(struct intel_context *ce);
|
|
void intel_context_exit_engine(struct intel_context *ce);
|
|
|
|
static inline void intel_context_enter(struct intel_context *ce)
|
|
{
|
|
lockdep_assert_held(&ce->timeline->mutex);
|
|
if (!ce->active_count++)
|
|
ce->ops->enter(ce);
|
|
}
|
|
|
|
static inline void intel_context_mark_active(struct intel_context *ce)
|
|
{
|
|
lockdep_assert(lockdep_is_held(&ce->timeline->mutex) ||
|
|
test_bit(CONTEXT_IS_PARKING, &ce->flags));
|
|
++ce->active_count;
|
|
}
|
|
|
|
static inline void intel_context_exit(struct intel_context *ce)
|
|
{
|
|
lockdep_assert_held(&ce->timeline->mutex);
|
|
GEM_BUG_ON(!ce->active_count);
|
|
if (!--ce->active_count)
|
|
ce->ops->exit(ce);
|
|
}
|
|
|
|
static inline struct intel_context *intel_context_get(struct intel_context *ce)
|
|
{
|
|
kref_get(&ce->ref);
|
|
return ce;
|
|
}
|
|
|
|
static inline void intel_context_put(struct intel_context *ce)
|
|
{
|
|
kref_put(&ce->ref, ce->ops->destroy);
|
|
}
|
|
|
|
static inline struct intel_timeline *__must_check
|
|
intel_context_timeline_lock(struct intel_context *ce)
|
|
__acquires(&ce->timeline->mutex)
|
|
{
|
|
struct intel_timeline *tl = ce->timeline;
|
|
int err;
|
|
|
|
if (intel_context_is_parent(ce))
|
|
err = mutex_lock_interruptible_nested(&tl->mutex, 0);
|
|
else if (intel_context_is_child(ce))
|
|
err = mutex_lock_interruptible_nested(&tl->mutex,
|
|
ce->parallel.child_index + 1);
|
|
else
|
|
err = mutex_lock_interruptible(&tl->mutex);
|
|
if (err)
|
|
return ERR_PTR(err);
|
|
|
|
return tl;
|
|
}
|
|
|
|
static inline void intel_context_timeline_unlock(struct intel_timeline *tl)
|
|
__releases(&tl->mutex)
|
|
{
|
|
mutex_unlock(&tl->mutex);
|
|
}
|
|
|
|
int intel_context_prepare_remote_request(struct intel_context *ce,
|
|
struct i915_request *rq);
|
|
|
|
struct i915_request *intel_context_create_request(struct intel_context *ce);
|
|
|
|
struct i915_request *intel_context_get_active_request(struct intel_context *ce);
|
|
|
|
static inline bool intel_context_is_barrier(const struct intel_context *ce)
|
|
{
|
|
return test_bit(CONTEXT_BARRIER_BIT, &ce->flags);
|
|
}
|
|
|
|
static inline void intel_context_close(struct intel_context *ce)
|
|
{
|
|
set_bit(CONTEXT_CLOSED_BIT, &ce->flags);
|
|
|
|
if (ce->ops->close)
|
|
ce->ops->close(ce);
|
|
}
|
|
|
|
static inline bool intel_context_is_closed(const struct intel_context *ce)
|
|
{
|
|
return test_bit(CONTEXT_CLOSED_BIT, &ce->flags);
|
|
}
|
|
|
|
static inline bool intel_context_has_inflight(const struct intel_context *ce)
|
|
{
|
|
return test_bit(COPS_HAS_INFLIGHT_BIT, &ce->ops->flags);
|
|
}
|
|
|
|
static inline bool intel_context_use_semaphores(const struct intel_context *ce)
|
|
{
|
|
return test_bit(CONTEXT_USE_SEMAPHORES, &ce->flags);
|
|
}
|
|
|
|
static inline void intel_context_set_use_semaphores(struct intel_context *ce)
|
|
{
|
|
set_bit(CONTEXT_USE_SEMAPHORES, &ce->flags);
|
|
}
|
|
|
|
static inline void intel_context_clear_use_semaphores(struct intel_context *ce)
|
|
{
|
|
clear_bit(CONTEXT_USE_SEMAPHORES, &ce->flags);
|
|
}
|
|
|
|
static inline bool intel_context_is_banned(const struct intel_context *ce)
|
|
{
|
|
return test_bit(CONTEXT_BANNED, &ce->flags);
|
|
}
|
|
|
|
static inline bool intel_context_set_banned(struct intel_context *ce)
|
|
{
|
|
return test_and_set_bit(CONTEXT_BANNED, &ce->flags);
|
|
}
|
|
|
|
bool intel_context_ban(struct intel_context *ce, struct i915_request *rq);
|
|
|
|
static inline bool intel_context_is_schedulable(const struct intel_context *ce)
|
|
{
|
|
return !test_bit(CONTEXT_EXITING, &ce->flags) &&
|
|
!test_bit(CONTEXT_BANNED, &ce->flags);
|
|
}
|
|
|
|
static inline bool intel_context_is_exiting(const struct intel_context *ce)
|
|
{
|
|
return test_bit(CONTEXT_EXITING, &ce->flags);
|
|
}
|
|
|
|
static inline bool intel_context_set_exiting(struct intel_context *ce)
|
|
{
|
|
return test_and_set_bit(CONTEXT_EXITING, &ce->flags);
|
|
}
|
|
|
|
bool intel_context_revoke(struct intel_context *ce);
|
|
|
|
static inline bool
|
|
intel_context_force_single_submission(const struct intel_context *ce)
|
|
{
|
|
return test_bit(CONTEXT_FORCE_SINGLE_SUBMISSION, &ce->flags);
|
|
}
|
|
|
|
static inline void
|
|
intel_context_set_single_submission(struct intel_context *ce)
|
|
{
|
|
__set_bit(CONTEXT_FORCE_SINGLE_SUBMISSION, &ce->flags);
|
|
}
|
|
|
|
static inline bool
|
|
intel_context_nopreempt(const struct intel_context *ce)
|
|
{
|
|
return test_bit(CONTEXT_NOPREEMPT, &ce->flags);
|
|
}
|
|
|
|
static inline void
|
|
intel_context_set_nopreempt(struct intel_context *ce)
|
|
{
|
|
set_bit(CONTEXT_NOPREEMPT, &ce->flags);
|
|
}
|
|
|
|
static inline void
|
|
intel_context_clear_nopreempt(struct intel_context *ce)
|
|
{
|
|
clear_bit(CONTEXT_NOPREEMPT, &ce->flags);
|
|
}
|
|
|
|
u64 intel_context_get_total_runtime_ns(const struct intel_context *ce);
|
|
u64 intel_context_get_avg_runtime_ns(struct intel_context *ce);
|
|
|
|
static inline u64 intel_context_clock(void)
|
|
{
|
|
/* As we mix CS cycles with CPU clocks, use the raw monotonic clock. */
|
|
return ktime_get_raw_fast_ns();
|
|
}
|
|
|
|
#endif /* __INTEL_CONTEXT_H__ */
|