mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-22 15:45:09 +07:00
f911e7234f
lockdep insists that if we give a lock a subclass, it must be used. Failure to do so triggers a self-consistency check when reading lockdep_stats: [ 49.902002] DEBUG_LOCKS_WARN_ON(debug_atomic_read(nr_unused_locks) != nr_unused) [ 49.902009] WARNING: CPU: 3 PID: 383 at kernel/locking/lockdep_proc.c:249 lockdep_stats_show+0x984/0xa10 [ 49.902026] Modules linked in: nls_ascii nls_cp437 vfat fat crct10dif_pclmul crc32_pclmul crc32c_intel aesni_intel aes_x86_64 crypto_simd cryptd glue_helper intel_cstate intel_uncore intel_rapl_perf intel_gtt efivars prime_numbers ahci libahci i2c_i801 video button efivarfs [last unloaded: drm_kms_helper] [ 49.902059] CPU: 3 PID: 383 Comm: cat Tainted: G U 4.20.0-rc2+ #304 [ 49.902068] Hardware name: Intel Corporation NUC7i5BNK/NUC7i5BNB, BIOS BNKBL357.86A.0052.2017.0918.1346 09/18/2017 [ 49.902079] RIP: 0010:lockdep_stats_show+0x984/0xa10 [ 49.902086] Code: 00 85 c0 0f 84 aa f8 ff ff 8b 05 77 37 e2 00 85 c0 0f 85 9c f8 ff ff 48 c7 c6 e0 57 bc 81 48 c7 c7 28 30 bb 81 e8 6b 77 fa ff <0f> 0b e9 82 f8 ff ff 48 c7 44 24 50 00 00 00 00 45 31 e4 31 db 31 [ 49.902103] RSP: 0018:ffffc90000247d58 EFLAGS: 00010292 [ 49.902110] RAX: 0000000000000044 RBX: 00000000000002f0 RCX: 0000000000000000 [ 49.902118] RDX: 0000000000000002 RSI: 0000000000000001 RDI: ffffffff810b3464 [ 49.902126] RBP: 0000000000000039 R08: 0000000000000002 R09: 0000000000000000 [ 49.902133] R10: 0000000000000000 R11: 0000000000000000 R12: 0000000000007ead [ 49.902141] R13: 0000000000000001 R14: ffff88884c021000 R15: 0000000000000097 [ 49.902150] FS: 00007fb347e66540(0000) GS:ffff88885e600000(0000) knlGS:0000000000000000 [ 49.902159] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 [ 49.902165] CR2: 00007fb347aeb000 CR3: 00000008544bd005 CR4: 00000000001606e0 Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk> Cc: Tvrtko Ursulin <tvrtko.ursulin@intel.com> Cc: Michał Winiarski <michal.winiarski@intel.com> Cc: Matthew Auld <matthew.auld@intel.com> Reviewed-by: Matthew Auld <matthew.auld@intel.com> Link: https://patchwork.freedesktop.org/patch/msgid/20181115203851.25739-1-chris@chris-wilson.co.uk
148 lines
4.6 KiB
C
148 lines
4.6 KiB
C
/*
|
|
* Copyright © 2016 Intel Corporation
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice (including the next
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
* Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
|
* IN THE SOFTWARE.
|
|
*
|
|
*/
|
|
|
|
#ifndef I915_TIMELINE_H
|
|
#define I915_TIMELINE_H
|
|
|
|
#include <linux/list.h>
|
|
#include <linux/kref.h>
|
|
|
|
#include "i915_request.h"
|
|
#include "i915_syncmap.h"
|
|
#include "i915_utils.h"
|
|
|
|
struct i915_timeline {
|
|
u64 fence_context;
|
|
u32 seqno;
|
|
|
|
spinlock_t lock;
|
|
#define TIMELINE_CLIENT 0 /* default subclass */
|
|
#define TIMELINE_ENGINE 1
|
|
|
|
/**
|
|
* List of breadcrumbs associated with GPU requests currently
|
|
* outstanding.
|
|
*/
|
|
struct list_head requests;
|
|
|
|
/* Contains an RCU guarded pointer to the last request. No reference is
|
|
* held to the request, users must carefully acquire a reference to
|
|
* the request using i915_gem_active_get_request_rcu(), or hold the
|
|
* struct_mutex.
|
|
*/
|
|
struct i915_gem_active last_request;
|
|
|
|
/**
|
|
* We track the most recent seqno that we wait on in every context so
|
|
* that we only have to emit a new await and dependency on a more
|
|
* recent sync point. As the contexts may be executed out-of-order, we
|
|
* have to track each individually and can not rely on an absolute
|
|
* global_seqno. When we know that all tracked fences are completed
|
|
* (i.e. when the driver is idle), we know that the syncmap is
|
|
* redundant and we can discard it without loss of generality.
|
|
*/
|
|
struct i915_syncmap *sync;
|
|
/**
|
|
* Separately to the inter-context seqno map above, we track the last
|
|
* barrier (e.g. semaphore wait) to the global engine timelines. Note
|
|
* that this tracks global_seqno rather than the context.seqno, and
|
|
* so it is subject to the limitations of hw wraparound and that we
|
|
* may need to revoke global_seqno (on pre-emption).
|
|
*/
|
|
u32 global_sync[I915_NUM_ENGINES];
|
|
|
|
struct list_head link;
|
|
const char *name;
|
|
|
|
struct kref kref;
|
|
};
|
|
|
|
void i915_timeline_init(struct drm_i915_private *i915,
|
|
struct i915_timeline *tl,
|
|
const char *name);
|
|
void i915_timeline_fini(struct i915_timeline *tl);
|
|
|
|
static inline void
|
|
i915_timeline_set_subclass(struct i915_timeline *timeline,
|
|
unsigned int subclass)
|
|
{
|
|
lockdep_set_subclass(&timeline->lock, subclass);
|
|
|
|
/*
|
|
* Due to an interesting quirk in lockdep's internal debug tracking,
|
|
* after setting a subclass we must ensure the lock is used. Otherwise,
|
|
* nr_unused_locks is incremented once too often.
|
|
*/
|
|
#ifdef CONFIG_DEBUG_LOCK_ALLOC
|
|
local_irq_disable();
|
|
lock_map_acquire(&timeline->lock.dep_map);
|
|
lock_map_release(&timeline->lock.dep_map);
|
|
local_irq_enable();
|
|
#endif
|
|
}
|
|
|
|
struct i915_timeline *
|
|
i915_timeline_create(struct drm_i915_private *i915, const char *name);
|
|
|
|
static inline struct i915_timeline *
|
|
i915_timeline_get(struct i915_timeline *timeline)
|
|
{
|
|
kref_get(&timeline->kref);
|
|
return timeline;
|
|
}
|
|
|
|
void __i915_timeline_free(struct kref *kref);
|
|
static inline void i915_timeline_put(struct i915_timeline *timeline)
|
|
{
|
|
kref_put(&timeline->kref, __i915_timeline_free);
|
|
}
|
|
|
|
static inline int __i915_timeline_sync_set(struct i915_timeline *tl,
|
|
u64 context, u32 seqno)
|
|
{
|
|
return i915_syncmap_set(&tl->sync, context, seqno);
|
|
}
|
|
|
|
static inline int i915_timeline_sync_set(struct i915_timeline *tl,
|
|
const struct dma_fence *fence)
|
|
{
|
|
return __i915_timeline_sync_set(tl, fence->context, fence->seqno);
|
|
}
|
|
|
|
static inline bool __i915_timeline_sync_is_later(struct i915_timeline *tl,
|
|
u64 context, u32 seqno)
|
|
{
|
|
return i915_syncmap_is_later(&tl->sync, context, seqno);
|
|
}
|
|
|
|
static inline bool i915_timeline_sync_is_later(struct i915_timeline *tl,
|
|
const struct dma_fence *fence)
|
|
{
|
|
return __i915_timeline_sync_is_later(tl, fence->context, fence->seqno);
|
|
}
|
|
|
|
void i915_timelines_park(struct drm_i915_private *i915);
|
|
|
|
#endif
|