mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-27 15:25:02 +07:00
72aabfb862
This adds mutex to guard against update of global ppgtt mm LRU list. To resolve error found as below warning. [73130.012162] ------------[ cut here ]------------ [73130.012168] list_add corruption. prev->next should be next (ffff995f970cca50), but was 0000000000000000. (prev=ffff995f0dc5bdf8). [73130.012181] WARNING: CPU: 3 PID: 82 at lib/list_debug.c:28 __list_add_valid+0x4d/0x70 [73130.012183] Modules linked in: btrfs(E) xor(E) zstd_decompress(E) zstd_compress(E) raid6_pq(E) dm_mod(E) kvmgt(E) fuse(E) xt_addrtype(E) nft_compat(E) xt_conntrack(E) nf_nat(E) nf_conntrack(E) nf_defrag_ipv6(E) nf_defrag_ipv4(E) libcrc32c(E) br_netfilter(E) bridge(E) stp(E) llc(E) overlay(E) devlink(E) nf_tables(E) nfnetlink(E) loop(E) x86_pkg_temp_thermal(E) intel_powerclamp(E) coretemp(E) crct10dif_pclmul(E) crc32_pclmul(E) ghash_clmulni_intel(E) mei_me(E) aesni_intel(E) aes_x86_64(E) crypto_simd(E) cryptd(E) glue_helper(E) intel_cstate(E) intel_uncore(E) mei(E) intel_pch_thermal(E) intel_rapl_perf(E) pcspkr(E) iTCO_wdt(E) iTCO_vendor_support(E) idma64(E) sg(E) virt_dma(E) acpi_pad(E) evdev(E) binfmt_misc(E) ip_tables(E) x_tables(E) ipv6(E) autofs4(E) hid_generic(E) usbhid(E) hid(E) ext4(E) crc32c_generic(E) crc16(E) mbcache(E) jbd2(E) fscrypto(E) xhci_pci(E) sdhci_pci(E) cqhci(E) intel_lpss_pci(E) intel_lpss(E) crc32c_intel(E) xhci_hcd(E) sdhci(E) i2c_i801(E) e1000e(E) mmc_core(E) [73130.012218] ptp(E) pps_core(E) usbcore(E) mfd_core(E) sd_mod(E) fan(E) thermal(E) [73130.012227] CPU: 3 PID: 82 Comm: gvt workload 0 Tainted: G W E 5.0.0-rc7-staging-190226+ #282 [73130.012228] Hardware name: /NUC6i5SYB, BIOS SYSKLi35.86A.0039.2016.0316.1747 03/16/2016 [73130.012232] RIP: 0010:__list_add_valid+0x4d/0x70 [73130.012234] Code: c3 48 89 d1 48 c7 c7 e0 82 91 bb 48 89 c2 e8 44 8a cc ff 0f 0b 31 c0 c3 48 89 c1 4c 89 c6 48 c7 c7 30 83 91 bb e8 2d 8a cc ff <0f> 0b 31 c0 c3 48 89 f2 4c 89 c1 48 89 fe 48 c7 c7 80 83 91 bb e8 [73130.012236] RSP: 0018:ffffa4924107fdd0 EFLAGS: 00010286 [73130.012238] RAX: 0000000000000000 RBX: ffff995d8a5ccf00 RCX: 0000000000000006 [73130.012240] RDX: 0000000000000007 RSI: 0000000000000086 RDI: ffff995faad96680 [73130.012241] RBP: 0000000000000000 R08: 0000000000213a28 R09: 0000000000000084 [73130.012243] R10: 0000000000000000 R11: ffffa4924107fc70 R12: ffff995d8a5ccf78 [73130.012245] R13: ffff995f970c8000 R14: ffff995f0dc5bdf8 R15: ffff995f970cca50 [73130.012247] FS: 0000000000000000(0000) GS:ffff995faad80000(0000) knlGS:0000000000000000 [73130.012249] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 [73130.012250] CR2: 00000222e1891000 CR3: 0000000116848002 CR4: 00000000003626e0 [73130.012252] Call Trace: [73130.012258] intel_vgpu_pin_mm+0x7a/0xa0 [73130.012262] workload_thread+0x683/0x12a0 [73130.012266] ? do_wait_intr_irq+0xb0/0xb0 [73130.012269] ? finish_wait+0x80/0x80 [73130.012271] ? intel_vgpu_clean_workloads+0x110/0x110 [73130.012274] kthread+0x116/0x130 [73130.012276] ? kthread_bind+0x30/0x30 [73130.012280] ret_from_fork+0x35/0x40 [73130.012285] WARNING: CPU: 3 PID: 82 at lib/list_debug.c:28 __list_add_valid+0x4d/0x70 [73130.012286] ---[ end trace 458a2e792eec21c0 ]--- v2: - simplify lock handling Reviewed-by: Xiong Zhang <xiong.y.zhang@intel.com> Cc: Xiong Zhang <xiong.y.zhang@intel.com> Signed-off-by: Zhenyu Wang <zhenyuw@linux.intel.com>
281 lines
7.7 KiB
C
281 lines
7.7 KiB
C
/*
|
|
* Copyright(c) 2011-2016 Intel Corporation. All rights reserved.
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice (including the next
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
* Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
* SOFTWARE.
|
|
*
|
|
* Authors:
|
|
* Zhi Wang <zhi.a.wang@intel.com>
|
|
* Zhenyu Wang <zhenyuw@linux.intel.com>
|
|
* Xiao Zheng <xiao.zheng@intel.com>
|
|
*
|
|
* Contributors:
|
|
* Min He <min.he@intel.com>
|
|
* Bing Niu <bing.niu@intel.com>
|
|
*
|
|
*/
|
|
|
|
#ifndef _GVT_GTT_H_
|
|
#define _GVT_GTT_H_
|
|
|
|
#define I915_GTT_PAGE_SHIFT 12
|
|
|
|
struct intel_vgpu_mm;
|
|
|
|
#define INTEL_GVT_INVALID_ADDR (~0UL)
|
|
|
|
struct intel_gvt_gtt_entry {
|
|
u64 val64;
|
|
int type;
|
|
};
|
|
|
|
struct intel_gvt_gtt_pte_ops {
|
|
int (*get_entry)(void *pt,
|
|
struct intel_gvt_gtt_entry *e,
|
|
unsigned long index,
|
|
bool hypervisor_access,
|
|
unsigned long gpa,
|
|
struct intel_vgpu *vgpu);
|
|
int (*set_entry)(void *pt,
|
|
struct intel_gvt_gtt_entry *e,
|
|
unsigned long index,
|
|
bool hypervisor_access,
|
|
unsigned long gpa,
|
|
struct intel_vgpu *vgpu);
|
|
bool (*test_present)(struct intel_gvt_gtt_entry *e);
|
|
void (*clear_present)(struct intel_gvt_gtt_entry *e);
|
|
void (*set_present)(struct intel_gvt_gtt_entry *e);
|
|
bool (*test_pse)(struct intel_gvt_gtt_entry *e);
|
|
void (*clear_pse)(struct intel_gvt_gtt_entry *e);
|
|
bool (*test_ips)(struct intel_gvt_gtt_entry *e);
|
|
void (*clear_ips)(struct intel_gvt_gtt_entry *e);
|
|
bool (*test_64k_splited)(struct intel_gvt_gtt_entry *e);
|
|
void (*clear_64k_splited)(struct intel_gvt_gtt_entry *e);
|
|
void (*set_64k_splited)(struct intel_gvt_gtt_entry *e);
|
|
void (*set_pfn)(struct intel_gvt_gtt_entry *e, unsigned long pfn);
|
|
unsigned long (*get_pfn)(struct intel_gvt_gtt_entry *e);
|
|
};
|
|
|
|
struct intel_gvt_gtt_gma_ops {
|
|
unsigned long (*gma_to_ggtt_pte_index)(unsigned long gma);
|
|
unsigned long (*gma_to_pte_index)(unsigned long gma);
|
|
unsigned long (*gma_to_pde_index)(unsigned long gma);
|
|
unsigned long (*gma_to_l3_pdp_index)(unsigned long gma);
|
|
unsigned long (*gma_to_l4_pdp_index)(unsigned long gma);
|
|
unsigned long (*gma_to_pml4_index)(unsigned long gma);
|
|
};
|
|
|
|
struct intel_gvt_gtt {
|
|
struct intel_gvt_gtt_pte_ops *pte_ops;
|
|
struct intel_gvt_gtt_gma_ops *gma_ops;
|
|
int (*mm_alloc_page_table)(struct intel_vgpu_mm *mm);
|
|
void (*mm_free_page_table)(struct intel_vgpu_mm *mm);
|
|
struct list_head oos_page_use_list_head;
|
|
struct list_head oos_page_free_list_head;
|
|
struct mutex ppgtt_mm_lock;
|
|
struct list_head ppgtt_mm_lru_list_head;
|
|
|
|
struct page *scratch_page;
|
|
unsigned long scratch_mfn;
|
|
};
|
|
|
|
typedef enum {
|
|
GTT_TYPE_INVALID = -1,
|
|
|
|
GTT_TYPE_GGTT_PTE,
|
|
|
|
GTT_TYPE_PPGTT_PTE_4K_ENTRY,
|
|
GTT_TYPE_PPGTT_PTE_64K_ENTRY,
|
|
GTT_TYPE_PPGTT_PTE_2M_ENTRY,
|
|
GTT_TYPE_PPGTT_PTE_1G_ENTRY,
|
|
|
|
GTT_TYPE_PPGTT_PTE_ENTRY,
|
|
|
|
GTT_TYPE_PPGTT_PDE_ENTRY,
|
|
GTT_TYPE_PPGTT_PDP_ENTRY,
|
|
GTT_TYPE_PPGTT_PML4_ENTRY,
|
|
|
|
GTT_TYPE_PPGTT_ROOT_ENTRY,
|
|
|
|
GTT_TYPE_PPGTT_ROOT_L3_ENTRY,
|
|
GTT_TYPE_PPGTT_ROOT_L4_ENTRY,
|
|
|
|
GTT_TYPE_PPGTT_ENTRY,
|
|
|
|
GTT_TYPE_PPGTT_PTE_PT,
|
|
GTT_TYPE_PPGTT_PDE_PT,
|
|
GTT_TYPE_PPGTT_PDP_PT,
|
|
GTT_TYPE_PPGTT_PML4_PT,
|
|
|
|
GTT_TYPE_MAX,
|
|
} intel_gvt_gtt_type_t;
|
|
|
|
enum intel_gvt_mm_type {
|
|
INTEL_GVT_MM_GGTT,
|
|
INTEL_GVT_MM_PPGTT,
|
|
};
|
|
|
|
#define GVT_RING_CTX_NR_PDPS GEN8_3LVL_PDPES
|
|
|
|
struct intel_gvt_partial_pte {
|
|
unsigned long offset;
|
|
u64 data;
|
|
struct list_head list;
|
|
};
|
|
|
|
struct intel_vgpu_mm {
|
|
enum intel_gvt_mm_type type;
|
|
struct intel_vgpu *vgpu;
|
|
|
|
struct kref ref;
|
|
atomic_t pincount;
|
|
|
|
union {
|
|
struct {
|
|
intel_gvt_gtt_type_t root_entry_type;
|
|
/*
|
|
* The 4 PDPs in ring context. For 48bit addressing,
|
|
* only PDP0 is valid and point to PML4. For 32it
|
|
* addressing, all 4 are used as true PDPs.
|
|
*/
|
|
u64 guest_pdps[GVT_RING_CTX_NR_PDPS];
|
|
u64 shadow_pdps[GVT_RING_CTX_NR_PDPS];
|
|
bool shadowed;
|
|
|
|
struct list_head list;
|
|
struct list_head lru_list;
|
|
} ppgtt_mm;
|
|
struct {
|
|
void *virtual_ggtt;
|
|
struct list_head partial_pte_list;
|
|
} ggtt_mm;
|
|
};
|
|
};
|
|
|
|
struct intel_vgpu_mm *intel_vgpu_create_ppgtt_mm(struct intel_vgpu *vgpu,
|
|
intel_gvt_gtt_type_t root_entry_type, u64 pdps[]);
|
|
|
|
static inline void intel_vgpu_mm_get(struct intel_vgpu_mm *mm)
|
|
{
|
|
kref_get(&mm->ref);
|
|
}
|
|
|
|
void _intel_vgpu_mm_release(struct kref *mm_ref);
|
|
|
|
static inline void intel_vgpu_mm_put(struct intel_vgpu_mm *mm)
|
|
{
|
|
kref_put(&mm->ref, _intel_vgpu_mm_release);
|
|
}
|
|
|
|
static inline void intel_vgpu_destroy_mm(struct intel_vgpu_mm *mm)
|
|
{
|
|
intel_vgpu_mm_put(mm);
|
|
}
|
|
|
|
struct intel_vgpu_guest_page;
|
|
|
|
struct intel_vgpu_scratch_pt {
|
|
struct page *page;
|
|
unsigned long page_mfn;
|
|
};
|
|
|
|
struct intel_vgpu_gtt {
|
|
struct intel_vgpu_mm *ggtt_mm;
|
|
unsigned long active_ppgtt_mm_bitmap;
|
|
struct list_head ppgtt_mm_list_head;
|
|
struct radix_tree_root spt_tree;
|
|
struct list_head oos_page_list_head;
|
|
struct list_head post_shadow_list_head;
|
|
struct intel_vgpu_scratch_pt scratch_pt[GTT_TYPE_MAX];
|
|
};
|
|
|
|
extern int intel_vgpu_init_gtt(struct intel_vgpu *vgpu);
|
|
extern void intel_vgpu_clean_gtt(struct intel_vgpu *vgpu);
|
|
void intel_vgpu_reset_ggtt(struct intel_vgpu *vgpu, bool invalidate_old);
|
|
void intel_vgpu_invalidate_ppgtt(struct intel_vgpu *vgpu);
|
|
|
|
extern int intel_gvt_init_gtt(struct intel_gvt *gvt);
|
|
void intel_vgpu_reset_gtt(struct intel_vgpu *vgpu);
|
|
extern void intel_gvt_clean_gtt(struct intel_gvt *gvt);
|
|
|
|
extern struct intel_vgpu_mm *intel_gvt_find_ppgtt_mm(struct intel_vgpu *vgpu,
|
|
int page_table_level, void *root_entry);
|
|
|
|
struct intel_vgpu_oos_page {
|
|
struct intel_vgpu_ppgtt_spt *spt;
|
|
struct list_head list;
|
|
struct list_head vm_list;
|
|
int id;
|
|
unsigned char mem[I915_GTT_PAGE_SIZE];
|
|
};
|
|
|
|
#define GTT_ENTRY_NUM_IN_ONE_PAGE 512
|
|
|
|
/* Represent a vgpu shadow page table. */
|
|
struct intel_vgpu_ppgtt_spt {
|
|
atomic_t refcount;
|
|
struct intel_vgpu *vgpu;
|
|
|
|
struct {
|
|
intel_gvt_gtt_type_t type;
|
|
bool pde_ips; /* for 64KB PTEs */
|
|
void *vaddr;
|
|
struct page *page;
|
|
unsigned long mfn;
|
|
} shadow_page;
|
|
|
|
struct {
|
|
intel_gvt_gtt_type_t type;
|
|
bool pde_ips; /* for 64KB PTEs */
|
|
unsigned long gfn;
|
|
unsigned long write_cnt;
|
|
struct intel_vgpu_oos_page *oos_page;
|
|
} guest_page;
|
|
|
|
DECLARE_BITMAP(post_shadow_bitmap, GTT_ENTRY_NUM_IN_ONE_PAGE);
|
|
struct list_head post_shadow_list;
|
|
};
|
|
|
|
int intel_vgpu_sync_oos_pages(struct intel_vgpu *vgpu);
|
|
|
|
int intel_vgpu_flush_post_shadow(struct intel_vgpu *vgpu);
|
|
|
|
int intel_vgpu_pin_mm(struct intel_vgpu_mm *mm);
|
|
|
|
void intel_vgpu_unpin_mm(struct intel_vgpu_mm *mm);
|
|
|
|
unsigned long intel_vgpu_gma_to_gpa(struct intel_vgpu_mm *mm,
|
|
unsigned long gma);
|
|
|
|
struct intel_vgpu_mm *intel_vgpu_find_ppgtt_mm(struct intel_vgpu *vgpu,
|
|
u64 pdps[]);
|
|
|
|
struct intel_vgpu_mm *intel_vgpu_get_ppgtt_mm(struct intel_vgpu *vgpu,
|
|
intel_gvt_gtt_type_t root_entry_type, u64 pdps[]);
|
|
|
|
int intel_vgpu_put_ppgtt_mm(struct intel_vgpu *vgpu, u64 pdps[]);
|
|
|
|
int intel_vgpu_emulate_ggtt_mmio_read(struct intel_vgpu *vgpu,
|
|
unsigned int off, void *p_data, unsigned int bytes);
|
|
|
|
int intel_vgpu_emulate_ggtt_mmio_write(struct intel_vgpu *vgpu,
|
|
unsigned int off, void *p_data, unsigned int bytes);
|
|
|
|
#endif /* _GVT_GTT_H_ */
|