mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2025-01-27 18:41:56 +07:00
bb620c3d39
In iperf experiments running linux as the Tx side (TCP client) with 10 threads results in a severe performance drop when TSO is disabled, indicating a weakness in the software that can be avoided by using the scalable IOMMU arena DMA allocation. Baseline numbers before this patch: with default settings (TSO enabled) : 9-9.5 Gbps Disable TSO using ethtool- drops badly: 2-3 Gbps. After this patch, iperf client with 10 threads, can give a throughput of at least 8.5 Gbps, even when TSO is disabled. Signed-off-by: Sowmini Varadhan <sowmini.varadhan@oracle.com> Acked-by: Benjamin Herrenschmidt <benh@kernel.crashing.org> Signed-off-by: David S. Miller <davem@davemloft.net>
65 lines
1.8 KiB
C
65 lines
1.8 KiB
C
/* iommu.h: Definitions for the sun5 IOMMU.
|
|
*
|
|
* Copyright (C) 1996, 1999, 2007 David S. Miller (davem@davemloft.net)
|
|
*/
|
|
#ifndef _SPARC64_IOMMU_H
|
|
#define _SPARC64_IOMMU_H
|
|
|
|
/* The format of an iopte in the page tables. */
|
|
#define IOPTE_VALID 0x8000000000000000UL
|
|
#define IOPTE_64K 0x2000000000000000UL
|
|
#define IOPTE_STBUF 0x1000000000000000UL
|
|
#define IOPTE_INTRA 0x0800000000000000UL
|
|
#define IOPTE_CONTEXT 0x07ff800000000000UL
|
|
#define IOPTE_PAGE 0x00007fffffffe000UL
|
|
#define IOPTE_CACHE 0x0000000000000010UL
|
|
#define IOPTE_WRITE 0x0000000000000002UL
|
|
|
|
#define IOMMU_NUM_CTXS 4096
|
|
#include <linux/iommu-common.h>
|
|
|
|
struct iommu_arena {
|
|
unsigned long *map;
|
|
unsigned int hint;
|
|
unsigned int limit;
|
|
};
|
|
|
|
struct iommu {
|
|
struct iommu_map_table tbl;
|
|
spinlock_t lock;
|
|
u32 dma_addr_mask;
|
|
iopte_t *page_table;
|
|
unsigned long iommu_control;
|
|
unsigned long iommu_tsbbase;
|
|
unsigned long iommu_flush;
|
|
unsigned long iommu_flushinv;
|
|
unsigned long iommu_tags;
|
|
unsigned long iommu_ctxflush;
|
|
unsigned long write_complete_reg;
|
|
unsigned long dummy_page;
|
|
unsigned long dummy_page_pa;
|
|
unsigned long ctx_lowest_free;
|
|
DECLARE_BITMAP(ctx_bitmap, IOMMU_NUM_CTXS);
|
|
};
|
|
|
|
struct strbuf {
|
|
int strbuf_enabled;
|
|
unsigned long strbuf_control;
|
|
unsigned long strbuf_pflush;
|
|
unsigned long strbuf_fsync;
|
|
unsigned long strbuf_err_stat;
|
|
unsigned long strbuf_tag_diag;
|
|
unsigned long strbuf_line_diag;
|
|
unsigned long strbuf_ctxflush;
|
|
unsigned long strbuf_ctxmatch_base;
|
|
unsigned long strbuf_flushflag_pa;
|
|
volatile unsigned long *strbuf_flushflag;
|
|
volatile unsigned long __flushflag_buf[(64+(64-1)) / sizeof(long)];
|
|
};
|
|
|
|
int iommu_table_init(struct iommu *iommu, int tsbsize,
|
|
u32 dma_offset, u32 dma_addr_mask,
|
|
int numa_node);
|
|
|
|
#endif /* !(_SPARC64_IOMMU_H) */
|