mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-27 21:26:27 +07:00
ece276de2a
MAC2008 means the processor implemented IEEE754 style Fused MADD instruction. It was introduced in Release3 but removed in Release5. The toolchain support of MAC2008 have never landed except for Loongson processors. This patch aimed to disabled the MAC2008 if it's optional. For MAC2008 only processors, we corrected math-emu behavior to align with actual hardware behavior. Signed-off-by: Jiaxun Yang <jiaxun.yang@flygoat.com> [paulburton@kernel.org: Fixup MIPSr2-r5 check in cpu_set_fpu_2008.] Signed-off-by: Paul Burton <paulburton@kernel.org> Cc: linux-mips@vger.kernel.org Cc: chenhc@lemote.com Cc: paul.burton@mips.com Cc: linux-kernel@vger.kernel.org
312 lines
9.8 KiB
C
312 lines
9.8 KiB
C
/* SPDX-License-Identifier: GPL-2.0-only */
|
|
/*
|
|
* MIPS floating point support
|
|
* Copyright (C) 1994-2000 Algorithmics Ltd.
|
|
*
|
|
* Nov 7, 2000
|
|
* Modification to allow integration with Linux kernel
|
|
*
|
|
* Kevin D. Kissell, kevink@mips.com and Carsten Langgard, carstenl@mips.com
|
|
* Copyright (C) 2000 MIPS Technologies, Inc. All rights reserved.
|
|
*/
|
|
#ifndef __ARCH_MIPS_MATH_EMU_IEEE754_H
|
|
#define __ARCH_MIPS_MATH_EMU_IEEE754_H
|
|
|
|
#include <linux/compiler.h>
|
|
#include <asm/byteorder.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/types.h>
|
|
#include <linux/sched.h>
|
|
#include <asm/bitfield.h>
|
|
|
|
union ieee754dp {
|
|
struct {
|
|
__BITFIELD_FIELD(unsigned int sign:1,
|
|
__BITFIELD_FIELD(unsigned int bexp:11,
|
|
__BITFIELD_FIELD(u64 mant:52,
|
|
;)))
|
|
};
|
|
u64 bits;
|
|
};
|
|
|
|
union ieee754sp {
|
|
struct {
|
|
__BITFIELD_FIELD(unsigned sign:1,
|
|
__BITFIELD_FIELD(unsigned bexp:8,
|
|
__BITFIELD_FIELD(unsigned mant:23,
|
|
;)))
|
|
};
|
|
u32 bits;
|
|
};
|
|
|
|
/*
|
|
* single precision (often aka float)
|
|
*/
|
|
int ieee754sp_class(union ieee754sp x);
|
|
|
|
union ieee754sp ieee754sp_abs(union ieee754sp x);
|
|
union ieee754sp ieee754sp_neg(union ieee754sp x);
|
|
|
|
union ieee754sp ieee754sp_add(union ieee754sp x, union ieee754sp y);
|
|
union ieee754sp ieee754sp_sub(union ieee754sp x, union ieee754sp y);
|
|
union ieee754sp ieee754sp_mul(union ieee754sp x, union ieee754sp y);
|
|
union ieee754sp ieee754sp_div(union ieee754sp x, union ieee754sp y);
|
|
|
|
union ieee754sp ieee754sp_fint(int x);
|
|
union ieee754sp ieee754sp_flong(s64 x);
|
|
union ieee754sp ieee754sp_fdp(union ieee754dp x);
|
|
union ieee754sp ieee754sp_rint(union ieee754sp x);
|
|
|
|
int ieee754sp_tint(union ieee754sp x);
|
|
s64 ieee754sp_tlong(union ieee754sp x);
|
|
|
|
int ieee754sp_cmp(union ieee754sp x, union ieee754sp y, int cop, int sig);
|
|
|
|
union ieee754sp ieee754sp_sqrt(union ieee754sp x);
|
|
|
|
union ieee754sp ieee754sp_maddf(union ieee754sp z, union ieee754sp x,
|
|
union ieee754sp y);
|
|
union ieee754sp ieee754sp_msubf(union ieee754sp z, union ieee754sp x,
|
|
union ieee754sp y);
|
|
union ieee754sp ieee754sp_madd(union ieee754sp z, union ieee754sp x,
|
|
union ieee754sp y);
|
|
union ieee754sp ieee754sp_msub(union ieee754sp z, union ieee754sp x,
|
|
union ieee754sp y);
|
|
union ieee754sp ieee754sp_nmadd(union ieee754sp z, union ieee754sp x,
|
|
union ieee754sp y);
|
|
union ieee754sp ieee754sp_nmsub(union ieee754sp z, union ieee754sp x,
|
|
union ieee754sp y);
|
|
int ieee754sp_2008class(union ieee754sp x);
|
|
union ieee754sp ieee754sp_fmin(union ieee754sp x, union ieee754sp y);
|
|
union ieee754sp ieee754sp_fmina(union ieee754sp x, union ieee754sp y);
|
|
union ieee754sp ieee754sp_fmax(union ieee754sp x, union ieee754sp y);
|
|
union ieee754sp ieee754sp_fmaxa(union ieee754sp x, union ieee754sp y);
|
|
|
|
/*
|
|
* double precision (often aka double)
|
|
*/
|
|
int ieee754dp_class(union ieee754dp x);
|
|
|
|
union ieee754dp ieee754dp_add(union ieee754dp x, union ieee754dp y);
|
|
union ieee754dp ieee754dp_sub(union ieee754dp x, union ieee754dp y);
|
|
union ieee754dp ieee754dp_mul(union ieee754dp x, union ieee754dp y);
|
|
union ieee754dp ieee754dp_div(union ieee754dp x, union ieee754dp y);
|
|
|
|
union ieee754dp ieee754dp_abs(union ieee754dp x);
|
|
union ieee754dp ieee754dp_neg(union ieee754dp x);
|
|
|
|
union ieee754dp ieee754dp_fint(int x);
|
|
union ieee754dp ieee754dp_flong(s64 x);
|
|
union ieee754dp ieee754dp_fsp(union ieee754sp x);
|
|
union ieee754dp ieee754dp_rint(union ieee754dp x);
|
|
|
|
int ieee754dp_tint(union ieee754dp x);
|
|
s64 ieee754dp_tlong(union ieee754dp x);
|
|
|
|
int ieee754dp_cmp(union ieee754dp x, union ieee754dp y, int cop, int sig);
|
|
|
|
union ieee754dp ieee754dp_sqrt(union ieee754dp x);
|
|
|
|
union ieee754dp ieee754dp_maddf(union ieee754dp z, union ieee754dp x,
|
|
union ieee754dp y);
|
|
union ieee754dp ieee754dp_msubf(union ieee754dp z, union ieee754dp x,
|
|
union ieee754dp y);
|
|
union ieee754dp ieee754dp_madd(union ieee754dp z, union ieee754dp x,
|
|
union ieee754dp y);
|
|
union ieee754dp ieee754dp_msub(union ieee754dp z, union ieee754dp x,
|
|
union ieee754dp y);
|
|
union ieee754dp ieee754dp_nmadd(union ieee754dp z, union ieee754dp x,
|
|
union ieee754dp y);
|
|
union ieee754dp ieee754dp_nmsub(union ieee754dp z, union ieee754dp x,
|
|
union ieee754dp y);
|
|
int ieee754dp_2008class(union ieee754dp x);
|
|
union ieee754dp ieee754dp_fmin(union ieee754dp x, union ieee754dp y);
|
|
union ieee754dp ieee754dp_fmina(union ieee754dp x, union ieee754dp y);
|
|
union ieee754dp ieee754dp_fmax(union ieee754dp x, union ieee754dp y);
|
|
union ieee754dp ieee754dp_fmaxa(union ieee754dp x, union ieee754dp y);
|
|
|
|
|
|
/* 5 types of floating point number
|
|
*/
|
|
enum {
|
|
IEEE754_CLASS_NORM = 0x00,
|
|
IEEE754_CLASS_ZERO = 0x01,
|
|
IEEE754_CLASS_DNORM = 0x02,
|
|
IEEE754_CLASS_INF = 0x03,
|
|
IEEE754_CLASS_SNAN = 0x04,
|
|
IEEE754_CLASS_QNAN = 0x05,
|
|
};
|
|
|
|
/* exception numbers */
|
|
#define IEEE754_INEXACT 0x01
|
|
#define IEEE754_UNDERFLOW 0x02
|
|
#define IEEE754_OVERFLOW 0x04
|
|
#define IEEE754_ZERO_DIVIDE 0x08
|
|
#define IEEE754_INVALID_OPERATION 0x10
|
|
|
|
/* cmp operators
|
|
*/
|
|
#define IEEE754_CLT 0x01
|
|
#define IEEE754_CEQ 0x02
|
|
#define IEEE754_CGT 0x04
|
|
#define IEEE754_CUN 0x08
|
|
|
|
/*
|
|
* The control status register
|
|
*/
|
|
struct _ieee754_csr {
|
|
__BITFIELD_FIELD(unsigned fcc:7, /* condition[7:1] */
|
|
__BITFIELD_FIELD(unsigned nod:1, /* set 1 for no denormals */
|
|
__BITFIELD_FIELD(unsigned c:1, /* condition[0] */
|
|
__BITFIELD_FIELD(unsigned pad0:3,
|
|
__BITFIELD_FIELD(unsigned abs2008:1, /* IEEE 754-2008 ABS/NEG.fmt */
|
|
__BITFIELD_FIELD(unsigned nan2008:1, /* IEEE 754-2008 NaN mode */
|
|
__BITFIELD_FIELD(unsigned cx:6, /* exceptions this operation */
|
|
__BITFIELD_FIELD(unsigned mx:5, /* exception enable mask */
|
|
__BITFIELD_FIELD(unsigned sx:5, /* exceptions total */
|
|
__BITFIELD_FIELD(unsigned rm:2, /* current rounding mode */
|
|
;))))))))))
|
|
};
|
|
#define ieee754_csr (*(struct _ieee754_csr *)(¤t->thread.fpu.fcr31))
|
|
|
|
static inline unsigned int ieee754_getrm(void)
|
|
{
|
|
return (ieee754_csr.rm);
|
|
}
|
|
|
|
static inline unsigned int ieee754_setrm(unsigned int rm)
|
|
{
|
|
return (ieee754_csr.rm = rm);
|
|
}
|
|
|
|
/*
|
|
* get current exceptions
|
|
*/
|
|
static inline unsigned int ieee754_getcx(void)
|
|
{
|
|
return (ieee754_csr.cx);
|
|
}
|
|
|
|
/* test for current exception condition
|
|
*/
|
|
static inline int ieee754_cxtest(unsigned int n)
|
|
{
|
|
return (ieee754_csr.cx & n);
|
|
}
|
|
|
|
/*
|
|
* get sticky exceptions
|
|
*/
|
|
static inline unsigned int ieee754_getsx(void)
|
|
{
|
|
return (ieee754_csr.sx);
|
|
}
|
|
|
|
/* clear sticky conditions
|
|
*/
|
|
static inline unsigned int ieee754_clrsx(void)
|
|
{
|
|
return (ieee754_csr.sx = 0);
|
|
}
|
|
|
|
/* test for sticky exception condition
|
|
*/
|
|
static inline int ieee754_sxtest(unsigned int n)
|
|
{
|
|
return (ieee754_csr.sx & n);
|
|
}
|
|
|
|
/* debugging */
|
|
union ieee754sp ieee754sp_dump(char *s, union ieee754sp x);
|
|
union ieee754dp ieee754dp_dump(char *s, union ieee754dp x);
|
|
|
|
#define IEEE754_SPCVAL_PZERO 0 /* +0.0 */
|
|
#define IEEE754_SPCVAL_NZERO 1 /* -0.0 */
|
|
#define IEEE754_SPCVAL_PONE 2 /* +1.0 */
|
|
#define IEEE754_SPCVAL_NONE 3 /* -1.0 */
|
|
#define IEEE754_SPCVAL_PTEN 4 /* +10.0 */
|
|
#define IEEE754_SPCVAL_NTEN 5 /* -10.0 */
|
|
#define IEEE754_SPCVAL_PINFINITY 6 /* +inf */
|
|
#define IEEE754_SPCVAL_NINFINITY 7 /* -inf */
|
|
#define IEEE754_SPCVAL_INDEF_LEG 8 /* legacy quiet NaN */
|
|
#define IEEE754_SPCVAL_INDEF_2008 9 /* IEEE 754-2008 quiet NaN */
|
|
#define IEEE754_SPCVAL_PMAX 10 /* +max norm */
|
|
#define IEEE754_SPCVAL_NMAX 11 /* -max norm */
|
|
#define IEEE754_SPCVAL_PMIN 12 /* +min norm */
|
|
#define IEEE754_SPCVAL_NMIN 13 /* -min norm */
|
|
#define IEEE754_SPCVAL_PMIND 14 /* +min denorm */
|
|
#define IEEE754_SPCVAL_NMIND 15 /* -min denorm */
|
|
#define IEEE754_SPCVAL_P1E31 16 /* + 1.0e31 */
|
|
#define IEEE754_SPCVAL_P1E63 17 /* + 1.0e63 */
|
|
|
|
extern const union ieee754dp __ieee754dp_spcvals[];
|
|
extern const union ieee754sp __ieee754sp_spcvals[];
|
|
#define ieee754dp_spcvals ((const union ieee754dp *)__ieee754dp_spcvals)
|
|
#define ieee754sp_spcvals ((const union ieee754sp *)__ieee754sp_spcvals)
|
|
|
|
/*
|
|
* Return infinity with given sign
|
|
*/
|
|
#define ieee754dp_inf(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
|
|
#define ieee754dp_zero(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
|
|
#define ieee754dp_one(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
|
|
#define ieee754dp_ten(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
|
|
#define ieee754dp_indef() (ieee754dp_spcvals[IEEE754_SPCVAL_INDEF_LEG + \
|
|
ieee754_csr.nan2008])
|
|
#define ieee754dp_max(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
|
|
#define ieee754dp_min(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
|
|
#define ieee754dp_mind(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
|
|
#define ieee754dp_1e31() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E31])
|
|
#define ieee754dp_1e63() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E63])
|
|
|
|
#define ieee754sp_inf(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
|
|
#define ieee754sp_zero(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
|
|
#define ieee754sp_one(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
|
|
#define ieee754sp_ten(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
|
|
#define ieee754sp_indef() (ieee754sp_spcvals[IEEE754_SPCVAL_INDEF_LEG + \
|
|
ieee754_csr.nan2008])
|
|
#define ieee754sp_max(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
|
|
#define ieee754sp_min(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
|
|
#define ieee754sp_mind(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
|
|
#define ieee754sp_1e31() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E31])
|
|
#define ieee754sp_1e63() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E63])
|
|
|
|
/*
|
|
* Indefinite integer value
|
|
*/
|
|
static inline int ieee754si_indef(void)
|
|
{
|
|
return ieee754_csr.nan2008 ? 0 : INT_MAX;
|
|
}
|
|
|
|
static inline s64 ieee754di_indef(void)
|
|
{
|
|
return ieee754_csr.nan2008 ? 0 : S64_MAX;
|
|
}
|
|
|
|
/*
|
|
* Overflow integer value
|
|
*/
|
|
static inline int ieee754si_overflow(int xs)
|
|
{
|
|
return ieee754_csr.nan2008 && xs ? INT_MIN : INT_MAX;
|
|
}
|
|
|
|
static inline s64 ieee754di_overflow(int xs)
|
|
{
|
|
return ieee754_csr.nan2008 && xs ? S64_MIN : S64_MAX;
|
|
}
|
|
|
|
/* result types for xctx.rt */
|
|
#define IEEE754_RT_SP 0
|
|
#define IEEE754_RT_DP 1
|
|
#define IEEE754_RT_XP 2
|
|
#define IEEE754_RT_SI 3
|
|
#define IEEE754_RT_DI 4
|
|
|
|
/* compat */
|
|
#define ieee754dp_fix(x) ieee754dp_tint(x)
|
|
#define ieee754sp_fix(x) ieee754sp_tint(x)
|
|
|
|
#endif /* __ARCH_MIPS_MATH_EMU_IEEE754_H */
|