mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-25 15:00:17 +07:00
479 lines
11 KiB
ArmAsm
479 lines
11 KiB
ArmAsm
|
/*
|
||
|
* fp_scan.S
|
||
|
*
|
||
|
* Copyright Roman Zippel, 1997. All rights reserved.
|
||
|
*
|
||
|
* Redistribution and use in source and binary forms, with or without
|
||
|
* modification, are permitted provided that the following conditions
|
||
|
* are met:
|
||
|
* 1. Redistributions of source code must retain the above copyright
|
||
|
* notice, and the entire permission notice in its entirety,
|
||
|
* including the disclaimer of warranties.
|
||
|
* 2. Redistributions in binary form must reproduce the above copyright
|
||
|
* notice, this list of conditions and the following disclaimer in the
|
||
|
* documentation and/or other materials provided with the distribution.
|
||
|
* 3. The name of the author may not be used to endorse or promote
|
||
|
* products derived from this software without specific prior
|
||
|
* written permission.
|
||
|
*
|
||
|
* ALTERNATIVELY, this product may be distributed under the terms of
|
||
|
* the GNU General Public License, in which case the provisions of the GPL are
|
||
|
* required INSTEAD OF the above restrictions. (This clause is
|
||
|
* necessary due to a potential bad interaction between the GPL and
|
||
|
* the restrictions contained in a BSD-style copyright.)
|
||
|
*
|
||
|
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
|
||
|
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
||
|
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
||
|
* DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
|
||
|
* INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
||
|
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
||
|
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
||
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
|
||
|
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
||
|
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
|
||
|
* OF THE POSSIBILITY OF SUCH DAMAGE.
|
||
|
*/
|
||
|
|
||
|
#include "fp_emu.h"
|
||
|
#include "fp_decode.h"
|
||
|
|
||
|
.globl fp_scan, fp_datasize
|
||
|
|
||
|
.data
|
||
|
|
||
|
| %d2 - first two instr words
|
||
|
| %d1 - operand size
|
||
|
|
||
|
/* operand formats are:
|
||
|
|
||
|
Long = 0, i.e. fmove.l
|
||
|
Single, i.e. fmove.s
|
||
|
Extended, i.e. fmove.x
|
||
|
Packed-BCD, i.e. fmove.p
|
||
|
Word, i.e. fmove.w
|
||
|
Double, i.e. fmove.d
|
||
|
*/
|
||
|
|
||
|
.text
|
||
|
|
||
|
| On entry:
|
||
|
| FPDATA - base of emulated FPU registers
|
||
|
|
||
|
fp_scan:
|
||
|
| normal fpu instruction? (this excludes fsave/frestore)
|
||
|
fp_get_pc %a0
|
||
|
printf PDECODE,"%08x: ",1,%a0
|
||
|
getuser.b (%a0),%d0,fp_err_ua1,%a0
|
||
|
#if 1
|
||
|
cmp.b #0xf2,%d0 | cpid = 1
|
||
|
#else
|
||
|
cmp.b #0xfc,%d0 | cpid = 6
|
||
|
#endif
|
||
|
jne fp_nonstd
|
||
|
| first two instruction words are kept in %d2
|
||
|
getuser.l (%a0)+,%d2,fp_err_ua1,%a0
|
||
|
fp_put_pc %a0
|
||
|
fp_decode_cond: | separate conditional instr
|
||
|
fp_decode_cond_instr_type
|
||
|
|
||
|
.long fp_decode_move, fp_fscc
|
||
|
.long fp_fbccw, fp_fbccl
|
||
|
|
||
|
fp_decode_move: | separate move instr
|
||
|
fp_decode_move_instr_type
|
||
|
|
||
|
.long fp_fgen_fp, fp_ill
|
||
|
.long fp_fgen_ea, fp_fmove_fp2mem
|
||
|
.long fp_fmovem_cr, fp_fmovem_cr
|
||
|
.long fp_fmovem_fp, fp_fmovem_fp
|
||
|
|
||
|
| now all arithmetic instr and a few move instr are left
|
||
|
fp_fgen_fp: | source is a fpu register
|
||
|
clr.b (FPD_FPSR+2,FPDATA) | clear the exception byte
|
||
|
fp_decode_sourcespec
|
||
|
printf PDECODE,"f<op>.x fp%d",1,%d0
|
||
|
fp_get_fp_reg
|
||
|
lea (FPD_TEMPFP1,FPDATA),%a1 | copy src into a temp location
|
||
|
move.l (%a0)+,(%a1)+
|
||
|
move.l (%a0)+,(%a1)+
|
||
|
move.l (%a0),(%a1)
|
||
|
lea (-8,%a1),%a0
|
||
|
jra fp_getdest
|
||
|
|
||
|
fp_fgen_ea: | source is <ea>
|
||
|
clr.b (FPD_FPSR+2,FPDATA) | clear the exception byte
|
||
|
| sort out fmovecr, keep data size in %d1
|
||
|
fp_decode_sourcespec
|
||
|
cmp.w #7,%d0
|
||
|
jeq fp_fmovecr
|
||
|
move.w %d0,%d1 | store data size twice in %d1
|
||
|
swap %d1 | one can be trashed below
|
||
|
move.w %d0,%d1
|
||
|
#ifdef FPU_EMU_DEBUG
|
||
|
lea 0f,%a0
|
||
|
clr.l %d0
|
||
|
move.b (%a0,%d1.w),%d0
|
||
|
printf PDECODE,"f<op>.%c ",1,%d0
|
||
|
|
||
|
.data
|
||
|
0: .byte 'l','s','x','p','w','d','b',0
|
||
|
.previous
|
||
|
#endif
|
||
|
|
||
|
/*
|
||
|
fp_getsource, fp_getdest
|
||
|
|
||
|
basically, we end up with a pointer to the source operand in
|
||
|
%a1, and a pointer to the destination operand in %a0. both
|
||
|
are, of course, 96-bit extended floating point numbers.
|
||
|
*/
|
||
|
|
||
|
fp_getsource:
|
||
|
| decode addressing mode for source
|
||
|
fp_decode_addr_mode
|
||
|
|
||
|
.long fp_data, fp_ill
|
||
|
.long fp_indirect, fp_postinc
|
||
|
.long fp_predecr, fp_disp16
|
||
|
.long fp_extmode0, fp_extmode1
|
||
|
|
||
|
| addressing mode: data register direct
|
||
|
fp_data:
|
||
|
fp_mode_data_direct
|
||
|
jsr fp_get_data_reg
|
||
|
lea (FPD_TEMPFP1,FPDATA),%a0
|
||
|
jmp ([0f:w,%pc,%d1.w*4])
|
||
|
|
||
|
.align 4
|
||
|
0:
|
||
|
.long fp_data_long, fp_data_single
|
||
|
.long fp_ill, fp_ill
|
||
|
.long fp_data_word, fp_ill
|
||
|
.long fp_data_byte, fp_ill
|
||
|
|
||
|
| data types that fit in an integer data register
|
||
|
fp_data_byte:
|
||
|
extb.l %d0
|
||
|
jra fp_data_long
|
||
|
|
||
|
fp_data_word:
|
||
|
ext.l %d0
|
||
|
|
||
|
fp_data_long:
|
||
|
jsr fp_conv_long2ext
|
||
|
jra fp_getdest
|
||
|
|
||
|
fp_data_single:
|
||
|
jsr fp_conv_single2ext
|
||
|
jra fp_getdest
|
||
|
|
||
|
| addressing mode: address register indirect
|
||
|
fp_indirect:
|
||
|
fp_mode_addr_indirect
|
||
|
jra fp_fetchsource
|
||
|
|
||
|
| addressing mode: address register indirect with postincrement
|
||
|
fp_postinc:
|
||
|
fp_mode_addr_indirect_postinc
|
||
|
jra fp_fetchsource
|
||
|
|
||
|
| addressing mode: address register indirect with predecrement
|
||
|
fp_predecr:
|
||
|
fp_mode_addr_indirect_predec
|
||
|
jra fp_fetchsource
|
||
|
|
||
|
| addressing mode: address register/programm counter indirect
|
||
|
| with 16bit displacement
|
||
|
fp_disp16:
|
||
|
fp_mode_addr_indirect_disp16
|
||
|
jra fp_fetchsource
|
||
|
|
||
|
| all other indirect addressing modes will finally end up here
|
||
|
fp_extmode0:
|
||
|
fp_mode_addr_indirect_extmode0
|
||
|
jra fp_fetchsource
|
||
|
|
||
|
| all pc relative addressing modes and immediate/absolute modes end up here
|
||
|
| the first ones are sent to fp_extmode0 or fp_disp16
|
||
|
| and only the latter are handled here
|
||
|
fp_extmode1:
|
||
|
fp_decode_addr_reg
|
||
|
jmp ([0f:w,%pc,%d0*4])
|
||
|
|
||
|
.align 4
|
||
|
0:
|
||
|
.long fp_abs_short, fp_abs_long
|
||
|
.long fp_disp16, fp_extmode0
|
||
|
.long fp_immediate, fp_ill
|
||
|
.long fp_ill, fp_ill
|
||
|
|
||
|
| addressing mode: absolute short
|
||
|
fp_abs_short:
|
||
|
fp_mode_abs_short
|
||
|
jra fp_fetchsource
|
||
|
|
||
|
| addressing mode: absolute long
|
||
|
fp_abs_long:
|
||
|
fp_mode_abs_long
|
||
|
jra fp_fetchsource
|
||
|
|
||
|
| addressing mode: immediate data
|
||
|
fp_immediate:
|
||
|
printf PDECODE,"#"
|
||
|
fp_get_pc %a0
|
||
|
move.w (fp_datasize,%d1.w*2),%d0
|
||
|
addq.w #1,%d0
|
||
|
and.w #-2,%d0
|
||
|
#ifdef FPU_EMU_DEBUG
|
||
|
movem.l %d0/%d1,-(%sp)
|
||
|
movel %a0,%a1
|
||
|
clr.l %d1
|
||
|
jra 2f
|
||
|
1: getuser.b (%a1)+,%d1,fp_err_ua1,%a1
|
||
|
printf PDECODE,"%02x",1,%d1
|
||
|
2: dbra %d0,1b
|
||
|
movem.l (%sp)+,%d0/%d1
|
||
|
#endif
|
||
|
lea (%a0,%d0.w),%a1
|
||
|
fp_put_pc %a1
|
||
|
| jra fp_fetchsource
|
||
|
|
||
|
fp_fetchsource:
|
||
|
move.l %a0,%a1
|
||
|
swap %d1
|
||
|
lea (FPD_TEMPFP1,FPDATA),%a0
|
||
|
jmp ([0f:w,%pc,%d1.w*4])
|
||
|
|
||
|
.align 4
|
||
|
0: .long fp_long, fp_single
|
||
|
.long fp_ext, fp_pack
|
||
|
.long fp_word, fp_double
|
||
|
.long fp_byte, fp_ill
|
||
|
|
||
|
fp_long:
|
||
|
getuser.l (%a1),%d0,fp_err_ua1,%a1
|
||
|
jsr fp_conv_long2ext
|
||
|
jra fp_getdest
|
||
|
|
||
|
fp_single:
|
||
|
getuser.l (%a1),%d0,fp_err_ua1,%a1
|
||
|
jsr fp_conv_single2ext
|
||
|
jra fp_getdest
|
||
|
|
||
|
fp_ext:
|
||
|
getuser.l (%a1)+,%d0,fp_err_ua1,%a1
|
||
|
lsr.l #8,%d0
|
||
|
lsr.l #7,%d0
|
||
|
lsr.w #1,%d0
|
||
|
move.l %d0,(%a0)+
|
||
|
getuser.l (%a1)+,%d0,fp_err_ua1,%a1
|
||
|
move.l %d0,(%a0)+
|
||
|
getuser.l (%a1),%d0,fp_err_ua1,%a1
|
||
|
move.l %d0,(%a0)
|
||
|
subq.l #8,%a0
|
||
|
jra fp_getdest
|
||
|
|
||
|
fp_pack:
|
||
|
/* not supported yet */
|
||
|
jra fp_ill
|
||
|
|
||
|
fp_word:
|
||
|
getuser.w (%a1),%d0,fp_err_ua1,%a1
|
||
|
ext.l %d0
|
||
|
jsr fp_conv_long2ext
|
||
|
jra fp_getdest
|
||
|
|
||
|
fp_double:
|
||
|
jsr fp_conv_double2ext
|
||
|
jra fp_getdest
|
||
|
|
||
|
fp_byte:
|
||
|
getuser.b (%a1),%d0,fp_err_ua1,%a1
|
||
|
extb.l %d0
|
||
|
jsr fp_conv_long2ext
|
||
|
| jra fp_getdest
|
||
|
|
||
|
fp_getdest:
|
||
|
move.l %a0,%a1
|
||
|
bfextu %d2{#22,#3},%d0
|
||
|
printf PDECODE,",fp%d\n",1,%d0
|
||
|
fp_get_fp_reg
|
||
|
movem.l %a0/%a1,-(%sp)
|
||
|
pea fp_finalrounding
|
||
|
bfextu %d2{#25,#7},%d0
|
||
|
jmp ([0f:w,%pc,%d0*4])
|
||
|
|
||
|
.align 4
|
||
|
0:
|
||
|
.long fp_fmove_mem2fp, fp_fint, fp_fsinh, fp_fintrz
|
||
|
.long fp_fsqrt, fp_ill, fp_flognp1, fp_ill
|
||
|
.long fp_fetoxm1, fp_ftanh, fp_fatan, fp_ill
|
||
|
.long fp_fasin, fp_fatanh, fp_fsin, fp_ftan
|
||
|
.long fp_fetox, fp_ftwotox, fp_ftentox, fp_ill
|
||
|
.long fp_flogn, fp_flog10, fp_flog2, fp_ill
|
||
|
.long fp_fabs, fp_fcosh, fp_fneg, fp_ill
|
||
|
.long fp_facos, fp_fcos, fp_fgetexp, fp_fgetman
|
||
|
.long fp_fdiv, fp_fmod, fp_fadd, fp_fmul
|
||
|
.long fpa_fsgldiv, fp_frem, fp_fscale, fpa_fsglmul
|
||
|
.long fp_fsub, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_fsincos0, fp_fsincos1, fp_fsincos2, fp_fsincos3
|
||
|
.long fp_fsincos4, fp_fsincos5, fp_fsincos6, fp_fsincos7
|
||
|
.long fp_fcmp, fp_ill, fp_ftst, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_fsmove, fp_fssqrt, fp_ill, fp_ill
|
||
|
.long fp_fdmove, fp_fdsqrt, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_fsabs, fp_ill, fp_fsneg, fp_ill
|
||
|
.long fp_fdabs, fp_ill, fp_fdneg, fp_ill
|
||
|
.long fp_fsdiv, fp_ill, fp_fsadd, fp_fsmul
|
||
|
.long fp_fddiv, fp_ill, fp_fdadd, fp_fdmul
|
||
|
.long fp_fssub, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_fdsub, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
.long fp_ill, fp_ill, fp_ill, fp_ill
|
||
|
|
||
|
| Instructions follow
|
||
|
|
||
|
| Move an (emulated) ROM constant
|
||
|
fp_fmovecr:
|
||
|
bfextu %d2{#27,#5},%d0
|
||
|
printf PINSTR,"fp_fmovecr #%d",1,%d0
|
||
|
move.l %d0,%d1
|
||
|
add.l %d0,%d0
|
||
|
add.l %d1,%d0
|
||
|
lea (fp_constants,%d0*4),%a0
|
||
|
move.l #0x801cc0ff,%d0
|
||
|
addq.l #1,%d1
|
||
|
lsl.l %d1,%d0
|
||
|
jcc 1f
|
||
|
fp_set_sr FPSR_EXC_INEX2 | INEX2 exception
|
||
|
1: moveq #-128,%d0 | continue with fmove
|
||
|
and.l %d0,%d2
|
||
|
jra fp_getdest
|
||
|
|
||
|
.data
|
||
|
.align 4
|
||
|
fp_constants:
|
||
|
.long 0x00004000,0xc90fdaa2,0x2168c235 | pi
|
||
|
.extend 0,0,0,0,0,0,0,0,0,0
|
||
|
.long 0x00003ffd,0x9a209a84,0xfbcff798 | log10(2)
|
||
|
.long 0x00004000,0xadf85458,0xa2bb4a9a | e
|
||
|
.long 0x00003fff,0xb8aa3b29,0x5c17f0bc | log2(e)
|
||
|
.long 0x00003ffd,0xde5bd8a9,0x37287195 | log10(e)
|
||
|
.long 0x00000000,0x00000000,0x00000000 | 0.0
|
||
|
.long 0x00003ffe,0xb17217f7,0xd1cf79ac | 1n(2)
|
||
|
.long 0x00004000,0x935d8ddd,0xaaa8ac17 | 1n(10)
|
||
|
| read this as "1.0 * 2^0" - note the high bit in the mantissa
|
||
|
.long 0x00003fff,0x80000000,0x00000000 | 10^0
|
||
|
.long 0x00004002,0xa0000000,0x00000000 | 10^1
|
||
|
.long 0x00004005,0xc8000000,0x00000000 | 10^2
|
||
|
.long 0x0000400c,0x9c400000,0x00000000 | 10^4
|
||
|
.long 0x00004019,0xbebc2000,0x00000000 | 10^8
|
||
|
.long 0x00004034,0x8e1bc9bf,0x04000000 | 10^16
|
||
|
.long 0x00004069,0x9dc5ada8,0x2b70b59e | 10^32
|
||
|
.long 0x000040d3,0xc2781f49,0xffcfa6d5 | 10^64
|
||
|
.long 0x000041a8,0x93ba47c9,0x80e98ce0 | 10^128
|
||
|
.long 0x00004351,0xaa7eebfb,0x9df9de8e | 10^256
|
||
|
.long 0x000046a3,0xe319a0ae,0xa60e91c7 | 10^512
|
||
|
.long 0x00004d48,0xc9767586,0x81750c17 | 10^1024
|
||
|
.long 0x00005a92,0x9e8b3b5d,0xc53d5de5 | 10^2048
|
||
|
.long 0x00007525,0xc4605202,0x8a20979b | 10^4096
|
||
|
.previous
|
||
|
|
||
|
fp_fmove_mem2fp:
|
||
|
printf PINSTR,"fmove %p,%p\n",2,%a0,%a1
|
||
|
move.l (%a1)+,(%a0)+
|
||
|
move.l (%a1)+,(%a0)+
|
||
|
move.l (%a1),(%a0)
|
||
|
subq.l #8,%a0
|
||
|
rts
|
||
|
|
||
|
fpa_fsglmul:
|
||
|
move.l #fp_finalrounding_single_fast,(%sp)
|
||
|
jra fp_fsglmul
|
||
|
|
||
|
fpa_fsgldiv:
|
||
|
move.l #fp_finalrounding_single_fast,(%sp)
|
||
|
jra fp_fsgldiv
|
||
|
|
||
|
.macro fp_dosingleprec instr
|
||
|
printf PINSTR,"single "
|
||
|
move.l #fp_finalrounding_single,(%sp)
|
||
|
jra \instr
|
||
|
.endm
|
||
|
|
||
|
.macro fp_dodoubleprec instr
|
||
|
printf PINSTR,"double "
|
||
|
move.l #fp_finalrounding_double,(%sp)
|
||
|
jra \instr
|
||
|
.endm
|
||
|
|
||
|
fp_fsmove:
|
||
|
fp_dosingleprec fp_fmove_mem2fp
|
||
|
|
||
|
fp_fssqrt:
|
||
|
fp_dosingleprec fp_fsqrt
|
||
|
|
||
|
fp_fdmove:
|
||
|
fp_dodoubleprec fp_fmove_mem2fp
|
||
|
|
||
|
fp_fdsqrt:
|
||
|
fp_dodoubleprec fp_fsqrt
|
||
|
|
||
|
fp_fsabs:
|
||
|
fp_dosingleprec fp_fabs
|
||
|
|
||
|
fp_fsneg:
|
||
|
fp_dosingleprec fp_fneg
|
||
|
|
||
|
fp_fdabs:
|
||
|
fp_dodoubleprec fp_fabs
|
||
|
|
||
|
fp_fdneg:
|
||
|
fp_dodoubleprec fp_fneg
|
||
|
|
||
|
fp_fsdiv:
|
||
|
fp_dosingleprec fp_fdiv
|
||
|
|
||
|
fp_fsadd:
|
||
|
fp_dosingleprec fp_fadd
|
||
|
|
||
|
fp_fsmul:
|
||
|
fp_dosingleprec fp_fmul
|
||
|
|
||
|
fp_fddiv:
|
||
|
fp_dodoubleprec fp_fdiv
|
||
|
|
||
|
fp_fdadd:
|
||
|
fp_dodoubleprec fp_fadd
|
||
|
|
||
|
fp_fdmul:
|
||
|
fp_dodoubleprec fp_fmul
|
||
|
|
||
|
fp_fssub:
|
||
|
fp_dosingleprec fp_fsub
|
||
|
|
||
|
fp_fdsub:
|
||
|
fp_dodoubleprec fp_fsub
|
||
|
|
||
|
fp_nonstd:
|
||
|
fp_get_pc %a0
|
||
|
getuser.l (%a0),%d0,fp_err_ua1,%a0
|
||
|
printf ,"nonstd ((%08x)=%08x)\n",2,%a0,%d0
|
||
|
moveq #-1,%d0
|
||
|
rts
|
||
|
|
||
|
.data
|
||
|
.align 4
|
||
|
|
||
|
| data sizes corresponding to the operand formats
|
||
|
fp_datasize:
|
||
|
.word 4, 4, 12, 12, 2, 8, 1, 0
|