OpenCloudOS-Kernel/arch/m68k/math-emu/fp_scan.S

/*
 * fp_scan.S
 *
 * Copyright Roman Zippel, 1997.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, and the entire permission notice in its entirety,
 *    including the disclaimer of warranties.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. The name of the author may not be used to endorse or promote
 *    products derived from this software without specific prior
 *    written permission.
 *
 * ALTERNATIVELY, this product may be distributed under the terms of
 * the GNU General Public License, in which case the provisions of the GPL are
 * required INSTEAD OF the above restrictions.  (This clause is
 * necessary due to a potential bad interaction between the GPL and
 * the restrictions contained in a BSD-style copyright.)
 *
 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 * DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
 * OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#include "fp_emu.h"
#include "fp_decode.h"

	.globl	fp_scan, fp_datasize

	.data

| %d2 - first two instr words
| %d1 - operand size

/* operand formats are:

	Long = 0,		i.e. fmove.l
	Single,			i.e. fmove.s
	Extended,		i.e. fmove.x
	Packed-BCD,		i.e. fmove.p
	Word,			i.e. fmove.w
	Double,			i.e. fmove.d
*/

	.text

| On entry:
| FPDATA - base of emulated FPU registers

fp_scan:
| normal fpu instruction? (this excludes fsave/frestore)
	fp_get_pc %a0
	printf	PDECODE,"%08x: ",1,%a0
	getuser.b (%a0),%d0,fp_err_ua1,%a0
#if 1
	cmp.b	#0xf2,%d0		| cpid = 1
#else
	cmp.b	#0xfc,%d0		| cpid = 6
#endif
	jne	fp_nonstd
| first two instruction words are kept in %d2
	getuser.l (%a0)+,%d2,fp_err_ua1,%a0
	fp_put_pc %a0
fp_decode_cond:				| separate conditional instr
	fp_decode_cond_instr_type

	.long	fp_decode_move, fp_fscc
	.long	fp_fbccw, fp_fbccl

fp_decode_move:				| separate move instr
	fp_decode_move_instr_type

	.long	fp_fgen_fp, fp_ill
	.long	fp_fgen_ea, fp_fmove_fp2mem
	.long	fp_fmovem_cr, fp_fmovem_cr
	.long	fp_fmovem_fp, fp_fmovem_fp

| now all arithmetic instr and a few move instr are left
fp_fgen_fp:				| source is a fpu register
	clr.b	(FPD_FPSR+2,FPDATA)	| clear the exception byte
	fp_decode_sourcespec
	printf	PDECODE,"f<op>.x fp%d",1,%d0
	fp_get_fp_reg
	lea	(FPD_TEMPFP1,FPDATA),%a1 | copy src into a temp location
	move.l	(%a0)+,(%a1)+
	move.l	(%a0)+,(%a1)+
	move.l	(%a0),(%a1)
	lea	(-8,%a1),%a0
	jra	fp_getdest

fp_fgen_ea:				| source is <ea>
	clr.b	(FPD_FPSR+2,FPDATA)	| clear the exception byte
	| sort out fmovecr, keep data size in %d1
	fp_decode_sourcespec
	cmp.w	#7,%d0
	jeq	fp_fmovecr
	move.w	%d0,%d1			| store data size twice in %d1
	swap	%d1			| one can be trashed below
	move.w	%d0,%d1
#ifdef FPU_EMU_DEBUG
	lea	0f,%a0
	clr.l	%d0
	move.b	(%a0,%d1.w),%d0
	printf	PDECODE,"f<op>.%c ",1,%d0

	.data
0:	.byte	'l','s','x','p','w','d','b',0
	.previous
#endif

/*
	fp_getsource, fp_getdest

	basically, we end up with a pointer to the source operand in
	%a1, and a pointer to the destination operand in %a0.  both
	are, of course, 96-bit extended floating point numbers.
*/

fp_getsource:
	| decode addressing mode for source
	fp_decode_addr_mode

	.long	fp_data, fp_ill
	.long	fp_indirect, fp_postinc
	.long	fp_predecr, fp_disp16
	.long	fp_extmode0, fp_extmode1

	| addressing mode: data register direct
fp_data:
	fp_mode_data_direct
	jsr	fp_get_data_reg
	lea	(FPD_TEMPFP1,FPDATA),%a0
	jmp	([0f:w,%pc,%d1.w*4])

	.align	4
0:
	.long	fp_data_long, fp_data_single
	.long	fp_ill, fp_ill
	.long	fp_data_word, fp_ill
	.long	fp_data_byte, fp_ill

	| data types that fit in an integer data register
fp_data_byte:
	extb.l	%d0
	jra	fp_data_long

fp_data_word:
	ext.l	%d0

fp_data_long:
	jsr	fp_conv_long2ext
	jra	fp_getdest

fp_data_single:
	jsr	fp_conv_single2ext
	jra	fp_getdest

	| addressing mode: address register indirect
fp_indirect:
	fp_mode_addr_indirect
	jra	fp_fetchsource

	| addressing mode: address register indirect with postincrement
fp_postinc:
	fp_mode_addr_indirect_postinc
	jra	fp_fetchsource

	| addressing mode: address register indirect with predecrement
fp_predecr:
	fp_mode_addr_indirect_predec
	jra	fp_fetchsource

	| addressing mode: address register/programm counter indirect
	|		   with 16bit displacement
fp_disp16:
	fp_mode_addr_indirect_disp16
	jra	fp_fetchsource

	| all other indirect addressing modes will finally end up here
fp_extmode0:
	fp_mode_addr_indirect_extmode0
	jra	fp_fetchsource

| all pc relative addressing modes and immediate/absolute modes end up here
| the first ones are sent to fp_extmode0 or fp_disp16
| and only the latter are handled here
fp_extmode1:
	fp_decode_addr_reg
	jmp	([0f:w,%pc,%d0*4])

	.align	4
0:
	.long	fp_abs_short, fp_abs_long
	.long	fp_disp16, fp_extmode0
	.long	fp_immediate, fp_ill
	.long	fp_ill, fp_ill

	| addressing mode: absolute short
fp_abs_short:
	fp_mode_abs_short
	jra	fp_fetchsource

	| addressing mode: absolute long
fp_abs_long:
	fp_mode_abs_long
	jra	fp_fetchsource

	| addressing mode: immediate data
fp_immediate:
	printf	PDECODE,"#"
	fp_get_pc %a0
	move.w	(fp_datasize,%d1.w*2),%d0
	addq.w	#1,%d0
	and.w	#-2,%d0
#ifdef FPU_EMU_DEBUG
	movem.l	%d0/%d1,-(%sp)
	movel	%a0,%a1
	clr.l	%d1
	jra	2f
1:	getuser.b (%a1)+,%d1,fp_err_ua1,%a1
	printf	PDECODE,"%02x",1,%d1
2:	dbra	%d0,1b
	movem.l	(%sp)+,%d0/%d1
#endif
	lea	(%a0,%d0.w),%a1
	fp_put_pc %a1
|	jra	fp_fetchsource

fp_fetchsource:
	move.l	%a0,%a1
	swap	%d1
	lea	(FPD_TEMPFP1,FPDATA),%a0
	jmp	([0f:w,%pc,%d1.w*4])

	.align	4
0:	.long	fp_long, fp_single
	.long	fp_ext, fp_pack
	.long	fp_word, fp_double
	.long	fp_byte, fp_ill

fp_long:
	getuser.l (%a1),%d0,fp_err_ua1,%a1
	jsr	fp_conv_long2ext
	jra	fp_getdest

fp_single:
	getuser.l (%a1),%d0,fp_err_ua1,%a1
	jsr	fp_conv_single2ext
	jra	fp_getdest

fp_ext:
	getuser.l (%a1)+,%d0,fp_err_ua1,%a1
	lsr.l	#8,%d0
	lsr.l	#7,%d0
	lsr.w	#1,%d0
	move.l	%d0,(%a0)+
	getuser.l (%a1)+,%d0,fp_err_ua1,%a1
	move.l	%d0,(%a0)+
	getuser.l (%a1),%d0,fp_err_ua1,%a1
	move.l	%d0,(%a0)
	subq.l	#8,%a0
	jra	fp_getdest

fp_pack:
	/* not supported yet */
	jra	fp_ill

fp_word:
	getuser.w (%a1),%d0,fp_err_ua1,%a1
	ext.l	%d0
	jsr	fp_conv_long2ext
	jra	fp_getdest

fp_double:
	jsr	fp_conv_double2ext
	jra	fp_getdest

fp_byte:
	getuser.b (%a1),%d0,fp_err_ua1,%a1
	extb.l	%d0
	jsr	fp_conv_long2ext
|	jra	fp_getdest

fp_getdest:
	move.l	%a0,%a1
	bfextu	%d2{#22,#3},%d0
	printf	PDECODE,",fp%d\n",1,%d0
	fp_get_fp_reg
	movem.l	%a0/%a1,-(%sp)
	pea	fp_finalrounding
	bfextu	%d2{#25,#7},%d0
	jmp	([0f:w,%pc,%d0*4])

	.align	4
0:
	.long	fp_fmove_mem2fp, fp_fint, fp_fsinh, fp_fintrz
	.long	fp_fsqrt, fp_ill, fp_flognp1, fp_ill
	.long	fp_fetoxm1, fp_ftanh, fp_fatan, fp_ill
	.long	fp_fasin, fp_fatanh, fp_fsin, fp_ftan
	.long	fp_fetox, fp_ftwotox, fp_ftentox, fp_ill
	.long	fp_flogn, fp_flog10, fp_flog2, fp_ill
	.long	fp_fabs, fp_fcosh, fp_fneg, fp_ill
	.long	fp_facos, fp_fcos, fp_fgetexp, fp_fgetman
	.long	fp_fdiv, fp_fmod, fp_fadd, fp_fmul
	.long	fpa_fsgldiv, fp_frem, fp_fscale, fpa_fsglmul
	.long	fp_fsub, fp_ill, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_fsincos0, fp_fsincos1, fp_fsincos2, fp_fsincos3
	.long	fp_fsincos4, fp_fsincos5, fp_fsincos6, fp_fsincos7
	.long	fp_fcmp, fp_ill, fp_ftst, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_fsmove, fp_fssqrt, fp_ill, fp_ill
	.long	fp_fdmove, fp_fdsqrt, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_fsabs, fp_ill, fp_fsneg, fp_ill
	.long	fp_fdabs, fp_ill, fp_fdneg, fp_ill
	.long	fp_fsdiv, fp_ill, fp_fsadd, fp_fsmul
	.long	fp_fddiv, fp_ill, fp_fdadd, fp_fdmul
	.long	fp_fssub, fp_ill, fp_ill, fp_ill
	.long	fp_fdsub, fp_ill, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill
	.long	fp_ill, fp_ill, fp_ill, fp_ill

	| Instructions follow

	| Move an (emulated) ROM constant
fp_fmovecr:
	bfextu	%d2{#27,#5},%d0
	printf	PINSTR,"fp_fmovecr #%d",1,%d0
	move.l	%d0,%d1
	add.l	%d0,%d0
	add.l	%d1,%d0
	lea	(fp_constants,%d0*4),%a0
	move.l	#0x801cc0ff,%d0
	addq.l	#1,%d1
	lsl.l	%d1,%d0
	jcc	1f
	fp_set_sr FPSR_EXC_INEX2			| INEX2 exception
1:	moveq	#-128,%d0				| continue with fmove
	and.l	%d0,%d2
	jra	fp_getdest

	.data
	.align	4
fp_constants:
	.long	0x00004000,0xc90fdaa2,0x2168c235	| pi
	.extend	0,0,0,0,0,0,0,0,0,0
	.long	0x00003ffd,0x9a209a84,0xfbcff798	| log10(2)
	.long	0x00004000,0xadf85458,0xa2bb4a9a	| e
	.long	0x00003fff,0xb8aa3b29,0x5c17f0bc	| log2(e)
	.long	0x00003ffd,0xde5bd8a9,0x37287195	| log10(e)
	.long	0x00000000,0x00000000,0x00000000	| 0.0
	.long	0x00003ffe,0xb17217f7,0xd1cf79ac	| 1n(2)
	.long	0x00004000,0x935d8ddd,0xaaa8ac17	| 1n(10)
	| read this as "1.0 * 2^0" - note the high bit in the mantissa
	.long	0x00003fff,0x80000000,0x00000000	| 10^0
	.long	0x00004002,0xa0000000,0x00000000	| 10^1
	.long	0x00004005,0xc8000000,0x00000000	| 10^2
	.long	0x0000400c,0x9c400000,0x00000000	| 10^4
	.long	0x00004019,0xbebc2000,0x00000000	| 10^8
	.long	0x00004034,0x8e1bc9bf,0x04000000	| 10^16
	.long	0x00004069,0x9dc5ada8,0x2b70b59e	| 10^32
	.long	0x000040d3,0xc2781f49,0xffcfa6d5	| 10^64
	.long	0x000041a8,0x93ba47c9,0x80e98ce0	| 10^128
	.long	0x00004351,0xaa7eebfb,0x9df9de8e	| 10^256
	.long	0x000046a3,0xe319a0ae,0xa60e91c7	| 10^512
	.long	0x00004d48,0xc9767586,0x81750c17	| 10^1024
	.long	0x00005a92,0x9e8b3b5d,0xc53d5de5	| 10^2048
	.long	0x00007525,0xc4605202,0x8a20979b	| 10^4096
	.previous

fp_fmove_mem2fp:
	printf	PINSTR,"fmove %p,%p\n",2,%a0,%a1
	move.l	(%a1)+,(%a0)+
	move.l	(%a1)+,(%a0)+
	move.l	(%a1),(%a0)
	subq.l	#8,%a0
	rts

fpa_fsglmul:
	move.l	#fp_finalrounding_single_fast,(%sp)
	jra	fp_fsglmul

fpa_fsgldiv:
	move.l	#fp_finalrounding_single_fast,(%sp)
	jra	fp_fsgldiv

.macro	fp_dosingleprec instr
	printf	PINSTR,"single "
	move.l	#fp_finalrounding_single,(%sp)
	jra	\instr
.endm

.macro	fp_dodoubleprec instr
	printf	PINSTR,"double "
	move.l	#fp_finalrounding_double,(%sp)
	jra	\instr
.endm

fp_fsmove:
	fp_dosingleprec fp_fmove_mem2fp

fp_fssqrt:
	fp_dosingleprec fp_fsqrt

fp_fdmove:
	fp_dodoubleprec fp_fmove_mem2fp

fp_fdsqrt:
	fp_dodoubleprec fp_fsqrt

fp_fsabs:
	fp_dosingleprec fp_fabs

fp_fsneg:
	fp_dosingleprec fp_fneg

fp_fdabs:
	fp_dodoubleprec fp_fabs

fp_fdneg:
	fp_dodoubleprec fp_fneg

fp_fsdiv:
	fp_dosingleprec fp_fdiv

fp_fsadd:
	fp_dosingleprec fp_fadd

fp_fsmul:
	fp_dosingleprec fp_fmul

fp_fddiv:
	fp_dodoubleprec fp_fdiv

fp_fdadd:
	fp_dodoubleprec fp_fadd

fp_fdmul:
	fp_dodoubleprec fp_fmul

fp_fssub:
	fp_dosingleprec fp_fsub

fp_fdsub:
	fp_dodoubleprec fp_fsub

fp_nonstd:
	fp_get_pc %a0
	getuser.l (%a0),%d0,fp_err_ua1,%a0
	printf	,"nonstd ((%08x)=%08x)\n",2,%a0,%d0
	moveq	#-1,%d0
	rts

	.data
	.align	4

	| data sizes corresponding to the operand formats
fp_datasize:
	.word	4, 4, 12, 12, 2, 8, 1, 0
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 06:20:36 +08:00			`/*`
			`* fp_scan.S`
			`*`
			`* Copyright Roman Zippel, 1997. All rights reserved.`
			`*`
			`* Redistribution and use in source and binary forms, with or without`
			`* modification, are permitted provided that the following conditions`
			`* are met:`
			`* 1. Redistributions of source code must retain the above copyright`
			`* notice, and the entire permission notice in its entirety,`
			`* including the disclaimer of warranties.`
			`* 2. Redistributions in binary form must reproduce the above copyright`
			`* notice, this list of conditions and the following disclaimer in the`
			`* documentation and/or other materials provided with the distribution.`
			`* 3. The name of the author may not be used to endorse or promote`
			`* products derived from this software without specific prior`
			`* written permission.`
			`*`
			`* ALTERNATIVELY, this product may be distributed under the terms of`
			`* the GNU General Public License, in which case the provisions of the GPL are`
			`* required INSTEAD OF the above restrictions. (This clause is`
			`* necessary due to a potential bad interaction between the GPL and`
			`* the restrictions contained in a BSD-style copyright.)`
			`*`
			* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
			`* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES`
			`* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE`
			`* DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,`
			`* INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES`
			`* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR`
			`* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)`
			`* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,`
			`* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)`
			`* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED`
			`* OF THE POSSIBILITY OF SUCH DAMAGE.`
			`*/`

			`#include "fp_emu.h"`
			`#include "fp_decode.h"`

			`.globl fp_scan, fp_datasize`

			`.data`

			`\| %d2 - first two instr words`
			`\| %d1 - operand size`

			`/* operand formats are:`

			`Long = 0, i.e. fmove.l`
			`Single, i.e. fmove.s`
			`Extended, i.e. fmove.x`
			`Packed-BCD, i.e. fmove.p`
			`Word, i.e. fmove.w`
			`Double, i.e. fmove.d`
			`*/`

			`.text`

			`\| On entry:`
			`\| FPDATA - base of emulated FPU registers`

			`fp_scan:`
			`\| normal fpu instruction? (this excludes fsave/frestore)`
			`fp_get_pc %a0`
			`printf PDECODE,"%08x: ",1,%a0`
			`getuser.b (%a0),%d0,fp_err_ua1,%a0`
			`#if 1`
			`cmp.b #0xf2,%d0 \| cpid = 1`
			`#else`
			`cmp.b #0xfc,%d0 \| cpid = 6`
			`#endif`
			`jne fp_nonstd`
			`\| first two instruction words are kept in %d2`
			`getuser.l (%a0)+,%d2,fp_err_ua1,%a0`
			`fp_put_pc %a0`
			`fp_decode_cond: \| separate conditional instr`
			`fp_decode_cond_instr_type`

			`.long fp_decode_move, fp_fscc`
			`.long fp_fbccw, fp_fbccl`

			`fp_decode_move: \| separate move instr`
			`fp_decode_move_instr_type`

			`.long fp_fgen_fp, fp_ill`
			`.long fp_fgen_ea, fp_fmove_fp2mem`
			`.long fp_fmovem_cr, fp_fmovem_cr`
			`.long fp_fmovem_fp, fp_fmovem_fp`

			`\| now all arithmetic instr and a few move instr are left`
			`fp_fgen_fp: \| source is a fpu register`
			`clr.b (FPD_FPSR+2,FPDATA) \| clear the exception byte`
			`fp_decode_sourcespec`
			`printf PDECODE,"f<op>.x fp%d",1,%d0`
			`fp_get_fp_reg`
			`lea (FPD_TEMPFP1,FPDATA),%a1 \| copy src into a temp location`
			`move.l (%a0)+,(%a1)+`
			`move.l (%a0)+,(%a1)+`
			`move.l (%a0),(%a1)`
			`lea (-8,%a1),%a0`
			`jra fp_getdest`

			`fp_fgen_ea: \| source is <ea>`
			`clr.b (FPD_FPSR+2,FPDATA) \| clear the exception byte`
			`\| sort out fmovecr, keep data size in %d1`
			`fp_decode_sourcespec`
			`cmp.w #7,%d0`
			`jeq fp_fmovecr`
			`move.w %d0,%d1 \| store data size twice in %d1`
			`swap %d1 \| one can be trashed below`
			`move.w %d0,%d1`
			`#ifdef FPU_EMU_DEBUG`
			`lea 0f,%a0`
			`clr.l %d0`
			`move.b (%a0,%d1.w),%d0`
			`printf PDECODE,"f<op>.%c ",1,%d0`

			`.data`
			`0: .byte 'l','s','x','p','w','d','b',0`
			`.previous`
			`#endif`

			`/*`
			`fp_getsource, fp_getdest`

			`basically, we end up with a pointer to the source operand in`
			`%a1, and a pointer to the destination operand in %a0. both`
			`are, of course, 96-bit extended floating point numbers.`
			`*/`

			`fp_getsource:`
			`\| decode addressing mode for source`
			`fp_decode_addr_mode`

			`.long fp_data, fp_ill`
			`.long fp_indirect, fp_postinc`
			`.long fp_predecr, fp_disp16`
			`.long fp_extmode0, fp_extmode1`

			`\| addressing mode: data register direct`
			`fp_data:`
			`fp_mode_data_direct`
			`jsr fp_get_data_reg`
			`lea (FPD_TEMPFP1,FPDATA),%a0`
			`jmp ([0f:w,%pc,%d1.w*4])`

			`.align 4`
			`0:`
			`.long fp_data_long, fp_data_single`
			`.long fp_ill, fp_ill`
			`.long fp_data_word, fp_ill`
			`.long fp_data_byte, fp_ill`

			`\| data types that fit in an integer data register`
			`fp_data_byte:`
			`extb.l %d0`
			`jra fp_data_long`

			`fp_data_word:`
			`ext.l %d0`

			`fp_data_long:`
			`jsr fp_conv_long2ext`
			`jra fp_getdest`

			`fp_data_single:`
			`jsr fp_conv_single2ext`
			`jra fp_getdest`

			`\| addressing mode: address register indirect`
			`fp_indirect:`
			`fp_mode_addr_indirect`
			`jra fp_fetchsource`

			`\| addressing mode: address register indirect with postincrement`
			`fp_postinc:`
			`fp_mode_addr_indirect_postinc`
			`jra fp_fetchsource`

			`\| addressing mode: address register indirect with predecrement`
			`fp_predecr:`
			`fp_mode_addr_indirect_predec`
			`jra fp_fetchsource`

			`\| addressing mode: address register/programm counter indirect`
			`\| with 16bit displacement`
			`fp_disp16:`
			`fp_mode_addr_indirect_disp16`
			`jra fp_fetchsource`

			`\| all other indirect addressing modes will finally end up here`
			`fp_extmode0:`
			`fp_mode_addr_indirect_extmode0`
			`jra fp_fetchsource`

			`\| all pc relative addressing modes and immediate/absolute modes end up here`
			`\| the first ones are sent to fp_extmode0 or fp_disp16`
			`\| and only the latter are handled here`
			`fp_extmode1:`
			`fp_decode_addr_reg`
			`jmp ([0f:w,%pc,%d0*4])`

			`.align 4`
			`0:`
			`.long fp_abs_short, fp_abs_long`
			`.long fp_disp16, fp_extmode0`
			`.long fp_immediate, fp_ill`
			`.long fp_ill, fp_ill`

			`\| addressing mode: absolute short`
			`fp_abs_short:`
			`fp_mode_abs_short`
			`jra fp_fetchsource`

			`\| addressing mode: absolute long`
			`fp_abs_long:`
			`fp_mode_abs_long`
			`jra fp_fetchsource`

			`\| addressing mode: immediate data`
			`fp_immediate:`
			`printf PDECODE,"#"`
			`fp_get_pc %a0`
			`move.w (fp_datasize,%d1.w*2),%d0`
			`addq.w #1,%d0`
			`and.w #-2,%d0`
			`#ifdef FPU_EMU_DEBUG`
			`movem.l %d0/%d1,-(%sp)`
			`movel %a0,%a1`
			`clr.l %d1`
			`jra 2f`
			`1: getuser.b (%a1)+,%d1,fp_err_ua1,%a1`
			`printf PDECODE,"%02x",1,%d1`
			`2: dbra %d0,1b`
			`movem.l (%sp)+,%d0/%d1`
			`#endif`
			`lea (%a0,%d0.w),%a1`
			`fp_put_pc %a1`
			`\| jra fp_fetchsource`

			`fp_fetchsource:`
			`move.l %a0,%a1`
			`swap %d1`
			`lea (FPD_TEMPFP1,FPDATA),%a0`
			`jmp ([0f:w,%pc,%d1.w*4])`

			`.align 4`
			`0: .long fp_long, fp_single`
			`.long fp_ext, fp_pack`
			`.long fp_word, fp_double`
			`.long fp_byte, fp_ill`

			`fp_long:`
			`getuser.l (%a1),%d0,fp_err_ua1,%a1`
			`jsr fp_conv_long2ext`
			`jra fp_getdest`

			`fp_single:`
			`getuser.l (%a1),%d0,fp_err_ua1,%a1`
			`jsr fp_conv_single2ext`
			`jra fp_getdest`

			`fp_ext:`
			`getuser.l (%a1)+,%d0,fp_err_ua1,%a1`
			`lsr.l #8,%d0`
			`lsr.l #7,%d0`
			`lsr.w #1,%d0`
			`move.l %d0,(%a0)+`
			`getuser.l (%a1)+,%d0,fp_err_ua1,%a1`
			`move.l %d0,(%a0)+`
			`getuser.l (%a1),%d0,fp_err_ua1,%a1`
			`move.l %d0,(%a0)`
			`subq.l #8,%a0`
			`jra fp_getdest`

			`fp_pack:`
			`/* not supported yet */`
			`jra fp_ill`

			`fp_word:`
			`getuser.w (%a1),%d0,fp_err_ua1,%a1`
			`ext.l %d0`
			`jsr fp_conv_long2ext`
			`jra fp_getdest`

			`fp_double:`
			`jsr fp_conv_double2ext`
			`jra fp_getdest`

			`fp_byte:`
			`getuser.b (%a1),%d0,fp_err_ua1,%a1`
			`extb.l %d0`
			`jsr fp_conv_long2ext`
			`\| jra fp_getdest`

			`fp_getdest:`
			`move.l %a0,%a1`
			`bfextu %d2{#22,#3},%d0`
			`printf PDECODE,",fp%d\n",1,%d0`
			`fp_get_fp_reg`
			`movem.l %a0/%a1,-(%sp)`
			`pea fp_finalrounding`
			`bfextu %d2{#25,#7},%d0`
			`jmp ([0f:w,%pc,%d0*4])`

			`.align 4`
			`0:`
			`.long fp_fmove_mem2fp, fp_fint, fp_fsinh, fp_fintrz`
			`.long fp_fsqrt, fp_ill, fp_flognp1, fp_ill`
			`.long fp_fetoxm1, fp_ftanh, fp_fatan, fp_ill`
			`.long fp_fasin, fp_fatanh, fp_fsin, fp_ftan`
			`.long fp_fetox, fp_ftwotox, fp_ftentox, fp_ill`
			`.long fp_flogn, fp_flog10, fp_flog2, fp_ill`
			`.long fp_fabs, fp_fcosh, fp_fneg, fp_ill`
			`.long fp_facos, fp_fcos, fp_fgetexp, fp_fgetman`
			`.long fp_fdiv, fp_fmod, fp_fadd, fp_fmul`
			`.long fpa_fsgldiv, fp_frem, fp_fscale, fpa_fsglmul`
			`.long fp_fsub, fp_ill, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_fsincos0, fp_fsincos1, fp_fsincos2, fp_fsincos3`
			`.long fp_fsincos4, fp_fsincos5, fp_fsincos6, fp_fsincos7`
			`.long fp_fcmp, fp_ill, fp_ftst, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_fsmove, fp_fssqrt, fp_ill, fp_ill`
			`.long fp_fdmove, fp_fdsqrt, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_fsabs, fp_ill, fp_fsneg, fp_ill`
			`.long fp_fdabs, fp_ill, fp_fdneg, fp_ill`
			`.long fp_fsdiv, fp_ill, fp_fsadd, fp_fsmul`
			`.long fp_fddiv, fp_ill, fp_fdadd, fp_fdmul`
			`.long fp_fssub, fp_ill, fp_ill, fp_ill`
			`.long fp_fdsub, fp_ill, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`
			`.long fp_ill, fp_ill, fp_ill, fp_ill`

			`\| Instructions follow`

			`\| Move an (emulated) ROM constant`
			`fp_fmovecr:`
			`bfextu %d2{#27,#5},%d0`
			`printf PINSTR,"fp_fmovecr #%d",1,%d0`
			`move.l %d0,%d1`
			`add.l %d0,%d0`
			`add.l %d1,%d0`
			`lea (fp_constants,%d0*4),%a0`
			`move.l #0x801cc0ff,%d0`
			`addq.l #1,%d1`
			`lsl.l %d1,%d0`
			`jcc 1f`
			`fp_set_sr FPSR_EXC_INEX2 \| INEX2 exception`
			`1: moveq #-128,%d0 \| continue with fmove`
			`and.l %d0,%d2`
			`jra fp_getdest`

			`.data`
			`.align 4`
			`fp_constants:`
			`.long 0x00004000,0xc90fdaa2,0x2168c235 \| pi`
			`.extend 0,0,0,0,0,0,0,0,0,0`
			`.long 0x00003ffd,0x9a209a84,0xfbcff798 \| log10(2)`
			`.long 0x00004000,0xadf85458,0xa2bb4a9a \| e`
			`.long 0x00003fff,0xb8aa3b29,0x5c17f0bc \| log2(e)`
			`.long 0x00003ffd,0xde5bd8a9,0x37287195 \| log10(e)`
			`.long 0x00000000,0x00000000,0x00000000 \| 0.0`
			`.long 0x00003ffe,0xb17217f7,0xd1cf79ac \| 1n(2)`
			`.long 0x00004000,0x935d8ddd,0xaaa8ac17 \| 1n(10)`
			`\| read this as "1.0 * 2^0" - note the high bit in the mantissa`
			`.long 0x00003fff,0x80000000,0x00000000 \| 10^0`
			`.long 0x00004002,0xa0000000,0x00000000 \| 10^1`
			`.long 0x00004005,0xc8000000,0x00000000 \| 10^2`
			`.long 0x0000400c,0x9c400000,0x00000000 \| 10^4`
			`.long 0x00004019,0xbebc2000,0x00000000 \| 10^8`
			`.long 0x00004034,0x8e1bc9bf,0x04000000 \| 10^16`
			`.long 0x00004069,0x9dc5ada8,0x2b70b59e \| 10^32`
			`.long 0x000040d3,0xc2781f49,0xffcfa6d5 \| 10^64`
			`.long 0x000041a8,0x93ba47c9,0x80e98ce0 \| 10^128`
			`.long 0x00004351,0xaa7eebfb,0x9df9de8e \| 10^256`
			`.long 0x000046a3,0xe319a0ae,0xa60e91c7 \| 10^512`
			`.long 0x00004d48,0xc9767586,0x81750c17 \| 10^1024`
			`.long 0x00005a92,0x9e8b3b5d,0xc53d5de5 \| 10^2048`
			`.long 0x00007525,0xc4605202,0x8a20979b \| 10^4096`
			`.previous`

			`fp_fmove_mem2fp:`
			`printf PINSTR,"fmove %p,%p\n",2,%a0,%a1`
			`move.l (%a1)+,(%a0)+`
			`move.l (%a1)+,(%a0)+`
			`move.l (%a1),(%a0)`
			`subq.l #8,%a0`
			`rts`

			`fpa_fsglmul:`
			`move.l #fp_finalrounding_single_fast,(%sp)`
			`jra fp_fsglmul`

			`fpa_fsgldiv:`
			`move.l #fp_finalrounding_single_fast,(%sp)`
			`jra fp_fsgldiv`

			`.macro fp_dosingleprec instr`
			`printf PINSTR,"single "`
			`move.l #fp_finalrounding_single,(%sp)`
			`jra \instr`
			`.endm`

			`.macro fp_dodoubleprec instr`
			`printf PINSTR,"double "`
			`move.l #fp_finalrounding_double,(%sp)`
			`jra \instr`
			`.endm`

			`fp_fsmove:`
			`fp_dosingleprec fp_fmove_mem2fp`

			`fp_fssqrt:`
			`fp_dosingleprec fp_fsqrt`

			`fp_fdmove:`
			`fp_dodoubleprec fp_fmove_mem2fp`

			`fp_fdsqrt:`
			`fp_dodoubleprec fp_fsqrt`

			`fp_fsabs:`
			`fp_dosingleprec fp_fabs`

			`fp_fsneg:`
			`fp_dosingleprec fp_fneg`

			`fp_fdabs:`
			`fp_dodoubleprec fp_fabs`

			`fp_fdneg:`
			`fp_dodoubleprec fp_fneg`

			`fp_fsdiv:`
			`fp_dosingleprec fp_fdiv`

			`fp_fsadd:`
			`fp_dosingleprec fp_fadd`

			`fp_fsmul:`
			`fp_dosingleprec fp_fmul`

			`fp_fddiv:`
			`fp_dodoubleprec fp_fdiv`

			`fp_fdadd:`
			`fp_dodoubleprec fp_fadd`

			`fp_fdmul:`
			`fp_dodoubleprec fp_fmul`

			`fp_fssub:`
			`fp_dosingleprec fp_fsub`

			`fp_fdsub:`
			`fp_dodoubleprec fp_fsub`

			`fp_nonstd:`
			`fp_get_pc %a0`
			`getuser.l (%a0),%d0,fp_err_ua1,%a0`
			`printf ,"nonstd ((%08x)=%08x)\n",2,%a0,%d0`
			`moveq #-1,%d0`
			`rts`

			`.data`
			`.align 4`

			`\| data sizes corresponding to the operand formats`
			`fp_datasize:`
			`.word 4, 4, 12, 12, 2, 8, 1, 0`