Blame - arch/m68k/math-emu/fp_scan.S - kernel/msm-4.9

blob: e4146ed574db92c2ffe31734f6f9c71c346a2177 [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	/*
				2	* fp_scan.S
				3	*
				4	* Copyright Roman Zippel, 1997. All rights reserved.
				5	*
				6	* Redistribution and use in source and binary forms, with or without
				7	* modification, are permitted provided that the following conditions
				8	* are met:
				9	* 1. Redistributions of source code must retain the above copyright
				10	* notice, and the entire permission notice in its entirety,
				11	* including the disclaimer of warranties.
				12	* 2. Redistributions in binary form must reproduce the above copyright
				13	* notice, this list of conditions and the following disclaimer in the
				14	* documentation and/or other materials provided with the distribution.
				15	* 3. The name of the author may not be used to endorse or promote
				16	* products derived from this software without specific prior
				17	* written permission.
				18	*
				19	* ALTERNATIVELY, this product may be distributed under the terms of
				20	* the GNU General Public License, in which case the provisions of the GPL are
				21	* required INSTEAD OF the above restrictions. (This clause is
				22	* necessary due to a potential bad interaction between the GPL and
				23	* the restrictions contained in a BSD-style copyright.)
				24	*
				25	* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
				26	* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
				27	* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
				28	* DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
				29	* INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
				30	* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
				31	* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
				32	* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
				33	* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
				34	* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
				35	* OF THE POSSIBILITY OF SUCH DAMAGE.
				36	*/
				37
				38	#include "fp_emu.h"
				39	#include "fp_decode.h"
				40
				41	.globl fp_scan, fp_datasize
				42
				43	.data
				44
				45	\| %d2 - first two instr words
				46	\| %d1 - operand size
				47
				48	/* operand formats are:
				49
				50	Long = 0, i.e. fmove.l
				51	Single, i.e. fmove.s
				52	Extended, i.e. fmove.x
				53	Packed-BCD, i.e. fmove.p
				54	Word, i.e. fmove.w
				55	Double, i.e. fmove.d
				56	*/
				57
				58	.text
				59
				60	\| On entry:
				61	\| FPDATA - base of emulated FPU registers
				62
				63	fp_scan:
				64	\| normal fpu instruction? (this excludes fsave/frestore)
				65	fp_get_pc %a0
				66	printf PDECODE,"%08x: ",1,%a0
				67	getuser.b (%a0),%d0,fp_err_ua1,%a0
				68	#if 1
				69	cmp.b #0xf2,%d0 \| cpid = 1
				70	#else
				71	cmp.b #0xfc,%d0 \| cpid = 6
				72	#endif
				73	jne fp_nonstd
				74	\| first two instruction words are kept in %d2
				75	getuser.l (%a0)+,%d2,fp_err_ua1,%a0
				76	fp_put_pc %a0
				77	fp_decode_cond: \| separate conditional instr
				78	fp_decode_cond_instr_type
				79
				80	.long fp_decode_move, fp_fscc
				81	.long fp_fbccw, fp_fbccl
				82
				83	fp_decode_move: \| separate move instr
				84	fp_decode_move_instr_type
				85
				86	.long fp_fgen_fp, fp_ill
				87	.long fp_fgen_ea, fp_fmove_fp2mem
				88	.long fp_fmovem_cr, fp_fmovem_cr
				89	.long fp_fmovem_fp, fp_fmovem_fp
				90
				91	\| now all arithmetic instr and a few move instr are left
				92	fp_fgen_fp: \| source is a fpu register
				93	clr.b (FPD_FPSR+2,FPDATA) \| clear the exception byte
				94	fp_decode_sourcespec
				95	printf PDECODE,"f<op>.x fp%d",1,%d0
				96	fp_get_fp_reg
				97	lea (FPD_TEMPFP1,FPDATA),%a1 \| copy src into a temp location
				98	move.l (%a0)+,(%a1)+
				99	move.l (%a0)+,(%a1)+
				100	move.l (%a0),(%a1)
				101	lea (-8,%a1),%a0
				102	jra fp_getdest
				103
				104	fp_fgen_ea: \| source is <ea>
				105	clr.b (FPD_FPSR+2,FPDATA) \| clear the exception byte
				106	\| sort out fmovecr, keep data size in %d1
				107	fp_decode_sourcespec
				108	cmp.w #7,%d0
				109	jeq fp_fmovecr
				110	move.w %d0,%d1 \| store data size twice in %d1
				111	swap %d1 \| one can be trashed below
				112	move.w %d0,%d1
				113	#ifdef FPU_EMU_DEBUG
				114	lea 0f,%a0
				115	clr.l %d0
				116	move.b (%a0,%d1.w),%d0
				117	printf PDECODE,"f<op>.%c ",1,%d0
				118
				119	.data
				120	0: .byte 'l','s','x','p','w','d','b',0
				121	.previous
				122	#endif
				123
				124	/*
				125	fp_getsource, fp_getdest
				126
				127	basically, we end up with a pointer to the source operand in
				128	%a1, and a pointer to the destination operand in %a0. both
				129	are, of course, 96-bit extended floating point numbers.
				130	*/
				131
				132	fp_getsource:
				133	\| decode addressing mode for source
				134	fp_decode_addr_mode
				135
				136	.long fp_data, fp_ill
				137	.long fp_indirect, fp_postinc
				138	.long fp_predecr, fp_disp16
				139	.long fp_extmode0, fp_extmode1
				140
				141	\| addressing mode: data register direct
				142	fp_data:
				143	fp_mode_data_direct
				144	jsr fp_get_data_reg
				145	lea (FPD_TEMPFP1,FPDATA),%a0
				146	jmp ([0f:w,%pc,%d1.w*4])
				147
				148	.align 4
				149	0:
				150	.long fp_data_long, fp_data_single
				151	.long fp_ill, fp_ill
				152	.long fp_data_word, fp_ill
				153	.long fp_data_byte, fp_ill
				154
				155	\| data types that fit in an integer data register
				156	fp_data_byte:
				157	extb.l %d0
				158	jra fp_data_long
				159
				160	fp_data_word:
				161	ext.l %d0
				162
				163	fp_data_long:
				164	jsr fp_conv_long2ext
				165	jra fp_getdest
				166
				167	fp_data_single:
				168	jsr fp_conv_single2ext
				169	jra fp_getdest
				170
				171	\| addressing mode: address register indirect
				172	fp_indirect:
				173	fp_mode_addr_indirect
				174	jra fp_fetchsource
				175
				176	\| addressing mode: address register indirect with postincrement
				177	fp_postinc:
				178	fp_mode_addr_indirect_postinc
				179	jra fp_fetchsource
				180
				181	\| addressing mode: address register indirect with predecrement
				182	fp_predecr:
				183	fp_mode_addr_indirect_predec
				184	jra fp_fetchsource
				185
				186	\| addressing mode: address register/programm counter indirect
				187	\| with 16bit displacement
				188	fp_disp16:
				189	fp_mode_addr_indirect_disp16
				190	jra fp_fetchsource
				191
				192	\| all other indirect addressing modes will finally end up here
				193	fp_extmode0:
				194	fp_mode_addr_indirect_extmode0
				195	jra fp_fetchsource
				196
				197	\| all pc relative addressing modes and immediate/absolute modes end up here
				198	\| the first ones are sent to fp_extmode0 or fp_disp16
				199	\| and only the latter are handled here
				200	fp_extmode1:
				201	fp_decode_addr_reg
				202	jmp ([0f:w,%pc,%d0*4])
				203
				204	.align 4
				205	0:
				206	.long fp_abs_short, fp_abs_long
				207	.long fp_disp16, fp_extmode0
				208	.long fp_immediate, fp_ill
				209	.long fp_ill, fp_ill
				210
				211	\| addressing mode: absolute short
				212	fp_abs_short:
				213	fp_mode_abs_short
				214	jra fp_fetchsource
				215
				216	\| addressing mode: absolute long
				217	fp_abs_long:
				218	fp_mode_abs_long
				219	jra fp_fetchsource
				220
				221	\| addressing mode: immediate data
				222	fp_immediate:
				223	printf PDECODE,"#"
				224	fp_get_pc %a0
				225	move.w (fp_datasize,%d1.w*2),%d0
				226	addq.w #1,%d0
				227	and.w #-2,%d0
				228	#ifdef FPU_EMU_DEBUG
				229	movem.l %d0/%d1,-(%sp)
				230	movel %a0,%a1
				231	clr.l %d1
				232	jra 2f
				233	1: getuser.b (%a1)+,%d1,fp_err_ua1,%a1
				234	printf PDECODE,"%02x",1,%d1
				235	2: dbra %d0,1b
				236	movem.l (%sp)+,%d0/%d1
				237	#endif
				238	lea (%a0,%d0.w),%a1
				239	fp_put_pc %a1
				240	\| jra fp_fetchsource
				241
				242	fp_fetchsource:
				243	move.l %a0,%a1
				244	swap %d1
				245	lea (FPD_TEMPFP1,FPDATA),%a0
				246	jmp ([0f:w,%pc,%d1.w*4])
				247
				248	.align 4
				249	0: .long fp_long, fp_single
				250	.long fp_ext, fp_pack
				251	.long fp_word, fp_double
				252	.long fp_byte, fp_ill
				253
				254	fp_long:
				255	getuser.l (%a1),%d0,fp_err_ua1,%a1
				256	jsr fp_conv_long2ext
				257	jra fp_getdest
				258
				259	fp_single:
				260	getuser.l (%a1),%d0,fp_err_ua1,%a1
				261	jsr fp_conv_single2ext
				262	jra fp_getdest
				263
				264	fp_ext:
				265	getuser.l (%a1)+,%d0,fp_err_ua1,%a1
				266	lsr.l #8,%d0
				267	lsr.l #7,%d0
				268	lsr.w #1,%d0
				269	move.l %d0,(%a0)+
				270	getuser.l (%a1)+,%d0,fp_err_ua1,%a1
				271	move.l %d0,(%a0)+
				272	getuser.l (%a1),%d0,fp_err_ua1,%a1
				273	move.l %d0,(%a0)
				274	subq.l #8,%a0
				275	jra fp_getdest
				276
				277	fp_pack:
				278	/* not supported yet */
				279	jra fp_ill
				280
				281	fp_word:
				282	getuser.w (%a1),%d0,fp_err_ua1,%a1
				283	ext.l %d0
				284	jsr fp_conv_long2ext
				285	jra fp_getdest
				286
				287	fp_double:
				288	jsr fp_conv_double2ext
				289	jra fp_getdest
				290
				291	fp_byte:
				292	getuser.b (%a1),%d0,fp_err_ua1,%a1
				293	extb.l %d0
				294	jsr fp_conv_long2ext
				295	\| jra fp_getdest
				296
				297	fp_getdest:
				298	move.l %a0,%a1
				299	bfextu %d2{#22,#3},%d0
				300	printf PDECODE,",fp%d\n",1,%d0
				301	fp_get_fp_reg
				302	movem.l %a0/%a1,-(%sp)
				303	pea fp_finalrounding
				304	bfextu %d2{#25,#7},%d0
				305	jmp ([0f:w,%pc,%d0*4])
				306
				307	.align 4
				308	0:
				309	.long fp_fmove_mem2fp, fp_fint, fp_fsinh, fp_fintrz
				310	.long fp_fsqrt, fp_ill, fp_flognp1, fp_ill
				311	.long fp_fetoxm1, fp_ftanh, fp_fatan, fp_ill
				312	.long fp_fasin, fp_fatanh, fp_fsin, fp_ftan
				313	.long fp_fetox, fp_ftwotox, fp_ftentox, fp_ill
				314	.long fp_flogn, fp_flog10, fp_flog2, fp_ill
				315	.long fp_fabs, fp_fcosh, fp_fneg, fp_ill
				316	.long fp_facos, fp_fcos, fp_fgetexp, fp_fgetman
				317	.long fp_fdiv, fp_fmod, fp_fadd, fp_fmul
				318	.long fpa_fsgldiv, fp_frem, fp_fscale, fpa_fsglmul
				319	.long fp_fsub, fp_ill, fp_ill, fp_ill
				320	.long fp_ill, fp_ill, fp_ill, fp_ill
				321	.long fp_fsincos0, fp_fsincos1, fp_fsincos2, fp_fsincos3
				322	.long fp_fsincos4, fp_fsincos5, fp_fsincos6, fp_fsincos7
				323	.long fp_fcmp, fp_ill, fp_ftst, fp_ill
				324	.long fp_ill, fp_ill, fp_ill, fp_ill
				325	.long fp_fsmove, fp_fssqrt, fp_ill, fp_ill
				326	.long fp_fdmove, fp_fdsqrt, fp_ill, fp_ill
				327	.long fp_ill, fp_ill, fp_ill, fp_ill
				328	.long fp_ill, fp_ill, fp_ill, fp_ill
				329	.long fp_ill, fp_ill, fp_ill, fp_ill
				330	.long fp_ill, fp_ill, fp_ill, fp_ill
				331	.long fp_fsabs, fp_ill, fp_fsneg, fp_ill
				332	.long fp_fdabs, fp_ill, fp_fdneg, fp_ill
				333	.long fp_fsdiv, fp_ill, fp_fsadd, fp_fsmul
				334	.long fp_fddiv, fp_ill, fp_fdadd, fp_fdmul
				335	.long fp_fssub, fp_ill, fp_ill, fp_ill
				336	.long fp_fdsub, fp_ill, fp_ill, fp_ill
				337	.long fp_ill, fp_ill, fp_ill, fp_ill
				338	.long fp_ill, fp_ill, fp_ill, fp_ill
				339	.long fp_ill, fp_ill, fp_ill, fp_ill
				340	.long fp_ill, fp_ill, fp_ill, fp_ill
				341
				342	\| Instructions follow
				343
				344	\| Move an (emulated) ROM constant
				345	fp_fmovecr:
				346	bfextu %d2{#27,#5},%d0
				347	printf PINSTR,"fp_fmovecr #%d",1,%d0
				348	move.l %d0,%d1
				349	add.l %d0,%d0
				350	add.l %d1,%d0
				351	lea (fp_constants,%d0*4),%a0
				352	move.l #0x801cc0ff,%d0
				353	addq.l #1,%d1
				354	lsl.l %d1,%d0
				355	jcc 1f
				356	fp_set_sr FPSR_EXC_INEX2 \| INEX2 exception
				357	1: moveq #-128,%d0 \| continue with fmove
				358	and.l %d0,%d2
				359	jra fp_getdest
				360
				361	.data
				362	.align 4
				363	fp_constants:
				364	.long 0x00004000,0xc90fdaa2,0x2168c235 \| pi
				365	.extend 0,0,0,0,0,0,0,0,0,0
				366	.long 0x00003ffd,0x9a209a84,0xfbcff798 \| log10(2)
				367	.long 0x00004000,0xadf85458,0xa2bb4a9a \| e
				368	.long 0x00003fff,0xb8aa3b29,0x5c17f0bc \| log2(e)
				369	.long 0x00003ffd,0xde5bd8a9,0x37287195 \| log10(e)
				370	.long 0x00000000,0x00000000,0x00000000 \| 0.0
				371	.long 0x00003ffe,0xb17217f7,0xd1cf79ac \| 1n(2)
				372	.long 0x00004000,0x935d8ddd,0xaaa8ac17 \| 1n(10)
				373	\| read this as "1.0 * 2^0" - note the high bit in the mantissa
				374	.long 0x00003fff,0x80000000,0x00000000 \| 10^0
				375	.long 0x00004002,0xa0000000,0x00000000 \| 10^1
				376	.long 0x00004005,0xc8000000,0x00000000 \| 10^2
				377	.long 0x0000400c,0x9c400000,0x00000000 \| 10^4
				378	.long 0x00004019,0xbebc2000,0x00000000 \| 10^8
				379	.long 0x00004034,0x8e1bc9bf,0x04000000 \| 10^16
				380	.long 0x00004069,0x9dc5ada8,0x2b70b59e \| 10^32
				381	.long 0x000040d3,0xc2781f49,0xffcfa6d5 \| 10^64
				382	.long 0x000041a8,0x93ba47c9,0x80e98ce0 \| 10^128
				383	.long 0x00004351,0xaa7eebfb,0x9df9de8e \| 10^256
				384	.long 0x000046a3,0xe319a0ae,0xa60e91c7 \| 10^512
				385	.long 0x00004d48,0xc9767586,0x81750c17 \| 10^1024
				386	.long 0x00005a92,0x9e8b3b5d,0xc53d5de5 \| 10^2048
				387	.long 0x00007525,0xc4605202,0x8a20979b \| 10^4096
				388	.previous
				389
				390	fp_fmove_mem2fp:
				391	printf PINSTR,"fmove %p,%p\n",2,%a0,%a1
				392	move.l (%a1)+,(%a0)+
				393	move.l (%a1)+,(%a0)+
				394	move.l (%a1),(%a0)
				395	subq.l #8,%a0
				396	rts
				397
				398	fpa_fsglmul:
				399	move.l #fp_finalrounding_single_fast,(%sp)
				400	jra fp_fsglmul
				401
				402	fpa_fsgldiv:
				403	move.l #fp_finalrounding_single_fast,(%sp)
				404	jra fp_fsgldiv
				405
				406	.macro fp_dosingleprec instr
				407	printf PINSTR,"single "
				408	move.l #fp_finalrounding_single,(%sp)
				409	jra \instr
				410	.endm
				411
				412	.macro fp_dodoubleprec instr
				413	printf PINSTR,"double "
				414	move.l #fp_finalrounding_double,(%sp)
				415	jra \instr
				416	.endm
				417
				418	fp_fsmove:
				419	fp_dosingleprec fp_fmove_mem2fp
				420
				421	fp_fssqrt:
				422	fp_dosingleprec fp_fsqrt
				423
				424	fp_fdmove:
				425	fp_dodoubleprec fp_fmove_mem2fp
				426
				427	fp_fdsqrt:
				428	fp_dodoubleprec fp_fsqrt
				429
				430	fp_fsabs:
				431	fp_dosingleprec fp_fabs
				432
				433	fp_fsneg:
				434	fp_dosingleprec fp_fneg
				435
				436	fp_fdabs:
				437	fp_dodoubleprec fp_fabs
				438
				439	fp_fdneg:
				440	fp_dodoubleprec fp_fneg
				441
				442	fp_fsdiv:
				443	fp_dosingleprec fp_fdiv
				444
				445	fp_fsadd:
				446	fp_dosingleprec fp_fadd
				447
				448	fp_fsmul:
				449	fp_dosingleprec fp_fmul
				450
				451	fp_fddiv:
				452	fp_dodoubleprec fp_fdiv
				453
				454	fp_fdadd:
				455	fp_dodoubleprec fp_fadd
				456
				457	fp_fdmul:
				458	fp_dodoubleprec fp_fmul
				459
				460	fp_fssub:
				461	fp_dosingleprec fp_fsub
				462
				463	fp_fdsub:
				464	fp_dodoubleprec fp_fsub
				465
				466	fp_nonstd:
				467	fp_get_pc %a0
				468	getuser.l (%a0),%d0,fp_err_ua1,%a0
				469	printf ,"nonstd ((%08x)=%08x)\n",2,%a0,%d0
				470	moveq #-1,%d0
				471	rts
				472
				473	.data
				474	.align 4
				475
				476	\| data sizes corresponding to the operand formats
				477	fp_datasize:
				478	.word 4, 4, 12, 12, 2, 8, 1, 0