1 /*
2  * fp_scan.S
3  *
4  * Copyright Roman Zippel, 1997.  All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions
8  * are met:
9  * 1. Redistributions of source code must retain the above copyright
10  *    notice, and the entire permission notice in its entirety,
11  *    including the disclaimer of warranties.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  * 3. The name of the author may not be used to endorse or promote
16  *    products derived from this software without specific prior
17  *    written permission.
18  *
19  * ALTERNATIVELY, this product may be distributed under the terms of
20  * the GNU General Public License, in which case the provisions of the GPL are
21  * required INSTEAD OF the above restrictions.  (This clause is
22  * necessary due to a potential bad interaction between the GPL and
23  * the restrictions contained in a BSD-style copyright.)
24  *
25  * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
26  * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
27  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
28  * DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
29  * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
30  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
31  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
32  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
33  * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
34  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
35  * OF THE POSSIBILITY OF SUCH DAMAGE.
36  */
37 
38 #include "fp_emu.h"
39 #include "fp_decode.h"
40 
41 	.globl	fp_scan, fp_datasize
42 
43 	.data
44 
45 | %d2 - first two instr words
46 | %d1 - operand size
47 
48 /* operand formats are:
49 
50 	Long = 0,		i.e. fmove.l
51 	Single,			i.e. fmove.s
52 	Extended,		i.e. fmove.x
53 	Packed-BCD,		i.e. fmove.p
54 	Word,			i.e. fmove.w
55 	Double,			i.e. fmove.d
56 */
57 
58 	.text
59 
60 | On entry:
61 | FPDATA - base of emulated FPU registers
62 
63 fp_scan:
64 | normal fpu instruction? (this excludes fsave/frestore)
65 	fp_get_pc %a0
66 	printf	PDECODE,"%08x: ",1,%a0
67 	getuser.b (%a0),%d0,fp_err_ua1,%a0
68 #if 1
69 	cmp.b	#0xf2,%d0		| cpid = 1
70 #else
71 	cmp.b	#0xfc,%d0		| cpid = 6
72 #endif
73 	jne	fp_nonstd
74 | first two instruction words are kept in %d2
75 	getuser.l (%a0)+,%d2,fp_err_ua1,%a0
76 	fp_put_pc %a0
77 fp_decode_cond:				| separate conditional instr
78 	fp_decode_cond_instr_type
79 
80 	.long	fp_decode_move, fp_fscc
81 	.long	fp_fbccw, fp_fbccl
82 
83 fp_decode_move:				| separate move instr
84 	fp_decode_move_instr_type
85 
86 	.long	fp_fgen_fp, fp_ill
87 	.long	fp_fgen_ea, fp_fmove_fp2mem
88 	.long	fp_fmovem_cr, fp_fmovem_cr
89 	.long	fp_fmovem_fp, fp_fmovem_fp
90 
91 | now all arithmetic instr and a few move instr are left
92 fp_fgen_fp:				| source is a fpu register
93 	clr.b	(FPD_FPSR+2,FPDATA)	| clear the exception byte
94 	fp_decode_sourcespec
95 	printf	PDECODE,"f<op>.x fp%d",1,%d0
96 	fp_get_fp_reg
97 	lea	(FPD_TEMPFP1,FPDATA),%a1 | copy src into a temp location
98 	move.l	(%a0)+,(%a1)+
99 	move.l	(%a0)+,(%a1)+
100 	move.l	(%a0),(%a1)
101 	lea	(-8,%a1),%a0
102 	jra	fp_getdest
103 
104 fp_fgen_ea:				| source is <ea>
105 	clr.b	(FPD_FPSR+2,FPDATA)	| clear the exception byte
106 	| sort out fmovecr, keep data size in %d1
107 	fp_decode_sourcespec
108 	cmp.w	#7,%d0
109 	jeq	fp_fmovecr
110 	move.w	%d0,%d1			| store data size twice in %d1
111 	swap	%d1			| one can be trashed below
112 	move.w	%d0,%d1
113 #ifdef FPU_EMU_DEBUG
114 	lea	0f,%a0
115 	clr.l	%d0
116 	move.b	(%a0,%d1.w),%d0
117 	printf	PDECODE,"f<op>.%c ",1,%d0
118 
119 	.data
120 0:	.byte	'l','s','x','p','w','d','b',0
121 	.previous
122 #endif
123 
124 /*
125 	fp_getsource, fp_getdest
126 
127 	basically, we end up with a pointer to the source operand in
128 	%a1, and a pointer to the destination operand in %a0.  both
129 	are, of course, 96-bit extended floating point numbers.
130 */
131 
132 fp_getsource:
133 	| decode addressing mode for source
134 	fp_decode_addr_mode
135 
136 	.long	fp_data, fp_ill
137 	.long	fp_indirect, fp_postinc
138 	.long	fp_predecr, fp_disp16
139 	.long	fp_extmode0, fp_extmode1
140 
141 	| addressing mode: data register direct
142 fp_data:
143 	fp_mode_data_direct
144 	jsr	fp_get_data_reg
145 	lea	(FPD_TEMPFP1,FPDATA),%a0
146 	jmp	([0f:w,%pc,%d1.w*4])
147 
148 	.align	4
149 0:
150 	.long	fp_data_long, fp_data_single
151 	.long	fp_ill, fp_ill
152 	.long	fp_data_word, fp_ill
153 	.long	fp_data_byte, fp_ill
154 
155 	| data types that fit in an integer data register
156 fp_data_byte:
157 	extb.l	%d0
158 	jra	fp_data_long
159 
160 fp_data_word:
161 	ext.l	%d0
162 
163 fp_data_long:
164 	jsr	fp_conv_long2ext
165 	jra	fp_getdest
166 
167 fp_data_single:
168 	jsr	fp_conv_single2ext
169 	jra	fp_getdest
170 
171 	| addressing mode: address register indirect
172 fp_indirect:
173 	fp_mode_addr_indirect
174 	jra	fp_fetchsource
175 
176 	| addressing mode: address register indirect with postincrement
177 fp_postinc:
178 	fp_mode_addr_indirect_postinc
179 	jra	fp_fetchsource
180 
181 	| addressing mode: address register indirect with predecrement
182 fp_predecr:
183 	fp_mode_addr_indirect_predec
184 	jra	fp_fetchsource
185 
186 	| addressing mode: address register/programm counter indirect
187 	|		   with 16bit displacement
188 fp_disp16:
189 	fp_mode_addr_indirect_disp16
190 	jra	fp_fetchsource
191 
192 	| all other indirect addressing modes will finally end up here
193 fp_extmode0:
194 	fp_mode_addr_indirect_extmode0
195 	jra	fp_fetchsource
196 
197 | all pc relative addressing modes and immediate/absolute modes end up here
198 | the first ones are sent to fp_extmode0 or fp_disp16
199 | and only the latter are handled here
200 fp_extmode1:
201 	fp_decode_addr_reg
202 	jmp	([0f:w,%pc,%d0*4])
203 
204 	.align	4
205 0:
206 	.long	fp_abs_short, fp_abs_long
207 	.long	fp_disp16, fp_extmode0
208 	.long	fp_immediate, fp_ill
209 	.long	fp_ill, fp_ill
210 
211 	| addressing mode: absolute short
212 fp_abs_short:
213 	fp_mode_abs_short
214 	jra	fp_fetchsource
215 
216 	| addressing mode: absolute long
217 fp_abs_long:
218 	fp_mode_abs_long
219 	jra	fp_fetchsource
220 
221 	| addressing mode: immediate data
222 fp_immediate:
223 	printf	PDECODE,"#"
224 	fp_get_pc %a0
225 	move.w	(fp_datasize,%d1.w*2),%d0
226 	addq.w	#1,%d0
227 	and.w	#-2,%d0
228 #ifdef FPU_EMU_DEBUG
229 	movem.l	%d0/%d1,-(%sp)
230 	movel	%a0,%a1
231 	clr.l	%d1
232 	jra	2f
233 1:	getuser.b (%a1)+,%d1,fp_err_ua1,%a1
234 	printf	PDECODE,"%02x",1,%d1
235 2:	dbra	%d0,1b
236 	movem.l	(%sp)+,%d0/%d1
237 #endif
238 	lea	(%a0,%d0.w),%a1
239 	fp_put_pc %a1
240 |	jra	fp_fetchsource
241 
242 fp_fetchsource:
243 	move.l	%a0,%a1
244 	swap	%d1
245 	lea	(FPD_TEMPFP1,FPDATA),%a0
246 	jmp	([0f:w,%pc,%d1.w*4])
247 
248 	.align	4
249 0:	.long	fp_long, fp_single
250 	.long	fp_ext, fp_pack
251 	.long	fp_word, fp_double
252 	.long	fp_byte, fp_ill
253 
254 fp_long:
255 	getuser.l (%a1),%d0,fp_err_ua1,%a1
256 	jsr	fp_conv_long2ext
257 	jra	fp_getdest
258 
259 fp_single:
260 	getuser.l (%a1),%d0,fp_err_ua1,%a1
261 	jsr	fp_conv_single2ext
262 	jra	fp_getdest
263 
264 fp_ext:
265 	getuser.l (%a1)+,%d0,fp_err_ua1,%a1
266 	lsr.l	#8,%d0
267 	lsr.l	#7,%d0
268 	lsr.w	#1,%d0
269 	move.l	%d0,(%a0)+
270 	getuser.l (%a1)+,%d0,fp_err_ua1,%a1
271 	move.l	%d0,(%a0)+
272 	getuser.l (%a1),%d0,fp_err_ua1,%a1
273 	move.l	%d0,(%a0)
274 	subq.l	#8,%a0
275 	jra	fp_getdest
276 
277 fp_pack:
278 	/* not supported yet */
279 	jra	fp_ill
280 
281 fp_word:
282 	getuser.w (%a1),%d0,fp_err_ua1,%a1
283 	ext.l	%d0
284 	jsr	fp_conv_long2ext
285 	jra	fp_getdest
286 
287 fp_double:
288 	jsr	fp_conv_double2ext
289 	jra	fp_getdest
290 
291 fp_byte:
292 	getuser.b (%a1),%d0,fp_err_ua1,%a1
293 	extb.l	%d0
294 	jsr	fp_conv_long2ext
295 |	jra	fp_getdest
296 
297 fp_getdest:
298 	move.l	%a0,%a1
299 	bfextu	%d2{#22,#3},%d0
300 	printf	PDECODE,",fp%d\n",1,%d0
301 	fp_get_fp_reg
302 	movem.l	%a0/%a1,-(%sp)
303 	pea	fp_finalrounding
304 	bfextu	%d2{#25,#7},%d0
305 	jmp	([0f:w,%pc,%d0*4])
306 
307 	.align	4
308 0:
309 	.long	fp_fmove_mem2fp, fp_fint, fp_fsinh, fp_fintrz
310 	.long	fp_fsqrt, fp_ill, fp_flognp1, fp_ill
311 	.long	fp_fetoxm1, fp_ftanh, fp_fatan, fp_ill
312 	.long	fp_fasin, fp_fatanh, fp_fsin, fp_ftan
313 	.long	fp_fetox, fp_ftwotox, fp_ftentox, fp_ill
314 	.long	fp_flogn, fp_flog10, fp_flog2, fp_ill
315 	.long	fp_fabs, fp_fcosh, fp_fneg, fp_ill
316 	.long	fp_facos, fp_fcos, fp_fgetexp, fp_fgetman
317 	.long	fp_fdiv, fp_fmod, fp_fadd, fp_fmul
318 	.long	fpa_fsgldiv, fp_frem, fp_fscale, fpa_fsglmul
319 	.long	fp_fsub, fp_ill, fp_ill, fp_ill
320 	.long	fp_ill, fp_ill, fp_ill, fp_ill
321 	.long	fp_fsincos0, fp_fsincos1, fp_fsincos2, fp_fsincos3
322 	.long	fp_fsincos4, fp_fsincos5, fp_fsincos6, fp_fsincos7
323 	.long	fp_fcmp, fp_ill, fp_ftst, fp_ill
324 	.long	fp_ill, fp_ill, fp_ill, fp_ill
325 	.long	fp_fsmove, fp_fssqrt, fp_ill, fp_ill
326 	.long	fp_fdmove, fp_fdsqrt, fp_ill, fp_ill
327 	.long	fp_ill, fp_ill, fp_ill, fp_ill
328 	.long	fp_ill, fp_ill, fp_ill, fp_ill
329 	.long	fp_ill, fp_ill, fp_ill, fp_ill
330 	.long	fp_ill, fp_ill, fp_ill, fp_ill
331 	.long	fp_fsabs, fp_ill, fp_fsneg, fp_ill
332 	.long	fp_fdabs, fp_ill, fp_fdneg, fp_ill
333 	.long	fp_fsdiv, fp_ill, fp_fsadd, fp_fsmul
334 	.long	fp_fddiv, fp_ill, fp_fdadd, fp_fdmul
335 	.long	fp_fssub, fp_ill, fp_ill, fp_ill
336 	.long	fp_fdsub, fp_ill, fp_ill, fp_ill
337 	.long	fp_ill, fp_ill, fp_ill, fp_ill
338 	.long	fp_ill, fp_ill, fp_ill, fp_ill
339 	.long	fp_ill, fp_ill, fp_ill, fp_ill
340 	.long	fp_ill, fp_ill, fp_ill, fp_ill
341 
342 	| Instructions follow
343 
344 	| Move an (emulated) ROM constant
345 fp_fmovecr:
346 	bfextu	%d2{#27,#5},%d0
347 	printf	PINSTR,"fp_fmovecr #%d",1,%d0
348 	move.l	%d0,%d1
349 	add.l	%d0,%d0
350 	add.l	%d1,%d0
351 	lea	(fp_constants,%d0*4),%a0
352 	move.l	#0x801cc0ff,%d0
353 	addq.l	#1,%d1
354 	lsl.l	%d1,%d0
355 	jcc	1f
356 	fp_set_sr FPSR_EXC_INEX2			| INEX2 exception
357 1:	moveq	#-128,%d0				| continue with fmove
358 	and.l	%d0,%d2
359 	jra	fp_getdest
360 
361 	.data
362 	.align	4
363 fp_constants:
364 	.long	0x00004000,0xc90fdaa2,0x2168c235	| pi
365 	.extend	0,0,0,0,0,0,0,0,0,0
366 	.long	0x00003ffd,0x9a209a84,0xfbcff798	| log10(2)
367 	.long	0x00004000,0xadf85458,0xa2bb4a9a	| e
368 	.long	0x00003fff,0xb8aa3b29,0x5c17f0bc	| log2(e)
369 	.long	0x00003ffd,0xde5bd8a9,0x37287195	| log10(e)
370 	.long	0x00000000,0x00000000,0x00000000	| 0.0
371 	.long	0x00003ffe,0xb17217f7,0xd1cf79ac	| 1n(2)
372 	.long	0x00004000,0x935d8ddd,0xaaa8ac17	| 1n(10)
373 	| read this as "1.0 * 2^0" - note the high bit in the mantissa
374 	.long	0x00003fff,0x80000000,0x00000000	| 10^0
375 	.long	0x00004002,0xa0000000,0x00000000	| 10^1
376 	.long	0x00004005,0xc8000000,0x00000000	| 10^2
377 	.long	0x0000400c,0x9c400000,0x00000000	| 10^4
378 	.long	0x00004019,0xbebc2000,0x00000000	| 10^8
379 	.long	0x00004034,0x8e1bc9bf,0x04000000	| 10^16
380 	.long	0x00004069,0x9dc5ada8,0x2b70b59e	| 10^32
381 	.long	0x000040d3,0xc2781f49,0xffcfa6d5	| 10^64
382 	.long	0x000041a8,0x93ba47c9,0x80e98ce0	| 10^128
383 	.long	0x00004351,0xaa7eebfb,0x9df9de8e	| 10^256
384 	.long	0x000046a3,0xe319a0ae,0xa60e91c7	| 10^512
385 	.long	0x00004d48,0xc9767586,0x81750c17	| 10^1024
386 	.long	0x00005a92,0x9e8b3b5d,0xc53d5de5	| 10^2048
387 	.long	0x00007525,0xc4605202,0x8a20979b	| 10^4096
388 	.previous
389 
390 fp_fmove_mem2fp:
391 	printf	PINSTR,"fmove %p,%p\n",2,%a0,%a1
392 	move.l	(%a1)+,(%a0)+
393 	move.l	(%a1)+,(%a0)+
394 	move.l	(%a1),(%a0)
395 	subq.l	#8,%a0
396 	rts
397 
398 fpa_fsglmul:
399 	move.l	#fp_finalrounding_single_fast,(%sp)
400 	jra	fp_fsglmul
401 
402 fpa_fsgldiv:
403 	move.l	#fp_finalrounding_single_fast,(%sp)
404 	jra	fp_fsgldiv
405 
406 .macro	fp_dosingleprec instr
407 	printf	PINSTR,"single "
408 	move.l	#fp_finalrounding_single,(%sp)
409 	jra	\instr
410 .endm
411 
412 .macro	fp_dodoubleprec instr
413 	printf	PINSTR,"double "
414 	move.l	#fp_finalrounding_double,(%sp)
415 	jra	\instr
416 .endm
417 
418 fp_fsmove:
419 	fp_dosingleprec fp_fmove_mem2fp
420 
421 fp_fssqrt:
422 	fp_dosingleprec fp_fsqrt
423 
424 fp_fdmove:
425 	fp_dodoubleprec fp_fmove_mem2fp
426 
427 fp_fdsqrt:
428 	fp_dodoubleprec fp_fsqrt
429 
430 fp_fsabs:
431 	fp_dosingleprec fp_fabs
432 
433 fp_fsneg:
434 	fp_dosingleprec fp_fneg
435 
436 fp_fdabs:
437 	fp_dodoubleprec fp_fabs
438 
439 fp_fdneg:
440 	fp_dodoubleprec fp_fneg
441 
442 fp_fsdiv:
443 	fp_dosingleprec fp_fdiv
444 
445 fp_fsadd:
446 	fp_dosingleprec fp_fadd
447 
448 fp_fsmul:
449 	fp_dosingleprec fp_fmul
450 
451 fp_fddiv:
452 	fp_dodoubleprec fp_fdiv
453 
454 fp_fdadd:
455 	fp_dodoubleprec fp_fadd
456 
457 fp_fdmul:
458 	fp_dodoubleprec fp_fmul
459 
460 fp_fssub:
461 	fp_dosingleprec fp_fsub
462 
463 fp_fdsub:
464 	fp_dodoubleprec fp_fsub
465 
466 fp_nonstd:
467 	fp_get_pc %a0
468 	getuser.l (%a0),%d0,fp_err_ua1,%a0
469 	printf	,"nonstd ((%08x)=%08x)\n",2,%a0,%d0
470 	moveq	#-1,%d0
471 	rts
472 
473 	.data
474 	.align	4
475 
476 	| data sizes corresponding to the operand formats
477 fp_datasize:
478 	.word	4, 4, 12, 12, 2, 8, 1, 0
479