18c2ecf20Sopenharmony_ci|
28c2ecf20Sopenharmony_ci|	slog2.sa 3.1 12/10/90
38c2ecf20Sopenharmony_ci|
48c2ecf20Sopenharmony_ci|       The entry point slog10 computes the base-10
58c2ecf20Sopenharmony_ci|	logarithm of an input argument X.
68c2ecf20Sopenharmony_ci|	slog10d does the same except the input value is a
78c2ecf20Sopenharmony_ci|	denormalized number.
88c2ecf20Sopenharmony_ci|	sLog2 and sLog2d are the base-2 analogues.
98c2ecf20Sopenharmony_ci|
108c2ecf20Sopenharmony_ci|       INPUT:	Double-extended value in memory location pointed to
118c2ecf20Sopenharmony_ci|		by address register a0.
128c2ecf20Sopenharmony_ci|
138c2ecf20Sopenharmony_ci|       OUTPUT: log_10(X) or log_2(X) returned in floating-point
148c2ecf20Sopenharmony_ci|		register fp0.
158c2ecf20Sopenharmony_ci|
168c2ecf20Sopenharmony_ci|       ACCURACY and MONOTONICITY: The returned result is within 1.7
178c2ecf20Sopenharmony_ci|		ulps in 64 significant bit, i.e. within 0.5003 ulp
188c2ecf20Sopenharmony_ci|		to 53 bits if the result is subsequently rounded
198c2ecf20Sopenharmony_ci|		to double precision. The result is provably monotonic
208c2ecf20Sopenharmony_ci|		in double precision.
218c2ecf20Sopenharmony_ci|
228c2ecf20Sopenharmony_ci|       SPEED:	Two timings are measured, both in the copy-back mode.
238c2ecf20Sopenharmony_ci|		The first one is measured when the function is invoked
248c2ecf20Sopenharmony_ci|		the first time (so the instructions and data are not
258c2ecf20Sopenharmony_ci|		in cache), and the second one is measured when the
268c2ecf20Sopenharmony_ci|		function is reinvoked at the same input argument.
278c2ecf20Sopenharmony_ci|
288c2ecf20Sopenharmony_ci|       ALGORITHM and IMPLEMENTATION NOTES:
298c2ecf20Sopenharmony_ci|
308c2ecf20Sopenharmony_ci|       slog10d:
318c2ecf20Sopenharmony_ci|
328c2ecf20Sopenharmony_ci|       Step 0.   If X < 0, create a NaN and raise the invalid operation
338c2ecf20Sopenharmony_ci|                 flag. Otherwise, save FPCR in D1; set FpCR to default.
348c2ecf20Sopenharmony_ci|       Notes:    Default means round-to-nearest mode, no floating-point
358c2ecf20Sopenharmony_ci|                 traps, and precision control = double extended.
368c2ecf20Sopenharmony_ci|
378c2ecf20Sopenharmony_ci|       Step 1.   Call slognd to obtain Y = log(X), the natural log of X.
388c2ecf20Sopenharmony_ci|       Notes:    Even if X is denormalized, log(X) is always normalized.
398c2ecf20Sopenharmony_ci|
408c2ecf20Sopenharmony_ci|       Step 2.   Compute log_10(X) = log(X) * (1/log(10)).
418c2ecf20Sopenharmony_ci|            2.1  Restore the user FPCR
428c2ecf20Sopenharmony_ci|            2.2  Return ans := Y * INV_L10.
438c2ecf20Sopenharmony_ci|
448c2ecf20Sopenharmony_ci|
458c2ecf20Sopenharmony_ci|       slog10:
468c2ecf20Sopenharmony_ci|
478c2ecf20Sopenharmony_ci|       Step 0.   If X < 0, create a NaN and raise the invalid operation
488c2ecf20Sopenharmony_ci|                 flag. Otherwise, save FPCR in D1; set FpCR to default.
498c2ecf20Sopenharmony_ci|       Notes:    Default means round-to-nearest mode, no floating-point
508c2ecf20Sopenharmony_ci|                 traps, and precision control = double extended.
518c2ecf20Sopenharmony_ci|
528c2ecf20Sopenharmony_ci|       Step 1.   Call sLogN to obtain Y = log(X), the natural log of X.
538c2ecf20Sopenharmony_ci|
548c2ecf20Sopenharmony_ci|       Step 2.   Compute log_10(X) = log(X) * (1/log(10)).
558c2ecf20Sopenharmony_ci|            2.1  Restore the user FPCR
568c2ecf20Sopenharmony_ci|            2.2  Return ans := Y * INV_L10.
578c2ecf20Sopenharmony_ci|
588c2ecf20Sopenharmony_ci|
598c2ecf20Sopenharmony_ci|       sLog2d:
608c2ecf20Sopenharmony_ci|
618c2ecf20Sopenharmony_ci|       Step 0.   If X < 0, create a NaN and raise the invalid operation
628c2ecf20Sopenharmony_ci|                 flag. Otherwise, save FPCR in D1; set FpCR to default.
638c2ecf20Sopenharmony_ci|       Notes:    Default means round-to-nearest mode, no floating-point
648c2ecf20Sopenharmony_ci|                 traps, and precision control = double extended.
658c2ecf20Sopenharmony_ci|
668c2ecf20Sopenharmony_ci|       Step 1.   Call slognd to obtain Y = log(X), the natural log of X.
678c2ecf20Sopenharmony_ci|       Notes:    Even if X is denormalized, log(X) is always normalized.
688c2ecf20Sopenharmony_ci|
698c2ecf20Sopenharmony_ci|       Step 2.   Compute log_10(X) = log(X) * (1/log(2)).
708c2ecf20Sopenharmony_ci|            2.1  Restore the user FPCR
718c2ecf20Sopenharmony_ci|            2.2  Return ans := Y * INV_L2.
728c2ecf20Sopenharmony_ci|
738c2ecf20Sopenharmony_ci|
748c2ecf20Sopenharmony_ci|       sLog2:
758c2ecf20Sopenharmony_ci|
768c2ecf20Sopenharmony_ci|       Step 0.   If X < 0, create a NaN and raise the invalid operation
778c2ecf20Sopenharmony_ci|                 flag. Otherwise, save FPCR in D1; set FpCR to default.
788c2ecf20Sopenharmony_ci|       Notes:    Default means round-to-nearest mode, no floating-point
798c2ecf20Sopenharmony_ci|                 traps, and precision control = double extended.
808c2ecf20Sopenharmony_ci|
818c2ecf20Sopenharmony_ci|       Step 1.   If X is not an integer power of two, i.e., X != 2^k,
828c2ecf20Sopenharmony_ci|                 go to Step 3.
838c2ecf20Sopenharmony_ci|
848c2ecf20Sopenharmony_ci|       Step 2.   Return k.
858c2ecf20Sopenharmony_ci|            2.1  Get integer k, X = 2^k.
868c2ecf20Sopenharmony_ci|            2.2  Restore the user FPCR.
878c2ecf20Sopenharmony_ci|            2.3  Return ans := convert-to-double-extended(k).
888c2ecf20Sopenharmony_ci|
898c2ecf20Sopenharmony_ci|       Step 3.   Call sLogN to obtain Y = log(X), the natural log of X.
908c2ecf20Sopenharmony_ci|
918c2ecf20Sopenharmony_ci|       Step 4.   Compute log_2(X) = log(X) * (1/log(2)).
928c2ecf20Sopenharmony_ci|            4.1  Restore the user FPCR
938c2ecf20Sopenharmony_ci|            4.2  Return ans := Y * INV_L2.
948c2ecf20Sopenharmony_ci|
958c2ecf20Sopenharmony_ci
968c2ecf20Sopenharmony_ci|		Copyright (C) Motorola, Inc. 1990
978c2ecf20Sopenharmony_ci|			All Rights Reserved
988c2ecf20Sopenharmony_ci|
998c2ecf20Sopenharmony_ci|       For details on the license for this file, please see the
1008c2ecf20Sopenharmony_ci|       file, README, in this same directory.
1018c2ecf20Sopenharmony_ci
1028c2ecf20Sopenharmony_ci|SLOG2    idnt    2,1 | Motorola 040 Floating Point Software Package
1038c2ecf20Sopenharmony_ci
1048c2ecf20Sopenharmony_ci	|section	8
1058c2ecf20Sopenharmony_ci
1068c2ecf20Sopenharmony_ci	|xref	t_frcinx
1078c2ecf20Sopenharmony_ci	|xref	t_operr
1088c2ecf20Sopenharmony_ci	|xref	slogn
1098c2ecf20Sopenharmony_ci	|xref	slognd
1108c2ecf20Sopenharmony_ci
1118c2ecf20Sopenharmony_ciINV_L10:  .long 0x3FFD0000,0xDE5BD8A9,0x37287195,0x00000000
1128c2ecf20Sopenharmony_ci
1138c2ecf20Sopenharmony_ciINV_L2:   .long 0x3FFF0000,0xB8AA3B29,0x5C17F0BC,0x00000000
1148c2ecf20Sopenharmony_ci
1158c2ecf20Sopenharmony_ci	.global	slog10d
1168c2ecf20Sopenharmony_cislog10d:
1178c2ecf20Sopenharmony_ci|--entry point for Log10(X), X is denormalized
1188c2ecf20Sopenharmony_ci	movel		(%a0),%d0
1198c2ecf20Sopenharmony_ci	blt		invalid
1208c2ecf20Sopenharmony_ci	movel		%d1,-(%sp)
1218c2ecf20Sopenharmony_ci	clrl		%d1
1228c2ecf20Sopenharmony_ci	bsr		slognd			| ...log(X), X denorm.
1238c2ecf20Sopenharmony_ci	fmovel		(%sp)+,%fpcr
1248c2ecf20Sopenharmony_ci	fmulx		INV_L10,%fp0
1258c2ecf20Sopenharmony_ci	bra		t_frcinx
1268c2ecf20Sopenharmony_ci
1278c2ecf20Sopenharmony_ci	.global	slog10
1288c2ecf20Sopenharmony_cislog10:
1298c2ecf20Sopenharmony_ci|--entry point for Log10(X), X is normalized
1308c2ecf20Sopenharmony_ci
1318c2ecf20Sopenharmony_ci	movel		(%a0),%d0
1328c2ecf20Sopenharmony_ci	blt		invalid
1338c2ecf20Sopenharmony_ci	movel		%d1,-(%sp)
1348c2ecf20Sopenharmony_ci	clrl		%d1
1358c2ecf20Sopenharmony_ci	bsr		slogn			| ...log(X), X normal.
1368c2ecf20Sopenharmony_ci	fmovel		(%sp)+,%fpcr
1378c2ecf20Sopenharmony_ci	fmulx		INV_L10,%fp0
1388c2ecf20Sopenharmony_ci	bra		t_frcinx
1398c2ecf20Sopenharmony_ci
1408c2ecf20Sopenharmony_ci
1418c2ecf20Sopenharmony_ci	.global	slog2d
1428c2ecf20Sopenharmony_cislog2d:
1438c2ecf20Sopenharmony_ci|--entry point for Log2(X), X is denormalized
1448c2ecf20Sopenharmony_ci
1458c2ecf20Sopenharmony_ci	movel		(%a0),%d0
1468c2ecf20Sopenharmony_ci	blt		invalid
1478c2ecf20Sopenharmony_ci	movel		%d1,-(%sp)
1488c2ecf20Sopenharmony_ci	clrl		%d1
1498c2ecf20Sopenharmony_ci	bsr		slognd			| ...log(X), X denorm.
1508c2ecf20Sopenharmony_ci	fmovel		(%sp)+,%fpcr
1518c2ecf20Sopenharmony_ci	fmulx		INV_L2,%fp0
1528c2ecf20Sopenharmony_ci	bra		t_frcinx
1538c2ecf20Sopenharmony_ci
1548c2ecf20Sopenharmony_ci	.global	slog2
1558c2ecf20Sopenharmony_cislog2:
1568c2ecf20Sopenharmony_ci|--entry point for Log2(X), X is normalized
1578c2ecf20Sopenharmony_ci	movel		(%a0),%d0
1588c2ecf20Sopenharmony_ci	blt		invalid
1598c2ecf20Sopenharmony_ci
1608c2ecf20Sopenharmony_ci	movel		8(%a0),%d0
1618c2ecf20Sopenharmony_ci	bnes		continue		| ...X is not 2^k
1628c2ecf20Sopenharmony_ci
1638c2ecf20Sopenharmony_ci	movel		4(%a0),%d0
1648c2ecf20Sopenharmony_ci	andl		#0x7FFFFFFF,%d0
1658c2ecf20Sopenharmony_ci	tstl		%d0
1668c2ecf20Sopenharmony_ci	bnes		continue
1678c2ecf20Sopenharmony_ci
1688c2ecf20Sopenharmony_ci|--X = 2^k.
1698c2ecf20Sopenharmony_ci	movew		(%a0),%d0
1708c2ecf20Sopenharmony_ci	andl		#0x00007FFF,%d0
1718c2ecf20Sopenharmony_ci	subl		#0x3FFF,%d0
1728c2ecf20Sopenharmony_ci	fmovel		%d1,%fpcr
1738c2ecf20Sopenharmony_ci	fmovel		%d0,%fp0
1748c2ecf20Sopenharmony_ci	bra		t_frcinx
1758c2ecf20Sopenharmony_ci
1768c2ecf20Sopenharmony_cicontinue:
1778c2ecf20Sopenharmony_ci	movel		%d1,-(%sp)
1788c2ecf20Sopenharmony_ci	clrl		%d1
1798c2ecf20Sopenharmony_ci	bsr		slogn			| ...log(X), X normal.
1808c2ecf20Sopenharmony_ci	fmovel		(%sp)+,%fpcr
1818c2ecf20Sopenharmony_ci	fmulx		INV_L2,%fp0
1828c2ecf20Sopenharmony_ci	bra		t_frcinx
1838c2ecf20Sopenharmony_ci
1848c2ecf20Sopenharmony_ciinvalid:
1858c2ecf20Sopenharmony_ci	bra		t_operr
1868c2ecf20Sopenharmony_ci
1878c2ecf20Sopenharmony_ci	|end
188