aha/arch/m68k/fpsp040/slog2.S
Matt Waddel e00d82d07f [PATCH] Add wording to m68k .S files to help clarify license info
Acked-by: Alan Cox <alan@redhat.com>
Signed-off-by: Matt Waddel <Matt.Waddel@freescale.com>
Cc: Roman Zippel <zippel@linux-m68k.org>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2006-02-11 21:41:11 -08:00

187 lines
5.1 KiB
ArmAsm

|
| slog2.sa 3.1 12/10/90
|
| The entry point slog10 computes the base-10
| logarithm of an input argument X.
| slog10d does the same except the input value is a
| denormalized number.
| sLog2 and sLog2d are the base-2 analogues.
|
| INPUT: Double-extended value in memory location pointed to
| by address register a0.
|
| OUTPUT: log_10(X) or log_2(X) returned in floating-point
| register fp0.
|
| ACCURACY and MONOTONICITY: The returned result is within 1.7
| ulps in 64 significant bit, i.e. within 0.5003 ulp
| to 53 bits if the result is subsequently rounded
| to double precision. The result is provably monotonic
| in double precision.
|
| SPEED: Two timings are measured, both in the copy-back mode.
| The first one is measured when the function is invoked
| the first time (so the instructions and data are not
| in cache), and the second one is measured when the
| function is reinvoked at the same input argument.
|
| ALGORITHM and IMPLEMENTATION NOTES:
|
| slog10d:
|
| Step 0. If X < 0, create a NaN and raise the invalid operation
| flag. Otherwise, save FPCR in D1; set FpCR to default.
| Notes: Default means round-to-nearest mode, no floating-point
| traps, and precision control = double extended.
|
| Step 1. Call slognd to obtain Y = log(X), the natural log of X.
| Notes: Even if X is denormalized, log(X) is always normalized.
|
| Step 2. Compute log_10(X) = log(X) * (1/log(10)).
| 2.1 Restore the user FPCR
| 2.2 Return ans := Y * INV_L10.
|
|
| slog10:
|
| Step 0. If X < 0, create a NaN and raise the invalid operation
| flag. Otherwise, save FPCR in D1; set FpCR to default.
| Notes: Default means round-to-nearest mode, no floating-point
| traps, and precision control = double extended.
|
| Step 1. Call sLogN to obtain Y = log(X), the natural log of X.
|
| Step 2. Compute log_10(X) = log(X) * (1/log(10)).
| 2.1 Restore the user FPCR
| 2.2 Return ans := Y * INV_L10.
|
|
| sLog2d:
|
| Step 0. If X < 0, create a NaN and raise the invalid operation
| flag. Otherwise, save FPCR in D1; set FpCR to default.
| Notes: Default means round-to-nearest mode, no floating-point
| traps, and precision control = double extended.
|
| Step 1. Call slognd to obtain Y = log(X), the natural log of X.
| Notes: Even if X is denormalized, log(X) is always normalized.
|
| Step 2. Compute log_10(X) = log(X) * (1/log(2)).
| 2.1 Restore the user FPCR
| 2.2 Return ans := Y * INV_L2.
|
|
| sLog2:
|
| Step 0. If X < 0, create a NaN and raise the invalid operation
| flag. Otherwise, save FPCR in D1; set FpCR to default.
| Notes: Default means round-to-nearest mode, no floating-point
| traps, and precision control = double extended.
|
| Step 1. If X is not an integer power of two, i.e., X != 2^k,
| go to Step 3.
|
| Step 2. Return k.
| 2.1 Get integer k, X = 2^k.
| 2.2 Restore the user FPCR.
| 2.3 Return ans := convert-to-double-extended(k).
|
| Step 3. Call sLogN to obtain Y = log(X), the natural log of X.
|
| Step 4. Compute log_2(X) = log(X) * (1/log(2)).
| 4.1 Restore the user FPCR
| 4.2 Return ans := Y * INV_L2.
|
| Copyright (C) Motorola, Inc. 1990
| All Rights Reserved
|
| For details on the license for this file, please see the
| file, README, in this same directory.
|SLOG2 idnt 2,1 | Motorola 040 Floating Point Software Package
|section 8
|xref t_frcinx
|xref t_operr
|xref slogn
|xref slognd
INV_L10: .long 0x3FFD0000,0xDE5BD8A9,0x37287195,0x00000000
INV_L2: .long 0x3FFF0000,0xB8AA3B29,0x5C17F0BC,0x00000000
.global slog10d
slog10d:
|--entry point for Log10(X), X is denormalized
movel (%a0),%d0
blt invalid
movel %d1,-(%sp)
clrl %d1
bsr slognd | ...log(X), X denorm.
fmovel (%sp)+,%fpcr
fmulx INV_L10,%fp0
bra t_frcinx
.global slog10
slog10:
|--entry point for Log10(X), X is normalized
movel (%a0),%d0
blt invalid
movel %d1,-(%sp)
clrl %d1
bsr slogn | ...log(X), X normal.
fmovel (%sp)+,%fpcr
fmulx INV_L10,%fp0
bra t_frcinx
.global slog2d
slog2d:
|--entry point for Log2(X), X is denormalized
movel (%a0),%d0
blt invalid
movel %d1,-(%sp)
clrl %d1
bsr slognd | ...log(X), X denorm.
fmovel (%sp)+,%fpcr
fmulx INV_L2,%fp0
bra t_frcinx
.global slog2
slog2:
|--entry point for Log2(X), X is normalized
movel (%a0),%d0
blt invalid
movel 8(%a0),%d0
bnes continue | ...X is not 2^k
movel 4(%a0),%d0
andl #0x7FFFFFFF,%d0
tstl %d0
bnes continue
|--X = 2^k.
movew (%a0),%d0
andl #0x00007FFF,%d0
subl #0x3FFF,%d0
fmovel %d1,%fpcr
fmovel %d0,%fp0
bra t_frcinx
continue:
movel %d1,-(%sp)
clrl %d1
bsr slogn | ...log(X), X normal.
fmovel (%sp)+,%fpcr
fmulx INV_L2,%fp0
bra t_frcinx
invalid:
bra t_operr
|end