Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | | |
| 2 | | sacos.sa 3.3 12/19/90 |
| 3 | | |
| 4 | | Description: The entry point sAcos computes the inverse cosine of |
| 5 | | an input argument; sAcosd does the same except for denormalized |
| 6 | | input. |
| 7 | | |
| 8 | | Input: Double-extended number X in location pointed to |
| 9 | | by address register a0. |
| 10 | | |
| 11 | | Output: The value arccos(X) returned in floating-point register Fp0. |
| 12 | | |
| 13 | | Accuracy and Monotonicity: The returned result is within 3 ulps in |
| 14 | | 64 significant bit, i.e. within 0.5001 ulp to 53 bits if the |
| 15 | | result is subsequently rounded to double precision. The |
| 16 | | result is provably monotonic in double precision. |
| 17 | | |
| 18 | | Speed: The program sCOS takes approximately 310 cycles. |
| 19 | | |
| 20 | | Algorithm: |
| 21 | | |
| 22 | | ACOS |
| 23 | | 1. If |X| >= 1, go to 3. |
| 24 | | |
| 25 | | 2. (|X| < 1) Calculate acos(X) by |
| 26 | | z := (1-X) / (1+X) |
| 27 | | acos(X) = 2 * atan( sqrt(z) ). |
| 28 | | Exit. |
| 29 | | |
| 30 | | 3. If |X| > 1, go to 5. |
| 31 | | |
| 32 | | 4. (|X| = 1) If X > 0, return 0. Otherwise, return Pi. Exit. |
| 33 | | |
| 34 | | 5. (|X| > 1) Generate an invalid operation by 0 * infinity. |
| 35 | | Exit. |
| 36 | | |
| 37 | |
| 38 | | Copyright (C) Motorola, Inc. 1990 |
| 39 | | All Rights Reserved |
| 40 | | |
Matt Waddel | e00d82d | 2006-02-11 17:55:48 -0800 | [diff] [blame] | 41 | | For details on the license for this file, please see the |
| 42 | | file, README, in this same directory. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 43 | |
| 44 | |SACOS idnt 2,1 | Motorola 040 Floating Point Software Package |
| 45 | |
| 46 | |section 8 |
| 47 | |
| 48 | PI: .long 0x40000000,0xC90FDAA2,0x2168C235,0x00000000 |
| 49 | PIBY2: .long 0x3FFF0000,0xC90FDAA2,0x2168C235,0x00000000 |
| 50 | |
| 51 | |xref t_operr |
| 52 | |xref t_frcinx |
| 53 | |xref satan |
| 54 | |
| 55 | .global sacosd |
| 56 | sacosd: |
| 57 | |--ACOS(X) = PI/2 FOR DENORMALIZED X |
| 58 | fmovel %d1,%fpcr | ...load user's rounding mode/precision |
| 59 | fmovex PIBY2,%fp0 |
| 60 | bra t_frcinx |
| 61 | |
| 62 | .global sacos |
| 63 | sacos: |
| 64 | fmovex (%a0),%fp0 | ...LOAD INPUT |
| 65 | |
| 66 | movel (%a0),%d0 | ...pack exponent with upper 16 fraction |
| 67 | movew 4(%a0),%d0 |
| 68 | andil #0x7FFFFFFF,%d0 |
| 69 | cmpil #0x3FFF8000,%d0 |
| 70 | bges ACOSBIG |
| 71 | |
| 72 | |--THIS IS THE USUAL CASE, |X| < 1 |
| 73 | |--ACOS(X) = 2 * ATAN( SQRT( (1-X)/(1+X) ) ) |
| 74 | |
| 75 | fmoves #0x3F800000,%fp1 |
| 76 | faddx %fp0,%fp1 | ...1+X |
| 77 | fnegx %fp0 | ... -X |
| 78 | fadds #0x3F800000,%fp0 | ...1-X |
| 79 | fdivx %fp1,%fp0 | ...(1-X)/(1+X) |
| 80 | fsqrtx %fp0 | ...SQRT((1-X)/(1+X)) |
| 81 | fmovemx %fp0-%fp0,(%a0) | ...overwrite input |
| 82 | movel %d1,-(%sp) |save original users fpcr |
| 83 | clrl %d1 |
| 84 | bsr satan | ...ATAN(SQRT([1-X]/[1+X])) |
| 85 | fmovel (%sp)+,%fpcr |restore users exceptions |
| 86 | faddx %fp0,%fp0 | ...2 * ATAN( STUFF ) |
| 87 | bra t_frcinx |
| 88 | |
| 89 | ACOSBIG: |
| 90 | fabsx %fp0 |
| 91 | fcmps #0x3F800000,%fp0 |
| 92 | fbgt t_operr |cause an operr exception |
| 93 | |
| 94 | |--|X| = 1, ACOS(X) = 0 OR PI |
| 95 | movel (%a0),%d0 | ...pack exponent with upper 16 fraction |
| 96 | movew 4(%a0),%d0 |
| 97 | cmpl #0,%d0 |D0 has original exponent+fraction |
| 98 | bgts ACOSP1 |
| 99 | |
| 100 | |--X = -1 |
| 101 | |Returns PI and inexact exception |
| 102 | fmovex PI,%fp0 |
| 103 | fmovel %d1,%FPCR |
| 104 | fadds #0x00800000,%fp0 |cause an inexact exception to be put |
| 105 | | ;into the 040 - will not trap until next |
| 106 | | ;fp inst. |
| 107 | bra t_frcinx |
| 108 | |
| 109 | ACOSP1: |
| 110 | fmovel %d1,%FPCR |
| 111 | fmoves #0x00000000,%fp0 |
| 112 | rts |Facos ; of +1 is exact |
| 113 | |
| 114 | |end |