fpu_trig.c 38 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643
  1. /*---------------------------------------------------------------------------+
  2. | fpu_trig.c |
  3. | |
  4. | Implementation of the FPU "transcendental" functions. |
  5. | |
  6. | Copyright (C) 1992,1993,1994,1997,1999 |
  7. | W. Metzenthen, 22 Parker St, Ormond, Vic 3163, |
  8. | Australia. E-mail [email protected] |
  9. | |
  10. | |
  11. +---------------------------------------------------------------------------*/
  12. #include "fpu_system.h"
  13. #include "exception.h"
  14. #include "fpu_emu.h"
  15. #include "status_w.h"
  16. #include "control_w.h"
  17. #include "reg_constant.h"
  18. static void rem_kernel(unsigned long long st0, unsigned long long *y,
  19. unsigned long long st1, unsigned long long q, int n);
  20. #define BETTER_THAN_486
  21. #define FCOS 4
  22. /* Used only by fptan, fsin, fcos, and fsincos. */
  23. /* This routine produces very accurate results, similar to
  24. using a value of pi with more than 128 bits precision. */
  25. /* Limited measurements show no results worse than 64 bit precision
  26. except for the results for arguments close to 2^63, where the
  27. precision of the result sometimes degrades to about 63.9 bits */
  28. static int trig_arg(FPU_REG *st0_ptr, int even)
  29. {
  30. FPU_REG tmp;
  31. u_char tmptag;
  32. unsigned long long q;
  33. int old_cw = control_word, saved_status = partial_status;
  34. int tag, st0_tag = TAG_Valid;
  35. if (exponent(st0_ptr) >= 63) {
  36. partial_status |= SW_C2; /* Reduction incomplete. */
  37. return -1;
  38. }
  39. control_word &= ~CW_RC;
  40. control_word |= RC_CHOP;
  41. setpositive(st0_ptr);
  42. tag = FPU_u_div(st0_ptr, &CONST_PI2, &tmp, PR_64_BITS | RC_CHOP | 0x3f,
  43. SIGN_POS);
  44. FPU_round_to_int(&tmp, tag); /* Fortunately, this can't overflow
  45. to 2^64 */
  46. q = significand(&tmp);
  47. if (q) {
  48. rem_kernel(significand(st0_ptr),
  49. &significand(&tmp),
  50. significand(&CONST_PI2),
  51. q, exponent(st0_ptr) - exponent(&CONST_PI2));
  52. setexponent16(&tmp, exponent(&CONST_PI2));
  53. st0_tag = FPU_normalize(&tmp);
  54. FPU_copy_to_reg0(&tmp, st0_tag);
  55. }
  56. if ((even && !(q & 1)) || (!even && (q & 1))) {
  57. st0_tag =
  58. FPU_sub(REV | LOADED | TAG_Valid, (int)&CONST_PI2,
  59. FULL_PRECISION);
  60. #ifdef BETTER_THAN_486
  61. /* So far, the results are exact but based upon a 64 bit
  62. precision approximation to pi/2. The technique used
  63. now is equivalent to using an approximation to pi/2 which
  64. is accurate to about 128 bits. */
  65. if ((exponent(st0_ptr) <= exponent(&CONST_PI2extra) + 64)
  66. || (q > 1)) {
  67. /* This code gives the effect of having pi/2 to better than
  68. 128 bits precision. */
  69. significand(&tmp) = q + 1;
  70. setexponent16(&tmp, 63);
  71. FPU_normalize(&tmp);
  72. tmptag =
  73. FPU_u_mul(&CONST_PI2extra, &tmp, &tmp,
  74. FULL_PRECISION, SIGN_POS,
  75. exponent(&CONST_PI2extra) +
  76. exponent(&tmp));
  77. setsign(&tmp, getsign(&CONST_PI2extra));
  78. st0_tag = FPU_add(&tmp, tmptag, 0, FULL_PRECISION);
  79. if (signnegative(st0_ptr)) {
  80. /* CONST_PI2extra is negative, so the result of the addition
  81. can be negative. This means that the argument is actually
  82. in a different quadrant. The correction is always < pi/2,
  83. so it can't overflow into yet another quadrant. */
  84. setpositive(st0_ptr);
  85. q++;
  86. }
  87. }
  88. #endif /* BETTER_THAN_486 */
  89. }
  90. #ifdef BETTER_THAN_486
  91. else {
  92. /* So far, the results are exact but based upon a 64 bit
  93. precision approximation to pi/2. The technique used
  94. now is equivalent to using an approximation to pi/2 which
  95. is accurate to about 128 bits. */
  96. if (((q > 0)
  97. && (exponent(st0_ptr) <= exponent(&CONST_PI2extra) + 64))
  98. || (q > 1)) {
  99. /* This code gives the effect of having p/2 to better than
  100. 128 bits precision. */
  101. significand(&tmp) = q;
  102. setexponent16(&tmp, 63);
  103. FPU_normalize(&tmp); /* This must return TAG_Valid */
  104. tmptag =
  105. FPU_u_mul(&CONST_PI2extra, &tmp, &tmp,
  106. FULL_PRECISION, SIGN_POS,
  107. exponent(&CONST_PI2extra) +
  108. exponent(&tmp));
  109. setsign(&tmp, getsign(&CONST_PI2extra));
  110. st0_tag = FPU_sub(LOADED | (tmptag & 0x0f), (int)&tmp,
  111. FULL_PRECISION);
  112. if ((exponent(st0_ptr) == exponent(&CONST_PI2)) &&
  113. ((st0_ptr->sigh > CONST_PI2.sigh)
  114. || ((st0_ptr->sigh == CONST_PI2.sigh)
  115. && (st0_ptr->sigl > CONST_PI2.sigl)))) {
  116. /* CONST_PI2extra is negative, so the result of the
  117. subtraction can be larger than pi/2. This means
  118. that the argument is actually in a different quadrant.
  119. The correction is always < pi/2, so it can't overflow
  120. into yet another quadrant. */
  121. st0_tag =
  122. FPU_sub(REV | LOADED | TAG_Valid,
  123. (int)&CONST_PI2, FULL_PRECISION);
  124. q++;
  125. }
  126. }
  127. }
  128. #endif /* BETTER_THAN_486 */
  129. FPU_settag0(st0_tag);
  130. control_word = old_cw;
  131. partial_status = saved_status & ~SW_C2; /* Reduction complete. */
  132. return (q & 3) | even;
  133. }
  134. /* Convert a long to register */
  135. static void convert_l2reg(long const *arg, int deststnr)
  136. {
  137. int tag;
  138. long num = *arg;
  139. u_char sign;
  140. FPU_REG *dest = &st(deststnr);
  141. if (num == 0) {
  142. FPU_copy_to_regi(&CONST_Z, TAG_Zero, deststnr);
  143. return;
  144. }
  145. if (num > 0) {
  146. sign = SIGN_POS;
  147. } else {
  148. num = -num;
  149. sign = SIGN_NEG;
  150. }
  151. dest->sigh = num;
  152. dest->sigl = 0;
  153. setexponent16(dest, 31);
  154. tag = FPU_normalize(dest);
  155. FPU_settagi(deststnr, tag);
  156. setsign(dest, sign);
  157. return;
  158. }
  159. static void single_arg_error(FPU_REG *st0_ptr, u_char st0_tag)
  160. {
  161. if (st0_tag == TAG_Empty)
  162. FPU_stack_underflow(); /* Puts a QNaN in st(0) */
  163. else if (st0_tag == TW_NaN)
  164. real_1op_NaN(st0_ptr); /* return with a NaN in st(0) */
  165. #ifdef PARANOID
  166. else
  167. EXCEPTION(EX_INTERNAL | 0x0112);
  168. #endif /* PARANOID */
  169. }
  170. static void single_arg_2_error(FPU_REG *st0_ptr, u_char st0_tag)
  171. {
  172. int isNaN;
  173. switch (st0_tag) {
  174. case TW_NaN:
  175. isNaN = (exponent(st0_ptr) == EXP_OVER)
  176. && (st0_ptr->sigh & 0x80000000);
  177. if (isNaN && !(st0_ptr->sigh & 0x40000000)) { /* Signaling ? */
  178. EXCEPTION(EX_Invalid);
  179. if (control_word & CW_Invalid) {
  180. /* The masked response */
  181. /* Convert to a QNaN */
  182. st0_ptr->sigh |= 0x40000000;
  183. push();
  184. FPU_copy_to_reg0(st0_ptr, TAG_Special);
  185. }
  186. } else if (isNaN) {
  187. /* A QNaN */
  188. push();
  189. FPU_copy_to_reg0(st0_ptr, TAG_Special);
  190. } else {
  191. /* pseudoNaN or other unsupported */
  192. EXCEPTION(EX_Invalid);
  193. if (control_word & CW_Invalid) {
  194. /* The masked response */
  195. FPU_copy_to_reg0(&CONST_QNaN, TAG_Special);
  196. push();
  197. FPU_copy_to_reg0(&CONST_QNaN, TAG_Special);
  198. }
  199. }
  200. break; /* return with a NaN in st(0) */
  201. #ifdef PARANOID
  202. default:
  203. EXCEPTION(EX_INTERNAL | 0x0112);
  204. #endif /* PARANOID */
  205. }
  206. }
  207. /*---------------------------------------------------------------------------*/
  208. static void f2xm1(FPU_REG *st0_ptr, u_char tag)
  209. {
  210. FPU_REG a;
  211. clear_C1();
  212. if (tag == TAG_Valid) {
  213. /* For an 80486 FPU, the result is undefined if the arg is >= 1.0 */
  214. if (exponent(st0_ptr) < 0) {
  215. denormal_arg:
  216. FPU_to_exp16(st0_ptr, &a);
  217. /* poly_2xm1(x) requires 0 < st(0) < 1. */
  218. poly_2xm1(getsign(st0_ptr), &a, st0_ptr);
  219. }
  220. set_precision_flag_up(); /* 80486 appears to always do this */
  221. return;
  222. }
  223. if (tag == TAG_Zero)
  224. return;
  225. if (tag == TAG_Special)
  226. tag = FPU_Special(st0_ptr);
  227. switch (tag) {
  228. case TW_Denormal:
  229. if (denormal_operand() < 0)
  230. return;
  231. goto denormal_arg;
  232. case TW_Infinity:
  233. if (signnegative(st0_ptr)) {
  234. /* -infinity gives -1 (p16-10) */
  235. FPU_copy_to_reg0(&CONST_1, TAG_Valid);
  236. setnegative(st0_ptr);
  237. }
  238. return;
  239. default:
  240. single_arg_error(st0_ptr, tag);
  241. }
  242. }
  243. static void fptan(FPU_REG *st0_ptr, u_char st0_tag)
  244. {
  245. FPU_REG *st_new_ptr;
  246. int q;
  247. u_char arg_sign = getsign(st0_ptr);
  248. /* Stack underflow has higher priority */
  249. if (st0_tag == TAG_Empty) {
  250. FPU_stack_underflow(); /* Puts a QNaN in st(0) */
  251. if (control_word & CW_Invalid) {
  252. st_new_ptr = &st(-1);
  253. push();
  254. FPU_stack_underflow(); /* Puts a QNaN in the new st(0) */
  255. }
  256. return;
  257. }
  258. if (STACK_OVERFLOW) {
  259. FPU_stack_overflow();
  260. return;
  261. }
  262. if (st0_tag == TAG_Valid) {
  263. if (exponent(st0_ptr) > -40) {
  264. if ((q = trig_arg(st0_ptr, 0)) == -1) {
  265. /* Operand is out of range */
  266. return;
  267. }
  268. poly_tan(st0_ptr);
  269. setsign(st0_ptr, (q & 1) ^ (arg_sign != 0));
  270. set_precision_flag_up(); /* We do not really know if up or down */
  271. } else {
  272. /* For a small arg, the result == the argument */
  273. /* Underflow may happen */
  274. denormal_arg:
  275. FPU_to_exp16(st0_ptr, st0_ptr);
  276. st0_tag =
  277. FPU_round(st0_ptr, 1, 0, FULL_PRECISION, arg_sign);
  278. FPU_settag0(st0_tag);
  279. }
  280. push();
  281. FPU_copy_to_reg0(&CONST_1, TAG_Valid);
  282. return;
  283. }
  284. if (st0_tag == TAG_Zero) {
  285. push();
  286. FPU_copy_to_reg0(&CONST_1, TAG_Valid);
  287. setcc(0);
  288. return;
  289. }
  290. if (st0_tag == TAG_Special)
  291. st0_tag = FPU_Special(st0_ptr);
  292. if (st0_tag == TW_Denormal) {
  293. if (denormal_operand() < 0)
  294. return;
  295. goto denormal_arg;
  296. }
  297. if (st0_tag == TW_Infinity) {
  298. /* The 80486 treats infinity as an invalid operand */
  299. if (arith_invalid(0) >= 0) {
  300. st_new_ptr = &st(-1);
  301. push();
  302. arith_invalid(0);
  303. }
  304. return;
  305. }
  306. single_arg_2_error(st0_ptr, st0_tag);
  307. }
  308. static void fxtract(FPU_REG *st0_ptr, u_char st0_tag)
  309. {
  310. FPU_REG *st_new_ptr;
  311. u_char sign;
  312. register FPU_REG *st1_ptr = st0_ptr; /* anticipate */
  313. if (STACK_OVERFLOW) {
  314. FPU_stack_overflow();
  315. return;
  316. }
  317. clear_C1();
  318. if (st0_tag == TAG_Valid) {
  319. long e;
  320. push();
  321. sign = getsign(st1_ptr);
  322. reg_copy(st1_ptr, st_new_ptr);
  323. setexponent16(st_new_ptr, exponent(st_new_ptr));
  324. denormal_arg:
  325. e = exponent16(st_new_ptr);
  326. convert_l2reg(&e, 1);
  327. setexponentpos(st_new_ptr, 0);
  328. setsign(st_new_ptr, sign);
  329. FPU_settag0(TAG_Valid); /* Needed if arg was a denormal */
  330. return;
  331. } else if (st0_tag == TAG_Zero) {
  332. sign = getsign(st0_ptr);
  333. if (FPU_divide_by_zero(0, SIGN_NEG) < 0)
  334. return;
  335. push();
  336. FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
  337. setsign(st_new_ptr, sign);
  338. return;
  339. }
  340. if (st0_tag == TAG_Special)
  341. st0_tag = FPU_Special(st0_ptr);
  342. if (st0_tag == TW_Denormal) {
  343. if (denormal_operand() < 0)
  344. return;
  345. push();
  346. sign = getsign(st1_ptr);
  347. FPU_to_exp16(st1_ptr, st_new_ptr);
  348. goto denormal_arg;
  349. } else if (st0_tag == TW_Infinity) {
  350. sign = getsign(st0_ptr);
  351. setpositive(st0_ptr);
  352. push();
  353. FPU_copy_to_reg0(&CONST_INF, TAG_Special);
  354. setsign(st_new_ptr, sign);
  355. return;
  356. } else if (st0_tag == TW_NaN) {
  357. if (real_1op_NaN(st0_ptr) < 0)
  358. return;
  359. push();
  360. FPU_copy_to_reg0(st0_ptr, TAG_Special);
  361. return;
  362. } else if (st0_tag == TAG_Empty) {
  363. /* Is this the correct behaviour? */
  364. if (control_word & EX_Invalid) {
  365. FPU_stack_underflow();
  366. push();
  367. FPU_stack_underflow();
  368. } else
  369. EXCEPTION(EX_StackUnder);
  370. }
  371. #ifdef PARANOID
  372. else
  373. EXCEPTION(EX_INTERNAL | 0x119);
  374. #endif /* PARANOID */
  375. }
  376. static void fdecstp(void)
  377. {
  378. clear_C1();
  379. top--;
  380. }
  381. static void fincstp(void)
  382. {
  383. clear_C1();
  384. top++;
  385. }
  386. static void fsqrt_(FPU_REG *st0_ptr, u_char st0_tag)
  387. {
  388. int expon;
  389. clear_C1();
  390. if (st0_tag == TAG_Valid) {
  391. u_char tag;
  392. if (signnegative(st0_ptr)) {
  393. arith_invalid(0); /* sqrt(negative) is invalid */
  394. return;
  395. }
  396. /* make st(0) in [1.0 .. 4.0) */
  397. expon = exponent(st0_ptr);
  398. denormal_arg:
  399. setexponent16(st0_ptr, (expon & 1));
  400. /* Do the computation, the sign of the result will be positive. */
  401. tag = wm_sqrt(st0_ptr, 0, 0, control_word, SIGN_POS);
  402. addexponent(st0_ptr, expon >> 1);
  403. FPU_settag0(tag);
  404. return;
  405. }
  406. if (st0_tag == TAG_Zero)
  407. return;
  408. if (st0_tag == TAG_Special)
  409. st0_tag = FPU_Special(st0_ptr);
  410. if (st0_tag == TW_Infinity) {
  411. if (signnegative(st0_ptr))
  412. arith_invalid(0); /* sqrt(-Infinity) is invalid */
  413. return;
  414. } else if (st0_tag == TW_Denormal) {
  415. if (signnegative(st0_ptr)) {
  416. arith_invalid(0); /* sqrt(negative) is invalid */
  417. return;
  418. }
  419. if (denormal_operand() < 0)
  420. return;
  421. FPU_to_exp16(st0_ptr, st0_ptr);
  422. expon = exponent16(st0_ptr);
  423. goto denormal_arg;
  424. }
  425. single_arg_error(st0_ptr, st0_tag);
  426. }
  427. static void frndint_(FPU_REG *st0_ptr, u_char st0_tag)
  428. {
  429. int flags, tag;
  430. if (st0_tag == TAG_Valid) {
  431. u_char sign;
  432. denormal_arg:
  433. sign = getsign(st0_ptr);
  434. if (exponent(st0_ptr) > 63)
  435. return;
  436. if (st0_tag == TW_Denormal) {
  437. if (denormal_operand() < 0)
  438. return;
  439. }
  440. /* Fortunately, this can't overflow to 2^64 */
  441. if ((flags = FPU_round_to_int(st0_ptr, st0_tag)))
  442. set_precision_flag(flags);
  443. setexponent16(st0_ptr, 63);
  444. tag = FPU_normalize(st0_ptr);
  445. setsign(st0_ptr, sign);
  446. FPU_settag0(tag);
  447. return;
  448. }
  449. if (st0_tag == TAG_Zero)
  450. return;
  451. if (st0_tag == TAG_Special)
  452. st0_tag = FPU_Special(st0_ptr);
  453. if (st0_tag == TW_Denormal)
  454. goto denormal_arg;
  455. else if (st0_tag == TW_Infinity)
  456. return;
  457. else
  458. single_arg_error(st0_ptr, st0_tag);
  459. }
  460. static int fsin(FPU_REG *st0_ptr, u_char tag)
  461. {
  462. u_char arg_sign = getsign(st0_ptr);
  463. if (tag == TAG_Valid) {
  464. int q;
  465. if (exponent(st0_ptr) > -40) {
  466. if ((q = trig_arg(st0_ptr, 0)) == -1) {
  467. /* Operand is out of range */
  468. return 1;
  469. }
  470. poly_sine(st0_ptr);
  471. if (q & 2)
  472. changesign(st0_ptr);
  473. setsign(st0_ptr, getsign(st0_ptr) ^ arg_sign);
  474. /* We do not really know if up or down */
  475. set_precision_flag_up();
  476. return 0;
  477. } else {
  478. /* For a small arg, the result == the argument */
  479. set_precision_flag_up(); /* Must be up. */
  480. return 0;
  481. }
  482. }
  483. if (tag == TAG_Zero) {
  484. setcc(0);
  485. return 0;
  486. }
  487. if (tag == TAG_Special)
  488. tag = FPU_Special(st0_ptr);
  489. if (tag == TW_Denormal) {
  490. if (denormal_operand() < 0)
  491. return 1;
  492. /* For a small arg, the result == the argument */
  493. /* Underflow may happen */
  494. FPU_to_exp16(st0_ptr, st0_ptr);
  495. tag = FPU_round(st0_ptr, 1, 0, FULL_PRECISION, arg_sign);
  496. FPU_settag0(tag);
  497. return 0;
  498. } else if (tag == TW_Infinity) {
  499. /* The 80486 treats infinity as an invalid operand */
  500. arith_invalid(0);
  501. return 1;
  502. } else {
  503. single_arg_error(st0_ptr, tag);
  504. return 1;
  505. }
  506. }
  507. static int f_cos(FPU_REG *st0_ptr, u_char tag)
  508. {
  509. u_char st0_sign;
  510. st0_sign = getsign(st0_ptr);
  511. if (tag == TAG_Valid) {
  512. int q;
  513. if (exponent(st0_ptr) > -40) {
  514. if ((exponent(st0_ptr) < 0)
  515. || ((exponent(st0_ptr) == 0)
  516. && (significand(st0_ptr) <=
  517. 0xc90fdaa22168c234LL))) {
  518. poly_cos(st0_ptr);
  519. /* We do not really know if up or down */
  520. set_precision_flag_down();
  521. return 0;
  522. } else if ((q = trig_arg(st0_ptr, FCOS)) != -1) {
  523. poly_sine(st0_ptr);
  524. if ((q + 1) & 2)
  525. changesign(st0_ptr);
  526. /* We do not really know if up or down */
  527. set_precision_flag_down();
  528. return 0;
  529. } else {
  530. /* Operand is out of range */
  531. return 1;
  532. }
  533. } else {
  534. denormal_arg:
  535. setcc(0);
  536. FPU_copy_to_reg0(&CONST_1, TAG_Valid);
  537. #ifdef PECULIAR_486
  538. set_precision_flag_down(); /* 80486 appears to do this. */
  539. #else
  540. set_precision_flag_up(); /* Must be up. */
  541. #endif /* PECULIAR_486 */
  542. return 0;
  543. }
  544. } else if (tag == TAG_Zero) {
  545. FPU_copy_to_reg0(&CONST_1, TAG_Valid);
  546. setcc(0);
  547. return 0;
  548. }
  549. if (tag == TAG_Special)
  550. tag = FPU_Special(st0_ptr);
  551. if (tag == TW_Denormal) {
  552. if (denormal_operand() < 0)
  553. return 1;
  554. goto denormal_arg;
  555. } else if (tag == TW_Infinity) {
  556. /* The 80486 treats infinity as an invalid operand */
  557. arith_invalid(0);
  558. return 1;
  559. } else {
  560. single_arg_error(st0_ptr, tag); /* requires st0_ptr == &st(0) */
  561. return 1;
  562. }
  563. }
  564. static void fcos(FPU_REG *st0_ptr, u_char st0_tag)
  565. {
  566. f_cos(st0_ptr, st0_tag);
  567. }
  568. static void fsincos(FPU_REG *st0_ptr, u_char st0_tag)
  569. {
  570. FPU_REG *st_new_ptr;
  571. FPU_REG arg;
  572. u_char tag;
  573. /* Stack underflow has higher priority */
  574. if (st0_tag == TAG_Empty) {
  575. FPU_stack_underflow(); /* Puts a QNaN in st(0) */
  576. if (control_word & CW_Invalid) {
  577. st_new_ptr = &st(-1);
  578. push();
  579. FPU_stack_underflow(); /* Puts a QNaN in the new st(0) */
  580. }
  581. return;
  582. }
  583. if (STACK_OVERFLOW) {
  584. FPU_stack_overflow();
  585. return;
  586. }
  587. if (st0_tag == TAG_Special)
  588. tag = FPU_Special(st0_ptr);
  589. else
  590. tag = st0_tag;
  591. if (tag == TW_NaN) {
  592. single_arg_2_error(st0_ptr, TW_NaN);
  593. return;
  594. } else if (tag == TW_Infinity) {
  595. /* The 80486 treats infinity as an invalid operand */
  596. if (arith_invalid(0) >= 0) {
  597. /* Masked response */
  598. push();
  599. arith_invalid(0);
  600. }
  601. return;
  602. }
  603. reg_copy(st0_ptr, &arg);
  604. if (!fsin(st0_ptr, st0_tag)) {
  605. push();
  606. FPU_copy_to_reg0(&arg, st0_tag);
  607. f_cos(&st(0), st0_tag);
  608. } else {
  609. /* An error, so restore st(0) */
  610. FPU_copy_to_reg0(&arg, st0_tag);
  611. }
  612. }
  613. /*---------------------------------------------------------------------------*/
  614. /* The following all require two arguments: st(0) and st(1) */
  615. /* A lean, mean kernel for the fprem instructions. This relies upon
  616. the division and rounding to an integer in do_fprem giving an
  617. exact result. Because of this, rem_kernel() needs to deal only with
  618. the least significant 64 bits, the more significant bits of the
  619. result must be zero.
  620. */
  621. static void rem_kernel(unsigned long long st0, unsigned long long *y,
  622. unsigned long long st1, unsigned long long q, int n)
  623. {
  624. int dummy;
  625. unsigned long long x;
  626. x = st0 << n;
  627. /* Do the required multiplication and subtraction in the one operation */
  628. /* lsw x -= lsw st1 * lsw q */
  629. asm volatile ("mull %4; subl %%eax,%0; sbbl %%edx,%1":"=m"
  630. (((unsigned *)&x)[0]), "=m"(((unsigned *)&x)[1]),
  631. "=a"(dummy)
  632. :"2"(((unsigned *)&st1)[0]), "m"(((unsigned *)&q)[0])
  633. :"%dx");
  634. /* msw x -= msw st1 * lsw q */
  635. asm volatile ("mull %3; subl %%eax,%0":"=m" (((unsigned *)&x)[1]),
  636. "=a"(dummy)
  637. :"1"(((unsigned *)&st1)[1]), "m"(((unsigned *)&q)[0])
  638. :"%dx");
  639. /* msw x -= lsw st1 * msw q */
  640. asm volatile ("mull %3; subl %%eax,%0":"=m" (((unsigned *)&x)[1]),
  641. "=a"(dummy)
  642. :"1"(((unsigned *)&st1)[0]), "m"(((unsigned *)&q)[1])
  643. :"%dx");
  644. *y = x;
  645. }
  646. /* Remainder of st(0) / st(1) */
  647. /* This routine produces exact results, i.e. there is never any
  648. rounding or truncation, etc of the result. */
  649. static void do_fprem(FPU_REG *st0_ptr, u_char st0_tag, int round)
  650. {
  651. FPU_REG *st1_ptr = &st(1);
  652. u_char st1_tag = FPU_gettagi(1);
  653. if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
  654. FPU_REG tmp, st0, st1;
  655. u_char st0_sign, st1_sign;
  656. u_char tmptag;
  657. int tag;
  658. int old_cw;
  659. int expdif;
  660. long long q;
  661. unsigned short saved_status;
  662. int cc;
  663. fprem_valid:
  664. /* Convert registers for internal use. */
  665. st0_sign = FPU_to_exp16(st0_ptr, &st0);
  666. st1_sign = FPU_to_exp16(st1_ptr, &st1);
  667. expdif = exponent16(&st0) - exponent16(&st1);
  668. old_cw = control_word;
  669. cc = 0;
  670. /* We want the status following the denorm tests, but don't want
  671. the status changed by the arithmetic operations. */
  672. saved_status = partial_status;
  673. control_word &= ~CW_RC;
  674. control_word |= RC_CHOP;
  675. if (expdif < 64) {
  676. /* This should be the most common case */
  677. if (expdif > -2) {
  678. u_char sign = st0_sign ^ st1_sign;
  679. tag = FPU_u_div(&st0, &st1, &tmp,
  680. PR_64_BITS | RC_CHOP | 0x3f,
  681. sign);
  682. setsign(&tmp, sign);
  683. if (exponent(&tmp) >= 0) {
  684. FPU_round_to_int(&tmp, tag); /* Fortunately, this can't
  685. overflow to 2^64 */
  686. q = significand(&tmp);
  687. rem_kernel(significand(&st0),
  688. &significand(&tmp),
  689. significand(&st1),
  690. q, expdif);
  691. setexponent16(&tmp, exponent16(&st1));
  692. } else {
  693. reg_copy(&st0, &tmp);
  694. q = 0;
  695. }
  696. if ((round == RC_RND)
  697. && (tmp.sigh & 0xc0000000)) {
  698. /* We may need to subtract st(1) once more,
  699. to get a result <= 1/2 of st(1). */
  700. unsigned long long x;
  701. expdif =
  702. exponent16(&st1) - exponent16(&tmp);
  703. if (expdif <= 1) {
  704. if (expdif == 0)
  705. x = significand(&st1) -
  706. significand(&tmp);
  707. else /* expdif is 1 */
  708. x = (significand(&st1)
  709. << 1) -
  710. significand(&tmp);
  711. if ((x < significand(&tmp)) ||
  712. /* or equi-distant (from 0 & st(1)) and q is odd */
  713. ((x == significand(&tmp))
  714. && (q & 1))) {
  715. st0_sign = !st0_sign;
  716. significand(&tmp) = x;
  717. q++;
  718. }
  719. }
  720. }
  721. if (q & 4)
  722. cc |= SW_C0;
  723. if (q & 2)
  724. cc |= SW_C3;
  725. if (q & 1)
  726. cc |= SW_C1;
  727. } else {
  728. control_word = old_cw;
  729. setcc(0);
  730. return;
  731. }
  732. } else {
  733. /* There is a large exponent difference ( >= 64 ) */
  734. /* To make much sense, the code in this section should
  735. be done at high precision. */
  736. int exp_1, N;
  737. u_char sign;
  738. /* prevent overflow here */
  739. /* N is 'a number between 32 and 63' (p26-113) */
  740. reg_copy(&st0, &tmp);
  741. tmptag = st0_tag;
  742. N = (expdif & 0x0000001f) + 32; /* This choice gives results
  743. identical to an AMD 486 */
  744. setexponent16(&tmp, N);
  745. exp_1 = exponent16(&st1);
  746. setexponent16(&st1, 0);
  747. expdif -= N;
  748. sign = getsign(&tmp) ^ st1_sign;
  749. tag =
  750. FPU_u_div(&tmp, &st1, &tmp,
  751. PR_64_BITS | RC_CHOP | 0x3f, sign);
  752. setsign(&tmp, sign);
  753. FPU_round_to_int(&tmp, tag); /* Fortunately, this can't
  754. overflow to 2^64 */
  755. rem_kernel(significand(&st0),
  756. &significand(&tmp),
  757. significand(&st1),
  758. significand(&tmp), exponent(&tmp)
  759. );
  760. setexponent16(&tmp, exp_1 + expdif);
  761. /* It is possible for the operation to be complete here.
  762. What does the IEEE standard say? The Intel 80486 manual
  763. implies that the operation will never be completed at this
  764. point, and the behaviour of a real 80486 confirms this.
  765. */
  766. if (!(tmp.sigh | tmp.sigl)) {
  767. /* The result is zero */
  768. control_word = old_cw;
  769. partial_status = saved_status;
  770. FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
  771. setsign(&st0, st0_sign);
  772. #ifdef PECULIAR_486
  773. setcc(SW_C2);
  774. #else
  775. setcc(0);
  776. #endif /* PECULIAR_486 */
  777. return;
  778. }
  779. cc = SW_C2;
  780. }
  781. control_word = old_cw;
  782. partial_status = saved_status;
  783. tag = FPU_normalize_nuo(&tmp);
  784. reg_copy(&tmp, st0_ptr);
  785. /* The only condition to be looked for is underflow,
  786. and it can occur here only if underflow is unmasked. */
  787. if ((exponent16(&tmp) <= EXP_UNDER) && (tag != TAG_Zero)
  788. && !(control_word & CW_Underflow)) {
  789. setcc(cc);
  790. tag = arith_underflow(st0_ptr);
  791. setsign(st0_ptr, st0_sign);
  792. FPU_settag0(tag);
  793. return;
  794. } else if ((exponent16(&tmp) > EXP_UNDER) || (tag == TAG_Zero)) {
  795. stdexp(st0_ptr);
  796. setsign(st0_ptr, st0_sign);
  797. } else {
  798. tag =
  799. FPU_round(st0_ptr, 0, 0, FULL_PRECISION, st0_sign);
  800. }
  801. FPU_settag0(tag);
  802. setcc(cc);
  803. return;
  804. }
  805. if (st0_tag == TAG_Special)
  806. st0_tag = FPU_Special(st0_ptr);
  807. if (st1_tag == TAG_Special)
  808. st1_tag = FPU_Special(st1_ptr);
  809. if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
  810. || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
  811. || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
  812. if (denormal_operand() < 0)
  813. return;
  814. goto fprem_valid;
  815. } else if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
  816. FPU_stack_underflow();
  817. return;
  818. } else if (st0_tag == TAG_Zero) {
  819. if (st1_tag == TAG_Valid) {
  820. setcc(0);
  821. return;
  822. } else if (st1_tag == TW_Denormal) {
  823. if (denormal_operand() < 0)
  824. return;
  825. setcc(0);
  826. return;
  827. } else if (st1_tag == TAG_Zero) {
  828. arith_invalid(0);
  829. return;
  830. } /* fprem(?,0) always invalid */
  831. else if (st1_tag == TW_Infinity) {
  832. setcc(0);
  833. return;
  834. }
  835. } else if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
  836. if (st1_tag == TAG_Zero) {
  837. arith_invalid(0); /* fprem(Valid,Zero) is invalid */
  838. return;
  839. } else if (st1_tag != TW_NaN) {
  840. if (((st0_tag == TW_Denormal)
  841. || (st1_tag == TW_Denormal))
  842. && (denormal_operand() < 0))
  843. return;
  844. if (st1_tag == TW_Infinity) {
  845. /* fprem(Valid,Infinity) is o.k. */
  846. setcc(0);
  847. return;
  848. }
  849. }
  850. } else if (st0_tag == TW_Infinity) {
  851. if (st1_tag != TW_NaN) {
  852. arith_invalid(0); /* fprem(Infinity,?) is invalid */
  853. return;
  854. }
  855. }
  856. /* One of the registers must contain a NaN if we got here. */
  857. #ifdef PARANOID
  858. if ((st0_tag != TW_NaN) && (st1_tag != TW_NaN))
  859. EXCEPTION(EX_INTERNAL | 0x118);
  860. #endif /* PARANOID */
  861. real_2op_NaN(st1_ptr, st1_tag, 0, st1_ptr);
  862. }
  863. /* ST(1) <- ST(1) * log ST; pop ST */
  864. static void fyl2x(FPU_REG *st0_ptr, u_char st0_tag)
  865. {
  866. FPU_REG *st1_ptr = &st(1), exponent;
  867. u_char st1_tag = FPU_gettagi(1);
  868. u_char sign;
  869. int e, tag;
  870. clear_C1();
  871. if ((st0_tag == TAG_Valid) && (st1_tag == TAG_Valid)) {
  872. both_valid:
  873. /* Both regs are Valid or Denormal */
  874. if (signpositive(st0_ptr)) {
  875. if (st0_tag == TW_Denormal)
  876. FPU_to_exp16(st0_ptr, st0_ptr);
  877. else
  878. /* Convert st(0) for internal use. */
  879. setexponent16(st0_ptr, exponent(st0_ptr));
  880. if ((st0_ptr->sigh == 0x80000000)
  881. && (st0_ptr->sigl == 0)) {
  882. /* Special case. The result can be precise. */
  883. u_char esign;
  884. e = exponent16(st0_ptr);
  885. if (e >= 0) {
  886. exponent.sigh = e;
  887. esign = SIGN_POS;
  888. } else {
  889. exponent.sigh = -e;
  890. esign = SIGN_NEG;
  891. }
  892. exponent.sigl = 0;
  893. setexponent16(&exponent, 31);
  894. tag = FPU_normalize_nuo(&exponent);
  895. stdexp(&exponent);
  896. setsign(&exponent, esign);
  897. tag =
  898. FPU_mul(&exponent, tag, 1, FULL_PRECISION);
  899. if (tag >= 0)
  900. FPU_settagi(1, tag);
  901. } else {
  902. /* The usual case */
  903. sign = getsign(st1_ptr);
  904. if (st1_tag == TW_Denormal)
  905. FPU_to_exp16(st1_ptr, st1_ptr);
  906. else
  907. /* Convert st(1) for internal use. */
  908. setexponent16(st1_ptr,
  909. exponent(st1_ptr));
  910. poly_l2(st0_ptr, st1_ptr, sign);
  911. }
  912. } else {
  913. /* negative */
  914. if (arith_invalid(1) < 0)
  915. return;
  916. }
  917. FPU_pop();
  918. return;
  919. }
  920. if (st0_tag == TAG_Special)
  921. st0_tag = FPU_Special(st0_ptr);
  922. if (st1_tag == TAG_Special)
  923. st1_tag = FPU_Special(st1_ptr);
  924. if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
  925. FPU_stack_underflow_pop(1);
  926. return;
  927. } else if ((st0_tag <= TW_Denormal) && (st1_tag <= TW_Denormal)) {
  928. if (st0_tag == TAG_Zero) {
  929. if (st1_tag == TAG_Zero) {
  930. /* Both args zero is invalid */
  931. if (arith_invalid(1) < 0)
  932. return;
  933. } else {
  934. u_char sign;
  935. sign = getsign(st1_ptr) ^ SIGN_NEG;
  936. if (FPU_divide_by_zero(1, sign) < 0)
  937. return;
  938. setsign(st1_ptr, sign);
  939. }
  940. } else if (st1_tag == TAG_Zero) {
  941. /* st(1) contains zero, st(0) valid <> 0 */
  942. /* Zero is the valid answer */
  943. sign = getsign(st1_ptr);
  944. if (signnegative(st0_ptr)) {
  945. /* log(negative) */
  946. if (arith_invalid(1) < 0)
  947. return;
  948. } else if ((st0_tag == TW_Denormal)
  949. && (denormal_operand() < 0))
  950. return;
  951. else {
  952. if (exponent(st0_ptr) < 0)
  953. sign ^= SIGN_NEG;
  954. FPU_copy_to_reg1(&CONST_Z, TAG_Zero);
  955. setsign(st1_ptr, sign);
  956. }
  957. } else {
  958. /* One or both operands are denormals. */
  959. if (denormal_operand() < 0)
  960. return;
  961. goto both_valid;
  962. }
  963. } else if ((st0_tag == TW_NaN) || (st1_tag == TW_NaN)) {
  964. if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
  965. return;
  966. }
  967. /* One or both arg must be an infinity */
  968. else if (st0_tag == TW_Infinity) {
  969. if ((signnegative(st0_ptr)) || (st1_tag == TAG_Zero)) {
  970. /* log(-infinity) or 0*log(infinity) */
  971. if (arith_invalid(1) < 0)
  972. return;
  973. } else {
  974. u_char sign = getsign(st1_ptr);
  975. if ((st1_tag == TW_Denormal)
  976. && (denormal_operand() < 0))
  977. return;
  978. FPU_copy_to_reg1(&CONST_INF, TAG_Special);
  979. setsign(st1_ptr, sign);
  980. }
  981. }
  982. /* st(1) must be infinity here */
  983. else if (((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal))
  984. && (signpositive(st0_ptr))) {
  985. if (exponent(st0_ptr) >= 0) {
  986. if ((exponent(st0_ptr) == 0) &&
  987. (st0_ptr->sigh == 0x80000000) &&
  988. (st0_ptr->sigl == 0)) {
  989. /* st(0) holds 1.0 */
  990. /* infinity*log(1) */
  991. if (arith_invalid(1) < 0)
  992. return;
  993. }
  994. /* else st(0) is positive and > 1.0 */
  995. } else {
  996. /* st(0) is positive and < 1.0 */
  997. if ((st0_tag == TW_Denormal)
  998. && (denormal_operand() < 0))
  999. return;
  1000. changesign(st1_ptr);
  1001. }
  1002. } else {
  1003. /* st(0) must be zero or negative */
  1004. if (st0_tag == TAG_Zero) {
  1005. /* This should be invalid, but a real 80486 is happy with it. */
  1006. #ifndef PECULIAR_486
  1007. sign = getsign(st1_ptr);
  1008. if (FPU_divide_by_zero(1, sign) < 0)
  1009. return;
  1010. #endif /* PECULIAR_486 */
  1011. changesign(st1_ptr);
  1012. } else if (arith_invalid(1) < 0) /* log(negative) */
  1013. return;
  1014. }
  1015. FPU_pop();
  1016. }
  1017. static void fpatan(FPU_REG *st0_ptr, u_char st0_tag)
  1018. {
  1019. FPU_REG *st1_ptr = &st(1);
  1020. u_char st1_tag = FPU_gettagi(1);
  1021. int tag;
  1022. clear_C1();
  1023. if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
  1024. valid_atan:
  1025. poly_atan(st0_ptr, st0_tag, st1_ptr, st1_tag);
  1026. FPU_pop();
  1027. return;
  1028. }
  1029. if (st0_tag == TAG_Special)
  1030. st0_tag = FPU_Special(st0_ptr);
  1031. if (st1_tag == TAG_Special)
  1032. st1_tag = FPU_Special(st1_ptr);
  1033. if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
  1034. || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
  1035. || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
  1036. if (denormal_operand() < 0)
  1037. return;
  1038. goto valid_atan;
  1039. } else if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
  1040. FPU_stack_underflow_pop(1);
  1041. return;
  1042. } else if ((st0_tag == TW_NaN) || (st1_tag == TW_NaN)) {
  1043. if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) >= 0)
  1044. FPU_pop();
  1045. return;
  1046. } else if ((st0_tag == TW_Infinity) || (st1_tag == TW_Infinity)) {
  1047. u_char sign = getsign(st1_ptr);
  1048. if (st0_tag == TW_Infinity) {
  1049. if (st1_tag == TW_Infinity) {
  1050. if (signpositive(st0_ptr)) {
  1051. FPU_copy_to_reg1(&CONST_PI4, TAG_Valid);
  1052. } else {
  1053. setpositive(st1_ptr);
  1054. tag =
  1055. FPU_u_add(&CONST_PI4, &CONST_PI2,
  1056. st1_ptr, FULL_PRECISION,
  1057. SIGN_POS,
  1058. exponent(&CONST_PI4),
  1059. exponent(&CONST_PI2));
  1060. if (tag >= 0)
  1061. FPU_settagi(1, tag);
  1062. }
  1063. } else {
  1064. if ((st1_tag == TW_Denormal)
  1065. && (denormal_operand() < 0))
  1066. return;
  1067. if (signpositive(st0_ptr)) {
  1068. FPU_copy_to_reg1(&CONST_Z, TAG_Zero);
  1069. setsign(st1_ptr, sign); /* An 80486 preserves the sign */
  1070. FPU_pop();
  1071. return;
  1072. } else {
  1073. FPU_copy_to_reg1(&CONST_PI, TAG_Valid);
  1074. }
  1075. }
  1076. } else {
  1077. /* st(1) is infinity, st(0) not infinity */
  1078. if ((st0_tag == TW_Denormal)
  1079. && (denormal_operand() < 0))
  1080. return;
  1081. FPU_copy_to_reg1(&CONST_PI2, TAG_Valid);
  1082. }
  1083. setsign(st1_ptr, sign);
  1084. } else if (st1_tag == TAG_Zero) {
  1085. /* st(0) must be valid or zero */
  1086. u_char sign = getsign(st1_ptr);
  1087. if ((st0_tag == TW_Denormal) && (denormal_operand() < 0))
  1088. return;
  1089. if (signpositive(st0_ptr)) {
  1090. /* An 80486 preserves the sign */
  1091. FPU_pop();
  1092. return;
  1093. }
  1094. FPU_copy_to_reg1(&CONST_PI, TAG_Valid);
  1095. setsign(st1_ptr, sign);
  1096. } else if (st0_tag == TAG_Zero) {
  1097. /* st(1) must be TAG_Valid here */
  1098. u_char sign = getsign(st1_ptr);
  1099. if ((st1_tag == TW_Denormal) && (denormal_operand() < 0))
  1100. return;
  1101. FPU_copy_to_reg1(&CONST_PI2, TAG_Valid);
  1102. setsign(st1_ptr, sign);
  1103. }
  1104. #ifdef PARANOID
  1105. else
  1106. EXCEPTION(EX_INTERNAL | 0x125);
  1107. #endif /* PARANOID */
  1108. FPU_pop();
  1109. set_precision_flag_up(); /* We do not really know if up or down */
  1110. }
  1111. static void fprem(FPU_REG *st0_ptr, u_char st0_tag)
  1112. {
  1113. do_fprem(st0_ptr, st0_tag, RC_CHOP);
  1114. }
  1115. static void fprem1(FPU_REG *st0_ptr, u_char st0_tag)
  1116. {
  1117. do_fprem(st0_ptr, st0_tag, RC_RND);
  1118. }
  1119. static void fyl2xp1(FPU_REG *st0_ptr, u_char st0_tag)
  1120. {
  1121. u_char sign, sign1;
  1122. FPU_REG *st1_ptr = &st(1), a, b;
  1123. u_char st1_tag = FPU_gettagi(1);
  1124. clear_C1();
  1125. if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
  1126. valid_yl2xp1:
  1127. sign = getsign(st0_ptr);
  1128. sign1 = getsign(st1_ptr);
  1129. FPU_to_exp16(st0_ptr, &a);
  1130. FPU_to_exp16(st1_ptr, &b);
  1131. if (poly_l2p1(sign, sign1, &a, &b, st1_ptr))
  1132. return;
  1133. FPU_pop();
  1134. return;
  1135. }
  1136. if (st0_tag == TAG_Special)
  1137. st0_tag = FPU_Special(st0_ptr);
  1138. if (st1_tag == TAG_Special)
  1139. st1_tag = FPU_Special(st1_ptr);
  1140. if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
  1141. || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
  1142. || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
  1143. if (denormal_operand() < 0)
  1144. return;
  1145. goto valid_yl2xp1;
  1146. } else if ((st0_tag == TAG_Empty) | (st1_tag == TAG_Empty)) {
  1147. FPU_stack_underflow_pop(1);
  1148. return;
  1149. } else if (st0_tag == TAG_Zero) {
  1150. switch (st1_tag) {
  1151. case TW_Denormal:
  1152. if (denormal_operand() < 0)
  1153. return;
  1154. case TAG_Zero:
  1155. case TAG_Valid:
  1156. setsign(st0_ptr, getsign(st0_ptr) ^ getsign(st1_ptr));
  1157. FPU_copy_to_reg1(st0_ptr, st0_tag);
  1158. break;
  1159. case TW_Infinity:
  1160. /* Infinity*log(1) */
  1161. if (arith_invalid(1) < 0)
  1162. return;
  1163. break;
  1164. case TW_NaN:
  1165. if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
  1166. return;
  1167. break;
  1168. default:
  1169. #ifdef PARANOID
  1170. EXCEPTION(EX_INTERNAL | 0x116);
  1171. return;
  1172. #endif /* PARANOID */
  1173. break;
  1174. }
  1175. } else if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
  1176. switch (st1_tag) {
  1177. case TAG_Zero:
  1178. if (signnegative(st0_ptr)) {
  1179. if (exponent(st0_ptr) >= 0) {
  1180. /* st(0) holds <= -1.0 */
  1181. #ifdef PECULIAR_486 /* Stupid 80486 doesn't worry about log(negative). */
  1182. changesign(st1_ptr);
  1183. #else
  1184. if (arith_invalid(1) < 0)
  1185. return;
  1186. #endif /* PECULIAR_486 */
  1187. } else if ((st0_tag == TW_Denormal)
  1188. && (denormal_operand() < 0))
  1189. return;
  1190. else
  1191. changesign(st1_ptr);
  1192. } else if ((st0_tag == TW_Denormal)
  1193. && (denormal_operand() < 0))
  1194. return;
  1195. break;
  1196. case TW_Infinity:
  1197. if (signnegative(st0_ptr)) {
  1198. if ((exponent(st0_ptr) >= 0) &&
  1199. !((st0_ptr->sigh == 0x80000000) &&
  1200. (st0_ptr->sigl == 0))) {
  1201. /* st(0) holds < -1.0 */
  1202. #ifdef PECULIAR_486 /* Stupid 80486 doesn't worry about log(negative). */
  1203. changesign(st1_ptr);
  1204. #else
  1205. if (arith_invalid(1) < 0)
  1206. return;
  1207. #endif /* PECULIAR_486 */
  1208. } else if ((st0_tag == TW_Denormal)
  1209. && (denormal_operand() < 0))
  1210. return;
  1211. else
  1212. changesign(st1_ptr);
  1213. } else if ((st0_tag == TW_Denormal)
  1214. && (denormal_operand() < 0))
  1215. return;
  1216. break;
  1217. case TW_NaN:
  1218. if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
  1219. return;
  1220. }
  1221. } else if (st0_tag == TW_NaN) {
  1222. if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
  1223. return;
  1224. } else if (st0_tag == TW_Infinity) {
  1225. if (st1_tag == TW_NaN) {
  1226. if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
  1227. return;
  1228. } else if (signnegative(st0_ptr)) {
  1229. #ifndef PECULIAR_486
  1230. /* This should have higher priority than denormals, but... */
  1231. if (arith_invalid(1) < 0) /* log(-infinity) */
  1232. return;
  1233. #endif /* PECULIAR_486 */
  1234. if ((st1_tag == TW_Denormal)
  1235. && (denormal_operand() < 0))
  1236. return;
  1237. #ifdef PECULIAR_486
  1238. /* Denormal operands actually get higher priority */
  1239. if (arith_invalid(1) < 0) /* log(-infinity) */
  1240. return;
  1241. #endif /* PECULIAR_486 */
  1242. } else if (st1_tag == TAG_Zero) {
  1243. /* log(infinity) */
  1244. if (arith_invalid(1) < 0)
  1245. return;
  1246. }
  1247. /* st(1) must be valid here. */
  1248. else if ((st1_tag == TW_Denormal) && (denormal_operand() < 0))
  1249. return;
  1250. /* The Manual says that log(Infinity) is invalid, but a real
  1251. 80486 sensibly says that it is o.k. */
  1252. else {
  1253. u_char sign = getsign(st1_ptr);
  1254. FPU_copy_to_reg1(&CONST_INF, TAG_Special);
  1255. setsign(st1_ptr, sign);
  1256. }
  1257. }
  1258. #ifdef PARANOID
  1259. else {
  1260. EXCEPTION(EX_INTERNAL | 0x117);
  1261. return;
  1262. }
  1263. #endif /* PARANOID */
  1264. FPU_pop();
  1265. return;
  1266. }
  1267. static void fscale(FPU_REG *st0_ptr, u_char st0_tag)
  1268. {
  1269. FPU_REG *st1_ptr = &st(1);
  1270. u_char st1_tag = FPU_gettagi(1);
  1271. int old_cw = control_word;
  1272. u_char sign = getsign(st0_ptr);
  1273. clear_C1();
  1274. if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
  1275. long scale;
  1276. FPU_REG tmp;
  1277. /* Convert register for internal use. */
  1278. setexponent16(st0_ptr, exponent(st0_ptr));
  1279. valid_scale:
  1280. if (exponent(st1_ptr) > 30) {
  1281. /* 2^31 is far too large, would require 2^(2^30) or 2^(-2^30) */
  1282. if (signpositive(st1_ptr)) {
  1283. EXCEPTION(EX_Overflow);
  1284. FPU_copy_to_reg0(&CONST_INF, TAG_Special);
  1285. } else {
  1286. EXCEPTION(EX_Underflow);
  1287. FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
  1288. }
  1289. setsign(st0_ptr, sign);
  1290. return;
  1291. }
  1292. control_word &= ~CW_RC;
  1293. control_word |= RC_CHOP;
  1294. reg_copy(st1_ptr, &tmp);
  1295. FPU_round_to_int(&tmp, st1_tag); /* This can never overflow here */
  1296. control_word = old_cw;
  1297. scale = signnegative(st1_ptr) ? -tmp.sigl : tmp.sigl;
  1298. scale += exponent16(st0_ptr);
  1299. setexponent16(st0_ptr, scale);
  1300. /* Use FPU_round() to properly detect under/overflow etc */
  1301. FPU_round(st0_ptr, 0, 0, control_word, sign);
  1302. return;
  1303. }
  1304. if (st0_tag == TAG_Special)
  1305. st0_tag = FPU_Special(st0_ptr);
  1306. if (st1_tag == TAG_Special)
  1307. st1_tag = FPU_Special(st1_ptr);
  1308. if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
  1309. switch (st1_tag) {
  1310. case TAG_Valid:
  1311. /* st(0) must be a denormal */
  1312. if ((st0_tag == TW_Denormal)
  1313. && (denormal_operand() < 0))
  1314. return;
  1315. FPU_to_exp16(st0_ptr, st0_ptr); /* Will not be left on stack */
  1316. goto valid_scale;
  1317. case TAG_Zero:
  1318. if (st0_tag == TW_Denormal)
  1319. denormal_operand();
  1320. return;
  1321. case TW_Denormal:
  1322. denormal_operand();
  1323. return;
  1324. case TW_Infinity:
  1325. if ((st0_tag == TW_Denormal)
  1326. && (denormal_operand() < 0))
  1327. return;
  1328. if (signpositive(st1_ptr))
  1329. FPU_copy_to_reg0(&CONST_INF, TAG_Special);
  1330. else
  1331. FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
  1332. setsign(st0_ptr, sign);
  1333. return;
  1334. case TW_NaN:
  1335. real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
  1336. return;
  1337. }
  1338. } else if (st0_tag == TAG_Zero) {
  1339. switch (st1_tag) {
  1340. case TAG_Valid:
  1341. case TAG_Zero:
  1342. return;
  1343. case TW_Denormal:
  1344. denormal_operand();
  1345. return;
  1346. case TW_Infinity:
  1347. if (signpositive(st1_ptr))
  1348. arith_invalid(0); /* Zero scaled by +Infinity */
  1349. return;
  1350. case TW_NaN:
  1351. real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
  1352. return;
  1353. }
  1354. } else if (st0_tag == TW_Infinity) {
  1355. switch (st1_tag) {
  1356. case TAG_Valid:
  1357. case TAG_Zero:
  1358. return;
  1359. case TW_Denormal:
  1360. denormal_operand();
  1361. return;
  1362. case TW_Infinity:
  1363. if (signnegative(st1_ptr))
  1364. arith_invalid(0); /* Infinity scaled by -Infinity */
  1365. return;
  1366. case TW_NaN:
  1367. real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
  1368. return;
  1369. }
  1370. } else if (st0_tag == TW_NaN) {
  1371. if (st1_tag != TAG_Empty) {
  1372. real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
  1373. return;
  1374. }
  1375. }
  1376. #ifdef PARANOID
  1377. if (!((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty))) {
  1378. EXCEPTION(EX_INTERNAL | 0x115);
  1379. return;
  1380. }
  1381. #endif
  1382. /* At least one of st(0), st(1) must be empty */
  1383. FPU_stack_underflow();
  1384. }
  1385. /*---------------------------------------------------------------------------*/
  1386. static FUNC_ST0 const trig_table_a[] = {
  1387. f2xm1, fyl2x, fptan, fpatan,
  1388. fxtract, fprem1, (FUNC_ST0) fdecstp, (FUNC_ST0) fincstp
  1389. };
  1390. void FPU_triga(void)
  1391. {
  1392. (trig_table_a[FPU_rm]) (&st(0), FPU_gettag0());
  1393. }
  1394. static FUNC_ST0 const trig_table_b[] = {
  1395. fprem, fyl2xp1, fsqrt_, fsincos, frndint_, fscale, (FUNC_ST0) fsin, fcos
  1396. };
  1397. void FPU_trigb(void)
  1398. {
  1399. (trig_table_b[FPU_rm]) (&st(0), FPU_gettag0());
  1400. }