0413b54c02
1997-08-10 18:48 Ulrich Drepper <drepper@cygnus.com> * Makeconfig: Define build-programs to no if not set and $(config-os) is none. * Makerules (+depfiles): Don't add $(others) if not build-programs. * Rules (others): Don't depend on $(install-bin), $(install-rootbin) and $(install-sbin) if not build-programs. * Makefile (subdirs): Remove login. * sysdeps/mach/hurd/Subdirs: Add login. * sysdeps/unix/Subdirs: Add login. * sysdeps/generic/sys/mman.h: Test feature macros before defining non-POSIX things. Add MAP_FAILED. * sysdeps/unix/bsd/osf/sys/mman.h: Likewise. * sysdeps/unix/bsd/sun/sunos4/sys/mman.h: Likewise. * sysdeps/unix/bsd/ultrix4/sys/mman.h: Likewise. * sysdeps/unix/sysv/irix4/sys/mman.h: Likewise. * sysdeps/unix/sysv/linux/sys/mman.h: Rewrite to not use kernel header but bits/mman.h. Test feature macros before definitions non-POSIX functions. * sysdeps/unix/sysv/linux/alpha/bits/mman.h: New file. * sysdeps/unix/sysv/linux/i386/bits/mman.h: New file. * sysdeps/unix/sysv/linux/m68k/bits/mman.h: New file. * sysdeps/unix/sysv/linux/mips/bits/mman.h: New file. * sysdeps/unix/sysv/linux/powerpc/bits/mman.h: New file. * sysdeps/unix/sysv/linux/sparc/bits/mman.h: New file. * sysdeps/unix/sysv/linux/sparc64/bits/mman.h: New file. * sysdeps/unix/sysv/linux/alpha/Dist: Add bits/mman.h. * sysdeps/unix/sysv/linux/i386/Dist: Likewise. * sysdeps/unix/sysv/linux/m68k/Dist: Likewise. * sysdeps/unix/sysv/linux/mips/Dist: Likewise. * sysdeps/unix/sysv/linux/powerpc/Dist: Likewise. * sysdeps/unix/sysv/linux/sparc/Dist: Likewise. * sysdeps/unix/sysv/linux/sparc64/Dist: New file. Likewise. * catgets/open_catalog.c (__open_catalog): Compare result of mmap with MAP_FAILED and not -1. * elf/dl-load.c (_dl_map_object_from_fd): Likewise. * elf/dl-minimal.c (malloc): Likewise. * elf/dl-misc.c (_dl_sysdep_read_whole_file): Likewise. * locale/loadlocale.c (_nl_load_locale): Likewise. * locale/programs/localedef.c: Likewise. * malloc/malloc.c (mmap_chunk): Likewise. (new_heap): Likewise. * string/stratcliff.c: Likewise. * string/tester.c: Add tests for stpcpy. * gmon/gmon.c (__monstartup): Use calloc instead of malloc+memset. * gmon/sys/gmon.h: Add prototype for write_profiling. * elf/dl-profile.c: Add decsriptions and implement reading of existing data in profiling file. * gmon/sys/gmon_out.h (GMON_SHOBJ_VERSION): New macro for shared lib profiling data. * sysdeps/stub/bits/libc-lock.h (__libc_once_define): Add new first parameter for class. * inet/inet_ntoa.c: Make once control variable static. Correctly handle case where key cannot be retrieved. * inet/Makefile (tests): Add tst-ntoa. * inet/tst-ntoa.c: New file. * manual/time.texi: Document localtime_r, gmtime_r, asctime_r, and ctime_r. Mention that tzname values must not be changed. * manual/users.texi: Document UTMP/WTMP handling functions. Mainly written by Mark Kettenis. * math/libm-test.c (cbrt_test): Add test for number with aboslute value < 1.0. * nss/nss_files/files-XXX.c (internal_setent): If opening of file failed with EGAIN return NSS_STATUS_TRYAGAIN. * nss/nss_files/files-alias.c (internal_setent): Likewise. * sysdeps/generic/bits/utmp.h: Pretty print. * sysdeps/i386/i586/strcpy.S: New file. Much faster implementation. * sysdeps/i386/i586/stpcpy.S: New file. * sysdeps/i386/i686/Implies: Don't fall back on i586 versions since these are less efficient than i486/i386 versions. * sysdeps/libm-i387/e_rem_pio2.c: Add empty file to prevent the version from libm-ieee754 be compiled since the later is not needed. * sysdeps/libm-i387/e_rem_pio2f.c: Likewise. * sysdeps/libm-i387/e_rem_pio2l.c: Likewise. * sysdeps/libm-i387/k_rem_pio2.c: Likewise. * sysdeps/libm-i387/k_rem_pio2f.c: Likewise. * sysdeps/libm-i387/k_rem_pio2l.c: Likewise. * sysdeps/m68k/fpu/e_rem_pio2.c: Likewise. * sysdeps/m68k/fpu/e_rem_pio2f.c: Likewise. * sysdeps/m68k/fpu/e_rem_pio2l.c: Likewise. * sysdeps/m68k/fpu/k_rem_pio2.c: Likewise. * sysdeps/m68k/fpu/k_rem_pio2f.c: Likewise. * sysdeps/m68k/fpu/k_rem_pio2l.c: Likewise. * sysdeps/libm-i387/s_cbrt.S: Fix several bugs. * sysdeps/libm-i387/s_cbrtf.S: Likewise. * sysdeps/libm-i387/s_cbrtl.S: Likewise. * sysdeps/unix/sysv/linux/if_index.c (if_indextoname): Correct little bug. * sysdeps/unix/sysv/linux/bits/socket.h (struct msghdr): Make field msg_iovlen of type int. * time/tzfile.c: Change return type of __tzstring to char *. * time/tzset.c: Likewise. Change definition of __tzstring. * time/tzset.c: Interpret no DST information in user provided time zone specification as it is meant: no DST. Patch by Paul Eggert <eggert@twinsun.com>. 1997-07-20 03:01 Geoff Keating <geoffk@ozemail.com.au> * sysdeps/elf/dl-load.c (add_name_to_object): New procedure. (_dl_map_object_from_fd): Use add_name_to_object. (_dl_map_object): If an object's SONAME is used to resolve a dependency, add it to the list of the object's names. * inet/getnameinfo.c: Make `domain' non-const. * sysdeps/unix/sysv/linux/powerpc/kernel_termios.c: Clean up. * math/test-fenv.c (feenv_nomask_test): Don't execute if FE_NOMASK_ENV is not defined, or if fesetenv(FE_NOMASK_ENV) sets errno to ENOSYS. * sysdeps/powerpc/dl-machine.h: Print proper error message on unknown reloc type (rather than using assert). * sysdeps/unix/sysv/linux/powerpc/profil-counter.h: New file. * sysdeps/unix/sysv/linux/powerpc/profil.c: Deleted. 1997-07-16 12:47 Geoff Keating <geoffk@ozemail.com.au> * sysdeps/powerpc/bits/fenv.h (feraiseexcept): New optimising macro. (feclearexcept): New optimising macro. (FE_NOMASK_ENV): Change to procedure so it can enable exceptions. (FE_ENABLED_ENV): Add. (FE_NONIEEE_ENV): Add. * sysdeps/powerpc/bits/fenv_const.c: Add __fe_enabled_env, __fe_nonieee_env; delete __fe_nomask_env. * sysdeps/powerpc/bits/fe_nomask.c: New file (stub warning until it gets implemented in the kernel). * sysdeps/powerpc/fraiseenv.c: Deal with chips that don't have FE_INVALID_SOFTWARE implemented. Use macros for bit names for clarity. * sysdeps/powerpc/fsetexcptflag.c: Likewise. * io/ftw.c: Don't compare holes in structures. * sysdeps/unix/sysv/linux/sys/sysmacros.h: Cast the result of the macros to `int', because otherwise it might be `long long' which the calling code is probably not expecting. * sysdeps/libm-ieee754/s_lround.c [NO_LONG_DOUBLE]: Fix a few bugs, document the existence of some more. * sysdeps/powerpc/s_llrint.c: New file. * sysdeps/powerpc/s_lrint.c: New file. * sysdeps/powerpc/s_llround.c: New file. * sysdeps/powerpc/s_lround.c: New file. * sysdeps/powerpc/s_sqrt.c: New file. * sysdeps/powerpc/s_sqrtf.c: New file. * sysdeps/powerpc/w_sqrt.s: New empty file. * sysdeps/powerpc/w_sqrtf.s: New empty file. * sysdeps/powerpc/t_sqrt.c: New file. * sysdeps/powerpc/test-arithf.c: New file. * sysdeps/powerpc/Makefile [subdir=math]: Add t_sqrt to support routines. Add test-arithf to test programs. * sysdeps/powerpc/bits/mathdef.h: Add FP_ILOGB0, FP_ILOGBNAN. * sysdeps/powerpc/strcmp.s: Simplify drastically. Now much neater, and possibly faster (or possibly slower, depending on input). 1997-06-08 22:55 Geoff Keating <geoffk@ozemail.com.au> * sysdeps/powerpc/fenvbits.h: Correct FE_DFL_ENV and FE_NOMASK_ENV macros. * sysdeps/powerpc/s_rint.c: New file. 1997-05-22 08:47 Geoff Keating <geoffk@ozemail.com.au> * sysdeps/powerpc/Makefile [subdir=math]: Add q_* routines. * sysdeps/powerpc/Dist: Add quad_float.h. * sysdeps/powerpc/q_dtoq.c: New file. * sysdeps/powerpc/q_itoq.c: New file. * sysdeps/powerpc/q_lltoq.c: New file. * sysdeps/powerpc/q_neg.c: New file. * sysdeps/powerpc/q_qtoi.c: New file. * sysdeps/powerpc/q_qtoll.c: New file. * sysdeps/powerpc/q_qtos.c: New file. * sysdeps/powerpc/q_qtou.c: New file. * sysdeps/powerpc/q_qtoull.c: New file. * sysdeps/powerpc/q_stoq.c: New file. * sysdeps/powerpc/q_ulltoq.c: New file. * sysdeps/powerpc/q_utoq.c: New file. * sysdeps/powerpc/quad_float.h: New file. * sysdeps/powerpc/test-arith.c: New file. * sysdeps/powerpc/fpu_control.h: Fix _FPU_GETCW. * sysdeps/powerpc/fegetround.c: Use mcrfs to be faster and not require a stack frame. * sysdeps/powerpc/bits/fenv.h: Include inline macro for fegetround. 1997-05-18 05:55 Geoff Keating <geoffk@ozemail.com.au> * sysdeps/powerpc/fenv_libc.h (fegetenv_register, fesetenv_register): Add 'volatile'. (set_fpscr_bit, reset_fpscr_bit): New macros, FPSCR_* constants to use with them. * sysdeps/powerpc/s_copysign.S: New file. * sysdeps/powerpc/s_copysignf.s: New file. * sysdeps/powerpc/s_fabs.S: New file. * sysdeps/powerpc/s_fabsf.s: New file. * sysdeps/powerpc/s_isnan.c: New file. * sysdeps/powerpc/s_isnanf.s: New file. * sysdeps/powerpc/s_rintf.c: New file. * sysdeps/powerpc/fenvbits.h: Make FE_INVALID the summary bit in the FPSCR, not the enable bit. * sysdeps/powerpc/fraiseexcpt.c: Consequent change to the above. * sysdeps/powerpc/fclrexcpt.c: Correct. * sysdeps/powerpc/fsetexcptflag.c: Correct. * sysdeps/powerpc/ftestexcpt.c: Is now much simpler. * sysdeps/powerpc/fgetexcptflg.c: Simplify. * sysdeps/powerpc/strlen.s: Schedule better, save 3 clocks :-). * sysdeps/powerpc/dl-machine.h (elf_machine_rela): Add comment explaining some reentrancy issues with lazy PLT entries. 1997-08-09 13:04 Mark Kettenis <kettenis@phys.uva.nl> * login/logout.c (logout): utmpname returns -1 on error. * login/libutil.map: Remove updwtmp. * login/getutline.c: Rename getutline to __getutline and make getutline a weak alias. Make getutxline a weak alias for __getutline. * login/getutid.c: Rename getutid to __getutid and make getutid a weak alias. Make getutxid a weak alias for __getutid. * libc.map: Add getutxid, getutxline. * login/utmpname.c (__utmpname): Reset backend right after backend endutent call. * login/utmp_file.c: Reordered functions. Remove unecessary header files. (getutent_r_file, pututline_file): Do not call setutent_file. At this point the file is guaranteed to be open (assert!). (getutid_r_file, getutline_r_file): Remove check for validity of file descriptor. At this point the file is guaranteed to be open. (getutent_r_file, internal_getut_r, getutline_r_file, pututline_file, updwtmp_file): Do not wait when unlocking file. * login/utmp_daemon.c: General cleanup and a bit of reordering. (getutent_r_daemon, pututline_daemon): Do not call setutent_daemon. At this point the socket is guaranteed to be open (assert!). (getutid_r_daemon, getutline_r_daemon): Do not check if daemon_sock is valid. At this point the socket is guaranteed to be open (assert!). * login/getutline_r.c: Remove unnecessary header files. (__getutline_r): Do not call backend setutent. * login/getutid_r.c: Remove unnecessary header files. (__getutid_r): Do not call backend setutent. * login/getutent_r.c: Remove unneccesary header files. (__libc_utmp_unknown_functions): Added getutid_r_unknown, getutline_r_unknown. (setutent_unknown): Only set file backend if setutent for the file backend was successful. (getutent_r_unknown, pututline_unknown): Call setutent_unknown instead of __setutent. Report failure if no backend was selected. (getutid_r_unknown): New function. (getutline_r_unknown): New function. (__endutent): Reset backend. This makes sure all backends are checked on the next setutent call. 1997-08-08 20:20 Thorsten Kukuk <kukuk@vt.uni-paderborn.de> * nis_cache.c: Replace dummy functions. * libc.map: Add xdr_sizeof symbol. * sunrpc/Makefile: Add xdr_sizeof to routines. * sunrpc/rpc/xdr.h: Add xdr_sizeof prototype. * sunrpc/xdr_sizeof.c: New, from tirpc 2.3. 1997-08-08 Thomas Bushnell, n/BSG <thomas@gnu.ai.mit.edu> * sysdeps/mach/bits/libc-lock.h (__libc_once): Define correctly. 1997-08-07 Thomas Bushnell, n/BSG <thomas@gnu.ai.mit.edu> * sysdeps/mach/hurd/profil.c (fetch_samples): Put parens in the right place. 1997-08-06 Thomas Bushnell, n/BSG <thomas@gnu.ai.mit.edu> * sysdeps/mach/hurd/profil.c (fetch_samples): Do arithmetic on PC's in long long to avoid overflow. 1997-08-07 Thomas Bushnell, n/BSG <thomas@gnu.ai.mit.edu> * sysdeps/mach/bits/libc-lock.h (__libc_once, __libc_once_define): New macros. 1997-08-06 Andreas Jaeger <aj@arthur.rhein-neckar.de> * nis/Makefile (headers): Remove bits/nislib.h. 1997-08-06 14:54 Ulrich Drepper <drepper@cygnus.com> * sysdeps/mach/hurd/Subdirs: Add login. 1997-08-06 14:23 Klaus Espenlaub <kespenla@hydra.informatik.uni-ulm.de> * db/hash/hash.c (init_hash): Don't use stat() if it doesn't provide the preferred block size. * login/programs/database.c (store_state_entry): Don't compile if there is no ut_type field. (store_state_entry, store_process_entry): Use the ut_tv field for timestamps if supported. * login/programs/utmpdump.c (print_entry): Always use ut_tv field. * login/programs/xtmp.c: Fix numerous xtmp/utmp typos. Use the ut_tv field for timestamps if supported. * login/programs/xtmp.h: Fix xtmp/utmp typo. * sysdeps/posix/defs.c (stdstream): Change (PTR) to (void *). * sysdeps/stub/connect.c (connect): Change to __connect, add alias. * sysdeps/stub/send.c (send): Likewise. * sysdeps/stub/s_exp2f.c: Emit correct stub_warning(). * sysdeps/stub/statfs.c: Move stub_warning() to the usual place. * sysdeps/stub/init-first.c: Add definition of __libc_pid. 1997-08-05 13:28 Philip Blundell <pb@spring.nexus.co.uk> * sysdeps/standalone/arm/bits/errno.h: Add EISDIR, EOPNOTSUPP; tidy up formatting. * Makefile (subdirs): Remove `login'. * sysdeps/unix/Subdirs: New file; build `login' subdirectory for Unix systems. 1997-08-05 Andreas Schwab <schwab@issan.informatik.uni-dortmund.de> * sysdeps/generic/bits/utmpx.h: New file. * sysdeps/mach/hurd/Dist: Add some files. * sysdeps/mips/Dist: Likewise. * sysdeps/mips/mips64/Dist: Likewise. * sysdeps/sparc/Dist: Likewise. * sysdeps/unix/sysv/linux/mips/Dist: Likewise. * sysdeps/unix/sysv/linux/sparc/Dist: Likewise. * sysdeps/mips/mipsel/Dist: New file. * sysdeps/sparc64/elf/Dist: New file. * sysdeps/unix/sysv/linux/sparc64/Dist: New file. 1997-08-05 Andreas Schwab <schwab@issan.informatik.uni-dortmund.de> * libc.map: Add missing symbols. 1997-08-05 Andreas Jaeger <aj@arthur.rhein-neckar.de> * manual/socket.texi: Correct typos. * manual/math.texi: Correct typos. * manual/time.texi (Formatting Date and Time): Likewise. 1997-08-04 13:06 Thomas Bushnell, n/BSG <thomas@gnu.ai.mit.edu> * gmon/gmon.c (write_gmon): New function; guts from _mcleanup. (_mcleanup): Use write_gmon. (write_profiling): This function can be safely called at any time to write a current histogram without interfering with ongoing profiling. * sysdeps/mach/hurd/profil.c (fetch_samples): Initialize NSAMPLES. 1997-08-01 17:53 Thomas Bushnell, n/BSG <thomas@gnu.ai.mit.edu> * sysdeps/mach/hurd/profil.c (fetch_samples): Sample buffer need not be vm_deallocated; it's a stack buffer. (profil_vm_deallocate): Delete prototype. (#include <../mach/RPC_vm_deallocate_rpc.c>): Drop this inclusion. * sysdeps/mach/hurd/Makefile ($(common-objpfx)hurd/../mach/RPC_vm_deallocate_rpc.c): Delete this rule. * sysdeps/mach/hurd/profil.c (fetch_samples): New function, guts from profile_waiter. (profile_waiter): Use fetch_samples. (profil): When turning off profiling, fetch the last bunch of samples before disabling PC sampling. (fetch_samples): Add prototype. 1997-07-30 12:53 Thomas Bushnell, n/BSG <thomas@gnu.ai.mit.edu> * sysdeps/mach/hurd/Makefile: Give normal rules for the mach RPC source included by profil.c instead of trying to use before-compile grot. 1997-07-23 15:04 Thomas Bushnell, n/BSG <thomas@gnu.ai.mit.edu> * sysdeps/mach/hurd/profil.c (profile_waiter): Do vm_deallocate after releasing lock. Use special RPC stubs and avoid assert, thus making this function entirely independent of the threadvar mechanism and of cthreads. (lock): Convert to be a spin lock instead of a mutex, so that the waiter thread need not use cthreads. Use a fork prepare hook instead of _hurd_fork_locks to make sure we are clean before forking. (fork_profil_child): Renamed from fork_profil. (profil_reply_port): New variable. (profil_vm_deallocate, profil_task_get_sampled_pcs): Special RPC stubs made by special hacks. * sysdeps/mach/hurd/Makefile (before-compile): Add the mach RPC source files that profil.c needs if we are in the gmon directory. * mach/setup-thread.c (__mach_setup_thread): Delete avoidance of a cthreads bug that hasn't existed for two years. * stdio-common/printf_fp.c (__printf_fp): Correct rounding of numbers * locale/programs/locale.c (print_escaped): New function. * time/australasia: Likewise. (open_database, synchronize_database, initialize_database): * nss/nss_files/files-netgrp.c (_nss_netgroup_parseline): Don't * Makerules (load-map-file): Currectly handle missing map file. cannot rely on M_SQRT2 being defined. (log1p): Use __M_SQRT2 not M_SQRT2.
550 lines
14 KiB
C
550 lines
14 KiB
C
/* Add or subtract two 128-bit floating point values. C prototype.
|
|
Copyright (C) 1997 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Library General Public License as
|
|
published by the Free Software Foundation; either version 2 of the
|
|
License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Library General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Library General Public
|
|
License along with the GNU C Library; see the file COPYING.LIB. If not,
|
|
write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
Boston, MA 02111-1307, USA. */
|
|
|
|
#include <quad_float.h>
|
|
|
|
/* Add 'a' to 'b' and put the result in 'result', but treat a[0]=axx,
|
|
b[0]=bxx. bxx differs from b[0] only in the high bit, similarly axx. */
|
|
/* Exceptions to raise:
|
|
- Invalid (SNaN)
|
|
- Invalid (Inf-Inf)
|
|
- Overflow
|
|
- Underflow
|
|
- Inexact
|
|
*/
|
|
|
|
/* Handle cases where exponent of a or b is maximum. */
|
|
static void
|
|
handle_max_exponent(unsigned result[4],
|
|
const unsigned a[4], const unsigned b[4],
|
|
const unsigned axx, /* Treat as a[0]. */
|
|
const unsigned bxx, /* Treat as b[0]. */
|
|
const unsigned ax, /* axx >> 16 & 0x7fff. */
|
|
const unsigned bx) /* bxx >> 16 & 0x7fff. */
|
|
{
|
|
int ax_ismax, bx_ismax;
|
|
unsigned a1,a2,a3, b1,b2,b3;
|
|
int a_zeromant, b_zeromant;
|
|
|
|
ax_ismax = ax == 0x7fff;
|
|
bx_ismax = bx == 0x7fff;
|
|
|
|
assert(ax_ismax || bx_ismax);
|
|
|
|
a1 = a[1]; a2 = a[2]; a3 = a[3];
|
|
b1 = b[1]; b2 = b[2]; b3 = b[3];
|
|
|
|
a_zeromant = (axx & 0xffff | a1 | a2 | a3) == 0;
|
|
b_zeromant = (bxx & 0xffff | b1 | b2 | b3) == 0;
|
|
|
|
/* Deal with SNaNs. */
|
|
if ( ax_ismax && !a_zeromant && (axx & 0x8000) == 0
|
|
|| bx_ismax && !b_zeromant && (bxx & 0x8000) == 0)
|
|
{
|
|
set_fpscr_bit(FPSCR_VXSNAN);
|
|
axx |= 0x8000; /* Demote the SNaN to a QNaN (whichever of */
|
|
bxx |= 0x8000; /* a or b it was). */
|
|
}
|
|
/* Deal with Inf-Inf. */
|
|
else if (a_zeromant && b_zeromant && (axx ^ bxx) == 0x80000000)
|
|
{
|
|
set_fpscr_bit(FPSCR_VXISI);
|
|
bxx |= 0x8000; /* Return an appropriate QNaN. */
|
|
}
|
|
|
|
/* Return the lexicographically larger of a or b, ignoring the sign
|
|
bits. */
|
|
if ((axx & 0x7fffffff) > (bxx & 0x7fffffff)) goto return_a;
|
|
else if ((axx & 0x7fffffff) < (bxx & 0x7fffffff)) goto return_b;
|
|
else if (a1 > b1) goto return_a;
|
|
else if (a1 < b1) goto return_b;
|
|
else if (a2 > b2) goto return_a;
|
|
else if (a2 < b2) goto return_b;
|
|
else if (a3 > b3) goto return_a; /* I've clearly been writing too */
|
|
else if (a3 < b3) goto return_b; /* much Fortran... */
|
|
|
|
/* If they are equal except for the sign bits, return 'b'. */
|
|
|
|
return_b:
|
|
result[0] = bxx; result[1] = b1; result[2] = b2; result[3] = b3;
|
|
return;
|
|
|
|
return_a:
|
|
result[0] = axx; result[1] = a1; result[2] = a2; result[3] = a3;
|
|
return;
|
|
}
|
|
|
|
/* Renormalise and output a FP number. */
|
|
static void
|
|
renormalise_value(unsigned result[4],
|
|
const unsigned axx,
|
|
unsigned ax,
|
|
unsigned r0,
|
|
unsigned r1,
|
|
unsigned r2,
|
|
unsigned r3)
|
|
{
|
|
int rshift;
|
|
if (r0 != 0 || cntlzw(a1) < 16 || 32 > ax-1)
|
|
{
|
|
rshift = cntlzw(r0)-15 + (-(cntlzw(r0) >> 5) & cntlzw(a1));
|
|
assert(rshift < 32);
|
|
if (rshift > ax-1)
|
|
{
|
|
ax--;
|
|
rshift = ax;
|
|
}
|
|
|
|
result[0] = (axx & 0x80000000
|
|
| ax-rshift << 16
|
|
| r0 << rshift & 0xffff
|
|
| a1 >> 32-rshift & 0xffff);
|
|
result[1] = a1 << rshift | a2 >> 32-rshift;
|
|
result[2] = a2 << rshift | a3 >> 32-rshift;
|
|
result[3] = a3 << rshift;
|
|
return;
|
|
}
|
|
result[3] = 0;
|
|
/* Special case for zero. */
|
|
if (a1 == 0 && a2 == 0 && a3 == 0)
|
|
{
|
|
result[0] = axx & 0x80000000;
|
|
result[1] = result[2] = 0;
|
|
return;
|
|
}
|
|
while (a1 != 0 && cntlzw(a2) >= 16 && 64 <= ax-1)
|
|
{
|
|
ax -= 32;
|
|
a1 = a2; a2 = a3; a3 = 0;
|
|
}
|
|
rshift = cntlzw(a1)-15 + (-(cntlzw(a1) >> 5) & cntlzw(a2));
|
|
assert(rshift < 32);
|
|
if (rshift > ax-1-32)
|
|
{
|
|
ax--;
|
|
rshift = ax-32;
|
|
}
|
|
|
|
result[0] = (axx & 0x80000000
|
|
| ax-rshift-32 << 16
|
|
| a1 << rshift & 0xffff
|
|
| a2 >> 32-rshift & 0xffff);
|
|
result[1] = a2 << rshift | a3 >> 32-rshift;
|
|
result[2] = a3 << rshift;
|
|
return;
|
|
}
|
|
|
|
/* Handle the case where one or both numbers are denormalised or zero.
|
|
This case almost never happens, so we don't slow the main code
|
|
with it. */
|
|
static void
|
|
handle_min_exponent(unsigned result[4],
|
|
const unsigned a[4], const unsigned b[4],
|
|
const unsigned axx, /* Treat as a[0]. */
|
|
const unsigned bxx, /* Treat as b[0]. */
|
|
const unsigned ax, /* axx >> 16 & 0x7fff. */
|
|
const unsigned bx) /* bxx >> 16 & 0x7fff. */
|
|
{
|
|
int ax_denorm, bx_denorm;
|
|
unsigned a1,a2,a3, b1,b2,b3;
|
|
int a_zeromant, b_zeromant;
|
|
|
|
ax_denorm = ax == 0;
|
|
bx_denorm = bx == 0;
|
|
|
|
assert(ax_denorm || bx_denorm);
|
|
|
|
a1 = a[1]; a2 = a[2]; a3 = a[3];
|
|
b1 = b[1]; b2 = b[2]; b3 = b[3];
|
|
|
|
|
|
}
|
|
|
|
/* Add a+b+cin modulo 2^32, put result in 'r' and carry in 'cout'. */
|
|
#define addc(r,cout,a,b,cin) \
|
|
do { \
|
|
unsigned long long addc_tmp = (a)+(b)+(cin);
|
|
(cout) = addc_tmp >> 32;
|
|
(r) = addc_tmp;
|
|
}
|
|
|
|
/* Calculate a+~b+cin modulo 2^32, put result in 'r' and carry in 'cout'. */
|
|
#define subc(r,cout,a,b,cin) \
|
|
do { \
|
|
unsigned long long addc_tmp = (a)-(b)+(cin)-1;
|
|
(cout) = addc_tmp >> 63;
|
|
(r) = addc_tmp;
|
|
}
|
|
|
|
/* Handle the case where both exponents are the same. This requires quite
|
|
a different algorithm than the general case. */
|
|
static void
|
|
handle_equal_exponents(unsigned result[4],
|
|
const unsigned a[4], const unsigned b[4],
|
|
const unsigned axx, /* Treat as a[0]. */
|
|
const unsigned bxx, /* Treat as b[0]. */
|
|
unsigned ax) /* [ab]xx >> 16 & 0x7fff. */
|
|
{
|
|
unsigned a1,a2,a3, b1,b2,b3;
|
|
int roundmode;
|
|
unsigned carry, r0;
|
|
|
|
a1 = a[1]; a2 = a[2]; a3 = a[3];
|
|
b1 = b[1]; b2 = b[2]; b3 = b[3];
|
|
|
|
if ((int)(axx ^ bxx) >= 0)
|
|
{
|
|
int roundmode;
|
|
|
|
/* Adding. */
|
|
roundmode = fegetround();
|
|
|
|
/* What about overflow? */
|
|
if (ax == 0x7ffe)
|
|
{
|
|
/* Oh no! Too big! */
|
|
/* Result:
|
|
rounding result
|
|
-------- ------
|
|
nearest return Inf with sign of a,b
|
|
zero return nearest possible non-Inf value with
|
|
sign of a,b
|
|
+Inf return +Inf if a,b>0, otherwise return
|
|
value just before -Inf.
|
|
-Inf return +Inf if a,b>0, otherwise return
|
|
value just before -Inf.
|
|
*/
|
|
set_fpscr_bit(FPSCR_OX);
|
|
/* Overflow always produces inexact result. */
|
|
set_fpscr_bit(FPSCR_XX);
|
|
|
|
if ( roundmode == FE_TONEAREST
|
|
|| roundmode == FE_UPWARD && (int)axx >= 0
|
|
|| roundmode == FE_DOWNWARD && (int)axx < 0)
|
|
{
|
|
result[3] = result[2] = result[1] = 0;
|
|
result[0] = axx & 0xffff0000 | 0x7fff0000;
|
|
}
|
|
else
|
|
{
|
|
result[3] = result[2] = result[1] = 0xffffffff;
|
|
result[0] = axx & 0xfffe0000 | 0x7ffeffff;
|
|
}
|
|
return;
|
|
}
|
|
|
|
/* We need to worry about rounding/inexact here. Do it like this: */
|
|
if (a3 + b3 & 1)
|
|
{
|
|
/* Need to round. Upwards? */
|
|
set_fpscr_bit(FPSCR_XX);
|
|
carry = ( roundmode == FE_NEAREST && (a3 + b3 & 2) != 0
|
|
|| roundmode == FE_UPWARD && (int)axx >= 0
|
|
|| roundmode == FE_DOWNWARD && (int)axx < 0);
|
|
}
|
|
else
|
|
carry = 0; /* Result will be exact. */
|
|
|
|
/* Perform the addition. */
|
|
addc(a3,carry,a3,b3,carry);
|
|
addc(a2,carry,a2,b2,carry);
|
|
addc(a1,carry,a1,b1,carry);
|
|
r0 = (axx & 0xffff) + (bxx & 0xffff) + carry;
|
|
|
|
/* Shift right by 1. */
|
|
result[3] = a3 >> 1 | a2 << 31;
|
|
result[2] = a2 >> 1 | a1 << 31;
|
|
result[1] = a1 >> 1 | r0 << 31;
|
|
/* Exponent of result is exponent of inputs plus 1.
|
|
Sign of result is common sign of inputs. */
|
|
result[0] = r0 >> 1 & 0xffff | axx + 0x10000 & 0xffff0000;
|
|
}
|
|
else
|
|
{
|
|
/* Subtracting. */
|
|
|
|
/* Perform the subtraction, a-b. */
|
|
subc(a3,carry,a3,b3,0);
|
|
subc(a2,carry,a2,b2,carry);
|
|
subc(a1,carry,a1,b1,carry);
|
|
subc(r0,carry,a0&0xffff,b0&0xffff,carry);
|
|
|
|
/* Maybe we should have calculated b-a... */
|
|
if (carry)
|
|
{
|
|
subc(a3,carry,0,a3,0);
|
|
subc(a2,carry,0,a2,carry);
|
|
subc(a1,carry,0,a1,carry);
|
|
subc(r0,carry,0,r0,carry);
|
|
axx ^= 0x80000000;
|
|
}
|
|
|
|
renormalise_value(result, axx, ax, r0, a1, a2, a3);
|
|
}
|
|
}
|
|
|
|
|
|
static void
|
|
add(unsigned result[4], const unsigned a[4], const unsigned b[4],
|
|
unsigned axx, unsigned bxx)
|
|
{
|
|
int ax, bx, diff, carry;
|
|
unsigned a0,a1,a2,a3, b0,b1,b2,b3,b4, sdiff;
|
|
|
|
ax = axx >> 16 & 0x7fff;
|
|
bx = bxx >> 16 & 0x7fff;
|
|
|
|
/* Deal with NaNs and Inf. */
|
|
if (ax == 0x7fff || bx == 0x7fff)
|
|
{
|
|
handle_max_exponent(result, a, b, axx, bxx, ax, bx);
|
|
return;
|
|
}
|
|
/* Deal with denorms and zero. */
|
|
if (ax == 0 || bx == 0)
|
|
{
|
|
handle_min_exponent(result, a, b, axx, bxx, ax, bx);
|
|
return;
|
|
}
|
|
/* Finally, one special case, when both exponents are equal. */
|
|
if (ax == bx)
|
|
{
|
|
handle_equal_exponents(result, a, b, axx, bxx, ax);
|
|
return;
|
|
}
|
|
|
|
sdiff = axx ^ bxx;
|
|
/* Swap a and b if b has a larger magnitude than a, so that a will have
|
|
the larger magnitude. */
|
|
if (ax < bx)
|
|
{
|
|
const unsigned *t;
|
|
t = b; b = a; a = t;
|
|
diff = bx - ax;
|
|
ax = bx;
|
|
axx = bxx;
|
|
}
|
|
else
|
|
diff = ax - bx;
|
|
|
|
a0 = a[0] & 0xffff | 0x10000; a1 = a[1]; a2 = a[2]; a3 = a[3];
|
|
b0 = b[0] & 0xffff | 0x10000; b1 = b[1]; b2 = b[2]; b3 = b[3];
|
|
if (diff < 32)
|
|
{
|
|
b4 = b3 << 32-diff;
|
|
b3 = b3 >> diff | b2 << 32-biff;
|
|
b2 = b2 >> diff | b1 << 32-diff;
|
|
b1 = b1 >> diff | b0 << 32-diff;
|
|
b0 = b0 >> diff;
|
|
}
|
|
else if (diff < 64)
|
|
{
|
|
diff -= 32;
|
|
b4 = b3 & 1 | b3 >> (diff == 32) | b2 << 32-biff;
|
|
b3 = b2 >> diff | b1 << 32-diff;
|
|
b2 = b1 >> diff | b0 << 32-diff;
|
|
b1 = b0 >> diff;
|
|
b0 = 0;
|
|
}
|
|
else if (diff < 96)
|
|
{
|
|
b4 = b2 | b3 | b1 << 32-diff;
|
|
b3 = b1 >> diff | b0 << 32-diff;
|
|
b2 = b0 >> diff;
|
|
b1 = b0 = 0;
|
|
}
|
|
else if (diff < 128)
|
|
{
|
|
b4 = b1 | b2 | b3 | b0 << 32-diff;
|
|
b3 = b0 >> diff;
|
|
b2 = b1 = b0 = 0;
|
|
}
|
|
else
|
|
{
|
|
b4 = b0|b1|b2|b3;
|
|
b3 = b2 = b1 = b0 = 0;
|
|
}
|
|
|
|
/* Now, two cases: one for addition, one for subtraction. */
|
|
if ((int)sdiff >= 0)
|
|
{
|
|
/* Addition. */
|
|
|
|
/*
|
|
|
|
/* Perform the addition. */
|
|
addc(a3,carry,a3,b3,0);
|
|
addc(a2,carry,a2,b2,carry);
|
|
addc(a1,carry,a1,b1,carry);
|
|
addc(a0,carry,a0,b0,carry);
|
|
|
|
|
|
|
|
if (a0 & 0x20000)
|
|
{
|
|
/* Need to renormalise by shifting right. */
|
|
/* Shift right by 1. */
|
|
b4 = b4 | a3 << 31;
|
|
a3 = a3 >> 1 | a2 << 31;
|
|
a2 = a2 >> 1 | a1 << 31;
|
|
result[1] = a1 >> 1 | r0 << 31;
|
|
/* Exponent of result is exponent of inputs plus 1.
|
|
Sign of result is common sign of inputs. */
|
|
result[0] = r0 >> 1 & 0xffff | axx + 0x10000 & 0xffff0000;
|
|
}
|
|
|
|
|
|
}
|
|
else
|
|
{
|
|
/* Subtraction. */
|
|
|
|
}
|
|
}
|
|
|
|
/* Add the absolute values of two 128-bit floating point values,
|
|
give the result the sign of one of them. The only exception this
|
|
can raise is for SNaN. */
|
|
static void
|
|
aadd(unsigned result[4], const unsigned a[4], const unsigned b[4])
|
|
{
|
|
unsigned ax, bx, xd;
|
|
const unsigned *sml;
|
|
unsigned t0,t1,t2,t3,tx, s0,s1,s2,s3,s4, carry;
|
|
int rmode, xdelta, shift;
|
|
|
|
ax = a[0] >> 16 & 0x7fff;
|
|
bx = b[0] >> 16 & 0x7fff;
|
|
|
|
/* Deal with . */
|
|
if (ax == 0x7fff)
|
|
{
|
|
t0 = a[0]; t1 = a[1]; t2 = a[2]; t3 = a[3];
|
|
/* Check for SNaN. */
|
|
if ((t0 & 0x8000) == 0
|
|
&& (t0 & 0x7fff | t1 | t2 | t3) != 0)
|
|
set_fpscr_bit(FPSCR_VXSNAN);
|
|
/* Return b. */
|
|
result[0] = t0; result[1] = t1; result[2] = t2; result[3] = t3;
|
|
return;
|
|
}
|
|
/* Deal with b==Inf or b==NaN. */
|
|
if (bx == 0x7fff)
|
|
{
|
|
t0 = b[0]; t1 = b[1]; t2 = b[2]; t3 = b[3];
|
|
/* Check for SNaN. */
|
|
if ((t0 & 0x8000) == 0
|
|
&& (t0 & 0x7fff | t1 | t2 | t3) != 0)
|
|
set_fpscr_bit(FPSCR_VXSNAN);
|
|
/* Return b. */
|
|
result[0] = t0; result[1] = t1; result[2] = t2; result[3] = t3;
|
|
return;
|
|
}
|
|
|
|
/* Choose the larger of the two to be 't', and the smaller to be 's'. */
|
|
if (ax > bx)
|
|
{
|
|
t0 = a[0] & 0xffff | (ax != 0) << 16;
|
|
t1 = a[1]; t2 = a[2]; t3 = a[3]; tx = ax;
|
|
s0 = b[0] & 0xffff | (bx != 0) << 16;
|
|
s1 = b[1]; s2 = b[2]; s3 = b[3];
|
|
xd = ax-bx;
|
|
}
|
|
else
|
|
{
|
|
t0 = b[0] & 0xffff | (bx != 0) << 16;
|
|
t1 = b[1]; t2 = b[2]; t3 = b[3]; tx = bx;
|
|
s0 = a[0] & 0xffff | (ax != 0) << 16;
|
|
s1 = a[1]; s2 = a[2]; s3 = a[3];
|
|
sml = a;
|
|
xd = bx-ax;
|
|
}
|
|
|
|
/* Shift 's2' right by 'xd' bits. */
|
|
switch (xd >> 5)
|
|
{
|
|
case 0:
|
|
s4 = 0;
|
|
break;
|
|
case 1:
|
|
s4 = s3; s3 = s2; s2 = s1; s1 = s0; s0 = 0;
|
|
break;
|
|
case 2:
|
|
s4 = s2 | s3 != 0;
|
|
s3 = s1; s2 = s0; s1 = s0 = 0;
|
|
break;
|
|
case 3:
|
|
s4 = s1 | (s3|s2) != 0;
|
|
s3 = s0; s2 = s1 = s0 = 0;
|
|
break;
|
|
default:
|
|
s4 = s0 | (s3|s2|s1) != 0;
|
|
s3 = s2 = s1 = s0 = 0;
|
|
}
|
|
xd = xd & 0x1f;
|
|
if (xd != 0)
|
|
{
|
|
s4 = s4 >> xd | (s4 << 32-xd) != 0 | s3 << 32-xd;
|
|
s3 = s3 >> xd | s2 << 32-xd;
|
|
s2 = s2 >> xd | s1 << 32-xd;
|
|
s1 = s1 >> xd | s0 << 32-xd;
|
|
s0 = s0 >> xd;
|
|
}
|
|
|
|
/* Do the addition. */
|
|
#define addc(r,cout,a,b,cin) \
|
|
do { \
|
|
unsigned long long addc_tmp = (a)+(b)+(cin);
|
|
(cout) = addc_tmp >> 32;
|
|
(r) = addc_tmp;
|
|
}
|
|
addc(t3,carry,t3,s3,0);
|
|
addc(t2,carry,t2,s2,carry);
|
|
addc(t1,carry,t1,s1,carry);
|
|
t0 = t0 + s0 + carry;
|
|
|
|
/* Renormalise. */
|
|
xdelta = 15-cntlzw(t0);
|
|
if (tx + xdelta <= 0x7fff)
|
|
shift = xdelta;
|
|
else
|
|
{
|
|
}
|
|
}
|
|
|
|
/* Add two 128-bit floating point values. */
|
|
void
|
|
__q_add(unsigned result[4], const unsigned a[4], const unsigned b[4])
|
|
{
|
|
if ((a[0] ^ b[0]) >= 0)
|
|
aadd(result, a, b);
|
|
else
|
|
asubtract(result, a, b);
|
|
}
|
|
|
|
/* Subtract two 128-bit floating point values. */
|
|
void
|
|
__q_sub(unsigned result[4], const unsigned a[4], const unsigned b[4])
|
|
{
|
|
if ((a[0] ^ b[0]) < 0)
|
|
aadd(result, a, b);
|
|
else
|
|
asubtract(result, a, b);
|
|
}
|