src/compiler/float-tran.lisp

   1 ;;;; This file contains floating-point-specific transforms, and may be
   2 ;;;; somewhat implementation-dependent in its assumptions of what the
   3 ;;;; formats are.
   4
   5 ;;;; This software is part of the SBCL system. See the README file for
   6 ;;;; more information.
   7 ;;;;
   8 ;;;; This software is derived from the CMU CL system, which was
   9 ;;;; written at Carnegie Mellon University and released into the
  10 ;;;; public domain. The software is in the public domain and is
  11 ;;;; provided with absolutely no warranty. See the COPYING and CREDITS
  12 ;;;; files for more information.
  13
  14 (in-package "SB!C")
  15 \f
  16 ;;;; coercions
  17
  18 (defknown %single-float (real) single-float (movable foldable flushable))
  19 (defknown %double-float (real) double-float (movable foldable flushable))
  20
  21 (deftransform float ((n &optional f) (* &optional single-float) *)
  22   '(%single-float n))
  23
  24 (deftransform float ((n f) (* double-float) *)
  25   '(%double-float n))
  26
  27 (deftransform %single-float ((n) (single-float) *)
  28   'n)
  29
  30 (deftransform %double-float ((n) (double-float) *)
  31   'n)
  32
  33 ;;; RANDOM
  34 (macrolet ((frob (fun type)
  35              `(deftransform random ((num &optional state)
  36                                     (,type &optional *) *)
  37                 "Use inline float operations."
  38                 '(,fun num (or state *random-state*)))))
  39   (frob %random-single-float single-float)
  40   (frob %random-double-float double-float))
  41
  42 ;;; Mersenne Twister RNG
  43 ;;;
  44 ;;; FIXME: It's unpleasant to have RANDOM functionality scattered
  45 ;;; through the code this way. It would be nice to move this into the
  46 ;;; same file as the other RANDOM definitions.
  47 (deftransform random ((num &optional state)
  48                       ((integer 1 #.(expt 2 32)) &optional *))
  49   ;; FIXME: I almost conditionalized this as #!+sb-doc. Find some way
  50   ;; of automatically finding #!+sb-doc in proximity to DEFTRANSFORM
  51   ;; to let me scan for places that I made this mistake and didn't
  52   ;; catch myself.
  53   "use inline (UNSIGNED-BYTE 32) operations"
  54   (let ((num-high (numeric-type-high (continuation-type num))))
  55     (when (null num-high)
  56       (give-up-ir1-transform))
  57     (cond ((constant-continuation-p num)
  58            ;; Check the worst case sum absolute error for the random number
  59            ;; expectations.
  60            (let ((rem (rem (expt 2 32) num-high)))
  61              (unless (< (/ (* 2 rem (- num-high rem)) num-high (expt 2 32))
  62                         (expt 2 (- sb!kernel::random-integer-extra-bits)))
  63                (give-up-ir1-transform
  64                 "The random number expectations are inaccurate."))
  65              (if (= num-high (expt 2 32))
  66                  '(random-chunk (or state *random-state*))
  67                  #!-x86 '(rem (random-chunk (or state *random-state*)) num)
  68                  #!+x86
  69                  ;; Use multiplication, which is faster.
  70                  '(values (sb!bignum::%multiply
  71                            (random-chunk (or state *random-state*))
  72                            num)))))
  73           ((> num-high random-fixnum-max)
  74            (give-up-ir1-transform
  75             "The range is too large to ensure an accurate result."))
  76           #!+x86
  77           ((< num-high (expt 2 32))
  78            '(values (sb!bignum::%multiply (random-chunk (or state
  79                                                             *random-state*))
  80                      num)))
  81           (t
  82            '(rem (random-chunk (or state *random-state*)) num)))))
  83 \f
  84 ;;;; float accessors
  85
  86 (defknown make-single-float ((signed-byte 32)) single-float
  87   (movable foldable flushable))
  88
  89 (defknown make-double-float ((signed-byte 32) (unsigned-byte 32)) double-float
  90   (movable foldable flushable))
  91
  92 (defknown single-float-bits (single-float) (signed-byte 32)
  93   (movable foldable flushable))
  94
  95 (defknown double-float-high-bits (double-float) (signed-byte 32)
  96   (movable foldable flushable))
  97
  98 (defknown double-float-low-bits (double-float) (unsigned-byte 32)
  99   (movable foldable flushable))
 100
 101 (deftransform float-sign ((float &optional float2)
 102                           (single-float &optional single-float) *)
 103   (if float2
 104       (let ((temp (gensym)))
 105         `(let ((,temp (abs float2)))
 106           (if (minusp (single-float-bits float)) (- ,temp) ,temp)))
 107       '(if (minusp (single-float-bits float)) -1f0 1f0)))
 108
 109 (deftransform float-sign ((float &optional float2)
 110                           (double-float &optional double-float) *)
 111   (if float2
 112       (let ((temp (gensym)))
 113         `(let ((,temp (abs float2)))
 114           (if (minusp (double-float-high-bits float)) (- ,temp) ,temp)))
 115       '(if (minusp (double-float-high-bits float)) -1d0 1d0)))
 116 \f
 117 ;;;; DECODE-FLOAT, INTEGER-DECODE-FLOAT, and SCALE-FLOAT
 118
 119 (defknown decode-single-float (single-float)
 120   (values single-float single-float-exponent (single-float -1f0 1f0))
 121   (movable foldable flushable))
 122
 123 (defknown decode-double-float (double-float)
 124   (values double-float double-float-exponent (double-float -1d0 1d0))
 125   (movable foldable flushable))
 126
 127 (defknown integer-decode-single-float (single-float)
 128   (values single-float-significand single-float-int-exponent (integer -1 1))
 129   (movable foldable flushable))
 130
 131 (defknown integer-decode-double-float (double-float)
 132   (values double-float-significand double-float-int-exponent (integer -1 1))
 133   (movable foldable flushable))
 134
 135 (defknown scale-single-float (single-float fixnum) single-float
 136   (movable foldable flushable))
 137
 138 (defknown scale-double-float (double-float fixnum) double-float
 139   (movable foldable flushable))
 140
 141 (deftransform decode-float ((x) (single-float) *)
 142   '(decode-single-float x))
 143
 144 (deftransform decode-float ((x) (double-float) *)
 145   '(decode-double-float x))
 146
 147 (deftransform integer-decode-float ((x) (single-float) *)
 148   '(integer-decode-single-float x))
 149
 150 (deftransform integer-decode-float ((x) (double-float) *)
 151   '(integer-decode-double-float x))
 152
 153 (deftransform scale-float ((f ex) (single-float *) *)
 154   (if (and #!+x86 t #!-x86 nil
 155            (csubtypep (continuation-type ex)
 156                       (specifier-type '(signed-byte 32))))
 157       '(coerce (%scalbn (coerce f 'double-float) ex) 'single-float)
 158       '(scale-single-float f ex)))
 159
 160 (deftransform scale-float ((f ex) (double-float *) *)
 161   (if (and #!+x86 t #!-x86 nil
 162            (csubtypep (continuation-type ex)
 163                       (specifier-type '(signed-byte 32))))
 164       '(%scalbn f ex)
 165       '(scale-double-float f ex)))
 166
 167 ;;; What is the CROSS-FLOAT-INFINITY-KLUDGE?
 168 ;;;
 169 ;;; SBCL's own implementation of floating point supports floating
 170 ;;; point infinities. Some of the old CMU CL :PROPAGATE-FLOAT-TYPE and
 171 ;;; :PROPAGATE-FUN-TYPE code, like the DEFOPTIMIZERs below, uses this
 172 ;;; floating point support. Thus, we have to avoid running it on the
 173 ;;; cross-compilation host, since we're not guaranteed that the
 174 ;;; cross-compilation host will support floating point infinities.
 175 ;;;
 176 ;;; If we wanted to live dangerously, we could conditionalize the code
 177 ;;; with #+(OR SBCL SB-XC) instead. That way, if the cross-compilation
 178 ;;; host happened to be SBCL, we'd be able to run the infinity-using
 179 ;;; code. Pro:
 180 ;;;   * SBCL itself gets built with more complete optimization.
 181 ;;; Con:
 182 ;;;   * You get a different SBCL depending on what your cross-compilation
 183 ;;;     host is.
 184 ;;; So far the pros and cons seem seem to be mostly academic, since
 185 ;;; AFAIK (WHN 2001-08-28) the propagate-foo-type optimizations aren't
 186 ;;; actually important in compiling SBCL itself. If this changes, then
 187 ;;; we have to decide:
 188 ;;;   * Go for simplicity, leaving things as they are.
 189 ;;;   * Go for performance at the expense of conceptual clarity,
 190 ;;;     using #+(OR SBCL SB-XC) and otherwise leaving the build
 191 ;;;     process as is.
 192 ;;;   * Go for performance at the expense of build time, using
 193 ;;;     #+(OR SBCL SB-XC) and also making SBCL do not just
 194 ;;;     make-host-1.sh and make-host-2.sh, but a third step
 195 ;;;     make-host-3.sh where it builds itself under itself. (Such a
 196 ;;;     3-step build process could also help with other things, e.g.
 197 ;;;     using specialized arrays to represent debug information.)
 198 ;;;   * Rewrite the code so that it doesn't depend on unportable
 199 ;;;     floating point infinities.
 200
 201 ;;; optimizers for SCALE-FLOAT. If the float has bounds, new bounds
 202 ;;; are computed for the result, if possible.
 203 #-sb-xc-host ; (See CROSS-FLOAT-INFINITY-KLUDGE.)
 204 (progn
 205
 206 (defun scale-float-derive-type-aux (f ex same-arg)
 207   (declare (ignore same-arg))
 208   (flet ((scale-bound (x n)
 209            ;; We need to be a bit careful here and catch any overflows
 210            ;; that might occur. We can ignore underflows which become
 211            ;; zeros.
 212            (set-bound
 213             (handler-case
 214              (scale-float (type-bound-number x) n)
 215              (floating-point-overflow ()
 216                 nil))
 217             (consp x))))
 218     (when (and (numeric-type-p f) (numeric-type-p ex))
 219       (let ((f-lo (numeric-type-low f))
 220             (f-hi (numeric-type-high f))
 221             (ex-lo (numeric-type-low ex))
 222             (ex-hi (numeric-type-high ex))
 223             (new-lo nil)
 224             (new-hi nil))
 225         (when (and f-hi ex-hi)
 226           (setf new-hi (scale-bound f-hi ex-hi)))
 227         (when (and f-lo ex-lo)
 228           (setf new-lo (scale-bound f-lo ex-lo)))
 229         (make-numeric-type :class (numeric-type-class f)
 230                            :format (numeric-type-format f)
 231                            :complexp :real
 232                            :low new-lo
 233                            :high new-hi)))))
 234 (defoptimizer (scale-single-float derive-type) ((f ex))
 235   (two-arg-derive-type f ex #'scale-float-derive-type-aux
 236                        #'scale-single-float t))
 237 (defoptimizer (scale-double-float derive-type) ((f ex))
 238   (two-arg-derive-type f ex #'scale-float-derive-type-aux
 239                        #'scale-double-float t))
 240
 241 ;;; DEFOPTIMIZERs for %SINGLE-FLOAT and %DOUBLE-FLOAT. This makes the
 242 ;;; FLOAT function return the correct ranges if the input has some
 243 ;;; defined range. Quite useful if we want to convert some type of
 244 ;;; bounded integer into a float.
 245 (macrolet
 246     ((frob (fun type)
 247        (let ((aux-name (symbolicate fun "-DERIVE-TYPE-AUX")))
 248          `(progn
 249            (defun ,aux-name (num)
 250              ;; When converting a number to a float, the limits are
 251              ;; the same.
 252              (let* ((lo (bound-func (lambda (x)
 253                                       (coerce x ',type))
 254                                     (numeric-type-low num)))
 255                     (hi (bound-func (lambda (x)
 256                                       (coerce x ',type))
 257                                     (numeric-type-high num))))
 258                (specifier-type `(,',type ,(or lo '*) ,(or hi '*)))))
 259
 260            (defoptimizer (,fun derive-type) ((num))
 261              (one-arg-derive-type num #',aux-name #',fun))))))
 262   (frob %single-float single-float)
 263   (frob %double-float double-float))
 264 ) ; PROGN
 265 \f
 266 ;;;; float contagion
 267
 268 ;;; Do some stuff to recognize when the loser is doing mixed float and
 269 ;;; rational arithmetic, or different float types, and fix it up. If
 270 ;;; we don't, he won't even get so much as an efficiency note.
 271 (deftransform float-contagion-arg1 ((x y) * * :defun-only t :node node)
 272   `(,(continuation-fun-name (basic-combination-fun node))
 273     (float x y) y))
 274 (deftransform float-contagion-arg2 ((x y) * * :defun-only t :node node)
 275   `(,(continuation-fun-name (basic-combination-fun node))
 276     x (float y x)))
 277
 278 (dolist (x '(+ * / -))
 279   (%deftransform x '(function (rational float) *) #'float-contagion-arg1)
 280   (%deftransform x '(function (float rational) *) #'float-contagion-arg2))
 281
 282 (dolist (x '(= < > + * / -))
 283   (%deftransform x '(function (single-float double-float) *)
 284                  #'float-contagion-arg1)
 285   (%deftransform x '(function (double-float single-float) *)
 286                  #'float-contagion-arg2))
 287
 288 ;;; Prevent ZEROP, PLUSP, and MINUSP from losing horribly. We can't in
 289 ;;; general float rational args to comparison, since Common Lisp
 290 ;;; semantics says we are supposed to compare as rationals, but we can
 291 ;;; do it for any rational that has a precise representation as a
 292 ;;; float (such as 0).
 293 (macrolet ((frob (op)
 294              `(deftransform ,op ((x y) (float rational) *)
 295                 "open-code FLOAT to RATIONAL comparison"
 296                 (unless (constant-continuation-p y)
 297                   (give-up-ir1-transform
 298                    "The RATIONAL value isn't known at compile time."))
 299                 (let ((val (continuation-value y)))
 300                   (unless (eql (rational (float val)) val)
 301                     (give-up-ir1-transform
 302                      "~S doesn't have a precise float representation."
 303                      val)))
 304                 `(,',op x (float y x)))))
 305   (frob <)
 306   (frob >)
 307   (frob =))
 308 \f
 309 ;;;; irrational derive-type methods
 310
 311 ;;; Derive the result to be float for argument types in the
 312 ;;; appropriate domain.
 313 #+sb-xc-host ; (See CROSS-FLOAT-INFINITY-KLUDGE.)
 314 (dolist (stuff '((asin (real -1.0 1.0))
 315                  (acos (real -1.0 1.0))
 316                  (acosh (real 1.0))
 317                  (atanh (real -1.0 1.0))
 318                  (sqrt (real 0.0))))
 319   (destructuring-bind (name type) stuff
 320     (let ((type (specifier-type type)))
 321       (setf (fun-info-derive-type (fun-info-or-lose name))
 322             (lambda (call)
 323               (declare (type combination call))
 324               (when (csubtypep (continuation-type
 325                                 (first (combination-args call)))
 326                                type)
 327                 (specifier-type 'float)))))))
 328
 329 #+sb-xc-host ; (See CROSS-FLOAT-INFINITY-KLUDGE.)
 330 (defoptimizer (log derive-type) ((x &optional y))
 331   (when (and (csubtypep (continuation-type x)
 332                         (specifier-type '(real 0.0)))
 333              (or (null y)
 334                  (csubtypep (continuation-type y)
 335                             (specifier-type '(real 0.0)))))
 336     (specifier-type 'float)))
 337 \f
 338 ;;;; irrational transforms
 339
 340 (defknown (%tan %sinh %asinh %atanh %log %logb %log10 %tan-quick)
 341           (double-float) double-float
 342   (movable foldable flushable))
 343
 344 (defknown (%sin %cos %tanh %sin-quick %cos-quick)
 345   (double-float) (double-float -1.0d0 1.0d0)
 346   (movable foldable flushable))
 347
 348 (defknown (%asin %atan)
 349   (double-float)
 350   (double-float #.(coerce (- (/ pi 2)) 'double-float)
 351                 #.(coerce (/ pi 2) 'double-float))
 352   (movable foldable flushable))
 353
 354 (defknown (%acos)
 355   (double-float) (double-float 0.0d0 #.(coerce pi 'double-float))
 356   (movable foldable flushable))
 357
 358 (defknown (%cosh)
 359   (double-float) (double-float 1.0d0)
 360   (movable foldable flushable))
 361
 362 (defknown (%acosh %exp %sqrt)
 363   (double-float) (double-float 0.0d0)
 364   (movable foldable flushable))
 365
 366 (defknown %expm1
 367   (double-float) (double-float -1d0)
 368   (movable foldable flushable))
 369
 370 (defknown (%hypot)
 371   (double-float double-float) (double-float 0d0)
 372   (movable foldable flushable))
 373
 374 (defknown (%pow)
 375   (double-float double-float) double-float
 376   (movable foldable flushable))
 377
 378 (defknown (%atan2)
 379   (double-float double-float)
 380   (double-float #.(coerce (- pi) 'double-float)
 381                 #.(coerce pi 'double-float))
 382   (movable foldable flushable))
 383
 384 (defknown (%scalb)
 385   (double-float double-float) double-float
 386   (movable foldable flushable))
 387
 388 (defknown (%scalbn)
 389   (double-float (signed-byte 32)) double-float
 390   (movable foldable flushable))
 391
 392 (defknown (%log1p)
 393   (double-float) double-float
 394   (movable foldable flushable))
 395
 396 (macrolet ((def (name prim rtype)
 397              `(progn
 398                (deftransform ,name ((x) (single-float) ,rtype)
 399                  `(coerce (,',prim (coerce x 'double-float)) 'single-float))
 400                (deftransform ,name ((x) (double-float) ,rtype)
 401                  `(,',prim x)))))
 402   (def exp %exp *)
 403   (def log %log float)
 404   (def sqrt %sqrt float)
 405   (def asin %asin float)
 406   (def acos %acos float)
 407   (def atan %atan *)
 408   (def sinh %sinh *)
 409   (def cosh %cosh *)
 410   (def tanh %tanh *)
 411   (def asinh %asinh *)
 412   (def acosh %acosh float)
 413   (def atanh %atanh float))
 414
 415 ;;; The argument range is limited on the x86 FP trig. functions. A
 416 ;;; post-test can detect a failure (and load a suitable result), but
 417 ;;; this test is avoided if possible.
 418 (macrolet ((def (name prim prim-quick)
 419              (declare (ignorable prim-quick))
 420              `(progn
 421                 (deftransform ,name ((x) (single-float) *)
 422                   #!+x86 (cond ((csubtypep (continuation-type x)
 423                                            (specifier-type '(single-float
 424                                                              (#.(- (expt 2f0 64)))
 425                                                              (#.(expt 2f0 64)))))
 426                                 `(coerce (,',prim-quick (coerce x 'double-float))
 427                                   'single-float))
 428                                (t
 429                                 (compiler-note
 430                                  "unable to avoid inline argument range check~@
 431                                   because the argument range (~S) was not within 2^64"
 432                                  (type-specifier (continuation-type x)))
 433                                 `(coerce (,',prim (coerce x 'double-float)) 'single-float)))
 434                   #!-x86 `(coerce (,',prim (coerce x 'double-float)) 'single-float))
 435                (deftransform ,name ((x) (double-float) *)
 436                  #!+x86 (cond ((csubtypep (continuation-type x)
 437                                           (specifier-type '(double-float
 438                                                             (#.(- (expt 2d0 64)))
 439                                                             (#.(expt 2d0 64)))))
 440                                `(,',prim-quick x))
 441                               (t
 442                                (compiler-note
 443                                 "unable to avoid inline argument range check~@
 444                                  because the argument range (~S) was not within 2^64"
 445                                 (type-specifier (continuation-type x)))
 446                                `(,',prim x)))
 447                  #!-x86 `(,',prim x)))))
 448   (def sin %sin %sin-quick)
 449   (def cos %cos %cos-quick)
 450   (def tan %tan %tan-quick))
 451
 452 (deftransform atan ((x y) (single-float single-float) *)
 453   `(coerce (%atan2 (coerce x 'double-float) (coerce y 'double-float))
 454     'single-float))
 455 (deftransform atan ((x y) (double-float double-float) *)
 456   `(%atan2 x y))
 457
 458 (deftransform expt ((x y) ((single-float 0f0) single-float) *)
 459   `(coerce (%pow (coerce x 'double-float) (coerce y 'double-float))
 460     'single-float))
 461 (deftransform expt ((x y) ((double-float 0d0) double-float) *)
 462   `(%pow x y))
 463 (deftransform expt ((x y) ((single-float 0f0) (signed-byte 32)) *)
 464   `(coerce (%pow (coerce x 'double-float) (coerce y 'double-float))
 465     'single-float))
 466 (deftransform expt ((x y) ((double-float 0d0) (signed-byte 32)) *)
 467   `(%pow x (coerce y 'double-float)))
 468
 469 ;;; ANSI says log with base zero returns zero.
 470 (deftransform log ((x y) (float float) float)
 471   '(if (zerop y) y (/ (log x) (log y))))
 472 \f
 473 ;;; Handle some simple transformations.
 474
 475 (deftransform abs ((x) ((complex double-float)) double-float)
 476   '(%hypot (realpart x) (imagpart x)))
 477
 478 (deftransform abs ((x) ((complex single-float)) single-float)
 479   '(coerce (%hypot (coerce (realpart x) 'double-float)
 480                    (coerce (imagpart x) 'double-float))
 481           'single-float))
 482
 483 (deftransform phase ((x) ((complex double-float)) double-float)
 484   '(%atan2 (imagpart x) (realpart x)))
 485
 486 (deftransform phase ((x) ((complex single-float)) single-float)
 487   '(coerce (%atan2 (coerce (imagpart x) 'double-float)
 488                    (coerce (realpart x) 'double-float))
 489           'single-float))
 490
 491 (deftransform phase ((x) ((float)) float)
 492   '(if (minusp (float-sign x))
 493        (float pi x)
 494        (float 0 x)))
 495
 496 ;;; The number is of type REAL.
 497 (defun numeric-type-real-p (type)
 498   (and (numeric-type-p type)
 499        (eq (numeric-type-complexp type) :real)))
 500
 501 ;;; Coerce a numeric type bound to the given type while handling
 502 ;;; exclusive bounds.
 503 (defun coerce-numeric-bound (bound type)
 504   (when bound
 505     (if (consp bound)
 506         (list (coerce (car bound) type))
 507         (coerce bound type))))
 508
 509 #-sb-xc-host ; (See CROSS-FLOAT-INFINITY-KLUDGE.)
 510 (progn
 511
 512 ;;;; optimizers for elementary functions
 513 ;;;;
 514 ;;;; These optimizers compute the output range of the elementary
 515 ;;;; function, based on the domain of the input.
 516
 517 ;;; Generate a specifier for a complex type specialized to the same
 518 ;;; type as the argument.
 519 (defun complex-float-type (arg)
 520   (declare (type numeric-type arg))
 521   (let* ((format (case (numeric-type-class arg)
 522                    ((integer rational) 'single-float)
 523                    (t (numeric-type-format arg))))
 524          (float-type (or format 'float)))
 525     (specifier-type `(complex ,float-type))))
 526
 527 ;;; Compute a specifier like '(OR FLOAT (COMPLEX FLOAT)), except float
 528 ;;; should be the right kind of float. Allow bounds for the float
 529 ;;; part too.
 530 (defun float-or-complex-float-type (arg &optional lo hi)
 531   (declare (type numeric-type arg))
 532   (let* ((format (case (numeric-type-class arg)
 533                    ((integer rational) 'single-float)
 534                    (t (numeric-type-format arg))))
 535          (float-type (or format 'float))
 536          (lo (coerce-numeric-bound lo float-type))
 537          (hi (coerce-numeric-bound hi float-type)))
 538     (specifier-type `(or (,float-type ,(or lo '*) ,(or hi '*))
 539                          (complex ,float-type)))))
 540
 541 ;;; Test whether the numeric-type ARG is within in domain specified by
 542 ;;; DOMAIN-LOW and DOMAIN-HIGH, consider negative and positive zero to
 543 ;;; be distinct.
 544 (defun domain-subtypep (arg domain-low domain-high)
 545   (declare (type numeric-type arg)
 546            (type (or real null) domain-low domain-high))
 547   (let* ((arg-lo (numeric-type-low arg))
 548          (arg-lo-val (type-bound-number arg-lo))
 549          (arg-hi (numeric-type-high arg))
 550          (arg-hi-val (type-bound-number arg-hi)))
 551     ;; Check that the ARG bounds are correctly canonicalized.
 552     (when (and arg-lo (floatp arg-lo-val) (zerop arg-lo-val) (consp arg-lo)
 553                (minusp (float-sign arg-lo-val)))
 554       (compiler-note "float zero bound ~S not correctly canonicalized?" arg-lo)
 555       (setq arg-lo '(0l0) arg-lo-val 0l0))
 556     (when (and arg-hi (zerop arg-hi-val) (floatp arg-hi-val) (consp arg-hi)
 557                (plusp (float-sign arg-hi-val)))
 558       (compiler-note "float zero bound ~S not correctly canonicalized?" arg-hi)
 559       (setq arg-hi '(-0l0) arg-hi-val -0l0))
 560     (and (or (null domain-low)
 561              (and arg-lo (>= arg-lo-val domain-low)
 562                   (not (and (zerop domain-low) (floatp domain-low)
 563                             (plusp (float-sign domain-low))
 564                             (zerop arg-lo-val) (floatp arg-lo-val)
 565                             (if (consp arg-lo)
 566                                 (plusp (float-sign arg-lo-val))
 567                                 (minusp (float-sign arg-lo-val)))))))
 568          (or (null domain-high)
 569              (and arg-hi (<= arg-hi-val domain-high)
 570                   (not (and (zerop domain-high) (floatp domain-high)
 571                             (minusp (float-sign domain-high))
 572                             (zerop arg-hi-val) (floatp arg-hi-val)
 573                             (if (consp arg-hi)
 574                                 (minusp (float-sign arg-hi-val))
 575                                 (plusp (float-sign arg-hi-val))))))))))
 576
 577 ;;; Handle monotonic functions of a single variable whose domain is
 578 ;;; possibly part of the real line. ARG is the variable, FCN is the
 579 ;;; function, and DOMAIN is a specifier that gives the (real) domain
 580 ;;; of the function. If ARG is a subset of the DOMAIN, we compute the
 581 ;;; bounds directly. Otherwise, we compute the bounds for the
 582 ;;; intersection between ARG and DOMAIN, and then append a complex
 583 ;;; result, which occurs for the parts of ARG not in the DOMAIN.
 584 ;;;
 585 ;;; Negative and positive zero are considered distinct within
 586 ;;; DOMAIN-LOW and DOMAIN-HIGH.
 587 ;;;
 588 ;;; DEFAULT-LOW and DEFAULT-HIGH are the lower and upper bounds if we
 589 ;;; can't compute the bounds using FCN.
 590 (defun elfun-derive-type-simple (arg fcn domain-low domain-high
 591                                      default-low default-high
 592                                      &optional (increasingp t))
 593   (declare (type (or null real) domain-low domain-high))
 594   (etypecase arg
 595     (numeric-type
 596      (cond ((eq (numeric-type-complexp arg) :complex)
 597             (make-numeric-type :class (numeric-type-class arg)
 598                                :format (numeric-type-format arg)
 599                                :complexp :complex))
 600            ((numeric-type-real-p arg)
 601             ;; The argument is real, so let's find the intersection
 602             ;; between the argument and the domain of the function.
 603             ;; We compute the bounds on the intersection, and for
 604             ;; everything else, we return a complex number of the
 605             ;; appropriate type.
 606             (multiple-value-bind (intersection difference)
 607                 (interval-intersection/difference (numeric-type->interval arg)
 608                                                   (make-interval
 609                                                    :low domain-low
 610                                                    :high domain-high))
 611               (cond
 612                 (intersection
 613                  ;; Process the intersection.
 614                  (let* ((low (interval-low intersection))
 615                         (high (interval-high intersection))
 616                         (res-lo (or (bound-func fcn (if increasingp low high))
 617                                     default-low))
 618                         (res-hi (or (bound-func fcn (if increasingp high low))
 619                                     default-high))
 620                         (format (case (numeric-type-class arg)
 621                                   ((integer rational) 'single-float)
 622                                   (t (numeric-type-format arg))))
 623                         (bound-type (or format 'float))
 624                         (result-type
 625                          (make-numeric-type
 626                           :class 'float
 627                           :format format
 628                           :low (coerce-numeric-bound res-lo bound-type)
 629                           :high (coerce-numeric-bound res-hi bound-type))))
 630                    ;; If the ARG is a subset of the domain, we don't
 631                    ;; have to worry about the difference, because that
 632                    ;; can't occur.
 633                    (if (or (null difference)
 634                            ;; Check whether the arg is within the domain.
 635                            (domain-subtypep arg domain-low domain-high))
 636                        result-type
 637                        (list result-type
 638                              (specifier-type `(complex ,bound-type))))))
 639                 (t
 640                  ;; No intersection so the result must be purely complex.
 641                  (complex-float-type arg)))))
 642            (t
 643             (float-or-complex-float-type arg default-low default-high))))))
 644
 645 (macrolet
 646     ((frob (name domain-low domain-high def-low-bnd def-high-bnd
 647                  &key (increasingp t))
 648        (let ((num (gensym)))
 649          `(defoptimizer (,name derive-type) ((,num))
 650            (one-arg-derive-type
 651             ,num
 652             (lambda (arg)
 653               (elfun-derive-type-simple arg #',name
 654                                         ,domain-low ,domain-high
 655                                         ,def-low-bnd ,def-high-bnd
 656                                         ,increasingp))
 657             #',name)))))
 658   ;; These functions are easy because they are defined for the whole
 659   ;; real line.
 660   (frob exp nil nil 0 nil)
 661   (frob sinh nil nil nil nil)
 662   (frob tanh nil nil -1 1)
 663   (frob asinh nil nil nil nil)
 664
 665   ;; These functions are only defined for part of the real line. The
 666   ;; condition selects the desired part of the line.
 667   (frob asin -1d0 1d0 (- (/ pi 2)) (/ pi 2))
 668   ;; Acos is monotonic decreasing, so we need to swap the function
 669   ;; values at the lower and upper bounds of the input domain.
 670   (frob acos -1d0 1d0 0 pi :increasingp nil)
 671   (frob acosh 1d0 nil nil nil)
 672   (frob atanh -1d0 1d0 -1 1)
 673   ;; Kahan says that (sqrt -0.0) is -0.0, so use a specifier that
 674   ;; includes -0.0.
 675   (frob sqrt -0d0 nil 0 nil))
 676
 677 ;;; Compute bounds for (expt x y). This should be easy since (expt x
 678 ;;; y) = (exp (* y (log x))). However, computations done this way
 679 ;;; have too much roundoff. Thus we have to do it the hard way.
 680 (defun safe-expt (x y)
 681   (handler-case
 682       (expt x y)
 683     (error ()
 684       nil)))
 685
 686 ;;; Handle the case when x >= 1.
 687 (defun interval-expt-> (x y)
 688   (case (sb!c::interval-range-info y 0d0)
 689     ('+
 690      ;; Y is positive and log X >= 0. The range of exp(y * log(x)) is
 691      ;; obviously non-negative. We just have to be careful for
 692      ;; infinite bounds (given by nil).
 693      (let ((lo (safe-expt (type-bound-number (sb!c::interval-low x))
 694                           (type-bound-number (sb!c::interval-low y))))
 695            (hi (safe-expt (type-bound-number (sb!c::interval-high x))
 696                           (type-bound-number (sb!c::interval-high y)))))
 697        (list (sb!c::make-interval :low (or lo 1) :high hi))))
 698     ('-
 699      ;; Y is negative and log x >= 0. The range of exp(y * log(x)) is
 700      ;; obviously [0, 1]. However, underflow (nil) means 0 is the
 701      ;; result.
 702      (let ((lo (safe-expt (type-bound-number (sb!c::interval-high x))
 703                           (type-bound-number (sb!c::interval-low y))))
 704            (hi (safe-expt (type-bound-number (sb!c::interval-low x))
 705                           (type-bound-number (sb!c::interval-high y)))))
 706        (list (sb!c::make-interval :low (or lo 0) :high (or hi 1)))))
 707     (t
 708      ;; Split the interval in half.
 709      (destructuring-bind (y- y+)
 710          (sb!c::interval-split 0 y t)
 711        (list (interval-expt-> x y-)
 712              (interval-expt-> x y+))))))
 713
 714 ;;; Handle the case when x <= 1
 715 (defun interval-expt-< (x y)
 716   (case (sb!c::interval-range-info x 0d0)
 717     ('+
 718      ;; The case of 0 <= x <= 1 is easy
 719      (case (sb!c::interval-range-info y)
 720        ('+
 721         ;; Y is positive and log X <= 0. The range of exp(y * log(x)) is
 722         ;; obviously [0, 1]. We just have to be careful for infinite bounds
 723         ;; (given by nil).
 724         (let ((lo (safe-expt (type-bound-number (sb!c::interval-low x))
 725                              (type-bound-number (sb!c::interval-high y))))
 726               (hi (safe-expt (type-bound-number (sb!c::interval-high x))
 727                              (type-bound-number (sb!c::interval-low y)))))
 728           (list (sb!c::make-interval :low (or lo 0) :high (or hi 1)))))
 729        ('-
 730         ;; Y is negative and log x <= 0. The range of exp(y * log(x)) is
 731         ;; obviously [1, inf].
 732         (let ((hi (safe-expt (type-bound-number (sb!c::interval-low x))
 733                              (type-bound-number (sb!c::interval-low y))))
 734               (lo (safe-expt (type-bound-number (sb!c::interval-high x))
 735                              (type-bound-number (sb!c::interval-high y)))))
 736           (list (sb!c::make-interval :low (or lo 1) :high hi))))
 737        (t
 738         ;; Split the interval in half
 739         (destructuring-bind (y- y+)
 740             (sb!c::interval-split 0 y t)
 741           (list (interval-expt-< x y-)
 742                 (interval-expt-< x y+))))))
 743     ('-
 744      ;; The case where x <= 0. Y MUST be an INTEGER for this to work!
 745      ;; The calling function must insure this! For now we'll just
 746      ;; return the appropriate unbounded float type.
 747      (list (sb!c::make-interval :low nil :high nil)))
 748     (t
 749      (destructuring-bind (neg pos)
 750          (interval-split 0 x t t)
 751        (list (interval-expt-< neg y)
 752              (interval-expt-< pos y))))))
 753
 754 ;;; Compute bounds for (expt x y).
 755 (defun interval-expt (x y)
 756   (case (interval-range-info x 1)
 757     ('+
 758      ;; X >= 1
 759          (interval-expt-> x y))
 760     ('-
 761      ;; X <= 1
 762      (interval-expt-< x y))
 763     (t
 764      (destructuring-bind (left right)
 765          (interval-split 1 x t t)
 766        (list (interval-expt left y)
 767              (interval-expt right y))))))
 768
 769 (defun fixup-interval-expt (bnd x-int y-int x-type y-type)
 770   (declare (ignore x-int))
 771   ;; Figure out what the return type should be, given the argument
 772   ;; types and bounds and the result type and bounds.
 773   (cond ((csubtypep x-type (specifier-type 'integer))
 774          ;; an integer to some power
 775          (case (numeric-type-class y-type)
 776            (integer
 777             ;; Positive integer to an integer power is either an
 778             ;; integer or a rational.
 779             (let ((lo (or (interval-low bnd) '*))
 780                   (hi (or (interval-high bnd) '*)))
 781               (if (and (interval-low y-int)
 782                        (>= (type-bound-number (interval-low y-int)) 0))
 783                   (specifier-type `(integer ,lo ,hi))
 784                   (specifier-type `(rational ,lo ,hi)))))
 785            (rational
 786             ;; Positive integer to rational power is either a rational
 787             ;; or a single-float.
 788             (let* ((lo (interval-low bnd))
 789                    (hi (interval-high bnd))
 790                    (int-lo (if lo
 791                                (floor (type-bound-number lo))
 792                                '*))
 793                    (int-hi (if hi
 794                                (ceiling (type-bound-number hi))
 795                                '*))
 796                    (f-lo (if lo
 797                              (bound-func #'float lo)
 798                              '*))
 799                    (f-hi (if hi
 800                              (bound-func #'float hi)
 801                              '*)))
 802               (specifier-type `(or (rational ,int-lo ,int-hi)
 803                                 (single-float ,f-lo, f-hi)))))
 804            (float
 805             ;; A positive integer to a float power is a float.
 806             (modified-numeric-type y-type
 807                                    :low (interval-low bnd)
 808                                    :high (interval-high bnd)))
 809            (t
 810             ;; A positive integer to a number is a number (for now).
 811             (specifier-type 'number))))
 812         ((csubtypep x-type (specifier-type 'rational))
 813          ;; a rational to some power
 814          (case (numeric-type-class y-type)
 815            (integer
 816             ;; A positive rational to an integer power is always a rational.
 817             (specifier-type `(rational ,(or (interval-low bnd) '*)
 818                                        ,(or (interval-high bnd) '*))))
 819            (rational
 820             ;; A positive rational to rational power is either a rational
 821             ;; or a single-float.
 822             (let* ((lo (interval-low bnd))
 823                    (hi (interval-high bnd))
 824                    (int-lo (if lo
 825                                (floor (type-bound-number lo))
 826                                '*))
 827                    (int-hi (if hi
 828                                (ceiling (type-bound-number hi))
 829                                '*))
 830                    (f-lo (if lo
 831                              (bound-func #'float lo)
 832                              '*))
 833                    (f-hi (if hi
 834                              (bound-func #'float hi)
 835                              '*)))
 836               (specifier-type `(or (rational ,int-lo ,int-hi)
 837                                 (single-float ,f-lo, f-hi)))))
 838            (float
 839             ;; A positive rational to a float power is a float.
 840             (modified-numeric-type y-type
 841                                    :low (interval-low bnd)
 842                                    :high (interval-high bnd)))
 843            (t
 844             ;; A positive rational to a number is a number (for now).
 845             (specifier-type 'number))))
 846         ((csubtypep x-type (specifier-type 'float))
 847          ;; a float to some power
 848          (case (numeric-type-class y-type)
 849            ((or integer rational)
 850             ;; A positive float to an integer or rational power is
 851             ;; always a float.
 852             (make-numeric-type
 853              :class 'float
 854              :format (numeric-type-format x-type)
 855              :low (interval-low bnd)
 856              :high (interval-high bnd)))
 857            (float
 858             ;; A positive float to a float power is a float of the
 859             ;; higher type.
 860             (make-numeric-type
 861              :class 'float
 862              :format (float-format-max (numeric-type-format x-type)
 863                                        (numeric-type-format y-type))
 864              :low (interval-low bnd)
 865              :high (interval-high bnd)))
 866            (t
 867             ;; A positive float to a number is a number (for now)
 868             (specifier-type 'number))))
 869         (t
 870          ;; A number to some power is a number.
 871          (specifier-type 'number))))
 872
 873 (defun merged-interval-expt (x y)
 874   (let* ((x-int (numeric-type->interval x))
 875          (y-int (numeric-type->interval y)))
 876     (mapcar (lambda (type)
 877               (fixup-interval-expt type x-int y-int x y))
 878             (flatten-list (interval-expt x-int y-int)))))
 879
 880 (defun expt-derive-type-aux (x y same-arg)
 881   (declare (ignore same-arg))
 882   (cond ((or (not (numeric-type-real-p x))
 883              (not (numeric-type-real-p y)))
 884          ;; Use numeric contagion if either is not real.
 885          (numeric-contagion x y))
 886         ((csubtypep y (specifier-type 'integer))
 887          ;; A real raised to an integer power is well-defined.
 888          (merged-interval-expt x y))
 889         (t
 890          ;; A real raised to a non-integral power can be a float or a
 891          ;; complex number.
 892          (cond ((or (csubtypep x (specifier-type '(rational 0)))
 893                     (csubtypep x (specifier-type '(float (0d0)))))
 894                 ;; But a positive real to any power is well-defined.
 895                 (merged-interval-expt x y))
 896                (t
 897                 ;; a real to some power. The result could be a real
 898                 ;; or a complex.
 899                 (float-or-complex-float-type (numeric-contagion x y)))))))
 900
 901 (defoptimizer (expt derive-type) ((x y))
 902   (two-arg-derive-type x y #'expt-derive-type-aux #'expt))
 903
 904 ;;; Note we must assume that a type including 0.0 may also include
 905 ;;; -0.0 and thus the result may be complex -infinity + i*pi.
 906 (defun log-derive-type-aux-1 (x)
 907   (elfun-derive-type-simple x #'log 0d0 nil nil nil))
 908
 909 (defun log-derive-type-aux-2 (x y same-arg)
 910   (let ((log-x (log-derive-type-aux-1 x))
 911         (log-y (log-derive-type-aux-1 y))
 912         (accumulated-list nil))
 913     ;; LOG-X or LOG-Y might be union types. We need to run through
 914     ;; the union types ourselves because /-DERIVE-TYPE-AUX doesn't.
 915     (dolist (x-type (prepare-arg-for-derive-type log-x))
 916       (dolist (y-type (prepare-arg-for-derive-type log-y))
 917         (push (/-derive-type-aux x-type y-type same-arg) accumulated-list)))
 918     (apply #'type-union (flatten-list accumulated-list))))
 919
 920 (defoptimizer (log derive-type) ((x &optional y))
 921   (if y
 922       (two-arg-derive-type x y #'log-derive-type-aux-2 #'log)
 923       (one-arg-derive-type x #'log-derive-type-aux-1 #'log)))
 924
 925 (defun atan-derive-type-aux-1 (y)
 926   (elfun-derive-type-simple y #'atan nil nil (- (/ pi 2)) (/ pi 2)))
 927
 928 (defun atan-derive-type-aux-2 (y x same-arg)
 929   (declare (ignore same-arg))
 930   ;; The hard case with two args. We just return the max bounds.
 931   (let ((result-type (numeric-contagion y x)))
 932     (cond ((and (numeric-type-real-p x)
 933                 (numeric-type-real-p y))
 934            (let* (;; FIXME: This expression for FORMAT seems to
 935                   ;; appear multiple times, and should be factored out.
 936                   (format (case (numeric-type-class result-type)
 937                             ((integer rational) 'single-float)
 938                             (t (numeric-type-format result-type))))
 939                   (bound-format (or format 'float)))
 940              (make-numeric-type :class 'float
 941                                 :format format
 942                                 :complexp :real
 943                                 :low (coerce (- pi) bound-format)
 944                                 :high (coerce pi bound-format))))
 945           (t
 946            ;; The result is a float or a complex number
 947            (float-or-complex-float-type result-type)))))
 948
 949 (defoptimizer (atan derive-type) ((y &optional x))
 950   (if x
 951       (two-arg-derive-type y x #'atan-derive-type-aux-2 #'atan)
 952       (one-arg-derive-type y #'atan-derive-type-aux-1 #'atan)))
 953
 954 (defun cosh-derive-type-aux (x)
 955   ;; We note that cosh x = cosh |x| for all real x.
 956   (elfun-derive-type-simple
 957    (if (numeric-type-real-p x)
 958        (abs-derive-type-aux x)
 959        x)
 960    #'cosh nil nil 0 nil))
 961
 962 (defoptimizer (cosh derive-type) ((num))
 963   (one-arg-derive-type num #'cosh-derive-type-aux #'cosh))
 964
 965 (defun phase-derive-type-aux (arg)
 966   (let* ((format (case (numeric-type-class arg)
 967                    ((integer rational) 'single-float)
 968                    (t (numeric-type-format arg))))
 969          (bound-type (or format 'float)))
 970     (cond ((numeric-type-real-p arg)
 971            (case (interval-range-info (numeric-type->interval arg) 0.0)
 972              ('+
 973               ;; The number is positive, so the phase is 0.
 974               (make-numeric-type :class 'float
 975                                  :format format
 976                                  :complexp :real
 977                                  :low (coerce 0 bound-type)
 978                                  :high (coerce 0 bound-type)))
 979              ('-
 980               ;; The number is always negative, so the phase is pi.
 981               (make-numeric-type :class 'float
 982                                  :format format
 983                                  :complexp :real
 984                                  :low (coerce pi bound-type)
 985                                  :high (coerce pi bound-type)))
 986              (t
 987               ;; We can't tell. The result is 0 or pi. Use a union
 988               ;; type for this.
 989               (list
 990                (make-numeric-type :class 'float
 991                                   :format format
 992                                   :complexp :real
 993                                   :low (coerce 0 bound-type)
 994                                   :high (coerce 0 bound-type))
 995                (make-numeric-type :class 'float
 996                                   :format format
 997                                   :complexp :real
 998                                   :low (coerce pi bound-type)
 999                                   :high (coerce pi bound-type))))))
1000           (t
1001            ;; We have a complex number. The answer is the range -pi
1002            ;; to pi. (-pi is included because we have -0.)
1003            (make-numeric-type :class 'float
1004                               :format format
1005                               :complexp :real
1006                               :low (coerce (- pi) bound-type)
1007                               :high (coerce pi bound-type))))))
1008
1009 (defoptimizer (phase derive-type) ((num))
1010   (one-arg-derive-type num #'phase-derive-type-aux #'phase))
1011
1012 ) ; PROGN
1013
1014 (deftransform realpart ((x) ((complex rational)) *)
1015   '(sb!kernel:%realpart x))
1016 (deftransform imagpart ((x) ((complex rational)) *)
1017   '(sb!kernel:%imagpart x))
1018
1019 ;;; Make REALPART and IMAGPART return the appropriate types. This
1020 ;;; should help a lot in optimized code.
1021 (defun realpart-derive-type-aux (type)
1022   (let ((class (numeric-type-class type))
1023         (format (numeric-type-format type)))
1024     (cond ((numeric-type-real-p type)
1025            ;; The realpart of a real has the same type and range as
1026            ;; the input.
1027            (make-numeric-type :class class
1028                               :format format
1029                               :complexp :real
1030                               :low (numeric-type-low type)
1031                               :high (numeric-type-high type)))
1032           (t
1033            ;; We have a complex number. The result has the same type
1034            ;; as the real part, except that it's real, not complex,
1035            ;; obviously.
1036            (make-numeric-type :class class
1037                               :format format
1038                               :complexp :real
1039                               :low (numeric-type-low type)
1040                               :high (numeric-type-high type))))))
1041 #-sb-xc-host ; (See CROSS-FLOAT-INFINITY-KLUDGE.)
1042 (defoptimizer (realpart derive-type) ((num))
1043   (one-arg-derive-type num #'realpart-derive-type-aux #'realpart))
1044 (defun imagpart-derive-type-aux (type)
1045   (let ((class (numeric-type-class type))
1046         (format (numeric-type-format type)))
1047     (cond ((numeric-type-real-p type)
1048            ;; The imagpart of a real has the same type as the input,
1049            ;; except that it's zero.
1050            (let ((bound-format (or format class 'real)))
1051              (make-numeric-type :class class
1052                                 :format format
1053                                 :complexp :real
1054                                 :low (coerce 0 bound-format)
1055                                 :high (coerce 0 bound-format))))
1056           (t
1057            ;; We have a complex number. The result has the same type as
1058            ;; the imaginary part, except that it's real, not complex,
1059            ;; obviously.
1060            (make-numeric-type :class class
1061                               :format format
1062                               :complexp :real
1063                               :low (numeric-type-low type)
1064                               :high (numeric-type-high type))))))
1065 #-sb-xc-host ; (See CROSS-FLOAT-INFINITY-KLUDGE.)
1066 (defoptimizer (imagpart derive-type) ((num))
1067   (one-arg-derive-type num #'imagpart-derive-type-aux #'imagpart))
1068
1069 (defun complex-derive-type-aux-1 (re-type)
1070   (if (numeric-type-p re-type)
1071       (make-numeric-type :class (numeric-type-class re-type)
1072                          :format (numeric-type-format re-type)
1073                          :complexp (if (csubtypep re-type
1074                                                   (specifier-type 'rational))
1075                                        :real
1076                                        :complex)
1077                          :low (numeric-type-low re-type)
1078                          :high (numeric-type-high re-type))
1079       (specifier-type 'complex)))
1080
1081 (defun complex-derive-type-aux-2 (re-type im-type same-arg)
1082   (declare (ignore same-arg))
1083   (if (and (numeric-type-p re-type)
1084            (numeric-type-p im-type))
1085       ;; Need to check to make sure numeric-contagion returns the
1086       ;; right type for what we want here.
1087
1088       ;; Also, what about rational canonicalization, like (complex 5 0)
1089       ;; is 5?  So, if the result must be complex, we make it so.
1090       ;; If the result might be complex, which happens only if the
1091       ;; arguments are rational, we make it a union type of (or
1092       ;; rational (complex rational)).
1093       (let* ((element-type (numeric-contagion re-type im-type))
1094              (rat-result-p (csubtypep element-type
1095                                       (specifier-type 'rational))))
1096         (if rat-result-p
1097             (type-union element-type
1098                         (specifier-type
1099                          `(complex ,(numeric-type-class element-type))))
1100             (make-numeric-type :class (numeric-type-class element-type)
1101                                :format (numeric-type-format element-type)
1102                                :complexp (if rat-result-p
1103                                              :real
1104                                              :complex))))
1105       (specifier-type 'complex)))
1106
1107 #-sb-xc-host ; (See CROSS-FLOAT-INFINITY-KLUDGE.)
1108 (defoptimizer (complex derive-type) ((re &optional im))
1109   (if im
1110       (two-arg-derive-type re im #'complex-derive-type-aux-2 #'complex)
1111       (one-arg-derive-type re #'complex-derive-type-aux-1 #'complex)))
1112
1113 ;;; Define some transforms for complex operations. We do this in lieu
1114 ;;; of complex operation VOPs.
1115 (macrolet ((frob (type)
1116              `(progn
1117                ;; negation
1118                (deftransform %negate ((z) ((complex ,type)) *)
1119                  '(complex (%negate (realpart z)) (%negate (imagpart z))))
1120                ;; complex addition and subtraction
1121                (deftransform + ((w z) ((complex ,type) (complex ,type)) *)
1122                  '(complex (+ (realpart w) (realpart z))
1123                            (+ (imagpart w) (imagpart z))))
1124                (deftransform - ((w z) ((complex ,type) (complex ,type)) *)
1125                  '(complex (- (realpart w) (realpart z))
1126                            (- (imagpart w) (imagpart z))))
1127                ;; Add and subtract a complex and a real.
1128                (deftransform + ((w z) ((complex ,type) real) *)
1129                  '(complex (+ (realpart w) z) (imagpart w)))
1130                (deftransform + ((z w) (real (complex ,type)) *)
1131                  '(complex (+ (realpart w) z) (imagpart w)))
1132                ;; Add and subtract a real and a complex number.
1133                (deftransform - ((w z) ((complex ,type) real) *)
1134                  '(complex (- (realpart w) z) (imagpart w)))
1135                (deftransform - ((z w) (real (complex ,type)) *)
1136                  '(complex (- z (realpart w)) (- (imagpart w))))
1137                ;; Multiply and divide two complex numbers.
1138                (deftransform * ((x y) ((complex ,type) (complex ,type)) *)
1139                  '(let* ((rx (realpart x))
1140                          (ix (imagpart x))
1141                          (ry (realpart y))
1142                          (iy (imagpart y)))
1143                     (complex (- (* rx ry) (* ix iy))
1144                              (+ (* rx iy) (* ix ry)))))
1145                (deftransform / ((x y) ((complex ,type) (complex ,type)) *)
1146                  '(let* ((rx (realpart x))
1147                          (ix (imagpart x))
1148                          (ry (realpart y))
1149                          (iy (imagpart y)))
1150                     (if (> (abs ry) (abs iy))
1151                         (let* ((r (/ iy ry))
1152                                (dn (* ry (+ 1 (* r r)))))
1153                           (complex (/ (+ rx (* ix r)) dn)
1154                                    (/ (- ix (* rx r)) dn)))
1155                         (let* ((r (/ ry iy))
1156                                (dn (* iy (+ 1 (* r r)))))
1157                           (complex (/ (+ (* rx r) ix) dn)
1158                                    (/ (- (* ix r) rx) dn))))))
1159                ;; Multiply a complex by a real or vice versa.
1160                (deftransform * ((w z) ((complex ,type) real) *)
1161                  '(complex (* (realpart w) z) (* (imagpart w) z)))
1162                (deftransform * ((z w) (real (complex ,type)) *)
1163                  '(complex (* (realpart w) z) (* (imagpart w) z)))
1164                ;; Divide a complex by a real.
1165                (deftransform / ((w z) ((complex ,type) real) *)
1166                  '(complex (/ (realpart w) z) (/ (imagpart w) z)))
1167                ;; conjugate of complex number
1168                (deftransform conjugate ((z) ((complex ,type)) *)
1169                  '(complex (realpart z) (- (imagpart z))))
1170                ;; CIS
1171                (deftransform cis ((z) ((,type)) *)
1172                  '(complex (cos z) (sin z)))
1173                ;; comparison
1174                (deftransform = ((w z) ((complex ,type) (complex ,type)) *)
1175                  '(and (= (realpart w) (realpart z))
1176                        (= (imagpart w) (imagpart z))))
1177                (deftransform = ((w z) ((complex ,type) real) *)
1178                  '(and (= (realpart w) z) (zerop (imagpart w))))
1179                (deftransform = ((w z) (real (complex ,type)) *)
1180                  '(and (= (realpart z) w) (zerop (imagpart z)))))))
1181
1182   (frob single-float)
1183   (frob double-float))
1184
1185 ;;; Here are simple optimizers for SIN, COS, and TAN. They do not
1186 ;;; produce a minimal range for the result; the result is the widest
1187 ;;; possible answer. This gets around the problem of doing range
1188 ;;; reduction correctly but still provides useful results when the
1189 ;;; inputs are union types.
1190 #-sb-xc-host ; (See CROSS-FLOAT-INFINITY-KLUDGE.)
1191 (progn
1192 (defun trig-derive-type-aux (arg domain fcn
1193                                  &optional def-lo def-hi (increasingp t))
1194   (etypecase arg
1195     (numeric-type
1196      (cond ((eq (numeric-type-complexp arg) :complex)
1197             (make-numeric-type :class (numeric-type-class arg)
1198                                :format (numeric-type-format arg)
1199                                :complexp :complex))
1200            ((numeric-type-real-p arg)
1201             (let* ((format (case (numeric-type-class arg)
1202                              ((integer rational) 'single-float)
1203                              (t (numeric-type-format arg))))
1204                    (bound-type (or format 'float)))
1205               ;; If the argument is a subset of the "principal" domain
1206               ;; of the function, we can compute the bounds because
1207               ;; the function is monotonic. We can't do this in
1208               ;; general for these periodic functions because we can't
1209               ;; (and don't want to) do the argument reduction in
1210               ;; exactly the same way as the functions themselves do
1211               ;; it.
1212               (if (csubtypep arg domain)
1213                   (let ((res-lo (bound-func fcn (numeric-type-low arg)))
1214                         (res-hi (bound-func fcn (numeric-type-high arg))))
1215                     (unless increasingp
1216                       (rotatef res-lo res-hi))
1217                     (make-numeric-type
1218                      :class 'float
1219                      :format format
1220                      :low (coerce-numeric-bound res-lo bound-type)
1221                      :high (coerce-numeric-bound res-hi bound-type)))
1222                   (make-numeric-type
1223                    :class 'float
1224                    :format format
1225                    :low (and def-lo (coerce def-lo bound-type))
1226                    :high (and def-hi (coerce def-hi bound-type))))))
1227            (t
1228             (float-or-complex-float-type arg def-lo def-hi))))))
1229
1230 (defoptimizer (sin derive-type) ((num))
1231   (one-arg-derive-type
1232    num
1233    (lambda (arg)
1234      ;; Derive the bounds if the arg is in [-pi/2, pi/2].
1235      (trig-derive-type-aux
1236       arg
1237       (specifier-type `(float ,(- (/ pi 2)) ,(/ pi 2)))
1238       #'sin
1239       -1 1))
1240    #'sin))
1241
1242 (defoptimizer (cos derive-type) ((num))
1243   (one-arg-derive-type
1244    num
1245    (lambda (arg)
1246      ;; Derive the bounds if the arg is in [0, pi].
1247      (trig-derive-type-aux arg
1248                            (specifier-type `(float 0d0 ,pi))
1249                            #'cos
1250                            -1 1
1251                            nil))
1252    #'cos))
1253
1254 (defoptimizer (tan derive-type) ((num))
1255   (one-arg-derive-type
1256    num
1257    (lambda (arg)
1258      ;; Derive the bounds if the arg is in [-pi/2, pi/2].
1259      (trig-derive-type-aux arg
1260                            (specifier-type `(float ,(- (/ pi 2)) ,(/ pi 2)))
1261                            #'tan
1262                            nil nil))
1263    #'tan))
1264
1265 ;;; CONJUGATE always returns the same type as the input type.
1266 ;;;
1267 ;;; FIXME: ANSI allows any subtype of REAL for the components of COMPLEX.
1268 ;;; So what if the input type is (COMPLEX (SINGLE-FLOAT 0 1))?
1269 (defoptimizer (conjugate derive-type) ((num))
1270   (continuation-type num))
1271
1272 (defoptimizer (cis derive-type) ((num))
1273   (one-arg-derive-type num
1274      (lambda (arg)
1275        (sb!c::specifier-type
1276         `(complex ,(or (numeric-type-format arg) 'float))))
1277      #'cis))
1278
1279 ) ; PROGN
1280 \f
1281 ;;;; TRUNCATE, FLOOR, CEILING, and ROUND
1282
1283 (macrolet ((define-frobs (fun ufun)
1284              `(progn
1285                 (defknown ,ufun (real) integer (movable foldable flushable))
1286                 (deftransform ,fun ((x &optional by)
1287                                     (* &optional
1288                                        (constant-arg (member 1))))
1289                   '(let ((res (,ufun x)))
1290                      (values res (- x res)))))))
1291   (define-frobs truncate %unary-truncate)
1292   (define-frobs round %unary-round))
1293
1294 ;;; Convert (TRUNCATE x y) to the obvious implementation.  We only want
1295 ;;; this when under certain conditions and let the generic TRUNCATE
1296 ;;; handle the rest.  (Note: if Y = 1, the divide and multiply by Y
1297 ;;; should be removed by other DEFTRANSFORMs.)
1298 (deftransform truncate ((x &optional y)
1299                         (float &optional (or float integer)))
1300   (let ((defaulted-y (if y 'y 1)))
1301     `(let ((res (%unary-truncate (/ x ,defaulted-y))))
1302        (values res (- x (* ,defaulted-y res))))))
1303
1304 (deftransform floor ((number &optional divisor)
1305                      (float &optional (or integer float)))
1306   (let ((defaulted-divisor (if divisor 'divisor 1)))
1307     `(multiple-value-bind (tru rem) (truncate number ,defaulted-divisor)
1308        (if (and (not (zerop rem))
1309                 (if (minusp ,defaulted-divisor)
1310                     (plusp number)
1311                     (minusp number)))
1312            (values (1- tru) (+ rem ,defaulted-divisor))
1313            (values tru rem)))))
1314
1315 (deftransform ceiling ((number &optional divisor)
1316                        (float &optional (or integer float)))
1317   (let ((defaulted-divisor (if divisor 'divisor 1)))
1318     `(multiple-value-bind (tru rem) (truncate number ,defaulted-divisor)
1319        (if (and (not (zerop rem))
1320                 (if (minusp ,defaulted-divisor)
1321                     (minusp number)
1322                     (plusp number)))
1323            (values (1+ tru) (- rem ,defaulted-divisor))
1324            (values tru rem)))))