src/compiler/node.lisp

   1 ;;;; structures for the first intermediate representation in the
   2 ;;;; compiler, IR1
   3
   4 ;;;; This software is part of the SBCL system. See the README file for
   5 ;;;; more information.
   6 ;;;;
   7 ;;;; This software is derived from the CMU CL system, which was
   8 ;;;; written at Carnegie Mellon University and released into the
   9 ;;;; public domain. The software is in the public domain and is
  10 ;;;; provided with absolutely no warranty. See the COPYING and CREDITS
  11 ;;;; files for more information.
  12
  13 (in-package "SB!C")
  14
  15 ;;; The front-end data structure (IR1) is composed of nodes and
  16 ;;; continuations. The general idea is that continuations contain
  17 ;;; top-down information and nodes contain bottom-up, derived
  18 ;;; information. A continuation represents a place in the code, while
  19 ;;; a node represents code that does something.
  20 ;;;
  21 ;;; This representation is more of a flow-graph than an augmented
  22 ;;; syntax tree. The evaluation order is explicitly represented in the
  23 ;;; linkage by continuations, rather than being implicit in the nodes
  24 ;;; which receive the the results of evaluation. This allows us to
  25 ;;; decouple the flow of results from the flow of control. A
  26 ;;; continuation represents both, but the continuation can represent
  27 ;;; the case of a discarded result by having no DEST.
  28
  29 (def!struct (continuation
  30              (:make-load-form-fun ignore-it)
  31              (:constructor make-continuation (&optional dest)))
  32   ;; an indication of the way that this continuation is currently used
  33   ;;
  34   ;; :UNUSED
  35   ;;    A continuation for which all control-related slots have the
  36   ;;    default values. A continuation is unused during IR1 conversion
  37   ;;    until it is assigned a block, and may be also be temporarily
  38   ;;    unused during later manipulations of IR1. In a consistent
  39   ;;    state there should never be any mention of :UNUSED
  40   ;;    continuations. Next can have a non-null value if the next node
  41   ;;    has already been determined.
  42   ;;
  43   ;; :DELETED
  44   ;;    A continuation that has been deleted from IR1. Any pointers into
  45   ;;    IR1 are cleared. There are two conditions under which a deleted
  46   ;;    continuation may appear in code:
  47   ;;     -- The CONT of the LAST node in a block may be a deleted
  48   ;;        continuation when the original receiver of the continuation's
  49   ;;        value was deleted. Note that DEST in a deleted continuation is
  50   ;;        null, so it is easy to know not to attempt delivering any
  51   ;;        values to the continuation.
  52   ;;     -- Unreachable code that hasn't been deleted yet may receive
  53   ;;        deleted continuations. All such code will be in blocks that
  54   ;;        have DELETE-P set. All unreachable code is deleted by control
  55   ;;        optimization, so the backend doesn't have to worry about this.
  56   ;;
  57   ;; :BLOCK-START
  58   ;;    The continuation that is the START of BLOCK. This is the only kind
  59   ;;    of continuation that can have more than one use. The BLOCK's
  60   ;;    START-USES is a list of all the uses.
  61   ;;
  62   ;; :DELETED-BLOCK-START
  63   ;;    Like :BLOCK-START, but BLOCK has been deleted. A block
  64   ;;    starting continuation is made into a deleted block start when
  65   ;;    the block is deleted, but the continuation still may have
  66   ;;    value semantics. Since there isn't any code left, next is
  67   ;;    null.
  68   ;;
  69   ;; :INSIDE-BLOCK
  70   ;;    A continuation that is the CONT of some node in BLOCK.
  71   (kind :unused :type (member :unused :deleted :inside-block :block-start
  72                               :deleted-block-start))
  73   ;; The node which receives this value, if any. In a deleted
  74   ;; continuation, this is null even though the node that receives
  75   ;; this continuation may not yet be deleted.
  76   (dest nil :type (or node null))
  77   ;; If this is a NODE, then it is the node which is to be evaluated
  78   ;; next. This is always null in :DELETED and :UNUSED continuations,
  79   ;; and will be null in a :INSIDE-BLOCK continuation when this is the
  80   ;; CONT of the LAST.
  81   (next nil :type (or node null))
  82   ;; an assertion on the type of this continuation's value
  83   (asserted-type *wild-type* :type ctype)
  84   ;; cached type of this continuation's value. If NIL, then this must
  85   ;; be recomputed: see CONTINUATION-DERIVED-TYPE.
  86   (%derived-type nil :type (or ctype null))
  87   ;; the node where this continuation is used, if unique. This is always
  88   ;; null in :DELETED and :UNUSED continuations, and is never null in
  89   ;; :INSIDE-BLOCK continuations. In a :BLOCK-START continuation, the
  90   ;; Block's START-USES indicate whether NIL means no uses or more
  91   ;; than one use.
  92   (use nil :type (or node null))
  93   ;; the basic block this continuation is in. This is null only in
  94   ;; :DELETED and :UNUSED continuations. Note that blocks that are
  95   ;; unreachable but still in the DFO may receive deleted
  96   ;; continuations, so it isn't o.k. to assume that any continuation
  97   ;; that you pick up out of its DEST node has a BLOCK.
  98   (block nil :type (or cblock null))
  99   ;; set to true when something about this continuation's value has
 100   ;; changed. See REOPTIMIZE-CONTINUATION. This provides a way for IR1
 101   ;; optimize to determine which operands to a node have changed. If
 102   ;; the optimizer for this node type doesn't care, it can elect not
 103   ;; to clear this flag.
 104   (reoptimize t :type boolean)
 105   ;; an indication of what we have proven about how this contination's
 106   ;; type assertion is satisfied:
 107   ;;
 108   ;; NIL
 109   ;;    No type check is necessary (proven type is a subtype of the assertion.)
 110   ;;
 111   ;; T
 112   ;;    A type check is needed.
 113   ;;
 114   ;; :DELETED
 115   ;;    Don't do a type check, but believe (intersect) the assertion.
 116   ;;    A T check can be changed to :DELETED if we somehow prove the
 117   ;;    check is unnecessary, or if we eliminate it through a policy
 118   ;;    decision.
 119   ;;
 120   ;; :NO-CHECK
 121   ;;    Type check generation sets the slot to this if a check is
 122   ;;    called for, but it believes it has proven that the check won't
 123   ;;    be done for policy reasons or because a safe implementation
 124   ;;    will be used. In the latter case, LTN must ensure that a safe
 125   ;;    implementation *is* used.
 126   ;;
 127   ;; :ERROR
 128   ;;    There is a compile-time type error in some use of this
 129   ;;    continuation. A type check should still be generated, but be
 130   ;;    careful.
 131   ;;
 132   ;; This is computed lazily by CONTINUATION-DERIVED-TYPE, so use
 133   ;; CONTINUATION-TYPE-CHECK instead of the %'ed slot accessor.
 134   (%type-check t :type (member t nil :deleted :no-check :error))
 135   ;; something or other that the back end annotates this continuation with
 136   (info nil)
 137   ;; uses of this continuation in the lexical environment. They are
 138   ;; recorded so that when one continuation is substituted for another
 139   ;; the environment may be updated properly.
 140   (lexenv-uses nil :type list))
 141
 142 (def!method print-object ((x continuation) stream)
 143   (print-unreadable-object (x stream :type t :identity t)))
 144
 145 (defstruct (node (:constructor nil)
 146                  (:copier nil))
 147   ;; the bottom-up derived type for this node. This does not take into
 148   ;; consideration output type assertions on this node (actually on its CONT).
 149   (derived-type *wild-type* :type ctype)
 150   ;; True if this node needs to be optimized. This is set to true
 151   ;; whenever something changes about the value of a continuation
 152   ;; whose DEST is this node.
 153   (reoptimize t :type boolean)
 154   ;; the continuation which receives the value of this node. This also
 155   ;; indicates what we do controlwise after evaluating this node. This
 156   ;; may be null during IR1 conversion.
 157   (cont nil :type (or continuation null))
 158   ;; the continuation that this node is the next of. This is null
 159   ;; during IR1 conversion when we haven't linked the node in yet or
 160   ;; in nodes that have been deleted from the IR1 by UNLINK-NODE.
 161   (prev nil :type (or continuation null))
 162   ;; the lexical environment this node was converted in
 163   (lexenv *lexenv* :type lexenv)
 164   ;; a representation of the source code responsible for generating
 165   ;; this node
 166   ;;
 167   ;; For a form introduced by compilation (does not appear in the
 168   ;; original source), the path begins with a list of all the
 169   ;; enclosing introduced forms. This list is from the inside out,
 170   ;; with the form immediately responsible for this node at the head
 171   ;; of the list.
 172   ;;
 173   ;; Following the introduced forms is a representation of the
 174   ;; location of the enclosing original source form. This transition
 175   ;; is indicated by the magic ORIGINAL-SOURCE-START marker. The first
 176   ;; element of the original source is the "form number", which is the
 177   ;; ordinal number of this form in a depth-first, left-to-right walk
 178   ;; of the truly-top-level form in which this appears.
 179   ;;
 180   ;; Following is a list of integers describing the path taken through
 181   ;; the source to get to this point:
 182   ;;     (K L M ...) => (NTH K (NTH L (NTH M ...)))
 183   ;;
 184   ;; The last element in the list is the top level form number, which
 185   ;; is the ordinal number (in this call to the compiler) of the truly
 186   ;; top level form containing the original source.
 187   (source-path *current-path* :type list)
 188   ;; If this node is in a tail-recursive position, then this is set to
 189   ;; T. At the end of IR1 (in physical environment analysis) this is
 190   ;; computed for all nodes (after cleanup code has been emitted).
 191   ;; Before then, a non-null value indicates that IR1 optimization has
 192   ;; converted a tail local call to a direct transfer.
 193   ;;
 194   ;; If the back-end breaks tail-recursion for some reason, then it
 195   ;; can null out this slot.
 196   (tail-p nil :type boolean))
 197
 198 ;;; Flags that are used to indicate various things about a block, such
 199 ;;; as what optimizations need to be done on it:
 200 ;;; -- REOPTIMIZE is set when something interesting happens the uses of a
 201 ;;;    continuation whose Dest is in this block. This indicates that the
 202 ;;;    value-driven (forward) IR1 optimizations should be done on this block.
 203 ;;; -- FLUSH-P is set when code in this block becomes potentially flushable,
 204 ;;;    usually due to a continuation's DEST becoming null.
 205 ;;; -- TYPE-CHECK is true when the type check phase should be run on this
 206 ;;;    block. IR1 optimize can introduce new blocks after type check has
 207 ;;;    already run. We need to check these blocks, but there is no point in
 208 ;;;    checking blocks we have already checked.
 209 ;;; -- DELETE-P is true when this block is used to indicate that this block
 210 ;;;    has been determined to be unreachable and should be deleted. IR1
 211 ;;;    phases should not attempt to  examine or modify blocks with DELETE-P
 212 ;;;    set, since they may:
 213 ;;;     - be in the process of being deleted, or
 214 ;;;     - have no successors, or
 215 ;;;     - receive :DELETED continuations.
 216 ;;; -- TYPE-ASSERTED, TEST-MODIFIED
 217 ;;;    These flags are used to indicate that something in this block
 218 ;;;    might be of interest to constraint propagation. TYPE-ASSERTED
 219 ;;;    is set when a continuation type assertion is strengthened.
 220 ;;;    TEST-MODIFIED is set whenever the test for the ending IF has
 221 ;;;    changed (may be true when there is no IF.)
 222 (def-boolean-attribute block
 223   reoptimize flush-p type-check delete-p type-asserted test-modified)
 224
 225 (macrolet ((frob (slot)
 226              `(defmacro ,(symbolicate "BLOCK-" slot) (block)
 227                 `(block-attributep (block-flags ,block) ,',slot))))
 228   (frob reoptimize)
 229   (frob flush-p)
 230   (frob type-check)
 231   (frob delete-p)
 232   (frob type-asserted)
 233   (frob test-modified))
 234
 235 ;;; The CBLOCK structure represents a basic block. We include
 236 ;;; SSET-ELEMENT so that we can have sets of blocks. Initially the
 237 ;;; SSET-ELEMENT-NUMBER is null, DFO analysis numbers in reverse DFO.
 238 ;;; During IR2 conversion, IR1 blocks are re-numbered in forward emit
 239 ;;; order. This latter numbering also forms the basis of the block
 240 ;;; numbering in the debug-info (though that is relative to the start
 241 ;;; of the function.)
 242 (defstruct (cblock (:include sset-element)
 243                    (:constructor make-block (start))
 244                    (:constructor make-block-key)
 245                    (:conc-name block-)
 246                    (:predicate block-p)
 247                    (:copier copy-block))
 248   ;; a list of all the blocks that are predecessors/successors of this
 249   ;; block. In well-formed IR1, most blocks will have one successor.
 250   ;; The only exceptions are:
 251   ;;  1. component head blocks (any number)
 252   ;;  2. blocks ending in an IF (1 or 2)
 253   ;;  3. blocks with DELETE-P set (zero)
 254   (pred nil :type list)
 255   (succ nil :type list)
 256   ;; the continuation which heads this block (either a :BLOCK-START or
 257   ;; :DELETED-BLOCK-START), or NIL when we haven't made the start
 258   ;; continuation yet (and in the dummy component head and tail
 259   ;; blocks)
 260   (start nil :type (or continuation null))
 261   ;; a list of all the nodes that have START as their CONT
 262   (start-uses nil :type list)
 263   ;; the last node in this block. This is NIL when we are in the
 264   ;; process of building a block (and in the dummy component head and
 265   ;; tail blocks.)
 266   (last nil :type (or node null))
 267   ;; the forward and backward links in the depth-first ordering of the
 268   ;; blocks. These slots are NIL at beginning/end.
 269   (next nil :type (or null cblock))
 270   (prev nil :type (or null cblock))
 271   ;; This block's attributes: see above.
 272   (flags (block-attributes reoptimize flush-p type-check type-asserted
 273                            test-modified)
 274          :type attributes)
 275   ;; CMU CL had a KILL slot here, documented as "set used by
 276   ;; constraint propagation", which was used in constraint propagation
 277   ;; as a list of LAMBDA-VARs killed, and in copy propagation as an
 278   ;; SSET, representing I dunno what. I (WHN) found this confusing,
 279   ;; and furthermore it caused type errors when I was trying to make
 280   ;; the compiler produce fully general LAMBDA functions directly
 281   ;; (instead of doing as CMU CL always did, producing extra little
 282   ;; functions which return the LAMDBA you need) and therefore taking
 283   ;; a new path through the compiler. So I split this into two:
 284   ;;   KILL-LIST = list of LAMBDA-VARs killed, used in constraint propagation
 285   ;;   KILL-SSET = an SSET value, used in copy propagation
 286   (kill-list nil :type list)
 287   (kill-sset nil :type (or sset null))
 288   ;; other sets used in constraint propagation and/or copy propagation
 289   (gen nil)
 290   (in nil)
 291   (out nil)
 292   ;; the component this block is in, or NIL temporarily during IR1
 293   ;; conversion and in deleted blocks
 294   (component *current-component* :type (or component null))
 295   ;; a flag used by various graph-walking code to determine whether
 296   ;; this block has been processed already or what. We make this
 297   ;; initially NIL so that FIND-INITIAL-DFO doesn't have to scan the
 298   ;; entire initial component just to clear the flags.
 299   (flag nil)
 300   ;; some kind of info used by the back end
 301   (info nil)
 302   ;; If true, then constraints that hold in this block and its
 303   ;; successors by merit of being tested by its IF predecessor.
 304   (test-constraint nil :type (or sset null)))
 305 (def!method print-object ((cblock cblock) stream)
 306   (print-unreadable-object (cblock stream :type t :identity t)
 307     (format stream ":START c~D" (cont-num (block-start cblock)))))
 308
 309 ;;; The BLOCK-ANNOTATION class is inherited (via :INCLUDE) by
 310 ;;; different BLOCK-INFO annotation structures so that code
 311 ;;; (specifically control analysis) can be shared.
 312 (defstruct (block-annotation (:constructor nil)
 313                              (:copier nil))
 314   ;; The IR1 block that this block is in the INFO for.
 315   (block (missing-arg) :type cblock)
 316   ;; the next and previous block in emission order (not DFO). This
 317   ;; determines which block we drop though to, and also used to chain
 318   ;; together overflow blocks that result from splitting of IR2 blocks
 319   ;; in lifetime analysis.
 320   (next nil :type (or block-annotation null))
 321   (prev nil :type (or block-annotation null)))
 322
 323 ;;; A COMPONENT structure provides a handle on a connected piece of
 324 ;;; the flow graph. Most of the passes in the compiler operate on
 325 ;;; COMPONENTs rather than on the entire flow graph.
 326 ;;;
 327 ;;; According to the CMU CL internals/front.tex, the reason for
 328 ;;; separating compilation into COMPONENTs is
 329 ;;;   to increase the efficiency of large block compilations. In
 330 ;;;   addition to improving locality of reference and reducing the
 331 ;;;   size of flow analysis problems, this allows back-end data
 332 ;;;   structures to be reclaimed after the compilation of each
 333 ;;;   component.
 334 (defstruct (component (:copier nil))
 335   ;; the kind of component
 336   ;;
 337   ;; (The terminology here is left over from before
 338   ;; sbcl-0.pre7.34.flaky5.2, when there was no such thing as
 339   ;; FUNCTIONAL-HAS-EXTERNAL-REFERENCES-P, so that Python was
 340   ;; incapable of building standalone :EXTERNAL functions, but instead
 341   ;; had to implement things like #'CL:COMPILE as FUNCALL of a little
 342   ;; toplevel stub whose sole purpose was to return an :EXTERNAL
 343   ;; function.)
 344   ;;
 345   ;; The possibilities are:
 346   ;;   NIL
 347   ;;     an ordinary component, containing non-top-level code
 348   ;;   :TOPLEVEL
 349   ;;     a component containing only load-time code
 350   ;;   :COMPLEX-TOPLEVEL
 351   ;;     In the old system, before FUNCTIONAL-HAS-EXTERNAL-REFERENCES-P
 352   ;;     was defined, this was necessarily a component containing both
 353   ;;     top level and run-time code. Now this state is also used for
 354   ;;     a component with HAS-EXTERNAL-REFERENCES-P functionals in it.
 355   ;;   :INITIAL
 356   ;;     the result of initial IR1 conversion, on which component
 357   ;;     analysis has not been done
 358   ;;   :DELETED
 359   ;;     debris left over from component analysis
 360   ;;
 361   ;; See also COMPONENT-TOPLEVELISH-P.
 362   (kind nil :type (member nil :toplevel :complex-toplevel :initial :deleted))
 363   ;; the blocks that are the dummy head and tail of the DFO
 364   ;;
 365   ;; Entry/exit points have these blocks as their
 366   ;; predecessors/successors. Null temporarily. The start and return
 367   ;; from each non-deleted function is linked to the component head
 368   ;; and tail. Until physical environment analysis links NLX entry
 369   ;; stubs to the component head, every successor of the head is a
 370   ;; function start (i.e. begins with a BIND node.)
 371   (head nil :type (or null cblock))
 372   (tail nil :type (or null cblock))
 373   ;; This becomes a list of the CLAMBDA structures for all functions
 374   ;; in this component. OPTIONAL-DISPATCHes are represented only by
 375   ;; their XEP and other associated lambdas. This doesn't contain any
 376   ;; deleted or LET lambdas.
 377   ;;
 378   ;; Note that logical associations between CLAMBDAs and COMPONENTs
 379   ;; seem to exist for a while before this is initialized. See e.g.
 380   ;; the NEW-FUNS slot. In particular, I got burned by writing some
 381   ;; code to use this value to decide which components need
 382   ;; LOCALL-ANALYZE-COMPONENT, when it turns out that
 383   ;; LOCALL-ANALYZE-COMPONENT had a role in initializing this value
 384   ;; (and DFO stuff does too, maybe). Also, even after it's
 385   ;; initialized, it might change as CLAMBDAs are deleted or merged.
 386   ;; -- WHN 2001-09-30
 387   (lambdas () :type list)
 388   ;; a list of FUNCTIONALs for functions that are newly converted, and
 389   ;; haven't been local-call analyzed yet. Initially functions are not
 390   ;; in the LAMBDAS list. Local call analysis moves them there
 391   ;; (possibly as LETs, or implicitly as XEPs if an OPTIONAL-DISPATCH.)
 392   ;; Between runs of local call analysis there may be some debris of
 393   ;; converted or even deleted functions in this list.
 394   (new-funs () :type list)
 395   ;; If this is true, then there is stuff in this component that could
 396   ;; benefit from further IR1 optimization.
 397   (reoptimize t :type boolean)
 398   ;; If this is true, then the control flow in this component was
 399   ;; messed up by IR1 optimizations, so the DFO should be recomputed.
 400   (reanalyze nil :type boolean)
 401   ;; some sort of name for the code in this component
 402   (name "<unknown>" :type simple-string)
 403   ;; some kind of info used by the back end
 404   (info nil)
 405   ;; the SOURCE-INFO structure describing where this component was
 406   ;; compiled from
 407   (source-info *source-info* :type source-info)
 408   ;; count of the number of inline expansions we have done while
 409   ;; compiling this component, to detect infinite or exponential
 410   ;; blowups
 411   (inline-expansions 0 :type index)
 412   ;; a map from combination nodes to things describing how an
 413   ;; optimization of the node failed. The description is an alist
 414   ;; (TRANSFORM . ARGS), where TRANSFORM is the structure describing
 415   ;; the transform that failed, and ARGS is either a list of format
 416   ;; arguments for the note, or the FUN-TYPE that would have
 417   ;; enabled the transformation but failed to match.
 418   (failed-optimizations (make-hash-table :test 'eq) :type hash-table)
 419   ;; This is similar to NEW-FUNS, but is used when a function has
 420   ;; already been analyzed, but new references have been added by
 421   ;; inline expansion. Unlike NEW-FUNS, this is not disjoint from
 422   ;; COMPONENT-LAMBDAS.
 423   (reanalyze-funs nil :type list))
 424 (defprinter (component :identity t)
 425   name
 426   (reanalyze :test reanalyze))
 427
 428 ;;; Before sbcl-0.7.0, there were :TOPLEVEL things which were magical
 429 ;;; in multiple ways. That's since been refactored into the orthogonal
 430 ;;; properties "optimized for locall with no arguments" and "externally
 431 ;;; visible/referenced (so don't delete it)". The code <0.7.0 did a lot
 432 ;;; of tests a la (EQ KIND :TOP_LEVEL) in the "don't delete it?" sense;
 433 ;;; this function is a sort of literal translation of those tests into
 434 ;;; the new world.
 435 ;;;
 436 ;;; FIXME: After things settle down, bare :TOPLEVEL might go away, at
 437 ;;; which time it might be possible to replace the COMPONENT-KIND
 438 ;;; :TOPLEVEL mess with a flag COMPONENT-HAS-EXTERNAL-REFERENCES-P
 439 ;;; along the lines of FUNCTIONAL-HAS-EXTERNAL-REFERENCES-P.
 440 (defun lambda-toplevelish-p (clambda)
 441   (or (eql (lambda-kind clambda) :toplevel)
 442       (lambda-has-external-references-p clambda)))
 443 (defun component-toplevelish-p (component)
 444   (member (component-kind component)
 445           '(:toplevel :complex-toplevel)))
 446
 447 ;;; A CLEANUP structure represents some dynamic binding action. Blocks
 448 ;;; are annotated with the current CLEANUP so that dynamic bindings
 449 ;;; can be removed when control is transferred out of the binding
 450 ;;; environment. We arrange for changes in dynamic bindings to happen
 451 ;;; at block boundaries, so that cleanup code may easily be inserted.
 452 ;;; The "mess-up" action is explicitly represented by a funny function
 453 ;;; call or ENTRY node.
 454 ;;;
 455 ;;; We guarantee that CLEANUPs only need to be done at block boundaries
 456 ;;; by requiring that the exit continuations initially head their
 457 ;;; blocks, and then by not merging blocks when there is a cleanup
 458 ;;; change.
 459 (defstruct (cleanup (:copier nil))
 460   ;; the kind of thing that has to be cleaned up
 461   (kind (missing-arg)
 462         :type (member :special-bind :catch :unwind-protect :block :tagbody))
 463   ;; the node that messes things up. This is the last node in the
 464   ;; non-messed-up environment. Null only temporarily. This could be
 465   ;; deleted due to unreachability.
 466   (mess-up nil :type (or node null))
 467   ;; a list of all the NLX-INFO structures whose NLX-INFO-CLEANUP is
 468   ;; this cleanup. This is filled in by physical environment analysis.
 469   (nlx-info nil :type list))
 470 (defprinter (cleanup :identity t)
 471   kind
 472   mess-up
 473   (nlx-info :test nlx-info))
 474
 475 ;;; A PHYSENV represents the result of physical environment analysis.
 476 ;;;
 477 ;;; As far as I can tell from reverse engineering, this IR1 structure
 478 ;;; represents the physical environment (which is probably not the
 479 ;;; standard Lispy term for this concept, but I dunno what is the
 480 ;;; standard term): those things in the lexical environment which a
 481 ;;; LAMBDA actually interacts with. Thus in
 482 ;;;   (DEFUN FROB-THINGS (THINGS)
 483 ;;;     (DOLIST (THING THINGS)
 484 ;;;       (BLOCK FROBBING-ONE-THING
 485 ;;;         (MAPCAR (LAMBDA (PATTERN)
 486 ;;;                   (WHEN (FITS-P THING PATTERN)
 487 ;;;                     (RETURN-FROM FROB-THINGS (LIST :FIT THING PATTERN))))
 488 ;;;                 *PATTERNS*))))
 489 ;;; the variables THINGS, THING, and PATTERN and the block names
 490 ;;; FROB-THINGS and FROBBING-ONE-THING are all in the inner LAMBDA's
 491 ;;; lexical environment, but of those only THING, PATTERN, and
 492 ;;; FROB-THINGS are in its physical environment. In IR1, we largely
 493 ;;; just collect the names of these things; in IR2 an IR2-PHYSENV
 494 ;;; structure is attached to INFO and used to keep track of
 495 ;;; associations between these names and less-abstract things (like
 496 ;;; TNs, or eventually stack slots and registers). -- WHN 2001-09-29
 497 (defstruct (physenv (:copier nil))
 498   ;; the function that allocates this physical environment
 499   (lambda (missing-arg) :type clambda :read-only t)
 500   #| ; seems not to be used as of sbcl-0.pre7.51
 501   ;; a list of all the lambdas that allocate variables in this
 502   ;; physical environment
 503   (lambdas nil :type list)
 504   |#
 505   ;; This ultimately converges to a list of all the LAMBDA-VARs and
 506   ;; NLX-INFOs needed from enclosing environments by code in this
 507   ;; physical environment. In the meantime, it may be
 508   ;;   * NIL at object creation time
 509   ;;   * a superset of the correct result, generated somewhat later
 510   ;;   * smaller and smaller sets converging to the correct result as
 511   ;;     we notice and delete unused elements in the superset
 512   (closure nil :type list)
 513   ;; a list of NLX-INFO structures describing all the non-local exits
 514   ;; into this physical environment
 515   (nlx-info nil :type list)
 516   ;; some kind of info used by the back end
 517   (info nil))
 518 (defprinter (physenv :identity t)
 519   lambda
 520   (closure :test closure)
 521   (nlx-info :test nlx-info))
 522
 523 ;;; An TAIL-SET structure is used to accumulate information about
 524 ;;; tail-recursive local calls. The "tail set" is effectively the
 525 ;;; transitive closure of the "is called tail-recursively by"
 526 ;;; relation.
 527 ;;;
 528 ;;; All functions in the same tail set share the same TAIL-SET
 529 ;;; structure. Initially each function has its own TAIL-SET, but when
 530 ;;; IR1-OPTIMIZE-RETURN notices a tail local call, it joins the tail
 531 ;;; sets of the called function and the calling function.
 532 ;;;
 533 ;;; The tail set is somewhat approximate, because it is too early to
 534 ;;; be sure which calls will be tail-recursive. Any call that *might*
 535 ;;; end up tail-recursive causes TAIL-SET merging.
 536 (defstruct (tail-set)
 537   ;; a list of all the LAMBDAs in this tail set
 538   (funs nil :type list)
 539   ;; our current best guess of the type returned by these functions.
 540   ;; This is the union across all the functions of the return node's
 541   ;; RESULT-TYPE, excluding local calls.
 542   (type *wild-type* :type ctype)
 543   ;; some info used by the back end
 544   (info nil))
 545 (defprinter (tail-set :identity t)
 546   funs
 547   type
 548   (info :test info))
 549
 550 ;;; The NLX-Info structure is used to collect various information
 551 ;;; about non-local exits. This is effectively an annotation on the
 552 ;;; CONTINUATION, although it is accessed by searching in the
 553 ;;; PHYSENV-NLX-INFO.
 554 (def!struct (nlx-info (:make-load-form-fun ignore-it))
 555   ;; the cleanup associated with this exit. In a catch or
 556   ;; unwind-protect, this is the :CATCH or :UNWIND-PROTECT cleanup,
 557   ;; and not the cleanup for the escape block. The CLEANUP-KIND of
 558   ;; this thus provides a good indication of what kind of exit is
 559   ;; being done.
 560   (cleanup (missing-arg) :type cleanup)
 561   ;; the continuation exited to (the CONT of the EXIT nodes). If this
 562   ;; exit is from an escape function (CATCH or UNWIND-PROTECT), then
 563   ;; physical environment analysis deletes the escape function and
 564   ;; instead has the %NLX-ENTRY use this continuation.
 565   ;;
 566   ;; This slot is primarily an indication of where this exit delivers
 567   ;; its values to (if any), but it is also used as a sort of name to
 568   ;; allow us to find the NLX-Info that corresponds to a given exit.
 569   ;; For this purpose, the Entry must also be used to disambiguate,
 570   ;; since exits to different places may deliver their result to the
 571   ;; same continuation.
 572   (continuation (missing-arg) :type continuation)
 573   ;; the entry stub inserted by physical environment analysis. This is
 574   ;; a block containing a call to the %NLX-Entry funny function that
 575   ;; has the original exit destination as its successor. Null only
 576   ;; temporarily.
 577   (target nil :type (or cblock null))
 578   ;; some kind of info used by the back end
 579   info)
 580 (defprinter (nlx-info :identity t)
 581   continuation
 582   target
 583   info)
 584 \f
 585 ;;;; LEAF structures
 586
 587 ;;; Variables, constants and functions are all represented by LEAF
 588 ;;; structures. A reference to a LEAF is indicated by a REF node. This
 589 ;;; allows us to easily substitute one for the other without actually
 590 ;;; hacking the flow graph.
 591 (def!struct (leaf (:make-load-form-fun ignore-it)
 592                   (:constructor nil))
 593   ;; (For public access to this slot, use LEAF-SOURCE-NAME.)
 594   ;;
 595   ;; the name of LEAF as it appears in the source, e.g. 'FOO or '(SETF
 596   ;; FOO) or 'N or '*Z*, or the special .ANONYMOUS. value if there's
 597   ;; no name for this thing in the source (as can happen for
 598   ;; FUNCTIONALs, e.g. for anonymous LAMBDAs or for functions for
 599   ;; top-level forms; and can also happen for anonymous constants) or
 600   ;; perhaps also if the match between the name and the thing is
 601   ;; skewed enough (e.g. for macro functions or method functions) that
 602   ;; we don't want to have that name affect compilation
 603   ;;
 604   ;; The value of this slot in can affect ordinary runtime behavior,
 605   ;; e.g. of special variables and known functions, not just debugging.
 606   ;;
 607   ;; See also the LEAF-DEBUG-NAME function and the
 608   ;; FUNCTIONAL-%DEBUG-NAME slot.
 609   (%source-name (missing-arg)
 610                 :type (or symbol (and cons (satisfies legal-fun-name-p)))
 611                 :read-only t)
 612   ;; the type which values of this leaf must have
 613   (type *universal-type* :type ctype)
 614   ;; where the TYPE information came from:
 615   ;;  :DECLARED, from a declaration.
 616   ;;  :ASSUMED, from uses of the object.
 617   ;;  :DEFINED, from examination of the definition.
 618   ;; FIXME: This should be a named type. (LEAF-WHERE-FROM? Or
 619   ;; perhaps just WHERE-FROM, since it's not just used in LEAF,
 620   ;; but also in various DEFINE-INFO-TYPEs in globaldb.lisp,
 621   ;; and very likely elsewhere too.)
 622   (where-from :assumed :type (member :declared :assumed :defined))
 623   ;; list of the REF nodes for this leaf
 624   (refs () :type list)
 625   ;; true if there was ever a REF or SET node for this leaf. This may
 626   ;; be true when REFS and SETS are null, since code can be deleted.
 627   (ever-used nil :type boolean)
 628   ;; some kind of info used by the back end
 629   (info nil))
 630
 631 ;;; LEAF name operations
 632 ;;;
 633 ;;; KLUDGE: wants CLOS..
 634 (defun leaf-has-source-name-p (leaf)
 635   (not (eq (leaf-%source-name leaf)
 636            '.anonymous.)))
 637 (defun leaf-source-name (leaf)
 638   (aver (leaf-has-source-name-p leaf))
 639   (leaf-%source-name leaf))
 640 (defun leaf-debug-name (leaf)
 641   (if (functional-p leaf)
 642       ;; FUNCTIONALs have additional %DEBUG-NAME behavior.
 643       (functional-debug-name leaf)
 644       ;; Other objects just use their source name.
 645       ;;
 646       ;; (As of sbcl-0.pre7.85, there are a few non-FUNCTIONAL
 647       ;; anonymous objects, (anonymous constants..) and those would
 648       ;; fail here if we ever tried to get debug names from them, but
 649       ;; it looks as though it's never interesting to get debug names
 650       ;; from them, so it's moot. -- WHN)
 651       (leaf-source-name leaf)))
 652
 653 ;;; The CONSTANT structure is used to represent known constant values.
 654 ;;; If NAME is not null, then it is the name of the named constant
 655 ;;; which this leaf corresponds to, otherwise this is an anonymous
 656 ;;; constant.
 657 (def!struct (constant (:include leaf))
 658   ;; the value of the constant
 659   (value nil :type t))
 660 (defprinter (constant :identity t)
 661   (%source-name :test %source-name)
 662   value)
 663
 664 ;;; The BASIC-VAR structure represents information common to all
 665 ;;; variables which don't correspond to known local functions.
 666 (def!struct (basic-var (:include leaf)
 667                        (:constructor nil))
 668   ;; Lists of the set nodes for this variable.
 669   (sets () :type list))
 670
 671 ;;; The GLOBAL-VAR structure represents a value hung off of the symbol
 672 ;;; NAME. We use a :CONSTANT VAR when we know that the thing is a
 673 ;;; constant, but don't know what the value is at compile time.
 674 (def!struct (global-var (:include basic-var))
 675   ;; kind of variable described
 676   (kind (missing-arg)
 677         :type (member :special :global-function :global)))
 678 (defprinter (global-var :identity t)
 679   %source-name
 680   (type :test (not (eq type *universal-type*)))
 681   (where-from :test (not (eq where-from :assumed)))
 682   kind)
 683
 684 ;;; The SLOT-ACCESSOR structure represents slot accessor functions. It
 685 ;;; is a subtype of GLOBAL-VAR to make it look more like a normal
 686 ;;; function.
 687 (def!struct (slot-accessor (:include global-var
 688                                      (where-from :defined)
 689                                      (kind :global-function)))
 690   ;; The description of the structure that this is an accessor for.
 691   (for (missing-arg) :type sb!xc:class)
 692   ;; The slot description of the slot.
 693   (slot (missing-arg)))
 694 (defprinter (slot-accessor :identity t)
 695   %source-name
 696   for
 697   slot)
 698
 699 ;;; A DEFINED-FUN represents a function that is defined in the same
 700 ;;; compilation block, or that has an inline expansion, or that has a
 701 ;;; non-NIL INLINEP value. Whenever we change the INLINEP state (i.e.
 702 ;;; an inline proclamation) we copy the structure so that former
 703 ;;; INLINEP values are preserved.
 704 (def!struct (defined-fun (:include global-var
 705                                    (where-from :defined)
 706                                    (kind :global-function)))
 707   ;; The values of INLINEP and INLINE-EXPANSION initialized from the
 708   ;; global environment.
 709   (inlinep nil :type inlinep)
 710   (inline-expansion nil :type (or cons null))
 711   ;; the block-local definition of this function (either because it
 712   ;; was semi-inline, or because it was defined in this block). If
 713   ;; this function is not an entry point, then this may be deleted or
 714   ;; LET-converted. Null if we haven't converted the expansion yet.
 715   (functional nil :type (or functional null)))
 716 (defprinter (defined-fun :identity t)
 717   %source-name
 718   inlinep
 719   (functional :test functional))
 720 \f
 721 ;;;; function stuff
 722
 723 ;;; We default the WHERE-FROM and TYPE slots to :DEFINED and FUNCTION.
 724 ;;; We don't normally manipulate function types for defined functions,
 725 ;;; but if someone wants to know, an approximation is there.
 726 (def!struct (functional (:include leaf
 727                                   (%source-name '.anonymous.)
 728                                   (where-from :defined)
 729                                   (type (specifier-type 'function))))
 730   ;; (For public access to this slot, use LEAF-DEBUG-NAME.)
 731   ;;
 732   ;; the name of FUNCTIONAL for debugging purposes, or NIL if we
 733   ;; should just let the SOURCE-NAME fall through
 734   ;;
 735   ;; Unlike the SOURCE-NAME slot, this slot's value should never
 736   ;; affect ordinary code behavior, only debugging/diagnostic behavior.
 737   ;;
 738   ;; The value of this slot can be anything, except that it shouldn't
 739   ;; be a legal function name, since otherwise debugging gets
 740   ;; confusing. (If a legal function name is a good name for the
 741   ;; function, it should be in %SOURCE-NAME, and then we shouldn't
 742   ;; need a %DEBUG-NAME.) In SBCL as of 0.pre7.87, it's always a
 743   ;; string unless it's NIL, since that's how CMU CL represented debug
 744   ;; names. However, eventually I (WHN) think it we should start using
 745   ;; list values instead, since they have much nicer print properties
 746   ;; (abbreviation, skipping package prefixes when unneeded, and
 747   ;; renaming package prefixes when we do things like renaming SB!EXT
 748   ;; to SB-EXT).
 749   ;;
 750   ;; E.g. for the function which implements (DEFUN FOO ...), we could
 751   ;; have
 752   ;;   %SOURCE-NAME=FOO
 753   ;;   %DEBUG-NAME=NIL
 754   ;; for the function which implements the top level form
 755   ;; (IN-PACKAGE :FOO) we could have
 756   ;;   %SOURCE-NAME=NIL
 757   ;;   %DEBUG-NAME="top level form (IN-PACKAGE :FOO)"
 758   ;; for the function which implements FOO in
 759   ;;   (DEFUN BAR (...) (FLET ((FOO (...) ...)) ...))
 760   ;; we could have
 761   ;;   %SOURCE-NAME=FOO
 762   ;;   %DEBUG-NAME="FLET FOO in BAR"
 763   ;; and for the function which implements FOO in
 764   ;;   (DEFMACRO FOO (...) ...)
 765   ;; we could have
 766   ;;   %SOURCE-NAME=FOO (or maybe .ANONYMOUS.?)
 767   ;;   %DEBUG-NAME="DEFMACRO FOO"
 768   (%debug-name nil
 769                :type (or null (not (satisfies legal-fun-name-p)))
 770                :read-only t)
 771   ;; some information about how this function is used. These values
 772   ;; are meaningful:
 773   ;;
 774   ;;    NIL
 775   ;;    an ordinary function, callable using local call
 776   ;;
 777   ;;    :LET
 778   ;;    a lambda that is used in only one local call, and has in
 779   ;;    effect been substituted directly inline. The return node is
 780   ;;    deleted, and the result is computed with the actual result
 781   ;;    continuation for the call.
 782   ;;
 783   ;;    :MV-LET
 784   ;;    Similar to :LET, but the call is an MV-CALL.
 785   ;;
 786   ;;    :ASSIGNMENT
 787   ;;    similar to a LET, but can have other than one call as long as
 788   ;;    there is at most one non-tail call.
 789   ;;
 790   ;;    :OPTIONAL
 791   ;;    a lambda that is an entry-point for an optional-dispatch.
 792   ;;    Similar to NIL, but requires greater caution, since local call
 793   ;;    analysis may create new references to this function. Also, the
 794   ;;    function cannot be deleted even if it has *no* references. The
 795   ;;    OPTIONAL-DISPATCH is in the LAMDBA-OPTIONAL-DISPATCH.
 796   ;;
 797   ;;    :EXTERNAL
 798   ;;    an external entry point lambda. The function it is an entry
 799   ;;    for is in the ENTRY-FUN slot.
 800   ;;
 801   ;;    :TOPLEVEL
 802   ;;    a top level lambda, holding a compiled top level form.
 803   ;;    Compiled very much like NIL, but provides an indication of
 804   ;;    top level context. A :TOPLEVEL lambda should have *no*
 805   ;;    references. Its ENTRY-FUN is a self-pointer.
 806   ;;
 807   ;;    :TOPLEVEL-XEP
 808   ;;    After a component is compiled, we clobber any top level code
 809   ;;    references to its non-closure XEPs with dummy FUNCTIONAL
 810   ;;    structures having this kind. This prevents the retained
 811   ;;    top level code from holding onto the IR for the code it
 812   ;;    references.
 813   ;;
 814   ;;    :ESCAPE
 815   ;;    :CLEANUP
 816   ;;    special functions used internally by CATCH and UNWIND-PROTECT.
 817   ;;    These are pretty much like a normal function (NIL), but are
 818   ;;    treated specially by local call analysis and stuff. Neither
 819   ;;    kind should ever be given an XEP even though they appear as
 820   ;;    args to funny functions. An :ESCAPE function is never actually
 821   ;;    called, and thus doesn't need to have code generated for it.
 822   ;;
 823   ;;    :DELETED
 824   ;;    This function has been found to be uncallable, and has been
 825   ;;    marked for deletion.
 826   (kind nil :type (member nil :optional :deleted :external :toplevel
 827                           :escape :cleanup :let :mv-let :assignment
 828                           :toplevel-xep))
 829   ;; Is this a function that some external entity (e.g. the fasl dumper)
 830   ;; refers to, so that even when it appears to have no references, it
 831   ;; shouldn't be deleted? In the old days (before
 832   ;; sbcl-0.pre7.37.flaky5.2) this was sort of implicitly true when
 833   ;; KIND was :TOPLEVEL. Now it must be set explicitly, both for
 834   ;; :TOPLEVEL functions and for any other kind of functions that we
 835   ;; want to dump or return from #'CL:COMPILE or whatever.
 836   (has-external-references-p nil)
 837   ;; In a normal function, this is the external entry point (XEP)
 838   ;; lambda for this function, if any. Each function that is used
 839   ;; other than in a local call has an XEP, and all of the
 840   ;; non-local-call references are replaced with references to the
 841   ;; XEP.
 842   ;;
 843   ;; In an XEP lambda (indicated by the :EXTERNAL kind), this is the
 844   ;; function that the XEP is an entry-point for. The body contains
 845   ;; local calls to all the actual entry points in the function. In a
 846   ;; :TOPLEVEL lambda (which is its own XEP) this is a self-pointer.
 847   ;;
 848   ;; With all other kinds, this is null.
 849   (entry-fun nil :type (or functional null))
 850   ;; the value of any inline/notinline declaration for a local function
 851   (inlinep nil :type inlinep)
 852   ;; If we have a lambda that can be used as in inline expansion for
 853   ;; this function, then this is it. If there is no source-level
 854   ;; lambda corresponding to this function then this is Null (but then
 855   ;; INLINEP will always be NIL as well.)
 856   (inline-expansion nil :type list)
 857   ;; the lexical environment that the inline-expansion should be converted in
 858   (lexenv *lexenv* :type lexenv)
 859   ;; the original function or macro lambda list, or :UNSPECIFIED if
 860   ;; this is a compiler created function
 861   (arg-documentation nil :type (or list (member :unspecified)))
 862   ;; various rare miscellaneous info that drives code generation & stuff
 863   (plist () :type list))
 864 (defprinter (functional :identity t)
 865   %source-name
 866   %debug-name)
 867
 868 ;;; FUNCTIONAL name operations
 869 (defun functional-debug-name (functional)
 870   ;; FUNCTIONAL-%DEBUG-NAME takes precedence over FUNCTIONAL-SOURCE-NAME
 871   ;; here because we want different debug names for the functions in
 872   ;; DEFUN FOO and FLET FOO even though they have the same source name.
 873   (or (functional-%debug-name functional)
 874       ;; Note that this will cause an error if the function is
 875       ;; anonymous. In SBCL (as opposed to CMU CL) we make all
 876       ;; FUNCTIONALs have debug names. The CMU CL code didn't bother
 877       ;; in many FUNCTIONALs, especially those which were likely to be
 878       ;; optimized away before the user saw them. However, getting
 879       ;; that right requires a global understanding of the code,
 880       ;; which seems bad, so we just require names for everything.
 881       (leaf-source-name functional)))
 882
 883 ;;; The CLAMBDA only deals with required lexical arguments. Special,
 884 ;;; optional, keyword and rest arguments are handled by transforming
 885 ;;; into simpler stuff.
 886 (def!struct (clambda (:include functional)
 887                      (:conc-name lambda-)
 888                      (:predicate lambda-p)
 889                      (:constructor make-lambda)
 890                      (:copier copy-lambda))
 891   ;; list of LAMBDA-VAR descriptors for arguments
 892   (vars nil :type list :read-only t)
 893   ;; If this function was ever a :OPTIONAL function (an entry-point
 894   ;; for an OPTIONAL-DISPATCH), then this is that OPTIONAL-DISPATCH.
 895   ;; The optional dispatch will be :DELETED if this function is no
 896   ;; longer :OPTIONAL.
 897   (optional-dispatch nil :type (or optional-dispatch null))
 898   ;; the BIND node for this LAMBDA. This node marks the beginning of
 899   ;; the lambda, and serves to explicitly represent the lambda binding
 900   ;; semantics within the flow graph representation. This is null in
 901   ;; deleted functions, and also in LETs where we deleted the call and
 902   ;; bind (because there are no variables left), but have not yet
 903   ;; actually deleted the LAMBDA yet.
 904   (bind nil :type (or bind null))
 905   ;; the RETURN node for this LAMBDA, or NIL if it has been deleted.
 906   ;; This marks the end of the lambda, receiving the result of the
 907   ;; body. In a LET, the return node is deleted, and the body delivers
 908   ;; the value to the actual continuation. The return may also be
 909   ;; deleted if it is unreachable.
 910   (return nil :type (or creturn null))
 911   ;; If this CLAMBDA is a LET, then this slot holds the LAMBDA whose
 912   ;; LETS list we are in, otherwise it is a self-pointer.
 913   (home nil :type (or clambda null))
 914   ;; all the lambdas that have been LET-substituted in this lambda.
 915   ;; This is only non-null in lambdas that aren't LETs.
 916   (lets nil :type list)
 917   ;; all the ENTRY nodes in this function and its LETs, or null in a LET
 918   (entries nil :type list)
 919   ;; CLAMBDAs which are locally called by this lambda, and other
 920   ;; objects (closed-over LAMBDA-VARs and XEPs) which this lambda
 921   ;; depends on in such a way that DFO shouldn't put them in separate
 922   ;; components.
 923   (calls-or-closes nil :type list)
 924   ;; the TAIL-SET that this LAMBDA is in. This is null during creation.
 925   ;;
 926   ;; In CMU CL, and old SBCL, this was also NILed out when LET
 927   ;; conversion happened. That caused some problems, so as of
 928   ;; sbcl-0.pre7.37.flaky5.2 when I was trying to get the compiler to
 929   ;; emit :EXTERNAL functions directly, and so now the value
 930   ;; is no longer NILed out in LET conversion, but instead copied
 931   ;; (so that any further optimizations on the rest of the tail
 932   ;; set won't modify the value) if necessary.
 933   (tail-set nil :type (or tail-set null))
 934   ;; the structure which represents the phsical environment that this
 935   ;; function's variables are allocated in. This is filled in by
 936   ;; physical environment analysis. In a LET, this is EQ to our home's
 937   ;; physical environment.
 938   (physenv nil :type (or physenv null))
 939   ;; In a LET, this is the NODE-LEXENV of the combination node. We
 940   ;; retain it so that if the LET is deleted (due to a lack of vars),
 941   ;; we will still have caller's lexenv to figure out which cleanup is
 942   ;; in effect.
 943   (call-lexenv nil :type (or lexenv null)))
 944 (defprinter (clambda :conc-name lambda- :identity t)
 945   %source-name
 946   %debug-name
 947   (type :test (not (eq type *universal-type*)))
 948   (where-from :test (not (eq where-from :assumed)))
 949   (vars :prin1 (mapcar #'leaf-source-name vars)))
 950
 951 ;;; The OPTIONAL-DISPATCH leaf is used to represent hairy lambdas. It
 952 ;;; is a FUNCTIONAL, like LAMBDA. Each legal number of arguments has a
 953 ;;; function which is called when that number of arguments is passed.
 954 ;;; The function is called with all the arguments actually passed. If
 955 ;;; additional arguments are legal, then the LEXPR style MORE-ENTRY
 956 ;;; handles them. The value returned by the function is the value
 957 ;;; which results from calling the OPTIONAL-DISPATCH.
 958 ;;;
 959 ;;; The theory is that each entry-point function calls the next entry
 960 ;;; point tail-recursively, passing all the arguments passed in and
 961 ;;; the default for the argument the entry point is for. The last
 962 ;;; entry point calls the real body of the function. In the presence
 963 ;;; of SUPPLIED-P args and other hair, things are more complicated. In
 964 ;;; general, there is a distinct internal function that takes the
 965 ;;; SUPPLIED-P args as parameters. The preceding entry point calls
 966 ;;; this function with NIL filled in for the SUPPLIED-P args, while
 967 ;;; the current entry point calls it with T in the SUPPLIED-P
 968 ;;; positions.
 969 ;;;
 970 ;;; Note that it is easy to turn a call with a known number of
 971 ;;; arguments into a direct call to the appropriate entry-point
 972 ;;; function, so functions that are compiled together can avoid doing
 973 ;;; the dispatch.
 974 (def!struct (optional-dispatch (:include functional))
 975   ;; the original parsed argument list, for anyone who cares
 976   (arglist nil :type list)
 977   ;; true if &ALLOW-OTHER-KEYS was supplied
 978   (allowp nil :type boolean)
 979   ;; true if &KEY was specified (which doesn't necessarily mean that
 980   ;; there are any &KEY arguments..)
 981   (keyp nil :type boolean)
 982   ;; the number of required arguments. This is the smallest legal
 983   ;; number of arguments.
 984   (min-args 0 :type unsigned-byte)
 985   ;; the total number of required and optional arguments. Args at
 986   ;; positions >= to this are &REST, &KEY or illegal args.
 987   (max-args 0 :type unsigned-byte)
 988   ;; list of the LAMBDAs which are the entry points for non-rest,
 989   ;; non-key calls. The entry for MIN-ARGS is first, MIN-ARGS+1
 990   ;; second, ... MAX-ARGS last. The last entry-point always calls the
 991   ;; main entry; in simple cases it may be the main entry.
 992   (entry-points nil :type list)
 993   ;; an entry point which takes MAX-ARGS fixed arguments followed by
 994   ;; an argument context pointer and an argument count. This entry
 995   ;; point deals with listifying rest args and parsing keywords. This
 996   ;; is null when extra arguments aren't legal.
 997   (more-entry nil :type (or clambda null))
 998   ;; the main entry-point into the function, which takes all arguments
 999   ;; including keywords as fixed arguments. The format of the
1000   ;; arguments must be determined by examining the arglist. This may
1001   ;; be used by callers that supply at least MAX-ARGS arguments and
1002   ;; know what they are doing.
1003   (main-entry nil :type (or clambda null)))
1004 (defprinter (optional-dispatch :identity t)
1005   %source-name
1006   %debug-name
1007   (type :test (not (eq type *universal-type*)))
1008   (where-from :test (not (eq where-from :assumed)))
1009   arglist
1010   allowp
1011   keyp
1012   min-args
1013   max-args
1014   (entry-points :test entry-points)
1015   (more-entry :test more-entry)
1016   main-entry)
1017
1018 ;;; The ARG-INFO structure allows us to tack various information onto
1019 ;;; LAMBDA-VARs during IR1 conversion. If we use one of these things,
1020 ;;; then the var will have to be massaged a bit before it is simple
1021 ;;; and lexical.
1022 (def!struct arg-info
1023   ;; true if this arg is to be specially bound
1024   (specialp nil :type boolean)
1025   ;; the kind of argument being described. Required args only have arg
1026   ;; info structures if they are special.
1027   (kind (missing-arg)
1028         :type (member :required :optional :keyword :rest
1029                       :more-context :more-count))
1030   ;; If true, this is the VAR for SUPPLIED-P variable of a keyword or
1031   ;; optional arg. This is true for keywords with non-constant
1032   ;; defaults even when there is no user-specified supplied-p var.
1033   (supplied-p nil :type (or lambda-var null))
1034   ;; the default for a keyword or optional, represented as the
1035   ;; original Lisp code. This is set to NIL in &KEY arguments that are
1036   ;; defaulted using the SUPPLIED-P arg.
1037   (default nil :type t)
1038   ;; the actual key for a &KEY argument. Note that in ANSI CL this is
1039   ;; not necessarily a keyword: (DEFUN FOO (&KEY ((BAR BAR))) ...).
1040   (key nil :type symbol))
1041 (defprinter (arg-info :identity t)
1042   (specialp :test specialp)
1043   kind
1044   (supplied-p :test supplied-p)
1045   (default :test default)
1046   (key :test key))
1047
1048 ;;; The LAMBDA-VAR structure represents a lexical lambda variable.
1049 ;;; This structure is also used during IR1 conversion to describe
1050 ;;; lambda arguments which may ultimately turn out not to be simple
1051 ;;; and lexical.
1052 ;;;
1053 ;;; LAMBDA-VARs with no REFs are considered to be deleted; physical
1054 ;;; environment analysis isn't done on these variables, so the back
1055 ;;; end must check for and ignore unreferenced variables. Note that a
1056 ;;; deleted LAMBDA-VAR may have sets; in this case the back end is
1057 ;;; still responsible for propagating the SET-VALUE to the set's CONT.
1058 (def!struct (lambda-var (:include basic-var))
1059   ;; true if this variable has been declared IGNORE
1060   (ignorep nil :type boolean)
1061   ;; the CLAMBDA that this var belongs to. This may be null when we are
1062   ;; building a lambda during IR1 conversion.
1063   (home nil :type (or null clambda))
1064   ;; This is set by physical environment analysis if it chooses an
1065   ;; indirect (value cell) representation for this variable because it
1066   ;; is both set and closed over.
1067   (indirect nil :type boolean)
1068   ;; The following two slots are only meaningful during IR1 conversion
1069   ;; of hairy lambda vars:
1070   ;;
1071   ;; The ARG-INFO structure which holds information obtained from
1072   ;; &keyword parsing.
1073   (arg-info nil :type (or arg-info null))
1074   ;; if true, the GLOBAL-VAR structure for the special variable which
1075   ;; is to be bound to the value of this argument
1076   (specvar nil :type (or global-var null))
1077   ;; Set of the CONSTRAINTs on this variable. Used by constraint
1078   ;; propagation. This is left null by the lambda pre-pass if it
1079   ;; determine that this is a set closure variable, and is thus not a
1080   ;; good subject for flow analysis.
1081   (constraints nil :type (or sset null)))
1082 (defprinter (lambda-var :identity t)
1083   %source-name
1084   (type :test (not (eq type *universal-type*)))
1085   (where-from :test (not (eq where-from :assumed)))
1086   (ignorep :test ignorep)
1087   (arg-info :test arg-info)
1088   (specvar :test specvar))
1089 \f
1090 ;;;; basic node types
1091
1092 ;;; A REF represents a reference to a LEAF. REF-REOPTIMIZE is
1093 ;;; initially (and forever) NIL, since REFs don't receive any values
1094 ;;; and don't have any IR1 optimizer.
1095 (defstruct (ref (:include node (:reoptimize nil))
1096                 (:constructor make-ref (derived-type leaf))
1097                 (:copier nil))
1098   ;; The leaf referenced.
1099   (leaf nil :type leaf))
1100 (defprinter (ref :identity t)
1101   leaf)
1102
1103 ;;; Naturally, the IF node always appears at the end of a block.
1104 ;;; NODE-CONT is a dummy continuation, and is there only to keep
1105 ;;; people happy.
1106 (defstruct (cif (:include node)
1107                 (:conc-name if-)
1108                 (:predicate if-p)
1109                 (:constructor make-if)
1110                 (:copier copy-if))
1111   ;; CONTINUATION for the predicate
1112   (test (missing-arg) :type continuation)
1113   ;; the blocks that we execute next in true and false case,
1114   ;; respectively (may be the same)
1115   (consequent (missing-arg) :type cblock)
1116   (alternative (missing-arg) :type cblock))
1117 (defprinter (cif :conc-name if- :identity t)
1118   (test :prin1 (continuation-use test))
1119   consequent
1120   alternative)
1121
1122 (defstruct (cset (:include node
1123                            (derived-type *universal-type*))
1124                  (:conc-name set-)
1125                  (:predicate set-p)
1126                  (:constructor make-set)
1127                  (:copier copy-set))
1128   ;; descriptor for the variable set
1129   (var (missing-arg) :type basic-var)
1130   ;; continuation for the value form
1131   (value (missing-arg) :type continuation))
1132 (defprinter (cset :conc-name set- :identity t)
1133   var
1134   (value :prin1 (continuation-use value)))
1135
1136 ;;; The BASIC-COMBINATION structure is used to represent both normal
1137 ;;; and multiple value combinations. In a local function call, this
1138 ;;; node appears at the end of its block and the body of the called
1139 ;;; function appears as the successor. The NODE-CONT remains the
1140 ;;; continuation which receives the value of the call.
1141 (defstruct (basic-combination (:include node)
1142                               (:constructor nil)
1143                               (:copier nil))
1144   ;; continuation for the function
1145   (fun (missing-arg) :type continuation)
1146   ;; list of CONTINUATIONs for the args. In a local call, an argument
1147   ;; continuation may be replaced with NIL to indicate that the
1148   ;; corresponding variable is unreferenced, and thus no argument
1149   ;; value need be passed.
1150   (args nil :type list)
1151   ;; the kind of function call being made. :LOCAL means that this is a
1152   ;; local call to a function in the same component, and that argument
1153   ;; syntax checking has been done, etc. Calls to known global
1154   ;; functions are represented by storing the FUNCTION-INFO for the
1155   ;; function in this slot. :FULL is a call to an (as yet) unknown
1156   ;; function. :ERROR is like :FULL, but means that we have discovered
1157   ;; that the call contains an error, and should not be reconsidered
1158   ;; for optimization.
1159   (kind :full :type (or (member :local :full :error) function-info))
1160   ;; some kind of information attached to this node by the back end
1161   (info nil))
1162
1163 ;;; The COMBINATION node represents all normal function calls,
1164 ;;; including FUNCALL. This is distinct from BASIC-COMBINATION so that
1165 ;;; an MV-COMBINATION isn't COMBINATION-P.
1166 (defstruct (combination (:include basic-combination)
1167                         (:constructor make-combination (fun))
1168                         (:copier nil)))
1169 (defprinter (combination :identity t)
1170   (fun :prin1 (continuation-use fun))
1171   (args :prin1 (mapcar (lambda (x)
1172                          (if x
1173                              (continuation-use x)
1174                              "<deleted>"))
1175                        args)))
1176
1177 ;;; An MV-COMBINATION is to MULTIPLE-VALUE-CALL as a COMBINATION is to
1178 ;;; FUNCALL. This is used to implement all the multiple-value
1179 ;;; receiving forms.
1180 (defstruct (mv-combination (:include basic-combination)
1181                            (:constructor make-mv-combination (fun))
1182                            (:copier nil)))
1183 (defprinter (mv-combination)
1184   (fun :prin1 (continuation-use fun))
1185   (args :prin1 (mapcar #'continuation-use args)))
1186
1187 ;;; The BIND node marks the beginning of a lambda body and represents
1188 ;;; the creation and initialization of the variables.
1189 (defstruct (bind (:include node)
1190                  (:copier nil))
1191   ;; the lambda we are binding variables for. Null when we are
1192   ;; creating the LAMBDA during IR1 translation.
1193   (lambda nil :type (or clambda null)))
1194 (defprinter (bind)
1195   lambda)
1196
1197 ;;; The RETURN node marks the end of a lambda body. It collects the
1198 ;;; return values and represents the control transfer on return. This
1199 ;;; is also where we stick information used for TAIL-SET type
1200 ;;; inference.
1201 (defstruct (creturn (:include node)
1202                     (:conc-name return-)
1203                     (:predicate return-p)
1204                     (:constructor make-return)
1205                     (:copier copy-return))
1206   ;; the lambda we are returning from. Null temporarily during
1207   ;; ir1tran.
1208   (lambda nil :type (or clambda null))
1209   ;; the continuation which yields the value of the lambda
1210   (result (missing-arg) :type continuation)
1211   ;; the union of the node-derived-type of all uses of the result
1212   ;; other than by a local call, intersected with the result's
1213   ;; asserted-type. If there are no non-call uses, this is
1214   ;; *EMPTY-TYPE*
1215   (result-type *wild-type* :type ctype))
1216 (defprinter (creturn :conc-name return- :identity t)
1217   lambda
1218   result-type)
1219 \f
1220 ;;;; non-local exit support
1221 ;;;;
1222 ;;;; In IR1, we insert special nodes to mark potentially non-local
1223 ;;;; lexical exits.
1224
1225 ;;; The ENTRY node serves to mark the start of the dynamic extent of a
1226 ;;; lexical exit. It is the mess-up node for the corresponding :Entry
1227 ;;; cleanup.
1228 (defstruct (entry (:include node)
1229                   (:copier nil))
1230   ;; All of the Exit nodes for potential non-local exits to this point.
1231   (exits nil :type list)
1232   ;; The cleanup for this entry. NULL only temporarily.
1233   (cleanup nil :type (or cleanup null)))
1234 (defprinter (entry :identity t))
1235
1236 ;;; The EXIT node marks the place at which exit code would be emitted,
1237 ;;; if necessary. This is interposed between the uses of the exit
1238 ;;; continuation and the exit continuation's DEST. Instead of using
1239 ;;; the returned value being delivered directly to the exit
1240 ;;; continuation, it is delivered to our VALUE continuation. The
1241 ;;; original exit continuation is the exit node's CONT.
1242 (defstruct (exit (:include node)
1243                  (:copier nil))
1244   ;; the ENTRY node that this is an exit for. If null, this is a
1245   ;; degenerate exit. A degenerate exit is used to "fill" an empty
1246   ;; block (which isn't allowed in IR1.) In a degenerate exit, Value
1247   ;; is always also null.
1248   (entry nil :type (or entry null))
1249   ;; the continuation yielding the value we are to exit with. If NIL,
1250   ;; then no value is desired (as in GO).
1251   (value nil :type (or continuation null)))
1252 (defprinter (exit :identity t)
1253   (entry :test entry)
1254   (value :test value))
1255 \f
1256 ;;;; miscellaneous IR1 structures
1257
1258 (defstruct (undefined-warning
1259             #-no-ansi-print-object
1260             (:print-object (lambda (x s)
1261                              (print-unreadable-object (x s :type t)
1262                                (prin1 (undefined-warning-name x) s))))
1263             (:copier nil))
1264   ;; the name of the unknown thing
1265   (name nil :type (or symbol list))
1266   ;; the kind of reference to NAME
1267   (kind (missing-arg) :type (member :function :type :variable))
1268   ;; the number of times this thing was used
1269   (count 0 :type unsigned-byte)
1270   ;; a list of COMPILER-ERROR-CONTEXT structures describing places
1271   ;; where this thing was used. Note that we only record the first
1272   ;; *UNDEFINED-WARNING-LIMIT* calls.
1273   (warnings () :type list))
1274 \f
1275 ;;; a helper for the POLICY macro, defined late here so that the
1276 ;;; various type tests can be inlined
1277 (declaim (ftype (function ((or list lexenv node functional)) list)
1278                 %coerce-to-policy))
1279 (defun %coerce-to-policy (thing)
1280   (let ((result (etypecase thing
1281                   (list thing)
1282                   (lexenv (lexenv-policy thing))
1283                   (node (lexenv-policy (node-lexenv thing)))
1284                   (functional (lexenv-policy (functional-lexenv thing))))))
1285     ;; Test the first element of the list as a rudimentary sanity
1286     ;; that it really does look like a valid policy.
1287     (aver (or (null result) (policy-quality-name-p (caar result))))
1288     ;; Voila.
1289     result))
1290 \f
1291 ;;;; Freeze some structure types to speed type testing.
1292
1293 #!-sb-fluid
1294 (declaim (freeze-type node leaf lexenv continuation cblock component cleanup
1295                       physenv tail-set nlx-info))