ghc/compiler/simplCore/OccurAnal.lhs

   1 %
   2 % (c) The GRASP/AQUA Project, Glasgow University, 1992-1998
   3 %
   4 %************************************************************************
   5 %*                                                                      *
   6 \section[OccurAnal]{Occurrence analysis pass}
   7 %*                                                                      *
   8 %************************************************************************
   9
  10 The occurrence analyser re-typechecks a core expression, returning a new
  11 core expression with (hopefully) improved usage information.
  12
  13 \begin{code}
  14 module OccurAnal (
  15         occurAnalyseBinds, occurAnalyseGlobalExpr, occurAnalyseRule
  16     ) where
  17
  18 #include "HsVersions.h"
  19
  20 import CoreSyn
  21 import CoreFVs          ( idRuleVars )
  22 import CoreUtils        ( exprIsTrivial )
  23 import Id               ( isDataConId, isOneShotLambda, setOneShotLambda,
  24                           idOccInfo, setIdOccInfo,
  25                           isExportedId, modifyIdInfo, idInfo, idArity,
  26                           idSpecialisation, isLocalId,
  27                           idType, idUnique, Id
  28                         )
  29 import IdInfo           ( copyIdInfo )
  30 import BasicTypes       ( OccInfo(..), isOneOcc )
  31
  32 import VarSet
  33 import VarEnv
  34
  35 import Type             ( isFunTy, dropForAlls )
  36 import Maybes           ( orElse )
  37 import Digraph          ( stronglyConnCompR, SCC(..) )
  38 import PrelNames        ( buildIdKey, foldrIdKey, runSTRepIdKey, augmentIdKey )
  39 import Unique           ( Unique )
  40 import UniqFM           ( keysUFM )
  41 import Util             ( zipWithEqual, mapAndUnzip )
  42 import Outputable
  43 \end{code}
  44
  45
  46 %************************************************************************
  47 %*                                                                      *
  48 \subsection[OccurAnal-main]{Counting occurrences: main function}
  49 %*                                                                      *
  50 %************************************************************************
  51
  52 Here's the externally-callable interface:
  53
  54 \begin{code}
  55 occurAnalyseGlobalExpr :: CoreExpr -> CoreExpr
  56 occurAnalyseGlobalExpr expr
  57   =     -- Top level expr, so no interesting free vars, and
  58         -- discard occurence info returned
  59     snd (occAnal (initOccEnv emptyVarSet) expr)
  60
  61 occurAnalyseRule :: CoreRule -> CoreRule
  62 occurAnalyseRule rule@(BuiltinRule _ _) = rule
  63 occurAnalyseRule (Rule str act tpl_vars tpl_args rhs)
  64                 -- Add occ info to tpl_vars, rhs
  65   = Rule str act tpl_vars' tpl_args rhs'
  66   where
  67     (rhs_uds, rhs') = occAnal (initOccEnv (mkVarSet tpl_vars)) rhs
  68     (_, tpl_vars')  = tagBinders rhs_uds tpl_vars
  69 \end{code}
  70
  71
  72 %************************************************************************
  73 %*                                                                      *
  74 \subsection{Top level stuff}
  75 %*                                                                      *
  76 %************************************************************************
  77
  78 In @occAnalTop@ we do indirection-shorting.  That is, if we have this:
  79
  80         x_local = <expression>
  81         ...
  82         x_exported = loc
  83
  84 where exp is exported, and loc is not, then we replace it with this:
  85
  86         x_local = x_exported
  87         x_exported = <expression>
  88         ...
  89
  90 Without this we never get rid of the x_exported = x_local thing.  This
  91 save a gratuitous jump (from \tr{x_exported} to \tr{x_local}), and
  92 makes strictness information propagate better.  This used to happen in
  93 the final phase, but it's tidier to do it here.
  94
  95 If more than one exported thing is equal to a local thing (i.e., the
  96 local thing really is shared), then we do one only:
  97 \begin{verbatim}
  98         x_local = ....
  99         x_exported1 = x_local
 100         x_exported2 = x_local
 101 ==>
 102         x_exported1 = ....
 103
 104         x_exported2 = x_exported1
 105 \end{verbatim}
 106
 107 We rely on prior eta reduction to simplify things like
 108 \begin{verbatim}
 109         x_exported = /\ tyvars -> x_local tyvars
 110 ==>
 111         x_exported = x_local
 112 \end{verbatim}
 113 Hence,there's a possibility of leaving unchanged something like this:
 114 \begin{verbatim}
 115         x_local = ....
 116         x_exported1 = x_local Int
 117 \end{verbatim}
 118 By the time we've thrown away the types in STG land this
 119 could be eliminated.  But I don't think it's very common
 120 and it's dangerous to do this fiddling in STG land
 121 because we might elminate a binding that's mentioned in the
 122 unfolding for something.
 123
 124 \begin{code}
 125 occurAnalyseBinds :: [CoreBind] -> [CoreBind]
 126
 127 occurAnalyseBinds binds
 128   = binds'
 129   where
 130     (_, _, binds') = go (initOccEnv emptyVarSet) binds
 131
 132     go :: OccEnv -> [CoreBind]
 133        -> (UsageDetails,        -- Occurrence info
 134            IdEnv Id,            -- Indirection elimination info
 135                                 --   Maps local-id -> exported-id, but it embodies
 136                                 --   bindings of the form exported-id = local-id in
 137                                 --   the argument to go
 138            [CoreBind])          -- Occ-analysed bindings, less the exported-id=local-id ones
 139
 140     go env [] = (emptyDetails, emptyVarEnv, [])
 141
 142     go env (bind : binds)
 143       = let
 144             new_env                        = env `addNewCands` (bindersOf bind)
 145             (scope_usage, ind_env, binds') = go new_env binds
 146             (final_usage, new_binds)       = occAnalBind env (zapBind ind_env bind) scope_usage
 147                                                 -- NB: I zap before occur-analysing, so
 148                                                 -- I don't need to worry about getting the
 149                                                 -- occ info on the new bindings right.
 150         in
 151         case bind of
 152             NonRec exported_id (Var local_id)
 153                 | shortMeOut ind_env exported_id local_id
 154                 -- Special case for eliminating indirections
 155                 --   Note: it's a shortcoming that this only works for
 156                 --         non-recursive bindings.  Elminating indirections
 157                 --         makes perfect sense for recursive bindings too, but
 158                 --         it's more complicated to implement, so I haven't done so
 159                 -> (scope_usage, ind_env', binds')
 160                 where
 161                    ind_env' = extendVarEnv ind_env local_id exported_id
 162
 163             other ->    -- Ho ho! The normal case
 164                      (final_usage, ind_env, new_binds ++ binds')
 165
 166
 167 -- Deal with any indirections
 168 zapBind ind_env (NonRec bndr rhs)
 169   | bndr `elemVarEnv` ind_env                      = Rec (zap ind_env (bndr,rhs))
 170                 -- The Rec isn't strictly necessary, but it's convenient
 171 zapBind ind_env (Rec pairs)
 172   | or [id `elemVarEnv` ind_env | (id,_) <- pairs] = Rec (concat (map (zap ind_env) pairs))
 173
 174 zapBind ind_env bind = bind
 175
 176 zap ind_env pair@(local_id,rhs)
 177   = case lookupVarEnv ind_env local_id of
 178         Nothing          -> [pair]
 179         Just exported_id -> [(local_id, Var exported_id),
 180                              (exported_id', rhs)]
 181                          where
 182                             exported_id' = modifyIdInfo (copyIdInfo (idInfo local_id)) exported_id
 183
 184 shortMeOut ind_env exported_id local_id
 185 -- The if-then-else stuff is just so I can get a pprTrace to see
 186 -- how often I don't get shorting out becuase of IdInfo stuff
 187   = if isExportedId exported_id &&              -- Only if this is exported
 188
 189        isLocalId local_id &&                    -- Only if this one is defined in this
 190                                                 --      module, so that we *can* change its
 191                                                 --      binding to be the exported thing!
 192
 193        not (isExportedId local_id) &&           -- Only if this one is not itself exported,
 194                                                 --      since the transformation will nuke it
 195
 196        not (local_id `elemVarEnv` ind_env)      -- Only if not already substituted for
 197     then
 198         True
 199
 200 {- No longer needed
 201         if shortableIdInfo (idInfo exported_id)         -- Only if its IdInfo is 'shortable'
 202                                                         -- (see the defn of IdInfo.shortableIdInfo)
 203         then True
 204         else
 205 #ifdef DEBUG
 206           pprTrace "shortMeOut:" (ppr exported_id)
 207 #endif
 208                                                 False
 209 -}
 210     else
 211         False
 212 \end{code}
 213
 214
 215 %************************************************************************
 216 %*                                                                      *
 217 \subsection[OccurAnal-main]{Counting occurrences: main function}
 218 %*                                                                      *
 219 %************************************************************************
 220
 221 Bindings
 222 ~~~~~~~~
 223
 224 \begin{code}
 225 type IdWithOccInfo = Id                 -- An Id with fresh PragmaInfo attached
 226
 227 type Node details = (details, Unique, [Unique]) -- The Ints are gotten from the Unique,
 228                                                 -- which is gotten from the Id.
 229 type Details1     = (Id, UsageDetails, CoreExpr)
 230 type Details2     = (IdWithOccInfo, CoreExpr)
 231
 232
 233 occAnalBind :: OccEnv
 234             -> CoreBind
 235             -> UsageDetails             -- Usage details of scope
 236             -> (UsageDetails,           -- Of the whole let(rec)
 237                 [CoreBind])
 238
 239 occAnalBind env (NonRec binder rhs) body_usage
 240   | not (binder `usedIn` body_usage)            -- It's not mentioned
 241   = (body_usage, [])
 242
 243   | otherwise                   -- It's mentioned in the body
 244   = (final_body_usage `combineUsageDetails` rhs_usage,
 245      [NonRec tagged_binder rhs'])
 246
 247   where
 248     (final_body_usage, tagged_binder) = tagBinder body_usage binder
 249     (rhs_usage, rhs')                 = occAnalRhs env binder rhs
 250 \end{code}
 251
 252 Dropping dead code for recursive bindings is done in a very simple way:
 253
 254         the entire set of bindings is dropped if none of its binders are
 255         mentioned in its body; otherwise none are.
 256
 257 This seems to miss an obvious improvement.
 258 @
 259         letrec  f = ...g...
 260                 g = ...f...
 261         in
 262         ...g...
 263
 264 ===>
 265
 266         letrec f = ...g...
 267                g = ...(...g...)...
 268         in
 269         ...g...
 270 @
 271
 272 Now @f@ is unused. But dependency analysis will sort this out into a
 273 @letrec@ for @g@ and a @let@ for @f@, and then @f@ will get dropped.
 274 It isn't easy to do a perfect job in one blow.  Consider
 275
 276 @
 277         letrec f = ...g...
 278                g = ...h...
 279                h = ...k...
 280                k = ...m...
 281                m = ...m...
 282         in
 283         ...m...
 284 @
 285
 286
 287 \begin{code}
 288 occAnalBind env (Rec pairs) body_usage
 289   = foldr (_scc_ "occAnalBind.dofinal" do_final_bind) (body_usage, []) sccs
 290   where
 291     binders = map fst pairs
 292     rhs_env = env `addNewCands` binders
 293
 294     analysed_pairs :: [Details1]
 295     analysed_pairs  = [ (bndr, rhs_usage, rhs')
 296                       | (bndr, rhs) <- pairs,
 297                         let (rhs_usage, rhs') = occAnalRhs rhs_env bndr rhs
 298                       ]
 299
 300     sccs :: [SCC (Node Details1)]
 301     sccs = _scc_ "occAnalBind.scc" stronglyConnCompR edges
 302
 303
 304     ---- stuff for dependency analysis of binds -------------------------------
 305     edges :: [Node Details1]
 306     edges = _scc_ "occAnalBind.assoc"
 307             [ (details, idUnique id, edges_from rhs_usage)
 308             | details@(id, rhs_usage, rhs) <- analysed_pairs
 309             ]
 310
 311         -- (a -> b) means a mentions b
 312         -- Given the usage details (a UFM that gives occ info for each free var of
 313         -- the RHS) we can get the list of free vars -- or rather their Int keys --
 314         -- by just extracting the keys from the finite map.  Grimy, but fast.
 315         -- Previously we had this:
 316         --      [ bndr | bndr <- bndrs,
 317         --               maybeToBool (lookupVarEnv rhs_usage bndr)]
 318         -- which has n**2 cost, and this meant that edges_from alone
 319         -- consumed 10% of total runtime!
 320     edges_from :: UsageDetails -> [Unique]
 321     edges_from rhs_usage = _scc_ "occAnalBind.edges_from"
 322                            keysUFM rhs_usage
 323
 324     ---- stuff to "re-constitute" bindings from dependency-analysis info ------
 325
 326         -- Non-recursive SCC
 327     do_final_bind (AcyclicSCC ((bndr, rhs_usage, rhs'), _, _)) (body_usage, binds_so_far)
 328       | not (bndr `usedIn` body_usage)
 329       = (body_usage, binds_so_far)                      -- Dead code
 330       | otherwise
 331       = (combined_usage, new_bind : binds_so_far)
 332       where
 333         total_usage                   = combineUsageDetails body_usage rhs_usage
 334         (combined_usage, tagged_bndr) = tagBinder total_usage bndr
 335         new_bind                      = NonRec tagged_bndr rhs'
 336
 337         -- Recursive SCC
 338     do_final_bind (CyclicSCC cycle) (body_usage, binds_so_far)
 339       | not (any (`usedIn` body_usage) bndrs)           -- NB: look at body_usage, not total_usage
 340       = (body_usage, binds_so_far)                      -- Dead code
 341       | otherwise
 342       = (combined_usage, final_bind:binds_so_far)
 343       where
 344         details                        = [details   | (details, _, _) <- cycle]
 345         bndrs                          = [bndr      | (bndr, _, _)      <- details]
 346         rhs_usages                     = [rhs_usage | (_, rhs_usage, _) <- details]
 347         total_usage                    = foldr combineUsageDetails body_usage rhs_usages
 348         (combined_usage, tagged_bndrs) = tagBinders total_usage bndrs
 349         final_bind                     = Rec (reOrderRec env new_cycle)
 350
 351         new_cycle = CyclicSCC (zipWithEqual "occAnalBind" mk_new_bind tagged_bndrs cycle)
 352         mk_new_bind tagged_bndr ((_, _, rhs'), key, keys) = ((tagged_bndr, rhs'), key, keys)
 353 \end{code}
 354
 355 @reOrderRec@ is applied to the list of (binder,rhs) pairs for a cyclic
 356 strongly connected component (there's guaranteed to be a cycle).  It returns the
 357 same pairs, but
 358         a) in a better order,
 359         b) with some of the Ids having a IMustNotBeINLINEd pragma
 360
 361 The "no-inline" Ids are sufficient to break all cycles in the SCC.  This means
 362 that the simplifier can guarantee not to loop provided it never records an inlining
 363 for these no-inline guys.
 364
 365 Furthermore, the order of the binds is such that if we neglect dependencies
 366 on the no-inline Ids then the binds are topologically sorted.  This means
 367 that the simplifier will generally do a good job if it works from top bottom,
 368 recording inlinings for any Ids which aren't marked as "no-inline" as it goes.
 369
 370 ==============
 371 [June 98: I don't understand the following paragraphs, and I've
 372           changed the a=b case again so that it isn't a special case any more.]
 373
 374 Here's a case that bit me:
 375
 376         letrec
 377                 a = b
 378                 b = \x. BIG
 379         in
 380         ...a...a...a....
 381
 382 Re-ordering doesn't change the order of bindings, but there was no loop-breaker.
 383
 384 My solution was to make a=b bindings record b as Many, rather like INLINE bindings.
 385 Perhaps something cleverer would suffice.
 386 ===============
 387
 388 You might think that you can prevent non-termination simply by making
 389 sure that we simplify a recursive binding's RHS in an environment that
 390 simply clones the recursive Id.  But no.  Consider
 391
 392                 letrec f = \x -> let z = f x' in ...
 393
 394                 in
 395                 let n = f y
 396                 in
 397                 case n of { ... }
 398
 399 We bind n to its *simplified* RHS, we then *re-simplify* it when
 400 we inline n.  Then we may well inline f; and then the same thing
 401 happens with z!
 402
 403 I don't think it's possible to prevent non-termination by environment
 404 manipulation in this way.  Apart from anything else, successive
 405 iterations of the simplifier may unroll recursive loops in cases like
 406 that above.  The idea of beaking every recursive loop with an
 407 IMustNotBeINLINEd pragma is much much better.
 408
 409
 410 \begin{code}
 411 reOrderRec
 412         :: OccEnv
 413         -> SCC (Node Details2)
 414         -> [Details2]
 415                         -- Sorted into a plausible order.  Enough of the Ids have
 416                         --      dontINLINE pragmas that there are no loops left.
 417
 418         -- Non-recursive case
 419 reOrderRec env (AcyclicSCC (bind, _, _)) = [bind]
 420
 421         -- Common case of simple self-recursion
 422 reOrderRec env (CyclicSCC [bind])
 423   = [(setIdOccInfo tagged_bndr IAmALoopBreaker, rhs)]
 424   where
 425     ((tagged_bndr, rhs), _, _) = bind
 426
 427 reOrderRec env (CyclicSCC (bind : binds))
 428   =     -- Choose a loop breaker, mark it no-inline,
 429         -- do SCC analysis on the rest, and recursively sort them out
 430     concat (map (reOrderRec env) (stronglyConnCompR unchosen))
 431     ++
 432     [(setIdOccInfo tagged_bndr IAmALoopBreaker, rhs)]
 433
 434   where
 435     (chosen_pair, unchosen) = choose_loop_breaker bind (score bind) [] binds
 436     (tagged_bndr, rhs)      = chosen_pair
 437
 438         -- This loop looks for the bind with the lowest score
 439         -- to pick as the loop  breaker.  The rest accumulate in
 440     choose_loop_breaker (details,_,_) loop_sc acc []
 441         = (details, acc)        -- Done
 442
 443     choose_loop_breaker loop_bind loop_sc acc (bind : binds)
 444         | sc < loop_sc  -- Lower score so pick this new one
 445         = choose_loop_breaker bind sc (loop_bind : acc) binds
 446
 447         | otherwise     -- No lower so don't pick it
 448         = choose_loop_breaker loop_bind loop_sc (bind : acc) binds
 449         where
 450           sc = score bind
 451
 452     score :: Node Details2 -> Int       -- Higher score => less likely to be picked as loop breaker
 453     score ((bndr, rhs), _, _)
 454         | exprIsTrivial rhs        = 4  -- Practically certain to be inlined
 455                 -- Used to have also: && not (isExportedId bndr)
 456                 -- But I found this sometimes cost an extra iteration when we have
 457                 --      rec { d = (a,b); a = ...df...; b = ...df...; df = d }
 458                 -- where df is the exported dictionary. Then df makes a really
 459                 -- bad choice for loop breaker
 460
 461         | not_fun_ty (idType bndr) = 3  -- Data types help with cases
 462                 -- This used to have a lower score than inlineCandidate, but
 463                 -- it's *really* helpful if dictionaries get inlined fast,
 464                 -- so I'm experimenting with giving higher priority to data-typed things
 465
 466         | inlineCandidate bndr rhs = 2  -- Likely to be inlined
 467
 468         | not (isEmptyCoreRules (idSpecialisation bndr)) = 1
 469                 -- Avoid things with specialisations; we'd like
 470                 -- to take advantage of them in the subsequent bindings
 471
 472         | otherwise = 0
 473
 474     inlineCandidate :: Id -> CoreExpr -> Bool
 475     inlineCandidate id (Note InlineMe _) = True
 476     inlineCandidate id rhs               = isOneOcc (idOccInfo id)
 477
 478         -- Real example (the Enum Ordering instance from PrelBase):
 479         --      rec     f = \ x -> case d of (p,q,r) -> p x
 480         --              g = \ x -> case d of (p,q,r) -> q x
 481         --              d = (v, f, g)
 482         --
 483         -- Here, f and g occur just once; but we can't inline them into d.
 484         -- On the other hand we *could* simplify those case expressions if
 485         -- we didn't stupidly choose d as the loop breaker.
 486         -- But we won't because constructor args are marked "Many".
 487
 488     not_fun_ty ty = not (isFunTy (dropForAlls ty))
 489 \end{code}
 490
 491 @occAnalRhs@ deals with the question of bindings where the Id is marked
 492 by an INLINE pragma.  For these we record that anything which occurs
 493 in its RHS occurs many times.  This pessimistically assumes that ths
 494 inlined binder also occurs many times in its scope, but if it doesn't
 495 we'll catch it next time round.  At worst this costs an extra simplifier pass.
 496 ToDo: try using the occurrence info for the inline'd binder.
 497
 498 [March 97] We do the same for atomic RHSs.  Reason: see notes with reOrderRec.
 499 [June 98, SLPJ]  I've undone this change; I don't understand it.  See notes with reOrderRec.
 500
 501
 502 \begin{code}
 503 occAnalRhs :: OccEnv
 504            -> Id -> CoreExpr    -- Binder and rhs
 505            -> (UsageDetails, CoreExpr)
 506
 507 occAnalRhs env id rhs
 508   = (final_usage, rhs')
 509   where
 510     (rhs_usage, rhs') = occAnal (rhsCtxt env) rhs
 511         -- Note that we use an rhsCtxt.  This tells the occ anal that it's
 512         -- looking at an RHS, which has an effect in occAnalApp
 513         --
 514         -- But there's a problem.  Consider
 515         --      x1 = a0 : []
 516         --      x2 = a1 : x1
 517         --      x3 = a2 : x2
 518         --      g  = f x2
 519         -- First time round, it looks as if x1 and x2 occur as an arg of a
 520         -- let-bound constructor ==> give them a many-occurrence.
 521         -- But then x3 is inlined (unconditionally as it happens) and
 522         -- next time round, x2 will be, and the next time round x1 will be
 523         -- Result: multiple simplifier iterations.  Sigh.
 524         -- Possible solution: use rhsCtxt for things that occur just once...
 525
 526         -- [March 98] A new wrinkle is that if the binder has specialisations inside
 527         -- it then we count the specialised Ids as "extra rhs's".  That way
 528         -- the "parent" keeps the specialised "children" alive.  If the parent
 529         -- dies (because it isn't referenced any more), then the children will
 530         -- die too unless they are already referenced directly.
 531
 532     final_usage = foldVarSet add rhs_usage (idRuleVars id)
 533     add v u = addOneOcc u v NoOccInfo           -- Give a non-committal binder info
 534                                                 -- (i.e manyOcc) because many copies
 535                                                 -- of the specialised thing can appear
 536 \end{code}
 537
 538 Expressions
 539 ~~~~~~~~~~~
 540 \begin{code}
 541 occAnal :: OccEnv
 542         -> CoreExpr
 543         -> (UsageDetails,       -- Gives info only about the "interesting" Ids
 544             CoreExpr)
 545
 546 occAnal env (Type t)  = (emptyDetails, Type t)
 547
 548 occAnal env (Var v)
 549   = (var_uds, Var v)
 550   where
 551     var_uds | isCandidate env v = unitVarEnv v oneOcc
 552             | otherwise         = emptyDetails
 553
 554     -- At one stage, I gathered the idRuleVars for v here too,
 555     -- which in a way is the right thing to do.
 556     -- But that went wrong right after specialisation, when
 557     -- the *occurrences* of the overloaded function didn't have any
 558     -- rules in them, so the *specialised* versions looked as if they
 559     -- weren't used at all.
 560
 561 \end{code}
 562
 563 We regard variables that occur as constructor arguments as "dangerousToDup":
 564
 565 \begin{verbatim}
 566 module A where
 567 f x = let y = expensive x in
 568       let z = (True,y) in
 569       (case z of {(p,q)->q}, case z of {(p,q)->q})
 570 \end{verbatim}
 571
 572 We feel free to duplicate the WHNF (True,y), but that means
 573 that y may be duplicated thereby.
 574
 575 If we aren't careful we duplicate the (expensive x) call!
 576 Constructors are rather like lambdas in this way.
 577
 578 \begin{code}
 579 occAnal env expr@(Lit lit) = (emptyDetails, expr)
 580 \end{code}
 581
 582 \begin{code}
 583 occAnal env (Note InlineMe body)
 584   = case occAnal env body of { (usage, body') ->
 585     (mapVarEnv markMany usage, Note InlineMe body')
 586     }
 587
 588 occAnal env (Note note@(SCC cc) body)
 589   = case occAnal env body of { (usage, body') ->
 590     (mapVarEnv markInsideSCC usage, Note note body')
 591     }
 592
 593 occAnal env (Note note body)
 594   = case occAnal env body of { (usage, body') ->
 595     (usage, Note note body')
 596     }
 597 \end{code}
 598
 599 \begin{code}
 600 occAnal env app@(App fun arg)
 601   = occAnalApp env (collectArgs app) False
 602
 603 -- Ignore type variables altogether
 604 --   (a) occurrences inside type lambdas only not marked as InsideLam
 605 --   (b) type variables not in environment
 606
 607 occAnal env expr@(Lam x body) | isTyVar x
 608   = case occAnal env body of { (body_usage, body') ->
 609     (body_usage, Lam x body')
 610     }
 611
 612 -- For value lambdas we do a special hack.  Consider
 613 --      (\x. \y. ...x...)
 614 -- If we did nothing, x is used inside the \y, so would be marked
 615 -- as dangerous to dup.  But in the common case where the abstraction
 616 -- is applied to two arguments this is over-pessimistic.
 617 -- So instead, we just mark each binder with its occurrence
 618 -- info in the *body* of the multiple lambda.
 619 -- Then, the simplifier is careful when partially applying lambdas.
 620
 621 occAnal env expr@(Lam _ _)
 622   = case occAnal env_body body of { (body_usage, body') ->
 623     let
 624         (final_usage, tagged_binders) = tagBinders body_usage binders
 625         --      URGH!  Sept 99: we don't seem to be able to use binders' here, because
 626         --      we get linear-typed things in the resulting program that we can't handle yet.
 627         --      (e.g. PrelShow)  TODO
 628
 629         really_final_usage = if linear then
 630                                 final_usage
 631                              else
 632                                 mapVarEnv markInsideLam final_usage
 633     in
 634     (really_final_usage,
 635      mkLams tagged_binders body') }
 636   where
 637     (binders, body)   = collectBinders expr
 638     (linear, env1, _) = oneShotGroup env binders
 639     env2              = env1 `addNewCands` binders      -- Add in-scope binders
 640     env_body          = vanillaCtxt env2                -- Body is (no longer) an RhsContext
 641
 642 occAnal env (Case scrut bndr alts)
 643   = case mapAndUnzip (occAnalAlt alt_env bndr) alts of { (alts_usage_s, alts')   ->
 644     case occAnal (vanillaCtxt env) scrut                    of { (scrut_usage, scrut') ->
 645         -- No need for rhsCtxt
 646     let
 647         alts_usage  = foldr1 combineAltsUsageDetails alts_usage_s
 648         alts_usage' = addCaseBndrUsage alts_usage
 649         (alts_usage1, tagged_bndr) = tagBinder alts_usage' bndr
 650         total_usage = scrut_usage `combineUsageDetails` alts_usage1
 651     in
 652     total_usage `seq` (total_usage, Case scrut' tagged_bndr alts') }}
 653   where
 654     alt_env = env `addNewCand` bndr
 655
 656         -- The case binder gets a usage of either "many" or "dead", never "one".
 657         -- Reason: we like to inline single occurrences, to eliminate a binding,
 658         -- but inlining a case binder *doesn't* eliminate a binding.
 659         -- We *don't* want to transform
 660         --      case x of w { (p,q) -> f w }
 661         -- into
 662         --      case x of w { (p,q) -> f (p,q) }
 663     addCaseBndrUsage usage = case lookupVarEnv usage bndr of
 664                                 Nothing  -> usage
 665                                 Just occ -> extendVarEnv usage bndr (markMany occ)
 666
 667 occAnal env (Let bind body)
 668   = case occAnal new_env body            of { (body_usage, body') ->
 669     case occAnalBind env bind body_usage of { (final_usage, new_binds) ->
 670        (final_usage, mkLets new_binds body') }}
 671   where
 672     new_env = env `addNewCands` (bindersOf bind)
 673
 674 occAnalArgs env args
 675   = case mapAndUnzip (occAnal arg_env) args of  { (arg_uds_s, args') ->
 676     (foldr combineUsageDetails emptyDetails arg_uds_s, args')}
 677   where
 678     arg_env = vanillaCtxt env
 679 \end{code}
 680
 681 Applications are dealt with specially because we want
 682 the "build hack" to work.
 683
 684 \begin{code}
 685 -- Hack for build, fold, runST
 686 occAnalApp env (Var fun, args) is_rhs
 687   = case args_stuff of { (args_uds, args') ->
 688     let
 689         -- We mark the free vars of the argument of a constructor or PAP
 690         -- as "many", if it is the RHS of a let(rec).
 691         -- This means that nothing gets inlined into a constructor argument
 692         -- position, which is what we want.  Typically those constructor
 693         -- arguments are just variables, or trivial expressions.
 694         --
 695         -- This is the *whole point* of the isRhsEnv predicate
 696         final_args_uds
 697                 | isRhsEnv env,
 698                   isDataConId fun || valArgCount args < idArity fun
 699                 = mapVarEnv markMany args_uds
 700                 | otherwise = args_uds
 701     in
 702     (fun_uds `combineUsageDetails` final_args_uds, mkApps (Var fun) args') }
 703   where
 704     fun_uniq = idUnique fun
 705
 706     fun_uds | isCandidate env fun = unitVarEnv fun oneOcc
 707             | otherwise           = emptyDetails
 708
 709     args_stuff  | fun_uniq == buildIdKey    = appSpecial env 2 [True,True]  args
 710                 | fun_uniq == augmentIdKey  = appSpecial env 2 [True,True]  args
 711                 | fun_uniq == foldrIdKey    = appSpecial env 3 [False,True] args
 712                 | fun_uniq == runSTRepIdKey = appSpecial env 2 [True]       args
 713                         -- (foldr k z xs) may call k many times, but it never
 714                         -- shares a partial application of k; hence [False,True]
 715                         -- This means we can optimise
 716                         --      foldr (\x -> let v = ...x... in \y -> ...v...) z xs
 717                         -- by floating in the v
 718
 719                 | otherwise = occAnalArgs env args
 720
 721
 722 occAnalApp env (fun, args) is_rhs
 723   = case occAnal (addAppCtxt env args) fun of   { (fun_uds, fun') ->
 724         -- The addAppCtxt is a bit cunning.  One iteration of the simplifier
 725         -- often leaves behind beta redexs like
 726         --      (\x y -> e) a1 a2
 727         -- Here we would like to mark x,y as one-shot, and treat the whole
 728         -- thing much like a let.  We do this by pushing some True items
 729         -- onto the context stack.
 730
 731     case occAnalArgs env args of        { (args_uds, args') ->
 732     let
 733         final_uds = fun_uds `combineUsageDetails` args_uds
 734     in
 735     (final_uds, mkApps fun' args') }}
 736
 737 appSpecial :: OccEnv
 738            -> Int -> CtxtTy     -- Argument number, and context to use for it
 739            -> [CoreExpr]
 740            -> (UsageDetails, [CoreExpr])
 741 appSpecial env n ctxt args
 742   = go n args
 743   where
 744     arg_env = vanillaCtxt env
 745
 746     go n [] = (emptyDetails, [])        -- Too few args
 747
 748     go 1 (arg:args)                     -- The magic arg
 749       = case occAnal (setCtxt arg_env ctxt) arg of      { (arg_uds, arg') ->
 750         case occAnalArgs env args of                    { (args_uds, args') ->
 751         (combineUsageDetails arg_uds args_uds, arg':args') }}
 752
 753     go n (arg:args)
 754       = case occAnal arg_env arg of     { (arg_uds, arg') ->
 755         case go (n-1) args of           { (args_uds, args') ->
 756         (combineUsageDetails arg_uds args_uds, arg':args') }}
 757 \end{code}
 758
 759
 760 Case alternatives
 761 ~~~~~~~~~~~~~~~~~
 762 If the case binder occurs at all, the other binders effectively do too.
 763 For example
 764         case e of x { (a,b) -> rhs }
 765 is rather like
 766         let x = (a,b) in rhs
 767 If e turns out to be (e1,e2) we indeed get something like
 768         let a = e1; b = e2; x = (a,b) in rhs
 769
 770 \begin{code}
 771 occAnalAlt env case_bndr (con, bndrs, rhs)
 772   = case occAnal (env `addNewCands` bndrs) rhs of { (rhs_usage, rhs') ->
 773     let
 774         (final_usage, tagged_bndrs) = tagBinders rhs_usage bndrs
 775         final_bndrs | case_bndr `elemVarEnv` final_usage = bndrs
 776                     | otherwise                         = tagged_bndrs
 777                 -- Leave the binders untagged if the case
 778                 -- binder occurs at all; see note above
 779     in
 780     (final_usage, (con, final_bndrs, rhs')) }
 781 \end{code}
 782
 783
 784 %************************************************************************
 785 %*                                                                      *
 786 \subsection[OccurAnal-types]{OccEnv}
 787 %*                                                                      *
 788 %************************************************************************
 789
 790 \begin{code}
 791 data OccEnv
 792   = OccEnv IdSet        -- In-scope Ids; we gather info about these only
 793            OccEncl      -- Enclosing context information
 794            CtxtTy       -- Tells about linearity
 795
 796 -- OccEncl is used to control whether to inline into constructor arguments
 797 -- For example:
 798 --      x = (p,q)               -- Don't inline p or q
 799 --      y = /\a -> (p a, q a)   -- Still don't inline p or q
 800 --      z = f (p,q)             -- Do inline p,q; it may make a rule fire
 801 -- So OccEncl tells enought about the context to know what to do when
 802 -- we encounter a contructor application or PAP.
 803
 804 data OccEncl
 805   = OccRhs              -- RHS of let(rec), albeit perhaps inside a type lambda
 806                         -- Don't inline into constructor args here
 807   | OccVanilla          -- Argument of function, body of lambda, scruintee of case etc.
 808                         -- Do inline into constructor args here
 809
 810 type CtxtTy = [Bool]
 811         -- []           No info
 812         --
 813         -- True:ctxt    Analysing a function-valued expression that will be
 814         --                      applied just once
 815         --
 816         -- False:ctxt   Analysing a function-valued expression that may
 817         --                      be applied many times; but when it is,
 818         --                      the CtxtTy inside applies
 819
 820 initOccEnv :: VarSet -> OccEnv
 821 initOccEnv vars = OccEnv vars OccRhs []
 822
 823 isRhsEnv (OccEnv _ OccRhs     _) = True
 824 isRhsEnv (OccEnv _ OccVanilla _) = False
 825
 826 isCandidate :: OccEnv -> Id -> Bool
 827 isCandidate (OccEnv cands encl _) id = id `elemVarSet` cands
 828
 829 addNewCands :: OccEnv -> [Id] -> OccEnv
 830 addNewCands (OccEnv cands encl ctxt) ids
 831   = OccEnv (cands `unionVarSet` mkVarSet ids) encl ctxt
 832
 833 addNewCand :: OccEnv -> Id -> OccEnv
 834 addNewCand (OccEnv cands encl ctxt) id
 835   = OccEnv (extendVarSet cands id) encl ctxt
 836
 837 setCtxt :: OccEnv -> CtxtTy -> OccEnv
 838 setCtxt (OccEnv cands encl _) ctxt = OccEnv cands encl ctxt
 839
 840 oneShotGroup :: OccEnv -> [CoreBndr] -> (Bool, OccEnv, [CoreBndr])
 841         -- True <=> this is a one-shot linear lambda group
 842         -- The [CoreBndr] are the binders.
 843
 844         -- The result binders have one-shot-ness set that they might not have had originally.
 845         -- This happens in (build (\cn -> e)).  Here the occurrence analyser
 846         -- linearity context knows that c,n are one-shot, and it records that fact in
 847         -- the binder. This is useful to guide subsequent float-in/float-out tranformations
 848
 849 oneShotGroup (OccEnv cands encl ctxt) bndrs
 850   = case go ctxt bndrs [] of
 851         (new_ctxt, new_bndrs) -> (all is_one_shot new_bndrs, OccEnv cands encl new_ctxt, new_bndrs)
 852   where
 853     is_one_shot b = isId b && isOneShotLambda b
 854
 855     go ctxt [] rev_bndrs = (ctxt, reverse rev_bndrs)
 856
 857     go (lin_ctxt:ctxt) (bndr:bndrs) rev_bndrs
 858         | isId bndr = go ctxt bndrs (bndr':rev_bndrs)
 859         where
 860           bndr' | lin_ctxt  = setOneShotLambda bndr
 861                 | otherwise = bndr
 862
 863     go ctxt (bndr:bndrs) rev_bndrs = go ctxt bndrs (bndr:rev_bndrs)
 864
 865
 866 vanillaCtxt (OccEnv cands _ _) = OccEnv cands OccVanilla []
 867 rhsCtxt     (OccEnv cands _ _) = OccEnv cands OccRhs     []
 868
 869 addAppCtxt (OccEnv cands encl ctxt) args
 870   = OccEnv cands encl (replicate (valArgCount args) True ++ ctxt)
 871 \end{code}
 872
 873 %************************************************************************
 874 %*                                                                      *
 875 \subsection[OccurAnal-types]{OccEnv}
 876 %*                                                                      *
 877 %************************************************************************
 878
 879 \begin{code}
 880 type UsageDetails = IdEnv OccInfo       -- A finite map from ids to their usage
 881
 882 combineUsageDetails, combineAltsUsageDetails
 883         :: UsageDetails -> UsageDetails -> UsageDetails
 884
 885 combineUsageDetails usage1 usage2
 886   = plusVarEnv_C addOccInfo usage1 usage2
 887
 888 combineAltsUsageDetails usage1 usage2
 889   = plusVarEnv_C orOccInfo usage1 usage2
 890
 891 addOneOcc :: UsageDetails -> Id -> OccInfo -> UsageDetails
 892 addOneOcc usage id info
 893   = plusVarEnv_C addOccInfo usage (unitVarEnv id info)
 894         -- ToDo: make this more efficient
 895
 896 emptyDetails = (emptyVarEnv :: UsageDetails)
 897
 898 usedIn :: Id -> UsageDetails -> Bool
 899 v `usedIn` details =  isExportedId v || v `elemVarEnv` details
 900
 901 tagBinders :: UsageDetails          -- Of scope
 902            -> [Id]                  -- Binders
 903            -> (UsageDetails,        -- Details with binders removed
 904               [IdWithOccInfo])    -- Tagged binders
 905
 906 tagBinders usage binders
 907  = let
 908      usage' = usage `delVarEnvList` binders
 909      uss    = map (setBinderOcc usage) binders
 910    in
 911    usage' `seq` (usage', uss)
 912
 913 tagBinder :: UsageDetails           -- Of scope
 914           -> Id                     -- Binders
 915           -> (UsageDetails,         -- Details with binders removed
 916               IdWithOccInfo)        -- Tagged binders
 917
 918 tagBinder usage binder
 919  = let
 920      usage'  = usage `delVarEnv` binder
 921      binder' = setBinderOcc usage binder
 922    in
 923    usage' `seq` (usage', binder')
 924
 925 setBinderOcc :: UsageDetails -> CoreBndr -> CoreBndr
 926 setBinderOcc usage bndr
 927   | isTyVar bndr      = bndr
 928   | isExportedId bndr = case idOccInfo bndr of
 929                           NoOccInfo -> bndr
 930                           other     -> setIdOccInfo bndr NoOccInfo
 931             -- Don't use local usage info for visible-elsewhere things
 932             -- BUT *do* erase any IAmALoopBreaker annotation, because we're
 933             -- about to re-generate it and it shouldn't be "sticky"
 934
 935   | otherwise = setIdOccInfo bndr occ_info
 936   where
 937     occ_info = lookupVarEnv usage bndr `orElse` IAmDead
 938 \end{code}
 939
 940
 941 %************************************************************************
 942 %*                                                                      *
 943 \subsection{Operations over OccInfo}
 944 %*                                                                      *
 945 %************************************************************************
 946
 947 \begin{code}
 948 oneOcc :: OccInfo
 949 oneOcc = OneOcc False True
 950
 951 markMany, markInsideLam, markInsideSCC :: OccInfo -> OccInfo
 952
 953 markMany IAmDead = IAmDead
 954 markMany other   = NoOccInfo
 955
 956 markInsideSCC occ = markMany occ
 957
 958 markInsideLam (OneOcc _ one_br) = OneOcc True one_br
 959 markInsideLam occ               = occ
 960
 961 addOccInfo, orOccInfo :: OccInfo -> OccInfo -> OccInfo
 962
 963 addOccInfo IAmDead info2 = info2
 964 addOccInfo info1 IAmDead = info1
 965 addOccInfo info1 info2   = NoOccInfo
 966
 967 -- (orOccInfo orig new) is used
 968 -- when combining occurrence info from branches of a case
 969
 970 orOccInfo IAmDead info2 = info2
 971 orOccInfo info1 IAmDead = info1
 972 orOccInfo (OneOcc in_lam1 one_branch1)
 973           (OneOcc in_lam2 one_branch2)
 974   = OneOcc (in_lam1 || in_lam2)
 975            False        -- False, because it occurs in both branches
 976
 977 orOccInfo info1 info2 = NoOccInfo
 978 \end{code}