Don't inline a loop breaker, even if it has an INLINE pragma

[ghc-hetmet.git] / compiler / simplCore / SimplUtils.lhs
diff --git a/compiler/simplCore/SimplUtils.lhs b/compiler/simplCore/SimplUtils.lhs

index c541096..1511a2f 100644 (file)
--- a/compiler/simplCore/SimplUtils.lhs
+++ b/compiler/simplCore/SimplUtils.lhs
@@ -11,12 +11,13 @@ module SimplUtils (
         -- Inlining,
         preInlineUnconditionally, postInlineUnconditionally, 
         activeInline, activeRule, 
         -- Inlining,
         preInlineUnconditionally, postInlineUnconditionally, 
         activeInline, activeRule, 
+        simplEnvForGHCi, simplEnvForRules, simplGentlyForInlineRules,
  
         -- The continuation type
         SimplCont(..), DupFlag(..), ArgInfo(..),
         contIsDupable, contResultType, contIsTrivial, contArgs, dropArgs, 
         countValArgs, countArgs, 
  
         -- The continuation type
         SimplCont(..), DupFlag(..), ArgInfo(..),
         contIsDupable, contResultType, contIsTrivial, contArgs, dropArgs, 
         countValArgs, countArgs, 
-       mkBoringStop, mkLazyArgStop, contIsRhsOrArg,
+       mkBoringStop, mkRhsStop, mkLazyArgStop, contIsRhsOrArg,
         interestingCallContext, 
  
         interestingArg, mkArgInfo,
         interestingCallContext, 
  
         interestingArg, mkArgInfo,
@@ -152,6 +153,9 @@ instance Outputable DupFlag where
  mkBoringStop :: SimplCont
  mkBoringStop = Stop BoringCtxt
  
  mkBoringStop :: SimplCont
  mkBoringStop = Stop BoringCtxt
  
+mkRhsStop :: SimplCont -- See Note [RHS of lets] in CoreUnfold
+mkRhsStop = Stop (ArgCtxt False)
+
  mkLazyArgStop :: CallCtxt -> SimplCont
  mkLazyArgStop cci = Stop cci
  
  mkLazyArgStop :: CallCtxt -> SimplCont
  mkLazyArgStop cci = Stop cci
  
@@ -260,8 +264,9 @@ interestingCallContext cont
    where
      interesting (Select _ bndr _ _ _)
         | isDeadBinder bndr = CaseCtxt
    where
      interesting (Select _ bndr _ _ _)
         | isDeadBinder bndr = CaseCtxt
-       | otherwise         = ArgCtxt False 2   -- If the binder is used, this
+       | otherwise         = ArgCtxt False     -- If the binder is used, this
                                                 -- is like a strict let
                                                 -- is like a strict let
+                                               -- See Note [RHS of lets] in CoreUnfold
                 
      interesting (ApplyTo _ arg _ cont)
         | isTypeArg arg = interesting cont
                 
      interesting (ApplyTo _ arg _ cont)
         | isTypeArg arg = interesting cont
@@ -394,8 +399,8 @@ interestingArgContext rules call_cont
      go (CoerceIt _ c)       = go c
      go (Stop cci)            = interesting cci
  
      go (CoerceIt _ c)       = go c
      go (Stop cci)            = interesting cci
  
-    interesting (ArgCtxt rules _) = rules
-    interesting _                 = False
+    interesting (ArgCtxt rules) = rules
+    interesting _               = False
  \end{code}
  
  
  \end{code}
  
  
@@ -406,18 +411,58 @@ interestingArgContext rules call_cont
  %*                                                                     *
  %************************************************************************
  
  %*                                                                     *
  %************************************************************************
  
-Inlining is controlled partly by the SimplifierMode switch.  This has two
-settings:
+\begin{code}
+simplEnvForGHCi :: SimplEnv
+simplEnvForGHCi = mkSimplEnv allOffSwitchChecker $
+                  SimplGently { sm_rules = False, sm_inline = False }
+   -- Do not do any inlining, in case we expose some unboxed
+   -- tuple stuff that confuses the bytecode interpreter
+
+simplEnvForRules :: SimplEnv
+simplEnvForRules = mkSimplEnv allOffSwitchChecker $
+                   SimplGently { sm_rules = True, sm_inline = False }
+
+simplGentlyForInlineRules :: SimplifierMode
+simplGentlyForInlineRules = SimplGently { sm_rules = True, sm_inline = True }
+       -- Simplify as much as possible, subject to the usual "gentle" rules
+\end{code}
  
  
+Inlining is controlled partly by the SimplifierMode switch.  This has two
+settings
+       
         SimplGently     (a) Simplifying before specialiser/full laziness
         SimplGently     (a) Simplifying before specialiser/full laziness
-                       (b) Simplifiying inside INLINE pragma
+                       (b) Simplifiying inside InlineRules
                         (c) Simplifying the LHS of a rule
                         (d) Simplifying a GHCi expression or Template 
                                 Haskell splice
  
         SimplPhase n _   Used at all other times
  
                         (c) Simplifying the LHS of a rule
                         (d) Simplifying a GHCi expression or Template 
                                 Haskell splice
  
         SimplPhase n _   Used at all other times
  
-The key thing about SimplGently is that it does no call-site inlining.
+Note [Gentle mode]
+~~~~~~~~~~~~~~~~~~
+Gentle mode has a separate boolean flag to control
+       a) inlining (sm_inline flag)
+       b) rules    (sm_rules  flag)
+A key invariant about Gentle mode is that it is treated as the EARLIEST
+phase.  Something is inlined if the sm_inline flag is on AND the thing
+is inlinable in the earliest phase.  This is important. Example
+
+  {-# INLINE [~1] g #-}
+  g = ...
+  
+  {-# INLINE f #-}
+  f x = g (g x)
+
+If we were to inline g into f's inlining, then an importing module would
+never be able to do
+       f e --> g (g e) ---> RULE fires
+because the InlineRule for f has had g inlined into it.
+
+On the other hand, it is bad not to do ANY inlining into an
+InlineRule, because then recursive knots in instance declarations
+don't get unravelled.
+
+However, *sometimes* SimplGently must do no call-site inlining at all.
  Before full laziness we must be careful not to inline wrappers,
  because doing so inhibits floating
      e.g. ...(case f x of ...)...
  Before full laziness we must be careful not to inline wrappers,
  because doing so inhibits floating
      e.g. ...(case f x of ...)...
@@ -431,11 +476,11 @@ running it, we don't want to use -O2.  Indeed, we don't want to inline
  anything, because the byte-code interpreter might get confused about 
  unboxed tuples and suchlike.
  
  anything, because the byte-code interpreter might get confused about 
  unboxed tuples and suchlike.
  
-INLINE pragmas
-~~~~~~~~~~~~~~
-We don't simplify inside InlineRules (which come from INLINE pragmas).
-It really is important to switch off inlinings inside such
-expressions.  Consider the following example 
+Note [Simplifying gently inside InlineRules]
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+We don't do much simplification inside InlineRules (which come from
+INLINE pragmas).  It really is important to switch off inlinings
+inside such expressions.  Consider the following example
  
         let f = \pq -> BIG
         in
  
         let f = \pq -> BIG
         in
@@ -444,16 +489,14 @@ expressions.  Consider the following example
         in ...g...g...g...g...g...
  
  Now, if that's the ONLY occurrence of f, it will be inlined inside g,
         in ...g...g...g...g...g...
  
  Now, if that's the ONLY occurrence of f, it will be inlined inside g,
-and thence copied multiple times when g is inlined.
-
+and thence copied multiple times when g is inlined.  
  
  
-This function may be inlinined in other modules, so we
-don't want to remove (by inlining) calls to functions that have
-specialisations, or that may have transformation rules in an importing
-scope.
+This function may be inlinined in other modules, so we don't want to
+remove (by inlining) calls to functions that have specialisations, or
+that may have transformation rules in an importing scope.
  
  E.g.   {-# INLINE f #-}
  
  E.g.   {-# INLINE f #-}
-               f x = ...g...
+       f x = ...g...
  
  and suppose that g is strict *and* has specialisations.  If we inline
  g's wrapper, we deny f the chance of getting the specialised version
  
  and suppose that g is strict *and* has specialisations.  If we inline
  g's wrapper, we deny f the chance of getting the specialised version
@@ -471,15 +514,14 @@ continuation.  That's why the keep_inline predicate returns True for
  ArgOf continuations.  It shouldn't do any harm not to dissolve the
  inline-me note under these circumstances.
  
  ArgOf continuations.  It shouldn't do any harm not to dissolve the
  inline-me note under these circumstances.
  
-Note that the result is that we do very little simplification
-inside an InlineMe.  
+Although we do very little simplification inside an InlineRule,
+the RHS is simplified as normal.  For example:
  
         all xs = foldr (&&) True xs
         any p = all . map p  {-# INLINE any #-}
  
  
         all xs = foldr (&&) True xs
         any p = all . map p  {-# INLINE any #-}
  
-Problem: any won't get deforested, and so if it's exported and the
-importer doesn't use the inlining, (eg passes it as an arg) then we
-won't get deforestation at all.  We havn't solved this problem yet!
+The RHS of 'any' will get optimised and deforested; but the InlineRule
+will still mention the original RHS.
  
  
  preInlineUnconditionally
  
  
  preInlineUnconditionally
@@ -546,6 +588,18 @@ seems a bit fragile.
  Conclusion: inline top level things gaily until Phase 0 (the last
  phase), at which point don't.
  
  Conclusion: inline top level things gaily until Phase 0 (the last
  phase), at which point don't.
  
+Note [pre/postInlineUnconditionally in gentle mode]
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Even in gentle mode we want to do preInlineUnconditionally.  The
+reason is that too little clean-up happens if you don't inline
+use-once things.  Also a bit of inlining is *good* for full laziness;
+it can expose constant sub-expressions.  Example in
+spectral/mandel/Mandel.hs, where the mandelset function gets a useful
+let-float if you inline windowToViewport
+
+However, as usual for Gentle mode, do not inline things that are
+inactive in the intial stages.  See Note [Gentle mode].
+
  \begin{code}
  preInlineUnconditionally :: SimplEnv -> TopLevelFlag -> InId -> InExpr -> Bool
  preInlineUnconditionally env top_lvl bndr rhs
  \begin{code}
  preInlineUnconditionally :: SimplEnv -> TopLevelFlag -> InId -> InExpr -> Bool
  preInlineUnconditionally env top_lvl bndr rhs
@@ -558,7 +612,8 @@ preInlineUnconditionally env top_lvl bndr rhs
    where
      phase = getMode env
      active = case phase of
    where
      phase = getMode env
      active = case phase of
-                  SimplGently    -> isEarlyActive act
+                  SimplGently {} -> isEarlyActive act
+                       -- See Note [pre/postInlineUnconditionally in gentle mode]
                    SimplPhase n _ -> isActive n act
      act = idInlineActivation bndr
  
                    SimplPhase n _ -> isActive n act
      act = idInlineActivation bndr
  
@@ -715,21 +770,21 @@ postInlineUnconditionally env top_lvl bndr occ_info rhs unfolding
  
    where
      active = case getMode env of
  
    where
      active = case getMode env of
-                  SimplGently    -> isAlwaysActive act
+                  SimplGently {} -> isEarlyActive act
+                       -- See Note [pre/postInlineUnconditionally in gentle mode]
                    SimplPhase n _ -> isActive n act
      act = idInlineActivation bndr
  
  activeInline :: SimplEnv -> OutId -> Bool
  activeInline env id
                    SimplPhase n _ -> isActive n act
      act = idInlineActivation bndr
  
  activeInline :: SimplEnv -> OutId -> Bool
  activeInline env id
+  | isNonRuleLoopBreaker (idOccInfo id)          -- Things with an INLINE pragma may have 
+                                         -- an unfolding *and* be a loop breaker
+  = False                                -- (maybe the knot is not yet untied)
+  | otherwise
    = case getMode env of
    = case getMode env of
-      SimplGently -> False
-       -- No inlining at all when doing gentle stuff,
-       -- except for local things that occur once (pre/postInlineUnconditionally)
-       -- The reason is that too little clean-up happens if you 
-       -- don't inline use-once things.   Also a bit of inlining is *good* for
-       -- full laziness; it can expose constant sub-expressions.
-       -- Example in spectral/mandel/Mandel.hs, where the mandelset 
-       -- function gets a useful let-float if you inline windowToViewport
+      SimplGently { sm_inline = inlining_on } 
+         -> inlining_on && isEarlyActive act
+       -- See Note [Gentle mode]
  
         -- NB: we used to have a second exception, for data con wrappers.
         -- On the grounds that we use gentle mode for rule LHSs, and 
  
         -- NB: we used to have a second exception, for data con wrappers.
         -- On the grounds that we use gentle mode for rule LHSs, and 
@@ -749,13 +804,15 @@ activeRule dflags env
    = Nothing    -- Rewriting is off
    | otherwise
    = case getMode env of
    = Nothing    -- Rewriting is off
    | otherwise
    = case getMode env of
-       SimplGently    -> Just isAlwaysActive
+      SimplGently { sm_rules = rules_on } 
+        | rules_on  -> Just isEarlyActive
+        | otherwise -> Nothing
                         -- Used to be Nothing (no rules in gentle mode)
                         -- Main motivation for changing is that I wanted
                         --      lift String ===> ...
                         -- to work in Template Haskell when simplifying
                         -- splices, so we get simpler code for literal strings
                         -- Used to be Nothing (no rules in gentle mode)
                         -- Main motivation for changing is that I wanted
                         --      lift String ===> ...
                         -- to work in Template Haskell when simplifying
                         -- splices, so we get simpler code for literal strings
-       SimplPhase n _ -> Just (isActive n)
+      SimplPhase n _ -> Just (isActive n)
  \end{code}
  
  Note [InlineRule and postInlineUnconditionally]
  \end{code}
  
  Note [InlineRule and postInlineUnconditionally]