[project @ 2001-01-09 17:43:57 by rrt]

[ghc-hetmet.git] / ghc / compiler / stranal / WorkWrap.lhs
diff --git a/ghc/compiler/stranal/WorkWrap.lhs b/ghc/compiler/stranal/WorkWrap.lhs

index d919b73..371920a 100644 (file)
--- a/ghc/compiler/stranal/WorkWrap.lhs
+++ b/ghc/compiler/stranal/WorkWrap.lhs
@@ -9,27 +9,21 @@ module WorkWrap ( wwTopBinds, mkWrapper ) where
  #include "HsVersions.h"
  
  import CoreSyn
-import CoreUnfold      ( Unfolding, certainlySmallEnoughToInline, calcUnfoldingGuidance )
-import CmdLineOpts     ( opt_UF_CreationThreshold , opt_D_verbose_core2core, 
-                          opt_D_dump_worker_wrapper
-                       )
-import CoreLint                ( beginPass, endPass )
-import CoreUtils       ( coreExprType, exprArity )
-import Const           ( Con(..) )
-import DataCon         ( DataCon )
+import CoreUnfold      ( certainlyWillInline )
+import CoreLint                ( showPass, endPass )
+import CoreUtils       ( exprType )
  import MkId            ( mkWorkerId )
-import Id              ( Id, idType, getIdStrictness, setIdArity, 
-                         setIdStrictness, getIdDemandInfo,
-                         setIdWorkerInfo, getIdCprInfo )
-import VarSet
+import Id              ( Id, idType, idStrictness, idArity, isOneShotLambda,
+                         setIdStrictness, idInlinePragma, 
+                         setIdWorkerInfo, idCprInfo, setInlinePragma )
  import Type            ( Type, isNewType, splitForAllTys, splitFunTys )
  import IdInfo          ( mkStrictnessInfo, noStrictnessInfo, StrictnessInfo(..),
-                         CprInfo(..), exactArity
+                         CprInfo(..), InlinePragInfo(..), isNeverInlinePrag,
+                         WorkerInfo(..)
                         )
-import Demand           ( Demand, wwLazy )
-import SaLib
+import Demand           ( Demand )
  import UniqSupply      ( UniqSupply, initUs_, returnUs, thenUs, mapUs, getUniqueUs, UniqSM )
-import UniqSet
+import CmdLineOpts
  import WwLib
  import Outputable
  \end{code}
@@ -62,20 +56,21 @@ info for exported values).
  
  \begin{code}
  
-wwTopBinds :: UniqSupply
-            -> [CoreBind]
-            -> IO [CoreBind]
+wwTopBinds :: DynFlags 
+          -> UniqSupply
+          -> [CoreBind]
+          -> IO [CoreBind]
  
-wwTopBinds us binds
+wwTopBinds dflags us binds
    = do {
-       beginPass "Worker Wrapper binds";
+       showPass dflags "Worker Wrapper binds";
  
         -- Create worker/wrappers, and mark binders with their
         -- "strictness info" [which encodes their worker/wrapper-ness]
         let { binds' = workersAndWrappers us binds };
  
-       endPass "Worker Wrapper binds" (opt_D_dump_worker_wrapper || 
-                                        opt_D_verbose_core2core) binds'
+       endPass dflags "Worker Wrapper binds" 
+               Opt_D_dump_worker_wrapper binds'
      }
  \end{code}
  
@@ -125,17 +120,13 @@ wwBind (Rec pairs)
  annotations that can be used. Remember it is @wwBind@ that does the
  matching by looking for strict arguments of the correct type.
  @wwExpr@ is a version that just returns the ``Plain'' Tree.
-???????????????? ToDo
  
  \begin{code}
  wwExpr :: CoreExpr -> UniqSM CoreExpr
  
  wwExpr e@(Type _)   = returnUs e
  wwExpr e@(Var _)    = returnUs e
-
-wwExpr e@(Con con args)
- = mapUs wwExpr args   `thenUs` \ args' ->
-   returnUs (Con con args')
+wwExpr e@(Lit _)    = returnUs e
  
  wwExpr (Lam binder expr)
    = wwExpr expr                        `thenUs` \ new_expr ->
@@ -194,33 +185,57 @@ tryWW     :: Bool                         -- True <=> a non-recursive binding
                                         -- if two, then a worker and a
                                         -- wrapper.
  tryWW non_rec fn_id rhs
-  | (non_rec &&                -- Don't split if its non-recursive and small
-     certainlySmallEnoughToInline (calcUnfoldingGuidance opt_UF_CreationThreshold rhs)
-       -- No point in worker/wrappering something that is going to be
+  | isNeverInlinePrag inline_prag || arity == 0
+  =    -- Don't split things that will never be inlined
+    returnUs [ (fn_id, rhs) ]
+
+  | non_rec && not do_coerce_ww && certainlyWillInline fn_id
+       -- No point in worker/wrappering a function that is going to be
         -- INLINEd wholesale anyway.  If the strictness analyser is run
         -- twice, this test also prevents wrappers (which are INLINEd)
         -- from being re-done.
-    )
-
-  || arity == 0                -- Don't split if it's not a function
+       --
+       -- The do_coerce_ww test is so that
+       -- a function with a coerce should w/w to get rid
+       -- of the coerces, which can significantly improve its arity.
+       -- Example:  f []     = return [] :: IO [Int]
+       --           f (x:xs) = return (x:xs)
+       -- If we aren't careful we end up with
+       --      f = \ x -> case x of {
+       --                   x:xs -> __coerce (IO [Int]) (\ s -> (# s, x:xs #)
+       --                   []   -> lvl_sJ8
+       --
+       --
+       -- OUT OF DATE NOTE, kept for info:
+       -- It's out of date because now wrappers look very cheap 
+       -- even when they are inlined.
+       --   In this case we add an INLINE pragma to the RHS.  Why?
+       --   Because consider
+       --        f = \x -> g x x
+       --        g = \yz -> ...                -- And g is strict
+       --   Then f is small, so we don't w/w it.  But g is big, and we do, so
+       --   g's wrapper will get inlined in f's RHS, which makes f look big now.
+       --   So f doesn't get inlined, but it is strict and we have failed to w/w it.
+  = returnUs [ (fn_id, rhs) ]
  
-  || not (do_strict_ww || do_cpr_ww || do_coerce_ww)
+  | not (do_strict_ww || do_cpr_ww || do_coerce_ww)
    = returnUs [ (fn_id, rhs) ]
  
    | otherwise          -- Do w/w split
-  = mkWwBodies fun_ty arity wrap_dmds cpr_info `thenUs` \ (work_args, wrap_fn, work_fn) ->
-    getUniqueUs                                        `thenUs` \ work_uniq ->
+  = mkWwBodies fun_ty arity wrap_dmds result_bot one_shots cpr_info    `thenUs` \ (work_demands, wrap_fn, work_fn) ->
+    getUniqueUs                                                                `thenUs` \ work_uniq ->
      let
-       work_rhs     = work_fn rhs
-       work_demands = [getIdDemandInfo v | v <- work_args, isId v]
-       proto_work_id            = mkWorkerId work_uniq fn_id (coreExprType work_rhs) 
+       work_rhs      = work_fn rhs
+       proto_work_id = mkWorkerId work_uniq fn_id (exprType work_rhs) 
+                       `setInlinePragma` inline_prag
+
         work_id | has_strictness = proto_work_id `setIdStrictness` mkStrictnessInfo (work_demands, result_bot)
                 | otherwise      = proto_work_id
  
         wrap_rhs = wrap_fn work_id
         wrap_id  = fn_id `setIdStrictness`      wrapper_strictness
-                         `setIdWorkerInfo`     Just work_id
-                        `setIdArity`           exactArity arity
+                         `setIdWorkerInfo`     HasWorker work_id arity
+                        `setInlinePragma`      NoInlinePragInfo        -- Put it on the worker instead
                 -- Add info to the wrapper:
                 --      (a) we want to set its arity
                 --      (b) we want to pin on its revised strictness info
@@ -228,40 +243,53 @@ tryWW non_rec fn_id rhs
      in
      returnUs ([(work_id, work_rhs), (wrap_id, wrap_rhs)])
         -- Worker first, because wrapper mentions it
+       -- mkWwBodies has already built a wrap_rhs with an INLINE pragma wrapped around it
    where
      fun_ty = idType fn_id
-    arity  = exprArity rhs
-
-    strictness_info                      = getIdStrictness fn_id
-    StrictnessInfo arg_demands result_bot = strictness_info
-    has_strictness                       = case strictness_info of
-                                               StrictnessInfo _ _ -> True
-                                               other              -> False
-                       
-    do_strict_ww = has_strictness && worthSplitting wrap_dmds result_bot
-
-       -- NB: There maybe be more items in arg_demands than arity, because
-       -- the strictness info is semantic and looks through InlineMe and Scc Notes, 
-       -- whereas arity does not
-    demands_for_visible_args = take arity arg_demands
-    remaining_arg_demands    = drop arity arg_demands
-
-    wrap_dmds | has_strictness = setUnpackStrategy demands_for_visible_args
-             | otherwise      = take arity (repeat wwLazy)
-
-    wrapper_strictness | has_strictness = mkStrictnessInfo (wrap_dmds ++ remaining_arg_demands, result_bot)
+    arity  = idArity fn_id     -- The arity is set by the simplifier using exprEtaExpandArity
+                               -- So it may be more than the number of top-level-visible lambdas
+
+    inline_prag  = idInlinePragma fn_id
+
+    strictness_info           = idStrictness fn_id
+    has_strictness           = case strictness_info of
+                                       StrictnessInfo _ _ -> True
+                                       NoStrictnessInfo   -> False
+    (arg_demands, result_bot) = case strictness_info of
+                                       StrictnessInfo d r -> (d,  r)
+                                       NoStrictnessInfo   -> ([], False)
+
+    wrap_dmds = setUnpackStrategy arg_demands
+    do_strict_ww = WARN( has_strictness && not result_bot && arity < length arg_demands && worthSplitting wrap_dmds result_bot, 
+                        text "Insufficient arity" <+> ppr fn_id <+> ppr arity <+> ppr arg_demands )
+                   (result_bot || arity >= length arg_demands) -- Only if there's enough visible arity
+                &&                                             -- (else strictness info isn't valid)
+                                                               -- 
+                   worthSplitting wrap_dmds result_bot         -- And it's useful
+       -- worthSplitting returns False for an empty list of demands,
+       -- and hence do_strict_ww is False if arity is zero
+       -- Also it's false if there is no strictness (arg_demands is [])
+
+    wrapper_strictness | has_strictness = mkStrictnessInfo (wrap_dmds, result_bot)
                        | otherwise      = noStrictnessInfo
  
         -------------------------------------------------------------
-    cpr_info     = getIdCprInfo fn_id
-    has_cpr_info = case cpr_info of
-                       CPRInfo _ -> True
-                       other     -> False
-
-    do_cpr_ww = has_cpr_info
+    cpr_info  = idCprInfo fn_id
+    do_cpr_ww = arity > 0 &&
+               case cpr_info of
+                       ReturnsCPR -> True
+                       other      -> False
  
         -------------------------------------------------------------
      do_coerce_ww = check_for_coerce arity fun_ty
+       -- We are willing to do a w/w even if the arity is zero.
+       --      x = coerce t E
+       -- ==>
+       --      x' = E
+       --      x  = coerce t x'
+
+       -------------------------------------------------------------
+    one_shots = get_one_shots rhs
  
  -- See if there's a Coerce before we run out of arity;
  -- if so, it's worth trying a w/w split.  Reason: we find
@@ -278,6 +306,16 @@ check_for_coerce arity ty
    where
      (_, tau)         = splitForAllTys ty
      (arg_tys, res_ty) = splitFunTys tau
+
+-- If the original function has one-shot arguments, it is important to
+-- make the wrapper and worker have corresponding one-shot arguments too.
+-- Otherwise we spuriously float stuff out of case-expression join points,
+-- which is very annoying.
+get_one_shots (Lam b e)
+  | isId b    = isOneShotLambda b : get_one_shots e
+  | otherwise = get_one_shots e
+get_one_shots (Note _ e) = get_one_shots e
+get_one_shots other     = noOneShotInfo
  \end{code}
  
  
@@ -295,12 +333,15 @@ the function and the name of its worker, and we want to make its body (the wrapp
  mkWrapper :: Type              -- Wrapper type
           -> Int                -- Arity
           -> [Demand]           -- Wrapper strictness info
+         -> Bool               -- Function returns bottom
           -> CprInfo            -- Wrapper cpr info
           -> UniqSM (Id -> CoreExpr)    -- Wrapper body, missing worker Id
  
-mkWrapper fun_ty arity demands cpr_info
-  = mkWwBodies fun_ty arity demands cpr_info   `thenUs` \ (_, wrap_fn, _) ->
+mkWrapper fun_ty arity demands res_bot cpr_info
+  = mkWwBodies fun_ty arity demands res_bot noOneShotInfo cpr_info     `thenUs` \ (_, wrap_fn, _) ->
      returnUs wrap_fn
+
+noOneShotInfo = repeat False
  \end{code}