+ vect_rhs bndr rhs = localV
+ . inBind bndr
+ $ vectExpr rhs
+
+vectExpr e@(_, AnnLam bndr _)
+ | isId bndr = vectFnExpr True e
+{-
+onlyIfV (isEmptyVarSet fvs) (vectScalarLam bs $ deAnnotate body)
+ `orElseV` vectLam True fvs bs body
+ where
+ (bs,body) = collectAnnValBinders e
+-}
+
+vectExpr e = cantVectorise "Can't vectorise expression" (ppr $ deAnnotate e)
+
+vectFnExpr :: Bool -> CoreExprWithFVs -> VM VExpr
+vectFnExpr inline e@(fvs, AnnLam bndr _)
+ | isId bndr = onlyIfV (isEmptyVarSet fvs) (vectScalarLam bs $ deAnnotate body)
+ `orElseV` vectLam inline fvs bs body
+ where
+ (bs,body) = collectAnnValBinders e
+vectFnExpr _ e = vectExpr e
+
+
+vectScalarLam :: [Var] -> CoreExpr -> VM VExpr
+vectScalarLam args body
+ = do
+ scalars <- globalScalars
+ onlyIfV (all is_scalar_ty arg_tys
+ && is_scalar_ty res_ty
+ && is_scalar (extendVarSetList scalars args) body)
+ $ do
+ fn_var <- hoistExpr (fsLit "fn") (mkLams args body)
+ zipf <- zipScalars arg_tys res_ty
+ clo <- scalarClosure arg_tys res_ty (Var fn_var)
+ (zipf `App` Var fn_var)
+ clo_var <- hoistExpr (fsLit "clo") clo
+ lclo <- liftPA (Var clo_var)
+ return (Var clo_var, lclo)
+ where
+ arg_tys = map idType args
+ res_ty = exprType body
+
+ is_scalar_ty ty | Just (tycon, []) <- splitTyConApp_maybe ty
+ = tycon == intTyCon
+ || tycon == floatTyCon
+ || tycon == doubleTyCon
+
+ | otherwise = False
+
+ is_scalar vs (Var v) = v `elemVarSet` vs
+ is_scalar _ e@(Lit _) = is_scalar_ty $ exprType e
+ is_scalar vs (App e1 e2) = is_scalar vs e1 && is_scalar vs e2
+ is_scalar _ _ = False
+
+vectLam :: Bool -> VarSet -> [Var] -> CoreExprWithFVs -> VM VExpr
+vectLam inline fvs bs body
+ = do
+ tyvars <- localTyVars
+ (vs, vvs) <- readLEnv $ \env ->
+ unzip [(var, vv) | var <- varSetElems fvs
+ , Just vv <- [lookupVarEnv (local_vars env) var]]
+
+ arg_tys <- mapM (vectType . idType) bs
+ res_ty <- vectType (exprType $ deAnnotate body)
+
+ buildClosures tyvars vvs arg_tys res_ty
+ . hoistPolyVExpr tyvars
+ $ do
+ lc <- builtin liftingContext
+ (vbndrs, vbody) <- vectBndrsIn (vs ++ bs)
+ (vectExpr body)
+ return . maybe_inline $ vLams lc vbndrs vbody
+ where
+ maybe_inline = if inline then vInlineMe else id
+
+vectTyAppExpr :: CoreExprWithFVs -> [Type] -> VM VExpr
+vectTyAppExpr (_, AnnVar v) tys = vectPolyVar v tys
+vectTyAppExpr e tys = cantVectorise "Can't vectorise expression"
+ (ppr $ deAnnotate e `mkTyApps` tys)
+
+-- We convert
+--
+-- case e :: t of v { ... }
+--
+-- to
+--
+-- V: let v' = e in case v' of _ { ... }
+-- L: let v' = e in case v' `cast` ... of _ { ... }
+--
+-- When lifting, we have to do it this way because v must have the type
+-- [:V(T):] but the scrutinee must be cast to the representation type. We also
+-- have to handle the case where v is a wild var correctly.
+--
+
+-- FIXME: this is too lazy
+vectAlgCase :: TyCon -> [Type] -> CoreExprWithFVs -> Var -> Type
+ -> [(AltCon, [Var], CoreExprWithFVs)]
+ -> VM VExpr
+vectAlgCase _tycon _ty_args scrut bndr ty [(DEFAULT, [], body)]
+ = do
+ vscrut <- vectExpr scrut
+ (vty, lty) <- vectAndLiftType ty
+ (vbndr, vbody) <- vectBndrIn bndr (vectExpr body)
+ return $ vCaseDEFAULT vscrut vbndr vty lty vbody
+
+vectAlgCase _tycon _ty_args scrut bndr ty [(DataAlt _, [], body)]
+ = do
+ vscrut <- vectExpr scrut
+ (vty, lty) <- vectAndLiftType ty
+ (vbndr, vbody) <- vectBndrIn bndr (vectExpr body)
+ return $ vCaseDEFAULT vscrut vbndr vty lty vbody
+
+vectAlgCase tycon _ty_args scrut bndr ty [(DataAlt dc, bndrs, body)]
+ = do
+ vect_tc <- maybeV (lookupTyCon tycon)
+ (vty, lty) <- vectAndLiftType ty
+ vexpr <- vectExpr scrut
+ (vbndr, (vbndrs, vbody)) <- vect_scrut_bndr
+ . vectBndrsIn bndrs
+ $ vectExpr body
+
+ (vscrut, arr_tc, _arg_tys) <- mkVScrut (vVar vbndr)
+ vect_dc <- maybeV (lookupDataCon dc)
+ let [arr_dc] = tyConDataCons arr_tc
+ repr <- mkRepr vect_tc
+ shape_bndrs <- arrShapeVars repr
+ return . vLet (vNonRec vbndr vexpr)
+ $ vCaseProd vscrut vty lty vect_dc arr_dc shape_bndrs vbndrs vbody
+ where
+ vect_scrut_bndr | isDeadBinder bndr = vectBndrNewIn bndr (fsLit "scrut")
+ | otherwise = vectBndrIn bndr
+
+vectAlgCase tycon _ty_args scrut bndr ty alts
+ = do
+ vect_tc <- maybeV (lookupTyCon tycon)
+ (vty, lty) <- vectAndLiftType ty
+ repr <- mkRepr vect_tc
+ shape_bndrs <- arrShapeVars repr
+ (len, sel, indices) <- arrSelector repr (map Var shape_bndrs)
+
+ (vbndr, valts) <- vect_scrut_bndr $ mapM (proc_alt sel vty lty) alts'
+ let (vect_dcs, vect_bndrss, lift_bndrss, vbodies) = unzip4 valts
+
+ vexpr <- vectExpr scrut
+ (vscrut, arr_tc, _arg_tys) <- mkVScrut (vVar vbndr)
+ let [arr_dc] = tyConDataCons arr_tc
+
+ let (vect_scrut, lift_scrut) = vscrut
+ (vect_bodies, lift_bodies) = unzip vbodies
+
+ vdummy <- newDummyVar (exprType vect_scrut)
+ ldummy <- newDummyVar (exprType lift_scrut)
+ let vect_case = Case vect_scrut vdummy vty
+ (zipWith3 mk_vect_alt vect_dcs vect_bndrss vect_bodies)
+
+ lbody <- combinePA vty len sel indices lift_bodies
+ let lift_case = Case lift_scrut ldummy lty
+ [(DataAlt arr_dc, shape_bndrs ++ concat lift_bndrss,
+ lbody)]
+
+ return . vLet (vNonRec vbndr vexpr)
+ $ (vect_case, lift_case)
+ where
+ vect_scrut_bndr | isDeadBinder bndr = vectBndrNewIn bndr (fsLit "scrut")
+ | otherwise = vectBndrIn bndr
+
+ alts' = sortBy (\(alt1, _, _) (alt2, _, _) -> cmp alt1 alt2) alts
+
+ cmp (DataAlt dc1) (DataAlt dc2) = dataConTag dc1 `compare` dataConTag dc2
+ cmp DEFAULT DEFAULT = EQ
+ cmp DEFAULT _ = LT
+ cmp _ DEFAULT = GT
+ cmp _ _ = panic "vectAlgCase/cmp"
+
+ proc_alt sel vty lty (DataAlt dc, bndrs, body)
+ = do
+ vect_dc <- maybeV (lookupDataCon dc)
+ let tag = mkDataConTag vect_dc
+ fvs = freeVarsOf body `delVarSetList` bndrs
+ (vect_bndrs, lift_bndrs, vbody)
+ <- vect_alt_bndrs bndrs
+ $ \len -> packLiftingContext len sel tag fvs vty lty
+ $ vectExpr body
+
+ return (vect_dc, vect_bndrs, lift_bndrs, vbody)
+ proc_alt _ _ _ _ = panic "vectAlgCase/proc_alt"
+
+ vect_alt_bndrs [] p
+ = do
+ void_tc <- builtin voidTyCon
+ let void_ty = mkTyConApp void_tc []
+ arr_ty <- mkPArrayType void_ty
+ bndr <- newLocalVar (fsLit "voids") arr_ty
+ len <- lengthPA void_ty (Var bndr)
+ e <- p len
+ return ([], [bndr], e)
+
+ vect_alt_bndrs bndrs p
+ = localV
+ $ do
+ vbndrs <- mapM vectBndr bndrs
+ let (vect_bndrs, lift_bndrs) = unzip vbndrs
+ vv : _ = vect_bndrs
+ lv : _ = lift_bndrs
+ len <- lengthPA (idType vv) (Var lv)
+ e <- p len
+ return (vect_bndrs, lift_bndrs, e)
+
+ mk_vect_alt vect_dc bndrs body = (DataAlt vect_dc, bndrs, body)
+
+packLiftingContext :: CoreExpr -> CoreExpr -> CoreExpr -> VarSet
+ -> Type -> Type -> VM VExpr -> VM VExpr
+packLiftingContext len shape tag fvs vty lty p
+ = do
+ select <- builtin selectPAIntPrimVar
+ let sel_expr = mkApps (Var select) [shape, tag]
+ sel_var <- newLocalVar (fsLit "sel#") (exprType sel_expr)
+ lc_var <- builtin liftingContext
+ localV $
+ do
+ bnds <- mapM (packFreeVar (Var lc_var) (Var sel_var))
+ . filter isLocalId
+ $ varSetElems fvs
+ (vexpr, lexpr) <- p
+ empty <- emptyPA vty
+ return (vexpr, Let (NonRec sel_var sel_expr)
+ $ Case len lc_var lty
+ [(DEFAULT, [], mkLets (concat bnds) lexpr),
+ (LitAlt (mkMachInt 0), [], empty)])
+
+packFreeVar :: CoreExpr -> CoreExpr -> Var -> VM [CoreBind]
+packFreeVar len sel v
+ = do
+ r <- lookupVar v
+ case r of
+ Local (vv,lv) ->
+ do
+ lv' <- cloneVar lv
+ expr <- packPA (idType vv) (Var lv) len sel
+ updLEnv (upd vv lv')
+ return [(NonRec lv' expr)]
+
+ _ -> return []
+ where
+ upd vv lv' env = env { local_vars = extendVarEnv (local_vars env) v (vv, lv') }