[project @ 2003-03-27 17:59:09 by sof]

[ghc-hetmet.git] / ghc / compiler / basicTypes / Literal.lhs
diff --git a/ghc/compiler/basicTypes/Literal.lhs b/ghc/compiler/basicTypes/Literal.lhs

index d2f6509..32815b9 100644 (file)
--- a/ghc/compiler/basicTypes/Literal.lhs
+++ b/ghc/compiler/basicTypes/Literal.lhs
@@ -8,15 +8,20 @@ module Literal
         ( Literal(..)           -- Exported to ParseIface
         , mkMachInt, mkMachWord
         , mkMachInt64, mkMachWord64
-       , isLitLitLit, maybeLitLit, litIsDupable,
+       , isLitLitLit, maybeLitLit, litSize
+       , litIsDupable, litIsTrivial
         , literalType, literalPrimRep
         , hashLiteral
  
-       , inIntRange, inWordRange, tARGET_MAX_INT
+       , inIntRange, inWordRange, tARGET_MAX_INT, inCharRange
+       , isZeroLit,
  
-       , word2IntLit, int2WordLit, char2IntLit, int2CharLit
+       , word2IntLit, int2WordLit
+       , narrow8IntLit, narrow16IntLit, narrow32IntLit
+       , narrow8WordLit, narrow16WordLit, narrow32WordLit
+       , char2IntLit, int2CharLit
         , float2IntLit, int2FloatLit, double2IntLit, int2DoubleLit
-       , addr2IntLit, int2AddrLit, float2DoubleLit, double2FloatLit
+       , nullAddrLit, float2DoubleLit, double2FloatLit
         ) where
  
  #include "HsVersions.h"
@@ -25,15 +30,21 @@ import TysPrim              ( charPrimTy, addrPrimTy, floatPrimTy, doublePrimTy,
                           intPrimTy, wordPrimTy, int64PrimTy, word64PrimTy
                         )
  import PrimRep         ( PrimRep(..) )
-import Type            ( Type, typePrimRep )
+import TcType          ( Type, tcCmpType )
+import Type            ( typePrimRep )
  import PprType         ( pprParendType )
  import CStrings                ( pprFSInCStyle )
  
  import Outputable
+import FastTypes
+import FastString
+import Binary
  import Util            ( thenCmp )
  
-import Ratio           ( numerator, denominator )
-import FastString      ( uniqueOfFS )
+import Ratio           ( numerator )
+import FastString      ( uniqueOfFS, lengthFS )
+import DATA_INT                ( Int8,  Int16,  Int32 )
+import DATA_WORD       ( Word8, Word16, Word32 )
  import Char            ( ord, chr )
  \end{code}
  
@@ -60,6 +71,9 @@ tARGET_MIN_INT = -2147483648
  tARGET_MAX_INT =  2147483647
  #endif
  tARGET_MAX_WORD = (tARGET_MAX_INT * 2) + 1
+
+tARGET_MAX_CHAR :: Int
+tARGET_MAX_CHAR = 0x10ffff
  \end{code}
   
  
@@ -86,27 +100,89 @@ data Literal
    =    ------------------
         -- First the primitive guys
      MachChar   Int             -- Char#        At least 31 bits
-  | MachStr    FAST_STRING
+  | MachStr    FastString
  
    | MachAddr   Integer -- Whatever this machine thinks is a "pointer"
  
-  | MachInt    Integer         -- Int#         At least 32 bits
+  | MachInt    Integer         -- Int#         At least WORD_SIZE_IN_BITS bits
    | MachInt64  Integer         -- Int64#       At least 64 bits
-  | MachWord   Integer         -- Word#        At least 32 bits
+  | MachWord   Integer         -- Word#        At least WORD_SIZE_IN_BITS bits
    | MachWord64 Integer         -- Word64#      At least 64 bits
  
    | MachFloat  Rational
    | MachDouble Rational
  
+        -- MachLabel is used (only) for the literal derived from a 
+       -- "foreign label" declaration.
         -- string argument is the name of a symbol.  This literal
         -- refers to the *address* of the label.
-  | MachLabel   FAST_STRING            -- always an Addr#
+  | MachLabel   FastString             -- always an Addr#
+               (Maybe Int)             -- the size (in bytes) of the arguments
+                                       -- the label expects. Only applicable with
+                                       -- 'stdcall' labels.
+                                       -- Just x => "@<x>" will be appended to label
+                                       --           name when emitting asm.
  
         -- lit-lits only work for via-C compilation, hence they
         -- are deprecated.  The string is emitted verbatim into
         -- the C file, and can therefore be any C expression,
         -- macro call, #defined constant etc.
-  | MachLitLit  FAST_STRING Type       -- Type might be Addr# or Int# etc
+  | MachLitLit  FastString Type        -- Type might be Addr# or Int# etc
+\end{code}
+
+Binary instance: must do this manually, because we don't want the type
+arg of MachLitLit involved.
+
+\begin{code}
+instance Binary Literal where
+    put_ bh (MachChar aa)     = do putByte bh 0; put_ bh aa
+    put_ bh (MachStr ab)      = do putByte bh 1; put_ bh ab
+    put_ bh (MachAddr ac)     = do putByte bh 2; put_ bh ac
+    put_ bh (MachInt ad)      = do putByte bh 3; put_ bh ad
+    put_ bh (MachInt64 ae)    = do putByte bh 4; put_ bh ae
+    put_ bh (MachWord af)     = do putByte bh 5; put_ bh af
+    put_ bh (MachWord64 ag)   = do putByte bh 6; put_ bh ag
+    put_ bh (MachFloat ah)    = do putByte bh 7; put_ bh ah
+    put_ bh (MachDouble ai)   = do putByte bh 8; put_ bh ai
+    put_ bh (MachLabel aj mb) = do putByte bh 9; put_ bh aj ; put_ bh mb
+    put_ bh (MachLitLit ak _) = do putByte bh 10; put_ bh ak
+    get bh = do
+           h <- getByte bh
+           case h of
+             0 -> do
+                   aa <- get bh
+                   return (MachChar aa)
+             1 -> do
+                   ab <- get bh
+                   return (MachStr ab)
+             2 -> do
+                   ac <- get bh
+                   return (MachAddr ac)
+             3 -> do
+                   ad <- get bh
+                   return (MachInt ad)
+             4 -> do
+                   ae <- get bh
+                   return (MachInt64 ae)
+             5 -> do
+                   af <- get bh
+                   return (MachWord af)
+             6 -> do
+                   ag <- get bh
+                   return (MachWord64 ag)
+             7 -> do
+                   ah <- get bh
+                   return (MachFloat ah)
+             8 -> do
+                   ai <- get bh
+                   return (MachDouble ai)
+             9 -> do
+                   aj <- get bh
+                   mb <- get bh
+                   return (MachLabel aj mb)
+             10 -> do
+                   ak <- get bh
+                   return (MachLitLit ak (error "MachLitLit: no type"))
  \end{code}
  
  \begin{code}
@@ -134,22 +210,44 @@ instance Ord Literal where
  \begin{code}
  mkMachInt, mkMachWord, mkMachInt64, mkMachWord64 :: Integer -> Literal
  
-mkMachInt  x   = ASSERT2( inIntRange x,  integer x ) MachInt x
-mkMachWord x   = ASSERT2( inWordRange x, integer x ) MachWord x
-mkMachInt64  x = MachInt64 x   -- Assertions?
-mkMachWord64 x = MachWord64 x  -- Ditto?
+mkMachInt  x   = -- ASSERT2( inIntRange x,  integer x ) 
+                -- Not true: you can write out of range Int# literals
+                -- For example, one can write (intToWord# 0xffff0000) to
+                -- get a particular Word bit-pattern, and there's no other
+                -- convenient way to write such literals, which is why we allow it.
+                MachInt x
+mkMachWord x   = -- ASSERT2( inWordRange x, integer x ) 
+                MachWord x
+mkMachInt64  x = MachInt64 x
+mkMachWord64 x = MachWord64 x
  
  inIntRange, inWordRange :: Integer -> Bool
  inIntRange  x = x >= tARGET_MIN_INT && x <= tARGET_MAX_INT
  inWordRange x = x >= 0             && x <= tARGET_MAX_WORD
+
+inCharRange :: Int -> Bool
+inCharRange c =  c >= 0 && c <= tARGET_MAX_CHAR
+
+isZeroLit :: Literal -> Bool
+isZeroLit (MachInt    0) = True
+isZeroLit (MachInt64  0) = True
+isZeroLit (MachWord   0) = True
+isZeroLit (MachWord64 0) = True
+isZeroLit (MachFloat  0) = True
+isZeroLit (MachDouble 0) = True
+isZeroLit other                 = False
  \end{code}
  
         Coercions
         ~~~~~~~~~
  \begin{code}
-word2IntLit, int2WordLit, char2IntLit, int2CharLit,
- float2IntLit, int2FloatLit, double2IntLit, int2DoubleLit,
- addr2IntLit, int2AddrLit, float2DoubleLit, double2FloatLit :: Literal -> Literal
+word2IntLit, int2WordLit,
+  narrow8IntLit, narrow16IntLit, narrow32IntLit,
+  narrow8WordLit, narrow16WordLit, narrow32WordLit,
+  char2IntLit, int2CharLit,
+  float2IntLit, int2FloatLit, double2IntLit, int2DoubleLit,
+  float2DoubleLit, double2FloatLit
+  :: Literal -> Literal
  
  word2IntLit (MachWord w) 
    | w > tARGET_MAX_INT = MachInt (w - tARGET_MAX_WORD - 1)
@@ -159,20 +257,27 @@ int2WordLit (MachInt i)
    | i < 0     = MachWord (1 + tARGET_MAX_WORD + i)     -- (-1)  --->  tARGET_MAX_WORD
    | otherwise = MachWord i
  
+narrow8IntLit    (MachInt  i) = MachInt  (toInteger (fromInteger i :: Int8))
+narrow16IntLit   (MachInt  i) = MachInt  (toInteger (fromInteger i :: Int16))
+narrow32IntLit   (MachInt  i) = MachInt  (toInteger (fromInteger i :: Int32))
+narrow8WordLit   (MachWord w) = MachWord (toInteger (fromInteger w :: Word8))
+narrow16WordLit  (MachWord w) = MachWord (toInteger (fromInteger w :: Word16))
+narrow32WordLit  (MachWord w) = MachWord (toInteger (fromInteger w :: Word32))
+
  char2IntLit (MachChar c) = MachInt  (toInteger c)
  int2CharLit (MachInt  i) = MachChar (fromInteger i)
  
  float2IntLit (MachFloat f) = MachInt   (truncate    f)
  int2FloatLit (MachInt   i) = MachFloat (fromInteger i)
  
-double2IntLit (MachFloat f) = MachInt    (truncate    f)
+double2IntLit (MachDouble f) = MachInt    (truncate    f)
  int2DoubleLit (MachInt   i) = MachDouble (fromInteger i)
  
-addr2IntLit (MachAddr a) = MachInt  a
-int2AddrLit (MachInt  i) = MachAddr i
-
  float2DoubleLit (MachFloat  f) = MachDouble f
  double2FloatLit (MachDouble d) = MachFloat  d
+
+nullAddrLit :: Literal
+nullAddrLit = MachAddr 0
  \end{code}
  
         Predicates
@@ -184,11 +289,27 @@ isLitLitLit _                  = False
  maybeLitLit (MachLitLit s t) = Just (s,t)
  maybeLitLit _               = Nothing
  
+litIsTrivial :: Literal -> Bool
+-- True if there is absolutely no penalty to duplicating the literal
+--     c.f. CoreUtils.exprIsTrivial
+-- False principally of strings
+litIsTrivial (MachStr _) = False
+litIsTrivial other      = True
+
  litIsDupable :: Literal -> Bool
-       -- True if code space does not go bad if we duplicate this literal
-       -- False principally of strings
+-- True if code space does not go bad if we duplicate this literal
+--     c.f. CoreUtils.exprIsDupable
+-- Currently we treat it just like litIsTrivial
  litIsDupable (MachStr _) = False
  litIsDupable other      = True
+
+litSize :: Literal -> Int
+-- Used by CoreUnfold.sizeExpr
+litSize (MachStr str) = 1 + (lengthFS str `div` 4)
+       -- Every literal has size at least 1, otherwise
+       --      f "x" 
+       -- might be too small
+litSize _other       = 1
  \end{code}
  
         Types
@@ -204,7 +325,7 @@ literalType (MachInt64  _)    = int64PrimTy
  literalType (MachWord64  _)      = word64PrimTy
  literalType (MachFloat _)        = floatPrimTy
  literalType (MachDouble _)       = doublePrimTy
-literalType (MachLabel _)        = addrPrimTy
+literalType (MachLabel _ _)      = addrPrimTy
  literalType (MachLitLit _ ty)    = ty
  \end{code}
  
@@ -220,7 +341,7 @@ literalPrimRep (MachInt64 _)          = Int64Rep
  literalPrimRep (MachWord64 _)    = Word64Rep
  literalPrimRep (MachFloat _)     = FloatRep
  literalPrimRep (MachDouble _)    = DoubleRep
-literalPrimRep (MachLabel _)     = AddrRep
+literalPrimRep (MachLabel _ _)   = AddrRep
  literalPrimRep (MachLitLit _ ty)  = typePrimRep ty
  \end{code}
  
@@ -237,22 +358,22 @@ cmpLit (MachInt64     a)   (MachInt64        b)   = a `compare` b
  cmpLit (MachWord64    a)   (MachWord64    b)   = a `compare` b
  cmpLit (MachFloat     a)   (MachFloat     b)   = a `compare` b
  cmpLit (MachDouble    a)   (MachDouble    b)   = a `compare` b
-cmpLit (MachLabel     a)   (MachLabel      b)   = a `compare` b
-cmpLit (MachLitLit    a b) (MachLitLit    c d)  = (a `compare` c) `thenCmp` (b `compare` d)
-cmpLit lit1               lit2                 | litTag lit1 _LT_ litTag lit2 = LT
+cmpLit (MachLabel     a _) (MachLabel      b _) = a `compare` b
+cmpLit (MachLitLit    a b) (MachLitLit    c d)  = (a `compare` c) `thenCmp` (b `tcCmpType` d)
+cmpLit lit1               lit2                 | litTag lit1 <# litTag lit2 = LT
                                                 | otherwise                    = GT
  
-litTag (MachChar      _)   = ILIT(1)
-litTag (MachStr       _)   = ILIT(2)
-litTag (MachAddr      _)   = ILIT(3)
-litTag (MachInt       _)   = ILIT(4)
-litTag (MachWord      _)   = ILIT(5)
-litTag (MachInt64     _)   = ILIT(6)
-litTag (MachWord64    _)   = ILIT(7)
-litTag (MachFloat     _)   = ILIT(8)
-litTag (MachDouble    _)   = ILIT(9)
-litTag (MachLabel     _)   = ILIT(10)
-litTag (MachLitLit    _ _) = ILIT(11)
+litTag (MachChar      _)   = _ILIT(1)
+litTag (MachStr       _)   = _ILIT(2)
+litTag (MachAddr      _)   = _ILIT(3)
+litTag (MachInt       _)   = _ILIT(4)
+litTag (MachWord      _)   = _ILIT(5)
+litTag (MachInt64     _)   = _ILIT(6)
+litTag (MachWord64    _)   = _ILIT(7)
+litTag (MachFloat     _)   = _ILIT(8)
+litTag (MachDouble    _)   = _ILIT(9)
+litTag (MachLabel   _ _)   = _ILIT(10)
+litTag (MachLitLit  _ _)   = _ILIT(11)
  \end{code}
  
         Printing
@@ -265,7 +386,6 @@ pprLit lit
    = getPprStyle $ \ sty ->
      let
        code_style  = codeStyle  sty
-      iface_style = ifaceStyle sty
      in
      case lit of
        MachChar ch | code_style -> hcat [ptext SLIT("(C_)"), text (show ch)]
@@ -290,23 +410,32 @@ pprLit lit
        MachWord64 w | code_style -> pprHexVal w
                    | otherwise  -> ptext SLIT("__word64") <+> integer w
  
-      MachFloat f | code_style -> ptext SLIT("(StgFloat)") <> rational f
+      MachFloat f | code_style -> ptext SLIT("(StgFloat)") <> code_rational f
                    | otherwise  -> ptext SLIT("__float") <+> rational f
  
-      MachDouble d | iface_style && d < 0 -> parens (rational d)
-                  | otherwise            -> rational d
+      MachDouble d | code_style -> code_rational d
+                  | otherwise  -> rational d
  
        MachAddr p | code_style -> ptext SLIT("(void*)") <> integer p
                  | otherwise  -> ptext SLIT("__addr") <+> integer p
  
-      MachLabel l | code_style -> ptext SLIT("(&") <> ptext l <> char ')'
-                 | otherwise  -> ptext SLIT("__label") <+> pprHsString l
+      MachLabel l mb
+         | code_style -> ptext SLIT("(&") <> ftext l <> char ')'
+        | otherwise  -> ptext SLIT("__label") <+> 
+            case mb of
+              Nothing -> pprHsString l
+              Just x  -> doubleQuotes (text (unpackFS l ++ '@':show x))
  
-      MachLitLit s ty | code_style  -> ptext s
+      MachLitLit s ty | code_style  -> ftext s
                       | otherwise   -> parens (hsep [ptext SLIT("__litlit"), 
                                                      pprHsString s,
                                                      pprParendType ty])
  
+-- negative floating literals in code style need parentheses to avoid
+-- interacting with surrounding syntax.
+code_rational d | d < 0     = parens (rational d)
+                | otherwise = rational d
+
  pprIntVal :: Integer -> SDoc
  -- Print negative integers with parens to be sure it's unambiguous
  pprIntVal i | i < 0     = parens (integer i)
@@ -346,7 +475,7 @@ hashLiteral (MachWord i)    = hashInteger i
  hashLiteral (MachWord64 i)     = hashInteger i
  hashLiteral (MachFloat r)      = hashRational r
  hashLiteral (MachDouble r)     = hashRational r
-hashLiteral (MachLabel s)       = hashFS s
+hashLiteral (MachLabel s _)     = hashFS s
  hashLiteral (MachLitLit s _)    = hashFS s
  
  hashRational :: Rational -> Int
@@ -357,6 +486,6 @@ hashInteger i = 1 + abs (fromInteger (i `rem` 10000))
                 -- The 1+ is to avoid zero, which is a Bad Number
                 -- since we use * to combine hash values
  
-hashFS :: FAST_STRING -> Int
-hashFS s = IBOX( uniqueOfFS s )
+hashFS :: FastString -> Int
+hashFS s = iBox (uniqueOfFS s)
  \end{code}