X-Git-Url: http://git.megacz.com/?a=blobdiff_plain;f=ghc%2Fcompiler%2FbasicTypes%2FLiteral.lhs;h=1e39e65a55394df277c3905bf9f5f38cc50d4fac;hb=ba2843abdfe6f055777e4e66e8add769fce31d29;hp=016cc8e332abaf14dbcd90372c4d4360b2fb0e0c;hpb=f6d1d276e759f97c80bec8974343322b28ea0545;p=ghc-hetmet.git

diff --git a/ghc/compiler/basicTypes/Literal.lhs b/ghc/compiler/basicTypes/Literal.lhs
index 016cc8e..1e39e65 100644
--- a/ghc/compiler/basicTypes/Literal.lhs
+++ b/ghc/compiler/basicTypes/Literal.lhs
@@ -8,15 +8,20 @@ module Literal
 	( Literal(..)		-- Exported to ParseIface
 	, mkMachInt, mkMachWord
 	, mkMachInt64, mkMachWord64
-	, isLitLitLit, maybeLitLit
+	, isLitLitLit, maybeLitLit, litSize
+	, litIsDupable, litIsTrivial
 	, literalType, literalPrimRep
 	, hashLiteral
 
-	, inIntRange, inWordRange
+	, inIntRange, inWordRange, tARGET_MAX_INT, inCharRange
+	, isZeroLit,
 
-	, word2IntLit, int2WordLit, char2IntLit, int2CharLit
+	, word2IntLit, int2WordLit
+	, narrow8IntLit, narrow16IntLit, narrow32IntLit
+	, narrow8WordLit, narrow16WordLit, narrow32WordLit
+	, char2IntLit, int2CharLit
 	, float2IntLit, int2FloatLit, double2IntLit, int2DoubleLit
-	, addr2IntLit, int2AddrLit, float2DoubleLit, double2FloatLit
+	, nullAddrLit, float2DoubleLit, double2FloatLit
 	) where
 
 #include "HsVersions.h"
@@ -24,19 +29,22 @@ module Literal
 import TysPrim		( charPrimTy, addrPrimTy, floatPrimTy, doublePrimTy,
 			  intPrimTy, wordPrimTy, int64PrimTy, word64PrimTy
 			)
-import Name		( hashName )
 import PrimRep		( PrimRep(..) )
-import TyCon		( isNewTyCon )
-import Type		( Type, typePrimRep )
+import TcType		( Type, tcCmpType )
+import Type		( typePrimRep )
 import PprType		( pprParendType )
-import Demand		( Demand )
-import CStrings		( charToC, charToEasyHaskell, pprFSInCStyle )
+import CStrings		( pprFSInCStyle )
 
 import Outputable
+import FastTypes
+import FastString
+import Binary
 import Util		( thenCmp )
 
-import Ratio 		( numerator, denominator )
-import FastString	( uniqueOfFS )
+import Ratio 		( numerator )
+import FastString	( uniqueOfFS, lengthFS )
+import DATA_INT		( Int8,  Int16,  Int32 )
+import DATA_WORD	( Word8, Word16, Word32 )
 import Char		( ord, chr )
 \end{code}
 
@@ -63,6 +71,9 @@ tARGET_MIN_INT = -2147483648
 tARGET_MAX_INT =  2147483647
 #endif
 tARGET_MAX_WORD = (tARGET_MAX_INT * 2) + 1
+
+tARGET_MAX_CHAR :: Int
+tARGET_MAX_CHAR = 0x10ffff
 \end{code}
  
 
@@ -88,20 +99,90 @@ function applications, etc., etc., has not yet been done.
 data Literal
   =	------------------
 	-- First the primitive guys
-    MachChar	Char
-  | MachStr	FAST_STRING
+    MachChar	Int             -- Char#        At least 31 bits
+  | MachStr	FastString
 
-  | MachAddr	Integer	-- Whatever this machine thinks is a "pointer"
+  | MachNullAddr                -- the NULL pointer, the only pointer value
+                                -- that can be represented as a Literal.
 
-  | MachInt	Integer		-- Int#		At least 32 bits
+  | MachInt	Integer		-- Int#		At least WORD_SIZE_IN_BITS bits
   | MachInt64	Integer		-- Int64#	At least 64 bits
-  | MachWord	Integer		-- Word#	At least 32 bits
+  | MachWord	Integer		-- Word#	At least WORD_SIZE_IN_BITS bits
   | MachWord64	Integer		-- Word64#	At least 64 bits
 
   | MachFloat	Rational
   | MachDouble	Rational
 
-  | MachLitLit  FAST_STRING Type	-- Type might be Add# or Int# etc
+        -- MachLabel is used (only) for the literal derived from a 
+	-- "foreign label" declaration.
+	-- string argument is the name of a symbol.  This literal
+	-- refers to the *address* of the label.
+  | MachLabel   FastString		-- always an Addr#
+  		(Maybe Int)             -- the size (in bytes) of the arguments
+					-- the label expects. Only applicable with
+					-- 'stdcall' labels.
+					-- Just x => "@<x>" will be appended to label
+					--           name when emitting asm.
+
+	-- lit-lits only work for via-C compilation, hence they
+	-- are deprecated.  The string is emitted verbatim into
+	-- the C file, and can therefore be any C expression,
+	-- macro call, #defined constant etc.
+  | MachLitLit  FastString Type	-- Type might be Addr# or Int# etc
+\end{code}
+
+Binary instance: must do this manually, because we don't want the type
+arg of MachLitLit involved.
+
+\begin{code}
+instance Binary Literal where
+    put_ bh (MachChar aa)     = do putByte bh 0; put_ bh aa
+    put_ bh (MachStr ab)      = do putByte bh 1; put_ bh ab
+    put_ bh (MachNullAddr)    = do putByte bh 2
+    put_ bh (MachInt ad)      = do putByte bh 3; put_ bh ad
+    put_ bh (MachInt64 ae)    = do putByte bh 4; put_ bh ae
+    put_ bh (MachWord af)     = do putByte bh 5; put_ bh af
+    put_ bh (MachWord64 ag)   = do putByte bh 6; put_ bh ag
+    put_ bh (MachFloat ah)    = do putByte bh 7; put_ bh ah
+    put_ bh (MachDouble ai)   = do putByte bh 8; put_ bh ai
+    put_ bh (MachLabel aj mb) = do putByte bh 9; put_ bh aj ; put_ bh mb
+    put_ bh (MachLitLit ak _) = do putByte bh 10; put_ bh ak
+    get bh = do
+	    h <- getByte bh
+	    case h of
+	      0 -> do
+		    aa <- get bh
+		    return (MachChar aa)
+	      1 -> do
+		    ab <- get bh
+		    return (MachStr ab)
+	      2 -> do
+		    return (MachNullAddr)
+	      3 -> do
+		    ad <- get bh
+		    return (MachInt ad)
+	      4 -> do
+		    ae <- get bh
+		    return (MachInt64 ae)
+	      5 -> do
+		    af <- get bh
+		    return (MachWord af)
+	      6 -> do
+		    ag <- get bh
+		    return (MachWord64 ag)
+	      7 -> do
+		    ah <- get bh
+		    return (MachFloat ah)
+	      8 -> do
+		    ai <- get bh
+		    return (MachDouble ai)
+	      9 -> do
+		    aj <- get bh
+		    mb <- get bh
+		    return (MachLabel aj mb)
+	      10 -> do
+		    ak <- get bh
+		    return (MachLitLit ak (error "MachLitLit: no type"))
 \end{code}
 
 \begin{code}
@@ -129,45 +210,74 @@ instance Ord Literal where
 \begin{code}
 mkMachInt, mkMachWord, mkMachInt64, mkMachWord64 :: Integer -> Literal
 
-mkMachInt  x   = ASSERT2( inIntRange x,  integer x ) MachInt x
-mkMachWord x   = ASSERT2( inWordRange x, integer x ) MachWord x
-mkMachInt64  x = MachInt64 x	-- Assertions?
-mkMachWord64 x = MachWord64 x	-- Ditto?
+mkMachInt  x   = -- ASSERT2( inIntRange x,  integer x ) 
+	 	 -- Not true: you can write out of range Int# literals
+		 -- For example, one can write (intToWord# 0xffff0000) to
+		 -- get a particular Word bit-pattern, and there's no other
+		 -- convenient way to write such literals, which is why we allow it.
+		 MachInt x
+mkMachWord x   = -- ASSERT2( inWordRange x, integer x ) 
+		 MachWord x
+mkMachInt64  x = MachInt64 x
+mkMachWord64 x = MachWord64 x
 
 inIntRange, inWordRange :: Integer -> Bool
 inIntRange  x = x >= tARGET_MIN_INT && x <= tARGET_MAX_INT
 inWordRange x = x >= 0		    && x <= tARGET_MAX_WORD
+
+inCharRange :: Int -> Bool
+inCharRange c =  c >= 0 && c <= tARGET_MAX_CHAR
+
+isZeroLit :: Literal -> Bool
+isZeroLit (MachInt    0) = True
+isZeroLit (MachInt64  0) = True
+isZeroLit (MachWord   0) = True
+isZeroLit (MachWord64 0) = True
+isZeroLit (MachFloat  0) = True
+isZeroLit (MachDouble 0) = True
+isZeroLit other		 = False
 \end{code}
 
 	Coercions
 	~~~~~~~~~
 \begin{code}
-word2IntLit, int2WordLit, char2IntLit, int2CharLit,
- float2IntLit, int2FloatLit, double2IntLit, int2DoubleLit,
- addr2IntLit, int2AddrLit, float2DoubleLit, double2FloatLit :: Literal -> Literal
+word2IntLit, int2WordLit,
+  narrow8IntLit, narrow16IntLit, narrow32IntLit,
+  narrow8WordLit, narrow16WordLit, narrow32WordLit,
+  char2IntLit, int2CharLit,
+  float2IntLit, int2FloatLit, double2IntLit, int2DoubleLit,
+  float2DoubleLit, double2FloatLit
+  :: Literal -> Literal
 
 word2IntLit (MachWord w) 
-  | w > tARGET_MAX_INT = MachInt ((-1) + tARGET_MAX_WORD - w)
+  | w > tARGET_MAX_INT = MachInt (w - tARGET_MAX_WORD - 1)
   | otherwise	       = MachInt w
 
 int2WordLit (MachInt i)
   | i < 0     = MachWord (1 + tARGET_MAX_WORD + i)	-- (-1)  --->  tARGET_MAX_WORD
   | otherwise = MachWord i
 
-char2IntLit (MachChar c) = MachInt  (toInteger (ord c))
-int2CharLit (MachInt  i) = MachChar (chr (fromInteger i))
+narrow8IntLit    (MachInt  i) = MachInt  (toInteger (fromInteger i :: Int8))
+narrow16IntLit   (MachInt  i) = MachInt  (toInteger (fromInteger i :: Int16))
+narrow32IntLit   (MachInt  i) = MachInt  (toInteger (fromInteger i :: Int32))
+narrow8WordLit   (MachWord w) = MachWord (toInteger (fromInteger w :: Word8))
+narrow16WordLit  (MachWord w) = MachWord (toInteger (fromInteger w :: Word16))
+narrow32WordLit  (MachWord w) = MachWord (toInteger (fromInteger w :: Word32))
+
+char2IntLit (MachChar c) = MachInt  (toInteger c)
+int2CharLit (MachInt  i) = MachChar (fromInteger i)
 
 float2IntLit (MachFloat f) = MachInt   (truncate    f)
 int2FloatLit (MachInt   i) = MachFloat (fromInteger i)
 
-double2IntLit (MachFloat f) = MachInt    (truncate    f)
+double2IntLit (MachDouble f) = MachInt    (truncate    f)
 int2DoubleLit (MachInt   i) = MachDouble (fromInteger i)
 
-addr2IntLit (MachAddr a) = MachInt  a
-int2AddrLit (MachInt  i) = MachAddr i
-
 float2DoubleLit (MachFloat  f) = MachDouble f
 double2FloatLit (MachDouble d) = MachFloat  d
+
+nullAddrLit :: Literal
+nullAddrLit = MachNullAddr
 \end{code}
 
 	Predicates
@@ -178,6 +288,28 @@ isLitLitLit _	    	     = False
 
 maybeLitLit (MachLitLit s t) = Just (s,t)
 maybeLitLit _		     = Nothing
+
+litIsTrivial :: Literal -> Bool
+-- True if there is absolutely no penalty to duplicating the literal
+--	c.f. CoreUtils.exprIsTrivial
+-- False principally of strings
+litIsTrivial (MachStr _) = False
+litIsTrivial other	 = True
+
+litIsDupable :: Literal -> Bool
+-- True if code space does not go bad if we duplicate this literal
+--	c.f. CoreUtils.exprIsDupable
+-- Currently we treat it just like litIsTrivial
+litIsDupable (MachStr _) = False
+litIsDupable other	 = True
+
+litSize :: Literal -> Int
+-- Used by CoreUnfold.sizeExpr
+litSize (MachStr str) = 1 + (lengthFS str `div` 4)
+	-- Every literal has size at least 1, otherwise
+	-- 	f "x" 
+	-- might be too small
+litSize _other	      = 1
 \end{code}
 
 	Types
@@ -186,13 +318,14 @@ maybeLitLit _		     = Nothing
 literalType :: Literal -> Type
 literalType (MachChar _)	  = charPrimTy
 literalType (MachStr  _)	  = addrPrimTy
-literalType (MachAddr _)	  = addrPrimTy
+literalType (MachNullAddr)	  = addrPrimTy
 literalType (MachInt  _)	  = intPrimTy
 literalType (MachWord  _)	  = wordPrimTy
 literalType (MachInt64  _)	  = int64PrimTy
 literalType (MachWord64  _)	  = word64PrimTy
 literalType (MachFloat _)	  = floatPrimTy
 literalType (MachDouble _)	  = doublePrimTy
+literalType (MachLabel _ _)	  = addrPrimTy
 literalType (MachLitLit _ ty)	  = ty
 \end{code}
 
@@ -201,13 +334,14 @@ literalPrimRep :: Literal -> PrimRep
 
 literalPrimRep (MachChar _)	  = CharRep
 literalPrimRep (MachStr _)	  = AddrRep  -- specifically: "char *"
-literalPrimRep (MachAddr  _)	  = AddrRep
+literalPrimRep (MachNullAddr)	  = AddrRep
 literalPrimRep (MachInt _) 	  = IntRep
 literalPrimRep (MachWord _) 	  = WordRep
 literalPrimRep (MachInt64 _)	  = Int64Rep
 literalPrimRep (MachWord64 _)	  = Word64Rep
 literalPrimRep (MachFloat _)	  = FloatRep
 literalPrimRep (MachDouble _)	  = DoubleRep
+literalPrimRep (MachLabel _ _)	  = AddrRep
 literalPrimRep (MachLitLit _ ty)  = typePrimRep ty
 \end{code}
 
@@ -217,49 +351,50 @@ literalPrimRep (MachLitLit _ ty)  = typePrimRep ty
 \begin{code}
 cmpLit (MachChar      a)   (MachChar	   b)   = a `compare` b
 cmpLit (MachStr       a)   (MachStr	   b)   = a `compare` b
-cmpLit (MachAddr      a)   (MachAddr	   b)   = a `compare` b
+cmpLit (MachNullAddr)      (MachNullAddr)       = EQ
 cmpLit (MachInt       a)   (MachInt	   b)   = a `compare` b
 cmpLit (MachWord      a)   (MachWord	   b)   = a `compare` b
 cmpLit (MachInt64     a)   (MachInt64	   b)   = a `compare` b
 cmpLit (MachWord64    a)   (MachWord64	   b)   = a `compare` b
 cmpLit (MachFloat     a)   (MachFloat	   b)   = a `compare` b
 cmpLit (MachDouble    a)   (MachDouble	   b)   = a `compare` b
-cmpLit (MachLitLit    a b) (MachLitLit    c d)  = (a `compare` c) `thenCmp` (b `compare` d)
-cmpLit lit1		   lit2		        | litTag lit1 _LT_ litTag lit2 = LT
+cmpLit (MachLabel     a _) (MachLabel      b _) = a `compare` b
+cmpLit (MachLitLit    a b) (MachLitLit    c d)  = (a `compare` c) `thenCmp` (b `tcCmpType` d)
+cmpLit lit1		   lit2		        | litTag lit1 <# litTag lit2 = LT
 					        | otherwise  		       = GT
 
-litTag (MachChar      _)   = ILIT(1)
-litTag (MachStr       _)   = ILIT(2)
-litTag (MachAddr      _)   = ILIT(3)
-litTag (MachInt       _)   = ILIT(4)
-litTag (MachWord      _)   = ILIT(5)
-litTag (MachInt64     _)   = ILIT(6)
-litTag (MachWord64    _)   = ILIT(7)
-litTag (MachFloat     _)   = ILIT(8)
-litTag (MachDouble    _)   = ILIT(9)
-litTag (MachLitLit    _ _) = ILIT(10)
+litTag (MachChar      _)   = _ILIT(1)
+litTag (MachStr       _)   = _ILIT(2)
+litTag (MachNullAddr)      = _ILIT(3)
+litTag (MachInt       _)   = _ILIT(4)
+litTag (MachWord      _)   = _ILIT(5)
+litTag (MachInt64     _)   = _ILIT(6)
+litTag (MachWord64    _)   = _ILIT(7)
+litTag (MachFloat     _)   = _ILIT(8)
+litTag (MachDouble    _)   = _ILIT(9)
+litTag (MachLabel   _ _)   = _ILIT(10)
+litTag (MachLitLit  _ _)   = _ILIT(11)
 \end{code}
 
 	Printing
 	~~~~~~~~
 * MachX (i.e. unboxed) things are printed unadornded (e.g. 3, 'a', "foo")
-  exceptions: MachFloat and MachAddr get an initial keyword prefix
+  exceptions: MachFloat gets an initial keyword prefix.
 
 \begin{code}
 pprLit lit
   = getPprStyle $ \ sty ->
     let
       code_style  = codeStyle  sty
-      iface_style = ifaceStyle sty
     in
     case lit of
-      MachChar ch | code_style  -> hcat [ptext SLIT("(C_)"), char '\'', 
-					 text (charToC ch), char '\'']
-	          | iface_style -> char '\'' <> text (charToEasyHaskell ch) <> char '\''
-		  | otherwise   -> text ['\'', ch, '\'']
+      MachChar ch | code_style -> hcat [ptext SLIT("(C_)"), text (show ch)]
+	          | otherwise  -> pprHsChar ch
 
       MachStr s | code_style -> pprFSInCStyle s
-	        | otherwise  -> pprFSAsString s
+	        | otherwise  -> pprHsString s
+      -- Warning: printing MachStr in code_style assumes it contains
+      -- only characters '\0'..'\xFF'!
 
       MachInt i | code_style && i == tARGET_MIN_INT -> parens (integer (i+1) <> text "-1")
 				-- Avoid a problem whereby gcc interprets
@@ -275,20 +410,32 @@ pprLit lit
       MachWord64 w | code_style -> pprHexVal w
 		   | otherwise  -> ptext SLIT("__word64") <+> integer w
 
-      MachFloat f | code_style -> ptext SLIT("(StgFloat)") <> rational f
+      MachFloat f | code_style -> ptext SLIT("(StgFloat)") <> code_rational f
                   | otherwise  -> ptext SLIT("__float") <+> rational f
 
-      MachDouble d | iface_style && d < 0 -> parens (rational d)
-		   | otherwise            -> rational d
+      MachDouble d | code_style -> code_rational d
+		   | otherwise  -> rational d
+
+      MachNullAddr | code_style -> ptext SLIT("(void*)0")
+	           | otherwise  -> ptext SLIT("__NULL")
 
-      MachAddr p | code_style -> ptext SLIT("(void*)") <> integer p
-	         | otherwise  -> ptext SLIT("__addr") <+> integer p
+      MachLabel l mb
+         | code_style -> ptext SLIT("(&") <> ftext l <> char ')'
+	 | otherwise  -> ptext SLIT("__label") <+> 
+	     case mb of
+	       Nothing -> pprHsString l
+	       Just x  -> doubleQuotes (text (unpackFS l ++ '@':show x))
 
-      MachLitLit s ty | code_style  -> ptext s
+      MachLitLit s ty | code_style  -> ftext s
 		      | otherwise   -> parens (hsep [ptext SLIT("__litlit"), 
-						     pprFSAsString s,
+						     pprHsString s,
 						     pprParendType ty])
 
+-- negative floating literals in code style need parentheses to avoid
+-- interacting with surrounding syntax.
+code_rational d | d < 0     = parens (rational d)
+                | otherwise = rational d
+
 pprIntVal :: Integer -> SDoc
 -- Print negative integers with parens to be sure it's unambiguous
 pprIntVal i | i < 0     = parens (integer i)
@@ -319,15 +466,16 @@ Hash values should be zero or a positive integer.  No negatives please.
 
 \begin{code}
 hashLiteral :: Literal -> Int
-hashLiteral (MachChar c)    	= ord c + 1000	-- Keep it out of range of common ints
+hashLiteral (MachChar c)    	= c + 1000	-- Keep it out of range of common ints
 hashLiteral (MachStr s)     	= hashFS s
-hashLiteral (MachAddr i)    	= hashInteger i
+hashLiteral (MachNullAddr)    	= 0
 hashLiteral (MachInt i)   	= hashInteger i
 hashLiteral (MachInt64 i) 	= hashInteger i
 hashLiteral (MachWord i)   	= hashInteger i
 hashLiteral (MachWord64 i) 	= hashInteger i
 hashLiteral (MachFloat r)   	= hashRational r
 hashLiteral (MachDouble r)  	= hashRational r
+hashLiteral (MachLabel s _)     = hashFS s
 hashLiteral (MachLitLit s _)    = hashFS s
 
 hashRational :: Rational -> Int
@@ -338,6 +486,6 @@ hashInteger i = 1 + abs (fromInteger (i `rem` 10000))
 		-- The 1+ is to avoid zero, which is a Bad Number
 		-- since we use * to combine hash values
 
-hashFS :: FAST_STRING -> Int
-hashFS s = IBOX( uniqueOfFS s )
+hashFS :: FastString -> Int
+hashFS s = iBox (uniqueOfFS s)
 \end{code}