X-Git-Url: http://git.megacz.com/?a=blobdiff_plain;f=ghc%2Fcompiler%2Futils%2FPrimPacked.lhs;h=f2d034dcee619b86e0b92fd5fb78763130cdaf86;hb=2a2efb720c0fdc06fe749f96f284b00b30f8f3f7;hp=d6b25c45402442e02dc6f6a86cb2fbe7cb5a9253;hpb=4054c720d8fe5e4e9bae01d444c01addc2c32aba;p=ghc-hetmet.git diff --git a/ghc/compiler/utils/PrimPacked.lhs b/ghc/compiler/utils/PrimPacked.lhs index d6b25c4..f2d034d 100644 --- a/ghc/compiler/utils/PrimPacked.lhs +++ b/ghc/compiler/utils/PrimPacked.lhs @@ -8,136 +8,166 @@ of bytes (character strings). Used by the interface lexer input subsystem, mostly. \begin{code} -{-# OPTIONS -fvia-C -monly-3-regs #-} -module PrimPacked - ( - strLength, -- :: _Addr -> Int - copyPrefixStr, -- :: _Addr -> Int -> ByteArray Int - copySubStr, -- :: _Addr -> Int -> Int -> ByteArray Int - copySubStrBA, -- :: ByteArray Int -> Int -> Int -> ByteArray Int - - eqStrPrefix, -- :: Addr# -> ByteArray# -> Int# -> Bool - eqCharStrPrefix, -- :: Addr# -> Addr# -> Int# -> Bool - eqStrPrefixBA, -- :: ByteArray# -> ByteArray# -> Int# -> Int# -> Bool - eqCharStrPrefixBA, -- :: Addr# -> ByteArray# -> Int# -> Int# -> Bool - - addrOffset# -- :: Addr# -> Int# -> Addr# - ) where +{-# OPTIONS -optc-DNON_POSIX_SOURCE #-} + +module PrimPacked ( + Ptr(..), nullPtr, plusAddr#, + BA(..), + packString, -- :: String -> (Int, BA) + unpackNBytesBA, -- :: BA -> Int -> [Char] + strLength, -- :: Ptr CChar -> Int + copyPrefixStr, -- :: Addr# -> Int -> BA + copySubStrBA, -- :: BA -> Int -> Int -> BA + eqStrPrefix, -- :: Addr# -> ByteArray# -> Int# -> Bool + eqStrPrefixBA, -- :: ByteArray# -> ByteArray# -> Int# -> Int# -> Bool + ) where -- This #define suppresses the "import FastString" that -- HsVersions otherwise produces #define COMPILING_FAST_STRING #include "HsVersions.h" -import GlaExts -#if __GLASGOW_HASKELL__ < 411 -import PrelAddr ( Addr(..) ) -#else -import Addr ( Addr(..) ) -#endif -import ST +import GLAEXTS +import UNSAFE_IO ( unsafePerformIO ) + +import MONAD_ST import Foreign -#if __GLASGOW_HASKELL__ < 301 -import ArrBase ( StateAndMutableByteArray#(..), - StateAndByteArray#(..) ) -import STBase -#elif __GLASGOW_HASKELL__ < 400 -import PrelArr ( StateAndMutableByteArray#(..), - StateAndByteArray#(..) ) +#if __GLASGOW_HASKELL__ < 503 import PrelST #else -import PrelST +import GHC.ST +#endif + +#if __GLASGOW_HASKELL__ >= 504 +import GHC.Ptr ( Ptr(..) ) +#elif __GLASGOW_HASKELL__ >= 500 +import Ptr ( Ptr(..) ) +#endif + +#if __GLASGOW_HASKELL__ < 504 +import PrelIOBase ( IO(..) ) +#else +import GHC.IOBase ( IO(..) ) +#endif +\end{code} + +Compatibility: 4.08 didn't have the Ptr type. + +\begin{code} +#if __GLASGOW_HASKELL__ <= 408 +data Ptr a = Ptr Addr# deriving (Eq, Ord) + +nullPtr :: Ptr a +nullPtr = Ptr (int2Addr# 0#) +#endif + +#if __GLASGOW_HASKELL__ <= 500 +-- plusAddr# is a primop in GHC > 5.00 +plusAddr# :: Addr# -> Int# -> Addr# +plusAddr# a# i# = int2Addr# (addr2Int# a# +# i#) #endif +\end{code} + +Wrapper types for bytearrays + +\begin{code} +data BA = BA ByteArray# +data MBA s = MBA (MutableByteArray# s) +\end{code} -\end{code} +\begin{code} +packString :: String -> (Int, BA) +packString str = (l, arr) + where + l@(I# length#) = length str + + arr = runST (do + ch_array <- new_ps_array length# + -- fill in packed string from "str" + fill_in ch_array 0# str + -- freeze the puppy: + freeze_ps_array ch_array length# + ) + + fill_in :: MBA s -> Int# -> [Char] -> ST s () + fill_in arr_in# idx [] = + return () + fill_in arr_in# idx (C# c : cs) = + write_ps_array arr_in# idx c >> + fill_in arr_in# (idx +# 1#) cs +\end{code} -Return the length of a @\\NUL@ terminated character string: +Unpacking a string \begin{code} -strLength :: Addr -> Int -strLength a = - unsafePerformIO ( - _ccall_ strlen a >>= \ len@(I# _) -> - return len - ) -{-# NOINLINE strLength #-} +unpackNBytesBA :: BA -> Int -> [Char] +unpackNBytesBA (BA bytes) (I# len) + = unpack 0# + where + unpack nh + | nh >=# len = [] + | otherwise = C# ch : unpack (nh +# 1#) + where + ch = indexCharArray# bytes nh \end{code} -Copying a char string prefix into a byte array, -{\em assuming} the prefix does not contain any -NULs. +Copying a char string prefix into a byte array. \begin{code} -copyPrefixStr :: Addr -> Int -> ByteArray Int -copyPrefixStr (A# a) len@(I# length#) = - runST ( - {- allocate an array that will hold the string - (not forgetting the NUL at the end) - -} - (new_ps_array (length# +# 1#)) >>= \ ch_array -> -{- Revert back to Haskell-only solution for the moment. - _ccall_ memcpy ch_array (A# a) len >>= \ () -> - write_ps_array ch_array length# (chr# 0#) >> --} - -- fill in packed string from "addr" - fill_in ch_array 0# >> - -- freeze the puppy: - freeze_ps_array ch_array length# >>= \ barr -> - return barr ) - where - fill_in :: MutableByteArray s Int -> Int# -> ST s () - - fill_in arr_in# idx +copyPrefixStr :: Addr# -> Int -> BA +copyPrefixStr a# len@(I# length#) = copy' length# + where + copy' length# = runST (do + {- allocate an array that will hold the string + -} + ch_array <- new_ps_array length# + {- Revert back to Haskell-only solution for the moment. + _ccall_ memcpy ch_array (A# a) len >>= \ () -> + write_ps_array ch_array length# (chr# 0#) >> + -} + -- fill in packed string from "addr" + fill_in ch_array 0# + -- freeze the puppy: + freeze_ps_array ch_array length# + ) + + fill_in :: MBA s -> Int# -> ST s () + fill_in arr_in# idx | idx ==# length# - = write_ps_array arr_in# idx (chr# 0#) >> - return () + = return () | otherwise - = case (indexCharOffAddr# a idx) of { ch -> + = case (indexCharOffAddr# a# idx) of { ch -> write_ps_array arr_in# idx ch >> fill_in arr_in# (idx +# 1#) } - \end{code} Copying out a substring, assume a 0-indexed string: (and positive lengths, thank you). \begin{code} -copySubStr :: Addr -> Int -> Int -> ByteArray Int -copySubStr a start length = - unsafePerformIO ( - _casm_ `` %r= (char *)((char *)%0 + (int)%1); '' a start - >>= \ a_start -> - return (copyPrefixStr a_start length)) - --- step on (char *) pointer by x units. -addrOffset# :: Addr# -> Int# -> Addr# -addrOffset# a# i# = - case unsafePerformIO (_casm_ ``%r=(char *)((char *)%0 + (int)%1); '' (A# a#) (I# i#)) of - A# a -> a - -copySubStrBA :: ByteArray Int -> Int -> Int -> ByteArray Int -#if __GLASGOW_HASKELL__ >= 405 -copySubStrBA (ByteArray _ _ barr#) (I# start#) len@(I# length#) = -#else -copySubStrBA (ByteArray _ barr#) (I# start#) len@(I# length#) = +#ifdef UNUSED +copySubStr :: Addr# -> Int -> Int -> BA +copySubStr a# (I# start#) length = + copyPrefixStr (a# `plusAddr#` start#) length #endif - runST ( - {- allocate an array that will hold the string - (not forgetting the NUL at the end) - -} - new_ps_array (length# +# 1#) >>= \ ch_array -> - -- fill in packed string from "addr" - fill_in ch_array 0# >> - -- freeze the puppy: - freeze_ps_array ch_array length#) - where - fill_in :: MutableByteArray s Int -> Int# -> ST s () - - fill_in arr_in# idx + +copySubStrBA :: BA -> Int -> Int -> BA +copySubStrBA (BA barr#) (I# start#) len@(I# length#) = ba + where + ba = runST (do + -- allocate an array that will hold the string + ch_array <- new_ps_array length# + -- fill in packed string from "addr" + fill_in ch_array 0# + -- freeze the puppy: + freeze_ps_array ch_array length# + ) + + fill_in :: MBA s -> Int# -> ST s () + fill_in arr_in# idx | idx ==# length# - = write_ps_array arr_in# idx (chr# 0#) >> - return () + = return () | otherwise = case (indexCharArray# barr# (start# +# idx)) of { ch -> write_ps_array arr_in# idx ch >> @@ -148,55 +178,28 @@ copySubStrBA (ByteArray _ barr#) (I# start#) len@(I# length#) = [Copied from PackBase; no real reason -- UGH] \begin{code} -new_ps_array :: Int# -> ST s (MutableByteArray s Int) -write_ps_array :: MutableByteArray s Int -> Int# -> Char# -> ST s () -freeze_ps_array :: MutableByteArray s Int -> Int# -> ST s (ByteArray Int) +new_ps_array :: Int# -> ST s (MBA s) +write_ps_array :: MBA s -> Int# -> Char# -> ST s () +freeze_ps_array :: MBA s -> Int# -> ST s BA -new_ps_array size = ST $ \ s -> -#if __GLASGOW_HASKELL__ < 400 - case (newCharArray# size s) of { StateAndMutableByteArray# s2# barr# -> - STret s2# (MutableByteArray bot barr#) } -#elif __GLASGOW_HASKELL__ < 405 - case (newCharArray# size s) of { (# s2#, barr# #) -> - (# s2#, MutableByteArray bot barr# #) } -#elif __GLASGOW_HASKELL__ < 411 - case (newCharArray# size s) of { (# s2#, barr# #) -> - (# s2#, MutableByteArray bot bot barr# #) } -#else /* 411 and higher */ - case (newByteArray# size s) of { (# s2#, barr# #) -> - (# s2#, MutableByteArray bot bot barr# #) } +#if __GLASGOW_HASKELL__ < 411 +#define NEW_BYTE_ARRAY newCharArray# +#else +#define NEW_BYTE_ARRAY newPinnedByteArray# #endif - where - bot = error "new_ps_array" -#if __GLASGOW_HASKELL__ < 400 -write_ps_array (MutableByteArray _ barr#) n ch = ST $ \ s# -> - case writeCharArray# barr# n ch s# of { s2# -> - STret s2# () } -#elif __GLASGOW_HASKELL__ < 405 -write_ps_array (MutableByteArray _ barr#) n ch = ST $ \ s# -> - case writeCharArray# barr# n ch s# of { s2# -> - (# s2#, () #) } -#else -write_ps_array (MutableByteArray _ _ barr#) n ch = ST $ \ s# -> +new_ps_array size = ST $ \ s -> + case (NEW_BYTE_ARRAY size s) of { (# s2#, barr# #) -> + (# s2#, MBA barr# #) } + +write_ps_array (MBA barr#) n ch = ST $ \ s# -> case writeCharArray# barr# n ch s# of { s2# -> (# s2#, () #) } -#endif -- same as unsafeFreezeByteArray -#if __GLASGOW_HASKELL__ < 400 -freeze_ps_array (MutableByteArray _ arr#) len# = ST $ \ s# -> - case unsafeFreezeByteArray# arr# s# of { StateAndByteArray# s2# frozen# -> - STret s2# (ByteArray (0,I# len#) frozen#) } -#elif __GLASGOW_HASKELL__ < 405 -freeze_ps_array (MutableByteArray _ arr#) len# = ST $ \ s# -> - case unsafeFreezeByteArray# arr# s# of { (# s2#, frozen# #) -> - (# s2#, ByteArray (0,I# len#) frozen# #) } -#else -freeze_ps_array (MutableByteArray _ _ arr#) len# = ST $ \ s# -> +freeze_ps_array (MBA arr#) len# = ST $ \ s# -> case unsafeFreezeByteArray# arr# s# of { (# s2#, frozen# #) -> - (# s2#, ByteArray 0 (I# len#) frozen# #) } -#endif + (# s2#, BA frozen# #) } \end{code} @@ -205,70 +208,58 @@ Compare two equal-length strings for equality: \begin{code} eqStrPrefix :: Addr# -> ByteArray# -> Int# -> Bool eqStrPrefix a# barr# len# = - unsafePerformIO ( -#if __GLASGOW_HASKELL__ < 405 - _ccall_ strncmp (A# a#) (ByteArray bot barr#) (I# len#) >>= \ (I# x#) -> -#else - _ccall_ strncmp (A# a#) (ByteArray bot bot barr#) (I# len#) >>= \ (I# x#) -> -#endif - return (x# ==# 0#)) - where -#if __GLASGOW_HASKELL__ < 405 - bot :: (Int,Int) -#else - bot :: Int -#endif - bot = error "eqStrPrefix" + inlinePerformIO $ do + x <- memcmp_ba a# barr# (I# len#) + return (x == 0) +#ifdef UNUSED eqCharStrPrefix :: Addr# -> Addr# -> Int# -> Bool eqCharStrPrefix a1# a2# len# = - unsafePerformIO ( - _ccall_ strncmp (A# a1#) (A# a2#) (I# len#) >>= \ (I# x#) -> - return (x# ==# 0#)) + inlinePerformIO $ do + x <- memcmp a1# a2# (I# len#) + return (x == 0) +#endif eqStrPrefixBA :: ByteArray# -> ByteArray# -> Int# -> Int# -> Bool eqStrPrefixBA b1# b2# start# len# = - unsafePerformIO ( - _casm_ ``%r=(int)strncmp((char *)%0+(int)%1,%2,%3); '' -#if __GLASGOW_HASKELL__ < 405 - (ByteArray bot b2#) -#else - (ByteArray bot bot b2#) -#endif - (I# start#) -#if __GLASGOW_HASKELL__ < 405 - (ByteArray bot b1#) -#else - (ByteArray bot bot b1#) -#endif - (I# len#) >>= \ (I# x#) -> - return (x# ==# 0#)) - where -#if __GLASGOW_HASKELL__ < 405 - bot :: (Int,Int) -#else - bot :: Int -#endif - bot = error "eqStrPrefixBA" + inlinePerformIO $ do + x <- memcmp_baoff_ba b2# (I# start#) b1# (I# len#) + return (x == 0) +#ifdef UNUSED eqCharStrPrefixBA :: Addr# -> ByteArray# -> Int# -> Int# -> Bool eqCharStrPrefixBA a# b2# start# len# = - unsafePerformIO ( - _casm_ ``%r=(int)strncmp((char *)%0+(int)%1,%2,%3); '' -#if __GLASGOW_HASKELL__ < 405 - (ByteArray bot b2#) -#else - (ByteArray bot bot b2#) + inlinePerformIO $ do + x <- memcmp_baoff b2# (I# start#) a# (I# len#) + return (x == 0) #endif - (I# start#) - (A# a#) - (I# len#) >>= \ (I# x#) -> - return (x# ==# 0#)) - where -#if __GLASGOW_HASKELL__ < 405 - bot :: (Int,Int) +\end{code} + +\begin{code} +-- Just like unsafePerformIO, but we inline it. This is safe when +-- there are no side effects, and improves performance. +{-# INLINE inlinePerformIO #-} +inlinePerformIO :: IO a -> a +inlinePerformIO (IO m) = case m realWorld# of (# _, r #) -> r + +#if __GLASGOW_HASKELL__ <= 408 +strLength (Ptr a#) = ghc_strlen a# +foreign import ccall unsafe "ghc_strlen" + ghc_strlen :: Addr# -> Int #else - bot :: Int +foreign import ccall unsafe "ghc_strlen" + strLength :: Ptr () -> Int #endif - bot = error "eqCharStrPrefixBA" + +foreign import ccall unsafe "ghc_memcmp" + memcmp :: Addr# -> Addr# -> Int -> IO Int + +foreign import ccall unsafe "ghc_memcmp" + memcmp_ba :: Addr# -> ByteArray# -> Int -> IO Int + +foreign import ccall unsafe "ghc_memcmp_off" + memcmp_baoff :: ByteArray# -> Int -> Addr# -> Int -> IO Int + +foreign import ccall unsafe "ghc_memcmp_off" + memcmp_baoff_ba :: ByteArray# -> Int -> ByteArray# -> Int -> IO Int \end{code}