-----------------------------------------------------------------------------
---
+-- |
-- Module : Text.Regex.Posix
--- Copyright : (c) The University of Glasgow 2001
--- License : BSD-style (see the file libraries/core/LICENSE)
+-- Copyright : (c) The University of Glasgow 2002
+-- License : BSD-style (see the file libraries/base/LICENSE)
--
-- Maintainer : libraries@haskell.org
-- Stability : experimental
--- Portability : non-portable (only on platforms that provide POSIX regexps)
---
--- $Id: Posix.hsc,v 1.2 2001/08/17 12:50:35 simonmar Exp $
+-- Portability : non-portable (needs POSIX regexps)
--
-- Interface to the POSIX regular expression library.
--- ToDo: detect regex library with configure.
--- ToDo: should have an interface using PackedStrings.
--
-----------------------------------------------------------------------------
+-- ToDo: should have an interface using PackedStrings.
+
module Text.Regex.Posix (
+ -- * The @Regex@ type
Regex, -- abstract
+ -- * Compiling a regular expression
regcomp, -- :: String -> Int -> IO Regex
+ -- ** Flags for regcomp
+ regExtended, -- (flag to regcomp) use extended regex syntax
+ regIgnoreCase, -- (flag to regcomp) ignore case when matching
+ regNewline, -- (flag to regcomp) '.' doesn't match newline
+
+ -- * Matching a regular expression
regexec, -- :: Regex -- pattern
-- -> String -- string to match
-- -> IO (Maybe (String, -- everything before match
-- String, -- everything after match
-- [String])) -- subexpression matches
- regExtended, -- (flag to regcomp) use extended regex syntax
- regIgnoreCase, -- (flag to regcomp) ignore case when matching
- regNewline -- (flag to regcomp) '.' doesn't match newline
) where
+#include <sys/types.h>
#include "regex.h"
import Prelude
import Foreign
import Foreign.C
+-- | A compiled regular expression
newtype Regex = Regex (ForeignPtr CRegex)
-- -----------------------------------------------------------------------------
-- regcomp
-regcomp :: String -> Int -> IO Regex
+-- | Compiles a regular expression
+regcomp
+ :: String -- ^ The regular expression to compile
+ -> Int -- ^ Flags (summed together)
+ -> IO Regex -- ^ Returns: the compiled regular expression
regcomp pattern flags = do
+#ifdef __HUGS__
+ regex_fptr <- mallocForeignPtrBytes (#const sizeof(regex_t))
+#else
regex_ptr <- mallocBytes (#const sizeof(regex_t))
regex_fptr <- newForeignPtr regex_ptr (regfree regex_ptr)
- withCString pattern $ \cstr -> do
- r <- c_regcomp regex_fptr cstr (fromIntegral flags)
- if (r == 0)
- then return (Regex regex_fptr)
- else error "Text.Regex.Posix.regcomp: error in pattern" -- ToDo
-
+#endif /* __HUGS__ */
+ r <- withCString pattern $ \cstr ->
+ withForeignPtr regex_fptr $ \p ->
+ c_regcomp p cstr (fromIntegral flags)
+#ifdef __HUGS__
+ addForeignPtrFinalizer regex_fptr ptr_regfree
+#endif
+ if (r == 0)
+ then return (Regex regex_fptr)
+ else error "Text.Regex.Posix.regcomp: error in pattern" -- ToDo
+
+#ifndef __HUGS__
regfree :: Ptr CRegex -> IO ()
regfree p_regex = do
c_regfree p_regex
free p_regex
+#endif /* __HUGS__ */
-- -----------------------------------------------------------------------------
-- regexec
-regexec :: Regex -- pattern
- -> String -- string to match
- -> IO (Maybe (String, -- everything before match
- String, -- matched portion
- String, -- everything after match
- [String])) -- subexpression matches
+-- | Matches a regular expression against a string
+regexec :: Regex -- ^ Compiled regular expression
+ -> String -- ^ String to match against
+ -> IO (Maybe (String, String, String, [String]))
+ -- ^ Returns: 'Nothing' if the regex did not match the
+ -- string, or:
+ --
+ -- @
+ -- 'Just' (everything before match,
+ -- matched portion,
+ -- everything after match,
+ -- subexpression matches)
+ -- @
regexec (Regex regex_fptr) str = do
withCString str $ \cstr -> do
- nsub <- withForeignPtr regex_fptr $ \p -> (#peek regex_t, re_nsub) p
- let nsub_int = fromIntegral (nsub :: CSize)
- allocaBytes ((1 + nsub_int) * (#const sizeof(regmatch_t))) $ \p_match -> do
+ withForeignPtr regex_fptr $ \regex_ptr -> do
+ nsub <- (#peek regex_t, re_nsub) regex_ptr
+ let nsub_int = fromIntegral (nsub :: CSize)
+ allocaBytes ((1 + nsub_int) * (#const sizeof(regmatch_t))) $ \p_match -> do
-- add one because index zero covers the whole match
- r <- c_regexec regex_fptr cstr (1 + nsub) p_match 0{-no flags for now-}
+ r <- c_regexec regex_ptr cstr (1 + nsub) p_match 0{-no flags for now-}
- if (r /= 0) then return Nothing else do
+ if (r /= 0) then return Nothing else do
- (before,match,after) <- matched_parts str p_match
+ (before,match,after) <- matched_parts str p_match
- sub_strs <-
+ sub_strs <-
mapM (unpack str) $ take nsub_int $ tail $
iterate (`plusPtr` (#const sizeof(regmatch_t))) p_match
- return (Just (before, match, after, sub_strs))
+ return (Just (before, match, after, sub_strs))
matched_parts :: String -> Ptr CRegMatch -> IO (String, String, String)
matched_parts string p_match = do
-- Flags for regexec
#enum Int,, \
REG_NOTBOL, \
- REG_NOTEOL \
+ REG_NOTEOL
-- Return values from regexec
#enum Int,, \
type CRegex = ()
type CRegMatch = ()
-foreign import "regcomp" unsafe
- c_regcomp :: ForeignPtr CRegex -> CString -> CInt -> IO CInt
+foreign import ccall unsafe "regcomp"
+ c_regcomp :: Ptr CRegex -> CString -> CInt -> IO CInt
-foreign import "regfree" unsafe
+#ifdef __HUGS__
+foreign import ccall unsafe "®free"
+ ptr_regfree :: FunPtr (Ptr CRegex -> IO ())
+#else
+foreign import ccall unsafe "regfree"
c_regfree :: Ptr CRegex -> IO ()
+#endif /* __HUGS__ */
-foreign import "regexec" unsafe
- c_regexec :: ForeignPtr CRegex -> CString -> CSize
+foreign import ccall unsafe "regexec"
+ c_regexec :: Ptr CRegex -> CString -> CSize
-> Ptr CRegMatch -> CInt -> IO CInt