Safe Haskell | Safe |
---|---|
Language | Haskell2010 |
- data M c
- empty :: M c
- eps :: M c
- char :: c -> M c
- charRange :: Enum c => c -> c -> M c
- anyChar :: (Bounded c, Enum c) => M c
- appends :: [M c] -> M c
- unions :: [M c] -> M c
- star :: M c -> M c
- string :: [c] -> M c
- nullable :: M c -> Bool
- derivate :: (Eq c, Enum c, Bounded c) => c -> M c -> M c
- generate :: Int -> M c -> [[c]]
- toKleene :: Kleene c k => M c -> k
- isEmpty :: M c -> Bool
- isEps :: M c -> Bool
Documentation
Regular expression which has no restrictions on the elements.
Therefore we can have Monad
instance, i.e. have a regexp where
characters are regexps themselves.
Because there are no optimisations, it's better to work over small alphabets. On the other hand, we can work over infinite alphabets, if we only use small amount of symbols!
>>>
putPretty $ string [True, False]
^10$
>>>
let re = string [True, False, True]
>>>
let re' = re >>= \b -> if b then char () else star (char ())
>>>
putPretty re'
^..*.$
MChars [c] | One of the characters |
MAppend [M c] | Concatenation |
MUnion [c] [M c] | Union |
MStar (M c) | Kleene star |
Monad M Source # | |
Functor M Source # | |
Applicative M Source # | |
Foldable M Source # | |
Traversable M Source # | |
(Eq c, Enum c, Bounded c) => Match c (M c) Source # | |
(Eq c, Enum c, Bounded c) => Derivate c (M c) Source # | |
Kleene c (M c) Source # | |
Eq c => Eq (M c) Source # | |
Ord c => Ord (M c) Source # | |
Show c => Show (M c) Source # | |
(~) * c Char => IsString (M c) Source # | |
Semigroup (M c) Source # | |
Monoid (M c) Source # | |
(Eq c, Enum c, Bounded c, Arbitrary c) => Arbitrary (M c) Source # | |
CoArbitrary c => CoArbitrary (M c) Source # | |
JoinSemiLattice (M c) Source # | |
BoundedJoinSemiLattice (M c) Source # | |
(Pretty c, Eq c) => Pretty (M c) Source # | |
Construction
Empty regex. Doesn't accept anything.
>>>
putPretty (empty :: M Bool)
^[]$
>>>
putPretty (bottom :: M Bool)
^[]$
match (empty :: M Bool) (s :: String) === False
Empty string. Note: different than empty
.
>>>
putPretty (eps :: M Bool)
^$
>>>
putPretty (mempty :: M Bool)
^$
match (eps :: M Bool) s === null (s :: String)
charRange :: Enum c => c -> c -> M c Source #
Note: we know little about c
.
>>>
putPretty $ charRange 'a' 'z'
^[abcdefghijklmnopqrstuvwxyz]$
anyChar :: (Bounded c, Enum c) => M c Source #
Any character. Note: different than dot!
>>>
putPretty (anyChar :: M Bool)
^[01]$
Literal string.
>>>
putPretty ("foobar" :: M Char)
^foobar$
>>>
putPretty ("(.)" :: M Char)
^\(\.\)$
>>>
putPretty $ string [False, True]
^01$
Derivative
nullable :: M c -> Bool Source #
We say that a regular expression r is nullable if the language it defines contains the empty string.
>>>
nullable eps
True
>>>
nullable (star "x")
True
>>>
nullable "foo"
False
derivate :: (Eq c, Enum c, Bounded c) => c -> M c -> M c Source #
Intuitively, the derivative of a language \(\mathcal{L} \subset \Sigma^\star\) with respect to a symbol \(a \in \Sigma\) is the language that includes only those suffixes of strings with a leading symbol \(a\) in \(\mathcal{L}\).
>>>
putPretty $ derivate 'f' "foobar"
^oobar$
>>>
putPretty $ derivate 'x' $ "xyz" \/ "abc"
^yz$
>>>
putPretty $ derivate 'x' $ star "xyz"
^yz(xyz)*$
Generation
Generate random strings of the language M c
describes.
>>>
let example = traverse_ print . take 3 . generate 42
>>>
example "abc"
"abc" "abc" "abc"
>>>
example $ star $ "a" \/ "b"
"ababbb" "baab" "abbababaa"
xx >>> example empty
expensive-prop> all (match r) $ take 10 $ generate 42 (r :: M Bool)
Conversion
toKleene :: Kleene c k => M c -> k Source #
Convert to Kleene
>>>
let re = charRange 'a' 'z'
>>>
putPretty re
^[abcdefghijklmnopqrstuvwxyz]$
>>>
putPretty (toKleene re :: RE Char)
^[a-z]$