Brzozowski derivatives are neat, but good old denotational semantics of regular expressions can be very elegant too:

data RE = Empty | Eps | Ch Char | App RE RE | Alt RE RE | Star RE

foldRE :: p -> p -> (Char -> p) -> (p -> p -> p) -> (p -> p -> p) -> (p -> p) -> RE -> p
foldRE emp eps ch app alt star = go where
  go = \case
    Empty -> emp
    Eps -> eps
    Ch c -> ch c
    App p q -> app (go p) (go q)
    Alt p q -> alt (go p) (go q)
    Star p -> star (go p)

recognise :: RE -> String -> [String]
recognise =
  foldRE (pure empty) pure (\c -> \case x : xs | c == x -> [xs]; _ -> [])
    (>=>) (liftA2 (<|>)) (\p -> fix (\t -> liftA2 (<|>) pure (p >=> t)))

#haskell

    • jaror@kbin.socialOP
      link
      fedilink
      arrow-up
      1
      ·
      1 year ago

      @mangoiv perhaps it is slightly easier to read like this?

      data RE = Empty | Eps | Ch Char | App RE RE | Alt RE RE | Star RE
      
      data REalg a = REalg
        { emp :: a
        , eps :: a
        , ch :: Char -> a
        , app :: a -> a -> a
        , alt :: a -> a -> a
        , star :: a -> a
        }
      
      foldRE :: REalg a -> RE -> a
      foldRE alg = go where
        go = \case
          Empty -> emp alg
          Eps -> eps alg
          Ch c -> ch alg c
          App p q -> app alg (go p) (go q)
          Alt p q -> alt alg (go p) (go q)
          Star p -> star alg (go p)
      
      recognise :: RE -> StateT String [] ()
      recognise = foldRE REalg
        { emp = empty
        , eps = pure ()
        , ch = \c -> StateT (\case x : xs | c == x -> [((), xs)]; _ -> [])
        , app = (*>)
        , alt = (&lt;|>)
        , star = \p -> fix (\t -> p *> t &lt;|> pure ())
        }