Permalink
Fetching contributors…
Cannot retrieve contributors at this time
47 lines (39 sloc) 1.4 KB
-- This script processes the following source file:
--
-- http://unicode.org/Public/UNIDATA/CaseFolding.txt
module CaseFolding
(
CaseFolding(..)
, Fold(..)
, parseCF
, mapCF
) where
import Arsec
data Fold = Fold {
code :: Char
, status :: Char
, mapping :: [Char]
, name :: String
} deriving (Eq, Ord, Show)
data CaseFolding = CF { cfComments :: [Comment], cfFolding :: [Fold] }
deriving (Show)
entries :: Parser CaseFolding
entries = CF <$> many comment <*> many (entry <* many comment)
where
entry = Fold <$> unichar <* semi
<*> oneOf "CFST" <* semi
<*> unichars
<*> (string "# " *> manyTill anyToken (char '\n'))
parseCF :: FilePath -> IO (Either ParseError CaseFolding)
parseCF name = parse entries name <$> readFile name
mapCF :: CaseFolding -> [String]
mapCF (CF _ ms) = typ ++ (map nice . filter p $ ms) ++ [last]
where
typ = ["foldMapping :: forall s. Char -> s -> Step (CC s) Char"
,"{-# NOINLINE foldMapping #-}"]
last = "foldMapping c s = Yield (toLower c) (CC s '\\0' '\\0')"
nice c = "-- " ++ name c ++ "\n" ++
"foldMapping " ++ showC (code c) ++ " s = Yield " ++ x ++ " (CC s " ++ y ++ " " ++ z ++ ")"
where [x,y,z] = (map showC . take 3) (mapping c ++ repeat '\0')
p f = status f `elem` "CF" &&
mapping f /= [toLower (code f)]