-- | A program to sanitize an HTML tag to a Haskell function.
--
module Util.Sanitize
( sanitize
, keywords
, prelude
) where
import Data.Char (toLower, toUpper)
import Data.Set (Set)
import qualified Data.Set as S
-- | Sanitize a tag. This function returns a name that can be used as
-- combinator in haskell source code.
--
-- Examples:
--
-- > sanitize "class" == "class_"
-- > sanitize "http-equiv" == "httpEquiv"
--
sanitize :: String -> String
sanitize = appendUnderscore . removeDashOrColon . map toLower
where
-- Remove a dash, replacing it by camelcase notation
--
-- Example:
--
-- > removeDashOrColon "foo-bar" == "fooBar"
--
removeDashOrColon ('-' : x : xs) = toUpper x : removeDashOrColon xs
removeDashOrColon (':' : x : xs) = toUpper x : removeDashOrColon xs
removeDashOrColon (x : xs) = x : removeDashOrColon xs
removeDashOrColon [] = []
appendUnderscore t | t `S.member` keywords = t ++ "_"
| t `S.member` prelude = t ++ "_"
| otherwise = t
-- | A set of standard Haskell keywords, which cannot be used as combinators.
--
keywords :: Set String
keywords = S.fromList
[ "case", "class", "data", "default", "deriving", "do", "else", "if"
, "import", "in", "infix", "infixl", "infixr", "instance" , "let", "module"
, "newtype", "of", "then", "type", "where"
]
-- | Set of functions from the Prelude, which we do not use as combinators.
--
prelude :: Set String
prelude = S.fromList
[ "abs", "acos", "acosh", "all", "and", "any", "appendFile", "asTypeOf"
, "asin", "asinh", "atan", "atan2", "atanh", "break", "catch", "ceiling"
, "compare", "concat", "concatMap", "const", "cos", "cosh", "curry", "cycle"
, "decodeFloat", "div", "divMod", "drop", "dropWhile", "either", "elem"
, "encodeFloat", "enumFrom", "enumFromThen", "enumFromThenTo", "enumFromTo"
, "error", "even", "exp", "exponent", "fail", "filter", "flip"
, "floatDigits", "floatRadix", "floatRange", "floor", "fmap", "foldl"
, "foldl1", "foldr", "foldr1", "fromEnum", "fromInteger", "fromIntegral"
, "fromRational", "fst", "gcd", "getChar", "getContents", "getLine", "head"
, "id", "init", "interact", "ioError", "isDenormalized", "isIEEE"
, "isInfinite", "isNaN", "isNegativeZero", "iterate", "last", "lcm"
, "length", "lex", "lines", "log", "logBase", "lookup", "map", "mapM"
, "mapM_", "max", "maxBound", "maximum", "maybe", "min", "minBound"
, "minimum", "mod", "negate", "not", "notElem", "null", "odd", "or"
, "otherwise", "pi", "pred", "print", "product", "properFraction", "putChar"
, "putStr", "putStrLn", "quot", "quotRem", "read", "readFile", "readIO"
, "readList", "readLn", "readParen", "reads", "readsPrec", "realToFrac"
, "recip", "rem", "repeat", "replicate", "return", "reverse", "round"
, "scaleFloat", "scanl", "scanl1", "scanr", "scanr1", "seq", "sequence"
, "sequence_", "show", "showChar", "showList", "showParen", "showString"
, "shows", "showsPrec", "significand", "signum", "sin", "sinh", "snd"
, "span", "splitAt", "sqrt", "subtract", "succ", "sum", "tail", "take"
, "takeWhile", "tan", "tanh", "toEnum", "toInteger", "toRational"
, "truncate", "text", "uncurry", "undefined", "unlines", "until", "unwords", "unzip"
, "unzip3", "userError", "words", "writeFile", "zip", "zip3", "zipWith"
, "zipWith3"
]