{- Copyright 2012-2019 Vidar Holen This file is part of ShellCheck. https://www.shellcheck.net ShellCheck is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. ShellCheck is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see . -} {-# LANGUAGE DeriveGeneric, DeriveAnyClass, DeriveTraversable, PatternSynonyms #-} module ShellCheck.AST where import GHC.Generics (Generic) import Control.Monad.Identity import Control.DeepSeq import Text.Parsec import qualified ShellCheck.Regex as Re import Prelude hiding (id) newtype Id = Id Int deriving (Show, Eq, Ord, Generic, NFData) data Quoted = Quoted | Unquoted deriving (Show, Eq) data Dashed = Dashed | Undashed deriving (Show, Eq) data AssignmentMode = Assign | Append deriving (Show, Eq) newtype FunctionKeyword = FunctionKeyword Bool deriving (Show, Eq) newtype FunctionParentheses = FunctionParentheses Bool deriving (Show, Eq) data CaseType = CaseBreak | CaseFallThrough | CaseContinue deriving (Show, Eq) newtype Root = Root Token data Token = OuterToken Id (InnerToken Token) deriving (Show) data InnerToken t = Inner_TA_Binary String t t | Inner_TA_Assignment String t t | Inner_TA_Variable String [t] | Inner_TA_Expansion [t] | Inner_TA_Sequence [t] | Inner_TA_Trinary t t t | Inner_TA_Unary String t | Inner_TC_And ConditionType String t t | Inner_TC_Binary ConditionType String t t | Inner_TC_Group ConditionType t | Inner_TC_Nullary ConditionType t | Inner_TC_Or ConditionType String t t | Inner_TC_Unary ConditionType String t | Inner_TC_Empty ConditionType | Inner_T_AND_IF | Inner_T_AndIf t t | Inner_T_Arithmetic t | Inner_T_Array [t] | Inner_T_IndexedElement [t] t -- Store the index as string, and parse as arithmetic or string later | Inner_T_UnparsedIndex SourcePos String | Inner_T_Assignment AssignmentMode String [t] t | Inner_T_Backgrounded t | Inner_T_Backticked [t] | Inner_T_Bang | Inner_T_Banged t | Inner_T_BraceExpansion [t] | Inner_T_BraceGroup [t] | Inner_T_CLOBBER | Inner_T_Case | Inner_T_CaseExpression t [(CaseType, [t], [t])] | Inner_T_Condition ConditionType t | Inner_T_DGREAT | Inner_T_DLESS | Inner_T_DLESSDASH | Inner_T_DSEMI | Inner_T_Do | Inner_T_DollarArithmetic t | Inner_T_DollarBraced Bool t | Inner_T_DollarBracket t | Inner_T_DollarDoubleQuoted [t] | Inner_T_DollarExpansion [t] | Inner_T_DollarSingleQuoted String | Inner_T_DollarBraceCommandExpansion [t] | Inner_T_Done | Inner_T_DoubleQuoted [t] | Inner_T_EOF | Inner_T_Elif | Inner_T_Else | Inner_T_Esac | Inner_T_Extglob String [t] | Inner_T_FdRedirect String t | Inner_T_Fi | Inner_T_For | Inner_T_ForArithmetic t t t [t] | Inner_T_ForIn String [t] [t] | Inner_T_Function FunctionKeyword FunctionParentheses String t | Inner_T_GREATAND | Inner_T_Glob String | Inner_T_Greater | Inner_T_HereDoc Dashed Quoted String [t] | Inner_T_HereString t | Inner_T_If | Inner_T_IfExpression [([t],[t])] [t] | Inner_T_In | Inner_T_IoFile t t | Inner_T_IoDuplicate t String | Inner_T_LESSAND | Inner_T_LESSGREAT | Inner_T_Lbrace | Inner_T_Less | Inner_T_Literal String | Inner_T_Lparen | Inner_T_NEWLINE | Inner_T_NormalWord [t] | Inner_T_OR_IF | Inner_T_OrIf t t | Inner_T_ParamSubSpecialChar String -- e.g. '%' in ${foo%bar} or '/' in ${foo/bar/baz} | Inner_T_Pipeline [t] [t] -- [Pipe separators] [Commands] | Inner_T_ProcSub String [t] | Inner_T_Rbrace | Inner_T_Redirecting [t] t | Inner_T_Rparen | Inner_T_Script t [t] -- Shebang T_Literal, followed by script. | Inner_T_Select | Inner_T_SelectIn String [t] [t] | Inner_T_Semi | Inner_T_SimpleCommand [t] [t] | Inner_T_SingleQuoted String | Inner_T_Subshell [t] | Inner_T_Then | Inner_T_Until | Inner_T_UntilExpression [t] [t] | Inner_T_While | Inner_T_WhileExpression [t] [t] | Inner_T_Annotation [Annotation] t | Inner_T_Pipe String | Inner_T_CoProc (Maybe String) t | Inner_T_CoProcBody t | Inner_T_Include t | Inner_T_SourceCommand t t | Inner_T_BatsTest t t deriving (Show, Eq, Functor, Foldable, Traversable) data Annotation = DisableComment Integer Integer -- [from, to) | EnableComment String | SourceOverride String | ShellOverride String | SourcePath String deriving (Show, Eq) data ConditionType = DoubleBracket | SingleBracket deriving (Show, Eq) pattern T_AND_IF id = OuterToken id Inner_T_AND_IF pattern T_Bang id = OuterToken id Inner_T_Bang pattern T_Case id = OuterToken id Inner_T_Case pattern TC_Empty id typ = OuterToken id (Inner_TC_Empty typ) pattern T_CLOBBER id = OuterToken id Inner_T_CLOBBER pattern T_DGREAT id = OuterToken id Inner_T_DGREAT pattern T_DLESS id = OuterToken id Inner_T_DLESS pattern T_DLESSDASH id = OuterToken id Inner_T_DLESSDASH pattern T_Do id = OuterToken id Inner_T_Do pattern T_DollarSingleQuoted id str = OuterToken id (Inner_T_DollarSingleQuoted str) pattern T_Done id = OuterToken id Inner_T_Done pattern T_DSEMI id = OuterToken id Inner_T_DSEMI pattern T_Elif id = OuterToken id Inner_T_Elif pattern T_Else id = OuterToken id Inner_T_Else pattern T_EOF id = OuterToken id Inner_T_EOF pattern T_Esac id = OuterToken id Inner_T_Esac pattern T_Fi id = OuterToken id Inner_T_Fi pattern T_For id = OuterToken id Inner_T_For pattern T_Glob id str = OuterToken id (Inner_T_Glob str) pattern T_GREATAND id = OuterToken id Inner_T_GREATAND pattern T_Greater id = OuterToken id Inner_T_Greater pattern T_If id = OuterToken id Inner_T_If pattern T_In id = OuterToken id Inner_T_In pattern T_Lbrace id = OuterToken id Inner_T_Lbrace pattern T_Less id = OuterToken id Inner_T_Less pattern T_LESSAND id = OuterToken id Inner_T_LESSAND pattern T_LESSGREAT id = OuterToken id Inner_T_LESSGREAT pattern T_Literal id str = OuterToken id (Inner_T_Literal str) pattern T_Lparen id = OuterToken id Inner_T_Lparen pattern T_NEWLINE id = OuterToken id Inner_T_NEWLINE pattern T_OR_IF id = OuterToken id Inner_T_OR_IF pattern T_ParamSubSpecialChar id str = OuterToken id (Inner_T_ParamSubSpecialChar str) pattern T_Pipe id str = OuterToken id (Inner_T_Pipe str) pattern T_Rbrace id = OuterToken id Inner_T_Rbrace pattern T_Rparen id = OuterToken id Inner_T_Rparen pattern T_Select id = OuterToken id Inner_T_Select pattern T_Semi id = OuterToken id Inner_T_Semi pattern T_SingleQuoted id str = OuterToken id (Inner_T_SingleQuoted str) pattern T_Then id = OuterToken id Inner_T_Then pattern T_UnparsedIndex id pos str = OuterToken id (Inner_T_UnparsedIndex pos str) pattern T_Until id = OuterToken id Inner_T_Until pattern T_While id = OuterToken id Inner_T_While pattern TA_Assignment id op t1 t2 = OuterToken id (Inner_TA_Assignment op t1 t2) pattern TA_Binary id op t1 t2 = OuterToken id (Inner_TA_Binary op t1 t2) pattern TA_Expansion id t = OuterToken id (Inner_TA_Expansion t) pattern T_AndIf id t u = OuterToken id (Inner_T_AndIf t u) pattern T_Annotation id anns t = OuterToken id (Inner_T_Annotation anns t) pattern T_Arithmetic id c = OuterToken id (Inner_T_Arithmetic c) pattern T_Array id t = OuterToken id (Inner_T_Array t) pattern TA_Sequence id l = OuterToken id (Inner_TA_Sequence l) pattern T_Assignment id mode var indices value = OuterToken id (Inner_T_Assignment mode var indices value) pattern TA_Trinary id t1 t2 t3 = OuterToken id (Inner_TA_Trinary t1 t2 t3) pattern TA_Unary id op t1 = OuterToken id (Inner_TA_Unary op t1) pattern TA_Variable id str t = OuterToken id (Inner_TA_Variable str t) pattern T_Backgrounded id l = OuterToken id (Inner_T_Backgrounded l) pattern T_Backticked id list = OuterToken id (Inner_T_Backticked list) pattern T_Banged id l = OuterToken id (Inner_T_Banged l) pattern T_BatsTest id name t = OuterToken id (Inner_T_BatsTest name t) pattern T_BraceExpansion id list = OuterToken id (Inner_T_BraceExpansion list) pattern T_BraceGroup id l = OuterToken id (Inner_T_BraceGroup l) pattern TC_And id typ str t1 t2 = OuterToken id (Inner_TC_And typ str t1 t2) pattern T_CaseExpression id word cases = OuterToken id (Inner_T_CaseExpression word cases) pattern TC_Binary id typ op lhs rhs = OuterToken id (Inner_TC_Binary typ op lhs rhs) pattern TC_Group id typ token = OuterToken id (Inner_TC_Group typ token) pattern TC_Nullary id typ token = OuterToken id (Inner_TC_Nullary typ token) pattern T_Condition id typ token = OuterToken id (Inner_T_Condition typ token) pattern T_CoProcBody id t = OuterToken id (Inner_T_CoProcBody t) pattern T_CoProc id var body = OuterToken id (Inner_T_CoProc var body) pattern TC_Or id typ str t1 t2 = OuterToken id (Inner_TC_Or typ str t1 t2) pattern TC_Unary id typ op token = OuterToken id (Inner_TC_Unary typ op token) pattern T_DollarArithmetic id c = OuterToken id (Inner_T_DollarArithmetic c) pattern T_DollarBraceCommandExpansion id list = OuterToken id (Inner_T_DollarBraceCommandExpansion list) pattern T_DollarBraced id braced op = OuterToken id (Inner_T_DollarBraced braced op) pattern T_DollarBracket id c = OuterToken id (Inner_T_DollarBracket c) pattern T_DollarDoubleQuoted id list = OuterToken id (Inner_T_DollarDoubleQuoted list) pattern T_DollarExpansion id list = OuterToken id (Inner_T_DollarExpansion list) pattern T_DoubleQuoted id list = OuterToken id (Inner_T_DoubleQuoted list) pattern T_Extglob id str l = OuterToken id (Inner_T_Extglob str l) pattern T_FdRedirect id v t = OuterToken id (Inner_T_FdRedirect v t) pattern T_ForArithmetic id a b c group = OuterToken id (Inner_T_ForArithmetic a b c group) pattern T_ForIn id v w l = OuterToken id (Inner_T_ForIn v w l) pattern T_Function id a b name body = OuterToken id (Inner_T_Function a b name body) pattern T_HereDoc id d q str l = OuterToken id (Inner_T_HereDoc d q str l) pattern T_HereString id word = OuterToken id (Inner_T_HereString word) pattern T_IfExpression id conditions elses = OuterToken id (Inner_T_IfExpression conditions elses) pattern T_Include id script = OuterToken id (Inner_T_Include script) pattern T_IndexedElement id indices t = OuterToken id (Inner_T_IndexedElement indices t) pattern T_IoDuplicate id op num = OuterToken id (Inner_T_IoDuplicate op num) pattern T_IoFile id op file = OuterToken id (Inner_T_IoFile op file) pattern T_NormalWord id list = OuterToken id (Inner_T_NormalWord list) pattern T_OrIf id t u = OuterToken id (Inner_T_OrIf t u) pattern T_Pipeline id l1 l2 = OuterToken id (Inner_T_Pipeline l1 l2) pattern T_ProcSub id typ l = OuterToken id (Inner_T_ProcSub typ l) pattern T_Redirecting id redirs cmd = OuterToken id (Inner_T_Redirecting redirs cmd) pattern T_Script id shebang list = OuterToken id (Inner_T_Script shebang list) pattern T_SelectIn id v w l = OuterToken id (Inner_T_SelectIn v w l) pattern T_SimpleCommand id vars cmds = OuterToken id (Inner_T_SimpleCommand vars cmds) pattern T_SourceCommand id includer t_include = OuterToken id (Inner_T_SourceCommand includer t_include) pattern T_Subshell id l = OuterToken id (Inner_T_Subshell l) pattern T_UntilExpression id c l = OuterToken id (Inner_T_UntilExpression c l) pattern T_WhileExpression id c l = OuterToken id (Inner_T_WhileExpression c l) {-# COMPLETE T_AND_IF, T_Bang, T_Case, TC_Empty, T_CLOBBER, T_DGREAT, T_DLESS, T_DLESSDASH, T_Do, T_DollarSingleQuoted, T_Done, T_DSEMI, T_Elif, T_Else, T_EOF, T_Esac, T_Fi, T_For, T_Glob, T_GREATAND, T_Greater, T_If, T_In, T_Lbrace, T_Less, T_LESSAND, T_LESSGREAT, T_Literal, T_Lparen, T_NEWLINE, T_OR_IF, T_ParamSubSpecialChar, T_Pipe, T_Rbrace, T_Rparen, T_Select, T_Semi, T_SingleQuoted, T_Then, T_UnparsedIndex, T_Until, T_While, TA_Assignment, TA_Binary, TA_Expansion, T_AndIf, T_Annotation, T_Arithmetic, T_Array, TA_Sequence, T_Assignment, TA_Trinary, TA_Unary, TA_Variable, T_Backgrounded, T_Backticked, T_Banged, T_BatsTest, T_BraceExpansion, T_BraceGroup, TC_And, T_CaseExpression, TC_Binary, TC_Group, TC_Nullary, T_Condition, T_CoProcBody, T_CoProc, TC_Or, TC_Unary, T_DollarArithmetic, T_DollarBraceCommandExpansion, T_DollarBraced, T_DollarBracket, T_DollarDoubleQuoted, T_DollarExpansion, T_DoubleQuoted, T_Extglob, T_FdRedirect, T_ForArithmetic, T_ForIn, T_Function, T_HereDoc, T_HereString, T_IfExpression, T_Include, T_IndexedElement, T_IoDuplicate, T_IoFile, T_NormalWord, T_OrIf, T_Pipeline, T_ProcSub, T_Redirecting, T_Script, T_SelectIn, T_SimpleCommand, T_SourceCommand, T_Subshell, T_UntilExpression, T_WhileExpression #-} instance Eq Token where OuterToken _ a == OuterToken _ b = a == b analyze :: Monad m => (Token -> m ()) -> (Token -> m ()) -> (Token -> m Token) -> Token -> m Token analyze f g i = round where round t@(OuterToken id it) = do f t newIt <- traverse round it g t i (OuterToken id newIt) getId :: Token -> Id getId (OuterToken id _) = id blank :: Monad m => Token -> m () blank = const $ return () doAnalysis :: Monad m => (Token -> m ()) -> Token -> m Token doAnalysis f = analyze f blank return doStackAnalysis :: Monad m => (Token -> m ()) -> (Token -> m ()) -> Token -> m Token doStackAnalysis startToken endToken = analyze startToken endToken return doTransform :: (Token -> Token) -> Token -> Token doTransform i = runIdentity . analyze blank blank (return . i)