{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE TypeFamilies #-}
{-# LANGUAGE FlexibleInstances #-}
{-# LANGUAGE MultiParamTypeClasses #-}
{-# LANGUAGE DeriveDataTypeable #-}
{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE TypeOperators #-}
{-# LANGUAGE FlexibleContexts #-}

module XSaiga.TypeAg2 where

import XSaiga.Getts
import Data.Text as T hiding (map)
import XSaiga.ShowText
import Control.Arrow
import Data.Bifunctor
import Data.Biapplicative
import Data.List (nub,union)
import qualified Data.Map.Strict as Map
import Control.Monad.State.Strict
--import Control.Applicative
import qualified Data.Data as Data

import GHC.Generics
import Data.Hashable
import Debug.Trace
import Generic.Data (gconIndex)

data GettsIntersectType = GI_NounAnd | GI_Most | GI_Every | GI_Which | GI_HowMany | GI_None | GI_Number Int deriving (Eq, Ord)

instance Show GettsIntersectType where
    show GI_NounAnd = "intersect_fdbr"
    show GI_Most = "most"
    show GI_Every = "every"
    show GI_Which = "which"
    show GI_HowMany = "how many"
    show (GI_Number 0) = "zero"
    show (GI_Number 1) = "one"
    show (GI_Number 2) = "two"
    show (GI_Number 3) = "three"
    show (GI_Number x) = show x

data GettsUnionType = GU_NounOr | GU_NounAnd deriving (Eq, Ord)

instance Show GettsUnionType where
    show GU_NounOr = "nounor"
    show GU_NounAnd = "nounand"

--ReducedTriplestore represents the local triplestore that the semantics operate on
--It is a pair of a list of triples with the cardinality of the set of entities within the triplestore.
--The "maybe" part comes from the fact that the cardinality may not have been retrieved
--Alternative representation: Map from events to (property,entity)?
--Also, COULD store a special triple, like ("ev_triplestore", "cardinality", cardinality)
--using pure* to access the cardinality?
type ReducedTriplestore = ([Triple], Maybe Cardinality)
getCardinality (_,x) = x
getTriples (x, _) = x

--idea: the tree should be fully applied whenever it is stored
--If made fine grained enough, this may suffice for memoization
type TF a = ReducedTriplestore -> a

--newtype TFMemo a = TFMemo (TF (State (Map.Map GettsTree FDBR) a), Maybe GettsTree)

--A SemFunc is really just a tuple of two functions
type SemFunc a = (a, Treeify a)

--convenience functions for TFMemo
{-
getGetts (TFMemo a) = snd a
getSem (TFMemo a) = fst a

instance Functor TFMemo where
    fmap f m = TFMemo (\triples -> fmap f (getSem m triples), Nothing)

instance Applicative TFMemo where
    --(<*>) :: TFMemo (a -> b) -> TFMemo a -> TFMemo b
    f <*> m = TFMemo (f', Nothing)
        where
            f' triples = (getSem f triples) <*> (getSem m triples)
    --f <*> m = f >>= (\f' -> m >>= (\a -> return $ f' a))
    pure a = TFMemo (const $ return a, Nothing)

instance Monad TFMemo where
    m >>= f = TFMemo (f', Nothing)
        where
            f' triples = getSem m triples >>= (\a -> getSem (f a) triples)
    return = pure
-}

--OBSERVATIONS:
{-
 * we didn't even use liftM anywhere for TFMemoT
 * we didn't use TFMemoT as a monad anywhere even
 * we actually lost performance when not memoizing GettsPropFDBR (1.62 vs 1.22 observed on highly ambiguous query)
 * we improved performance slightly using Strict map and Strict state
 * we improved performance slightly by re-using the state between ambiguous parses
 * so, do we need to overcomplicate with Nothing?  for now, lets not do this.
 * liftS/T vs wrapS/V -- can we just get SemFunc to do our work for us?  as it turns out, yes, for no real additional cost
   all memoized denotations are now in terms of the original SemFunc definitions using this

 * significant slowdown in ambiguous queries from fact that SPARQL queries are not cached between parses
   it may be ideal to collect ALL parses at once and then make a reduced triplestore from that
   above IMPLEMENTED to GREAT effect!
   and also fix our representation of how reduced triplestores are stored to alleviate the slowdown

 * could we make an wrap style function that can handle N-arity?  probably needs TH

 * TODO: pre-populate GettsMembers FDBRs, EntEvProp FDBRs, and optimize [Triple] for faster GettsPropFDBR queries
 could we eliminate [Triple] altogether and do everything right from the FDBR cache?  probably not, but worth thinking about

-}

newtype TFMemoT t g m a = TFMemoT (t -> m a, g)
getGetts (TFMemoT a) = snd a
getSem (TFMemoT a) = fst a

--this could be made into a monad if we use Maybe GettsTree... but it is not a useful one
type TFMemo = TFMemoT ReducedTriplestore GettsTree (State (Map.Map GettsTree Result))

--moon >>= (\moon_fdbr -> spins >>= (\spin_fdbr -> a'' moon_fdbr spins_fdbr))

--the idea: bind erases the name but keeps the memoized computation
--so liftM* works as expected
--liftS* can be used to keep names for things
--does this uphold the monad laws?

data GettsTree =
      GettsNone -- TODO MEMO: NOT to be used for memoization (replace with Maybe GettsTree in termphrases/superphrases?)
    | GettsPNoun Text
    | GettsMembers Text
    | GettsTP Text Relation [GettsTree]
    | GettsPrep [Text] (Maybe Ordering) GettsTree --TODO memoized superlatives
    | GettsIntersect GettsIntersectType GettsTree GettsTree --representing result of intersect_fdbr (only evs from 2nd tree are kept)
    | GettsUnion GettsUnionType GettsTree GettsTree --representing result of "union" of fdbrs.  Keeps everything.
    | GettsYesNo GettsTree
    | GettsPropTmph Text GettsTree
    | GettsAttachP Text GettsTree
    | GettsPropFDBR [Text] [Text] --props and events, used for memoizing filter_evs
    | GettsComplement GettsTree
    deriving (Eq, Show, Ord)

showOrd Nothing = ""
showOrd (Just x) = show x

showList list = T.concat ["[", (T.intercalate "," list), "]"]

treeToParsedSentence :: GettsTree -> Text
treeToParsedSentence GettsNone = ""
treeToParsedSentence (GettsPNoun t) = t
treeToParsedSentence (GettsMembers t) = t
treeToParsedSentence (GettsTP sub (rel, _, _) preps) = T.concat [rel, "_(", sub, ") ", XSaiga.TypeAg2.showList $ map treeToParsedSentence preps]
treeToParsedSentence (GettsPrep props ord tree) = T.concat ["(", XSaiga.TypeAg2.showList props, ", ", pack $ showOrd ord, treeToParsedSentence tree , ")"]
treeToParsedSentence (GettsIntersect t t1 t2) = T.concat $ ["(", (pack $ show t), " ", treeToParsedSentence t1] ++ (let x = treeToParsedSentence t2 in if T.null x then [] else [" ", x]) ++ [")"]
treeToParsedSentence (GettsUnion t t1 t2) =  T.concat $ ["(", (pack $ show t), " ", treeToParsedSentence t1] ++ (let x = treeToParsedSentence t2 in if T.null x then [] else [" ", x]) ++ [")"]
treeToParsedSentence (GettsYesNo t) = treeToParsedSentence t
treeToParsedSentence (GettsPropTmph t tree) = T.concat [t, treeToParsedSentence tree]
treeToParsedSentence (GettsAttachP t tree) = T.concat [t, treeToParsedSentence tree]
treeToParsedSentence (GettsPropFDBR x y) = undefined


data GettsFlatTypes =
    FGettsMembers Text
  | FGettsT [Text] Text
  | FGettsCardinality [Text] --the list of properties that is used to count the total number of entities

type FGettsMembers = Text
type FGettsT = ([Text], Text)
type FGettsCardinality = [Text] --Maybe?

type GettsFlat = ([FGettsMembers], [FGettsT], FGettsCardinality)

--Convert a function signature to a Getts style function
--Keeps same kind, same arity
type family Treeify x where
  --Treeify ((TF a -> b) -> c) = Treeify (TF a -> b) -> Treeify c
  --Treeify (TF a -> b) = GettsTree -> Treeify b
  Treeify (TF a) = GettsTree
  Treeify (a -> b) = Treeify a -> Treeify b
  Treeify a = GettsTree
  --Treeify _ = GettsTree<Paste>

--TODO: Abstract tree into separate datastructure as Foldable and Traversable
--It seems to me there are five layers:
{-

User layer: GettsT, GettsPrep, GettsAttachP ... these are like semantic "words"
Unparsed Tree layer: GettsSubQuery, GettsList, GettsNode ... this is like the parse tree of those "words"
Semantic (condensed) layer: Group SubQuery, List, Node, etc... into GettsTP, keeping tree
Flattened layer: Only a list of GettsMembers and a list of GettsTP (flattened tree)
Optimization layer: Knowledge to reduce queries (subsets, GettsTP of same type)

Semantic tree layer
Flattened layer

-}

--wrapS* memoizes SemFuncs
--wrapT* does not (but still uses memoization in the arguments)
--TODO: could TF/Memo Result be changed to TF/Memo c?
wrapS0 :: SemFunc (TF Result) -> TFMemo Result
wrapS0 (f,g) = TFMemoT (f', g)
    where
        f' triples = do
            s <- get
            case Map.lookup g s of
                Just fdbr -> return fdbr
                Nothing -> do
                    let res = f triples
                    modify (\s' -> Map.insert g res s')
                    return res

wrapS1 :: SemFunc (TF a -> TF Result) -> TFMemo a -> TFMemo Result
wrapS1 (f,g) a = TFMemoT (f', g')
                where
                    g' = g (getGetts a)
                    f' triples = do
                            s <- get
                            case Map.lookup g' s of
                                Just fdbr -> return fdbr
                                Nothing -> do
                                    x <- getSem a triples
                                    let res = f (const x) triples
                                    modify (\s' -> Map.insert g' res s')
                                    return res

wrapS2 :: SemFunc (TF a -> TF b -> TF Result) -> TFMemo a -> TFMemo b -> TFMemo Result
wrapS2 (f,g) a b = TFMemoT (f', g')
                where
                    g' = g (getGetts a) (getGetts b)
                    f' triples = do
                            s <- get
                            case Map.lookup g' s of
                                Just fdbr -> return fdbr
                                Nothing -> do
                                    x1 <- getSem a triples
                                    x2 <- getSem b triples
                                    let res = f (const x1) (const x2) triples
                                    modify (\s' -> Map.insert g' res s')
                                    return res

wrapT0 :: (TF a, GettsTree) -> TFMemo a
wrapT0 (f,g) = TFMemoT (f', g)
                    where
                        f' triples = return $ f triples

wrapT1 :: (TF a -> TF b, GettsTree -> GettsTree) -> TFMemo a -> TFMemo b
wrapT1 (f,g) a = TFMemoT (f', g')
                    where
                        g' = g (getGetts a)
                        f' triples = (getSem a triples) >>= (\x -> return $ f (const x) triples)

wrapT2 :: (TF a -> TF b -> TF c, GettsTree -> GettsTree -> GettsTree) -> TFMemo a -> TFMemo b -> TFMemo c
wrapT2 (f,g) a b = TFMemoT (f', g')
                    where
                        g' = g (getGetts a) (getGetts b)
                        f' triples = do
                            x1 <- (getSem a triples)
                            x2 <- (getSem b triples)
                            return $ f (const x1) (const x2) triples

--NEW: convert from biapplicative form to regular function application
--this is a one way conversion, unless you have the property that the tuple elements are "invariant" with respect to each other

--A type-level function to "tie" two functions together into a series of functions each taking a pair argument
type family BiappFunc x y where
    BiappFunc (a1 -> a2) (b1 -> b2) = (a1, b1) -> BiappFunc a2 b2
    BiappFunc x y = (x, y)

--Implementation of the "tie" function above
class BiappFuncImpl x y where
    tieFunc :: x -> y -> BiappFunc x y

instance {-# OVERLAPPING #-} (BiappFuncImpl a2 b2) => BiappFuncImpl (a1 -> a2) (b1 -> b2) where
    tieFunc f g = (\(a, b) -> tieFunc (f a) (g b))

instance (BiappFunc a b ~ (a, b)) => BiappFuncImpl a b where
    tieFunc a b = (a, b)

--Implementation to convert `SemFunc a` to function application form
fromBiapp (a, b) = tieFunc a b
--toBiapp :: (a, b) -> (a2, b2) -> ... -> (a -> a2 -> ..., b -> b2 ->...)
--TODO: make more general -- support generalized biapplicative?
--fromBiapp :: Biapplicative p (a1 -> a2) (b1 -> b2) -> p a1 b1 -> p a2 b2
--fromBiapp b x = (b <<*>> x) <<*> ...
--TODO: support higher order functions as well using `extract` function

--So, you get the original behaviour by doing convBiapp $ termor, convBiapp $ a, etc...
--This allows biapplicative form to be used for easy extraction, and function application form for convenience
--It would be nice to get rid of the overlapping instances though!

--TODO: restrict arity of b (same kind as a)
semFunc :: a -> Treeify a -> SemFunc a
semFunc = bipure

--Just for presentation purposes
instance Show (TF FDBR) where
  show x = "TF FDBR"

instance (Show a) => Show (TF (State (Map.Map GettsTree FDBR) a)) where
  show x = "TF State"

instance Show (TF GFDBR) where
  show x = "TF GFDBR"

instance Show (TF Text) where
  show x = "TF Text"


--Unclean -- Foldable would help
--TODO: filter duplicates
--TODO: make [SemFunc a] not used with gatherPreps, apply directly to verb?
--Would avoid GettsPreps situation

--apply over the intersect_entevimages, remember evs of im2 are preserved and im1 are discarded
gettsAttachP :: T.Text -> GettsTree -> GettsTree
gettsAttachP prop (GettsIntersect t x y) = GettsIntersect t x (gettsAttachP prop y)
gettsAttachP prop (GettsUnion t x y) = GettsUnion t x (gettsAttachP prop y)
gettsAttachP prop (GettsTP p rel sub) = GettsTP p rel ((GettsPrep [prop] Nothing GettsNone):sub) --is this correct?  should i go back to the old way?  does cardinality have to match?
--TODO MEMO -- altering tree may affect identity for memoization
--IDEA!!  create a GettsAttachP node instead and only during flattening will it have any effect -- prevents altering trees

--TODO: flattenGetts needs information about list of entity properties to count in the triplestore (to be used in a count query)
flattenGetts'' :: [T.Text] -> GettsTree -> GettsFlat
flattenGetts'' allEntProps tree = flattenGetts' tree
    where
    flattenGetts' :: GettsTree -> GettsFlat
    flattenGetts' GettsNone = ([],[],[])
    flattenGetts' (GettsPNoun _) = ([],[],[])
    flattenGetts' (GettsMembers set) = ([set], [], [])
    flattenGetts' (GettsYesNo fdbr) = flattenGetts' fdbr
    flattenGetts' (GettsIntersect t i1 i2) = merge (flattenGetts' i1) (flattenGetts' i2)
    flattenGetts' (GettsUnion t i1 i2) = merge (flattenGetts' i1) (flattenGetts' i2)
    flattenGetts' (GettsPrep props _ sub) = error "Cannot flatten prep directly" --TODO
    flattenGetts' (GettsPropTmph t sub) = flattenGetts' sub --TODO MEMO!
    flattenGetts' (GettsAttachP prop sub) = flattenGetts' $ gettsAttachP prop sub
    flattenGetts' (GettsTP prop (rel, _, _) preps) =
        let props = nub $ prop:(Prelude.concatMap (\(GettsPrep p _ _) -> p) preps)
            in Prelude.foldr merge ([],[(props, rel)],[]) $ map (\(GettsPrep _ _ sub) -> flattenGetts' sub) preps
    flattenGetts' (GettsComplement tree) = merge ([],[],allEntProps) (flattenGetts' tree) --FIXME

--TODO: refactor... expose to user somehow (triplestore retriever builder?)
flattenGetts = flattenGetts'' ["subject","object","with_implement", "location"] --the Solarman props
--TODO: denotation of "thing" or "entity" == above?

merge :: GettsFlat -> GettsFlat -> GettsFlat
merge (x1, y1, props1) (x2, y2, props2) = (x1 ++ x2, y1 ++ y2, union props1 props2)

(>|<) :: a -> Treeify a -> SemFunc a
f >|< g = bipure f g

flatOptimize :: GettsFlat -> GettsFlat
flatOptimize (members, gettsTPs, comp) = (nub members, dedupTP, nub comp)
  where
    dedupTP = Prelude.foldr (\(props, rel) -> \optlist -> if Prelude.any (\(_, r) -> r == rel) optlist
                                                             then map (\(p, r) -> if r == rel then (nub $ props ++ p, rel) else (p, r)) optlist
                                                             else (props,rel):optlist) [] gettsTPs

--TODO: the triplestore itself, [Triple], should maybe be ([Triple], Maybe Int) for cardinality?
--      this would at least make the #entities information available...
--      but then, how do we specify which props to count?
-- TODO: maybe good opportunity to specify comp properties here?
getReducedTriplestore :: (TripleStore m) => m -> GettsFlat -> IO ReducedTriplestore
getReducedTriplestore ev_data (sets, trans, compProps) = do
  t1 <- mapM (\set -> getts_triples_members ev_data set) sets
  t2 <- mapM (\(props, rel) -> getts_triples_entevprop_type ev_data props rel) trans
  let triples = Prelude.concat $ t1 ++ t2
  if Prelude.null compProps
      then return $ (triples, Nothing)
      else do t3 <- getts_cardinality_allents ev_data compProps
              return $ (triples, Just t3)

unionerr x y = error $ "attempt to union: " ++ show x ++ " with " ++ show y --TODO: debugging

--TODO OLD
{-gettsIdentity f GettsNone y = y
gettsIdentity f x GettsNone = x
gettsIdentity f x y = f x y

gettsIntersect = gettsIdentity GettsIntersect

--TODO: make this a proper union
gettsUnion = gettsIdentity GettsUnion
-}

gettsApply g = g GettsNone

--NOTE MEMO: only use gettsApply here for unique naming, not for memoizing individual semantic functions
--NOTE MEMO: what do we do if we have unmemoized stuff?
--NOTE MEMO: assume all top level things are named, because otherwise we can't query the database
--cannot use sequenceA because it would look like
--with (a (telescope (by (a (person))))) instead of (with ( a telescope )), (by (a person))
--TODO: augment with superlative
gatherPreps' :: [([T.Text], Maybe Ordering, SemFunc (TF a -> TF b))] -> [GettsTree]
gatherPreps' = map (\(props, ord, g) -> GettsPrep props ord $ gettsApply $ snd g)

gatherPreps :: [([T.Text], Maybe Ordering, TFMemo a -> TFMemo b)] -> [GettsTree]
gatherPreps = map (\(props, ord, g) -> GettsPrep props ord $ applyGettsPrep g) --test with undefined to prove

--used ONLY to get a unique identifier for prepositions
applyGettsPrep :: (TFMemo a -> TFMemo b) -> GettsTree
applyGettsPrep g = getGetts $ g $ TFMemoT (error "Should not eval!", GettsNone)

--OBSERVATION: top level things need names for sure.  the only time we don't want to name things is sometimes inside other computations.
--a top level expression without a name will cause the entire expression to not have a name
--but that also means we can't retrieve anything from the triplestore because we will have Nothing to query it with
--it would be nice to garrant that top level things will always have a name, and provide an escape hatch for those inside computations that don't contribute to the name of other things
--in practice, it's only inside transitive verbs we need more control over this
--in particular, the predicates in here need that control
--if we pass Nothing in, we forbid them from memoizing
--since they may appear at the top level, the same denotation must be used inside and outside
--therefore, that denotation needs to account for this
--if we make GettsIntersect have a Maybe GettsTree as the last argument, we can remove GettsNone
--but this complicates liftS* a bit: (FDBR -> FDBR -> FDBR) -> (GettsTree -> Maybe GettsTree -> Maybe GettsTree) -> ...?

--a <<*>> moon <<*>> spins...
--PUBLIC INTERFACE (TODO)
--TODO: make_fdbr_with_prop is DANGEROUS
--Get members of named set
--get_members :: (TripleStore m) => m -> Text -> IO FDBR
--get_members = getts_members
get_members' :: Text -> SemFunc (TF Result)
get_members' set = (\r -> FDBR $ pure_getts_members r set) >|< GettsMembers set
--NOTE: should we have get_not_members?  how do we get cardinalities?
--Example: GettsComplement (GettsMembers "moon") -- this means the "not" should have something in it about the cardinality
--like AttachCardinality?

get_members = wrapS0 . get_members'

--TODO: revise this for new transitive verb definition.  should not assume these fields in general.
--NOTE: how do we handle "not" here?  need cardinality... how do we request it and fill it in here?
get_subjs_of_event_type' :: Text -> SemFunc (TF Result)
get_subjs_of_event_type' ev_type = (\r -> FDBR $ make_fdbr_with_prop (pure_getts_triples_entevprop_type r ["subject"] ev_type) "subject") >|< GettsTP "subject" (ev_type, "subject", "object") []

get_subjs_of_event_type = wrapS0 . get_subjs_of_event_type'

--constrName :: Data.Data a => a -> T.Text
--constrName = T.pack . show . Data.toConstr

--constrName = T.pack . gconName

{-
class Name a where
  constrName :: a -> String
instance {# OVERLAPPING #} Name a => Name (r -> a) where
  constrName f = constrName (f undefined)
instance (Data.Data a) => Name a where
  constrName = show . toConstr
-}

--constrName :: Data.Data a => a -> Data.ConIndex
--constrName = Data.constrIndex . Data.toConstr

--instance (Generic a, Generic b) => Generic (a -> b) where

--constrName :: (HasConstructor (Rep a), Generic a) => a -> Text
--constrName = pack . genericConstrName . from

{-class HasConstructor (f :: * -> *) where
  genericConstrName :: f x -> String

instance HasConstructor f => HasConstructor (D1 c f) where
  genericConstrName (M1 x) = genericConstrName x

instance (HasConstructor x, HasConstructor y) => HasConstructor (x :+: y) where
  genericConstrName (L1 l) = genericConstrName l
  genericConstrName (R1 r) = genericConstrName r

instance Constructor c => HasConstructor (C1 c f) where
  genericConstrName = conName
-}

constrName = gconIndex

--Denotes either a set of examples or a set of exceptions
--Inspired from Frost,Boulos (2004)
data Result = FDBR FDBR | ComplementFDBR FDBR
getFDBR (FDBR x) = x
getFDBR (ComplementFDBR x) = x

type CardinalityFunction = Result -> Cardinality

data AttValue = VAL             {getAVAL    ::   Int}
              | MaxVal          {getAVAL    ::   Int}
              | RepVal          {getAVAL    ::   Int}
              | Res             {getRVAL    ::   DisplayTree}
              | B_OP            {getB_OP    ::   (Int -> Int -> Int)}
              | U_OP            {getU_OP    ::   (Int -> Int)}
              | SENT_VAL        {getSV      ::   TFMemo Result }
              | NOUNCLA_VAL     {getAVALS   ::   TFMemo Result }
              | VERBPH_VAL      {getAVALS   ::   TFMemo Result }
              | ADJ_VAL         {getAVALS   ::   TFMemo Result } --TODO: treat adjective like termph whose argument is a moon?
              | TERMPH_VAL      {getTVAL    ::   TFMemo Result -> TFMemo Result}
              | DET_VAL         {getDVAL    ::   TFMemo Result -> TFMemo Result -> TFMemo Result}
              | VERB_VAL        {getBR      ::   Relation } --stores relation, "subject" and "object". TODO: need to expand on later for "used"
          | RELPRON_VAL     {getRELVAL  ::   TFMemo Result -> TFMemo Result -> TFMemo Result}
          | NOUNJOIN_VAL    {getNJVAL   ::   TFMemo Result -> TFMemo Result -> TFMemo Result}
          | VBPHJOIN_VAL    {getVJVAL   ::   TFMemo Result -> TFMemo Result -> TFMemo Result}
          | TERMPHJOIN_VAL  {getTJVAL   ::   (TFMemo Result -> TFMemo Result) -> (TFMemo Result -> TFMemo Result) -> TFMemo Result -> TFMemo Result }
          | SUPERPHSTART_VAL  {getSUPERPHSTARTVAL :: ()}
          | SUPER_VAL       {getSUPERVAL ::  Ordering}
          | SUPERPH_VAL     {getSUPERPHVAL :: (Ordering, TFMemo Result -> TFMemo Result)}
          | PREP_VAL       {getPREPVAL ::   [([Text], Maybe Ordering, TFMemo Result -> TFMemo Result)]} -- used in "hall discovered phobos with a telescope" as "with".
          | PREPN_VAL       {getPREPNVAL :: [Text]} --used for mapping between prepositions and their corresponding identifiers in the database.  I.e., "in" -> ["location", "year"]
          | PREPNPH_VAL     {getPREPNPHVAL :: [Text]}
          | PREPPH_VAL      {getPREPPHVAL :: ([Text], Maybe Ordering, TFMemo Result -> TFMemo Result)}
          | TERMPHNOT_VAL   {getTERMPHNOTVAL :: (TFMemo Result -> TFMemo Result) -> (TFMemo Result -> TFMemo Result)}  --"not" (as in not-hall)
          | PREFIX_VAL      {getPREFIXVAL :: TFMemo Result -> TFMemo Result} -- "non-" (as in "non moon")
          | ADVERB_VAL      {getADVERBVAL :: TFMemo Result -> TFMemo Result} -- "not" (as in "not spins")
          | LINKINGVB_VAL   {getLINKVAL ::   TFMemo Result -> TFMemo Result}
          | SENTJOIN_VAL    {getSJVAL   ::   TFMemo Result -> TFMemo Result -> TFMemo Result}
          | DOT_VAL         {getDOTVAL  ::   TFMemo Text}
          | QM_VAL          {getQMVAL   ::   TFMemo Text}
          | QUEST_VAL       {getQUVAL   ::   TFMemo Text}
          | QUEST1_VAL      {getQU1VAL  ::   TFMemo Result -> TFMemo Text}
          | QUEST2_VAL      {getQU2VAL  ::   TFMemo Result -> TFMemo Text}
          | QUEST6_VAL      {getQU6VAL  ::   TFMemo Result -> TFMemo Text}
          | QUEST3_VAL      {getQU3VAL  ::   TFMemo Result -> TFMemo Result -> TFMemo Text}
          | YEAR_VAL        {getYEARVAL ::   Int}
          deriving(Generic)

--            | RESULT [sys_message]
--Also called a "NodeName"
--TODO: Split ALeaf out from here, and make this an enum!  ALeaf is used for terminals
data MemoL    = Start | Tree | Num | Emp | ALeaf !Text | Expr | Op  | ET
              | Pnoun|Cnoun|Adj|Det|Intransvb|Transvb|Linkingvb|Relpron|Termphjoin|Verbphjoin|Nounjoin|Preps|Prepph|Super|Superph|SuperphStart|Prepn|Prepnph|Prepyear|Joinyear|Indefpron|Sentjoin|Quest1|Quest2|Quest3|Quest4a|Quest4b
              | Snouncla|Relnouncla|Nouncla|Adjs|Detph|Transvbph|Verbph|Termph|Jointermph|Joinvbph|Sent|Two_sent|Question|Quest4|Query|Year|Quest5|Quest6|Adverb|Prefix|Termphnot
                deriving (Eq,Ord,Show,Generic)

instance Hashable MemoL

data Id       = O0|S0 |S1|S2|S3|S4|S5|S6|S7|S8|S9|T0|T1 | T2 | T3 |T4 | N1| N2 | N3 | E0 |E1 |E2 | O1| LHS  deriving (Eq,Ord,Show,Enum,Generic)
                -- basic IDs for identifying each NT

instance Hashable Id

{-

attFunc
 = [
    (VAL,getAVAL), (MaxVal,getAVAL), (SubVal,getAVAL), (RepVal,getAVAL), (Res,getRVAL), (B_OP,getB_OP),(U_OP,getU_OP),(SENT_VAL,getSV),(ErrorVal,getEVAL),
    (NOUNCLA_VAL,getAVALS),(VERBPH_VAL,getAVALS),(ADJ_VAL,getAVALS),(TERMPH_VAL,getTVAL),(DET_VAL,getDVAL),(VERB_VAL,getBR),(RELPRON_VAL,getRELVAL),(NOUNJOIN_VAL,getNJVAL),
    (VBPHJOIN_VAL,getVJVAL),(TERMPHJOIN_VAL,getTJVAL),(PREP_VAL,getPREPVAL),(LINKINGVB_VAL,getLINKVAL),(SENTJOIN_VAL,getSJVAL),(DOT_VAL,getDOTVAL),(QM_VAL,getQMVAL),(QUEST1_VAL,getQU1VAL),
    (QUEST2_VAL,getQU2VAL),(QUEST3_VAL,getQU3VAL)
   ]
-}
type Entity         =  Text
--type Bin_Rel        =  [(Entity,Entity)] -- [(Int, Int)]
--type Relation     = (ES -> Bool) -> FDBR
type Relation = (Text, Text, Text)

data DisplayTree = B [DisplayTree]
                 | N Int
                   deriving (Show, Eq, Data.Data)

--instance Show AttValue where
--    show x = "AttValue"

instance Show AttValue where
    show (VAL  j)     = "VAL "    ++ show j
    show (MaxVal j)   = "MaxVal " ++ show j
    --show (SubVal j)   = "SubVal " ++ show j
    show (RepVal j)   = "RepVal " ++ show j
    show (Res j)      = "Tree: "  ++ show j
    show (B_OP j)     = "B_OP"
    show (U_OP j)     = "U_OP"
    show _            = "AttValue"
    {-show (SENT_VAL j) = show j
    show (ErrorVal j) =  j
    show (NOUNCLA_VAL j) = "NOUNCLA_VAL " ++ unwords $ map fst j
    show (VERBPH_VAL j)  = "VERBPH_VAL " ++ unwords $ map fst j
    show (ADJ_VAL    j)  = "ADJ_VLA " ++ unwords $ map fst j
    show (TERMPH_VAL j)  = "TERMPH_VAL "
    show (DET_VAL j)     = "DET_VAL "
    show (VERB_VAL j)    =  "VERB_VAL " ++ j
    show (RELPRON_VAL j)  = "RELPRON_VAL "
    show (NOUNJOIN_VAL j)  = "NOUNJOIN_VAL "
    show (VBPHJOIN_VAL j)  = "VBPHJOIN_VAL "
    show (TERMPHJOIN_VAL j)  = "TERMPHJOIN_VAL "
    show (PREP_VAL j)  = "PREP_VAL "
    show (LINKINGVB_VAL j)  = "LINKINGVB_VAL "
    show (SENTJOIN_VAL j)  = "SENTJOIN_VAL "
    show (DOT_VAL j) = j
    show (QM_VAL j) = j
    show (QUEST_VAL j) = j
    show (QUEST1_VAL j)  = "QUEST1_VAL"
    show (QUEST2_VAL j)  = "QUEST2_VAL"
    show (QUEST3_VAL j)  = "SENTJOIN_VAL"-}

--TODO: find a better way to do this
--NOTE: this is only here because of the expression problem in Haskell
--Ideally, you do this with the EqC typeclass and then it gets handled properly in AGParser2
--Instead, we define equality as equality up to the constructor used to generate the AttValue
{-instance Eq AttValue where
    (VAL  _)           ==  (VAL  _)     = True
    (MaxVal _)         ==  (MaxVal _)   = True
    (RepVal _)         ==  (RepVal _)   = True
    (Res _)            ==  (Res _)      = True
    (B_OP _)           ==  (B_OP _)     = True
    (U_OP _)           ==  (U_OP _)     = True
    (SENT_VAL _)       ==  (SENT_VAL _) = True
    (NOUNCLA_VAL _)    ==  (NOUNCLA_VAL _) = True
    (VERBPH_VAL _)     ==  (VERBPH_VAL _) = True
    (ADJ_VAL _)        ==  (ADJ_VAL _) = True
    (TERMPH_VAL _)     ==  (TERMPH_VAL _) = True
    (DET_VAL _)        ==  (DET_VAL _) = True
    (VERB_VAL _)       ==  (VERB_VAL _) = True
    (RELPRON_VAL _)    ==  (RELPRON_VAL _) = True
    (NOUNJOIN_VAL _)   ==  (NOUNJOIN_VAL _) = True
    (VBPHJOIN_VAL _)   ==  (VBPHJOIN_VAL _) = True
    (TERMPHJOIN_VAL _) ==  (TERMPHJOIN_VAL _) = True
    (LINKINGVB_VAL _)  ==  (LINKINGVB_VAL _) = True
    (SENTJOIN_VAL _)   ==  (SENTJOIN_VAL _) = True
    (DOT_VAL _)        ==  (DOT_VAL _) = True
    (QM_VAL _)         ==  (QM_VAL _) = True
    (QUEST_VAL _)      ==  (QUEST_VAL _) = True
    (QUEST1_VAL _)     ==  (QUEST1_VAL _) = True
    (QUEST2_VAL _)     ==  (QUEST2_VAL _) = True
    (QUEST3_VAL _)     ==  (QUEST3_VAL _) = True
    (QUEST6_VAL _)     ==  (QUEST6_VAL _) = True
    (PREP_VAL _)      ==  (PREP_VAL _) = True
    (PREPN_VAL _)     ==  (PREPN_VAL _) = True
    (PREPNPH_VAL _)   ==  (PREPNPH_VAL _) = True
    (PREPPH_VAL _)    ==  (PREPPH_VAL _) = True
    (YEAR_VAL _)      ==  (YEAR_VAL _) = True
    (SUPERPHSTART_VAL _) ==  (SUPERPHSTART_VAL _) = True
    (SUPER_VAL _)     ==  (SUPER_VAL _) = True
    (SUPERPH_VAL _)   ==  (SUPERPH_VAL _) = True
    _                  ==  _              = False
-}

--------- *********************** --------------
-- needs to be simplified --
--This seems to be used in the "left hand side" "right hand side" code... interpret arg1 as LHS and arg2 as RHS
--if attempting to assign arg2 to arg1, only do it if the rules match

{-
setAtt (MaxVal _)   (MaxVal s)       = [MaxVal s]
setAtt (RepVal _)   (RepVal s)       = [RepVal s]
setAtt (VAL _)      (VAL s)          = [VAL s]
setAtt (Res _)      (Res s)          = [Res s]

setAtt (NOUNCLA_VAL _)  (NOUNCLA_VAL s)    = [NOUNCLA_VAL s]
setAtt (ADJ_VAL _)      (ADJ_VAL s)        = [ADJ_VAL s]
setAtt (TERMPH_VAL _)   (TERMPH_VAL s)     = [TERMPH_VAL s]
setAtt (VERBPH_VAL _)   (VERBPH_VAL s)     = [VERBPH_VAL s]
setAtt (SENT_VAL   _)   (SENT_VAL   s)     = [SENT_VAL s]
setAtt (QUEST_VAL  _)   (QUEST_VAL  s)     = [QUEST_VAL s]
setAtt (QUEST1_VAL  _)   (QUEST1_VAL  s)     = [QUEST1_VAL s]
setAtt (QUEST2_VAL  _)   (QUEST2_VAL  s)     = [QUEST2_VAL s]
setAtt (QUEST3_VAL  _)   (QUEST3_VAL  s)     = [QUEST3_VAL s]
setAtt (QUEST6_VAL  _)   (QUEST6_VAL  s)     = [QUEST6_VAL s]

setAtt (PREP_VAL _) (PREP_VAL s) = [PREP_VAL s]
setAtt (PREPN_VAL _) (PREPN_VAL s) = [PREPN_VAL s]
setAtt (PREPNPH_VAL _) (PREPNPH_VAL s) = [PREPNPH_VAL s]
setAtt (PREPPH_VAL _) (PREPPH_VAL s) = [PREPPH_VAL s]
setAtt (YEAR_VAL _) (YEAR_VAL s) = [YEAR_VAL s]

setAtt (SUPERPHSTART_VAL _) (SUPERPHSTART_VAL s) = [SUPERPHSTART_VAL s]
setAtt (SUPER_VAL _) (SUPER_VAL s) = [SUPER_VAL s]
setAtt (SUPERPH_VAL _) (SUPERPH_VAL s) = [SUPERPH_VAL s]
-}

--appears that ErrorVal is used as a sort of sentinel value -- all things that attempt to set to this should be treated as an error
--setAtt _ (ErrorVal s)   = [ErrorVal s]
--------- *********************** --------------