module Biobase.TrainingData.Manip where
import Data.List (sort,sortBy)
import Data.Ord (comparing)
import Biobase.Secondary.PseudoKnots
import Biobase.TrainingData
type TDmanip = Either TrainingData TrainingData
removePK rpk td@TrainingData{..}
  | not rpk   = td
  | otherwise = td{secondary = removeByCounting secondary}
fRemoveTriplets False td = td
fRemoveTriplets True td@TrainingData{..} = td{secondary = sort $ rmTs secondary} where
  rmTs [] = []
  rmTs (x:xs)
    | length ts == 1 = if worst x ts
                         then rmTs xs
                         else rmTs . filter (/= head ts) $ x:xs 
    | length ts >= 2 = rmTs xs 
    | otherwise = x : rmTs xs
    where
      ts = triplets x xs
      triplets ((i,j),_) zs = filter (\((k,l),_) -> i==k || i==l || j==k || j==l) zs
      worst z zs = last (sortBy (comparing snd) $ z : zs) == z