module Biobase.TrainingData.Manip where
import Data.List (sort,sortBy)
import Data.Ord (comparing)
import Biobase.Secondary.PseudoKnots
import Biobase.TrainingData
type TDmanip = Either TrainingData TrainingData
removePK rpk td@TrainingData{..}
| not rpk = td
| otherwise = td{secondary = removeByCounting secondary}
fRemoveTriplets False td = td
fRemoveTriplets True td@TrainingData{..} = td{secondary = sort $ rmTs secondary} where
rmTs [] = []
rmTs (x:xs)
| length ts == 1 = if worst x ts
then rmTs xs
else rmTs . filter (/= head ts) $ x:xs
| length ts >= 2 = rmTs xs
| otherwise = x : rmTs xs
where
ts = triplets x xs
triplets ((i,j),_) zs = filter (\((k,l),_) -> i==k || i==l || j==k || j==l) zs
worst z zs = last (sortBy (comparing snd) $ z : zs) == z