imageduplicates/src/Data/BKTree.hs

61 lines
1.8 KiB
Haskell

{-# LANGUAGE DeriveFoldable #-}
{-# LANGUAGE DeriveFunctor #-}
{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE DeriveTraversable #-}
{-# LANGUAGE KindSignatures #-}
{-# LANGUAGE LambdaCase #-}
{-# LANGUAGE ScopedTypeVariables #-}
{-# LANGUAGE TemplateHaskell #-}
{-# LANGUAGE TypeFamilies #-}
module Data.BKTree where
import Data.Functor.Foldable
import Data.Functor.Foldable.TH
import GHC.Generics (Generic)
-- Point for testing purposes
data Point = Point Int Int deriving Show
instance Metric Point where
distance (Point p1 p2) (Point q1 q2) = abs (p1 - q1) + abs (p2 - q2)
class Metric a where
distance :: a -> a -> Int
data BKTree a = Empty
| Node a [(Int, BKTree a)] deriving (Show, Generic)
makeBaseFunctor ''BKTree
empty :: BKTree a
empty = Empty
singleton :: Metric a => a -> BKTree a
singleton a = insert a empty
insert :: Metric a => a -> BKTree a -> BKTree a
insert a = \case
Empty -> Node a []
Node b children ->
let newDistance = distance a b
in Node b (addChild newDistance children)
where
addChild d = \case
[] -> (d, insert a Empty) : []
(d',child):children | d == d' -> (d', insert a child) : children
| otherwise -> (d',child) : addChild d children
search :: forall a. Metric a => Int -> a -> BKTree a -> [a]
search n a tree = cata alg tree
where
alg :: BKTreeF a [a] -> [a]
alg = \case
EmptyF -> []
NodeF x children ->
let thisDistance = distance a x
upper = thisDistance + n
lower = thisDistance - n
filteredChildren = concat [xs | (d, xs) <- children, d <= upper, d >= lower]
in if thisDistance <= n then x : filteredChildren else filteredChildren