Safe Haskell	None
Language	Haskell2010

Math.Clustering.Spectral.Sparse

Synopsis

newtype B = B {
- unB :: SpMatrix Double
}
newtype B1 = B1 {
- unB1 :: SpMatrix Double
}
newtype B2 = B2 {
- unB2 :: SpMatrix Double
}
type AdjacencyMatrix = SpMatrix Double
spectral :: Int -> Int -> B -> [SpVector Double]
spectralCluster :: B -> LabelVector
spectralClusterK :: Int -> Int -> B -> LabelVector
spectralNorm :: Int -> Int -> AdjacencyMatrix -> [SpVector Double]
spectralClusterNorm :: AdjacencyMatrix -> LabelVector
spectralClusterKNorm :: Int -> Int -> AdjacencyMatrix -> LabelVector
getB :: Bool -> SpMatrix Double -> B
b1ToB2 :: B1 -> B2
getSimilarityFromB2 :: B2 -> Int -> Int -> Double

Documentation

newtype B Source #

Constructors

B
Fields unB :: SpMatrix Double

Instances

Show B Source #
Instance details Defined in Math.Clustering.Spectral.Sparse Methods showsPrec :: Int -> B -> ShowS # show :: B -> String # showList :: [B] -> ShowS #

newtype B1 Source #

Constructors

B1
Fields unB1 :: SpMatrix Double

Instances

Show B1 Source #
Instance details Defined in Math.Clustering.Spectral.Sparse Methods showsPrec :: Int -> B1 -> ShowS # show :: B1 -> String # showList :: [B1] -> ShowS #

newtype B2 Source #

Constructors

B2
Fields unB2 :: SpMatrix Double

Instances

Show B2 Source #
Instance details Defined in Math.Clustering.Spectral.Sparse Methods showsPrec :: Int -> B2 -> ShowS # show :: B2 -> String # showList :: [B2] -> ShowS #

type AdjacencyMatrix = SpMatrix Double Source #

spectral :: Int -> Int -> B -> [SpVector Double] Source #

Returns the second left singular vector (or from N) and E on of a sparse spectral process. Assumes the columns are features and rows are observations. B is the normalized matrix (from getB). See Shu et al., "Efficient Spectral Neighborhood Blocking for Entity Resolution", 2011.

spectralCluster :: B -> LabelVector Source #

Returns a vector of cluster labels for two groups by finding the second left singular vector of a special normalized matrix. Assumes the columns are features and rows are observations. B is the normalized matrix (from getB). See Shu et al., "Efficient Spectral Neighborhood Blocking for Entity Resolution", 2011.

spectralClusterK :: Int -> Int -> B -> LabelVector Source #

Returns a vector of cluster labels for two groups by finding the second left singular vector and on of a special normalized matrix and running kmeans. Assumes the columns are features and rows are observations. B is the normalized matrix (from getB). See Shu et al., "Efficient Spectral Neighborhood Blocking for Entity Resolution", 2011.

spectralNorm :: Int -> Int -> AdjacencyMatrix -> [SpVector Double] Source #

Returns the eigenvector with the second smallest eigenvalue (or N start) and E on of the symmetric normalized Laplacian L. Computes real symmetric part of L, so ensure the input is real and symmetric. Diagonal should be 0s for adjacency matrix. Uses I + Lnorm instead of I - Lnorm to find second largest singular value instead of second smallest for Lnorm.

spectralClusterNorm :: AdjacencyMatrix -> LabelVector Source #

Returns the eigenvector with the second smallest eigenvalue of the symmetric normalized Laplacian L. Computes real symmetric part of L, so ensure the input is real and symmetric. Diagonal should be 0s for adjacency matrix. Clusters the eigenvector by sign.

spectralClusterKNorm :: Int -> Int -> AdjacencyMatrix -> LabelVector Source #

Returns the eigenvector with the second smallest eigenvalue and on of the symmetric normalized Laplacian L. Computes real symmetric part of L, so ensure the input is real and symmetric. Diagonal should be 0s for adjacency matrix. Clusters the eigenvector using kmeans into k groups.

getB :: Bool -> SpMatrix Double -> B Source #

Get the normalized matrix B from an input matrix where the features are columns and rows are observations. Optionally, do not normalize.

b1ToB2 :: B1 -> B2 Source #

Normalize the input matrix by column. Here, columns are features.

getSimilarityFromB2 :: B2 -> Int -> Int -> Double Source #

Get the cosine similarity between two rows using B2.