-- Hoogle documentation, generated by Haddock -- See Hoogle, http://www.haskell.org/hoogle/ -- | Classical data sets for statistics and machine learning -- -- Classical machine learning and statistics datasets from the UCI -- Machine Learning Repository and other sources. -- -- The datasets package defines two different kinds of datasets: -- -- -- --
--   import Numeric.Datasets (getDataset)
--   import Numeric.Datasets.Iris (iris)
--   import Numeric.Datasets.Abalone (abalone)
--   
--   main = do
--     -- The Iris data set is embedded
--     print (length iris)
--     print (head iris)
--     -- The Abalone dataset is fetched
--     abas <- getDataset abalone
--     print (length abas)
--     print (head abas)
--   
@package datasets @version 0.2.0.3 -- | Old Faithful Geyser Eruption data -- -- Article: http://web.pdx.edu/~jfreder/M212/oldfaithful.pdf -- -- These data from: -- http://www2.stat.duke.edu/courses/Fall02/sta290/datasets/geyser -- -- For more data, see -- http://www.geyserstudy.org/geyser.aspx?pGeyserNo=OLDFAITHFUL module Numeric.Datasets.OldFaithful data OldFaithful OF :: Int -> Double -> Double -> OldFaithful -- | Recording day. 1-8: 1978, 16-23: 1979 [recordingDay] :: OldFaithful -> Int -- | waiting time until next eruption [waiting] :: OldFaithful -> Double -- | duration of eruption in minutes [duration] :: OldFaithful -> Double oldFaithful :: [OldFaithful] -- | Anscombe's quartet -- -- Four datasets with nearly identical statistical properties -- -- Wikipedia article: -- https://en.wikipedia.org/wiki/Anscombe%27s_quartet module Numeric.Datasets.Anscombe anscombe :: [[(Double, Double)]] anscombe1 :: [(Double, Double)] anscombe2 :: [(Double, Double)] anscombe3 :: [(Double, Double)] anscombe4 :: [(Double, Double)] -- | The datasets package defines two different kinds of datasets: -- -- -- -- This module defines the getDataset function for fetching -- datasets and utilies for defining new data sets. It is only necessary -- to import this module when using fetched data sets. Embedded data sets -- can be imported directly. module Numeric.Datasets -- | Load a dataset, using the system temporary directory as a cache getDataset :: Dataset a -> IO [a] -- | A dataset is defined as a function from the caching directory to the -- IO action that loads the data type Dataset a = FilePath Directory for caching downloaded datasets -> IO [a] data Source URL :: String -> Source -- | Define a dataset from a pre-processing function and a source for a CSV -- file csvDatasetPreprocess :: FromRecord a => (ByteString -> ByteString) -> Source -> Dataset a -- | Define a dataset from a source for a CSV file csvDataset :: FromRecord a => Source -> Dataset a jsonDataset :: FromJSON a => Source -> Dataset a -- | Get a ByteString from the specified Source getFileFromSource :: FilePath -> Source -> IO (ByteString) parseCSV :: FromRecord a => (ByteString -> ByteString) -> ByteString -> [a] parseJSON :: FromJSON a => ByteString -> [a] -- | Turn dashes to CamlCase dashToCamelCase :: String -> String -- | Parse a field, first turning dashes to CamlCase parseDashToCamelField :: Read a => Field -> Parser a -- | parse somethign, based on its read instance parseReadField :: Read a => Field -> Parser a -- | Drop lines from a bytestring dropLines :: Int -> ByteString -> ByteString -- | Turn US-style decimals starting with a period (e.g. .2) into something -- Haskell can parse (e.g. 0.2) fixAmericanDecimals :: ByteString -> ByteString -- | Convert a Fixed-width format to a CSV fixedWidthToCSV :: ByteString -> ByteString -- | Abalone data set -- -- UCI ML Repository link -- https://archive.ics.uci.edu/ml/datasets/abalone module Numeric.Datasets.Abalone data Sex M :: Sex F :: Sex I :: Sex data Abalone Abalone :: Sex -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Int -> Abalone [sex] :: Abalone -> Sex [abaloneLength] :: Abalone -> Double [diameter] :: Abalone -> Double [height] :: Abalone -> Double [wholeWeight] :: Abalone -> Double [shuckedWeight] :: Abalone -> Double [visceraWeight] :: Abalone -> Double [shellWeight] :: Abalone -> Double [rings] :: Abalone -> Int abalone :: Dataset Abalone instance GHC.Generics.Generic Numeric.Datasets.Abalone.Abalone instance GHC.Read.Read Numeric.Datasets.Abalone.Abalone instance GHC.Show.Show Numeric.Datasets.Abalone.Abalone instance GHC.Generics.Generic Numeric.Datasets.Abalone.Sex instance GHC.Classes.Eq Numeric.Datasets.Abalone.Sex instance GHC.Read.Read Numeric.Datasets.Abalone.Sex instance GHC.Show.Show Numeric.Datasets.Abalone.Sex instance Data.Csv.Conversion.FromField Numeric.Datasets.Abalone.Sex instance Data.Csv.Conversion.FromRecord Numeric.Datasets.Abalone.Abalone -- | Adult (AKA Census Income) dataset. -- -- UCI ML Repository link -- http://archive.ics.uci.edu/ml/datasets/Adult module Numeric.Datasets.Adult data WorkClass Private :: WorkClass SelfEmpNotInc :: WorkClass SelfEmpInc :: WorkClass FederalGov :: WorkClass LocalGov :: WorkClass StateGov :: WorkClass WithoutPay :: WorkClass NeverWorked :: WorkClass data MaritalStatus MarriedCivSpouse :: MaritalStatus Divorced :: MaritalStatus NeverMarried :: MaritalStatus Separated :: MaritalStatus Widowed :: MaritalStatus MarriedSpouseAbsent :: MaritalStatus MarriedAFSpouse :: MaritalStatus data Occupation TechSupport :: Occupation CraftRepair :: Occupation OtherService :: Occupation Sales :: Occupation ExecManagerial :: Occupation ProfSpecialty :: Occupation HandlersCleaners :: Occupation MachineOpInspct :: Occupation AdmClerical :: Occupation FarmingFishing :: Occupation TransportMoving :: Occupation PrivHouseServ :: Occupation ProtectiveServ :: Occupation ArmedForces :: Occupation data Relationship Wife :: Relationship OwnChild :: Relationship Husband :: Relationship NotInFamily :: Relationship OtherRelative :: Relationship Unmarried :: Relationship data Race White :: Race AsianPacIslander :: Race AmerIndianEskimo :: Race Other :: Race Black :: Race data Sex Female :: Sex Male :: Sex data Income GT50K :: Income LE50K :: Income data Adult Adult :: Int -> Maybe WorkClass -> Int -> Text -> Int -> MaritalStatus -> Maybe Occupation -> Relationship -> Race -> Sex -> Int -> Int -> Int -> Text -> Income -> Adult [age] :: Adult -> Int [workClass] :: Adult -> Maybe WorkClass [finalWeight] :: Adult -> Int [education] :: Adult -> Text [educationNum] :: Adult -> Int [maritalStatus] :: Adult -> MaritalStatus [occupation] :: Adult -> Maybe Occupation [relationship] :: Adult -> Relationship [race] :: Adult -> Race [sex] :: Adult -> Sex [capitalGain] :: Adult -> Int [capitalLoss] :: Adult -> Int [hoursPerWeek] :: Adult -> Int [nativeCountry] :: Adult -> Text [income] :: Adult -> Income adult :: Dataset Adult adultTestSet :: Dataset Adult instance GHC.Generics.Generic Numeric.Datasets.Adult.Adult instance GHC.Read.Read Numeric.Datasets.Adult.Adult instance GHC.Show.Show Numeric.Datasets.Adult.Adult instance GHC.Generics.Generic Numeric.Datasets.Adult.Income instance GHC.Classes.Eq Numeric.Datasets.Adult.Income instance GHC.Read.Read Numeric.Datasets.Adult.Income instance GHC.Show.Show Numeric.Datasets.Adult.Income instance GHC.Generics.Generic Numeric.Datasets.Adult.Sex instance GHC.Classes.Eq Numeric.Datasets.Adult.Sex instance GHC.Read.Read Numeric.Datasets.Adult.Sex instance GHC.Show.Show Numeric.Datasets.Adult.Sex instance GHC.Generics.Generic Numeric.Datasets.Adult.Race instance GHC.Classes.Eq Numeric.Datasets.Adult.Race instance GHC.Read.Read Numeric.Datasets.Adult.Race instance GHC.Show.Show Numeric.Datasets.Adult.Race instance GHC.Generics.Generic Numeric.Datasets.Adult.Relationship instance GHC.Classes.Eq Numeric.Datasets.Adult.Relationship instance GHC.Read.Read Numeric.Datasets.Adult.Relationship instance GHC.Show.Show Numeric.Datasets.Adult.Relationship instance GHC.Generics.Generic Numeric.Datasets.Adult.Occupation instance GHC.Classes.Eq Numeric.Datasets.Adult.Occupation instance GHC.Read.Read Numeric.Datasets.Adult.Occupation instance GHC.Show.Show Numeric.Datasets.Adult.Occupation instance GHC.Generics.Generic Numeric.Datasets.Adult.MaritalStatus instance GHC.Classes.Eq Numeric.Datasets.Adult.MaritalStatus instance GHC.Read.Read Numeric.Datasets.Adult.MaritalStatus instance GHC.Show.Show Numeric.Datasets.Adult.MaritalStatus instance GHC.Generics.Generic Numeric.Datasets.Adult.WorkClass instance GHC.Classes.Eq Numeric.Datasets.Adult.WorkClass instance GHC.Read.Read Numeric.Datasets.Adult.WorkClass instance GHC.Show.Show Numeric.Datasets.Adult.WorkClass instance Data.Csv.Conversion.FromField Numeric.Datasets.Adult.WorkClass instance Data.Csv.Conversion.FromField Numeric.Datasets.Adult.MaritalStatus instance Data.Csv.Conversion.FromField Numeric.Datasets.Adult.Occupation instance Data.Csv.Conversion.FromField Numeric.Datasets.Adult.Relationship instance Data.Csv.Conversion.FromField Numeric.Datasets.Adult.Race instance Data.Csv.Conversion.FromField Numeric.Datasets.Adult.Sex instance Data.Csv.Conversion.FromField Numeric.Datasets.Adult.Income instance Data.Csv.Conversion.FromRecord Numeric.Datasets.Adult.Adult -- | BostonHousing Data set -- -- scikit-learn calls this "boston" and UCI calls it Housing -- -- UCI ML Repository link -- http://mlr.cs.umass.edu/ml/datasets/housing module Numeric.Datasets.BostonHousing data BostonHousing BostonHousing :: Double -> Double -> Double -> Bool -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> BostonHousing [crimeRate] :: BostonHousing -> Double [zoned] :: BostonHousing -> Double [industrial] :: BostonHousing -> Double [charlesRiver] :: BostonHousing -> Bool [nitricOxides] :: BostonHousing -> Double [rooms] :: BostonHousing -> Double [age] :: BostonHousing -> Double [distance] :: BostonHousing -> Double [radialHwy] :: BostonHousing -> Double [tax] :: BostonHousing -> Double [ptRatio] :: BostonHousing -> Double [b] :: BostonHousing -> Double [lowerStatus] :: BostonHousing -> Double [medianValue] :: BostonHousing -> Double bostonHousing :: Dataset BostonHousing instance GHC.Generics.Generic Numeric.Datasets.BostonHousing.BostonHousing instance GHC.Read.Read Numeric.Datasets.BostonHousing.BostonHousing instance GHC.Show.Show Numeric.Datasets.BostonHousing.BostonHousing instance Data.Csv.Conversion.FromRecord Numeric.Datasets.BostonHousing.BostonHousing -- | Breast Cancer Wisconsin (Diagnostic) Data Set -- -- Repository link: -- http://mlr.cs.umass.edu/ml/datasets/Breast+Cancer+Wisconsin+%28Diagnostic%29 module Numeric.Datasets.BreastCancerWisconsin data Diagnosis Malignant :: Diagnosis Benign :: Diagnosis data Prognosis Recurrent :: Prognosis Nonrecurrent :: Prognosis intToDiagnosis :: Int -> Diagnosis data BreastCancerEntry BreastCancerEntry :: Int -> Int -> Int -> Int -> Int -> Int -> Maybe Int -> Int -> Int -> Int -> Diagnosis -> BreastCancerEntry [sampleCodeNumber] :: BreastCancerEntry -> Int [clumpThickness] :: BreastCancerEntry -> Int [uniformityCellSize] :: BreastCancerEntry -> Int [uniformityCellShape] :: BreastCancerEntry -> Int [marginalAdhesion] :: BreastCancerEntry -> Int [singleEpithelialCellSize] :: BreastCancerEntry -> Int [bareNuclei] :: BreastCancerEntry -> Maybe Int [blandChromatin] :: BreastCancerEntry -> Int [normalNucleoli] :: BreastCancerEntry -> Int [mitosis] :: BreastCancerEntry -> Int [sampleClass] :: BreastCancerEntry -> Diagnosis breastCancerDatabase :: Dataset BreastCancerEntry data DiagnosticBreastCancer DiagnosticBreastCancer :: Int -> Diagnosis -> CellFeatures -> DiagnosticBreastCancer [diagnosticID] :: DiagnosticBreastCancer -> Int [diagnosis] :: DiagnosticBreastCancer -> Diagnosis [diagnosticCells] :: DiagnosticBreastCancer -> CellFeatures data PrognosticBreastCancer PrognosticBreastCancer :: Int -> Prognosis -> CellFeatures -> PrognosticBreastCancer [prognosticID] :: PrognosticBreastCancer -> Int [prognosis] :: PrognosticBreastCancer -> Prognosis [prognosticCells] :: PrognosticBreastCancer -> CellFeatures data CellFeatures CellFeatures :: Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> CellFeatures [radius] :: CellFeatures -> Double [perimeter] :: CellFeatures -> Double [area] :: CellFeatures -> Double [smoothness] :: CellFeatures -> Double [compactness] :: CellFeatures -> Double [concavity] :: CellFeatures -> Double [concavePoints] :: CellFeatures -> Double [symmetry] :: CellFeatures -> Double [fractalDimension] :: CellFeatures -> Double charToDiagnosis :: String -> Diagnosis charToPrognosis :: String -> Prognosis diagnosticBreastCancer :: Dataset DiagnosticBreastCancer prognosticBreastCancer :: Dataset PrognosticBreastCancer instance GHC.Generics.Generic Numeric.Datasets.BreastCancerWisconsin.DiagnosticBreastCancer instance GHC.Read.Read Numeric.Datasets.BreastCancerWisconsin.DiagnosticBreastCancer instance GHC.Show.Show Numeric.Datasets.BreastCancerWisconsin.DiagnosticBreastCancer instance GHC.Generics.Generic Numeric.Datasets.BreastCancerWisconsin.PrognosticBreastCancer instance GHC.Read.Read Numeric.Datasets.BreastCancerWisconsin.PrognosticBreastCancer instance GHC.Show.Show Numeric.Datasets.BreastCancerWisconsin.PrognosticBreastCancer instance GHC.Generics.Generic Numeric.Datasets.BreastCancerWisconsin.CellFeatures instance GHC.Read.Read Numeric.Datasets.BreastCancerWisconsin.CellFeatures instance GHC.Show.Show Numeric.Datasets.BreastCancerWisconsin.CellFeatures instance GHC.Generics.Generic Numeric.Datasets.BreastCancerWisconsin.BreastCancerEntry instance GHC.Read.Read Numeric.Datasets.BreastCancerWisconsin.BreastCancerEntry instance GHC.Show.Show Numeric.Datasets.BreastCancerWisconsin.BreastCancerEntry instance GHC.Generics.Generic Numeric.Datasets.BreastCancerWisconsin.Prognosis instance GHC.Classes.Eq Numeric.Datasets.BreastCancerWisconsin.Prognosis instance GHC.Read.Read Numeric.Datasets.BreastCancerWisconsin.Prognosis instance GHC.Show.Show Numeric.Datasets.BreastCancerWisconsin.Prognosis instance GHC.Generics.Generic Numeric.Datasets.BreastCancerWisconsin.Diagnosis instance GHC.Classes.Eq Numeric.Datasets.BreastCancerWisconsin.Diagnosis instance GHC.Read.Read Numeric.Datasets.BreastCancerWisconsin.Diagnosis instance GHC.Show.Show Numeric.Datasets.BreastCancerWisconsin.Diagnosis instance Data.Csv.Conversion.FromRecord Numeric.Datasets.BreastCancerWisconsin.BreastCancerEntry instance Data.Csv.Conversion.FromRecord Numeric.Datasets.BreastCancerWisconsin.DiagnosticBreastCancer instance Data.Csv.Conversion.FromRecord Numeric.Datasets.BreastCancerWisconsin.PrognosticBreastCancer instance Data.Csv.Conversion.FromRecord Numeric.Datasets.BreastCancerWisconsin.CellFeatures -- | Car dataset -- -- UCI ML Repository link -- https://archive.ics.uci.edu/ml/datasets/car module Numeric.Datasets.Car data RelScore Low :: RelScore Med :: RelScore High :: RelScore VeryHigh :: RelScore data RelSize Small :: RelSize Medium :: RelSize Big :: RelSize data Acceptability Unacceptable :: Acceptability Acceptable :: Acceptability Good :: Acceptability VeryGood :: Acceptability data Count N :: Int -> Count NOrMore :: Int -> Count More :: Count data Car Car :: RelScore -> RelScore -> Count -> Count -> RelSize -> RelScore -> Acceptability -> Car [buying] :: Car -> RelScore [maintenance] :: Car -> RelScore [doors] :: Car -> Count [persons] :: Car -> Count [luggageBoot] :: Car -> RelSize [safety] :: Car -> RelScore [acceptability] :: Car -> Acceptability car :: Dataset Car instance GHC.Generics.Generic Numeric.Datasets.Car.Car instance GHC.Read.Read Numeric.Datasets.Car.Car instance GHC.Show.Show Numeric.Datasets.Car.Car instance GHC.Generics.Generic Numeric.Datasets.Car.Count instance GHC.Classes.Eq Numeric.Datasets.Car.Count instance GHC.Read.Read Numeric.Datasets.Car.Count instance GHC.Show.Show Numeric.Datasets.Car.Count instance GHC.Generics.Generic Numeric.Datasets.Car.Acceptability instance GHC.Classes.Eq Numeric.Datasets.Car.Acceptability instance GHC.Read.Read Numeric.Datasets.Car.Acceptability instance GHC.Show.Show Numeric.Datasets.Car.Acceptability instance GHC.Generics.Generic Numeric.Datasets.Car.RelSize instance GHC.Classes.Eq Numeric.Datasets.Car.RelSize instance GHC.Read.Read Numeric.Datasets.Car.RelSize instance GHC.Show.Show Numeric.Datasets.Car.RelSize instance GHC.Generics.Generic Numeric.Datasets.Car.RelScore instance GHC.Classes.Eq Numeric.Datasets.Car.RelScore instance GHC.Read.Read Numeric.Datasets.Car.RelScore instance GHC.Show.Show Numeric.Datasets.Car.RelScore instance Data.Csv.Conversion.FromField Numeric.Datasets.Car.RelScore instance Data.Csv.Conversion.FromField Numeric.Datasets.Car.RelSize instance Data.Csv.Conversion.FromField Numeric.Datasets.Car.Acceptability instance Data.Csv.Conversion.FromField Numeric.Datasets.Car.Count instance Data.Csv.Conversion.FromRecord Numeric.Datasets.Car.Car -- | The classical Iris dataset, due to R.A. Fisher. -- -- UCI ML Repository link -- https://archive.ics.uci.edu/ml/datasets/Iris module Numeric.Datasets.Iris data IrisClass Setosa :: IrisClass Versicolor :: IrisClass Virginica :: IrisClass data Iris Iris :: Double -> Double -> Double -> Double -> IrisClass -> Iris [sepalLength] :: Iris -> Double [sepalWidth] :: Iris -> Double [petalLength] :: Iris -> Double [petalWidth] :: Iris -> Double [irisClass] :: Iris -> IrisClass iris :: [Iris] instance GHC.Generics.Generic Numeric.Datasets.Iris.Iris instance GHC.Read.Read Numeric.Datasets.Iris.Iris instance GHC.Show.Show Numeric.Datasets.Iris.Iris instance GHC.Generics.Generic Numeric.Datasets.Iris.IrisClass instance GHC.Classes.Eq Numeric.Datasets.Iris.IrisClass instance GHC.Read.Read Numeric.Datasets.Iris.IrisClass instance GHC.Show.Show Numeric.Datasets.Iris.IrisClass instance Data.Csv.Conversion.FromField Numeric.Datasets.Iris.IrisClass instance Data.Csv.Conversion.FromRecord Numeric.Datasets.Iris.Iris -- | Michelson's speed of light dataset - five repeated measurements of the -- speed of light. -- -- Data from -- https://github.com/datasets-io/michelson-speed-of-light -- -- The embedded dataset is Copyright (c) 2015 The Compute.io Authors. module Numeric.Datasets.Michelson michelson :: [[Double]] -- | Florence Nightingale's count of injuries in the Crimean War, used for -- her rose plots -- -- Data from https://github.com/datasets-io/nightingales-rose -- -- The embedded dataset is Copyright (c) 2015 The Compute.io Authors. module Numeric.Datasets.Nightingale data Nightingale Nightingale :: UTCTime -> Int -> Int -> Int -> Int -> Nightingale [date] :: Nightingale -> UTCTime [army_size] :: Nightingale -> Int [disease] :: Nightingale -> Int [wounds] :: Nightingale -> Int [other] :: Nightingale -> Int nightingale :: [Nightingale] instance GHC.Generics.Generic Numeric.Datasets.Nightingale.Nightingale instance GHC.Read.Read Numeric.Datasets.Nightingale.Nightingale instance GHC.Show.Show Numeric.Datasets.Nightingale.Nightingale instance Data.Aeson.Types.FromJSON.FromJSON Numeric.Datasets.Nightingale.Nightingale -- | Wine Data set -- -- UCI ML Repository link http://mlr.cs.umass.edu/ml/datasets/Wine module Numeric.Datasets.Wine data Wine Wine :: Int -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Double -> Int -> Wine [wineClass] :: Wine -> Int [alcohol] :: Wine -> Double [malicAcid] :: Wine -> Double [ash] :: Wine -> Double [ashAlcalinity] :: Wine -> Double [magnesium] :: Wine -> Double [totalPhenols] :: Wine -> Double [flavanoids] :: Wine -> Double [nonflavanoidPhenols] :: Wine -> Double [proanthocyanins] :: Wine -> Double [colorIntensity] :: Wine -> Double [hue] :: Wine -> Double [dilutedOD280toOD315] :: Wine -> Double [proline] :: Wine -> Int wine :: Dataset Wine instance GHC.Generics.Generic Numeric.Datasets.Wine.Wine instance GHC.Read.Read Numeric.Datasets.Wine.Wine instance GHC.Show.Show Numeric.Datasets.Wine.Wine instance Data.Csv.Conversion.FromRecord Numeric.Datasets.Wine.Wine