Safe Haskell | None |
---|---|
Language | Haskell2010 |
Exposes some of Spark's joining algorithms.
- join :: Column ref1 key -> Column ref1 value1 -> Column ref2 key -> Column ref2 value2 -> Dataset (key, value1, value2)
- join' :: DynColumn -> DynColumn -> DynColumn -> DynColumn -> DataFrame
- joinInner :: Column ref1 key -> Column ref1 value1 -> Column ref2 key -> Column ref2 value2 -> Dataset (key, value1, value2)
- joinInner' :: DynColumn -> DynColumn -> DynColumn -> DynColumn -> DataFrame
- joinObs :: HasCallStack => Column ref val -> LocalData val' -> Dataset (val, val')
- joinObs' :: DynColumn -> LocalFrame -> DataFrame
Documentation
join :: Column ref1 key -> Column ref1 value1 -> Column ref2 key -> Column ref2 value2 -> Dataset (key, value1, value2) Source #
Standard (inner) join on two sets of data.
join' :: DynColumn -> DynColumn -> DynColumn -> DynColumn -> DataFrame Source #
Untyped version of the standard join.
joinInner :: Column ref1 key -> Column ref1 value1 -> Column ref2 key -> Column ref2 value2 -> Dataset (key, value1, value2) Source #
Explicit inner join.
joinInner' :: DynColumn -> DynColumn -> DynColumn -> DynColumn -> DataFrame Source #
Untyped version of the inner join.
joinObs :: HasCallStack => Column ref val -> LocalData val' -> Dataset (val, val') Source #
Broadcasts an observable alongside a dataset to make it available as an extra column.
joinObs' :: DynColumn -> LocalFrame -> DataFrame Source #
Broadcasts an observable along side a dataset to make it available as an extra column.
The resulting dataframe has 2 columns:
- one column called values
- one column called broadcast
Note: this is a low-level operation. Users may want to use broadcastObs instead.