{- Copyright (C) 2010 Scott R Parish Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. -} -- | A driver for MongoDB -- -- This module lets you connect to MongoDB, do inserts, queries, -- updates, etc. Also has many convience functions inspired by HDBC -- such as more easily converting between the BsonValue types and -- native Haskell types. -- -- * Tutorial for this driver: -- -- -- * Map/Reduce example for this driver: -- -- -- * MongoDB: -- -- module Database.MongoDB ( -- * Connection Connection, ConnectOpt(..), connect, connectOnPort, conClose, disconnect, dropDatabase, connectCluster, connectClusterOnPort, serverInfo, serverShutdown, databasesInfo, databaseNames, -- * Database Database, MongoDBCollectionInvalid, Password, Username, ColCreateOpt(..), collectionNames, createCollection, dropCollection, renameCollection, runCommand, validateCollection, auth, addUser, login, logout, -- * Collection Collection, FieldSelector, FullCollection, NumToSkip, NumToReturn, Selector, QueryOpt(..), UpdateFlag(..), count, countMatching, delete, insert, insertMany, query, remove, update, save, -- * Convenience collection operations find, findOne, quickFind, quickFind', -- * Query Helpers whereClause, -- * Cursor Cursor, allDocs, allDocs', finish, nextDoc, -- * Index Key, Unique, Direction(..), createIndex, dropIndex, dropIndexes, indexInformation, -- * Map-Reduce MapReduceOpt(..), mapReduce, mapReduceWScopes, runMapReduce, runMapReduceWScopes, mapReduceResults, ) where import Control.Exception import Control.Monad import Data.Binary() import Data.Binary.Get import Data.Binary.Put import Data.Bits import Data.ByteString.Char8 (pack) import Data.ByteString.Internal (c2w) import qualified Data.ByteString.Lazy as L import qualified Data.ByteString.Lazy.UTF8 as L8 import Data.Digest.OpenSSL.MD5 import Data.Int import Data.IORef import qualified Data.List as List import Data.Maybe import Data.Typeable import Database.MongoDB.BSON as BSON import Database.MongoDB.Util import qualified Network import Network.Socket hiding (connect, send, sendTo, recv, recvFrom) import Prelude hiding (getContents) import System.IO import System.IO.Unsafe import System.Random -- | A list of handles to database connections data Connection = Connection { cHandle :: IORef Handle, cRand :: IORef [Int], cOidGen :: ObjectIdGen } data ConnectOpt = SlaveOK -- ^ It's fine to connect to the slave deriving (Show, Eq) -- | Establish a connection to a MongoDB server connect :: HostName -> [ConnectOpt] -> IO Connection connect = flip connectOnPort (Network.PortNumber 27017) -- | Establish connections to a list of MongoDB servers connectCluster :: [HostName] -> [ConnectOpt] -> IO Connection connectCluster xs = connectClusterOnPort (fmap (flip (,) $ Network.PortNumber 27017) xs) -- | Establish connections to a list of MongoDB servers specifying each port. connectClusterOnPort :: [(HostName, Network.PortID)] -> [ConnectOpt] -> IO Connection connectClusterOnPort [] _ = throwOpFailure "No hostnames in list" connectClusterOnPort servers opts = newConnection servers opts -- | Establish a connection to a MongoDB server on a non-standard port connectOnPort :: HostName -> Network.PortID -> [ConnectOpt] -> IO Connection connectOnPort host port = newConnection [(host, port)] newConnection :: [(HostName, Network.PortID)] -> [ConnectOpt] -> IO Connection newConnection servers opts = do r <- newStdGen let ns = randomRs (fromIntegral (minBound :: Int32), fromIntegral (maxBound :: Int32)) r nsRef <- newIORef ns hRef <- openHandle (head servers) >>= newIORef oidGen <- mkObjectIdGen let c = Connection hRef nsRef oidGen res <- isMaster c if fromBson (fromLookup $ List.lookup (s2L "ismaster") res) == (1::Int) || isJust (List.elemIndex SlaveOK opts) then return c else case List.lookup (s2L "remote") res of Nothing -> throwConFailure "Couldn't find master to connect to" Just server -> do hRef' <- openHandle (splitHostPort $ fromBson server) >>= newIORef return $ c {cHandle = hRef'} openHandle :: (HostName, Network.PortID) -> IO Handle openHandle (host, port) = do h <- Network.connectTo host port hSetBuffering h NoBuffering return h getHandle :: Connection -> IO Handle getHandle c = readIORef $ cHandle c cPut :: Connection -> L.ByteString -> IO () cPut c msg = getHandle c >>= flip L.hPut msg -- | Close database connection conClose :: Connection -> IO () conClose c = readIORef (cHandle c) >>= hClose -- | Information about the databases on the server. databasesInfo :: Connection -> IO BsonDoc databasesInfo c = runCommand c (s2L "admin") $ toBsonDoc [("listDatabases", BsonInt32 1)] -- | Return a list of database names on the server. databaseNames :: Connection -> IO [Database] databaseNames c = do info <- databasesInfo c let (BsonArray dbs) = fromLookup $ List.lookup (s2L "databases") info names = mapMaybe (List.lookup (s2L "name") . fromBson) dbs return $ List.map fromBson (names::[BsonValue]) -- | Alias for 'conClose' disconnect :: Connection -> IO () disconnect = conClose -- | Drop a database. dropDatabase :: Connection -> Database -> IO () dropDatabase c db = do _ <- runCommand c db $ toBsonDoc [("dropDatabase", BsonInt32 1)] return () isMaster :: Connection -> IO BsonDoc isMaster c = runCommand c (s2L "admin") $ toBsonDoc [("ismaster", BsonInt32 1)] -- | Get information about the MongoDB server we're connected to. serverInfo :: Connection -> IO BsonDoc serverInfo c = runCommand c (s2L "admin") $ toBsonDoc [("buildinfo", BsonInt32 1)] -- | Shut down the MongoDB server. -- -- Force a clean exit, flushing and closing all data files. -- Note that it will wait until all ongoing operations are complete. serverShutdown :: Connection -> IO BsonDoc serverShutdown c = runCommand c (s2L "admin") $ toBsonDoc [("shutdown", BsonInt32 1)] -- | Return a list of collections in /Database/. collectionNames :: Connection -> Database -> IO [FullCollection] collectionNames c db = do docs <- quickFind' c (L.append db $ s2L ".system.namespaces") empty let names = flip List.map docs $ fromBson . fromLookup . List.lookup (s2L "name") return $ List.filter (L.notElem $ c2w '$') names data ColCreateOpt = CCOSize Int64 -- ^ Desired initial size for the -- collection (in bytes). must be -- less than or equal to -- 10000000000. For capped -- collections this size is the max -- size of the collection. | CCOCapped Bool -- ^ If 'True', this is a capped collection. | CCOMax Int64 -- ^ Maximum number of objects if capped. deriving (Show, Eq) colCreateOptToBson :: ColCreateOpt -> (String, BsonValue) colCreateOptToBson (CCOSize sz) = ("size", toBson sz) colCreateOptToBson (CCOCapped b) = ("capped", toBson b) colCreateOptToBson (CCOMax m) = ("max", toBson m) -- | Create a new collection in this database. -- -- Normally collection creation is automatic. This function should -- only be needed if you want to specify 'ColCreateOpt's on creation. -- 'MongoDBCollectionInvalid' is thrown if the collection already -- exists. createCollection :: Connection -> FullCollection -> [ColCreateOpt] -> IO () createCollection c col opts = do (db, col') <- validateCollectionName col dbcols <- collectionNames c db when (col `List.elem` dbcols) $ throwColInvalid $ "Collection already exists: " ++ show col let cmd = ("create", toBson col') : List.map colCreateOptToBson opts _ <- runCommand c db $ toBsonDoc cmd return () -- | Drop a collection. dropCollection :: Connection -> FullCollection -> IO () dropCollection c col = do let (db, col') = splitFullCol col _ <- runCommand c db $ toBsonDoc [("drop", toBson col')] return () -- | Rename a collection--first /FullCollection/ argument is the -- existing name, the second is the new name. At the moment this command -- can also be used to move a collection between databases. renameCollection :: Connection -> FullCollection -> FullCollection -> IO () renameCollection c col newName = do _ <- validateCollectionName col _ <- runCommand c (s2L "admin") $ toBsonDoc [("renameCollection", toBson col), ("to", toBson newName)] return () -- | Return a string of validation info about the collection. -- -- Example output (note this probably can/will change with different -- versions of the server): -- -- > validate -- > details: 0x7fe5cc2c1da4 ofs:e7da4 -- > firstExtent:0:24100 ns:test.foo.bar -- > lastExtent:0:24100 ns:test.foo.bar -- > # extents:1 -- > datasize?:180 nrecords?:5 lastExtentSize:1024 -- > padding:1 -- > first extent: -- > loc:0:24100 xnext:null xprev:null -- > nsdiag:test.foo.bar -- > size:1024 firstRecord:0:241e4 lastRecord:0:24280 -- > 5 objects found, nobj:5 -- > 260 bytes data w/headers -- > 180 bytes data wout/headers -- > deletedList: 0100100000000000000 -- > deleted: n: 4 size: 588 -- > nIndexes:1 -- > test.foo.bar.$_id_ keys:5 validateCollection :: Connection -> FullCollection -> IO String validateCollection c col = do let (db, col') = splitFullCol col res <- runCommand c db $ toBsonDoc [("validate", toBson col')] return $ fromBson $ fromLookup $ List.lookup (s2L "result") res splitFullCol :: FullCollection -> (Database, Collection) splitFullCol col = (L.takeWhile (c2w '.' /=) col, L.tail $ L.dropWhile (c2w '.' /=) col) splitHostPort :: String -> (HostName, Network.PortID) splitHostPort hp = (host, port) where host = List.takeWhile (':' /=) hp port = case List.dropWhile (':' /=) hp of "" -> Network.PortNumber 27017 pstr -> Network.Service $ List.tail pstr -- | Run a database command. Usually this is unneeded as driver wraps -- all of the commands for you (eg 'createCollection', -- 'dropCollection', etc). runCommand :: Connection -> Database -> BsonDoc -> IO BsonDoc runCommand c db cmd = do mres <- findOne c (L.append db $ s2L ".$cmd") cmd let res = fromLookup mres when (BsonDouble 1.0 /= fromLookup (List.lookup (s2L "ok") res)) $ throwOpFailure $ "command \"" ++ show cmd ++ "\" failed: " ++ fromBson (fromLookup $ List.lookup (s2L "errmsg") res) return res -- | An Iterator over the results of a query. Use 'nextDoc' to get each -- successive result document, or 'allDocs' or 'allDocs'' to get lazy or -- strict lists of results. data Cursor = Cursor { curCon :: Connection, curID :: IORef Int64, curNumToRet :: Int32, curCol :: FullCollection, curDocBytes :: IORef L.ByteString, curClosed :: IORef Bool } data Opcode = OPReply -- 1 Reply to a client request. responseTo is set | OPMsg -- 1000 generic msg command followed by a string | OPUpdate -- 2001 update document | OPInsert -- 2002 insert new document | OPGetByOid -- 2003 is this used? | OPQuery -- 2004 query a collection | OPGetMore -- 2005 Get more data from a query. See Cursors | OPDelete -- 2006 Delete documents | OPKillCursors -- 2007 Tell database client is done with a cursor deriving (Show, Eq) data MongoDBInternalError = MongoDBInternalError String deriving (Eq, Show, Read) mongoDBInternalError :: TyCon mongoDBInternalError = mkTyCon "Database.MongoDB.MongoDBInternalError" instance Typeable MongoDBInternalError where typeOf _ = mkTyConApp mongoDBInternalError [] instance Exception MongoDBInternalError data MongoDBCollectionInvalid = MongoDBCollectionInvalid String deriving (Eq, Show, Read) mongoDBCollectionInvalid :: TyCon mongoDBCollectionInvalid = mkTyCon "Database.MongoDB.MongoDBcollectionInvalid" instance Typeable MongoDBCollectionInvalid where typeOf _ = mkTyConApp mongoDBCollectionInvalid [] instance Exception MongoDBCollectionInvalid throwColInvalid :: String -> a throwColInvalid = throw . MongoDBCollectionInvalid data MongoDBOperationFailure = MongoDBOperationFailure String deriving (Eq, Show, Read) mongoDBOperationFailure :: TyCon mongoDBOperationFailure = mkTyCon "Database.MongoDB.MongoDBoperationFailure" instance Typeable MongoDBOperationFailure where typeOf _ = mkTyConApp mongoDBOperationFailure [] instance Exception MongoDBOperationFailure throwOpFailure :: String -> a throwOpFailure = throw . MongoDBOperationFailure data MongoDBConnectionFailure = MongoDBConnectionFailure String deriving (Eq, Show, Read) mongoDBConnectionFailure :: TyCon mongoDBConnectionFailure = mkTyCon "Database.MongoDB.MongoDBconnectionFailure" instance Typeable MongoDBConnectionFailure where typeOf _ = mkTyConApp mongoDBConnectionFailure [] instance Exception MongoDBConnectionFailure throwConFailure :: String -> a throwConFailure = throw . MongoDBConnectionFailure fromOpcode :: Opcode -> Int32 fromOpcode OPReply = 1 fromOpcode OPMsg = 1000 fromOpcode OPUpdate = 2001 fromOpcode OPInsert = 2002 fromOpcode OPGetByOid = 2003 fromOpcode OPQuery = 2004 fromOpcode OPGetMore = 2005 fromOpcode OPDelete = 2006 fromOpcode OPKillCursors = 2007 toOpcode :: Int32 -> Opcode toOpcode 1 = OPReply toOpcode 1000 = OPMsg toOpcode 2001 = OPUpdate toOpcode 2002 = OPInsert toOpcode 2003 = OPGetByOid toOpcode 2004 = OPQuery toOpcode 2005 = OPGetMore toOpcode 2006 = OPDelete toOpcode 2007 = OPKillCursors toOpcode n = throw $ MongoDBInternalError $ "Got unexpected Opcode: " ++ show n -- | The name of a database. type Database = L8.ByteString -- | The full collection name. The full collection name is the -- concatenation of the database name with the collection name, using -- a @.@ for the concatenation. For example, for the database @foo@ -- and the collection @bar@, the full collection name is @foo.bar@. type FullCollection = L8.ByteString -- | The same as 'FullCollection' but without the 'Database' prefix. type Collection = L8.ByteString -- | A 'BsonDoc' representing restrictions for a query much like the -- /where/ part of an SQL query. type Selector = BsonDoc -- | A list of field names that limits the fields in the returned -- documents. The list can contains zero or more elements, each of -- which is the name of a field that should be returned. An empty list -- means that no limiting is done and all fields are returned. type FieldSelector = [L8.ByteString] type RequestID = Int32 -- | Sets the number of documents to omit - starting from the first -- document in the resulting dataset - when returning the result of -- the query. type NumToSkip = Int32 -- | This controls how many documents are returned at a time. The -- cursor works by requesting /NumToReturn/ documents, which are then -- immediately all transfered over the network; these are held locally -- until the those /NumToReturn/ are all consumed and then the network -- will be hit again for the next /NumToReturn/ documents. -- -- If the value @0@ is given, the database will choose the number of -- documents to return. -- -- Otherwise choosing a good value is very dependant on the document size -- and the way the cursor is being used. type NumToReturn = Int32 type Username = String type Password = String type JSCode = L8.ByteString -- | Options that control the behavior of a 'query' operation. data QueryOpt = QOTailableCursor | QOSlaveOK | QOOpLogReplay | QONoCursorTimeout deriving (Show) fromQueryOpts :: [QueryOpt] -> Int32 fromQueryOpts opts = List.foldl (.|.) 0 $ fmap toVal opts where toVal QOTailableCursor = 2 toVal QOSlaveOK = 4 toVal QOOpLogReplay = 8 toVal QONoCursorTimeout = 16 -- | Options that effect the behavior of a 'update' operation. data UpdateFlag = UFUpsert | UFMultiupdate deriving (Show, Enum) fromUpdateFlags :: [UpdateFlag] -> Int32 fromUpdateFlags flags = List.foldl (.|.) 0 $ flip fmap flags $ (1 `shiftL`) . fromEnum -- | Return the number of documents in /FullCollection/. count :: Connection -> FullCollection -> IO Integer count c col = countMatching c col empty -- | Return the number of documents in /FullCollection/ matching /Selector/ countMatching :: Connection -> FullCollection -> Selector -> IO Integer countMatching c col sel = do let (db, col') = splitFullCol col res <- runCommand c db $ toBsonDoc [("count", toBson col'), ("query", toBson sel)] let cnt = (fromBson $ fromLookup $ List.lookup (s2L "n") res :: Double) return $ truncate cnt -- | Delete documents matching /Selector/ from the given /FullCollection/. delete :: Connection -> FullCollection -> Selector -> IO RequestID delete c col sel = do let body = runPut $ do putI32 0 putCol col putI32 0 putBsonDoc sel (reqID, msg) <- packMsg c OPDelete body cPut c msg return reqID -- | An alias for 'delete'. remove :: Connection -> FullCollection -> Selector -> IO RequestID remove = delete moveOidToFrontOrGen :: Connection -> BsonDoc -> IO BsonDoc moveOidToFrontOrGen c doc = case List.lookup (s2L "_id") doc of Nothing -> do oid <- genObjectId $ cOidGen c return $ (s2L "_id", oid) : doc Just oid -> do let keyEq = (\(k1, _) (k2, _) -> k1 == k2) delByKey = \k -> List.deleteBy keyEq (k, undefined) return $ (s2L "_id", oid) : delByKey (s2L "_id") doc -- | Insert a single document into /FullCollection/ returning the /_id/ field. insert :: Connection -> FullCollection -> BsonDoc -> IO BsonValue insert c col doc = do doc' <- moveOidToFrontOrGen c doc let body = runPut $ do putI32 0 putCol col putBsonDoc doc' (_reqID, msg) <- packMsg c OPInsert body cPut c msg return $ snd $ head doc' -- | Insert a list of documents into /FullCollection/ returing the -- /_id/ field for each one in the same order as they were given. insertMany :: Connection -> FullCollection -> [BsonDoc] -> IO [BsonValue] insertMany c col docs = do docs' <- mapM (moveOidToFrontOrGen c) docs let body = runPut $ do putI32 0 putCol col forM_ docs' putBsonDoc (_, msg) <- packMsg c OPInsert body cPut c msg return $ List.map (snd . head) docs' -- | Open a cursor to find documents. If you need full functionality, -- see 'query' find :: Connection -> FullCollection -> Selector -> IO Cursor find c col sel = query c col [] 0 0 sel [] -- | Query, but only return the first result, if any. findOne :: Connection -> FullCollection -> Selector -> IO (Maybe BsonDoc) findOne c col sel = query c col [] 0 (-1) sel [] >>= nextDoc -- | Perform a query and return the result as a lazy list. Be sure to -- understand the comments about using the lazy list given for -- 'allDocs'. quickFind :: Connection -> FullCollection -> Selector -> IO [BsonDoc] quickFind c col sel = find c col sel >>= allDocs -- | Perform a query and return the result as a strict list. quickFind' :: Connection -> FullCollection -> Selector -> IO [BsonDoc] quickFind' c col sel = find c col sel >>= allDocs' -- | Open a cursor to find documents in /FullCollection/ that match -- /Selector/. See the documentation for each argument's type for -- information about how it effects the query. query :: Connection -> FullCollection -> [QueryOpt] -> NumToSkip -> NumToReturn -> Selector -> FieldSelector -> IO Cursor query c col opts nskip ret sel fsel = do h <- getHandle c let body = runPut $ do putI32 $ fromQueryOpts opts putCol col putI32 nskip putI32 ret putBsonDoc sel case fsel of [] -> putNothing _ -> putBsonDoc $ toBsonDoc $ List.zip fsel $ repeat $ BsonInt32 1 (reqID, msg) <- packMsg c OPQuery body L.hPut h msg hdr <- getHeader h assert (OPReply == hOp hdr) $ return () assert (hRespTo hdr == reqID) $ return () reply <- getReply h assert (rRespFlags reply == 0) $ return () docBytes <- L.hGet h (fromIntegral $ hMsgLen hdr - 16 - 20) >>= newIORef closed <- newIORef False cid <- newIORef $ rCursorID reply return Cursor { curCon = c, curID = cid, curNumToRet = ret, curCol = col, curDocBytes = docBytes, curClosed = closed } -- | Update documents with /BsonDoc/ in /FullCollection/ that match /Selector/. update :: Connection -> FullCollection -> [UpdateFlag] -> Selector -> BsonDoc -> IO RequestID update c col flags sel obj = do let body = runPut $ do putI32 0 putCol col putI32 $ fromUpdateFlags flags putBsonDoc sel putBsonDoc obj (reqID, msg) <- packMsg c OPUpdate body cPut c msg return reqID -- | log into the mongodb /Database/ attached to the /Connection/ login :: Connection -> Database -> Username -> Password -> IO BsonDoc login c db user pass = do doc <- runCommand c db (toBsonDoc [("getnonce", toBson (1 :: Int))]) let nonce = fromBson $ fromLookup $ List.lookup (s2L "nonce") doc :: String digest = md5sum $ pack $ nonce ++ user ++ md5sum (pack (user ++ ":mongo:" ++ pass)) request = toBsonDoc [("authenticate", toBson (1 :: Int)), ("user", toBson user), ("nonce", toBson nonce), ("key", toBson digest)] in runCommand c db request auth :: Connection -> Database -> Username -> Password -> IO BsonDoc auth = login logout :: Connection -> Database -> IO () logout c db = runCommand c db (toBsonDoc [(s2L "logout", BsonInt32 1)]) >> return () -- | create a new user in the current /Database/ addUser :: Connection -> Database -> Username -> Password -> IO BsonDoc addUser c db user pass = do let userDoc = toBsonDoc [(s2L "user", toBson user)] fdb = L.append db (s2L ".system.users") doc <- findOne c fdb userDoc let pwd = md5sum $ pack (user ++ ":mongo:" ++ pass) doc' = (s2L "pwd", toBson pwd) : List.deleteBy (\(k1,_) (k2,_) -> (k1 == k2)) (s2L user, undefined) (fromMaybe userDoc doc) _ <- save c fdb doc' return doc' data MapReduceOpt = MROptQuery BsonDoc -- ^ query filter object -- | MRSort ???? TODO | MROptLimit Int64 -- ^ number of objects to return from -- collection | MROptOut L8.ByteString -- ^ output-collection name | MROptKeepTemp -- ^ If set the generated collection is -- not treated as temporary, as it will -- be by defualt. When /MROptOut/ is -- specified, the collection is -- automatically made permanent. | MROptFinalize JSCode -- ^ function to apply to all the -- results when finished | MROptScope BsonDoc -- ^ can pass in variables that can be -- access from map/reduce/finalize | MROptVerbose -- ^ provide statistics on job execution -- time mrOptToTuple :: MapReduceOpt -> (String, BsonValue) mrOptToTuple (MROptQuery q) = ("query", BsonDoc q) mrOptToTuple (MROptLimit l) = ("limit", BsonInt64 l) mrOptToTuple (MROptOut c) = ("out", BsonString c) mrOptToTuple MROptKeepTemp = ("keeptemp", BsonBool True) mrOptToTuple (MROptFinalize f) = ("finalize", BsonJSCode f) mrOptToTuple (MROptScope s) = ("scope", BsonDoc s) mrOptToTuple MROptVerbose = ("verbose", BsonBool True) -- | Issue a map/reduce command and return the results metadata. If -- all you care about is the actual map/reduce results you might want -- to use the 'mapReduce' command instead. -- -- The results meta-document will look something like this: -- -- > {"result": "tmp.mr.mapreduce_1268095152_14", -- > "timeMillis": 67, -- > "counts": {"input": 4, -- > "emit": 6, -- > "output": 3}, -- > "ok": 1.0} -- -- The /results/ field is the collection name within the same Database -- that contain the results of the map/reduce. runMapReduce :: Connection -> FullCollection -> JSCode -- ^ mapping javascript function -> JSCode -- ^ reducing javascript function -> [MapReduceOpt] -> IO BsonDoc runMapReduce c fc m r opts = do let (db, col) = splitFullCol fc doc = [("mapreduce", toBson col), ("map", BsonJSCode m), ("reduce", BsonJSCode r)] ++ List.map mrOptToTuple opts runCommand c db $ toBsonDoc doc -- | Issue a map/reduce command with associated scopes and return the -- results metadata. If all you care about is the actual map/reduce -- results you might want to use the 'mapReduce' command instead. -- -- See 'runMapReduce' for more information about the form of the -- result metadata. runMapReduceWScopes :: Connection -> FullCollection -> JSCode -- ^ mapping javascript function -> BsonDoc -- ^ Scope for mapping function -> JSCode -- ^ reducing javascript function -> BsonDoc -- ^ Scope for reducing function -> [MapReduceOpt] -> IO BsonDoc runMapReduceWScopes c fc m ms r rs opts = do let (db, col) = splitFullCol fc doc = [("mapreduce", toBson col), ("map", BsonJSCodeWScope m ms), ("reduce", BsonJSCodeWScope r rs)] ++ List.map mrOptToTuple opts runCommand c db $ toBsonDoc doc -- | Given a result metadata from a 'mapReduce' command (or -- 'mapReduceWScope'), issue the 'find' command that will produce the -- actual map/reduce results. mapReduceResults :: Connection -> Database -> BsonDoc -> IO Cursor mapReduceResults c db r = do let col = case List.lookup (s2L "result") r of Just bCol -> fromBson bCol Nothing -> throwOpFailure "No 'result' in mapReduce response" fc = L.append (L.append db $ s2L ".") col find c fc [] -- | Run map/reduce and produce a cursor on the results. mapReduce :: Connection -> FullCollection -> JSCode -- ^ mapping javascript function -> JSCode -- ^ reducing javascript function -> [MapReduceOpt] -> IO Cursor mapReduce c fc m r opts = runMapReduce c fc m r opts >>= mapReduceResults c (fst $ splitFullCol fc) -- | Run map/reduce with associated scopes and produce a cursor on the -- results. mapReduceWScopes :: Connection -> FullCollection -> JSCode -- ^ mapping javascript function -> BsonDoc -- ^ Scope for mapping function -> JSCode -- ^ reducing javascript function -> BsonDoc -- ^ Scope for mapping function -> [MapReduceOpt] -> IO Cursor mapReduceWScopes c fc m ms r rs opts = runMapReduceWScopes c fc m ms r rs opts >>= mapReduceResults c (fst $ splitFullCol fc) -- | Conveniently stores the /BsonDoc/ to the /FullCollection/ -- if there is an _id present in the /BsonDoc/ then it already has -- a place in the DB, so we update it using the _id, otherwise -- we insert it save :: Connection -> FullCollection -> BsonDoc -> IO BsonValue save c fc doc = case List.lookup (s2L "_id") doc of Nothing -> insert c fc doc Just oid -> update c fc [UFUpsert] (toBsonDoc [("_id", oid)]) doc >> return oid -- | Use this in the place of the query portion of a select type query -- This uses javascript and a scope supplied by a /BsonDoc/ to evaluate -- documents in the database for retrieval. -- -- Example: -- -- > findOne conn mycoll $ whereClause "this.name == (name1 + name2)" -- > Just (toBsonDoc [("name1", toBson "mar"), ("name2", toBson "tha")]) whereClause :: String -> Maybe BsonDoc -> BsonDoc whereClause qry Nothing = toBsonDoc [("$where", BsonJSCode (s2L qry))] whereClause qry (Just scope) = toBsonDoc [("$where", BsonJSCodeWScope (s2L qry) scope)] data Hdr = Hdr { hMsgLen :: Int32, -- hReqID :: Int32, hRespTo :: Int32, hOp :: Opcode } deriving (Show) data Reply = Reply { rRespFlags :: Int32, rCursorID :: Int64 -- rStartFrom :: Int32, -- rNumReturned :: Int32 } deriving (Show) getHeader :: Handle -> IO Hdr getHeader h = do hdrBytes <- L.hGet h 16 return $ flip runGet hdrBytes $ do msgLen <- getI32 skip 4 -- reqID <- getI32 respTo <- getI32 op <- getI32 return $ Hdr msgLen respTo $ toOpcode op getReply :: Handle -> IO Reply getReply h = do replyBytes <- L.hGet h 20 return $ flip runGet replyBytes $ do respFlags <- getI32 cursorID <- getI64 skip 4 -- startFrom <- getI32 skip 4 -- numReturned <- getI32 return $ Reply respFlags cursorID -- | Return one document or Nothing if there are no more. -- Automatically closes the cursor when last document is read nextDoc :: Cursor -> IO (Maybe BsonDoc) nextDoc cur = do closed <- readIORef $ curClosed cur if closed then return Nothing else do docBytes <- readIORef $ curDocBytes cur cid <- readIORef $ curID cur case L.length docBytes of 0 -> if cid == 0 then writeIORef (curClosed cur) True >> return Nothing else getMore cur _ -> do let (doc, docBytes') = getFirstDoc docBytes writeIORef (curDocBytes cur) docBytes' return $ Just doc -- | Return a lazy list of all (of the rest) of the documents in the -- cursor. This works much like hGetContents--it will lazily read the -- cursor data out of the database as the list is used. The cursor is -- automatically closed when the list has been fully read. -- -- If you manually finish the cursor before consuming off this list -- you won't get all the original documents in the cursor. -- -- If you don't consume to the end of the list, you must manually -- close the cursor or you will leak the cursor, which may also leak -- on the database side. allDocs :: Cursor -> IO [BsonDoc] allDocs cur = unsafeInterleaveIO $ do doc <- nextDoc cur case doc of Nothing -> return [] Just d -> liftM (d :) (allDocs cur) -- | Returns a strict list of all (of the rest) of the documents in -- the cursor. This means that all of the documents will immediately -- be read out of the database and loaded into memory. allDocs' :: Cursor -> IO [BsonDoc] allDocs' cur = do doc <- nextDoc cur case doc of Nothing -> return [] Just d -> liftM (d :) (allDocs' cur) getFirstDoc :: L.ByteString -> (BsonDoc, L.ByteString) getFirstDoc docBytes = flip runGet docBytes $ do doc <- getBsonDoc docBytes' <- getRemainingLazyByteString return (doc, docBytes') getMore :: Cursor -> IO (Maybe BsonDoc) getMore cur = do h <- getHandle $ curCon cur cid <- readIORef $ curID cur let body = runPut $ do putI32 0 putCol $ curCol cur putI32 $ curNumToRet cur putI64 cid (reqID, msg) <- packMsg (curCon cur) OPGetMore body L.hPut h msg hdr <- getHeader h assert (OPReply == hOp hdr) $ return () assert (hRespTo hdr == reqID) $ return () reply <- getReply h assert (rRespFlags reply == 0) $ return () case rCursorID reply of 0 -> writeIORef (curID cur) 0 ncid -> assert (ncid == cid) $ return () docBytes <- (L.hGet h $ fromIntegral $ hMsgLen hdr - 16 - 20) case L.length docBytes of 0 -> writeIORef (curClosed cur) True >> return Nothing _ -> do let (doc, docBytes') = getFirstDoc docBytes writeIORef (curDocBytes cur) docBytes' return $ Just doc -- | Manually close a cursor -- usually not needed if you use -- 'allDocs', 'allDocs'', or 'nextDoc'. finish :: Cursor -> IO () finish cur = do h <- getHandle $ curCon cur cid <- readIORef $ curID cur unless (cid == 0) $ do let body = runPut $ do putI32 0 putI32 1 putI64 cid (_reqID, msg) <- packMsg (curCon cur) OPKillCursors body L.hPut h msg writeIORef (curClosed cur) True return () -- | The field key to index on. type Key = L8.ByteString -- | Direction to index. data Direction = Ascending | Descending deriving (Show, Eq) fromDirection :: Direction -> Int fromDirection Ascending = 1 fromDirection Descending = - 1 -- | Should this index guarantee uniqueness? type Unique = Bool -- | Create a new index on /FullCollection/ on the list of /Key/ / -- /Direction/ pairs. createIndex :: Connection -> FullCollection -> [(Key, Direction)] -> Unique -> IO L8.ByteString createIndex c col keys uniq = do let (db, _col') = splitFullCol col name = indexName keys keysDoc = flip fmap keys $ \(k, d) -> (k, toBson $ fromDirection d :: BsonValue) _ <- insert c (L.append db $ s2L ".system.indexes") $ toBsonDoc [("name", toBson name), ("ns", toBson col), ("key", toBson keysDoc), ("unique", toBson uniq)] return name -- | Drop the specified index on the given /FullCollection/. dropIndex :: Connection -> FullCollection -> [(Key, Direction)] -> IO () dropIndex c col keys = do let (db, col') = splitFullCol col name = indexName keys _ <- runCommand c db $ toBsonDoc [("deleteIndexes", toBson col'), ("index", toBson name)] return () -- | Drop all indexes on /FullCollection/. dropIndexes :: Connection -> FullCollection -> IO () dropIndexes c col = do let (db, col') = splitFullCol col _ <- runCommand c db $ toBsonDoc [("deleteIndexes", toBson col'), ("index", toBson "*")] return () -- | Return a BsonDoc describing the existing indexes on /FullCollection/. -- -- With the current server versions (1.2) this will return documents -- such as: -- -- > {"key": {"lastname": -1, "firstname": 1}, -- > "name": "lastname_-1_firstname_1", -- > "ns": "mydb.people", -- > "unique": true} -- -- Which is a single key that indexes on @lastname@ (descending) and -- then @firstname@ (ascending) on the collection @people@ of the -- database @mydb@ with a uniqueness requirement. indexInformation :: Connection -> FullCollection -> IO [BsonDoc] indexInformation c col = do let (db, _col') = splitFullCol col quickFind' c (L.append db $ s2L ".system.indexes") $ toBsonDoc [("ns", toBson col)] indexName :: [(Key, Direction)] -> L8.ByteString indexName = L.intercalate (s2L "_") . List.map partName where partName (k, Ascending) = L.append k $ s2L "_1" partName (k, Descending) = L.append k $ s2L "_-1" putCol :: Collection -> Put putCol col = putLazyByteString col >> putNull packMsg :: Connection -> Opcode -> L.ByteString -> IO (RequestID, L.ByteString) packMsg c op body = do reqID <- randNum c let msg = runPut $ do putI32 $ fromIntegral $ L.length body + 16 putI32 reqID putI32 0 putI32 $ fromOpcode op putLazyByteString body return (reqID, msg) randNum :: Connection -> IO Int32 randNum Connection { cRand = nsRef } = atomicModifyIORef nsRef $ \ns -> (List.tail ns, fromIntegral $ List.head ns) s2L :: String -> L8.ByteString s2L = L8.fromString validateCollectionName :: FullCollection -> IO (Database, Collection) validateCollectionName col = do let (db, col') = splitFullCol col when (s2L ".." `List.elem` L.group col) $ throwColInvalid $ "Collection can't contain \"..\": " ++ show col when (c2w '$' `L.elem` col && not (s2L "oplog.$mail" `L.isPrefixOf` col' || s2L "$cmd" `L.isPrefixOf` col')) $ throwColInvalid $ "Collection can't contain '$': " ++ show col when (L.head col == c2w '.' || L.last col == c2w '.') $ throwColInvalid $ "Collection can't start or end with '.': " ++ show col return (db, col') fromLookup :: Maybe a -> a fromLookup (Just m) = m fromLookup Nothing = throwColInvalid "cannot find key"