{- Copyright (C) 2010 Scott R Parish Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. -} module Database.MongoDB ( connect, connectOnPort, conClose, delete, insert, insertMany, query, remove, update, find, quickFind, quickFind', allDocs, allDocs', finish, nextDoc, Collection, FieldSelector, NumToSkip, NumToReturn, RequestID, Selector, Opcode(..), QueryOpt(..), UpdateFlag(..), ) where import Control.Exception import Control.Monad import Data.Binary import Data.Binary.Get import Data.Binary.Put import Data.Bits import Data.ByteString.Char8 hiding (find) import qualified Data.ByteString.Lazy as L import Data.Int import Data.IORef import qualified Data.List as List import Data.Typeable import Database.MongoDB.BSON import Database.MongoDB.Util import qualified Network import Network.Socket hiding (connect, send, sendTo, recv, recvFrom) import Prelude hiding (getContents) import System.IO import System.IO.Unsafe import System.Random data Connection = Connection { cHandle :: Handle, cRand :: IORef [Int] } connect :: HostName -> IO Connection connect = flip connectOnPort $ Network.PortNumber 27017 connectOnPort :: HostName -> Network.PortID -> IO Connection connectOnPort host port = do h <- Network.connectTo host port hSetBuffering h NoBuffering r <- newStdGen let ns = randomRs (fromIntegral (minBound :: Int32), fromIntegral (maxBound :: Int32)) r nsRef <- newIORef ns return $ Connection { cHandle = h, cRand = nsRef } conClose :: Connection -> IO () conClose = hClose . cHandle data Cursor = Cursor { curCon :: Connection, curID :: IORef Int64, curNumToRet :: Int32, curCol :: Collection, curDocBytes :: IORef L.ByteString, curClosed :: IORef Bool } data Opcode = OP_REPLY -- 1 Reply to a client request. responseTo is set | OP_MSG -- 1000 generic msg command followed by a string | OP_UPDATE -- 2001 update document | OP_INSERT -- 2002 insert new document | OP_GET_BY_OID -- 2003 is this used? | OP_QUERY -- 2004 query a collection | OP_GET_MORE -- 2005 Get more data from a query. See Cursors | OP_DELETE -- 2006 Delete documents | OP_KILL_CURSORS -- 2007 Tell database client is done with a cursor deriving (Show, Eq) data MongoDBInternalError = MongoDBInternalError String deriving (Eq, Show, Read) mongoDBInternalError :: TyCon mongoDBInternalError = mkTyCon "Database.MongoDB.MongoDBInternalError" instance Typeable MongoDBInternalError where typeOf _ = mkTyConApp mongoDBInternalError [] instance Exception MongoDBInternalError fromOpcode :: Opcode -> Int32 fromOpcode OP_REPLY = 1 fromOpcode OP_MSG = 1000 fromOpcode OP_UPDATE = 2001 fromOpcode OP_INSERT = 2002 fromOpcode OP_GET_BY_OID = 2003 fromOpcode OP_QUERY = 2004 fromOpcode OP_GET_MORE = 2005 fromOpcode OP_DELETE = 2006 fromOpcode OP_KILL_CURSORS = 2007 toOpcode :: Int32 -> Opcode toOpcode 1 = OP_REPLY toOpcode 1000 = OP_MSG toOpcode 2001 = OP_UPDATE toOpcode 2002 = OP_INSERT toOpcode 2003 = OP_GET_BY_OID toOpcode 2004 = OP_QUERY toOpcode 2005 = OP_GET_MORE toOpcode 2006 = OP_DELETE toOpcode 2007 = OP_KILL_CURSORS toOpcode n = throw $ MongoDBInternalError $ "Got unexpected Opcode: " ++ show n type Collection = String type Selector = BsonDoc type FieldSelector = BsonDoc type RequestID = Int32 type NumToSkip = Int32 type NumToReturn = Int32 data QueryOpt = QO_TailableCursor | QO_SlaveOK | QO_OpLogReplay | QO_NoCursorTimeout deriving (Show) fromQueryOpts :: [QueryOpt] -> Int32 fromQueryOpts opts = List.foldl (.|.) 0 $ fmap toVal opts where toVal QO_TailableCursor = 2 toVal QO_SlaveOK = 4 toVal QO_OpLogReplay = 8 toVal QO_NoCursorTimeout = 16 data UpdateFlag = UF_Upsert | UF_Multiupdate deriving (Show, Enum) fromUpdateFlags :: [UpdateFlag] -> Int32 fromUpdateFlags flags = List.foldl (.|.) 0 $ flip fmap flags $ (1 `shiftL`) . fromEnum delete :: Connection -> Collection -> Selector -> IO RequestID delete c col sel = do let body = runPut $ do putI32 0 putCol col putI32 0 put sel (reqID, msg) <- packMsg c OP_DELETE body L.hPut (cHandle c) msg return reqID remove :: Connection -> Collection -> Selector -> IO RequestID remove = delete insert :: Connection -> Collection -> BsonDoc -> IO RequestID insert c col doc = do let body = runPut $ do putI32 0 putCol col put doc (reqID, msg) <- packMsg c OP_INSERT body L.hPut (cHandle c) msg return reqID insertMany :: Connection -> Collection -> [BsonDoc] -> IO RequestID insertMany c col docs = do let body = runPut $ do putI32 0 putCol col forM_ docs put (reqID, msg) <- packMsg c OP_INSERT body L.hPut (cHandle c) msg return reqID {- | Open a cursor to find documents. If you need full functionality, see 'query' -} find :: Connection -> Collection -> Selector -> IO Cursor find c col sel = query c col [] 0 0 sel Nothing {- | Perform a query and return the result as a lazy list. Be sure to understand the comments about using the lazy list given for 'allDocs'. -} quickFind :: Connection -> Collection -> Selector -> IO [BsonDoc] quickFind c col sel = find c col sel >>= allDocs {- | Perform a query and return the result as a strict list. -} quickFind' :: Connection -> Collection -> Selector -> IO [BsonDoc] quickFind' c col sel = find c col sel >>= allDocs' query :: Connection -> Collection -> [QueryOpt] -> NumToSkip -> NumToReturn -> Selector -> Maybe FieldSelector -> IO Cursor query c col opts nskip ret sel fsel = do let h = cHandle c let body = runPut $ do putI32 $ fromQueryOpts opts putCol col putI32 nskip putI32 ret put sel case fsel of Nothing -> putNothing Just _ -> put fsel (reqID, msg) <- packMsg c OP_QUERY body L.hPut h msg hdr <- getHeader h assert (OP_REPLY == hOp hdr) $ return () assert (hRespTo hdr == reqID) $ return () reply <- getReply h assert (rRespFlags reply == 0) $ return () docBytes <- (L.hGet h $ fromIntegral $ hMsgLen hdr - 16 - 20) >>= newIORef closed <- newIORef False cid <- newIORef $ rCursorID reply return $ Cursor { curCon = c, curID = cid, curNumToRet = ret, curCol = col, curDocBytes = docBytes, curClosed = closed } update :: Connection -> Collection -> [UpdateFlag] -> Selector -> BsonDoc -> IO RequestID update c col flags sel obj = do let body = runPut $ do putI32 0 putCol col putI32 $ fromUpdateFlags flags put sel put obj (reqID, msg) <- packMsg c OP_UPDATE body L.hPut (cHandle c) msg return reqID data Hdr = Hdr { hMsgLen :: Int32, -- hReqID :: Int32, hRespTo :: Int32, hOp :: Opcode } deriving (Show) data Reply = Reply { rRespFlags :: Int32, rCursorID :: Int64 -- rStartFrom :: Int32, -- rNumReturned :: Int32 } deriving (Show) getHeader :: Handle -> IO Hdr getHeader h = do hdrBytes <- L.hGet h 16 return $ flip runGet hdrBytes $ do msgLen <- getI32 skip 4 -- reqID <- getI32 respTo <- getI32 op <- getI32 return $ Hdr msgLen respTo $ toOpcode op getReply :: Handle -> IO Reply getReply h = do replyBytes <- L.hGet h 20 return $ flip runGet replyBytes $ do respFlags <- getI32 cursorID <- getI64 skip 4 -- startFrom <- getI32 skip 4 -- numReturned <- getI32 return $ (Reply respFlags cursorID) {- | Return one document or Nothing if there are no more. Automatically closes the curosr when last document is read -} nextDoc :: Cursor -> IO (Maybe BsonDoc) nextDoc cur = do closed <- readIORef $ curClosed cur case closed of True -> return Nothing False -> do docBytes <- readIORef $ curDocBytes cur cid <- readIORef $ curID cur case L.length docBytes of 0 -> if cid == 0 then writeIORef (curClosed cur) True >> return Nothing else getMore cur _ -> do let (doc, docBytes') = getFirstDoc docBytes writeIORef (curDocBytes cur) docBytes' return $ Just doc {- | Return a lazy list of all (of the rest) of the documents in the cursor. This works much like hGetContents--it will lazily read the cursor data out of the database as the list is used. The cursor is automatically closed when the list has been fully read. If you manually finish the cursor before consuming off this list you won't get all the original documents in the cursor. If you don't consume to the end of the list, you must manually close the cursor or you will leak the cursor, which may also leak on the database side. -} allDocs :: Cursor -> IO [BsonDoc] allDocs cur = unsafeInterleaveIO $ do doc <- nextDoc cur case doc of Nothing -> return [] Just d -> allDocs cur >>= return . (d :) {- | Returns a strict list of all (of the rest) of the documents in the cursor. This means that all of the documents will immediately be read out of the database and loaded into memory. -} allDocs' :: Cursor -> IO [BsonDoc] allDocs' cur = do doc <- nextDoc cur case doc of Nothing -> return [] Just d -> allDocs' cur >>= return . (d :) getFirstDoc :: L.ByteString -> (BsonDoc, L.ByteString) getFirstDoc docBytes = flip runGet docBytes $ do doc <- get docBytes' <- getRemainingLazyByteString return (doc, docBytes') getMore :: Cursor -> IO (Maybe BsonDoc) getMore cur = do let h = cHandle $ curCon cur cid <- readIORef $ curID cur let body = runPut $ do putI32 0 putCol $ curCol cur putI32 $ curNumToRet cur putI64 cid (reqID, msg) <- packMsg (curCon cur) OP_GET_MORE body L.hPut h msg hdr <- getHeader h assert (OP_REPLY == hOp hdr) $ return () assert (hRespTo hdr == reqID) $ return () reply <- getReply h assert (rRespFlags reply == 0) $ return () case rCursorID reply of 0 -> writeIORef (curID cur) 0 ncid -> assert (ncid == cid) $ return () docBytes <- (L.hGet h $ fromIntegral $ hMsgLen hdr - 16 - 20) case L.length docBytes of 0 -> writeIORef (curClosed cur) True >> return Nothing _ -> do let (doc, docBytes') = getFirstDoc docBytes writeIORef (curDocBytes cur) docBytes' return $ Just doc {- Manually close a cursor -- usually not needed. -} finish :: Cursor -> IO () finish cur = do let h = cHandle $ curCon cur cid <- readIORef $ curID cur let body = runPut $ do putI32 0 putI32 1 putI64 cid (_reqID, msg) <- packMsg (curCon cur) OP_KILL_CURSORS body L.hPut h msg writeIORef (curClosed cur) True return () putCol :: Collection -> Put putCol col = putByteString (pack col) >> putNull packMsg :: Connection -> Opcode -> L.ByteString -> IO (RequestID, L.ByteString) packMsg c op body = do reqID <- randNum c let msg = runPut $ do putI32 $ fromIntegral $ L.length body + 16 putI32 reqID putI32 0 putI32 $ fromOpcode op putLazyByteString body return (reqID, msg) randNum :: Connection -> IO Int32 randNum Connection { cRand = nsRef } = atomicModifyIORef nsRef $ \ns -> (List.tail ns, fromIntegral $ List.head ns)