{-# LANGUAGE AllowAmbiguousTypes #-}
{-# LANGUAGE GeneralizedNewtypeDeriving #-}
{-# LANGUAGE LambdaCase #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE RecordWildCards #-}
{-# LANGUAGE ScopedTypeVariables #-}
{-# LANGUAGE TypeApplications #-}
{-# LANGUAGE ViewPatterns #-}
{-# LANGUAGE DerivingStrategies #-}
{-# LANGUAGE BangPatterns #-}
{-# LANGUAGE TypeFamilies #-}
{-# LANGUAGE InstanceSigs #-}
{-# OPTIONS_HADDOCK not-home #-}
module FlatBuffers.Internal.Read where
import Control.Monad ( (>=>), join )
import Data.Binary.Get ( Get )
import qualified Data.Binary.Get as G
import qualified Data.ByteString as BS
import Data.ByteString.Lazy ( ByteString )
import qualified Data.ByteString.Lazy as BSL
import qualified Data.ByteString.Lazy.Internal as BSL
import qualified Data.ByteString.Unsafe as BSU
import Data.Coerce ( coerce )
import Data.Functor ( (<&>) )
import Data.Int
import qualified Data.List as L
import Data.Text ( Text )
import qualified Data.Text.Encoding as T
import qualified Data.Text.Encoding.Error as T
import Data.Word
import FlatBuffers.Internal.Constants
import FlatBuffers.Internal.FileIdentifier ( FileIdentifier(..), HasFileIdentifier(..) )
import FlatBuffers.Internal.Types
import FlatBuffers.Internal.Util ( Positive, positive )
import Prelude hiding ( length )
type ReadError = String
newtype TableIndex = TableIndex { unTableIndex :: Word16 }
deriving newtype (Show, Num)
newtype VOffset = VOffset { unVOffset :: Word16 }
deriving newtype (Show, Num, Real, Ord, Enum, Integral, Eq)
newtype OffsetFromRoot = OffsetFromRoot Int32
deriving newtype (Show, Num, Real, Ord, Enum, Integral, Eq)
data Table a = Table
{ vtable :: !Position
, tablePos :: !PositionInfo
}
newtype Struct a = Struct
{ structPos :: Position
}
data Union a
= Union !a
| UnionNone
| UnionUnknown !Word8
type Position = ByteString
data PositionInfo = PositionInfo
{ posRoot :: !Position
, posCurrent :: !Position
, posOffsetFromRoot :: !OffsetFromRoot
}
class HasPosition a where
getPosition :: a -> Position
move :: Integral i => a -> i -> a
instance HasPosition ByteString where
getPosition = id
move bs offset = BSL.drop (fromIntegral @_ @Int64 offset) bs
instance HasPosition PositionInfo where
getPosition = posCurrent
move PositionInfo{..} offset =
PositionInfo
{ posRoot = posRoot
, posCurrent = move posCurrent offset
, posOffsetFromRoot = posOffsetFromRoot + OffsetFromRoot (fromIntegral @_ @Int32 offset)
}
decode :: ByteString -> Either ReadError (Table a)
decode root = readTable initialPos
where
initialPos = PositionInfo root root 0
checkFileIdentifier :: forall a. HasFileIdentifier a => ByteString -> Bool
checkFileIdentifier = checkFileIdentifier' (getFileIdentifier @a)
checkFileIdentifier' :: FileIdentifier -> ByteString -> Bool
checkFileIdentifier' (unFileIdentifier -> fileIdent) bs =
actualFileIdent == BSL.fromStrict fileIdent
where
actualFileIdent =
BSL.take fileIdentifierSize .
BSL.drop uoffsetSize $
bs
{-# INLINE moveToElem #-}
moveToElem :: HasPosition pos => pos -> Int32 -> Int32 -> pos
moveToElem pos elemSize ix =
let elemOffset = int32Size + (ix * elemSize)
in move pos elemOffset
{-# INLINE checkIndexBounds #-}
checkIndexBounds :: Int32 -> Int32 -> Int32
checkIndexBounds ix length
| ix < 0 = error ("FlatBuffers.Internal.Read.index: negative index: " <> show ix)
| ix >= length = error ("FlatBuffers.Internal.Read.index: index too large: " <> show ix)
| otherwise = ix
{-# INLINE inlineVectorToList #-}
inlineVectorToList :: HasPosition pos => Get a -> pos -> Either ReadError [a]
inlineVectorToList get (getPosition -> pos) =
flip runGet pos $ do
len <- G.getInt32le
sequence $ L.replicate (fromIntegral @Int32 @Int len) get
class VectorElement a where
data Vector a
length :: Vector a -> Either ReadError Int32
index :: Vector a -> Int32 -> Either ReadError a
index vec ix = unsafeIndex vec . checkIndexBounds ix =<< length vec
unsafeIndex :: Vector a -> Int32 -> Either ReadError a
toList :: Vector a -> Either ReadError [a]
instance VectorElement Word8 where
newtype Vector Word8 = VectorWord8 Position
deriving newtype HasPosition
length = readInt32
index vec ix = byteStringSafeIndex (coerce vec) . (+ int32Size) . checkIndexBounds ix =<< length vec
unsafeIndex vec ix = byteStringSafeIndex (coerce vec) (int32Size + ix)
toList vec =
length vec <&> \len ->
BSL.unpack $
BSL.take (fromIntegral @Int32 @Int64 len) $
BSL.drop int32Size
(coerce vec)
instance VectorElement Word16 where
newtype Vector Word16 = VectorWord16 Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readWord16 . moveToElem vec word16Size
toList = inlineVectorToList G.getWord16le
instance VectorElement Word32 where
newtype Vector Word32 = VectorWord32 Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readWord32 . moveToElem vec word32Size
toList = inlineVectorToList G.getWord32le
instance VectorElement Word64 where
newtype Vector Word64 = VectorWord64 Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readWord64 . moveToElem vec word64Size
toList = inlineVectorToList G.getWord64le
instance VectorElement Int8 where
newtype Vector Int8 = VectorInt8 Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readInt8 . moveToElem vec int8Size
toList = inlineVectorToList G.getInt8
instance VectorElement Int16 where
newtype Vector Int16 = VectorInt16 Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readInt16 . moveToElem vec int16Size
toList = inlineVectorToList G.getInt16le
instance VectorElement Int32 where
newtype Vector Int32 = VectorInt32 Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readInt32 . moveToElem vec int32Size
toList = inlineVectorToList G.getInt32le
instance VectorElement Int64 where
newtype Vector Int64 = VectorInt64 Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readInt64 . moveToElem vec int64Size
toList = inlineVectorToList G.getInt64le
instance VectorElement Float where
newtype Vector Float = VectorFloat Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readFloat . moveToElem vec floatSize
toList = inlineVectorToList G.getFloatle
instance VectorElement Double where
newtype Vector Double = VectorDouble Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readDouble . moveToElem vec doubleSize
toList = inlineVectorToList G.getDoublele
instance VectorElement Bool where
newtype Vector Bool = VectorBool Position
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readBool . moveToElem vec boolSize
toList (VectorBool pos) = fmap word8ToBool <$> toList (VectorWord8 pos)
instance VectorElement Text where
newtype Vector Text = VectorText Position
length (VectorText pos) = readInt32 pos
unsafeIndex (VectorText pos) = readText . moveToElem pos textRefSize
toList :: Vector Text -> Either ReadError [Text]
toList (VectorText pos) = do
offsets <- toList (VectorInt32 pos)
L.reverse <$> go offsets 0 []
where
go :: [Int32] -> Int32 -> [Text] -> Either ReadError [Text]
go [] _ acc = Right acc
go (offset : xs) ix acc = do
let textPos = move pos (offset + (ix * 4) + 4)
text <- join $ runGet readText' textPos
go xs (ix + 1) (text : acc)
instance VectorElement (Struct a) where
data Vector (Struct a) = VectorStruct
{ vectorStructStructSize :: !InlineSize
, vectorStructPos :: !Position
}
length = readInt32 . vectorStructPos
unsafeIndex (VectorStruct structSize pos) =
let elemSize = fromIntegral @InlineSize @Int32 structSize
in Right . readStruct . moveToElem pos elemSize
toList vec@(VectorStruct structSize pos) =
length vec <&> \len ->
go len (move pos (int32Size :: Int64))
where
go :: Int32 -> Position -> [Struct a]
go 0 _ = []
go !len pos =
let head = readStruct pos
tail = go (len - 1) (move pos structSize)
in head : tail
instance VectorElement (Table a) where
newtype Vector (Table a) = VectorTable PositionInfo
deriving newtype HasPosition
length = readInt32
unsafeIndex vec = readTable . coerce . moveToElem vec tableRefSize
toList (VectorTable vectorPos) = do
offsets <- toList (VectorInt32 (posCurrent vectorPos))
go offsets 0
where
go :: [Int32] -> Int32 -> Either ReadError [Table a]
go [] _ = Right []
go (offset : offsets) !ix = do
let tablePos = move vectorPos (offset + (ix * 4) + 4)
table <- readTable' tablePos
tables <- go offsets (ix + 1)
pure (table : tables)
instance VectorElement (Union a) where
data Vector (Union a) = VectorUnion
{ vectorUnionTypesPos :: !(Vector Word8)
, vectorUnionValuesPos :: !PositionInfo
, vectorUnionReadElem :: !(Positive Word8 -> PositionInfo -> Either ReadError (Union a))
}
length = length . vectorUnionTypesPos
unsafeIndex (VectorUnion typesPos valuesPos readElem) ix = do
unionType <- unsafeIndex typesPos ix
case positive unionType of
Nothing -> Right UnionNone
Just unionType' -> do
tablePos <- readUOffsetAndSkip $ moveToElem valuesPos tableRefSize ix
readElem unionType' tablePos
toList (VectorUnion typesPos valuesPos readElem) = do
unionTypes <- toList typesPos
offsets <- toList (VectorInt32 (posCurrent valuesPos))
go unionTypes offsets 0
where
go :: [Word8] -> [Int32] -> Int32 -> Either ReadError [Union a]
go [] [] _ = Right []
go (unionType : unionTypes) (offset : offsets) !ix = do
union <-
case positive unionType of
Nothing -> Right UnionNone
Just unionType' ->
let tablePos = move valuesPos (offset + (ix * 4) + 4)
in readElem unionType' tablePos
unions <- go unionTypes offsets (ix + 1)
pure (union : unions)
go _ _ _ = Left "Union vector: 'type vector' and 'value vector' do not have the same length."
{-# INLINE readStructField #-}
readStructField :: (Position -> a) -> VOffset -> Struct s -> a
readStructField read voffset (Struct bs) =
read (move bs voffset)
{-# INLINE readTableFieldOpt #-}
readTableFieldOpt :: (PositionInfo -> Either ReadError a) -> TableIndex -> Table t -> Either ReadError (Maybe a)
readTableFieldOpt read ix t = do
mbOffset <- tableIndexToVOffset t ix
traverse (\offset -> read (move (tablePos t) offset)) mbOffset
{-# INLINE readTableFieldReq #-}
readTableFieldReq :: (PositionInfo -> Either ReadError a) -> TableIndex -> String -> Table t -> Either ReadError a
readTableFieldReq read ix name t = do
mbOffset <- tableIndexToVOffset t ix
case mbOffset of
Nothing -> missingField name
Just offset -> read (move (tablePos t) offset)
{-# INLINE readTableFieldWithDef #-}
readTableFieldWithDef :: (PositionInfo -> Either ReadError a) -> TableIndex -> a -> Table t -> Either ReadError a
readTableFieldWithDef read ix dflt t =
tableIndexToVOffset t ix >>= \case
Nothing -> Right dflt
Just offset -> read (move (tablePos t) offset)
{-# INLINE readTableFieldUnion #-}
readTableFieldUnion :: (Positive Word8 -> PositionInfo -> Either ReadError (Union a)) -> TableIndex -> Table t -> Either ReadError (Union a)
readTableFieldUnion read ix t =
readTableFieldWithDef readWord8 (ix - 1) 0 t >>= \unionType ->
case positive unionType of
Nothing -> Right UnionNone
Just unionType' ->
tableIndexToVOffset t ix >>= \case
Nothing -> Left "Union: 'union type' found but 'union value' is missing."
Just offset -> readUOffsetAndSkip (move (tablePos t) offset) >>= read unionType'
readTableFieldUnionVectorOpt ::
(Positive Word8 -> PositionInfo -> Either ReadError (Union a))
-> TableIndex
-> Table t
-> Either ReadError (Maybe (Vector (Union a)))
readTableFieldUnionVectorOpt read ix t =
tableIndexToVOffset t (ix - 1) >>= \case
Nothing -> Right Nothing
Just typesOffset ->
tableIndexToVOffset t ix >>= \case
Nothing -> Left "Union vector: 'type vector' found but 'value vector' is missing."
Just valuesOffset ->
Just <$> readUnionVector read (move (tablePos t) typesOffset) (move (tablePos t) valuesOffset)
readTableFieldUnionVectorReq ::
(Positive Word8 -> PositionInfo -> Either ReadError (Union a))
-> TableIndex
-> String
-> Table t
-> Either ReadError (Vector (Union a))
readTableFieldUnionVectorReq read ix name t =
tableIndexToVOffset t (ix - 1) >>= \case
Nothing -> missingField name
Just typesOffset ->
tableIndexToVOffset t ix >>= \case
Nothing -> Left "Union vector: 'type vector' found but 'value vector' is missing."
Just valuesOffset ->
readUnionVector read (move (tablePos t) typesOffset) (move (tablePos t) valuesOffset)
{-# INLINE readInt8 #-}
readInt8 :: HasPosition a => a -> Either ReadError Int8
readInt8 (getPosition -> pos) = runGet G.getInt8 pos
{-# INLINE readInt16 #-}
readInt16 :: HasPosition a => a -> Either ReadError Int16
readInt16 (getPosition -> pos) = runGet G.getInt16le pos
{-# INLINE readInt32 #-}
readInt32 :: HasPosition a => a -> Either ReadError Int32
readInt32 (getPosition -> pos) = runGet G.getInt32le pos
{-# INLINE readInt64 #-}
readInt64 :: HasPosition a => a -> Either ReadError Int64
readInt64 (getPosition -> pos) = runGet G.getInt64le pos
{-# INLINE readWord8 #-}
readWord8 :: HasPosition a => a -> Either ReadError Word8
readWord8 (getPosition -> pos) = runGet G.getWord8 pos
{-# INLINE readWord16 #-}
readWord16 :: HasPosition a => a -> Either ReadError Word16
readWord16 (getPosition -> pos) = runGet G.getWord16le pos
{-# INLINE readWord32 #-}
readWord32 :: HasPosition a => a -> Either ReadError Word32
readWord32 (getPosition -> pos) = runGet G.getWord32le pos
{-# INLINE readWord64 #-}
readWord64 :: HasPosition a => a -> Either ReadError Word64
readWord64 (getPosition -> pos) = runGet G.getWord64le pos
{-# INLINE readFloat #-}
readFloat :: HasPosition a => a -> Either ReadError Float
readFloat (getPosition -> pos) = runGet G.getFloatle pos
{-# INLINE readDouble #-}
readDouble :: HasPosition a => a -> Either ReadError Double
readDouble (getPosition -> pos) = runGet G.getDoublele pos
{-# INLINE readBool #-}
readBool :: HasPosition a => a -> Either ReadError Bool
readBool p = word8ToBool <$> readWord8 p
{-# INLINE word8ToBool #-}
word8ToBool :: Word8 -> Bool
word8ToBool 0 = False
word8ToBool _ = True
readPrimVector ::
(Position -> Vector a)
-> PositionInfo
-> Either ReadError (Vector a)
readPrimVector vecConstructor (posCurrent -> pos) =
vecConstructor <$> readUOffsetAndSkip pos
readTableVector :: PositionInfo -> Either ReadError (Vector (Table a))
readTableVector pos =
VectorTable <$> readUOffsetAndSkip pos
readStructVector :: forall a. IsStruct a => PositionInfo -> Either ReadError (Vector (Struct a))
readStructVector (posCurrent -> pos) =
VectorStruct (structSizeOf @a) <$> readUOffsetAndSkip pos
readUnionVector ::
(Positive Word8 -> PositionInfo -> Either ReadError (Union a))
-> PositionInfo
-> PositionInfo
-> Either ReadError (Vector (Union a))
readUnionVector readUnion typesPos valuesPos =
do
typesVec <- readPrimVector VectorWord8 typesPos
valuesVec <- readUOffsetAndSkip valuesPos
Right $! VectorUnion
typesVec
valuesVec
readUnion
{-# INLINE readText #-}
readText :: HasPosition a => a -> Either ReadError Text
readText (getPosition -> pos) =
join $ flip runGet pos $ do
uoffset <- G.getInt32le
G.skip (fromIntegral @Int32 @Int (uoffset - uoffsetSize))
readText'
{-# INLINE readText' #-}
readText' :: Get (Either ReadError Text)
readText' = do
strLength <- G.getInt32le
bs <- G.getByteString $ fromIntegral @Int32 @Int strLength
pure $! case T.decodeUtf8' bs of
Right t -> Right t
Left (T.DecodeError msg byteMaybe) ->
case byteMaybe of
Just byte -> Left $ "UTF8 decoding error (byte " <> show byte <> "): " <> msg
Nothing -> Left $ "UTF8 decoding error: " <> msg
Left _ -> error "the impossible happened"
{-# INLINE readTable #-}
readTable :: PositionInfo -> Either ReadError (Table t)
readTable = readUOffsetAndSkip >=> readTable'
{-# INLINE readTable' #-}
readTable' :: PositionInfo -> Either ReadError (Table t)
readTable' tablePos =
readInt32 tablePos <&> \soffset ->
let vtableOffsetFromRoot = coerce (posOffsetFromRoot tablePos) - soffset
vtable = move (posRoot tablePos) vtableOffsetFromRoot
in Table vtable tablePos
{-# INLINE readStruct #-}
readStruct :: HasPosition a => a -> Struct s
readStruct = Struct . getPosition
{-# INLINE tableIndexToVOffset #-}
tableIndexToVOffset :: Table t -> TableIndex -> Either ReadError (Maybe VOffset)
tableIndexToVOffset Table{..} ix =
flip runGet vtable $ do
vtableSize <- G.getWord16le
let vtableIndex = 4 + (unTableIndex ix * 2)
if vtableIndex >= vtableSize
then pure Nothing
else do
G.skip (fromIntegral @Word16 @Int vtableIndex - 2)
G.getWord16le <&> \case
0 -> Nothing
word16 -> Just (VOffset word16)
{-# INLINE readUOffsetAndSkip #-}
readUOffsetAndSkip :: HasPosition pos => pos -> Either ReadError pos
readUOffsetAndSkip pos =
move pos <$> readInt32 pos
{-# INLINE runGet #-}
runGet :: Get a -> ByteString -> Either ReadError a
runGet get bs =
case G.runGetOrFail get bs of
Right (_, _, a) -> Right a
Left (_, _, msg) -> Left msg
{-# NOINLINE missingField #-}
missingField :: String -> Either ReadError a
missingField fieldName =
Left $ "Missing required table field: " <> fieldName
{-# INLINE byteStringSafeIndex #-}
byteStringSafeIndex :: ByteString -> Int32 -> Either ReadError Word8
byteStringSafeIndex !cs0 !i =
index' cs0 i
where index' BSL.Empty _ = Left "not enough bytes"
index' (BSL.Chunk c cs) n
| fromIntegral @Int32 @Int n >= BS.length c =
index' cs (n - fromIntegral @Int @Int32 (BS.length c))
| otherwise = Right $! BSU.unsafeIndex c (fromIntegral @Int32 @Int n)