module Data.Avro.Decode.Lazy.Deconflict
( deconflict
, deconflictNoResolve
) where
import Control.Applicative ((<|>))
import Data.Avro.Decode.Lazy.Convert (fromStrictValue)
import Data.Avro.Decode.Lazy.LazyValue as T
import Data.Avro.Schema as S
import qualified Data.Foldable as Foldable
import Data.HashMap.Strict (HashMap)
import qualified Data.HashMap.Strict as HashMap
import Data.List (find)
import Data.List.NonEmpty (NonEmpty (..))
import qualified Data.List.NonEmpty as NE
import qualified Data.Map as M
import Data.Semigroup ((<>))
import qualified Data.Set as Set
import Data.Text (Text)
import qualified Data.Text as Text
import qualified Data.Text.Encoding as Text
import Data.Vector (Vector)
import qualified Data.Vector as V
deconflict :: Schema
-> Schema
-> T.LazyValue Type
-> T.LazyValue Type
deconflict writerSchema readerSchema =
deconflictNoResolve (S.expandNamedTypes writerSchema) (S.expandNamedTypes readerSchema)
deconflictNoResolve :: Schema
-> Schema
-> T.LazyValue Type
-> T.LazyValue Type
deconflictNoResolve writerSchema readerSchema =
deconflictValue writerSchema readerSchema
deconflictValue :: Type -> Type -> T.LazyValue Type -> T.LazyValue Type
deconflictValue writerSchema readerSchema v
| writerSchema == readerSchema = v
| otherwise = go writerSchema readerSchema v
where
go :: Type -> Type -> T.LazyValue Type -> T.LazyValue Type
go _ _ val@(T.Error _) = val
go (S.Array aTy) (S.Array bTy) (T.Array vec) =
T.Array $ fmap (go aTy bTy) vec
go (S.Map aTy) (S.Map bTy) (T.Map mp) =
T.Map $ fmap (go aTy bTy) mp
go a@S.Enum {} b@S.Enum {} val
| name a == name b = deconflictEnum a b val
go a@S.Fixed {} b@S.Fixed {} val
| name a == name b && size a == size b = val
go a@S.Record {} b@S.Record {} val
| name a == name b = deconflictRecord a b val
go (S.Union xs) (S.Union ys) (T.Union _ tyVal val) =
withSchemaIn tyVal xs $ \sch -> deconflictReaderUnion sch ys val
go nonUnion (S.Union ys) val =
deconflictReaderUnion nonUnion ys val
go (S.Union xs) nonUnion (T.Union _ tyVal val) =
withSchemaIn tyVal xs $ \sch -> deconflictValue sch nonUnion val
go eTy dTy val =
case val of
T.Int i32 | dTy == S.Long -> T.Long (fromIntegral i32)
| dTy == S.Float -> T.Float (fromIntegral i32)
| dTy == S.Double -> T.Double (fromIntegral i32)
T.Long i64 | dTy == S.Float -> T.Float (fromIntegral i64)
| dTy == S.Double -> T.Double (fromIntegral i64)
T.Float f | dTy == S.Double -> T.Double (realToFrac f)
T.String s | dTy == S.Bytes -> T.Bytes (Text.encodeUtf8 s)
T.Bytes bs | dTy == S.String -> T.String (Text.decodeUtf8 bs)
_ -> T.Error $ "Can not resolve differing writer and reader schemas: " ++ show (eTy, dTy)
deconflictEnum :: Type -> Type -> T.LazyValue Type -> T.LazyValue Type
deconflictEnum e d val@(T.Enum _ _ _txt) = val
withSchemaIn :: (Foldable f, Functor f)
=> Schema
-> f Schema
-> (Schema -> LazyValue Schema)
-> LazyValue Schema
withSchemaIn schema schemas f =
case findType schema schemas of
Nothing -> T.Error $ "Incorrect payload: union " <> (show . Foldable.toList $ typeName <$> schemas) <> " does not contain schema " <> Text.unpack (typeName schema)
Just found -> f found
deconflictReaderUnion :: Type -> Vector Type -> T.LazyValue Type -> T.LazyValue Type
deconflictReaderUnion valueType unionTypes val =
let hdl [] = T.Error $ "No corresponding union value for " <> Text.unpack (typeName valueType)
hdl (d:rest) =
case deconflictValue valueType d val of
T.Error _ -> hdl rest
v -> T.Union unionTypes d v
in hdl (V.toList unionTypes)
deconflictRecord :: Type -> Type -> T.LazyValue Type -> T.LazyValue Type
deconflictRecord writerSchema readerSchema (T.Record ty fldVals) =
T.Record readerSchema . HashMap.fromList $ fmap (deconflictFields fldVals (fields writerSchema)) (fields readerSchema)
deconflictFields :: HashMap Text (T.LazyValue Type) -> [Field] -> Field -> (Text,T.LazyValue Type)
deconflictFields hm writerFields readerField =
let
mbWriterField = findField readerField writerFields
mbValue = HashMap.lookup (fldName readerField) hm
in case (mbWriterField, mbValue, fldDefault readerField) of
(Just w, Just x,_) -> (fldName readerField, deconflictValue (fldType w) (fldType readerField) x)
(_, Just x,_) -> (fldName readerField, x)
(_, _,Just def) -> (fldName readerField, fromStrictValue def)
(_,Nothing,Nothing) -> (fldName readerField, T.Error ("No field and no default for " ++ show (fldName readerField)))
findField :: Field -> [Field] -> Maybe Field
findField f fs =
let
byName = find (\x -> fldName x == fldName f) fs
allNames fld = Set.fromList (fldName fld : fldAliases fld)
fNames = allNames f
sameField = not . Set.null . Set.intersection fNames . allNames
byAliases = find sameField fs
in byName <|> byAliases
findType :: Foldable f => Schema -> f Schema -> Maybe Schema
findType schema =
let tn = typeName schema
in Foldable.find ((tn ==) . typeName)