{-# LANGUAGE Safe #-} -- | -- Module : Data.Text.Encoding.Base32 -- Copyright : (c) 2019-2020 Emily Pillmore -- License : BSD-style -- -- Maintainer : Emily Pillmore <emilypi@cohomolo.gy> -- Stability : stable -- Portability : non-portable -- -- This module contains 'Data.Text.Text'-valued combinators for -- implementing the RFC 4648 specification of the Base32 -- encoding format. This includes strictly padded/unpadded decoding variants, as well as -- internal and external validation for canonicity. -- module Data.Text.Encoding.Base32 ( encodeBase32 , decodeBase32 , decodeBase32With , encodeBase32Unpadded , decodeBase32Unpadded , decodeBase32UnpaddedWith , decodeBase32Padded , decodeBase32PaddedWith -- , decodeBase32Lenient , isBase32 , isValidBase32 ) where import Data.Bifunctor (first) import Data.ByteString (ByteString) import qualified Data.ByteString.Base32 as B32 import Data.Text (Text) import qualified Data.Text.Encoding as T import Data.Text.Encoding.Base32.Error (Base32Error(..)) -- | Encode a 'Text' value in Base32 with padding. -- -- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6> -- -- === __Examples__: -- -- >>> encodeBase32 "Sun" -- "KN2W4===" -- encodeBase32 :: Text -> Text encodeBase32 = B32.encodeBase32 . T.encodeUtf8 {-# INLINE encodeBase32 #-} -- | Decode an arbitrarily padded Base32-encoded 'Text' value. If its length is not a multiple -- of 4, then padding chars will be added to fill out the input to a multiple of -- 4 for safe decoding as base32 encodings are optionally padded. -- -- /Note:/ This function makes sure that decoding is total by deferring to -- 'T.decodeLatin1'. This will always round trip for any valid Base32-encoded -- text value, but it may not round trip for bad inputs. The onus is on the -- caller to make sure inputs are valid. If unsure, defer to `decodeBase32With` -- and pass in a custom decode function. -- -- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6> -- -- === __Examples__: -- -- >>> decodeBase32 "KN2W4===" -- Right "Sun" -- -- >>> decodeBase32 "KN2W4" -- Right "Sun" -- -- >>> decodeBase32 "KN2W===" -- Left "Base32-encoded bytestring has invalid padding" -- decodeBase32 :: Text -> Either Text Text decodeBase32 = fmap T.decodeLatin1 . B32.decodeBase32 . T.encodeUtf8 {-# INLINE decodeBase32 #-} -- | Attempt to decode a 'Text' value as Base32, converting from -- 'ByteString' to 'Text' according to some encoding function. In practice, -- This is something like 'decodeUtf8'', which may produce an error. -- -- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6> -- -- === __Example__: -- -- @ -- 'decodeBase32With' 'T.decodeUtf8'' -- :: 'ByteString' -> 'Either' ('Base32Error' 'UnicodeException') 'Text' -- @ -- decodeBase32With :: (ByteString -> Either err Text) -- ^ convert a bytestring to text (e.g. 'T.decodeUtf8'') -> ByteString -- ^ Input text to decode -> Either (Base32Error err) Text decodeBase32With f t = case B32.decodeBase32 t of Left de -> Left $ DecodeError de Right a -> first ConversionError (f a) {-# INLINE decodeBase32With #-} -- | Encode a 'Text' value in Base32 without padding. -- -- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6> -- -- === __Examples__: -- -- >>> encodeBase32Unpadded "Sun" -- "KN2W4" -- encodeBase32Unpadded :: Text -> Text encodeBase32Unpadded = B32.encodeBase32Unpadded . T.encodeUtf8 {-# INLINE encodeBase32Unpadded #-} -- | Decode an unpadded Base32 encoded 'Text' value. -- -- /Note:/ This function makes sure that decoding is total by deferring to -- 'T.decodeLatin1'. This will always round trip for any valid Base32-encoded -- text value, but it may not round trip for bad inputs. The onus is on the -- caller to make sure inputs are valid. If unsure, defer to `decodeBase32WUnpaddedWith` -- and pass in a custom decode function. -- -- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6> -- -- === __Examples__: -- -- >>> decodeBase32Unpadded "KN2W4" -- Right "Sun" -- -- >>> decodeBase32Unpadded "KN2W4===" -- Left "Base32-encoded bytestring has invalid padding" -- decodeBase32Unpadded :: Text -> Either Text Text decodeBase32Unpadded = fmap T.decodeLatin1 . B32.decodeBase32Unpadded . T.encodeUtf8 {-# INLINE decodeBase32Unpadded #-} -- | Attempt to decode an unpadded 'ByteString' value as Base32, converting from -- 'ByteString' to 'Text' according to some encoding function. In practice, -- This is something like 'decodeUtf8'', which may produce an error. -- -- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6> -- -- === __Example__: -- -- @ -- 'decodeBase32UnpaddedWith' 'T.decodeUtf8'' -- :: 'ByteString' -> 'Either' ('Base32Error' 'UnicodeException') 'Text' -- @ -- decodeBase32UnpaddedWith :: (ByteString -> Either err Text) -- ^ convert a bytestring to text (e.g. 'T.decodeUtf8'') -> ByteString -- ^ Input text to decode -> Either (Base32Error err) Text decodeBase32UnpaddedWith f t = case B32.decodeBase32Unpadded t of Left de -> Left $ DecodeError de Right a -> first ConversionError (f a) {-# INLINE decodeBase32UnpaddedWith #-} -- | Decode an padded Base32 encoded 'Text' value -- -- /Note:/ This function makes sure that decoding is total by deferring to -- 'T.decodeLatin1'. This will always round trip for any valid Base32-encoded -- text value, but it may not round trip for bad inputs. The onus is on the -- caller to make sure inputs are valid. If unsure, defer to `decodeBase32PaddedWith` -- and pass in a custom decode function. -- -- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6> -- -- === __Examples__: -- -- >>> decodeBase32Padded "KN2W4===" -- Right "Sun" -- -- >>> decodeBase32Padded "KN2W4" -- Left "Base32-encoded bytestring requires padding" -- decodeBase32Padded :: Text -> Either Text Text decodeBase32Padded = fmap T.decodeLatin1 . B32.decodeBase32Padded . T.encodeUtf8 {-# INLINE decodeBase32Padded #-} -- | Attempt to decode a padded 'ByteString' value as Base32, converting from -- 'ByteString' to 'Text' according to some encoding function. In practice, -- This is something like 'decodeUtf8'', which may produce an error. -- -- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6> -- -- === __Example__: -- -- @ -- 'decodeBase32PaddedWith' 'T.decodeUtf8'' -- :: 'ByteString' -> 'Either' ('Base32Error' 'UnicodeException') 'Text' -- @ -- decodeBase32PaddedWith :: (ByteString -> Either err Text) -- ^ convert a bytestring to text (e.g. 'T.decodeUtf8'') -> ByteString -- ^ Input text to decode -> Either (Base32Error err) Text decodeBase32PaddedWith f t = case B32.decodeBase32Padded t of Left de -> Left $ DecodeError de Right a -> first ConversionError (f a) {-# INLINE decodeBase32PaddedWith #-} -- -- | Leniently decode a Base32-encoded 'Text' value. This function -- -- will not generate parse errors. If input data contains padding chars, -- -- then the input will be parsed up until the first pad character. -- -- -- -- __Note:__ This is not RFC 4648-compliant. -- -- -- decodeBase32Lenient :: Text -> Text -- decodeBase32Lenient = T.decodeUtf8 -- . B32.decodeBase32Lenient -- . T.encodeUtf8 -- {-# INLINE decodeBase32Lenient #-} -- | Tell whether a 'Text' value is Base32-encoded -- -- === __Examples__: -- -- >>> isBase32 "KN2W4" -- True -- -- >>> isBase32 "KN2W4===" -- True -- -- >>> isBase32 "KN2W4==" -- False -- isBase32 :: Text -> Bool isBase32 = B32.isBase32 . T.encodeUtf8 {-# INLINE isBase32 #-} -- | Tell whether a 'Text' value is a valid Base32 format. -- -- This will not tell you whether or not this is a correct Base32 representation, -- only that it conforms to the correct shape. To check whether it is a true -- Base32 encoded 'Text' value, use 'isBase32'. -- -- === __Examples__: -- -- >>> isValidBase32 "KN2W4" -- True -- -- >>> isValidBase32 "KN2W4=" -- False -- -- >>> isValidBase32 "KN2W4%" -- False -- isValidBase32 :: Text -> Bool isValidBase32 = B32.isValidBase32 . T.encodeUtf8 {-# INLINE isValidBase32 #-}