225 lines
6.9 KiB
Haskell
225 lines
6.9 KiB
Haskell
{-# LANGUAGE BangPatterns #-}
|
|
{-# LANGUAGE MagicHash #-}
|
|
{-# LANGUAGE OverloadedStrings #-}
|
|
{-# LANGUAGE Trustworthy #-}
|
|
-- |
|
|
-- Module : Data.ByteString.Base32
|
|
-- Copyright : (c) 2019-2023 Emily Pillmore
|
|
-- License : BSD-style
|
|
--
|
|
-- Maintainer : Emily Pillmore <emilypi@cohomolo.gy>
|
|
-- Stability : stable
|
|
-- Portability : non-portable
|
|
--
|
|
-- This module contains 'Data.ByteString.ByteString'-valued combinators for
|
|
-- implementing the RFC 4648 specification of the Base32
|
|
-- encoding format. This includes padded and unpadded decoding variants, as well as
|
|
-- internal and external validation for canonicity.
|
|
--
|
|
module Data.ByteString.Base32
|
|
( -- * Encoding
|
|
encodeBase32
|
|
, encodeBase32'
|
|
, encodeBase32Unpadded
|
|
, encodeBase32Unpadded'
|
|
-- * Decoding
|
|
, decodeBase32
|
|
, decodeBase32Unpadded
|
|
, decodeBase32Padded
|
|
-- , decodeBase32Lenient
|
|
-- * Validation
|
|
, isBase32
|
|
, isValidBase32
|
|
) where
|
|
|
|
|
|
import qualified Data.ByteString as BS
|
|
import Data.ByteString.Internal (ByteString(..))
|
|
import Data.ByteString.Base32.Internal
|
|
import Data.ByteString.Base32.Internal.Tables
|
|
import Data.Either (isRight)
|
|
import Data.Text (Text)
|
|
import qualified Data.Text.Encoding as T
|
|
|
|
import System.IO.Unsafe (unsafeDupablePerformIO)
|
|
|
|
|
|
-- | Encode a 'ByteString' value as a Base32 'Text' value with padding.
|
|
--
|
|
-- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6>
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> encodeBase32 "Sun"
|
|
-- "KN2W4==="
|
|
--
|
|
encodeBase32 :: ByteString -> Text
|
|
encodeBase32 = T.decodeUtf8 . encodeBase32'
|
|
{-# INLINE encodeBase32 #-}
|
|
|
|
-- | Encode a 'ByteString' value as a Base32 'ByteString' value with padding.
|
|
--
|
|
-- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6>
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> encodeBase32' "Sun"
|
|
-- "KN2W4==="
|
|
--
|
|
encodeBase32' :: ByteString -> ByteString
|
|
encodeBase32' = encodeBase32_ "ABCDEFGHIJKLMNOPQRSTUVWXYZ234567"#
|
|
{-# INLINE encodeBase32' #-}
|
|
|
|
-- | Decode an arbitrarily padded Base32-encoded 'ByteString' value. If its length
|
|
-- is not a multiple of 8, then padding characters will be added to fill out the
|
|
-- input to a multiple of 8 for safe decoding, as Base32-encoded values are
|
|
-- optionally padded.
|
|
--
|
|
-- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6>
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> decodeBase32 "KN2W4==="
|
|
-- Right "Sun"
|
|
--
|
|
-- >>> decodeBase32 "KN2W4"
|
|
-- Right "Sun"
|
|
--
|
|
-- >>> decodeBase32 "KN2W==="
|
|
-- Left "Base32-encoded bytestring has invalid padding"
|
|
--
|
|
decodeBase32 :: ByteString -> Either Text ByteString
|
|
decodeBase32 bs@(BS _ !l)
|
|
| l == 0 = Right bs
|
|
| r == 0 = unsafeDupablePerformIO $ decodeBase32_ stdDecodeTable bs
|
|
| r == 2 = unsafeDupablePerformIO $ decodeBase32_ stdDecodeTable (BS.append bs "======")
|
|
| r == 4 = validateLastNPads 2 bs $ decodeBase32_ stdDecodeTable (BS.append bs "====")
|
|
| r == 5 = validateLastNPads 3 bs $ decodeBase32_ stdDecodeTable (BS.append bs "===")
|
|
| r == 7 = validateLastNPads 5 bs $ decodeBase32_ stdDecodeTable (BS.append bs "=")
|
|
| otherwise = Left "Base32-encoded bytestring has invalid size"
|
|
where
|
|
!r = l `rem` 8
|
|
{-# INLINE decodeBase32 #-}
|
|
|
|
-- | Encode a 'ByteString' value as a Base32 'Text' value without padding.
|
|
--
|
|
-- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6>
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> encodeBase32Unpadded "Sun"
|
|
-- "KN2W4"
|
|
--
|
|
encodeBase32Unpadded :: ByteString -> Text
|
|
encodeBase32Unpadded = T.decodeUtf8 . encodeBase32Unpadded'
|
|
{-# INLINE encodeBase32Unpadded #-}
|
|
|
|
-- | Encode a 'ByteString' value as a Base32 'ByteString' value without padding.
|
|
--
|
|
-- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6>
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> encodeBase32Unpadded' "Sun"
|
|
-- "KN2W4"
|
|
--
|
|
encodeBase32Unpadded' :: ByteString -> ByteString
|
|
encodeBase32Unpadded' = encodeBase32NoPad_ "ABCDEFGHIJKLMNOPQRSTUVWXYZ234567"#
|
|
{-# INLINE encodeBase32Unpadded' #-}
|
|
|
|
-- | Decode an unpadded Base32-encoded 'ByteString' value.
|
|
--
|
|
-- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6>
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> decodeBase32Unpadded "KN2W4"
|
|
-- Right "Sun"
|
|
--
|
|
-- >>> decodeBase32Unpadded "KN2W4==="
|
|
-- Left "Base32-encoded bytestring has invalid padding"
|
|
--
|
|
decodeBase32Unpadded :: ByteString -> Either Text ByteString
|
|
decodeBase32Unpadded bs@(BS _ !l)
|
|
| l == 0 = Right bs
|
|
| r == 0 = validateLastNPads 1 bs $ decodeBase32_ stdDecodeTable bs
|
|
| r == 2 = unsafeDupablePerformIO $ decodeBase32_ stdDecodeTable (BS.append bs "======")
|
|
| r == 4 = validateLastNPads 1 bs $ decodeBase32_ stdDecodeTable (BS.append bs "====")
|
|
| r == 5 = validateLastNPads 1 bs $ decodeBase32_ stdDecodeTable (BS.append bs "===")
|
|
| r == 7 = validateLastNPads 1 bs $ decodeBase32_ stdDecodeTable (BS.append bs "=")
|
|
| otherwise = Left "Base32-encoded bytestring has invalid size"
|
|
where
|
|
!r = l `rem` 8
|
|
{-# INLINE decodeBase32Unpadded #-}
|
|
|
|
-- | Decode a padded Base32-encoded 'ByteString' value.
|
|
--
|
|
-- See: <https://tools.ietf.org/html/rfc4648#section-6 RFC-4648 section 6>
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> decodeBase32Padded "KN2W4==="
|
|
-- Right "Sun"
|
|
--
|
|
-- >>> decodeBase32Padded "KN2W4"
|
|
-- Left "Base32-encoded bytestring requires padding"
|
|
--
|
|
decodeBase32Padded :: ByteString -> Either Text ByteString
|
|
decodeBase32Padded bs@(BS _ !l)
|
|
| l == 0 = Right bs
|
|
| r == 1 = Left "Base32-encoded bytestring has invalid size"
|
|
| r == 3 = Left "Base32-encoded bytestring has invalid size"
|
|
| r == 6 = Left "Base32-encoded bytestring has invalid size"
|
|
| r /= 0 = Left "Base32-encoded bytestring requires padding"
|
|
| otherwise = unsafeDupablePerformIO $ decodeBase32_ stdDecodeTable bs
|
|
where
|
|
!r = l `rem` 8
|
|
{-# INLINE decodeBase32Padded #-}
|
|
|
|
-- -- | Leniently decode an unpadded Base32-encoded 'ByteString' value. This function
|
|
-- -- will not generate parse errors. If input data contains padding chars,
|
|
-- -- then the input will be parsed up until the first pad character.
|
|
-- --
|
|
-- -- __Note:__ This is not RFC 4648-compliant.
|
|
-- --
|
|
-- decodeBase32Lenient :: ByteString -> ByteString
|
|
-- decodeBase32Lenient = decodeBase32Lenient_ decodeB32Table
|
|
-- {-# INLINE decodeBase32Lenient #-}
|
|
|
|
-- | Tell whether a 'ByteString' value is encoded in padded or unpadded Base32 format
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> isBase32 "KN2W4"
|
|
-- True
|
|
--
|
|
-- >>> isBase32 "KN2W4==="
|
|
-- True
|
|
--
|
|
-- >>> isBase32 "KN2W4=="
|
|
-- False
|
|
--
|
|
isBase32 :: ByteString -> Bool
|
|
isBase32 bs = isValidBase32 bs && isRight (decodeBase32 bs)
|
|
{-# INLINE isBase32 #-}
|
|
|
|
-- | Tell whether a 'ByteString' value is a valid Base32 format.
|
|
--
|
|
-- This will not tell you whether or not this is a correct Base32 representation,
|
|
-- only that it conforms to the correct shape (including padding/size etc.).
|
|
-- To check whether it is a true Base32 encoded 'ByteString' value, use 'isBase32'.
|
|
--
|
|
-- === __Examples__:
|
|
--
|
|
-- >>> isValidBase32 "KN2W4"
|
|
-- True
|
|
--
|
|
-- >>> isValidBase32 "KN2W4="
|
|
-- False
|
|
--
|
|
-- >>> isValidBase32 "KN2W4%"
|
|
-- False
|
|
--
|
|
isValidBase32 :: ByteString -> Bool
|
|
isValidBase32 = validateBase32 "ABCDEFGHIJKLMNOPQRSTUVWXYZ234567"
|
|
{-# INLINE isValidBase32 #-}
|