{- Copyright © 2007 Magnus Therning - - This file is part of dataenc. - - Dataenc is free software: you can redistribute it and/or modify it under - the terms of the GNU Lesser General Public License as published by the - Free Software Foundation, either version 3 of the License, or (at your - option) any later version. - - Dataenc is distributed in the hope that it will be useful, but WITHOUT - ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or - FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public - License for more details. - - You should have received a copy of the GNU Lesser General Public License - along with dataenc. If not, see -} -- | Uuencoding module. -- -- Uuencoding is notoriously badly specified. This implementation is -- compatible with the GNU Sharutils -- (). module Codec.Binary.Uu ( encode , decode , decode' , chop , unchop ) where import Control.Monad import Data.Array import Data.Bits import Data.Maybe import Data.Word import qualified Data.Map as M -- {{{1 encodeArray encodeArray :: Array Word8 Char encodeArray = array (0, 64) [ (0, '`'), (1, '!'), (2, '"'), (3, '#'), (4, '$'), (5, '%'), (6, '&'), (7, '\''), (8, '('), (9, ')'), (10, '*'), (11, '+'), (12, ','), (13, '-'), (14, '.'), (15, '/'), (16, '0'), (17, '1'), (18, '2'), (19, '3'), (20, '4'), (21, '5'), (22, '6'), (23, '7'), (24, '8'), (25, '9'), (26, ':'), (27, ';'), (28, '<'), (29, '='), (30, '>'), (31, '?'), (32, '@'), (33, 'A'), (34, 'B'), (35, 'C'), (36, 'D'), (37, 'E'), (38, 'F'), (39, 'G'), (40, 'H'), (41, 'I'), (42, 'J'), (43, 'K'), (44, 'L'), (45, 'M'), (46, 'N'), (47, 'O'), (48, 'P'), (49, 'Q'), (50, 'R'), (51, 'S'), (52, 'T'), (53, 'U') ,(54, 'V'), (55, 'W'), (56, 'X'), (57, 'Y'), (58, 'Z'), (59, '['), (60, '\\'), (61, ']'), (62, '^'), (63, '_') ] -- {{{1 decodeMap decodeMap :: M.Map Char Word8 decodeMap = M.fromList [ ('`', 0), ('!', 1), ('"', 2), ('#', 3), ('$', 4), ('%', 5), ('&', 6), ('\'', 7), ('(', 8), (')', 9), ('*', 10), ('+', 11), (',', 12), ('-', 13), ('.', 14), ('/', 15), ('0', 16), ('1', 17), ('2', 18), ('3', 19), ('4', 20), ('5', 21), ('6', 22), ('7', 23), ('8', 24), ('9', 25), (':', 26), (';', 27), ('<', 28), ('=', 29), ('>', 30), ('?', 31), ('@', 32), ('A', 33), ('B', 34), ('C', 35), ('D', 36), ('E', 37), ('F', 38), ('G', 39), ('H', 40), ('I', 41), ('J', 42), ('K', 43), ('L', 44), ('M', 45), ('N', 46), ('O', 47), ('P', 48), ('Q', 49), ('R', 50), ('S', 51), ('T', 52), ('U', 53), ('V', 54), ('W', 55), ('X', 56), ('Y', 57), ('Z', 58), ('[', 59), ('\\', 60), (']', 61), ('^', 62), ('_', 63) ] -- {{{1 encode -- | Encode data. encode :: [Word8] -> String encode [] = "" encode [o] = let i1 = o `shiftR` 2 i2 = o `shiftL` 4 .&. 0x3f in (encodeArray ! i1) : (encodeArray ! i2) : "" encode [o1, o2] = let i1 = o1 `shiftR` 2 i2 = (o1 `shiftL` 4 .|. o2 `shiftR` 4) .&. 0x3f i3 = o2 `shiftL` 2 .&. 0x3f in foldr (\ i s-> (encodeArray ! i) : s) "" [i1, i2, i3] encode (o1:o2:o3:os) = let i1 = o1 `shiftR` 2 i2 = (o1 `shiftL` 4 .|. o2 `shiftR` 4) .&. 0x3f i3 = (o2 `shiftL` 2 .|. o3 `shiftR` 6) .&. 0x3f i4 = o3 .&. 0x3f in (foldr (\ i s -> (encodeArray ! i) : s) "" [i1, i2, i3, i4]) ++ encode os -- {{{1 decode -- | Decode data (lazy). decode' :: String -> [Maybe Word8] decode' = let dec [] = [] dec [Just eo1, Just eo2] = [Just (eo1 `shiftL` 2 .|. eo2 `shiftR` 4)] dec [Just eo1, Just eo2, Just eo3] = let o1 = eo1 `shiftL` 2 .|. eo2 `shiftR` 4 o2 = eo2 `shiftL` 4 .|. eo3 `shiftR` 2 in [Just o1, Just o2] dec (Just eo1:Just eo2:Just eo3:Just eo4:eos) = let o1 = eo1 `shiftL` 2 .|. eo2 `shiftR` 4 o2 = eo2 `shiftL` 4 .|. eo3 `shiftR` 2 o3 = eo3 `shiftL` 6 .|. eo4 in Just o1:Just o2:Just o3:(dec eos) dec _ = [Nothing] in dec . map (flip M.lookup decodeMap) -- | Decode data (strict). decode :: String -> Maybe [Word8] decode = sequence . decode' -- {{{1 chop -- | Chop up a string in parts. Each string in the resulting list is prepended -- with the length according to the uuencode \"specificiation\". -- -- /Notes:/ -- -- * The length of the strings in the result will be @(n -1) `div` 4 * 4@. -- The @-1@ comes from the need to prepend the length. Keeping it to a -- multiple of 4 means that strings returned from 'encode' can be chopped -- without requiring any changes. -- -- * The length of lines in GNU's sharutils is 61. chop :: Int -- ^ length (@1 < n <= 65@, not checked) -> String -> [String] chop n "" = [] chop n s = let enc_len = (n - 1) `div` 4 * 4 enc_line = take enc_len s act_len = fromIntegral $ case (length enc_line `divMod` 4) of (l, 0) -> l * 3 (l, 2) -> l * 3 + 1 (l, 3) -> l * 3 + 2 len = (encodeArray ! act_len) in (len : enc_line) : chop n (drop enc_len s) -- {{{1 unchop -- | Concatenate the strings into one long string. Each string is assumed to -- be prepended with the length according to the uuencode specification. unchop :: [String] -> String unchop ss = let singleUnchop (l:cs) = let act_len = fromIntegral $ decodeMap M.! l enc_len = case (act_len `divMod` 3) of (n, 0) -> n * 4 (n, 1) -> n * 4 + 2 (n, 2) -> n * 4 + 3 in take enc_len cs in foldr (\ s res -> (singleUnchop s) ++ res) "" ss