1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
|
--------------------------------------------------------------------
-- |
-- Module : Codec.MIME.Decode
-- Copyright : (c) Galois, Inc. 2006..2008
-- License : BSD3
--
-- Maintainer: Don Stewart <dons@galois.com>
-- Stability : provisional
-- Portability:
--
--------------------------------------------------------------------
module Codec.MIME.Decode where
import Data.Char
import Codec.MIME.QuotedPrintable as QP
import Codec.MIME.Base64 as Base64
decodeBody :: String -> String -> String
decodeBody enc body =
case map toLower enc of
"base64" -> map (chr.fromIntegral) $ Base64.decode body
"quoted-printable" -> QP.decode body
_ -> body
-- Decoding of RFC 2047's "encoded-words' production
-- (as used in email-headers and some HTTP header cases
-- (AtomPub's Slug: header))
decodeWord :: String -> Maybe (String, String)
decodeWord str =
case str of
'=':'?':xs ->
case dropLang $ break (\ch -> ch =='?' || ch == '*') xs of
(cs,_:x:'?':bs)
| isKnownCharset (map toLower cs) ->
case toLower x of
'q' -> decodeQ cs (break (=='?') bs)
'b' -> decodeB cs (break (=='?') bs)
_ -> Nothing
_ -> Nothing
_ -> Nothing
where
isKnownCharset cs = cs `elem` ["iso-8859-1", "us-ascii"]
-- ignore RFC 2231 extension of permitting a language tag to be supplied
-- after the charset.
dropLang (as,'*':bs) = (as,dropWhile (/='?') bs)
dropLang (as,bs) = (as,bs)
decodeQ cset (fs,'?':'=':rs) = Just (fromCharset cset (QP.decode fs),rs)
decodeQ _ _ = Nothing
decodeB cset (fs,'?':'=':rs) =
Just (fromCharset cset (Base64.decodeToString fs),rs)
decodeB _ _ = Nothing
fromCharset _cset cs = cs
decodeWords :: String -> String
decodeWords "" = ""
decodeWords (x:xs)
| isSpace x = x : decodeWords xs
| otherwise =
case decodeWord (x:xs) of
Nothing -> x : decodeWords xs
Just (as,bs) -> as ++ decodeWords bs
|