aboutsummaryrefslogblamecommitdiffstats
path: root/lib/stdlib/src/base64.erl
blob: 6ff6020e53dc773ed4df86dace15b1f9b1301178 (plain) (tree)
1
2
3
4
5


                   
                                                        
   










                                                                           









                                                                           

                                                                

                                 
 
                                                 
                                              
                                     

                                            
                                          
                                            
                                
 
                                 

                                              

                                  
                             
                                  
                            
 
                            
       








                                              


                                
                                                   
 

































                                                                          
 
                                 

                                                

                                  
                             
                                  
                            
 
                                      

                                                

                                       
                                  
                                       
                                 
 


                                                                     
 
                                                 

                                                

                                            
                                          
                                            
                                
 
                                                      

                                                

                                                 
                                               
                                                 
                                     
 








                                                                     
        
                          

      






                                                        

        








                                                         

        








                                                                 

        

































                                                                        
        
 
















                                                                   
             














                                                                          
        











































                                                                        
             








                                                                
                                                      















                                                                               
                            
                    

                                    
        
                     

      
                                
                    

                                        

        
                                    
                    

                                            

        
                                        
                    



                                                                              

        



























                                                                                     







                                          



































                                                                        
                 
      
                       
                   
                             


                                          



                                                                           
             





















                                                                                    






                                                                    
%%
%% %CopyrightBegin%
%% 
%% Copyright Ericsson AB 2007-2017. All Rights Reserved.
%% 
%% Licensed under the Apache License, Version 2.0 (the "License");
%% you may not use this file except in compliance with the License.
%% You may obtain a copy of the License at
%%
%%     http://www.apache.org/licenses/LICENSE-2.0
%%
%% Unless required by applicable law or agreed to in writing, software
%% distributed under the License is distributed on an "AS IS" BASIS,
%% WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
%% See the License for the specific language governing permissions and
%% limitations under the License.
%% 
%% %CopyrightEnd%
%%
%% Description: Implements base 64 encode and decode. See RFC4648.

-module(base64).

-export([encode/1, decode/1, mime_decode/1,
	 encode_to_string/1, decode_to_string/1, mime_decode_to_string/1]).

%% The following type is a subtype of string() for return values
%% of (some) functions of this module.
-type ascii_string() :: [1..255].
-type ascii_binary() :: binary().

-spec encode_to_string(Data) -> Base64String when
      Data :: ascii_string() | ascii_binary(),
      Base64String :: ascii_string().

encode_to_string(Bin) when is_binary(Bin) ->
    encode_to_string(binary_to_list(Bin));
encode_to_string(List) when is_list(List) ->
    encode_list_to_string(List).

-spec encode(Data) -> Base64 when
      Data :: ascii_string() | ascii_binary(),
      Base64 :: ascii_binary().

encode(Bin) when is_binary(Bin) ->
    encode_binary(Bin, <<>>);
encode(List) when is_list(List) ->
    encode_list(List, <<>>).

encode_list_to_string([]) ->
    [];
encode_list_to_string([B1]) ->
    [b64e(B1 bsr 2),
     b64e((B1 band 3) bsl 4), $=, $=];
encode_list_to_string([B1,B2]) ->
    [b64e(B1 bsr 2),
     b64e(((B1 band 3) bsl 4) bor (B2 bsr 4)),
     b64e((B2 band 15) bsl 2), $=];
encode_list_to_string([B1,B2,B3|Ls]) ->
    BB = (B1 bsl 16) bor (B2 bsl 8) bor B3,
    [b64e(BB bsr 18),
     b64e((BB bsr 12) band 63), 
     b64e((BB bsr 6) band 63),
     b64e(BB band 63) | encode_list_to_string(Ls)].

encode_binary(<<>>, A) ->
    A;
encode_binary(<<B1:8>>, A) ->
    <<A/binary,(b64e(B1 bsr 2)):8,(b64e((B1 band 3) bsl 4)):8,$=:8,$=:8>>;
encode_binary(<<B1:8, B2:8>>, A) ->
    <<A/binary,(b64e(B1 bsr 2)):8,
      (b64e(((B1 band 3) bsl 4) bor (B2 bsr 4))):8,
      (b64e((B2 band 15) bsl 2)):8, $=:8>>;
encode_binary(<<B1:8, B2:8, B3:8, Ls/bits>>, A) ->
    BB = (B1 bsl 16) bor (B2 bsl 8) bor B3,
    encode_binary(Ls,
                  <<A/binary,(b64e(BB bsr 18)):8,
                    (b64e((BB bsr 12) band 63)):8,
                    (b64e((BB bsr 6) band 63)):8,
                    (b64e(BB band 63)):8>>).

encode_list([], A) ->
    A;
encode_list([B1], A) ->
    <<A/binary,(b64e(B1 bsr 2)):8,(b64e((B1 band 3) bsl 4)):8,$=:8,$=:8>>;
encode_list([B1,B2], A) ->
    <<A/binary,(b64e(B1 bsr 2)):8,
      (b64e(((B1 band 3) bsl 4) bor (B2 bsr 4))):8,
      (b64e((B2 band 15) bsl 2)):8, $=:8>>;
encode_list([B1,B2,B3|Ls], A) ->
    BB = (B1 bsl 16) bor (B2 bsl 8) bor B3,
    encode_list(Ls,
                <<A/binary,(b64e(BB bsr 18)):8,
                  (b64e((BB bsr 12) band 63)):8,
                  (b64e((BB bsr 6) band 63)):8,
                  (b64e(BB band 63)):8>>).

%% mime_decode strips away all characters not Base64 before
%% converting, whereas decode crashes if an illegal character is found

-spec decode(Base64) -> Data when
      Base64 :: ascii_string() | ascii_binary(),
      Data :: ascii_binary().

decode(Bin) when is_binary(Bin) ->
    decode_binary(Bin, <<>>);
decode(List) when is_list(List) ->
    decode_list(List, <<>>).

-spec mime_decode(Base64) -> Data when
      Base64 :: ascii_string() | ascii_binary(),
      Data :: ascii_binary().

mime_decode(Bin) when is_binary(Bin) ->
    mime_decode_binary(Bin, <<>>);
mime_decode(List) when is_list(List) ->
    mime_decode_list(List, <<>>).

%% mime_decode_to_string strips away all characters not Base64 before
%% converting, whereas decode_to_string crashes if an illegal
%% character is found

-spec decode_to_string(Base64) -> DataString when
      Base64 :: ascii_string() | ascii_binary(),
      DataString :: ascii_string().

decode_to_string(Bin) when is_binary(Bin) ->
    decode_to_string(binary_to_list(Bin));
decode_to_string(List) when is_list(List) ->
    decode_list_to_string(List).

-spec mime_decode_to_string(Base64) -> DataString when
      Base64 :: ascii_string() | ascii_binary(),
      DataString :: ascii_string().

mime_decode_to_string(Bin) when is_binary(Bin) ->
    mime_decode_to_string(binary_to_list(Bin));
mime_decode_to_string(List) when is_list(List) ->
    mime_decode_list_to_string(List).

%% Skipping pad character if not at end of string. Also liberal about
%% excess padding and skipping of other illegal (non-base64 alphabet)
%% characters. See section 3.3 of RFC4648
mime_decode_list([0 | Cs], A) ->
    mime_decode_list(Cs, A);
mime_decode_list([C1 | Cs], A) ->
    case b64d(C1) of
        B1 when is_integer(B1) -> mime_decode_list(Cs, A, B1);
        _ -> mime_decode_list(Cs, A)  % eq is padding
    end;
mime_decode_list([], A) ->
    A.

mime_decode_list([0 | Cs], A, B1) ->
    mime_decode_list(Cs, A, B1);
mime_decode_list([C2 | Cs], A, B1) ->
    case b64d(C2) of
        B2 when is_integer(B2) ->
            mime_decode_list(Cs, A, B1, B2);
        _ -> mime_decode_list(Cs, A, B1) % eq is padding
    end.

mime_decode_list([0 | Cs], A, B1, B2) ->
    mime_decode_list(Cs, A, B1, B2);
mime_decode_list([C3 | Cs], A, B1, B2) ->
    case b64d(C3) of
        B3 when is_integer(B3) ->
            mime_decode_list(Cs, A, B1, B2, B3);
        eq=B3 ->
            mime_decode_list_after_eq(Cs, A, B1, B2, B3);
        _ -> mime_decode_list(Cs, A, B1, B2)
    end.

mime_decode_list([0 | Cs], A, B1, B2, B3) ->
    mime_decode_list(Cs, A, B1, B2, B3);
mime_decode_list([C4 | Cs], A, B1, B2, B3) ->
    case b64d(C4) of
        B4 when is_integer(B4) ->
            mime_decode_list(Cs, <<A/bits,B1:6,B2:6,B3:6,B4:6>>);
        eq ->
            mime_decode_list_after_eq(Cs, A, B1, B2, B3);
        _ -> mime_decode_list(Cs, A, B1, B2, B3)
    end.

mime_decode_list_after_eq([0 | Cs], A, B1, B2, B3) ->
    mime_decode_list_after_eq(Cs, A, B1, B2, B3);
mime_decode_list_after_eq([C | Cs], A, B1, B2, B3) ->
    case b64d(C) of
        B when is_integer(B) ->
            %% More valid data, skip the eq as invalid
            case B3 of
                eq -> mime_decode_list(Cs, A, B1, B2, B);
                _ -> mime_decode_list(Cs, <<A/bits,B1:6,B2:6,B3:6,B:6>>)
            end;
        _ -> mime_decode_list_after_eq(Cs, A, B1, B2, B3)
    end;
mime_decode_list_after_eq([], A, B1, B2, eq) ->
    <<A/binary,B1:6,(B2 bsr 4):2>>;
mime_decode_list_after_eq([], A, B1, B2, B3) ->
    <<A/binary,B1:6,B2:6,(B3 bsr 2):4>>.

mime_decode_binary(<<0:8, Cs/bits>>, A) ->
    mime_decode_binary(Cs, A);
mime_decode_binary(<<C1:8, Cs/bits>>, A) ->
    case b64d(C1) of
        B1 when is_integer(B1) -> mime_decode_binary(Cs, A, B1);
        _ -> mime_decode_binary(Cs, A)  % eq is padding
    end;
mime_decode_binary(<<>>, A) ->
    A.

mime_decode_binary(<<0:8, Cs/bits>>, A, B1) ->
    mime_decode_binary(Cs, A, B1);
mime_decode_binary(<<C2:8, Cs/bits>>, A, B1) ->
    case b64d(C2) of
        B2 when is_integer(B2) ->
            mime_decode_binary(Cs, A, B1, B2);
        _ -> mime_decode_binary(Cs, A, B1) % eq is padding
    end.

mime_decode_binary(<<0:8, Cs/bits>>, A, B1, B2) ->
    mime_decode_binary(Cs, A, B1, B2);
mime_decode_binary(<<C3:8, Cs/bits>>, A, B1, B2) ->
    case b64d(C3) of
        B3 when is_integer(B3) ->
            mime_decode_binary(Cs, A, B1, B2, B3);
        eq=B3 ->
            mime_decode_binary_after_eq(Cs, A, B1, B2, B3);
        _ -> mime_decode_binary(Cs, A, B1, B2)
    end.

mime_decode_binary(<<0:8, Cs/bits>>, A, B1, B2, B3) ->
    mime_decode_binary(Cs, A, B1, B2, B3);
mime_decode_binary(<<C4:8, Cs/bits>>, A, B1, B2, B3) ->
    case b64d(C4) of
        B4 when is_integer(B4) ->
            mime_decode_binary(Cs, <<A/bits,B1:6,B2:6,B3:6,B4:6>>);
        eq ->
            mime_decode_binary_after_eq(Cs, A, B1, B2, B3);
        _ -> mime_decode_binary(Cs, A, B1, B2, B3)
    end.

mime_decode_binary_after_eq(<<0:8, Cs/bits>>, A, B1, B2, B3) ->
    mime_decode_binary_after_eq(Cs, A, B1, B2, B3);
mime_decode_binary_after_eq(<<C:8, Cs/bits>>, A, B1, B2, B3) ->
    case b64d(C) of
        B when is_integer(B) ->
            %% More valid data, skip the eq as invalid
            case B3 of
                eq -> mime_decode_binary(Cs, A, B1, B2, B);
                _ -> mime_decode_binary(Cs, <<A/bits,B1:6,B2:6,B3:6,B:6>>)
            end;
        _ -> mime_decode_binary_after_eq(Cs, A, B1, B2, B3)
    end;
mime_decode_binary_after_eq(<<>>, A, B1, B2, eq) ->
    <<A/binary,B1:6,(B2 bsr 4):2>>;
mime_decode_binary_after_eq(<<>>, A, B1, B2, B3) ->
    <<A/binary,B1:6,B2:6,(B3 bsr 2):4>>.

mime_decode_list_to_string([0 | Cs]) ->
    mime_decode_list_to_string(Cs);
mime_decode_list_to_string([C1 | Cs]) ->
    case b64d(C1) of
        B1 when is_integer(B1) -> mime_decode_list_to_string(Cs, B1);
        _ -> mime_decode_list_to_string(Cs) % eq is padding
    end;
mime_decode_list_to_string([]) ->
    [].

mime_decode_list_to_string([0 | Cs], B1) ->
    mime_decode_list_to_string(Cs, B1);
mime_decode_list_to_string([C2 | Cs], B1) ->
    case b64d(C2) of
        B2 when is_integer(B2) ->
            mime_decode_list_to_string(Cs, B1, B2);
        _ -> mime_decode_list_to_string(Cs, B1) % eq is padding
    end.

mime_decode_list_to_string([0 | Cs], B1, B2) ->
    mime_decode_list_to_string(Cs, B1, B2);
mime_decode_list_to_string([C3 | Cs], B1, B2) ->
    case b64d(C3) of
        B3 when is_integer(B3) ->
            mime_decode_list_to_string(Cs, B1, B2, B3);
        eq=B3 -> mime_decode_list_to_string_after_eq(Cs, B1, B2, B3);
        _ -> mime_decode_list_to_string(Cs, B1, B2)
    end.

mime_decode_list_to_string([0 | Cs], B1, B2, B3) ->
    mime_decode_list_to_string(Cs, B1, B2, B3);
mime_decode_list_to_string([C4 | Cs], B1, B2, B3) ->
    case b64d(C4) of
        B4 when is_integer(B4) ->
            Bits4x6 = (B1 bsl 18) bor (B2 bsl 12) bor (B3 bsl 6) bor B4,
            Octet1 = Bits4x6 bsr 16,
            Octet2 = (Bits4x6 bsr 8) band 16#ff,
            Octet3 = Bits4x6 band 16#ff,
            [Octet1, Octet2, Octet3 | mime_decode_list_to_string(Cs)];
        eq ->
            mime_decode_list_to_string_after_eq(Cs, B1, B2, B3);
        _ -> mime_decode_list_to_string(Cs, B1, B2, B3)
    end.

mime_decode_list_to_string_after_eq([0 | Cs], B1, B2, B3) ->
    mime_decode_list_to_string_after_eq(Cs, B1, B2, B3);
mime_decode_list_to_string_after_eq([C | Cs], B1, B2, B3) ->
    case b64d(C) of
        B when is_integer(B) ->
            %% More valid data, skip the eq as invalid
            case B3 of
                eq -> mime_decode_list_to_string(Cs, B1, B2, B);
                _ ->
                    Bits4x6 = (B1 bsl 18) bor (B2 bsl 12) bor (B3 bsl 6) bor B,
                    Octet1 = Bits4x6 bsr 16,
                    Octet2 = (Bits4x6 bsr 8) band 16#ff,
                    Octet3 = Bits4x6 band 16#ff,
                    [Octet1, Octet2, Octet3 | mime_decode_list_to_string(Cs)]
            end;
        _ -> mime_decode_list_to_string_after_eq(Cs, B1, B2, B3)
    end;
mime_decode_list_to_string_after_eq([], B1, B2, eq) ->
    binary_to_list(<<B1:6,(B2 bsr 4):2>>);
mime_decode_list_to_string_after_eq([], B1, B2, B3) ->
    binary_to_list(<<B1:6,B2:6,(B3 bsr 2):4>>).

decode_list([C1 | Cs], A) ->
    case b64d(C1) of
        ws -> decode_list(Cs, A);
        B1 -> decode_list(Cs, A, B1)
    end;
decode_list([], A) ->
    A.

decode_list([C2 | Cs], A, B1) ->
    case b64d(C2) of
        ws -> decode_list(Cs, A, B1);
        B2 -> decode_list(Cs, A, B1, B2)
    end.

decode_list([C3 | Cs], A, B1, B2) ->
    case b64d(C3) of
        ws -> decode_list(Cs, A, B1, B2);
        B3 -> decode_list(Cs, A, B1, B2, B3)
    end.

decode_list([C4 | Cs], A, B1, B2, B3) ->
    case b64d(C4) of
        ws                -> decode_list(Cs, A, B1, B2, B3);
        eq when B3 =:= eq -> only_ws(Cs, <<A/binary,B1:6,(B2 bsr 4):2>>);
        eq                -> only_ws(Cs, <<A/binary,B1:6,B2:6,(B3 bsr 2):4>>);
        B4                -> decode_list(Cs, <<A/binary,B1:6,B2:6,B3:6,B4:6>>)
    end.

decode_binary(<<C1:8, Cs/bits>>, A) ->
    case b64d(C1) of
        ws -> decode_binary(Cs, A);
        B1 -> decode_binary(Cs, A, B1)
    end;
decode_binary(<<>>, A) ->
    A.

decode_binary(<<C2:8, Cs/bits>>, A, B1) ->
    case b64d(C2) of
        ws -> decode_binary(Cs, A, B1);
        B2 -> decode_binary(Cs, A, B1, B2)
    end.

decode_binary(<<C3:8, Cs/bits>>, A, B1, B2) ->
    case b64d(C3) of
        ws -> decode_binary(Cs, A, B1, B2);
        B3 -> decode_binary(Cs, A, B1, B2, B3)
    end.

decode_binary(<<C4:8, Cs/bits>>, A, B1, B2, B3) ->
    case b64d(C4) of
        ws                -> decode_binary(Cs, A, B1, B2, B3);
        eq when B3 =:= eq -> only_ws_binary(Cs, <<A/binary,B1:6,(B2 bsr 4):2>>);
        eq                -> only_ws_binary(Cs, <<A/binary,B1:6,B2:6,(B3 bsr 2):4>>);
        B4                -> decode_binary(Cs, <<A/binary,B1:6,B2:6,B3:6,B4:6>>)
    end.

only_ws_binary(<<>>, A) ->
    A;
only_ws_binary(<<C:8, Cs/bits>>, A) ->
    case b64d(C) of
        ws -> only_ws_binary(Cs, A);
        _ -> erlang:error(function_clause)
    end.

decode_list_to_string([C1 | Cs]) ->
    case b64d(C1) of
        ws -> decode_list_to_string(Cs);
        B1 -> decode_list_to_string(Cs, B1)
    end;
decode_list_to_string([]) ->
    [].

decode_list_to_string([C2 | Cs], B1) ->
    case b64d(C2) of
        ws -> decode_list_to_string(Cs, B1);
        B2 -> decode_list_to_string(Cs, B1, B2)
    end.

decode_list_to_string([C3 | Cs], B1, B2) ->
    case b64d(C3) of
        ws -> decode_list_to_string(Cs, B1, B2);
        B3 -> decode_list_to_string(Cs, B1, B2, B3)
    end.

decode_list_to_string([C4 | Cs], B1, B2, B3) ->
    case b64d(C4) of
        ws ->
            decode_list_to_string(Cs, B1, B2, B3);
        eq when B3 =:= eq ->
            only_ws(Cs, binary_to_list(<<B1:6,(B2 bsr 4):2>>));
        eq ->
            only_ws(Cs, binary_to_list(<<B1:6,B2:6,(B3 bsr 2):4>>));
        B4 ->
            Bits4x6 = (B1 bsl 18) bor (B2 bsl 12) bor (B3 bsl 6) bor B4,
            Octet1 = Bits4x6 bsr 16,
            Octet2 = (Bits4x6 bsr 8) band 16#ff,
            Octet3 = Bits4x6 band 16#ff,
            [Octet1, Octet2, Octet3 | decode_list_to_string(Cs)]
    end.

only_ws([], A) ->
    A;
only_ws([C | Cs], A) ->
    case b64d(C) of
        ws -> only_ws(Cs, A);
        _ -> erlang:error(function_clause)
    end.

%%%========================================================================
%%% Internal functions
%%%========================================================================

%% accessors 
-compile({inline, [{b64d, 1}]}).
%% One-based decode map.
b64d(X) ->
    element(X,
            {bad,bad,bad,bad,bad,bad,bad,bad,ws,ws,bad,bad,ws,bad,bad, %1-15
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad, %16-31
             ws,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,62,bad,bad,bad,63, %32-47
             52,53,54,55,56,57,58,59,60,61,bad,bad,bad,eq,bad,bad, %48-63
             bad,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,
             15,16,17,18,19,20,21,22,23,24,25,bad,bad,bad,bad,bad,
             bad,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,
             41,42,43,44,45,46,47,48,49,50,51,bad,bad,bad,bad,bad,
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,
             bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad,bad}).

-compile({inline, [{b64e, 1}]}).
b64e(X) ->
    element(X+1,
	    {$A, $B, $C, $D, $E, $F, $G, $H, $I, $J, $K, $L, $M, $N,
	     $O, $P, $Q, $R, $S, $T, $U, $V, $W, $X, $Y, $Z,
	     $a, $b, $c, $d, $e, $f, $g, $h, $i, $j, $k, $l, $m, $n,
	     $o, $p, $q, $r, $s, $t, $u, $v, $w, $x, $y, $z,
	     $0, $1, $2, $3, $4, $5, $6, $7, $8, $9, $+, $/}).