diff options
Diffstat (limited to 'lib/stdlib')
| -rw-r--r-- | lib/stdlib/doc/src/io.xml | 95 | ||||
| -rw-r--r-- | lib/stdlib/src/erl_lint.erl | 8 | ||||
| -rw-r--r-- | lib/stdlib/src/io_lib.erl | 58 | ||||
| -rw-r--r-- | lib/stdlib/src/io_lib_format.erl | 43 | ||||
| -rw-r--r-- | lib/stdlib/test/io_SUITE.erl | 87 | 
5 files changed, 202 insertions, 89 deletions
| diff --git a/lib/stdlib/doc/src/io.xml b/lib/stdlib/doc/src/io.xml index 72c774e6ef..f1037ec76b 100644 --- a/lib/stdlib/doc/src/io.xml +++ b/lib/stdlib/doc/src/io.xml @@ -137,11 +137,11 @@  Hello world!  ok</pre>          <p>The general format of a control sequence is <c>~F.P.PadModC</c>.</p> -        <p>Character <c>C</c> determines the type of control sequence -          to be used, <c>F</c> and <c>P</c> are optional numeric -          arguments. If <c>F</c>, <c>P</c>, or <c>Pad</c> is <c>*</c>, -          the next argument in <c>Data</c> is used as the numeric value -          of <c>F</c> or <c>P</c>.</p> +        <p>The character <c>C</c> determines the type of control sequence +          to be used. It is the only required field. All of <c>F</c>, +          <c>P</c>, <c>Pad</c>, and <c>Mod</c> are optional. For example, +          to use a <c>#</c> for <c>Pad</c> but use the default values for +          <c>F</c> and <c>P</c>, you can write <c>~..#C</c>.</p>          <list type="bulleted">          <item>            <p><c>F</c> is the <c>field width</c> of the printed argument. A @@ -167,13 +167,26 @@ ok</pre>              The default padding character is <c>' '</c> (space).</p>          </item>          <item> -          <p><c>Mod</c> is the control sequence modifier. It is either a -            single character (<c>t</c>, for Unicode -            translation, and <c>l</c>, for stopping <c>p</c> and -            <c>P</c> from detecting printable characters) -            that changes the interpretation of <c>Data</c>.</p> +          <p><c>Mod</c> is the control sequence modifier. This is +            one or more characters that change the interpretation of +            <c>Data</c>. The current modifiers are <c>t</c>, for Unicode +            translation, and <c>l</c>, for stopping <c>p</c> and <c>P</c> +            from detecting printable characters.</p>          </item>        </list> +        <p>If <c>F</c>, <c>P</c>, or <c>Pad</c> is a <c>*</c> character, +        the next argument in <c>Data</c> is used as the value. +        For example:</p> +        <pre> +1> <input>io:fwrite("~*.*.0f~n",[9, 5, 3.14159265]).</input> +003.14159 +ok</pre> +        <p>To use a literal <c>*</c> character as <c>Pad</c>, it must be +          passed as an argument:</p> +        <pre> +2> <input>io:fwrite("~*.*.*f~n",[9, 5, $*, 3.14159265]).</input> +**3.14159 +ok</pre>          <p><em>Available control sequences:</em></p>          <taglist>            <tag><c>~</c></tag> @@ -277,10 +290,9 @@ ok                <c>~w</c>, but breaks terms whose printed representation                is longer than one line into many lines and indents each                line sensibly. Left-justification is not supported. -              It also tries to detect lists of -              printable characters and to output these as strings. The -              Unicode translation modifier is used for determining -              what characters are printable, for example:</p> +              It also tries to detect flat lists of +              printable characters and output these as strings. +              For example:</p>              <pre>  1> <input>T = [{attributes,[[{id,age,1.50000},{mode,explicit},</input>  <input>{typename,"INTEGER"}], [{id,cho},{mode,explicit},{typename,'Cho'}]]},</input> @@ -302,7 +314,7 @@ ok   {mode,implicit}]  ok</pre>              <p>The field width specifies the maximum line length. -              Defaults to 80. The precision specifies the initial +              It defaults to 80. The precision specifies the initial                indentation of the term. It defaults to the number of                characters printed on this line in the <em>same</em> call to                <seealso marker="#write/1"><c>write/1</c></seealso> or @@ -332,18 +344,53 @@ ok  [{a,[97]},   {b,[98]}]  ok</pre> -            <p>Binaries that look like UTF-8 encoded strings are -              output with the string syntax if the Unicode translation -              modifier is specified:</p> +            <p>The Unicode translation modifier <c>t</c> specifies how to treat +              characters outside the Latin-1 range of codepoints, in +              atoms, strings, and binaries. For example, printing an atom +              containing a character > 255:</p> +            <pre> +8> <input>io:fwrite("~p~n",[list_to_atom([1024])]).</input> +'\x{400}' +ok +9> <input>io:fwrite("~tp~n",[list_to_atom([1024])]).</input> +'Ѐ' +ok</pre> +            <p>By default, Erlang only detects lists of characters +              in the Latin-1 range as strings, but the <c>+pc unicode</c> +              flag can be used to change this (see <seealso +              marker="#printable_range/0"> +              <c>printable_range/0</c></seealso> for details). For example:</p> +            <pre> +10> <input>io:fwrite("~p~n",[[214]]).</input> +"Ö" +ok +11> <input>io:fwrite("~p~n",[[1024]]).</input> +[1024] +ok +12> <input>io:fwrite("~tp~n",[[1024]]).</input> +[1024] +ok +</pre> +            <p>but if Erlang was started with <c>+pc unicode</c>:</p>              <pre> -9> <input>io:fwrite("~p~n",[[1024]]).</input> +13> <input>io:fwrite("~p~n",[[1024]]).</input>  [1024] -10> <input>io:fwrite("~tp~n",[[1024]]).</input> -"\x{400}" -11> <input>io:fwrite("~tp~n", [<<128,128>>]).</input> +ok +14> <input>io:fwrite("~tp~n",[[1024]]).</input> +"Ѐ" +ok</pre> +            <p>Similarly, binaries that look like UTF-8 encoded strings +              are output with the binary string syntax if the <c>t</c> +              modifier is specified:</p> +            <pre> +15> <input>io:fwrite("~p~n", [<<208,128>>]).</input> +<<208,128>> +ok +16> <input>io:fwrite("~tp~n", [<<208,128>>]).</input> +<<"Ѐ"/utf8>> +ok +17> <input>io:fwrite("~tp~n", [<<128,128>>]).</input>  <<128,128>> -12> <input>io:fwrite("~tp~n", [<<208,128>>]).</input> -<<"\x{400}"/utf8>>  ok</pre>            </item>            <tag><c>W</c></tag> diff --git a/lib/stdlib/src/erl_lint.erl b/lib/stdlib/src/erl_lint.erl index 1930c462e8..9a62d21d34 100644 --- a/lib/stdlib/src/erl_lint.erl +++ b/lib/stdlib/src/erl_lint.erl @@ -3971,6 +3971,8 @@ extract_sequence(3, [$.,_|Fmt], Need) ->      extract_sequence(4, Fmt, Need);  extract_sequence(3, Fmt, Need) ->      extract_sequence(4, Fmt, Need); +extract_sequence(4, [$t, $l | Fmt], Need) -> +    extract_sequence(4, [$l, $t | Fmt], Need);  extract_sequence(4, [$t, $c | Fmt], Need) ->      extract_sequence(5, [$c|Fmt], Need);  extract_sequence(4, [$t, $s | Fmt], Need) -> @@ -3987,8 +3989,14 @@ extract_sequence(4, [$t, C | _Fmt], _Need) ->      {error,"invalid control ~t" ++ [C]};  extract_sequence(4, [$l, $p | Fmt], Need) ->      extract_sequence(5, [$p|Fmt], Need); +extract_sequence(4, [$l, $t, $p | Fmt], Need) -> +    extract_sequence(5, [$p|Fmt], Need);  extract_sequence(4, [$l, $P | Fmt], Need) ->      extract_sequence(5, [$P|Fmt], Need); +extract_sequence(4, [$l, $t, $P | Fmt], Need) -> +    extract_sequence(5, [$P|Fmt], Need); +extract_sequence(4, [$l, $t, C | _Fmt], _Need) -> +    {error,"invalid control ~lt" ++ [C]};  extract_sequence(4, [$l, C | _Fmt], _Need) ->      {error,"invalid control ~l" ++ [C]};  extract_sequence(4, Fmt, Need) -> diff --git a/lib/stdlib/src/io_lib.erl b/lib/stdlib/src/io_lib.erl index cacd9f2524..e37c13093b 100644 --- a/lib/stdlib/src/io_lib.erl +++ b/lib/stdlib/src/io_lib.erl @@ -931,7 +931,7 @@ limit_term(Term, Depth) ->  limit(_, 0) -> '...';  limit([H|T]=L, D) ->      if -	D =:= 1 -> '...'; +	D =:= 1 -> ['...'];  	true ->              case printable_list(L) of                  true -> L; @@ -944,7 +944,7 @@ limit(Term, D) when is_map(Term) ->  limit({}=T, _D) -> T;  limit(T, D) when is_tuple(T) ->      if -	D =:= 1 -> '...'; +	D =:= 1 -> {'...'};  	true ->              list_to_tuple([limit(element(1, T), D-1)|                             limit_tail(tl(tuple_to_list(T)), D-1)]) @@ -961,32 +961,29 @@ limit_tail(Other, D) ->  %% Cannot limit maps properly since there is no guarantee that  %% maps:from_list() creates a map with the same internal ordering of -%% the selected associations as in Map. +%% the selected associations as in Map. Instead of subtracting one +%% from the depth as the map associations are traversed (as is done +%% for tuples and lists), the same depth is applied to each and every +%% (returned) association.  limit_map(Map, D) -> -    limit_map(maps:iterator(Map), D, []). +    %% Keep one extra association to make sure the final ',...' is included. +    limit_map_body(maps:iterator(Map), D + 1, D, []). -limit_map(_I, 0, Acc) -> +limit_map_body(_I, 0, _D0, Acc) ->      maps:from_list(Acc); -limit_map(I, D, Acc) -> +limit_map_body(I, D, D0, Acc) ->      case maps:next(I) of          {K, V, NextI} -> -            limit_map(NextI, D-1, [{K,V} | Acc]); +            limit_map_body(NextI, D-1, D0, [limit_map_assoc(K, V, D0) | Acc]);          none ->              maps:from_list(Acc)      end. -%%     maps:from_list(limit_map_body(erts_internal:maps_to_list(Map, D), D)). +limit_map_assoc(K, V, D) -> +    %% Keep keys as are to avoid creating duplicated keys. +    {K, limit(V, D - 1)}. -%% limit_map_body(_, 0) -> [{'...', '...'}]; -%% limit_map_body([], _) -> []; -%% limit_map_body([{K,V}], D) -> [limit_map_assoc(K, V, D)]; -%% limit_map_body([{K,V}|KVs], D) -> -%%     [limit_map_assoc(K, V, D) | limit_map_body(KVs, D-1)]. - -%% limit_map_assoc(K, V, D) -> -%%     {limit(K, D-1), limit(V, D-1)}. - -limit_bitstring(B, _D) -> B. %% Keeps all printable binaries. +limit_bitstring(B, _D) -> B. % Keeps all printable binaries.  test_limit(_, 0) -> throw(limit);  test_limit([H|T]=L, D) when is_integer(D) -> @@ -1022,18 +1019,21 @@ test_limit_tuple(T, I, Sz, D) ->      test_limit(element(I, T), D-1),      test_limit_tuple(T, I+1, Sz, D-1). -test_limit_map(_Map, _D) -> ok. -%%     test_limit_map_body(erts_internal:maps_to_list(Map, D), D). +test_limit_map(Map, D) -> +    test_limit_map_body(maps:iterator(Map), D). -%% test_limit_map_body(_, 0) -> throw(limit); -%% test_limit_map_body([], _) -> ok; -%% test_limit_map_body([{K,V}], D) -> test_limit_map_assoc(K, V, D); -%% test_limit_map_body([{K,V}|KVs], D) -> -%%     test_limit_map_assoc(K, V, D), -%%     test_limit_map_body(KVs, D-1). +test_limit_map_body(_I, 0) -> throw(limit); % cannot happen +test_limit_map_body(I, D) -> +    case maps:next(I) of +        {K, V, NextI} -> +            test_limit_map_assoc(K, V, D), +            test_limit_map_body(NextI, D-1); +        none -> +            ok +    end. -%% test_limit_map_assoc(K, V, D) -> -%%     test_limit(K, D-1), -%%     test_limit(V, D-1). +test_limit_map_assoc(K, V, D) -> +    test_limit(K, D - 1), +    test_limit(V, D - 1).  test_limit_bitstring(_, _) -> ok. diff --git a/lib/stdlib/src/io_lib_format.erl b/lib/stdlib/src/io_lib_format.erl index e345810ca0..64edbf1824 100644 --- a/lib/stdlib/src/io_lib_format.erl +++ b/lib/stdlib/src/io_lib_format.erl @@ -95,7 +95,7 @@ print([]) ->      [].  print(C, F, Ad, P, Pad, Encoding, Strings) -> -    [$~] ++ print_field_width(F, Ad) ++ print_precision(P) ++ +    [$~] ++ print_field_width(F, Ad) ++ print_precision(P, Pad) ++          print_pad_char(Pad) ++ print_encoding(Encoding) ++          print_strings(Strings) ++ [C]. @@ -103,8 +103,9 @@ print_field_width(none, _Ad) -> "";  print_field_width(F, left) -> integer_to_list(-F);  print_field_width(F, right) -> integer_to_list(F). -print_precision(none) -> ""; -print_precision(P) -> [$. | integer_to_list(P)]. +print_precision(none, $\s) -> ""; +print_precision(none, _Pad) -> ".";  % pad must be second dot +print_precision(P, _Pad) -> [$. | integer_to_list(P)].  print_pad_char($\s) -> ""; % default, no need to make explicit  print_pad_char(Pad) -> [$., Pad]. @@ -126,25 +127,23 @@ collect_cseq(Fmt0, Args0) ->      {F,Ad,Fmt1,Args1} = field_width(Fmt0, Args0),      {P,Fmt2,Args2} = precision(Fmt1, Args1),      {Pad,Fmt3,Args3} = pad_char(Fmt2, Args2), -    {Encoding,Fmt4,Args4} = encoding(Fmt3, Args3), -    {Strings,Fmt5,Args5} = strings(Fmt4, Args4), -    {C,As,Fmt6,Args6} = collect_cc(Fmt5, Args5), -    FormatSpec = #{control_char => C, args => As, width => F, adjust => Ad, -                   precision => P, pad_char => Pad, encoding => Encoding, -                   strings => Strings}, -    {FormatSpec,Fmt6,Args6}. - -encoding([$t|Fmt],Args) -> -    true = hd(Fmt) =/= $l, -    {unicode,Fmt,Args}; -encoding(Fmt,Args) -> -    {latin1,Fmt,Args}. - -strings([$l|Fmt],Args) -> -    true = hd(Fmt) =/= $t, -    {false,Fmt,Args}; -strings(Fmt,Args) -> -    {true,Fmt,Args}. +    Spec0 = #{width => F, +              adjust => Ad, +              precision => P, +              pad_char => Pad, +              encoding => latin1, +              strings => true}, +    {Spec1,Fmt4} = modifiers(Fmt3, Spec0), +    {C,As,Fmt5,Args4} = collect_cc(Fmt4, Args3), +    Spec2 = Spec1#{control_char => C, args => As}, +    {Spec2,Fmt5,Args4}. + +modifiers([$t|Fmt], Spec) -> +    modifiers(Fmt, Spec#{encoding => unicode}); +modifiers([$l|Fmt], Spec) -> +    modifiers(Fmt, Spec#{strings => false}); +modifiers(Fmt, Spec) -> +    {Spec, Fmt}.  field_width([$-|Fmt0], Args0) ->      {F,Fmt,Args} = field_value(Fmt0, Args0), diff --git a/lib/stdlib/test/io_SUITE.erl b/lib/stdlib/test/io_SUITE.erl index 45363c0592..6f4e7ad7e0 100644 --- a/lib/stdlib/test/io_SUITE.erl +++ b/lib/stdlib/test/io_SUITE.erl @@ -1905,29 +1905,61 @@ otp_10836(Suite) when is_list(Suite) ->  %% OTP-10755. The 'l' modifier  otp_10755(Suite) when is_list(Suite) -> +    %% printing plain ascii characters      S = "string",      "\"string\"" = fmt("~p", [S]),      "[115,116,114,105,110,103]" = fmt("~lp", [S]),      "\"string\"" = fmt("~P", [S, 2]),      "[115|...]" = fmt("~lP", [S, 2]), -    {'EXIT',{badarg,_}} = (catch fmt("~ltp", [S])), -    {'EXIT',{badarg,_}} = (catch fmt("~tlp", [S])), -    {'EXIT',{badarg,_}} = (catch fmt("~ltP", [S])), -    {'EXIT',{badarg,_}} = (catch fmt("~tlP", [S])), +    %% printing latin1 chars, with and without modifiers +    T = {[255],list_to_atom([255]),[a,b,c]}, +    "{\"ÿ\",ÿ,[a,b,c]}" = fmt("~p", [T]), +    "{\"ÿ\",ÿ,[a,b,c]}" = fmt("~tp", [T]), +    "{[255],ÿ,[a,b,c]}" = fmt("~lp", [T]), +    "{[255],ÿ,[a,b,c]}" = fmt("~ltp", [T]), +    "{[255],ÿ,[a,b,c]}" = fmt("~tlp", [T]), +    "{\"ÿ\",ÿ,...}" = fmt("~P", [T,3]), +    "{\"ÿ\",ÿ,...}" = fmt("~tP", [T,3]), +    "{[255],ÿ,...}" = fmt("~lP", [T,3]), +    "{[255],ÿ,...}" = fmt("~ltP", [T,3]), +    "{[255],ÿ,...}" = fmt("~tlP", [T,3]), +    %% printing unicode chars, with and without modifiers +    U = {[666],list_to_atom([666]),[a,b,c]}, +    "{[666],'\\x{29A}',[a,b,c]}" = fmt("~p", [U]), +    case io:printable_range() of +        unicode -> +            "{\"ʚ\",'ʚ',[a,b,c]}" = fmt("~tp", [U]), +            "{\"ʚ\",'ʚ',...}" = fmt("~tP", [U,3]); +        latin1 -> +            "{[666],'ʚ',[a,b,c]}" = fmt("~tp", [U]), +            "{[666],'ʚ',...}" = fmt("~tP", [U,3]) +    end, +    "{[666],'\\x{29A}',[a,b,c]}" = fmt("~lp", [U]), +    "{[666],'ʚ',[a,b,c]}" = fmt("~ltp", [U]), +    "{[666],'ʚ',[a,b,c]}" = fmt("~tlp", [U]), +    "{[666],'\\x{29A}',...}" = fmt("~P", [U,3]), +    "{[666],'\\x{29A}',...}" = fmt("~lP", [U,3]), +    "{[666],'ʚ',...}" = fmt("~ltP", [U,3]), +    "{[666],'ʚ',...}" = fmt("~tlP", [U,3]), +    %% the compiler should catch uses of ~l with other than pP      Text =          "-module(l_mod).\n"          "-export([t/0]).\n"          "t() ->\n"          "    S = \"string\",\n" -        "    io:format(\"~ltp\", [S]),\n" -        "    io:format(\"~tlp\", [S]),\n" -        "    io:format(\"~ltP\", [S, 1]),\n" -        "    io:format(\"~tlP\", [S, 1]).\n", +        "    io:format(\"~lw\", [S]),\n" +        "    io:format(\"~lW\", [S, 1]),\n" +        "    io:format(\"~ltw\", [S]),\n" +        "    io:format(\"~tlw\", [S]),\n" +        "    io:format(\"~ltW\", [S, 1]),\n" +        "    io:format(\"~tlW\", [S, 1]).\n",      {ok,l_mod,[{_File,Ws}]} = compile_file("l_mod.erl", Text, Suite), -    ["format string invalid (invalid control ~lt)", -     "format string invalid (invalid control ~tl)", -     "format string invalid (invalid control ~lt)", -     "format string invalid (invalid control ~tl)"] = +    ["format string invalid (invalid control ~lw)", +     "format string invalid (invalid control ~lW)", +     "format string invalid (invalid control ~ltw)", +     "format string invalid (invalid control ~ltw)", +     "format string invalid (invalid control ~ltW)", +     "format string invalid (invalid control ~ltW)"] =          [lists:flatten(M:format_error(E)) || {_L,M,E} <- Ws],      ok. @@ -2005,6 +2037,7 @@ writes(N, F1) ->  format_string(_Config) ->      %% All but padding is tested by fmt/2. +    "xxxxxxxsss" = fmt("~10..xs", ["sss"]),      "xxxxxxsssx" = fmt("~10.4.xs", ["sss"]),      "xxxxxxsssx" = fmt("~10.4.*s", [$x, "sss"]),      ok. @@ -2384,19 +2417,36 @@ limit_term(_Config) ->      {_, 2} = limt({a,b,c,[d,e]}, 2),      {_, 2} = limt({a,b,c,[d,e]}, 3),      {_, 2} = limt({a,b,c,[d,e]}, 4), +    T0 = [1|{a,b,c}], +    {_, 2} = limt(T0, 2), +    {_, 2} = limt(T0, 3), +    {_, 2} = limt(T0, 4),      {_, 1} = limt(<<"foo">>, 18), +    {_, 2} = limt({"",[1,2]}, 3), +    {_, 2} = limt({"",{1,2}}, 3), +    true = limt_pp({"123456789012345678901234567890",{1,2}}, 3),      ok = blimt(<<"123456789012345678901234567890">>), +    true = limt_pp(<<"123456789012345678901234567890">>, 3), +    {_, 2} = limt({<<"kljlkjsl">>,[1,2,3,4]}, 4),      {_, 1} = limt(<<7:3>>, 2),      {_, 1} = limt(<<7:21>>, 2),      {_, 1} = limt([], 2),      {_, 1} = limt({}, 2), +    {_, 1} = limt({"", ""}, 4),      {_, 1} = limt(#{}, 2), -    {_, 1} = limt(#{[] => {}}, 2), +    {_, 2} = limt(#{[] => {}}, 1), +    {_, 2} = limt(#{[] => {}}, 2),      {_, 1} = limt(#{[] => {}}, 3),      T = #{[] => {},[a] => [b]}, -    {_, 1} = limt(T, 2), +    {_, 1} = limt(T, 0), +    {_, 2} = limt(T, 1), +    {_, 2} = limt(T, 2),      {_, 1} = limt(T, 3),      {_, 1} = limt(T, 4), +    T2 = #{[] => {},{} => []}, +    {_, 2} = limt(T2, 1), +    {_, 2} = limt(T2, 2), +    {_, 1} = limt(T2, 3),      ok.  blimt(Binary) -> @@ -2430,3 +2480,12 @@ limt(Term, Depth) when is_integer(Depth) ->  form(Term, Depth) ->      lists:flatten(io_lib:format("~W", [Term, Depth])). + +limt_pp(Term, Depth) when is_integer(Depth) -> +    T1 = io_lib:limit_term(Term, Depth), +    S = pp(Term, Depth), +    S1 = pp(T1, Depth), +    S1 =:= S. + +pp(Term, Depth) -> +    lists:flatten(io_lib:format("~P", [Term, Depth])). | 
