aboutsummaryrefslogtreecommitdiffstats
path: root/lib/stdlib
diff options
context:
space:
mode:
authorPéter Dimitrov <[email protected]>2017-10-31 13:24:13 +0100
committerPéter Dimitrov <[email protected]>2017-10-31 15:05:17 +0100
commita4c3f8d3b270b9c21caabcd084bf55049b5bc700 (patch)
tree614c1f1d5fc63b4df252d3153ba7243a68a7fe04 /lib/stdlib
parent7a4d4e183ae5567d6242184b8268918904c872c6 (diff)
downloadotp-a4c3f8d3b270b9c21caabcd084bf55049b5bc700.tar.gz
otp-a4c3f8d3b270b9c21caabcd084bf55049b5bc700.tar.bz2
otp-a4c3f8d3b270b9c21caabcd084bf55049b5bc700.zip
stdlib: Fix case normalization (normalize/1)
Diffstat (limited to 'lib/stdlib')
-rw-r--r--lib/stdlib/src/uri_string.erl35
1 files changed, 31 insertions, 4 deletions
diff --git a/lib/stdlib/src/uri_string.erl b/lib/stdlib/src/uri_string.erl
index 2c73e38324..b8e0432fd6 100644
--- a/lib/stdlib/src/uri_string.erl
+++ b/lib/stdlib/src/uri_string.erl
@@ -296,12 +296,14 @@
URIString :: uri_string(),
NormalizedURI :: uri_string().
normalize(URIString) ->
- %% Case normalization and percent-encoding normalization are achieved
- %% by running parse and recompose on the input URI string.
+ %% Percent-encoding normalization and case normalization for
+ %% percent-encoded triplets are achieved by running parse and
+ %% recompose on the input URI string.
recompose(
normalize_path_segment(
normalize_scheme_based(
- parse(URIString)))).
+ normalize_case(
+ parse(URIString))))).
%%-------------------------------------------------------------------------
@@ -1894,7 +1896,32 @@ form_urldecode(<<H,_/binary>>, _Acc) ->
%% Helper functions for normalize
%%-------------------------------------------------------------------------
-%% RFC 3986
+%% 6.2.2.1. Case Normalization
+normalize_case(#{scheme := Scheme, host := Host} = Map) ->
+ Map#{scheme => to_lower(Scheme),
+ host => to_lower(Host)};
+normalize_case(#{host := Host} = Map) ->
+ Map#{host => to_lower(Host)};
+normalize_case(#{scheme := Scheme} = Map) ->
+ Map#{scheme => to_lower(Scheme)};
+normalize_case(#{} = Map) ->
+ Map.
+
+
+to_lower(Cs) when is_list(Cs) ->
+ B = convert_binary(Cs, utf8, utf8),
+ convert_list(to_lower(B), utf8);
+to_lower(Cs) when is_binary(Cs) ->
+ to_lower(Cs, <<>>).
+%%
+to_lower(<<C,Cs/binary>>, Acc) when $A =< C, C =< $Z ->
+ to_lower(Cs, <<Acc/binary,(C + 32)>>);
+to_lower(<<C,Cs/binary>>, Acc) ->
+ to_lower(Cs, <<Acc/binary,C>>);
+to_lower(<<>>, Acc) ->
+ Acc.
+
+
%% 6.2.2.3. Path Segment Normalization
%% 5.2.4. Remove Dot Segments
normalize_path_segment(Map) ->