Use a more efficient variant of string:to_lower to improve performance.

After much testing and experimentation of all kinds I find lists to be both faster and using less memory than binaries for request-line and headers handling. This is more than likely due to the fact that headers are very short and thus do not benefit from the advantages of refc binaries, meaning they're copied, just like lists. The memory usage discrepancy is still a mystery for the most part, although the hoops needed to perform operations on the binaries are probably responsible for the extra memory use. I'm thus giving up on trying to use binaries for request-line and headers. Instead, this commit improves performances even more to the lists code, making lists 5% faster than binaries. Lists are easier to work with too, so I guess it's all a big win for everyone. Of course the request body is still read as a binary, we're using the binary type where it performs best.
author: Loïc Hoguin <[email protected]> 2011-03-27 01:16:11 +0100
committer: Loïc Hoguin <[email protected]> 2011-03-27 01:16:11 +0100
commit: d0d9b0e8b363b456bd0b9e5fbdebc90f055546c3 (patch)
tree: f6692301fa8f811ad3e8c042875bd576aba290f1 /src
parent: 5726aa3d85c0b8642b90d698b15fee8e5a0281fb (diff)
download: cowboy-d0d9b0e8b363b456bd0b9e5fbdebc90f055546c3.tar.gz
cowboy-d0d9b0e8b363b456bd0b9e5fbdebc90f055546c3.tar.bz2
cowboy-d0d9b0e8b363b456bd0b9e5fbdebc90f055546c3.zip
1 files changed, 38 insertions, 2 deletions
diff --git a/src/cowboy_http_protocol.erl b/src/cowboy_http_protocol.erl
index 55ecd34..6242fdd 100644
--- a/src/cowboy_http_protocol.erl
+++ b/src/cowboy_http_protocol.erl
@@ -97,7 +97,7 @@ wait_header(Req, State=#state{socket=Socket,
 	Value::string()} | http_eoh, Req::#http_req{}, State::#state{}) -> ok.
 header({http_header, _I, 'Host', _R, RawHost}, Req=#http_req{path=Path,
 		host=undefined}, State=#state{dispatch=Dispatch}) ->
-	RawHost2 = string:to_lower(RawHost),
+	RawHost2 = string_to_lower(RawHost),
 	Host = cowboy_dispatcher:split_host(RawHost2),
 	%% @todo We probably want to filter the Host and Path here to allow
 	%%       things like url rewriting.
@@ -220,7 +220,43 @@ connection_to_atom("keep-alive") ->
 connection_to_atom("close") ->
 	close;
 connection_to_atom(Connection) ->
-	case string:to_lower(Connection) of
+	case string_to_lower(Connection) of
 		"close" -> close;
 		_Any -> keepalive
 	end.
+
+%% More efficient implementation of string:to_lower.
+%% We are excluding a few characters on purpose.
+-spec string_to_lower(string()) -> string().
+string_to_lower(L) ->
+	[char_to_lower(C) || C <- L].
+
+%% We gain noticeable speed by matching each value directly.
+-spec char_to_lower(char()) -> char().
+char_to_lower($A) -> $a;
+char_to_lower($B) -> $b;
+char_to_lower($C) -> $c;
+char_to_lower($D) -> $d;
+char_to_lower($E) -> $e;
+char_to_lower($F) -> $f;
+char_to_lower($G) -> $g;
+char_to_lower($H) -> $h;
+char_to_lower($I) -> $i;
+char_to_lower($J) -> $j;
+char_to_lower($K) -> $k;
+char_to_lower($L) -> $l;
+char_to_lower($M) -> $m;
+char_to_lower($N) -> $n;
+char_to_lower($O) -> $o;
+char_to_lower($P) -> $p;
+char_to_lower($Q) -> $q;
+char_to_lower($R) -> $r;
+char_to_lower($S) -> $s;
+char_to_lower($T) -> $t;
+char_to_lower($U) -> $u;
+char_to_lower($V) -> $v;
+char_to_lower($W) -> $w;
+char_to_lower($X) -> $x;
+char_to_lower($Y) -> $y;
+char_to_lower($Z) -> $z;
+char_to_lower(Ch) -> Ch.
author	Loïc Hoguin <[email protected]>	2011-03-27 01:16:11 +0100
committer	Loïc Hoguin <[email protected]>	2011-03-27 01:16:11 +0100
commit	d0d9b0e8b363b456bd0b9e5fbdebc90f055546c3 (patch)
tree	f6692301fa8f811ad3e8c042875bd576aba290f1 /src
parent	5726aa3d85c0b8642b90d698b15fee8e5a0281fb (diff)
download	cowboy-d0d9b0e8b363b456bd0b9e5fbdebc90f055546c3.tar.gz cowboy-d0d9b0e8b363b456bd0b9e5fbdebc90f055546c3.tar.bz2 cowboy-d0d9b0e8b363b456bd0b9e5fbdebc90f055546c3.zip