cowboy_bstr.erl 4.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135
  1. %% Copyright (c) 2011-2014, Loïc Hoguin <essen@ninenines.eu>
  2. %%
  3. %% Permission to use, copy, modify, and/or distribute this software for any
  4. %% purpose with or without fee is hereby granted, provided that the above
  5. %% copyright notice and this permission notice appear in all copies.
  6. %%
  7. %% THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
  8. %% WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
  9. %% MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
  10. %% ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
  11. %% WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
  12. %% ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
  13. %% OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
  14. %% @doc Binary string manipulation.
  15. -module(cowboy_bstr).
  16. %% Binary strings.
  17. -export([capitalize_token/1]).
  18. -export([to_lower/1]).
  19. -export([to_upper/1]).
  20. %% Characters.
  21. -export([char_to_lower/1]).
  22. -export([char_to_upper/1]).
  23. %% @doc Capitalize a token.
  24. %%
  25. %% The first letter and all letters after a dash are capitalized.
  26. %% This is the form seen for header names in the HTTP/1.1 RFC and
  27. %% others. Note that using this form isn't required, as header name
  28. %% are case insensitive, and it is only provided for use with eventual
  29. %% badly implemented clients.
  30. -spec capitalize_token(B) -> B when B::binary().
  31. capitalize_token(B) ->
  32. capitalize_token(B, true, <<>>).
  33. capitalize_token(<<>>, _, Acc) ->
  34. Acc;
  35. capitalize_token(<< $-, Rest/bits >>, _, Acc) ->
  36. capitalize_token(Rest, true, << Acc/binary, $- >>);
  37. capitalize_token(<< C, Rest/bits >>, true, Acc) ->
  38. capitalize_token(Rest, false, << Acc/binary, (char_to_upper(C)) >>);
  39. capitalize_token(<< C, Rest/bits >>, false, Acc) ->
  40. capitalize_token(Rest, false, << Acc/binary, (char_to_lower(C)) >>).
  41. %% @doc Convert a binary string to lowercase.
  42. -spec to_lower(B) -> B when B::binary().
  43. to_lower(B) ->
  44. << << (char_to_lower(C)) >> || << C >> <= B >>.
  45. %% @doc Convert a binary string to uppercase.
  46. -spec to_upper(B) -> B when B::binary().
  47. to_upper(B) ->
  48. << << (char_to_upper(C)) >> || << C >> <= B >>.
  49. %% @doc Convert [A-Z] characters to lowercase.
  50. %% @end
  51. %% We gain noticeable speed by matching each value directly.
  52. -spec char_to_lower(char()) -> char().
  53. char_to_lower($A) -> $a;
  54. char_to_lower($B) -> $b;
  55. char_to_lower($C) -> $c;
  56. char_to_lower($D) -> $d;
  57. char_to_lower($E) -> $e;
  58. char_to_lower($F) -> $f;
  59. char_to_lower($G) -> $g;
  60. char_to_lower($H) -> $h;
  61. char_to_lower($I) -> $i;
  62. char_to_lower($J) -> $j;
  63. char_to_lower($K) -> $k;
  64. char_to_lower($L) -> $l;
  65. char_to_lower($M) -> $m;
  66. char_to_lower($N) -> $n;
  67. char_to_lower($O) -> $o;
  68. char_to_lower($P) -> $p;
  69. char_to_lower($Q) -> $q;
  70. char_to_lower($R) -> $r;
  71. char_to_lower($S) -> $s;
  72. char_to_lower($T) -> $t;
  73. char_to_lower($U) -> $u;
  74. char_to_lower($V) -> $v;
  75. char_to_lower($W) -> $w;
  76. char_to_lower($X) -> $x;
  77. char_to_lower($Y) -> $y;
  78. char_to_lower($Z) -> $z;
  79. char_to_lower(Ch) -> Ch.
  80. %% @doc Convert [a-z] characters to uppercase.
  81. -spec char_to_upper(char()) -> char().
  82. char_to_upper($a) -> $A;
  83. char_to_upper($b) -> $B;
  84. char_to_upper($c) -> $C;
  85. char_to_upper($d) -> $D;
  86. char_to_upper($e) -> $E;
  87. char_to_upper($f) -> $F;
  88. char_to_upper($g) -> $G;
  89. char_to_upper($h) -> $H;
  90. char_to_upper($i) -> $I;
  91. char_to_upper($j) -> $J;
  92. char_to_upper($k) -> $K;
  93. char_to_upper($l) -> $L;
  94. char_to_upper($m) -> $M;
  95. char_to_upper($n) -> $N;
  96. char_to_upper($o) -> $O;
  97. char_to_upper($p) -> $P;
  98. char_to_upper($q) -> $Q;
  99. char_to_upper($r) -> $R;
  100. char_to_upper($s) -> $S;
  101. char_to_upper($t) -> $T;
  102. char_to_upper($u) -> $U;
  103. char_to_upper($v) -> $V;
  104. char_to_upper($w) -> $W;
  105. char_to_upper($x) -> $X;
  106. char_to_upper($y) -> $Y;
  107. char_to_upper($z) -> $Z;
  108. char_to_upper(Ch) -> Ch.
  109. %% Tests.
  110. -ifdef(TEST).
  111. capitalize_token_test_() ->
  112. %% {Header, Result}
  113. Tests = [
  114. {<<"heLLo-woRld">>, <<"Hello-World">>},
  115. {<<"Sec-Websocket-Version">>, <<"Sec-Websocket-Version">>},
  116. {<<"Sec-WebSocket-Version">>, <<"Sec-Websocket-Version">>},
  117. {<<"sec-websocket-version">>, <<"Sec-Websocket-Version">>},
  118. {<<"SEC-WEBSOCKET-VERSION">>, <<"Sec-Websocket-Version">>},
  119. {<<"Sec-WebSocket--Version">>, <<"Sec-Websocket--Version">>},
  120. {<<"Sec-WebSocket---Version">>, <<"Sec-Websocket---Version">>}
  121. ],
  122. [{H, fun() -> R = capitalize_token(H) end} || {H, R} <- Tests].
  123. -endif.