123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440 |
- %% Copyright (c) 2014, Loïc Hoguin <essen@ninenines.eu>
- %%
- %% Permission to use, copy, modify, and/or distribute this software for any
- %% purpose with or without fee is hereby granted, provided that the above
- %% copyright notice and this permission notice appear in all copies.
- %%
- %% THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
- %% WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
- %% MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
- %% ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
- %% WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
- %% ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
- %% OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
- -module(cow_http_hd).
- -export([parse_accept/1]).
- -export([parse_accept_charset/1]).
- -export([parse_accept_encoding/1]).
- -export([parse_accept_language/1]).
- -export([parse_connection/1]).
- -export([parse_content_length/1]).
- -export([parse_content_type/1]).
- -export([parse_date/1]).
- -export([parse_etag/1]).
- -export([parse_expect/1]).
- -export([parse_if_match/1]).
- -export([parse_if_modified_since/1]).
- -export([parse_if_none_match/1]).
- -export([parse_if_unmodified_since/1]).
- -export([parse_last_modified/1]).
- -export([parse_max_forwards/1]).
- -export([parse_transfer_encoding/1]).
- -export([parse_upgrade/1]).
- -type etag() :: {weak | strong, binary()}.
- -export_type([etag/0]).
- -type media_type() :: {binary(), binary(), [{binary(), binary()}]}.
- -export_type([media_type/0]).
- -type qvalue() :: 0..1000.
- -export_type([qvalue/0]).
- -include("cow_inline.hrl").
- -ifdef(TEST).
- -include_lib("triq/include/triq.hrl").
- ows() ->
- list(oneof([$\s, $\t])).
- alpha_chars() -> "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ".
- alphanum_chars() -> "0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ".
- alpha() ->
- oneof(alpha_chars()).
- alphanum() ->
- oneof(alphanum_chars()).
- tchar() ->
- frequency([
- {1, oneof([$!, $#, $$, $%, $&, $', $*, $+, $-, $., $^, $_, $`, $|, $~])},
- {99, oneof(alphanum_chars())}
- ]).
- token() ->
- ?LET(T,
- non_empty(list(tchar())),
- list_to_binary(T)).
- obs_text() ->
- [128,129,130,131,132,133,134,135,136,137,138,139,140,141,142,143,144,145,
- 146,147,148,149,150,151,152,153,154,155,156,157,158,159,160,161,162,163,
- 164,165,166,167,168,169,170,171,172,173,174,175,176,177,178,179,180,181,
- 182,183,184,185,186,187,188,189,190,191,192,193,194,195,196,197,198,199,
- 200,201,202,203,204,205,206,207,208,209,210,211,212,213,214,215,216,217,
- 218,219,220,221,222,223,224,225,226,227,228,229,230,231,232,233,234,235,
- 236,237,238,239,240,241,242,243,244,245,246,247,248,249,250,251,252,253,
- 254,255].
- qdtext() ->
- frequency([
- {99, oneof("\t\s!#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[]^_`abcdefghijklmnopqrstuvwxyz{|}~")},
- {1, oneof(obs_text())}
- ]).
- quoted_pair() ->
- [$\\, frequency([
- {99, oneof("\t\s!\"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\\]^_`abcdefghijklmnopqrstuvwxyz{|}~")},
- {1, oneof(obs_text())}
- ])].
- quoted_string() ->
- [$", list(frequency([{100, qdtext()}, {1, quoted_pair()}])), $"].
- %% Helper function for ( token / quoted-string ) values.
- unquote([$", V, $"]) -> unquote(V, <<>>);
- unquote(V) -> V.
- unquote([], Acc) -> Acc;
- unquote([[$\\, C]|Tail], Acc) -> unquote(Tail, << Acc/binary, C >>);
- unquote([C|Tail], Acc) -> unquote(Tail, << Acc/binary, C >>).
- parameter() ->
- ?SUCHTHAT({K, _, _, _},
- {token(), oneof([token(), quoted_string()]), ows(), ows()},
- K =/= <<"q">>).
- weight() ->
- frequency([
- {90, int(0, 1000)},
- {10, undefined}
- ]).
- %% Helper function for weight's qvalue formatting.
- qvalue_to_iodata(0) -> <<"0">>;
- qvalue_to_iodata(Q) when Q < 10 -> [<<"0.00">>, integer_to_binary(Q)];
- qvalue_to_iodata(Q) when Q < 100 -> [<<"0.0">>, integer_to_binary(Q)];
- qvalue_to_iodata(Q) when Q < 1000 -> [<<"0.">>, integer_to_binary(Q)];
- qvalue_to_iodata(1000) -> <<"1">>.
- -endif.
- %% @doc Parse the Accept header.
- -spec parse_accept(binary()) -> [{media_type(), qvalue(), [binary() | {binary(), binary()}]}].
- parse_accept(<<"*/*">>) ->
- [{{<<"*">>, <<"*">>, []}, 1000, []}];
- parse_accept(Accept) ->
- media_range_list(Accept, []).
- media_range_list(<<>>, Acc) -> lists:reverse(Acc);
- media_range_list(<< $\s, R/bits >>, Acc) -> media_range_list(R, Acc);
- media_range_list(<< $\t, R/bits >>, Acc) -> media_range_list(R, Acc);
- media_range_list(<< $,, R/bits >>, Acc) -> media_range_list(R, Acc);
- media_range_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_range_type, R, Acc, <<>>)
- end.
- media_range_type(<< $/, R/bits >>, Acc, T) -> media_range_subtype(R, Acc, T, <<>>);
- %% Special clause for badly behaving user agents that send * instead of */*.
- media_range_type(<< $;, R/bits >>, Acc, <<"*">>) -> media_range_before_param(R, Acc, <<"*">>, <<"*">>, []);
- media_range_type(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_range_type, R, Acc, T)
- end.
- media_range_subtype(<<>>, Acc, T, S) when S =/= <<>> -> lists:reverse([{{T, S, []}, 1000, []}|Acc]);
- media_range_subtype(<< $,, R/bits >>, Acc, T, S) when S =/= <<>> -> media_range_list(R, [{{T, S, []}, 1000, []}|Acc]);
- media_range_subtype(<< $;, R/bits >>, Acc, T, S) when S =/= <<>> -> media_range_before_param(R, Acc, T, S, []);
- media_range_subtype(<< $\s, R/bits >>, Acc, T, S) when S =/= <<>> -> media_range_before_semicolon(R, Acc, T, S, []);
- media_range_subtype(<< $\t, R/bits >>, Acc, T, S) when S =/= <<>> -> media_range_before_semicolon(R, Acc, T, S, []);
- media_range_subtype(<< C, R/bits >>, Acc, T, S) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_range_subtype, R, Acc, T, S)
- end.
- media_range_before_semicolon(<<>>, Acc, T, S, P) -> lists:reverse([{{T, S, lists:reverse(P)}, 1000, []}|Acc]);
- media_range_before_semicolon(<< $,, R/bits >>, Acc, T, S, P) -> media_range_list(R, [{{T, S, lists:reverse(P)}, 1000, []}|Acc]);
- media_range_before_semicolon(<< $;, R/bits >>, Acc, T, S, P) -> media_range_before_param(R, Acc, T, S, P);
- media_range_before_semicolon(<< $\s, R/bits >>, Acc, T, S, P) -> media_range_before_semicolon(R, Acc, T, S, P);
- media_range_before_semicolon(<< $\t, R/bits >>, Acc, T, S, P) -> media_range_before_semicolon(R, Acc, T, S, P).
- media_range_before_param(<< $\s, R/bits >>, Acc, T, S, P) -> media_range_before_param(R, Acc, T, S, P);
- media_range_before_param(<< $\t, R/bits >>, Acc, T, S, P) -> media_range_before_param(R, Acc, T, S, P);
- %% Special clause for badly behaving user agents that send .123 instead of 0.123.
- media_range_before_param(<< $q, $=, $., R/bits >>, Acc, T, S, P) -> media_range_broken_weight(R, Acc, T, S, P);
- media_range_before_param(<< $q, $=, R/bits >>, Acc, T, S, P) -> media_range_weight(R, Acc, T, S, P);
- media_range_before_param(<< C, R/bits >>, Acc, T, S, P) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_range_param, R, Acc, T, S, P, <<>>)
- end.
- media_range_param(<< $=, $", R/bits >>, Acc, T, S, P, K) -> media_range_quoted(R, Acc, T, S, P, K, <<>>);
- media_range_param(<< $=, R/bits >>, Acc, T, S, P, K) -> media_range_value(R, Acc, T, S, P, K, <<>>);
- media_range_param(<< C, R/bits >>, Acc, T, S, P, K) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_range_param, R, Acc, T, S, P, K)
- end.
- media_range_quoted(<< $", R/bits >>, Acc, T, S, P, K, V) -> media_range_before_semicolon(R, Acc, T, S, [{K, V}|P]);
- media_range_quoted(<< $\\, C, R/bits >>, Acc, T, S, P, K, V) when ?IS_VCHAR(C) -> media_range_quoted(R, Acc, T, S, P, K, << V/binary, C >>);
- media_range_quoted(<< C, R/bits >>, Acc, T, S, P, K, V) when ?IS_VCHAR(C) -> media_range_quoted(R, Acc, T, S, P, K, << V/binary, C >>).
- media_range_value(<<>>, Acc, T, S, P, K, V) -> lists:reverse([{{T, S, lists:reverse([{K, V}|P])}, 1000, []}|Acc]);
- media_range_value(<< $,, R/bits >>, Acc, T, S, P, K, V) -> media_range_list(R, [{{T, S, lists:reverse([{K, V}|P])}, 1000, []}|Acc]);
- media_range_value(<< $;, R/bits >>, Acc, T, S, P, K, V) -> media_range_before_param(R, Acc, T, S, [{K, V}|P]);
- media_range_value(<< $\s, R/bits >>, Acc, T, S, P, K, V) -> media_range_before_semicolon(R, Acc, T, S, [{K, V}|P]);
- media_range_value(<< $\t, R/bits >>, Acc, T, S, P, K, V) -> media_range_before_semicolon(R, Acc, T, S, [{K, V}|P]);
- media_range_value(<< C, R/bits >>, Acc, T, S, P, K, V) when ?IS_TOKEN(C) -> media_range_value(R, Acc, T, S, P, K, << V/binary, C >>).
- %% Special function for badly behaving user agents that send .123 instead of 0.123.
- media_range_broken_weight(<< A, B, C, R/bits >>, Acc, T, S, P)
- when A >= $0, A =< $9, B >= $0, B =< $9, C >= $0, C =< $9 ->
- accept_before_semicolon(R, Acc, T, S, P, (A - $0) * 100 + (B - $0) * 10 + (C - $0), []);
- media_range_broken_weight(<< A, B, R/bits >>, Acc, T, S, P)
- when A >= $0, A =< $9, B >= $0, B =< $9 ->
- accept_before_semicolon(R, Acc, T, S, P, (A - $0) * 100 + (B - $0) * 10, []);
- media_range_broken_weight(<< A, R/bits >>, Acc, T, S, P)
- when A >= $0, A =< $9 ->
- accept_before_semicolon(R, Acc, T, S, P, (A - $0) * 100, []).
- media_range_weight(<< "1.000", R/bits >>, Acc, T, S, P) -> accept_before_semicolon(R, Acc, T, S, P, 1000, []);
- media_range_weight(<< "1.00", R/bits >>, Acc, T, S, P) -> accept_before_semicolon(R, Acc, T, S, P, 1000, []);
- media_range_weight(<< "1.0", R/bits >>, Acc, T, S, P) -> accept_before_semicolon(R, Acc, T, S, P, 1000, []);
- media_range_weight(<< "1.", R/bits >>, Acc, T, S, P) -> accept_before_semicolon(R, Acc, T, S, P, 1000, []);
- media_range_weight(<< "1", R/bits >>, Acc, T, S, P) -> accept_before_semicolon(R, Acc, T, S, P, 1000, []);
- media_range_weight(<< "0.", A, B, C, R/bits >>, Acc, T, S, P)
- when A >= $0, A =< $9, B >= $0, B =< $9, C >= $0, C =< $9 ->
- accept_before_semicolon(R, Acc, T, S, P, (A - $0) * 100 + (B - $0) * 10 + (C - $0), []);
- media_range_weight(<< "0.", A, B, R/bits >>, Acc, T, S, P)
- when A >= $0, A =< $9, B >= $0, B =< $9 ->
- accept_before_semicolon(R, Acc, T, S, P, (A - $0) * 100 + (B - $0) * 10, []);
- media_range_weight(<< "0.", A, R/bits >>, Acc, T, S, P)
- when A >= $0, A =< $9 ->
- accept_before_semicolon(R, Acc, T, S, P, (A - $0) * 100, []);
- media_range_weight(<< "0.", R/bits >>, Acc, T, S, P) -> accept_before_semicolon(R, Acc, T, S, P, 0, []);
- media_range_weight(<< "0", R/bits >>, Acc, T, S, P) -> accept_before_semicolon(R, Acc, T, S, P, 0, []).
- accept_before_semicolon(<<>>, Acc, T, S, P, Q, E) -> lists:reverse([{{T, S, lists:reverse(P)}, Q, lists:reverse(E)}|Acc]);
- accept_before_semicolon(<< $,, R/bits >>, Acc, T, S, P, Q, E) -> media_range_list(R, [{{T, S, lists:reverse(P)}, Q, lists:reverse(E)}|Acc]);
- accept_before_semicolon(<< $;, R/bits >>, Acc, T, S, P, Q, E) -> accept_before_ext(R, Acc, T, S, P, Q, E);
- accept_before_semicolon(<< $\s, R/bits >>, Acc, T, S, P, Q, E) -> accept_before_semicolon(R, Acc, T, S, P, Q, E);
- accept_before_semicolon(<< $\t, R/bits >>, Acc, T, S, P, Q, E) -> accept_before_semicolon(R, Acc, T, S, P, Q, E).
- accept_before_ext(<< $\s, R/bits >>, Acc, T, S, P, Q, E) -> accept_before_ext(R, Acc, T, S, P, Q, E);
- accept_before_ext(<< $\t, R/bits >>, Acc, T, S, P, Q, E) -> accept_before_ext(R, Acc, T, S, P, Q, E);
- accept_before_ext(<< C, R/bits >>, Acc, T, S, P, Q, E) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(accept_ext, R, Acc, T, S, P, Q, E, <<>>)
- end.
- accept_ext(<<>>, Acc, T, S, P, Q, E, K) -> lists:reverse([{{T, S, lists:reverse(P)}, Q, lists:reverse([K|E])}|Acc]);
- accept_ext(<< $,, R/bits >>, Acc, T, S, P, Q, E, K) -> media_range_list(R, [{{T, S, lists:reverse(P)}, Q, lists:reverse([K|E])}|Acc]);
- accept_ext(<< $;, R/bits >>, Acc, T, S, P, Q, E, K) -> accept_before_ext(R, Acc, T, S, P, Q, [K|E]);
- accept_ext(<< $\s, R/bits >>, Acc, T, S, P, Q, E, K) -> accept_before_semicolon(R, Acc, T, S, P, Q, [K|E]);
- accept_ext(<< $\t, R/bits >>, Acc, T, S, P, Q, E, K) -> accept_before_semicolon(R, Acc, T, S, P, Q, [K|E]);
- accept_ext(<< $=, $", R/bits >>, Acc, T, S, P, Q, E, K) -> accept_quoted(R, Acc, T, S, P, Q, E, K, <<>>);
- accept_ext(<< $=, R/bits >>, Acc, T, S, P, Q, E, K) -> accept_value(R, Acc, T, S, P, Q, E, K, <<>>);
- accept_ext(<< C, R/bits >>, Acc, T, S, P, Q, E, K) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(accept_ext, R, Acc, T, S, P, Q, E, K)
- end.
- accept_quoted(<< $", R/bits >>, Acc, T, S, P, Q, E, K, V) -> accept_before_semicolon(R, Acc, T, S, P, Q, [{K, V}|E]);
- accept_quoted(<< $\\, C, R/bits >>, Acc, T, S, P, Q, E, K, V) when ?IS_VCHAR(C) -> accept_quoted(R, Acc, T, S, P, Q, E, K, << V/binary, C >>);
- accept_quoted(<< C, R/bits >>, Acc, T, S, P, Q, E, K, V) when ?IS_VCHAR(C) -> accept_quoted(R, Acc, T, S, P, Q, E, K, << V/binary, C >>).
- accept_value(<<>>, Acc, T, S, P, Q, E, K, V) -> lists:reverse([{{T, S, lists:reverse(P)}, Q, lists:reverse([{K, V}|E])}|Acc]);
- accept_value(<< $,, R/bits >>, Acc, T, S, P, Q, E, K, V) -> media_range_list(R, [{{T, S, lists:reverse(P)}, Q, lists:reverse([{K, V}|E])}|Acc]);
- accept_value(<< $;, R/bits >>, Acc, T, S, P, Q, E, K, V) -> accept_before_ext(R, Acc, T, S, P, Q, [{K, V}|E]);
- accept_value(<< $\s, R/bits >>, Acc, T, S, P, Q, E, K, V) -> accept_before_semicolon(R, Acc, T, S, P, Q, [{K, V}|E]);
- accept_value(<< $\t, R/bits >>, Acc, T, S, P, Q, E, K, V) -> accept_before_semicolon(R, Acc, T, S, P, Q, [{K, V}|E]);
- accept_value(<< C, R/bits >>, Acc, T, S, P, Q, E, K, V) when ?IS_TOKEN(C) -> accept_value(R, Acc, T, S, P, Q, E, K, << V/binary, C >>).
- -ifdef(TEST).
- accept_ext() ->
- oneof([token(), parameter()]).
- accept_params() ->
- frequency([
- {90, []},
- {10, list(accept_ext())}
- ]).
- accept() ->
- ?LET({T, S, P, W, E},
- {token(), token(), list(parameter()), weight(), accept_params()},
- {T, S, P, W, E, iolist_to_binary([T, $/, S,
- [[OWS1, $;, OWS2, K, $=, V] || {K, V, OWS1, OWS2} <- P],
- case W of
- undefined -> [];
- _ -> [
- [<<";q=">>, qvalue_to_iodata(W)],
- [case Ext of
- {K, V, OWS1, OWS2} -> [OWS1, $;, OWS2, K, $=, V];
- K -> [$;, K]
- end || Ext <- E]]
- end])}
- ).
- prop_parse_accept() ->
- ?FORALL(L,
- non_empty(list(accept())),
- begin
- << _, Accept/binary >> = iolist_to_binary([[$,, A] || {_, _, _, _, _, A} <- L]),
- ResL = parse_accept(Accept),
- CheckedL = [begin
- ExpectedP = [{?INLINE_LOWERCASE_BC(K), unquote(V)} || {K, V, _, _} <- P],
- ExpectedE = [case Ext of
- {K, V, _, _} -> {?INLINE_LOWERCASE_BC(K), unquote(V)};
- K -> ?INLINE_LOWERCASE_BC(K)
- end || Ext <- E],
- ResT =:= ?INLINE_LOWERCASE_BC(T)
- andalso ResS =:= ?INLINE_LOWERCASE_BC(S)
- andalso ResP =:= ExpectedP
- andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
- andalso ((W =:= undefined andalso ResE =:= []) orelse (W =/= undefined andalso ResE =:= ExpectedE))
- end || {{T, S, P, W, E, _}, {{ResT, ResS, ResP}, ResW, ResE}} <- lists:zip(L, ResL)],
- [true] =:= lists:usort(CheckedL)
- end
- ).
- parse_accept_test_() ->
- Tests = [
- {<<>>, []},
- {<<" ">>, []},
- {<<"audio/*; q=0.2, audio/basic">>, [
- {{<<"audio">>, <<"*">>, []}, 200, []},
- {{<<"audio">>, <<"basic">>, []}, 1000, []}
- ]},
- {<<"text/plain; q=0.5, text/html, "
- "text/x-dvi; q=0.8, text/x-c">>, [
- {{<<"text">>, <<"plain">>, []}, 500, []},
- {{<<"text">>, <<"html">>, []}, 1000, []},
- {{<<"text">>, <<"x-dvi">>, []}, 800, []},
- {{<<"text">>, <<"x-c">>, []}, 1000, []}
- ]},
- {<<"text/*, text/html, text/html;level=1, */*">>, [
- {{<<"text">>, <<"*">>, []}, 1000, []},
- {{<<"text">>, <<"html">>, []}, 1000, []},
- {{<<"text">>, <<"html">>, [{<<"level">>, <<"1">>}]}, 1000, []},
- {{<<"*">>, <<"*">>, []}, 1000, []}
- ]},
- {<<"text/*;q=0.3, text/html;q=0.7, text/html;level=1, "
- "text/html;level=2;q=0.4, */*;q=0.5">>, [
- {{<<"text">>, <<"*">>, []}, 300, []},
- {{<<"text">>, <<"html">>, []}, 700, []},
- {{<<"text">>, <<"html">>, [{<<"level">>, <<"1">>}]}, 1000, []},
- {{<<"text">>, <<"html">>, [{<<"level">>, <<"2">>}]}, 400, []},
- {{<<"*">>, <<"*">>, []}, 500, []}
- ]},
- {<<"text/html;level=1;quoted=\"hi hi hi\";"
- "q=0.123;standalone;complex=gits, text/plain">>, [
- {{<<"text">>, <<"html">>,
- [{<<"level">>, <<"1">>}, {<<"quoted">>, <<"hi hi hi">>}]}, 123,
- [<<"standalone">>, {<<"complex">>, <<"gits">>}]},
- {{<<"text">>, <<"plain">>, []}, 1000, []}
- ]},
- {<<"text/html, image/gif, image/jpeg, *; q=.2, */*; q=.2">>, [
- {{<<"text">>, <<"html">>, []}, 1000, []},
- {{<<"image">>, <<"gif">>, []}, 1000, []},
- {{<<"image">>, <<"jpeg">>, []}, 1000, []},
- {{<<"*">>, <<"*">>, []}, 200, []},
- {{<<"*">>, <<"*">>, []}, 200, []}
- ]}
- ],
- [{V, fun() -> R = parse_accept(V) end} || {V, R} <- Tests].
- parse_accept_error_test_() ->
- Tests = [
- <<"audio/basic, */;q=0.5">>,
- <<"audio/, audio/basic">>,
- <<"aud\tio/basic">>,
- <<"audio/basic;t=\"zero \\", 0, " woo\"">>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_accept(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_accept() ->
- horse:repeat(20000,
- parse_accept(<<"text/*;q=0.3, text/html;q=0.7, text/html;level=1, "
- "text/html;level=2;q=0.4, */*;q=0.5">>)
- ).
- -endif.
- %% @doc Parse the Accept-Charset header.
- -spec parse_accept_charset(binary()) -> [{binary(), qvalue()}].
- parse_accept_charset(Charset) ->
- nonempty(conneg_list(Charset, [])).
- conneg_list(<<>>, Acc) -> lists:reverse(Acc);
- conneg_list(<< $\s, R/bits >>, Acc) -> conneg_list(R, Acc);
- conneg_list(<< $\t, R/bits >>, Acc) -> conneg_list(R, Acc);
- conneg_list(<< $\,, R/bits >>, Acc) -> conneg_list(R, Acc);
- conneg_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(conneg, R, Acc, <<>>)
- end.
- conneg(<<>>, Acc, T) -> lists:reverse([{T, 1000}|Acc]);
- conneg(<< $,, R/bits >>, Acc, T) -> conneg_list(R, [{T, 1000}|Acc]);
- conneg(<< $;, R/bits >>, Acc, T) -> conneg_before_weight(R, Acc, T);
- conneg(<< $\s, R/bits >>, Acc, T) -> conneg_before_semicolon(R, Acc, T);
- conneg(<< $\t, R/bits >>, Acc, T) -> conneg_before_semicolon(R, Acc, T);
- conneg(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(conneg, R, Acc, T)
- end.
- conneg_before_semicolon(<<>>, Acc, T) -> lists:reverse([{T, 1000}|Acc]);
- conneg_before_semicolon(<< $,, R/bits >>, Acc, T) -> conneg_list(R, [{T, 1000}|Acc]);
- conneg_before_semicolon(<< $;, R/bits >>, Acc, T) -> conneg_before_weight(R, Acc, T);
- conneg_before_semicolon(<< $\s, R/bits >>, Acc, T) -> conneg_before_semicolon(R, Acc, T);
- conneg_before_semicolon(<< $\t, R/bits >>, Acc, T) -> conneg_before_semicolon(R, Acc, T).
- conneg_before_weight(<< $\s, R/bits >>, Acc, T) -> conneg_before_weight(R, Acc, T);
- conneg_before_weight(<< $\t, R/bits >>, Acc, T) -> conneg_before_weight(R, Acc, T);
- conneg_before_weight(<< $q, $=, R/bits >>, Acc, T) -> conneg_weight(R, Acc, T);
- %% Special clause for broken user agents that confuse ; and , separators.
- conneg_before_weight(<< C, R/bits >>, Acc, T) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(conneg, R, [{T, 1000}|Acc], <<>>)
- end.
- conneg_weight(<< "1.000", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
- conneg_weight(<< "1.00", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
- conneg_weight(<< "1.0", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
- conneg_weight(<< "1.", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
- conneg_weight(<< "1", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 1000}|Acc]);
- conneg_weight(<< "0.", A, B, C, R/bits >>, Acc, T)
- when A >= $0, A =< $9, B >= $0, B =< $9, C >= $0, C =< $9 ->
- conneg_list_sep(R, [{T, (A - $0) * 100 + (B - $0) * 10 + (C - $0)}|Acc]);
- conneg_weight(<< "0.", A, B, R/bits >>, Acc, T)
- when A >= $0, A =< $9, B >= $0, B =< $9 ->
- conneg_list_sep(R, [{T, (A - $0) * 100 + (B - $0) * 10}|Acc]);
- conneg_weight(<< "0.", A, R/bits >>, Acc, T)
- when A >= $0, A =< $9 ->
- conneg_list_sep(R, [{T, (A - $0) * 100}|Acc]);
- conneg_weight(<< "0.", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 0}|Acc]);
- conneg_weight(<< "0", R/bits >>, Acc, T) -> conneg_list_sep(R, [{T, 0}|Acc]).
- conneg_list_sep(<<>>, Acc) -> lists:reverse(Acc);
- conneg_list_sep(<< $\s, R/bits >>, Acc) -> conneg_list_sep(R, Acc);
- conneg_list_sep(<< $\t, R/bits >>, Acc) -> conneg_list_sep(R, Acc);
- conneg_list_sep(<< $,, R/bits >>, Acc) -> conneg_list(R, Acc).
- -ifdef(TEST).
- accept_charset() ->
- ?LET({C, W},
- {token(), weight()},
- {C, W, iolist_to_binary([C, case W of
- undefined -> [];
- _ -> [<<";q=">>, qvalue_to_iodata(W)]
- end])}
- ).
- prop_parse_accept_charset() ->
- ?FORALL(L,
- non_empty(list(accept_charset())),
- begin
- << _, AcceptCharset/binary >> = iolist_to_binary([[$,, A] || {_, _, A} <- L]),
- ResL = parse_accept_charset(AcceptCharset),
- CheckedL = [begin
- ResC =:= ?INLINE_LOWERCASE_BC(Ch)
- andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
- end || {{Ch, W, _}, {ResC, ResW}} <- lists:zip(L, ResL)],
- [true] =:= lists:usort(CheckedL)
- end).
- parse_accept_charset_test_() ->
- Tests = [
- {<<"iso-8859-5, unicode-1-1;q=0.8">>, [
- {<<"iso-8859-5">>, 1000},
- {<<"unicode-1-1">>, 800}
- ]},
- %% Some user agents send this invalid value for the Accept-Charset header
- {<<"ISO-8859-1;utf-8;q=0.7,*;q=0.7">>, [
- {<<"iso-8859-1">>, 1000},
- {<<"utf-8">>, 700},
- {<<"*">>, 700}
- ]}
- ],
- [{V, fun() -> R = parse_accept_charset(V) end} || {V, R} <- Tests].
- parse_accept_charset_error_test_() ->
- Tests = [
- <<>>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_accept_charset(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_accept_charset() ->
- horse:repeat(20000,
- parse_accept_charset(<<"iso-8859-5, unicode-1-1;q=0.8">>)
- ).
- -endif.
- %% @doc Parse the Accept-Encoding header.
- -spec parse_accept_encoding(binary()) -> [{binary(), qvalue()}].
- parse_accept_encoding(Encoding) ->
- conneg_list(Encoding, []).
- -ifdef(TEST).
- accept_encoding() ->
- ?LET({E, W},
- {token(), weight()},
- {E, W, iolist_to_binary([E, case W of
- undefined -> [];
- _ -> [<<";q=">>, qvalue_to_iodata(W)]
- end])}
- ).
- prop_parse_accept_encoding() ->
- ?FORALL(L,
- non_empty(list(accept_encoding())),
- begin
- << _, AcceptEncoding/binary >> = iolist_to_binary([[$,, A] || {_, _, A} <- L]),
- ResL = parse_accept_encoding(AcceptEncoding),
- CheckedL = [begin
- ResE =:= ?INLINE_LOWERCASE_BC(E)
- andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
- end || {{E, W, _}, {ResE, ResW}} <- lists:zip(L, ResL)],
- [true] =:= lists:usort(CheckedL)
- end).
- parse_accept_encoding_test_() ->
- Tests = [
- {<<>>, []},
- {<<"*">>, [{<<"*">>, 1000}]},
- {<<"compress, gzip">>, [
- {<<"compress">>, 1000},
- {<<"gzip">>, 1000}
- ]},
- {<<"compress;q=0.5, gzip;q=1.0">>, [
- {<<"compress">>, 500},
- {<<"gzip">>, 1000}
- ]},
- {<<"gzip;q=1.0, identity; q=0.5, *;q=0">>, [
- {<<"gzip">>, 1000},
- {<<"identity">>, 500},
- {<<"*">>, 0}
- ]}
- ],
- [{V, fun() -> R = parse_accept_encoding(V) end} || {V, R} <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_accept_encoding() ->
- horse:repeat(20000,
- parse_accept_encoding(<<"gzip;q=1.0, identity; q=0.5, *;q=0">>)
- ).
- -endif.
- %% @doc Parse the Accept-Language header.
- -spec parse_accept_language(binary()) -> [{binary(), qvalue()}].
- parse_accept_language(LanguageRange) ->
- nonempty(language_range_list(LanguageRange, [])).
- language_range_list(<<>>, Acc) -> lists:reverse(Acc);
- language_range_list(<< $\s, R/bits >>, Acc) -> language_range_list(R, Acc);
- language_range_list(<< $\t, R/bits >>, Acc) -> language_range_list(R, Acc);
- language_range_list(<< $\,, R/bits >>, Acc) -> language_range_list(R, Acc);
- language_range_list(<< $*, R/bits >>, Acc) -> language_range_before_semicolon(R, Acc, <<"*">>);
- language_range_list(<< C, R/bits >>, Acc) when ?IS_ALPHA(C) ->
- case C of
- ?INLINE_LOWERCASE(language_range, R, Acc, 1, <<>>)
- end.
- language_range(<<>>, Acc, _, T) -> lists:reverse([{T, 1000}|Acc]);
- language_range(<< $,, R/bits >>, Acc, _, T) -> language_range_list(R, [{T, 1000}|Acc]);
- language_range(<< $;, R/bits >>, Acc, _, T) -> language_range_before_weight(R, Acc, T);
- language_range(<< $\s, R/bits >>, Acc, _, T) -> language_range_before_semicolon(R, Acc, T);
- language_range(<< $\t, R/bits >>, Acc, _, T) -> language_range_before_semicolon(R, Acc, T);
- language_range(<< $-, R/bits >>, Acc, _, T) -> language_range_sub(R, Acc, 0, << T/binary, $- >>);
- language_range(<< _, _/bits >>, _, 8, _) -> error(badarg);
- language_range(<< C, R/bits >>, Acc, N, T) when ?IS_ALPHA(C) ->
- case C of
- ?INLINE_LOWERCASE(language_range, R, Acc, N + 1, T)
- end.
- language_range_sub(<<>>, Acc, N, T) when N > 0 -> lists:reverse([{T, 1000}|Acc]);
- language_range_sub(<< $,, R/bits >>, Acc, N, T) when N > 0 -> language_range_list(R, [{T, 1000}|Acc]);
- language_range_sub(<< $;, R/bits >>, Acc, N, T) when N > 0 -> language_range_before_weight(R, Acc, T);
- language_range_sub(<< $\s, R/bits >>, Acc, N, T) when N > 0 -> language_range_before_semicolon(R, Acc, T);
- language_range_sub(<< $\t, R/bits >>, Acc, N, T) when N > 0 -> language_range_before_semicolon(R, Acc, T);
- language_range_sub(<< $-, R/bits >>, Acc, N, T) when N > 0 -> language_range_sub(R, Acc, 0, << T/binary, $- >>);
- language_range_sub(<< _, _/bits >>, _, 8, _) -> error(badarg);
- language_range_sub(<< C, R/bits >>, Acc, N, T) when ?IS_ALPHA(C); ?IS_DIGIT(C) ->
- case C of
- ?INLINE_LOWERCASE(language_range_sub, R, Acc, N + 1, T)
- end.
- language_range_before_semicolon(<<>>, Acc, T) -> lists:reverse([{T, 1000}|Acc]);
- language_range_before_semicolon(<< $,, R/bits >>, Acc, T) -> language_range_list(R, [{T, 1000}|Acc]);
- language_range_before_semicolon(<< $;, R/bits >>, Acc, T) -> language_range_before_weight(R, Acc, T);
- language_range_before_semicolon(<< $\s, R/bits >>, Acc, T) -> language_range_before_semicolon(R, Acc, T);
- language_range_before_semicolon(<< $\t, R/bits >>, Acc, T) -> language_range_before_semicolon(R, Acc, T).
- language_range_before_weight(<< $\s, R/bits >>, Acc, T) -> language_range_before_weight(R, Acc, T);
- language_range_before_weight(<< $\t, R/bits >>, Acc, T) -> language_range_before_weight(R, Acc, T);
- language_range_before_weight(<< $q, $=, R/bits >>, Acc, T) -> language_range_weight(R, Acc, T);
- %% Special clause for broken user agents that confuse ; and , separators.
- language_range_before_weight(<< C, R/bits >>, Acc, T) when ?IS_ALPHA(C) ->
- case C of
- ?INLINE_LOWERCASE(language_range, R, [{T, 1000}|Acc], 1, <<>>)
- end.
- language_range_weight(<< "1.000", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
- language_range_weight(<< "1.00", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
- language_range_weight(<< "1.0", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
- language_range_weight(<< "1.", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
- language_range_weight(<< "1", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 1000}|Acc]);
- language_range_weight(<< "0.", A, B, C, R/bits >>, Acc, T)
- when A >= $0, A =< $9, B >= $0, B =< $9, C >= $0, C =< $9 ->
- language_range_list_sep(R, [{T, (A - $0) * 100 + (B - $0) * 10 + (C - $0)}|Acc]);
- language_range_weight(<< "0.", A, B, R/bits >>, Acc, T)
- when A >= $0, A =< $9, B >= $0, B =< $9 ->
- language_range_list_sep(R, [{T, (A - $0) * 100 + (B - $0) * 10}|Acc]);
- language_range_weight(<< "0.", A, R/bits >>, Acc, T)
- when A >= $0, A =< $9 ->
- language_range_list_sep(R, [{T, (A - $0) * 100}|Acc]);
- language_range_weight(<< "0.", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 0}|Acc]);
- language_range_weight(<< "0", R/bits >>, Acc, T) -> language_range_list_sep(R, [{T, 0}|Acc]).
- language_range_list_sep(<<>>, Acc) -> lists:reverse(Acc);
- language_range_list_sep(<< $\s, R/bits >>, Acc) -> language_range_list_sep(R, Acc);
- language_range_list_sep(<< $\t, R/bits >>, Acc) -> language_range_list_sep(R, Acc);
- language_range_list_sep(<< $,, R/bits >>, Acc) -> language_range_list(R, Acc).
- -ifdef(TEST).
- language_tag() ->
- oneof([
- [alpha()],
- [alpha(), alpha()],
- [alpha(), alpha(), alpha()],
- [alpha(), alpha(), alpha(), alpha()],
- [alpha(), alpha(), alpha(), alpha(), alpha()],
- [alpha(), alpha(), alpha(), alpha(), alpha(), alpha()],
- [alpha(), alpha(), alpha(), alpha(), alpha(), alpha(), alpha()],
- [alpha(), alpha(), alpha(), alpha(), alpha(), alpha(), alpha(), alpha()]
- ]).
- language_subtag() ->
- [$-, oneof([
- [alphanum()],
- [alphanum(), alphanum()],
- [alphanum(), alphanum(), alphanum()],
- [alphanum(), alphanum(), alphanum(), alphanum()],
- [alphanum(), alphanum(), alphanum(), alphanum(), alphanum()],
- [alphanum(), alphanum(), alphanum(), alphanum(), alphanum(), alphanum()],
- [alphanum(), alphanum(), alphanum(), alphanum(), alphanum(), alphanum(), alphanum()],
- [alphanum(), alphanum(), alphanum(), alphanum(), alphanum(), alphanum(), alphanum(), alphanum()]
- ])].
- language_range() ->
- [language_tag(), list(language_subtag())].
- accept_language() ->
- ?LET({R, W},
- {language_range(), weight()},
- {iolist_to_binary(R), W, iolist_to_binary([R, case W of
- undefined -> [];
- _ -> [<<";q=">>, qvalue_to_iodata(W)]
- end])}
- ).
- prop_parse_accept_language() ->
- ?FORALL(L,
- non_empty(list(accept_language())),
- begin
- << _, AcceptLanguage/binary >> = iolist_to_binary([[$,, A] || {_, _, A} <- L]),
- ResL = parse_accept_language(AcceptLanguage),
- CheckedL = [begin
- ResR =:= ?INLINE_LOWERCASE_BC(R)
- andalso (ResW =:= W orelse (W =:= undefined andalso ResW =:= 1000))
- end || {{R, W, _}, {ResR, ResW}} <- lists:zip(L, ResL)],
- [true] =:= lists:usort(CheckedL)
- end).
- parse_accept_language_test_() ->
- Tests = [
- {<<"da, en-gb;q=0.8, en;q=0.7">>, [
- {<<"da">>, 1000},
- {<<"en-gb">>, 800},
- {<<"en">>, 700}
- ]},
- {<<"en, en-US, en-cockney, i-cherokee, x-pig-latin, es-419">>, [
- {<<"en">>, 1000},
- {<<"en-us">>, 1000},
- {<<"en-cockney">>, 1000},
- {<<"i-cherokee">>, 1000},
- {<<"x-pig-latin">>, 1000},
- {<<"es-419">>, 1000}
- ]}
- ],
- [{V, fun() -> R = parse_accept_language(V) end} || {V, R} <- Tests].
- parse_accept_language_error_test_() ->
- Tests = [
- <<>>,
- <<"loooooong">>,
- <<"en-us-loooooong">>,
- <<"419-en-us">>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_accept_language(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_accept_language() ->
- horse:repeat(20000,
- parse_accept_language(<<"da, en-gb;q=0.8, en;q=0.7">>)
- ).
- -endif.
- %% @doc Parse the Connection header.
- -spec parse_connection(binary()) -> [binary()].
- parse_connection(<<"close">>) ->
- [<<"close">>];
- parse_connection(<<"keep-alive">>) ->
- [<<"keep-alive">>];
- parse_connection(Connection) ->
- nonempty(token_ci_list(Connection, [])).
- -ifdef(TEST).
- prop_parse_connection() ->
- ?FORALL(L,
- non_empty(list(token())),
- begin
- << _, Connection/binary >> = iolist_to_binary([[$,, C] || C <- L]),
- ResL = parse_connection(Connection),
- CheckedL = [?INLINE_LOWERCASE_BC(Co) =:= ResC || {Co, ResC} <- lists:zip(L, ResL)],
- [true] =:= lists:usort(CheckedL)
- end).
- parse_connection_test_() ->
- Tests = [
- {<<"close">>, [<<"close">>]},
- {<<"ClOsE">>, [<<"close">>]},
- {<<"Keep-Alive">>, [<<"keep-alive">>]},
- {<<"keep-alive, Upgrade">>, [<<"keep-alive">>, <<"upgrade">>]}
- ],
- [{V, fun() -> R = parse_connection(V) end} || {V, R} <- Tests].
- parse_connection_error_test_() ->
- Tests = [
- <<>>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_connection(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_connection_close() ->
- horse:repeat(200000,
- parse_connection(<<"close">>)
- ).
- horse_parse_connection_keepalive() ->
- horse:repeat(200000,
- parse_connection(<<"keep-alive">>)
- ).
- horse_parse_connection_keepalive_upgrade() ->
- horse:repeat(200000,
- parse_connection(<<"keep-alive, upgrade">>)
- ).
- -endif.
- %% @doc Parse the Content-Length header.
- %%
- %% The value has at least one digit, and may be followed by whitespace.
- -spec parse_content_length(binary()) -> non_neg_integer().
- parse_content_length(<< $0 >>) -> 0;
- parse_content_length(<< $0, R/bits >>) -> number(R, 0);
- parse_content_length(<< $1, R/bits >>) -> number(R, 1);
- parse_content_length(<< $2, R/bits >>) -> number(R, 2);
- parse_content_length(<< $3, R/bits >>) -> number(R, 3);
- parse_content_length(<< $4, R/bits >>) -> number(R, 4);
- parse_content_length(<< $5, R/bits >>) -> number(R, 5);
- parse_content_length(<< $6, R/bits >>) -> number(R, 6);
- parse_content_length(<< $7, R/bits >>) -> number(R, 7);
- parse_content_length(<< $8, R/bits >>) -> number(R, 8);
- parse_content_length(<< $9, R/bits >>) -> number(R, 9).
- -ifdef(TEST).
- prop_parse_content_length() ->
- ?FORALL(
- X,
- non_neg_integer(),
- X =:= parse_content_length(integer_to_binary(X))
- ).
- parse_content_length_test_() ->
- Tests = [
- {<<"0">>, 0},
- {<<"42 ">>, 42},
- {<<"69\t">>, 69},
- {<<"1337">>, 1337},
- {<<"3495">>, 3495},
- {<<"1234567890">>, 1234567890},
- {<<"1234567890 ">>, 1234567890}
- ],
- [{V, fun() -> R = parse_content_length(V) end} || {V, R} <- Tests].
- parse_content_length_error_test_() ->
- Tests = [
- <<>>,
- <<"123, 123">>,
- <<"4.17">>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_content_length(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_content_length_zero() ->
- horse:repeat(100000,
- parse_content_length(<<"0">>)
- ).
- horse_parse_content_length_giga() ->
- horse:repeat(100000,
- parse_content_length(<<"1234567890">>)
- ).
- -endif.
- %% @doc Parse the Content-Type header.
- -spec parse_content_type(binary()) -> media_type().
- parse_content_type(<< C, R/bits >>) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_type, R, <<>>)
- end.
- media_type(<< $/, C, R/bits >>, T) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_subtype, R, T, <<>>)
- end;
- media_type(<< C, R/bits >>, T) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_type, R, T)
- end.
- media_subtype(<<>>, T, S) -> {T, S, []};
- media_subtype(<< $;, R/bits >>, T, S) -> media_before_param(R, T, S, []);
- media_subtype(<< $\s, R/bits >>, T, S) -> media_before_semicolon(R, T, S, []);
- media_subtype(<< $\t, R/bits >>, T, S) -> media_before_semicolon(R, T, S, []);
- media_subtype(<< C, R/bits >>, T, S) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_subtype, R, T, S)
- end.
- media_before_semicolon(<<>>, T, S, P) -> {T, S, lists:reverse(P)};
- media_before_semicolon(<< $;, R/bits >>, T, S, P) -> media_before_param(R, T, S, P);
- media_before_semicolon(<< $\s, R/bits >>, T, S, P) -> media_before_semicolon(R, T, S, P);
- media_before_semicolon(<< $\t, R/bits >>, T, S, P) -> media_before_semicolon(R, T, S, P).
- media_before_param(<< $\s, R/bits >>, T, S, P) -> media_before_param(R, T, S, P);
- media_before_param(<< $\t, R/bits >>, T, S, P) -> media_before_param(R, T, S, P);
- media_before_param(<< "charset=", $", R/bits >>, T, S, P) -> media_charset_quoted(R, T, S, P, <<>>);
- media_before_param(<< "charset=", R/bits >>, T, S, P) -> media_charset(R, T, S, P, <<>>);
- media_before_param(<< C, R/bits >>, T, S, P) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_param, R, T, S, P, <<>>)
- end.
- media_charset_quoted(<< $", R/bits >>, T, S, P, V) ->
- media_before_semicolon(R, T, S, [{<<"charset">>, V}|P]);
- media_charset_quoted(<< $\\, C, R/bits >>, T, S, P, V) when ?IS_VCHAR(C) ->
- case C of
- ?INLINE_LOWERCASE(media_charset_quoted, R, T, S, P, V)
- end;
- media_charset_quoted(<< C, R/bits >>, T, S, P, V) when ?IS_VCHAR(C) ->
- case C of
- ?INLINE_LOWERCASE(media_charset_quoted, R, T, S, P, V)
- end.
- media_charset(<<>>, T, S, P, V) -> {T, S, lists:reverse([{<<"charset">>, V}|P])};
- media_charset(<< $;, R/bits >>, T, S, P, V) -> media_before_param(R, T, S, [{<<"charset">>, V}|P]);
- media_charset(<< $\s, R/bits >>, T, S, P, V) -> media_before_semicolon(R, T, S, [{<<"charset">>, V}|P]);
- media_charset(<< $\t, R/bits >>, T, S, P, V) -> media_before_semicolon(R, T, S, [{<<"charset">>, V}|P]);
- media_charset(<< C, R/bits >>, T, S, P, V) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_charset, R, T, S, P, V)
- end.
- media_param(<< $=, $", R/bits >>, T, S, P, K) -> media_quoted(R, T, S, P, K, <<>>);
- media_param(<< $=, R/bits >>, T, S, P, K) -> media_value(R, T, S, P, K, <<>>);
- media_param(<< C, R/bits >>, T, S, P, K) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(media_param, R, T, S, P, K)
- end.
- media_quoted(<< $", R/bits >>, T, S, P, K, V) -> media_before_semicolon(R, T, S, [{K, V}|P]);
- media_quoted(<< $\\, C, R/bits >>, T, S, P, K, V) when ?IS_VCHAR(C) -> media_quoted(R, T, S, P, K, << V/binary, C >>);
- media_quoted(<< C, R/bits >>, T, S, P, K, V) when ?IS_VCHAR(C) -> media_quoted(R, T, S, P, K, << V/binary, C >>).
- media_value(<<>>, T, S, P, K, V) -> {T, S, lists:reverse([{K, V}|P])};
- media_value(<< $;, R/bits >>, T, S, P, K, V) -> media_before_param(R, T, S, [{K, V}|P]);
- media_value(<< $\s, R/bits >>, T, S, P, K, V) -> media_before_semicolon(R, T, S, [{K, V}|P]);
- media_value(<< $\t, R/bits >>, T, S, P, K, V) -> media_before_semicolon(R, T, S, [{K, V}|P]);
- media_value(<< C, R/bits >>, T, S, P, K, V) when ?IS_TOKEN(C) -> media_value(R, T, S, P, K, << V/binary, C >>).
- -ifdef(TEST).
- media_type_parameter() ->
- frequency([
- {90, parameter()},
- {10, {<<"charset">>, oneof([token(), quoted_string()]), <<>>, <<>>}}
- ]).
- media_type() ->
- ?LET({T, S, P},
- {token(), token(), list(media_type_parameter())},
- {T, S, P, iolist_to_binary([T, $/, S, [[OWS1, $;, OWS2, K, $=, V] || {K, V, OWS1, OWS2} <- P]])}
- ).
- prop_parse_content_type() ->
- ?FORALL({T, S, P, MediaType},
- media_type(),
- begin
- {ResT, ResS, ResP} = parse_content_type(MediaType),
- ExpectedP = [case ?INLINE_LOWERCASE_BC(K) of
- <<"charset">> -> {<<"charset">>, ?INLINE_LOWERCASE_BC(unquote(V))};
- LowK -> {LowK, unquote(V)}
- end || {K, V, _, _} <- P],
- ResT =:= ?INLINE_LOWERCASE_BC(T)
- andalso ResS =:= ?INLINE_LOWERCASE_BC(S)
- andalso ResP =:= ExpectedP
- end
- ).
- parse_content_type_test_() ->
- Tests = [
- {<<"text/html;charset=utf-8">>,
- {<<"text">>, <<"html">>, [{<<"charset">>, <<"utf-8">>}]}},
- {<<"text/html;charset=UTF-8">>,
- {<<"text">>, <<"html">>, [{<<"charset">>, <<"utf-8">>}]}},
- {<<"Text/HTML;Charset=\"utf-8\"">>,
- {<<"text">>, <<"html">>, [{<<"charset">>, <<"utf-8">>}]}},
- {<<"text/html; charset=\"utf-8\"">>,
- {<<"text">>, <<"html">>, [{<<"charset">>, <<"utf-8">>}]}},
- {<<"text/html; charset=ISO-8859-4">>,
- {<<"text">>, <<"html">>, [{<<"charset">>, <<"iso-8859-4">>}]}},
- {<<"text/plain; charset=iso-8859-4">>,
- {<<"text">>, <<"plain">>, [{<<"charset">>, <<"iso-8859-4">>}]}},
- {<<"multipart/form-data \t;Boundary=\"MultipartIsUgly\"">>,
- {<<"multipart">>, <<"form-data">>, [
- {<<"boundary">>, <<"MultipartIsUgly">>}
- ]}},
- {<<"foo/bar; one=FirstParam; two=SecondParam">>,
- {<<"foo">>, <<"bar">>, [
- {<<"one">>, <<"FirstParam">>},
- {<<"two">>, <<"SecondParam">>}
- ]}}
- ],
- [{V, fun() -> R = parse_content_type(V) end} || {V, R} <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_content_type() ->
- horse:repeat(200000,
- parse_content_type(<<"text/html;charset=utf-8">>)
- ).
- -endif.
- %% @doc Parse the Date header.
- -spec parse_date(binary()) -> calendar:datetime().
- parse_date(Date) ->
- cow_date:parse_date(Date).
- -ifdef(TEST).
- parse_date_test_() ->
- Tests = [
- {<<"Tue, 15 Nov 1994 08:12:31 GMT">>, {{1994, 11, 15}, {8, 12, 31}}}
- ],
- [{V, fun() -> R = parse_date(V) end} || {V, R} <- Tests].
- -endif.
- %% @doc Parse the ETag header.
- -spec parse_etag(binary()) -> etag().
- parse_etag(<< $W, $/, $", R/bits >>) ->
- etag(R, weak, <<>>);
- parse_etag(<< $", R/bits >>) ->
- etag(R, strong, <<>>).
- etag(<< $", R/bits >>, Strength, Tag) ->
- ws_end(R),
- {Strength, Tag};
- etag(<< C, R/bits >>, Strength, Tag) when ?IS_ETAGC(C) ->
- etag(R, Strength, << Tag/binary, C >>).
- -ifdef(TEST).
- etagc() ->
- ?SUCHTHAT(C, int(16#21, 16#ff), C =/= 16#22 andalso C =/= 16#7f).
- etag() ->
- ?LET({Strength, Tag},
- {oneof([weak, strong]), list(etagc())},
- begin
- TagBin = list_to_binary(Tag),
- {{Strength, TagBin},
- case Strength of
- weak -> << $W, $/, $", TagBin/binary, $" >>;
- strong -> << $", TagBin/binary, $" >>
- end}
- end).
- prop_parse_etag() ->
- ?FORALL({Tag, TagBin},
- etag(),
- Tag =:= parse_etag(TagBin)).
- parse_etag_test_() ->
- Tests = [
- {<<"\"xyzzy\"">>, {strong, <<"xyzzy">>}},
- {<<"W/\"xyzzy\"">>, {weak, <<"xyzzy">>}},
- {<<"\"\"">>, {strong, <<>>}}
- ],
- [{V, fun() -> R = parse_etag(V) end} || {V, R} <- Tests].
- parse_etag_error_test_() ->
- Tests = [
- <<>>,
- <<"\"">>,
- <<"W">>,
- <<"W/">>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_etag(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_etag() ->
- horse:repeat(200000,
- parse_etag(<<"W/\"xyzzy\"">>)
- ).
- -endif.
- %% @doc Parse the Expect header.
- -spec parse_expect(binary()) -> continue.
- parse_expect(<<"100-continue", Rest/bits >>) ->
- ws_end(Rest),
- continue;
- parse_expect(<<"100-", C, O, N, T, I, M, U, E, Rest/bits >>)
- when C =:= $C orelse C =:= $c, O =:= $O orelse O =:= $o,
- N =:= $N orelse N =:= $n, T =:= $T orelse T =:= $t,
- I =:= $I orelse I =:= $i, M =:= $N orelse M =:= $n,
- U =:= $U orelse U =:= $u, E =:= $E orelse E =:= $e ->
- ws_end(Rest),
- continue.
- -ifdef(TEST).
- expect() ->
- ?LET(E,
- [$1, $0, $0, $-,
- oneof([$c, $C]), oneof([$o, $O]), oneof([$n, $N]),
- oneof([$t, $T]), oneof([$i, $I]), oneof([$n, $N]),
- oneof([$u, $U]), oneof([$e, $E])],
- list_to_binary(E)).
- prop_parse_expect() ->
- ?FORALL(E, expect(), continue =:= parse_expect(E)).
- parse_expect_test_() ->
- Tests = [
- <<"100-continue">>,
- <<"100-CONTINUE">>,
- <<"100-Continue">>,
- <<"100-CoNtInUe">>,
- <<"100-continue ">>
- ],
- [{V, fun() -> continue = parse_expect(V) end} || V <- Tests].
- parse_expect_error_test_() ->
- Tests = [
- <<>>,
- <<" ">>,
- <<"200-OK">>,
- <<"Cookies">>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_expect(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_expect() ->
- horse:repeat(200000,
- parse_expect(<<"100-continue">>)
- ).
- -endif.
- %% @doc Parse the If-Match header.
- -spec parse_if_match(binary()) -> '*' | [etag()].
- parse_if_match(<<"*">>) ->
- '*';
- parse_if_match(IfMatch) ->
- nonempty(etag_list(IfMatch, [])).
- etag_list(<<>>, Acc) -> lists:reverse(Acc);
- etag_list(<< $\s, R/bits >>, Acc) -> etag_list(R, Acc);
- etag_list(<< $\t, R/bits >>, Acc) -> etag_list(R, Acc);
- etag_list(<< $,, R/bits >>, Acc) -> etag_list(R, Acc);
- etag_list(<< $W, $/, $", R/bits >>, Acc) -> etag(R, Acc, weak, <<>>);
- etag_list(<< $", R/bits >>, Acc) -> etag(R, Acc, strong, <<>>).
- etag(<< $", R/bits >>, Acc, Strength, Tag) -> etag_list_sep(R, [{Strength, Tag}|Acc]);
- etag(<< C, R/bits >>, Acc, Strength, Tag) when ?IS_ETAGC(C) -> etag(R, Acc, Strength, << Tag/binary, C >>).
- etag_list_sep(<<>>, Acc) -> lists:reverse(Acc);
- etag_list_sep(<< $\s, R/bits >>, Acc) -> etag_list_sep(R, Acc);
- etag_list_sep(<< $\t, R/bits >>, Acc) -> etag_list_sep(R, Acc);
- etag_list_sep(<< $,, R/bits >>, Acc) -> etag_list(R, Acc).
- -ifdef(TEST).
- prop_parse_if_match() ->
- ?FORALL(L,
- non_empty(list(etag())),
- begin
- << _, IfMatch/binary >> = iolist_to_binary([[$,, T] || {_, T} <- L]),
- ResL = parse_if_match(IfMatch),
- CheckedL = [T =:= ResT || {{T, _}, ResT} <- lists:zip(L, ResL)],
- [true] =:= lists:usort(CheckedL)
- end).
- parse_if_match_test_() ->
- Tests = [
- {<<"\"xyzzy\"">>, [{strong, <<"xyzzy">>}]},
- {<<"\"xyzzy\", \"r2d2xxxx\", \"c3piozzzz\"">>,
- [{strong, <<"xyzzy">>}, {strong, <<"r2d2xxxx">>}, {strong, <<"c3piozzzz">>}]},
- {<<"*">>, '*'}
- ],
- [{V, fun() -> R = parse_if_match(V) end} || {V, R} <- Tests].
- parse_if_match_error_test_() ->
- Tests = [
- <<>>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_if_match(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_if_match() ->
- horse:repeat(200000,
- parse_if_match(<<"\"xyzzy\", \"r2d2xxxx\", \"c3piozzzz\"">>)
- ).
- -endif.
- %% @doc Parse the If-Modified-Since header.
- -spec parse_if_modified_since(binary()) -> calendar:datetime().
- parse_if_modified_since(IfModifiedSince) ->
- cow_date:parse_date(IfModifiedSince).
- -ifdef(TEST).
- parse_if_modified_since_test_() ->
- Tests = [
- {<<"Sat, 29 Oct 1994 19:43:31 GMT">>, {{1994, 10, 29}, {19, 43, 31}}}
- ],
- [{V, fun() -> R = parse_if_modified_since(V) end} || {V, R} <- Tests].
- -endif.
- %% @doc Parse the If-None-Match header.
- -spec parse_if_none_match(binary()) -> '*' | [etag()].
- parse_if_none_match(<<"*">>) ->
- '*';
- parse_if_none_match(IfNoneMatch) ->
- nonempty(etag_list(IfNoneMatch, [])).
- -ifdef(TEST).
- parse_if_none_match_test_() ->
- Tests = [
- {<<"\"xyzzy\"">>, [{strong, <<"xyzzy">>}]},
- {<<"W/\"xyzzy\"">>, [{weak, <<"xyzzy">>}]},
- {<<"\"xyzzy\", \"r2d2xxxx\", \"c3piozzzz\"">>,
- [{strong, <<"xyzzy">>}, {strong, <<"r2d2xxxx">>}, {strong, <<"c3piozzzz">>}]},
- {<<"W/\"xyzzy\", W/\"r2d2xxxx\", W/\"c3piozzzz\"">>,
- [{weak, <<"xyzzy">>}, {weak, <<"r2d2xxxx">>}, {weak, <<"c3piozzzz">>}]},
- {<<"*">>, '*'}
- ],
- [{V, fun() -> R = parse_if_none_match(V) end} || {V, R} <- Tests].
- parse_if_none_match_error_test_() ->
- Tests = [
- <<>>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_if_none_match(V)) end} || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_if_none_match() ->
- horse:repeat(200000,
- parse_if_none_match(<<"W/\"xyzzy\", W/\"r2d2xxxx\", W/\"c3piozzzz\"">>)
- ).
- -endif.
- %% @doc Parse the If-Unmodified-Since header.
- -spec parse_if_unmodified_since(binary()) -> calendar:datetime().
- parse_if_unmodified_since(IfModifiedSince) ->
- cow_date:parse_date(IfModifiedSince).
- -ifdef(TEST).
- parse_if_unmodified_since_test_() ->
- Tests = [
- {<<"Sat, 29 Oct 1994 19:43:31 GMT">>, {{1994, 10, 29}, {19, 43, 31}}}
- ],
- [{V, fun() -> R = parse_if_unmodified_since(V) end} || {V, R} <- Tests].
- -endif.
- %% @doc Parse the Last-Modified header.
- -spec parse_last_modified(binary()) -> calendar:datetime().
- parse_last_modified(LastModified) ->
- cow_date:parse_date(LastModified).
- -ifdef(TEST).
- parse_last_modified_test_() ->
- Tests = [
- {<<"Tue, 15 Nov 1994 12:45:26 GMT">>, {{1994, 11, 15}, {12, 45, 26}}}
- ],
- [{V, fun() -> R = parse_last_modified(V) end} || {V, R} <- Tests].
- -endif.
- %% @doc Parse the Max-Forwards header.
- -spec parse_max_forwards(binary()) -> integer().
- parse_max_forwards(<< $0, R/bits >>) -> number(R, 0);
- parse_max_forwards(<< $1, R/bits >>) -> number(R, 1);
- parse_max_forwards(<< $2, R/bits >>) -> number(R, 2);
- parse_max_forwards(<< $3, R/bits >>) -> number(R, 3);
- parse_max_forwards(<< $4, R/bits >>) -> number(R, 4);
- parse_max_forwards(<< $5, R/bits >>) -> number(R, 5);
- parse_max_forwards(<< $6, R/bits >>) -> number(R, 6);
- parse_max_forwards(<< $7, R/bits >>) -> number(R, 7);
- parse_max_forwards(<< $8, R/bits >>) -> number(R, 8);
- parse_max_forwards(<< $9, R/bits >>) -> number(R, 9).
- -ifdef(TEST).
- prop_parse_max_forwards() ->
- ?FORALL(
- X,
- non_neg_integer(),
- X =:= parse_max_forwards(integer_to_binary(X))
- ).
- parse_max_forwards_test_() ->
- Tests = [
- {<<"0">>, 0},
- {<<"42 ">>, 42},
- {<<"69\t">>, 69},
- {<<"1337">>, 1337},
- {<<"1234567890">>, 1234567890},
- {<<"1234567890 ">>, 1234567890}
- ],
- [{V, fun() -> R = parse_max_forwards(V) end} || {V, R} <- Tests].
- parse_max_forwards_error_test_() ->
- Tests = [
- <<>>,
- <<"123, 123">>,
- <<"4.17">>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_content_length(V)) end} || V <- Tests].
- -endif.
- %% @doc Parse the Transfer-Encoding header.
- %%
- %% @todo This function does not support parsing of transfer-parameter.
- -spec parse_transfer_encoding(binary()) -> [binary()].
- parse_transfer_encoding(<<"chunked">>) ->
- [<<"chunked">>];
- parse_transfer_encoding(TransferEncoding) ->
- nonempty(token_ci_list(TransferEncoding, [])).
- -ifdef(TEST).
- prop_parse_transfer_encoding() ->
- ?FORALL(L,
- non_empty(list(token())),
- begin
- << _, TransferEncoding/binary >> = iolist_to_binary([[$,, C] || C <- L]),
- ResL = parse_transfer_encoding(TransferEncoding),
- CheckedL = [?INLINE_LOWERCASE_BC(Co) =:= ResC || {Co, ResC} <- lists:zip(L, ResL)],
- [true] =:= lists:usort(CheckedL)
- end).
- parse_transfer_encoding_test_() ->
- Tests = [
- {<<"a , , , ">>, [<<"a">>]},
- {<<" , , , a">>, [<<"a">>]},
- {<<"a , , b">>, [<<"a">>, <<"b">>]},
- {<<"chunked">>, [<<"chunked">>]},
- {<<"chunked, something">>, [<<"chunked">>, <<"something">>]},
- {<<"gzip, chunked">>, [<<"gzip">>, <<"chunked">>]}
- ],
- [{V, fun() -> R = parse_transfer_encoding(V) end} || {V, R} <- Tests].
- parse_transfer_encoding_error_test_() ->
- Tests = [
- <<>>,
- <<" ">>,
- <<" , ">>,
- <<",,,">>,
- <<"a b">>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_transfer_encoding(V)) end}
- || V <- Tests].
- -endif.
- -ifdef(PERF).
- horse_parse_transfer_encoding_chunked() ->
- horse:repeat(200000,
- parse_transfer_encoding(<<"chunked">>)
- ).
- horse_parse_transfer_encoding_custom() ->
- horse:repeat(200000,
- parse_transfer_encoding(<<"chunked, something">>)
- ).
- -endif.
- %% @doc Parse the Upgrade header.
- %%
- %% It is unclear from the RFC whether the values here are
- %% case sensitive.
- %%
- %% We handle them in a case insensitive manner because they
- %% are described as case insensitive in the Websocket RFC.
- -spec parse_upgrade(binary()) -> [binary()].
- parse_upgrade(Upgrade) ->
- nonempty(protocol_list(Upgrade, [])).
- protocol_list(<<>>, Acc) -> lists:reverse(Acc);
- protocol_list(<< $\s, R/bits >>, Acc) -> protocol_list(R, Acc);
- protocol_list(<< $\t, R/bits >>, Acc) -> protocol_list(R, Acc);
- protocol_list(<< $,, R/bits >>, Acc) -> protocol_list(R, Acc);
- protocol_list(<< C, R/bits >>, Acc) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(protocol_name, R, Acc, <<>>)
- end.
- protocol_name(<<>>, Acc, P) -> lists:reverse([P|Acc]);
- protocol_name(<< $\s, R/bits >>, Acc, P) -> protocol_list_sep(R, [P|Acc]);
- protocol_name(<< $\t, R/bits >>, Acc, P) -> protocol_list_sep(R, [P|Acc]);
- protocol_name(<< $,, R/bits >>, Acc, P) -> protocol_list(R, [P|Acc]);
- protocol_name(<< $/, C, R/bits >>, Acc, P) ->
- case C of
- ?INLINE_LOWERCASE(protocol_version, R, Acc, << P/binary, $/ >>)
- end;
- protocol_name(<< C, R/bits >>, Acc, P) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(protocol_name, R, Acc, P)
- end.
- protocol_version(<<>>, Acc, P) -> lists:reverse([P|Acc]);
- protocol_version(<< $\s, R/bits >>, Acc, P) -> protocol_list_sep(R, [P|Acc]);
- protocol_version(<< $\t, R/bits >>, Acc, P) -> protocol_list_sep(R, [P|Acc]);
- protocol_version(<< $,, R/bits >>, Acc, P) -> protocol_list(R, [P|Acc]);
- protocol_version(<< C, R/bits >>, Acc, P) when ?IS_TOKEN(C) ->
- case C of
- ?INLINE_LOWERCASE(protocol_version, R, Acc, P)
- end.
- protocol_list_sep(<<>>, Acc) -> lists:reverse(Acc);
- protocol_list_sep(<< $\s, R/bits >>, Acc) -> protocol_list_sep(R, Acc);
- protocol_list_sep(<< $\t, R/bits >>, Acc) -> protocol_list_sep(R, Acc);
- protocol_list_sep(<< $,, R/bits >>, Acc) -> protocol_list(R, Acc).
- -ifdef(TEST).
- protocols() ->
- ?LET(P,
- oneof([token(), [token(), $/, token()]]),
- iolist_to_binary(P)).
- prop_parse_upgrade() ->
- ?FORALL(L,
- non_empty(list(protocols())),
- begin
- << _, Upgrade/binary >> = iolist_to_binary([[$,, P] || P <- L]),
- ResL = parse_upgrade(Upgrade),
- CheckedL = [?INLINE_LOWERCASE_BC(P) =:= ResP || {P, ResP} <- lists:zip(L, ResL)],
- [true] =:= lists:usort(CheckedL)
- end).
- parse_upgrade_test_() ->
- Tests = [
- {<<"HTTP/2.0, SHTTP/1.3, IRC/6.9, RTA/x11">>,
- [<<"http/2.0">>, <<"shttp/1.3">>, <<"irc/6.9">>, <<"rta/x11">>]},
- {<<"HTTP/2.0">>, [<<"http/2.0">>]}
- ],
- [{V, fun() -> R = parse_transfer_encoding(V) end} || {V, R} <- Tests].
- parse_upgrade_error_test_() ->
- Tests = [
- <<>>
- ],
- [{V, fun() -> {'EXIT', _} = (catch parse_upgrade(V)) end}
- || V <- Tests].
- -endif.
- %% Internal.
- %% Only return if the list is not empty.
- nonempty(L) when L =/= [] -> L.
- %% Parse a number optionally followed by whitespace.
- number(<< $0, R/bits >>, Acc) -> number(R, Acc * 10);
- number(<< $1, R/bits >>, Acc) -> number(R, Acc * 10 + 1);
- number(<< $2, R/bits >>, Acc) -> number(R, Acc * 10 + 2);
- number(<< $3, R/bits >>, Acc) -> number(R, Acc * 10 + 3);
- number(<< $4, R/bits >>, Acc) -> number(R, Acc * 10 + 4);
- number(<< $5, R/bits >>, Acc) -> number(R, Acc * 10 + 5);
- number(<< $6, R/bits >>, Acc) -> number(R, Acc * 10 + 6);
- number(<< $7, R/bits >>, Acc) -> number(R, Acc * 10 + 7);
- number(<< $8, R/bits >>, Acc) -> number(R, Acc * 10 + 8);
- number(<< $9, R/bits >>, Acc) -> number(R, Acc * 10 + 9);
- number(<< $\s, R/bits >>, Acc) -> ws_end(R), Acc;
- number(<< $\t, R/bits >>, Acc) -> ws_end(R), Acc;
- number(<<>>, Acc) -> Acc.
- ws_end(<< $\s, R/bits >>) -> ws_end(R);
- ws_end(<< $\t, R/bits >>) -> ws_end(R);
- ws_end(<<>>) -> ok.
- %% Parse a list of case insensitive tokens.
- token_ci_list(<<>>, Acc) -> lists:reverse(Acc);
- token_ci_list(<< $\s, R/bits >>, Acc) -> token_ci_list(R, Acc);
- token_ci_list(<< $\t, R/bits >>, Acc) -> token_ci_list(R, Acc);
- token_ci_list(<< $,, R/bits >>, Acc) -> token_ci_list(R, Acc);
- token_ci_list(<< C, R/bits >>, Acc) ->
- case C of
- ?INLINE_LOWERCASE(token_ci_list, R, Acc, <<>>)
- end.
- token_ci_list(<<>>, Acc, T) -> lists:reverse([T|Acc]);
- token_ci_list(<< $\s, R/bits >>, Acc, T) -> token_ci_list_sep(R, Acc, T);
- token_ci_list(<< $\t, R/bits >>, Acc, T) -> token_ci_list_sep(R, Acc, T);
- token_ci_list(<< $,, R/bits >>, Acc, T) -> token_ci_list(R, [T|Acc]);
- token_ci_list(<< C, R/bits >>, Acc, T) ->
- case C of
- ?INLINE_LOWERCASE(token_ci_list, R, Acc, T)
- end.
- token_ci_list_sep(<<>>, Acc, T) -> lists:reverse([T|Acc]);
- token_ci_list_sep(<< $\s, R/bits >>, Acc, T) -> token_ci_list_sep(R, Acc, T);
- token_ci_list_sep(<< $\t, R/bits >>, Acc, T) -> token_ci_list_sep(R, Acc, T);
- token_ci_list_sep(<< $,, R/bits >>, Acc, T) -> token_ci_list(R, [T|Acc]).
|